diff --git "a/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" --- "a/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" +++ "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.4112, "train/learning_rate": 2.3978622327790973e-06, "train/epoch": 18.5, "train/global_step": 16500, "_runtime": 98398, "_timestamp": 1647045637, "_step": 16510, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 3.0, 10.0, 5.0, 11.0, 14.0, 11.0, 8.0, 17.0, 16.0, 24.0, 20.0, 29.0, 38.0, 25.0, 37.0, 34.0, 44.0, 40.0, 39.0, 31.0, 33.0, 53.0, 43.0, 43.0, 36.0, 42.0, 38.0, 40.0, 31.0, 32.0, 25.0, 11.0, 21.0, 14.0, 11.0, 14.0, 12.0, 8.0, 12.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-49.009525299072266, -48.12847137451172, -47.24742126464844, -46.36636734008789, -45.48531723022461, -44.60426330566406, -43.72321319580078, -42.842159271240234, -41.96110534667969, -41.08005142211914, -40.19900131225586, -39.31794738769531, -38.43689727783203, -37.555843353271484, -36.6747932434082, -35.793739318847656, -34.912689208984375, -34.03163528442383, -33.15058517456055, -32.26953125, -31.38848114013672, -30.507427215576172, -29.626375198364258, -28.745323181152344, -27.86427116394043, -26.983219146728516, -26.1021671295166, -25.221115112304688, -24.34006118774414, -23.45901107788086, -22.577957153320312, -21.6969051361084, -20.815853118896484, -19.93480110168457, -19.053749084472656, -18.172697067260742, -17.291645050048828, -16.41059112548828, -15.529539108276367, -14.648487091064453, -13.767434120178223, -12.886382102966309, -12.005329132080078, -11.124277114868164, -10.24322509765625, -9.362173080444336, -8.481121063232422, -7.600068092346191, -6.719016075134277, -5.837964057922363, -4.956911563873291, -4.075859069824219, -3.1948070526123047, -2.3137550354003906, -1.4327025413513184, -0.5516500473022461, 0.32940196990966797, 1.2104542255401611, 2.0915064811706543, 2.9725587368011475, 3.8536109924316406, 4.734663009643555, 5.615715503692627, 6.496767997741699, 7.377820014953613]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 5.0, 12.0, 9.0, 6.0, 12.0, 19.0, 12.0, 16.0, 10.0, 20.0, 29.0, 42.0, 29.0, 32.0, 36.0, 36.0, 37.0, 30.0, 33.0, 47.0, 46.0, 49.0, 32.0, 44.0, 45.0, 34.0, 36.0, 26.0, 29.0, 20.0, 18.0, 22.0, 15.0, 18.0, 13.0, 16.0, 7.0, 22.0, 10.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-27.398508071899414, -26.53114128112793, -25.663776397705078, -24.796409606933594, -23.929044723510742, -23.061677932739258, -22.194313049316406, -21.326946258544922, -20.459579467773438, -19.592212677001953, -18.7248477935791, -17.857481002807617, -16.990116119384766, -16.12274932861328, -15.255383491516113, -14.388017654418945, -13.520652770996094, -12.653286933898926, -11.785921096801758, -10.918554306030273, -10.051189422607422, -9.183822631835938, -8.31645679473877, -7.449090957641602, -6.581725120544434, -5.714359283447266, -4.846993446350098, -3.9796271324157715, -3.1122612953186035, -2.2448954582214355, -1.3775291442871094, -0.5101633071899414, 0.3572044372558594, 1.224570393562317, 2.0919363498687744, 2.9593024253845215, 3.8266682624816895, 4.694034099578857, 5.561400413513184, 6.428766250610352, 7.2961320877075195, 8.163497924804688, 9.030863761901855, 9.898229598999023, 10.765596389770508, 11.63296127319336, 12.500328063964844, 13.367693901062012, 14.23505973815918, 15.102425575256348, 15.969791412353516, 16.837158203125, 17.70452308654785, 18.571889877319336, 19.439254760742188, 20.306621551513672, 21.173988342285156, 22.04135513305664, 22.908720016479492, 23.776086807250977, 24.643451690673828, 25.510818481445312, 26.378185272216797, 27.24555015563965, 28.1129150390625]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 9.0, 21.0, 19.0, 38.0, 67.0, 107.0, 164.0, 297.0, 437.0, 700.0, 1205.0, 1883.0, 3272.0, 5480.0, 9110.0, 15576.0, 25785.0, 42868.0, 70206.0, 114269.0, 181292.0, 278806.0, 406860.0, 540171.0, 611332.0, 570135.0, 448662.0, 314825.0, 207513.0, 132166.0, 82664.0, 51002.0, 30698.0, 18897.0, 11283.0, 6734.0, 3828.0, 2385.0, 1390.0, 861.0, 492.0, 305.0, 174.0, 120.0, 61.0, 40.0, 31.0, 17.0, 11.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-45.9375, -44.57275390625, -43.2080078125, -41.84326171875, -40.478515625, -39.11376953125, -37.7490234375, -36.38427734375, -35.01953125, -33.65478515625, -32.2900390625, -30.92529296875, -29.560546875, -28.19580078125, -26.8310546875, -25.46630859375, -24.1015625, -22.73681640625, -21.3720703125, -20.00732421875, -18.642578125, -17.27783203125, -15.9130859375, -14.54833984375, -13.18359375, -11.81884765625, -10.4541015625, -9.08935546875, -7.724609375, -6.35986328125, -4.9951171875, -3.63037109375, -2.265625, -0.90087890625, 0.4638671875, 1.82861328125, 3.193359375, 4.55810546875, 5.9228515625, 7.28759765625, 8.65234375, 10.01708984375, 11.3818359375, 12.74658203125, 14.111328125, 15.47607421875, 16.8408203125, 18.20556640625, 19.5703125, 20.93505859375, 22.2998046875, 23.66455078125, 25.029296875, 26.39404296875, 27.7587890625, 29.12353515625, 30.48828125, 31.85302734375, 33.2177734375, 34.58251953125, 35.947265625, 37.31201171875, 38.6767578125, 40.04150390625, 41.40625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 5.0, 5.0, 4.0, 6.0, 13.0, 12.0, 15.0, 16.0, 20.0, 25.0, 25.0, 24.0, 19.0, 30.0, 36.0, 38.0, 46.0, 46.0, 33.0, 31.0, 44.0, 51.0, 30.0, 48.0, 39.0, 34.0, 36.0, 38.0, 31.0, 27.0, 26.0, 24.0, 14.0, 10.0, 20.0, 14.0, 12.0, 9.0, 12.0, 8.0, 7.0, 7.0, 6.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.671875, -30.7421875, -29.8125, -28.8828125, -27.953125, -27.0234375, -26.09375, -25.1640625, -24.234375, -23.3046875, -22.375, -21.4453125, -20.515625, -19.5859375, -18.65625, -17.7265625, -16.796875, -15.8671875, -14.9375, -14.0078125, -13.078125, -12.1484375, -11.21875, -10.2890625, -9.359375, -8.4296875, -7.5, -6.5703125, -5.640625, -4.7109375, -3.78125, -2.8515625, -1.921875, -0.9921875, -0.0625, 0.8671875, 1.796875, 2.7265625, 3.65625, 4.5859375, 5.515625, 6.4453125, 7.375, 8.3046875, 9.234375, 10.1640625, 11.09375, 12.0234375, 12.953125, 13.8828125, 14.8125, 15.7421875, 16.671875, 17.6015625, 18.53125, 19.4609375, 20.390625, 21.3203125, 22.25, 23.1796875, 24.109375, 25.0390625, 25.96875, 26.8984375, 27.828125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 7.0, 7.0, 22.0, 21.0, 40.0, 66.0, 111.0, 155.0, 286.0, 405.0, 704.0, 1224.0, 1914.0, 3069.0, 5090.0, 7900.0, 12633.0, 20051.0, 31047.0, 47586.0, 71945.0, 105910.0, 151656.0, 211409.0, 279482.0, 351691.0, 411712.0, 446630.0, 438420.0, 397264.0, 330931.0, 259629.0, 193063.0, 137478.0, 95461.0, 63406.0, 41915.0, 27504.0, 17285.0, 10921.0, 6969.0, 4301.0, 2667.0, 1632.0, 1024.0, 626.0, 416.0, 239.0, 138.0, 89.0, 55.0, 43.0, 20.0, 12.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-29.25, -28.302001953125, -27.35400390625, -26.406005859375, -25.4580078125, -24.510009765625, -23.56201171875, -22.614013671875, -21.666015625, -20.718017578125, -19.77001953125, -18.822021484375, -17.8740234375, -16.926025390625, -15.97802734375, -15.030029296875, -14.08203125, -13.134033203125, -12.18603515625, -11.238037109375, -10.2900390625, -9.342041015625, -8.39404296875, -7.446044921875, -6.498046875, -5.550048828125, -4.60205078125, -3.654052734375, -2.7060546875, -1.758056640625, -0.81005859375, 0.137939453125, 1.0859375, 2.033935546875, 2.98193359375, 3.929931640625, 4.8779296875, 5.825927734375, 6.77392578125, 7.721923828125, 8.669921875, 9.617919921875, 10.56591796875, 11.513916015625, 12.4619140625, 13.409912109375, 14.35791015625, 15.305908203125, 16.25390625, 17.201904296875, 18.14990234375, 19.097900390625, 20.0458984375, 20.993896484375, 21.94189453125, 22.889892578125, 23.837890625, 24.785888671875, 25.73388671875, 26.681884765625, 27.6298828125, 28.577880859375, 29.52587890625, 30.473876953125, 31.421875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 9.0, 5.0, 12.0, 23.0, 20.0, 29.0, 31.0, 30.0, 49.0, 57.0, 70.0, 94.0, 70.0, 112.0, 130.0, 165.0, 159.0, 169.0, 172.0, 202.0, 191.0, 219.0, 185.0, 191.0, 219.0, 205.0, 190.0, 156.0, 130.0, 118.0, 92.0, 100.0, 101.0, 58.0, 66.0, 35.0, 41.0, 29.0, 24.0, 26.0, 18.0, 15.0, 11.0, 11.0, 11.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.4765625, -14.010498046875, -13.54443359375, -13.078369140625, -12.6123046875, -12.146240234375, -11.68017578125, -11.214111328125, -10.748046875, -10.281982421875, -9.81591796875, -9.349853515625, -8.8837890625, -8.417724609375, -7.95166015625, -7.485595703125, -7.01953125, -6.553466796875, -6.08740234375, -5.621337890625, -5.1552734375, -4.689208984375, -4.22314453125, -3.757080078125, -3.291015625, -2.824951171875, -2.35888671875, -1.892822265625, -1.4267578125, -0.960693359375, -0.49462890625, -0.028564453125, 0.4375, 0.903564453125, 1.36962890625, 1.835693359375, 2.3017578125, 2.767822265625, 3.23388671875, 3.699951171875, 4.166015625, 4.632080078125, 5.09814453125, 5.564208984375, 6.0302734375, 6.496337890625, 6.96240234375, 7.428466796875, 7.89453125, 8.360595703125, 8.82666015625, 9.292724609375, 9.7587890625, 10.224853515625, 10.69091796875, 11.156982421875, 11.623046875, 12.089111328125, 12.55517578125, 13.021240234375, 13.4873046875, 13.953369140625, 14.41943359375, 14.885498046875, 15.3515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 6.0, 6.0, 15.0, 7.0, 14.0, 16.0, 17.0, 19.0, 15.0, 21.0, 37.0, 32.0, 42.0, 36.0, 35.0, 45.0, 30.0, 38.0, 53.0, 43.0, 44.0, 46.0, 35.0, 41.0, 27.0, 31.0, 30.0, 30.0, 31.0, 17.0, 23.0, 22.0, 18.0, 17.0, 13.0, 9.0, 4.0, 6.0, 5.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.58919906616211, -29.544570922851562, -28.499942779541016, -27.4553165435791, -26.410688400268555, -25.366060256958008, -24.321434020996094, -23.276805877685547, -22.232177734375, -21.187549591064453, -20.142921447753906, -19.098295211791992, -18.053667068481445, -17.0090389251709, -15.964411735534668, -14.919784545898438, -13.87515640258789, -12.830528259277344, -11.785901069641113, -10.741273880004883, -9.696645736694336, -8.652017593383789, -7.607390403747559, -6.56276273727417, -5.518135070800781, -4.473507404327393, -3.428879737854004, -2.3842520713806152, -1.3396244049072266, -0.2949967384338379, 0.7496309280395508, 1.7942585945129395, 2.8388824462890625, 3.883510112762451, 4.92813777923584, 5.9727654457092285, 7.017393112182617, 8.062021255493164, 9.106648445129395, 10.151275634765625, 11.195903778076172, 12.240531921386719, 13.28515911102295, 14.32978630065918, 15.374414443969727, 16.419042587280273, 17.463668823242188, 18.508296966552734, 19.55292510986328, 20.597553253173828, 21.642181396484375, 22.68680763244629, 23.731435775756836, 24.776063919067383, 25.820690155029297, 26.865318298339844, 27.90994644165039, 28.954574584960938, 29.999202728271484, 31.0438289642334, 32.08845520019531, 33.13308334350586, 34.177711486816406, 35.22233963012695, 36.2669677734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 5.0, 5.0, 6.0, 6.0, 11.0, 10.0, 13.0, 17.0, 24.0, 22.0, 21.0, 27.0, 18.0, 27.0, 30.0, 41.0, 37.0, 37.0, 37.0, 46.0, 47.0, 41.0, 33.0, 36.0, 48.0, 47.0, 36.0, 37.0, 28.0, 28.0, 30.0, 17.0, 24.0, 15.0, 17.0, 12.0, 12.0, 11.0, 11.0, 7.0, 6.0, 9.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-38.14582824707031, -37.04217529296875, -35.93851852416992, -34.83486557006836, -33.73120880126953, -32.62755584716797, -31.523902893066406, -30.42024803161621, -29.316593170166016, -28.21293830871582, -27.109283447265625, -26.005630493164062, -24.901975631713867, -23.798320770263672, -22.69466781616211, -21.591012954711914, -20.48735809326172, -19.383703231811523, -18.280048370361328, -17.176395416259766, -16.07274055480957, -14.969085693359375, -13.865431785583496, -12.761777877807617, -11.658123016357422, -10.554468154907227, -9.450814247131348, -8.347160339355469, -7.243505477905273, -6.139851093292236, -5.036196708679199, -3.932542324066162, -2.828887939453125, -1.725233554840088, -0.6215791702270508, 0.48207521438598633, 1.5857295989990234, 2.6893839836120605, 3.7930383682250977, 4.896692752838135, 6.000347137451172, 7.104001522064209, 8.207655906677246, 9.311309814453125, 10.41496467590332, 11.518619537353516, 12.622273445129395, 13.725927352905273, 14.829582214355469, 15.933237075805664, 17.03689193725586, 18.140544891357422, 19.244199752807617, 20.347854614257812, 21.451507568359375, 22.55516242980957, 23.658817291259766, 24.76247215270996, 25.866127014160156, 26.96977996826172, 28.073434829711914, 29.17708969116211, 30.280742645263672, 31.384397506713867, 32.48805236816406]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 10.0, 13.0, 10.0, 20.0, 38.0, 47.0, 64.0, 103.0, 162.0, 240.0, 332.0, 499.0, 752.0, 1162.0, 1698.0, 2641.0, 4173.0, 6679.0, 10765.0, 17489.0, 28411.0, 45766.0, 71443.0, 105652.0, 140669.0, 158895.0, 144181.0, 108280.0, 73638.0, 47074.0, 29163.0, 18038.0, 11168.0, 6833.0, 4341.0, 2814.0, 1725.0, 1141.0, 772.0, 538.0, 352.0, 260.0, 156.0, 119.0, 82.0, 50.0, 30.0, 26.0, 10.0, 8.0, 7.0, 7.0, 2.0, 3.0, 2.0, 3.0], "bins": [-29.859375, -28.968994140625, -28.07861328125, -27.188232421875, -26.2978515625, -25.407470703125, -24.51708984375, -23.626708984375, -22.736328125, -21.845947265625, -20.95556640625, -20.065185546875, -19.1748046875, -18.284423828125, -17.39404296875, -16.503662109375, -15.61328125, -14.722900390625, -13.83251953125, -12.942138671875, -12.0517578125, -11.161376953125, -10.27099609375, -9.380615234375, -8.490234375, -7.599853515625, -6.70947265625, -5.819091796875, -4.9287109375, -4.038330078125, -3.14794921875, -2.257568359375, -1.3671875, -0.476806640625, 0.41357421875, 1.303955078125, 2.1943359375, 3.084716796875, 3.97509765625, 4.865478515625, 5.755859375, 6.646240234375, 7.53662109375, 8.427001953125, 9.3173828125, 10.207763671875, 11.09814453125, 11.988525390625, 12.87890625, 13.769287109375, 14.65966796875, 15.550048828125, 16.4404296875, 17.330810546875, 18.22119140625, 19.111572265625, 20.001953125, 20.892333984375, 21.78271484375, 22.673095703125, 23.5634765625, 24.453857421875, 25.34423828125, 26.234619140625, 27.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 5.0, 5.0, 8.0, 11.0, 10.0, 10.0, 24.0, 19.0, 25.0, 17.0, 28.0, 22.0, 25.0, 36.0, 31.0, 41.0, 43.0, 32.0, 45.0, 45.0, 44.0, 27.0, 44.0, 49.0, 45.0, 41.0, 32.0, 25.0, 34.0, 26.0, 15.0, 28.0, 14.0, 15.0, 10.0, 14.0, 12.0, 8.0, 8.0, 7.0, 8.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-38.9375, -37.80810546875, -36.6787109375, -35.54931640625, -34.419921875, -33.29052734375, -32.1611328125, -31.03173828125, -29.90234375, -28.77294921875, -27.6435546875, -26.51416015625, -25.384765625, -24.25537109375, -23.1259765625, -21.99658203125, -20.8671875, -19.73779296875, -18.6083984375, -17.47900390625, -16.349609375, -15.22021484375, -14.0908203125, -12.96142578125, -11.83203125, -10.70263671875, -9.5732421875, -8.44384765625, -7.314453125, -6.18505859375, -5.0556640625, -3.92626953125, -2.796875, -1.66748046875, -0.5380859375, 0.59130859375, 1.720703125, 2.85009765625, 3.9794921875, 5.10888671875, 6.23828125, 7.36767578125, 8.4970703125, 9.62646484375, 10.755859375, 11.88525390625, 13.0146484375, 14.14404296875, 15.2734375, 16.40283203125, 17.5322265625, 18.66162109375, 19.791015625, 20.92041015625, 22.0498046875, 23.17919921875, 24.30859375, 25.43798828125, 26.5673828125, 27.69677734375, 28.826171875, 29.95556640625, 31.0849609375, 32.21435546875, 33.34375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 4.0, 6.0, 14.0, 16.0, 23.0, 30.0, 45.0, 61.0, 123.0, 135.0, 210.0, 324.0, 498.0, 875.0, 1458.0, 2687.0, 4978.0, 9987.0, 21707.0, 51755.0, 129811.0, 281034.0, 295229.0, 143481.0, 57063.0, 23727.0, 10990.0, 5378.0, 2815.0, 1572.0, 939.0, 550.0, 350.0, 202.0, 156.0, 106.0, 68.0, 56.0, 30.0, 23.0, 16.0, 11.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.34375, -38.1162109375, -36.888671875, -35.6611328125, -34.43359375, -33.2060546875, -31.978515625, -30.7509765625, -29.5234375, -28.2958984375, -27.068359375, -25.8408203125, -24.61328125, -23.3857421875, -22.158203125, -20.9306640625, -19.703125, -18.4755859375, -17.248046875, -16.0205078125, -14.79296875, -13.5654296875, -12.337890625, -11.1103515625, -9.8828125, -8.6552734375, -7.427734375, -6.2001953125, -4.97265625, -3.7451171875, -2.517578125, -1.2900390625, -0.0625, 1.1650390625, 2.392578125, 3.6201171875, 4.84765625, 6.0751953125, 7.302734375, 8.5302734375, 9.7578125, 10.9853515625, 12.212890625, 13.4404296875, 14.66796875, 15.8955078125, 17.123046875, 18.3505859375, 19.578125, 20.8056640625, 22.033203125, 23.2607421875, 24.48828125, 25.7158203125, 26.943359375, 28.1708984375, 29.3984375, 30.6259765625, 31.853515625, 33.0810546875, 34.30859375, 35.5361328125, 36.763671875, 37.9912109375, 39.21875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 5.0, 6.0, 11.0, 9.0, 16.0, 17.0, 9.0, 16.0, 19.0, 24.0, 19.0, 21.0, 29.0, 27.0, 38.0, 30.0, 30.0, 45.0, 37.0, 36.0, 41.0, 32.0, 38.0, 52.0, 39.0, 40.0, 32.0, 31.0, 35.0, 20.0, 26.0, 16.0, 28.0, 18.0, 13.0, 12.0, 10.0, 14.0, 9.0, 8.0, 10.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.828125, -19.13916015625, -18.4501953125, -17.76123046875, -17.072265625, -16.38330078125, -15.6943359375, -15.00537109375, -14.31640625, -13.62744140625, -12.9384765625, -12.24951171875, -11.560546875, -10.87158203125, -10.1826171875, -9.49365234375, -8.8046875, -8.11572265625, -7.4267578125, -6.73779296875, -6.048828125, -5.35986328125, -4.6708984375, -3.98193359375, -3.29296875, -2.60400390625, -1.9150390625, -1.22607421875, -0.537109375, 0.15185546875, 0.8408203125, 1.52978515625, 2.21875, 2.90771484375, 3.5966796875, 4.28564453125, 4.974609375, 5.66357421875, 6.3525390625, 7.04150390625, 7.73046875, 8.41943359375, 9.1083984375, 9.79736328125, 10.486328125, 11.17529296875, 11.8642578125, 12.55322265625, 13.2421875, 13.93115234375, 14.6201171875, 15.30908203125, 15.998046875, 16.68701171875, 17.3759765625, 18.06494140625, 18.75390625, 19.44287109375, 20.1318359375, 20.82080078125, 21.509765625, 22.19873046875, 22.8876953125, 23.57666015625, 24.265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 5.0, 10.0, 8.0, 16.0, 32.0, 42.0, 44.0, 48.0, 90.0, 112.0, 166.0, 260.0, 351.0, 534.0, 703.0, 1098.0, 1648.0, 2574.0, 4227.0, 7294.0, 13002.0, 24363.0, 49627.0, 114680.0, 259839.0, 297810.0, 142958.0, 61625.0, 28816.0, 14881.0, 8210.0, 4920.0, 2976.0, 1777.0, 1210.0, 791.0, 555.0, 381.0, 255.0, 177.0, 126.0, 85.0, 67.0, 46.0, 41.0, 20.0, 15.0, 12.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-19.03125, -18.4736328125, -17.916015625, -17.3583984375, -16.80078125, -16.2431640625, -15.685546875, -15.1279296875, -14.5703125, -14.0126953125, -13.455078125, -12.8974609375, -12.33984375, -11.7822265625, -11.224609375, -10.6669921875, -10.109375, -9.5517578125, -8.994140625, -8.4365234375, -7.87890625, -7.3212890625, -6.763671875, -6.2060546875, -5.6484375, -5.0908203125, -4.533203125, -3.9755859375, -3.41796875, -2.8603515625, -2.302734375, -1.7451171875, -1.1875, -0.6298828125, -0.072265625, 0.4853515625, 1.04296875, 1.6005859375, 2.158203125, 2.7158203125, 3.2734375, 3.8310546875, 4.388671875, 4.9462890625, 5.50390625, 6.0615234375, 6.619140625, 7.1767578125, 7.734375, 8.2919921875, 8.849609375, 9.4072265625, 9.96484375, 10.5224609375, 11.080078125, 11.6376953125, 12.1953125, 12.7529296875, 13.310546875, 13.8681640625, 14.42578125, 14.9833984375, 15.541015625, 16.0986328125, 16.65625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 10.0, 8.0, 13.0, 13.0, 10.0, 19.0, 20.0, 35.0, 46.0, 50.0, 46.0, 45.0, 57.0, 69.0, 67.0, 59.0, 59.0, 70.0, 49.0, 43.0, 31.0, 23.0, 18.0, 19.0, 16.0, 13.0, 7.0, 17.0, 9.0, 6.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.0010080337524414062, -0.0009749382734298706, -0.000941842794418335, -0.0009087473154067993, -0.0008756518363952637, -0.000842556357383728, -0.0008094608783721924, -0.0007763653993606567, -0.0007432699203491211, -0.0007101744413375854, -0.0006770789623260498, -0.0006439834833145142, -0.0006108880043029785, -0.0005777925252914429, -0.0005446970462799072, -0.0005116015672683716, -0.00047850608825683594, -0.0004454106092453003, -0.00041231513023376465, -0.000379219651222229, -0.00034612417221069336, -0.0003130286931991577, -0.00027993321418762207, -0.0002468377351760864, -0.00021374225616455078, -0.00018064677715301514, -0.0001475512981414795, -0.00011445581912994385, -8.13603401184082e-05, -4.826486110687256e-05, -1.5169382095336914e-05, 1.792609691619873e-05, 5.1021575927734375e-05, 8.411705493927002e-05, 0.00011721253395080566, 0.0001503080129623413, 0.00018340349197387695, 0.0002164989709854126, 0.00024959444999694824, 0.0002826899290084839, 0.00031578540802001953, 0.0003488808870315552, 0.0003819763660430908, 0.00041507184505462646, 0.0004481673240661621, 0.00048126280307769775, 0.0005143582820892334, 0.000547453761100769, 0.0005805492401123047, 0.0006136447191238403, 0.000646740198135376, 0.0006798356771469116, 0.0007129311561584473, 0.0007460266351699829, 0.0007791221141815186, 0.0008122175931930542, 0.0008453130722045898, 0.0008784085512161255, 0.0009115040302276611, 0.0009445995092391968, 0.0009776949882507324, 0.001010790467262268, 0.0010438859462738037, 0.0010769814252853394, 0.001110076904296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 6.0, 3.0, 10.0, 17.0, 20.0, 27.0, 45.0, 52.0, 95.0, 141.0, 212.0, 317.0, 487.0, 729.0, 1138.0, 1715.0, 2758.0, 4255.0, 6913.0, 11509.0, 18917.0, 32146.0, 53880.0, 87407.0, 133084.0, 171461.0, 169688.0, 131720.0, 86885.0, 52732.0, 31283.0, 18776.0, 11374.0, 6919.0, 4214.0, 2731.0, 1669.0, 1091.0, 689.0, 456.0, 307.0, 206.0, 156.0, 92.0, 79.0, 42.0, 26.0, 25.0, 18.0, 15.0, 10.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.71875, -18.094482421875, -17.47021484375, -16.845947265625, -16.2216796875, -15.597412109375, -14.97314453125, -14.348876953125, -13.724609375, -13.100341796875, -12.47607421875, -11.851806640625, -11.2275390625, -10.603271484375, -9.97900390625, -9.354736328125, -8.73046875, -8.106201171875, -7.48193359375, -6.857666015625, -6.2333984375, -5.609130859375, -4.98486328125, -4.360595703125, -3.736328125, -3.112060546875, -2.48779296875, -1.863525390625, -1.2392578125, -0.614990234375, 0.00927734375, 0.633544921875, 1.2578125, 1.882080078125, 2.50634765625, 3.130615234375, 3.7548828125, 4.379150390625, 5.00341796875, 5.627685546875, 6.251953125, 6.876220703125, 7.50048828125, 8.124755859375, 8.7490234375, 9.373291015625, 9.99755859375, 10.621826171875, 11.24609375, 11.870361328125, 12.49462890625, 13.118896484375, 13.7431640625, 14.367431640625, 14.99169921875, 15.615966796875, 16.240234375, 16.864501953125, 17.48876953125, 18.113037109375, 18.7373046875, 19.361572265625, 19.98583984375, 20.610107421875, 21.234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 10.0, 8.0, 10.0, 13.0, 27.0, 28.0, 30.0, 33.0, 44.0, 40.0, 63.0, 60.0, 52.0, 61.0, 63.0, 79.0, 50.0, 36.0, 55.0, 47.0, 31.0, 28.0, 29.0, 28.0, 14.0, 11.0, 11.0, 10.0, 12.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.65625, -8.380615234375, -8.10498046875, -7.829345703125, -7.5537109375, -7.278076171875, -7.00244140625, -6.726806640625, -6.451171875, -6.175537109375, -5.89990234375, -5.624267578125, -5.3486328125, -5.072998046875, -4.79736328125, -4.521728515625, -4.24609375, -3.970458984375, -3.69482421875, -3.419189453125, -3.1435546875, -2.867919921875, -2.59228515625, -2.316650390625, -2.041015625, -1.765380859375, -1.48974609375, -1.214111328125, -0.9384765625, -0.662841796875, -0.38720703125, -0.111572265625, 0.1640625, 0.439697265625, 0.71533203125, 0.990966796875, 1.2666015625, 1.542236328125, 1.81787109375, 2.093505859375, 2.369140625, 2.644775390625, 2.92041015625, 3.196044921875, 3.4716796875, 3.747314453125, 4.02294921875, 4.298583984375, 4.57421875, 4.849853515625, 5.12548828125, 5.401123046875, 5.6767578125, 5.952392578125, 6.22802734375, 6.503662109375, 6.779296875, 7.054931640625, 7.33056640625, 7.606201171875, 7.8818359375, 8.157470703125, 8.43310546875, 8.708740234375, 8.984375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 7.0, 4.0, 4.0, 10.0, 15.0, 10.0, 13.0, 11.0, 17.0, 20.0, 29.0, 38.0, 31.0, 32.0, 42.0, 43.0, 42.0, 45.0, 59.0, 53.0, 50.0, 50.0, 43.0, 48.0, 34.0, 32.0, 35.0, 33.0, 29.0, 28.0, 18.0, 17.0, 11.0, 12.0, 7.0, 10.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.674945831298828, -29.471168518066406, -28.267391204833984, -27.063613891601562, -25.85983657836914, -24.65605926513672, -23.452281951904297, -22.248504638671875, -21.044727325439453, -19.84095001220703, -18.63717269897461, -17.433395385742188, -16.229618072509766, -15.025840759277344, -13.822063446044922, -12.6182861328125, -11.414508819580078, -10.210731506347656, -9.006954193115234, -7.8031768798828125, -6.599399566650391, -5.395622253417969, -4.191844940185547, -2.988067626953125, -1.7842903137207031, -0.5805130004882812, 0.6232643127441406, 1.8270416259765625, 3.0308189392089844, 4.234596252441406, 5.438373565673828, 6.64215087890625, 7.845924377441406, 9.049701690673828, 10.25347900390625, 11.457256317138672, 12.661033630371094, 13.864810943603516, 15.068588256835938, 16.27236557006836, 17.47614288330078, 18.679920196533203, 19.883697509765625, 21.087474822998047, 22.29125213623047, 23.49502944946289, 24.698806762695312, 25.902584075927734, 27.106361389160156, 28.310138702392578, 29.513916015625, 30.717693328857422, 31.921470642089844, 33.125247955322266, 34.32902526855469, 35.53280258178711, 36.73657989501953, 37.94035720825195, 39.144134521484375, 40.3479118347168, 41.55168914794922, 42.75546646118164, 43.95924377441406, 45.163021087646484, 46.366798400878906]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 4.0, 12.0, 8.0, 11.0, 22.0, 18.0, 20.0, 19.0, 27.0, 26.0, 36.0, 34.0, 27.0, 39.0, 39.0, 39.0, 40.0, 54.0, 42.0, 53.0, 39.0, 42.0, 46.0, 41.0, 31.0, 33.0, 24.0, 23.0, 15.0, 14.0, 24.0, 26.0, 10.0, 12.0, 9.0, 8.0, 7.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.558223724365234, -38.3369255065918, -37.115623474121094, -35.894325256347656, -34.67302322387695, -33.451725006103516, -32.23042297363281, -31.009124755859375, -29.787824630737305, -28.566524505615234, -27.345224380493164, -26.123924255371094, -24.902626037597656, -23.681324005126953, -22.460025787353516, -21.238725662231445, -20.017425537109375, -18.796125411987305, -17.574825286865234, -16.353525161743164, -15.13222599029541, -13.91092586517334, -12.689626693725586, -11.468326568603516, -10.247026443481445, -9.025726318359375, -7.804426670074463, -6.583127021789551, -5.3618268966674805, -4.14052677154541, -2.919227123260498, -1.697927474975586, -0.4766273498535156, 0.7446725368499756, 1.9659724235534668, 3.187272310256958, 4.408572196960449, 5.6298723220825195, 6.851171970367432, 8.072471618652344, 9.293771743774414, 10.515071868896484, 11.736371994018555, 12.957671165466309, 14.178971290588379, 15.40027141571045, 16.621570587158203, 17.842870712280273, 19.064170837402344, 20.285470962524414, 21.506771087646484, 22.728071212768555, 23.949371337890625, 25.170669555664062, 26.391969680786133, 27.613269805908203, 28.834569931030273, 30.055870056152344, 31.277170181274414, 32.498470306396484, 33.71976852416992, 34.941070556640625, 36.16236877441406, 37.3836669921875, 38.6049690246582]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 10.0, 10.0, 28.0, 33.0, 56.0, 117.0, 213.0, 322.0, 550.0, 988.0, 1656.0, 2811.0, 4587.0, 7472.0, 12015.0, 18744.0, 28517.0, 41716.0, 57543.0, 76400.0, 93251.0, 106852.0, 112957.0, 108683.0, 97310.0, 80999.0, 62257.0, 45189.0, 31419.0, 20824.0, 13625.0, 8409.0, 5384.0, 3142.0, 1840.0, 1058.0, 627.0, 386.0, 241.0, 134.0, 85.0, 39.0, 26.0, 17.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-44.21875, -42.9775390625, -41.736328125, -40.4951171875, -39.25390625, -38.0126953125, -36.771484375, -35.5302734375, -34.2890625, -33.0478515625, -31.806640625, -30.5654296875, -29.32421875, -28.0830078125, -26.841796875, -25.6005859375, -24.359375, -23.1181640625, -21.876953125, -20.6357421875, -19.39453125, -18.1533203125, -16.912109375, -15.6708984375, -14.4296875, -13.1884765625, -11.947265625, -10.7060546875, -9.46484375, -8.2236328125, -6.982421875, -5.7412109375, -4.5, -3.2587890625, -2.017578125, -0.7763671875, 0.46484375, 1.7060546875, 2.947265625, 4.1884765625, 5.4296875, 6.6708984375, 7.912109375, 9.1533203125, 10.39453125, 11.6357421875, 12.876953125, 14.1181640625, 15.359375, 16.6005859375, 17.841796875, 19.0830078125, 20.32421875, 21.5654296875, 22.806640625, 24.0478515625, 25.2890625, 26.5302734375, 27.771484375, 29.0126953125, 30.25390625, 31.4951171875, 32.736328125, 33.9775390625, 35.21875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 10.0, 9.0, 17.0, 17.0, 17.0, 22.0, 19.0, 28.0, 29.0, 35.0, 34.0, 27.0, 40.0, 39.0, 39.0, 40.0, 58.0, 44.0, 49.0, 35.0, 46.0, 49.0, 32.0, 34.0, 30.0, 27.0, 22.0, 14.0, 19.0, 23.0, 20.0, 11.0, 11.0, 9.0, 7.0, 8.0, 11.0, 3.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.125, -37.91162109375, -36.6982421875, -35.48486328125, -34.271484375, -33.05810546875, -31.8447265625, -30.63134765625, -29.41796875, -28.20458984375, -26.9912109375, -25.77783203125, -24.564453125, -23.35107421875, -22.1376953125, -20.92431640625, -19.7109375, -18.49755859375, -17.2841796875, -16.07080078125, -14.857421875, -13.64404296875, -12.4306640625, -11.21728515625, -10.00390625, -8.79052734375, -7.5771484375, -6.36376953125, -5.150390625, -3.93701171875, -2.7236328125, -1.51025390625, -0.296875, 0.91650390625, 2.1298828125, 3.34326171875, 4.556640625, 5.77001953125, 6.9833984375, 8.19677734375, 9.41015625, 10.62353515625, 11.8369140625, 13.05029296875, 14.263671875, 15.47705078125, 16.6904296875, 17.90380859375, 19.1171875, 20.33056640625, 21.5439453125, 22.75732421875, 23.970703125, 25.18408203125, 26.3974609375, 27.61083984375, 28.82421875, 30.03759765625, 31.2509765625, 32.46435546875, 33.677734375, 34.89111328125, 36.1044921875, 37.31787109375, 38.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 8.0, 12.0, 8.0, 18.0, 36.0, 42.0, 65.0, 112.0, 206.0, 366.0, 590.0, 882.0, 1515.0, 2496.0, 4154.0, 6753.0, 10693.0, 17508.0, 27082.0, 40956.0, 57994.0, 78664.0, 99364.0, 113304.0, 119454.0, 113942.0, 99020.0, 79689.0, 58914.0, 41130.0, 27509.0, 17666.0, 11232.0, 6814.0, 4087.0, 2381.0, 1499.0, 911.0, 546.0, 337.0, 236.0, 135.0, 85.0, 53.0, 40.0, 24.0, 11.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.25, -38.787109375, -37.32421875, -35.861328125, -34.3984375, -32.935546875, -31.47265625, -30.009765625, -28.546875, -27.083984375, -25.62109375, -24.158203125, -22.6953125, -21.232421875, -19.76953125, -18.306640625, -16.84375, -15.380859375, -13.91796875, -12.455078125, -10.9921875, -9.529296875, -8.06640625, -6.603515625, -5.140625, -3.677734375, -2.21484375, -0.751953125, 0.7109375, 2.173828125, 3.63671875, 5.099609375, 6.5625, 8.025390625, 9.48828125, 10.951171875, 12.4140625, 13.876953125, 15.33984375, 16.802734375, 18.265625, 19.728515625, 21.19140625, 22.654296875, 24.1171875, 25.580078125, 27.04296875, 28.505859375, 29.96875, 31.431640625, 32.89453125, 34.357421875, 35.8203125, 37.283203125, 38.74609375, 40.208984375, 41.671875, 43.134765625, 44.59765625, 46.060546875, 47.5234375, 48.986328125, 50.44921875, 51.912109375, 53.375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 10.0, 15.0, 12.0, 11.0, 19.0, 31.0, 22.0, 24.0, 23.0, 42.0, 42.0, 43.0, 39.0, 40.0, 34.0, 44.0, 49.0, 46.0, 42.0, 41.0, 40.0, 37.0, 27.0, 30.0, 27.0, 30.0, 24.0, 24.0, 14.0, 17.0, 15.0, 11.0, 13.0, 10.0, 6.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.796875, -28.9296875, -28.0625, -27.1953125, -26.328125, -25.4609375, -24.59375, -23.7265625, -22.859375, -21.9921875, -21.125, -20.2578125, -19.390625, -18.5234375, -17.65625, -16.7890625, -15.921875, -15.0546875, -14.1875, -13.3203125, -12.453125, -11.5859375, -10.71875, -9.8515625, -8.984375, -8.1171875, -7.25, -6.3828125, -5.515625, -4.6484375, -3.78125, -2.9140625, -2.046875, -1.1796875, -0.3125, 0.5546875, 1.421875, 2.2890625, 3.15625, 4.0234375, 4.890625, 5.7578125, 6.625, 7.4921875, 8.359375, 9.2265625, 10.09375, 10.9609375, 11.828125, 12.6953125, 13.5625, 14.4296875, 15.296875, 16.1640625, 17.03125, 17.8984375, 18.765625, 19.6328125, 20.5, 21.3671875, 22.234375, 23.1015625, 23.96875, 24.8359375, 25.703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 21.0, 31.0, 44.0, 72.0, 98.0, 146.0, 239.0, 365.0, 519.0, 875.0, 1353.0, 2207.0, 3522.0, 5714.0, 9355.0, 15650.0, 26208.0, 44409.0, 72573.0, 110322.0, 148104.0, 165316.0, 147907.0, 110745.0, 72536.0, 44025.0, 26204.0, 15680.0, 9337.0, 5483.0, 3472.0, 2250.0, 1366.0, 876.0, 583.0, 328.0, 216.0, 142.0, 81.0, 57.0, 42.0, 41.0, 14.0, 5.0, 6.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.66015625, -18.0859375, -17.51171875, -16.9375, -16.36328125, -15.7890625, -15.21484375, -14.640625, -14.06640625, -13.4921875, -12.91796875, -12.34375, -11.76953125, -11.1953125, -10.62109375, -10.046875, -9.47265625, -8.8984375, -8.32421875, -7.75, -7.17578125, -6.6015625, -6.02734375, -5.453125, -4.87890625, -4.3046875, -3.73046875, -3.15625, -2.58203125, -2.0078125, -1.43359375, -0.859375, -0.28515625, 0.2890625, 0.86328125, 1.4375, 2.01171875, 2.5859375, 3.16015625, 3.734375, 4.30859375, 4.8828125, 5.45703125, 6.03125, 6.60546875, 7.1796875, 7.75390625, 8.328125, 8.90234375, 9.4765625, 10.05078125, 10.625, 11.19921875, 11.7734375, 12.34765625, 12.921875, 13.49609375, 14.0703125, 14.64453125, 15.21875, 15.79296875, 16.3671875, 16.94140625, 17.515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 7.0, 6.0, 16.0, 8.0, 13.0, 15.0, 29.0, 32.0, 47.0, 39.0, 49.0, 57.0, 67.0, 64.0, 69.0, 82.0, 63.0, 70.0, 56.0, 35.0, 40.0, 34.0, 13.0, 22.0, 15.0, 7.0, 8.0, 4.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027446746826171875, -0.0026630163192749023, -0.002581357955932617, -0.002499699592590332, -0.002418041229248047, -0.0023363828659057617, -0.0022547245025634766, -0.0021730661392211914, -0.0020914077758789062, -0.002009749412536621, -0.001928091049194336, -0.0018464326858520508, -0.0017647743225097656, -0.0016831159591674805, -0.0016014575958251953, -0.0015197992324829102, -0.001438140869140625, -0.0013564825057983398, -0.0012748241424560547, -0.0011931657791137695, -0.0011115074157714844, -0.0010298490524291992, -0.0009481906890869141, -0.0008665323257446289, -0.0007848739624023438, -0.0007032155990600586, -0.0006215572357177734, -0.0005398988723754883, -0.0004582405090332031, -0.00037658214569091797, -0.0002949237823486328, -0.00021326541900634766, -0.0001316070556640625, -4.9948692321777344e-05, 3.170967102050781e-05, 0.00011336803436279297, 0.00019502639770507812, 0.0002766847610473633, 0.00035834312438964844, 0.0004400014877319336, 0.0005216598510742188, 0.0006033182144165039, 0.0006849765777587891, 0.0007666349411010742, 0.0008482933044433594, 0.0009299516677856445, 0.0010116100311279297, 0.0010932683944702148, 0.0011749267578125, 0.0012565851211547852, 0.0013382434844970703, 0.0014199018478393555, 0.0015015602111816406, 0.0015832185745239258, 0.001664876937866211, 0.001746535301208496, 0.0018281936645507812, 0.0019098520278930664, 0.0019915103912353516, 0.0020731687545776367, 0.002154827117919922, 0.002236485481262207, 0.002318143844604492, 0.0023998022079467773, 0.0024814605712890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 9.0, 9.0, 8.0, 24.0, 36.0, 46.0, 64.0, 94.0, 152.0, 224.0, 364.0, 541.0, 926.0, 1341.0, 2330.0, 3641.0, 5963.0, 9610.0, 15236.0, 23618.0, 36120.0, 52984.0, 74690.0, 97094.0, 115548.0, 124195.0, 119958.0, 103842.0, 82618.0, 60292.0, 41725.0, 27565.0, 17960.0, 11172.0, 6912.0, 4335.0, 2672.0, 1690.0, 1062.0, 656.0, 421.0, 279.0, 198.0, 114.0, 81.0, 43.0, 40.0, 22.0, 14.0, 12.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-11.4296875, -11.06884765625, -10.7080078125, -10.34716796875, -9.986328125, -9.62548828125, -9.2646484375, -8.90380859375, -8.54296875, -8.18212890625, -7.8212890625, -7.46044921875, -7.099609375, -6.73876953125, -6.3779296875, -6.01708984375, -5.65625, -5.29541015625, -4.9345703125, -4.57373046875, -4.212890625, -3.85205078125, -3.4912109375, -3.13037109375, -2.76953125, -2.40869140625, -2.0478515625, -1.68701171875, -1.326171875, -0.96533203125, -0.6044921875, -0.24365234375, 0.1171875, 0.47802734375, 0.8388671875, 1.19970703125, 1.560546875, 1.92138671875, 2.2822265625, 2.64306640625, 3.00390625, 3.36474609375, 3.7255859375, 4.08642578125, 4.447265625, 4.80810546875, 5.1689453125, 5.52978515625, 5.890625, 6.25146484375, 6.6123046875, 6.97314453125, 7.333984375, 7.69482421875, 8.0556640625, 8.41650390625, 8.77734375, 9.13818359375, 9.4990234375, 9.85986328125, 10.220703125, 10.58154296875, 10.9423828125, 11.30322265625, 11.6640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 8.0, 7.0, 13.0, 12.0, 19.0, 22.0, 34.0, 23.0, 29.0, 40.0, 51.0, 51.0, 36.0, 43.0, 54.0, 60.0, 41.0, 56.0, 51.0, 37.0, 46.0, 40.0, 43.0, 23.0, 21.0, 26.0, 25.0, 18.0, 16.0, 20.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.35382080078125, -5.1959228515625, -5.03802490234375, -4.880126953125, -4.72222900390625, -4.5643310546875, -4.40643310546875, -4.24853515625, -4.09063720703125, -3.9327392578125, -3.77484130859375, -3.616943359375, -3.45904541015625, -3.3011474609375, -3.14324951171875, -2.9853515625, -2.82745361328125, -2.6695556640625, -2.51165771484375, -2.353759765625, -2.19586181640625, -2.0379638671875, -1.88006591796875, -1.72216796875, -1.56427001953125, -1.4063720703125, -1.24847412109375, -1.090576171875, -0.93267822265625, -0.7747802734375, -0.61688232421875, -0.458984375, -0.30108642578125, -0.1431884765625, 0.01470947265625, 0.172607421875, 0.33050537109375, 0.4884033203125, 0.64630126953125, 0.80419921875, 0.96209716796875, 1.1199951171875, 1.27789306640625, 1.435791015625, 1.59368896484375, 1.7515869140625, 1.90948486328125, 2.0673828125, 2.22528076171875, 2.3831787109375, 2.54107666015625, 2.698974609375, 2.85687255859375, 3.0147705078125, 3.17266845703125, 3.33056640625, 3.48846435546875, 3.6463623046875, 3.80426025390625, 3.962158203125, 4.12005615234375, 4.2779541015625, 4.43585205078125, 4.59375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 9.0, 9.0, 9.0, 6.0, 16.0, 10.0, 22.0, 17.0, 24.0, 12.0, 21.0, 32.0, 33.0, 45.0, 38.0, 51.0, 48.0, 51.0, 37.0, 56.0, 53.0, 55.0, 45.0, 42.0, 23.0, 38.0, 41.0, 26.0, 30.0, 15.0, 13.0, 23.0, 16.0, 9.0, 4.0, 1.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.295684814453125, -38.02851104736328, -36.76133728027344, -35.49415969848633, -34.226985931396484, -32.95981216430664, -31.692638397216797, -30.42546272277832, -29.158287048339844, -27.89111328125, -26.623937606811523, -25.35676383972168, -24.089588165283203, -22.82241439819336, -21.555240631103516, -20.28806495666504, -19.020891189575195, -17.75371742248535, -16.486541748046875, -15.219367980957031, -13.952192306518555, -12.685018539428711, -11.41784381866455, -10.15066909790039, -8.88349437713623, -7.61631965637207, -6.34914493560791, -5.081970691680908, -3.814795970916748, -2.547621250152588, -1.280447006225586, -0.013272285461425781, 1.2539024353027344, 2.5210771560668945, 3.7882516384124756, 5.055426120758057, 6.322600841522217, 7.589775562286377, 8.856949806213379, 10.124124526977539, 11.3912992477417, 12.65847396850586, 13.92564868927002, 15.19282341003418, 16.459997177124023, 17.7271728515625, 18.994346618652344, 20.261520385742188, 21.528696060180664, 22.795869827270508, 24.063045501708984, 25.330219268798828, 26.597394943237305, 27.86456871032715, 29.131744384765625, 30.39891815185547, 31.666091918945312, 32.933265686035156, 34.200439453125, 35.46761703491211, 36.73479080200195, 38.0019645690918, 39.26913833618164, 40.53631591796875, 41.803489685058594]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 6.0, 8.0, 8.0, 9.0, 12.0, 16.0, 19.0, 23.0, 19.0, 18.0, 24.0, 32.0, 31.0, 34.0, 32.0, 55.0, 47.0, 39.0, 43.0, 48.0, 44.0, 41.0, 39.0, 40.0, 33.0, 37.0, 29.0, 25.0, 22.0, 13.0, 23.0, 29.0, 18.0, 15.0, 16.0, 12.0, 12.0, 7.0, 7.0, 13.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-43.21232986450195, -41.94058609008789, -40.66884231567383, -39.397098541259766, -38.1253547668457, -36.85361099243164, -35.58186721801758, -34.31011962890625, -33.03837585449219, -31.766632080078125, -30.494888305664062, -29.22314453125, -27.951400756835938, -26.679656982421875, -25.40791130065918, -24.136167526245117, -22.864425659179688, -21.592681884765625, -20.320938110351562, -19.0491943359375, -17.777450561523438, -16.505706787109375, -15.23396110534668, -13.962217330932617, -12.690473556518555, -11.418729782104492, -10.14698600769043, -8.87524127960205, -7.603497505187988, -6.331753730773926, -5.060009479522705, -3.7882652282714844, -2.5165176391601562, -1.2447736263275146, 0.026970386505126953, 1.2987143993377686, 2.57045841217041, 3.8422021865844727, 5.113946437835693, 6.385690689086914, 7.657434463500977, 8.929178237915039, 10.200922012329102, 11.47266674041748, 12.744410514831543, 14.016154289245605, 15.287899017333984, 16.559642791748047, 17.83138656616211, 19.103130340576172, 20.374874114990234, 21.646617889404297, 22.91836166381836, 24.190105438232422, 25.461851119995117, 26.73359489440918, 28.005338668823242, 29.277082443237305, 30.548826217651367, 31.82056999206543, 33.092315673828125, 34.36405944824219, 35.63580322265625, 36.90754699707031, 38.179290771484375]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 9.0, 13.0, 19.0, 35.0, 76.0, 131.0, 219.0, 347.0, 558.0, 962.0, 1746.0, 3002.0, 5066.0, 8707.0, 14457.0, 25226.0, 42506.0, 71213.0, 117163.0, 187119.0, 285142.0, 404329.0, 517139.0, 576853.0, 551621.0, 454789.0, 333886.0, 225638.0, 143495.0, 89441.0, 53891.0, 32216.0, 19323.0, 11502.0, 6732.0, 4002.0, 2386.0, 1361.0, 782.0, 479.0, 256.0, 181.0, 90.0, 74.0, 39.0, 29.0, 9.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.34375, -37.095703125, -35.84765625, -34.599609375, -33.3515625, -32.103515625, -30.85546875, -29.607421875, -28.359375, -27.111328125, -25.86328125, -24.615234375, -23.3671875, -22.119140625, -20.87109375, -19.623046875, -18.375, -17.126953125, -15.87890625, -14.630859375, -13.3828125, -12.134765625, -10.88671875, -9.638671875, -8.390625, -7.142578125, -5.89453125, -4.646484375, -3.3984375, -2.150390625, -0.90234375, 0.345703125, 1.59375, 2.841796875, 4.08984375, 5.337890625, 6.5859375, 7.833984375, 9.08203125, 10.330078125, 11.578125, 12.826171875, 14.07421875, 15.322265625, 16.5703125, 17.818359375, 19.06640625, 20.314453125, 21.5625, 22.810546875, 24.05859375, 25.306640625, 26.5546875, 27.802734375, 29.05078125, 30.298828125, 31.546875, 32.794921875, 34.04296875, 35.291015625, 36.5390625, 37.787109375, 39.03515625, 40.283203125, 41.53125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 8.0, 9.0, 12.0, 15.0, 26.0, 16.0, 15.0, 20.0, 31.0, 32.0, 24.0, 27.0, 40.0, 40.0, 49.0, 38.0, 43.0, 46.0, 50.0, 45.0, 34.0, 41.0, 33.0, 28.0, 39.0, 22.0, 22.0, 21.0, 16.0, 22.0, 21.0, 19.0, 14.0, 19.0, 13.0, 5.0, 6.0, 14.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-36.5625, -35.48876953125, -34.4150390625, -33.34130859375, -32.267578125, -31.19384765625, -30.1201171875, -29.04638671875, -27.97265625, -26.89892578125, -25.8251953125, -24.75146484375, -23.677734375, -22.60400390625, -21.5302734375, -20.45654296875, -19.3828125, -18.30908203125, -17.2353515625, -16.16162109375, -15.087890625, -14.01416015625, -12.9404296875, -11.86669921875, -10.79296875, -9.71923828125, -8.6455078125, -7.57177734375, -6.498046875, -5.42431640625, -4.3505859375, -3.27685546875, -2.203125, -1.12939453125, -0.0556640625, 1.01806640625, 2.091796875, 3.16552734375, 4.2392578125, 5.31298828125, 6.38671875, 7.46044921875, 8.5341796875, 9.60791015625, 10.681640625, 11.75537109375, 12.8291015625, 13.90283203125, 14.9765625, 16.05029296875, 17.1240234375, 18.19775390625, 19.271484375, 20.34521484375, 21.4189453125, 22.49267578125, 23.56640625, 24.64013671875, 25.7138671875, 26.78759765625, 27.861328125, 28.93505859375, 30.0087890625, 31.08251953125, 32.15625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 19.0, 27.0, 35.0, 81.0, 126.0, 209.0, 329.0, 607.0, 1034.0, 1900.0, 3254.0, 5663.0, 9877.0, 16935.0, 29989.0, 50216.0, 83502.0, 132754.0, 203915.0, 295524.0, 395609.0, 484120.0, 528167.0, 510359.0, 439919.0, 339167.0, 243350.0, 162280.0, 103057.0, 62627.0, 37711.0, 22261.0, 12744.0, 7252.0, 4128.0, 2382.0, 1337.0, 739.0, 413.0, 262.0, 168.0, 90.0, 54.0, 29.0, 20.0, 14.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.59375, -38.3837890625, -37.173828125, -35.9638671875, -34.75390625, -33.5439453125, -32.333984375, -31.1240234375, -29.9140625, -28.7041015625, -27.494140625, -26.2841796875, -25.07421875, -23.8642578125, -22.654296875, -21.4443359375, -20.234375, -19.0244140625, -17.814453125, -16.6044921875, -15.39453125, -14.1845703125, -12.974609375, -11.7646484375, -10.5546875, -9.3447265625, -8.134765625, -6.9248046875, -5.71484375, -4.5048828125, -3.294921875, -2.0849609375, -0.875, 0.3349609375, 1.544921875, 2.7548828125, 3.96484375, 5.1748046875, 6.384765625, 7.5947265625, 8.8046875, 10.0146484375, 11.224609375, 12.4345703125, 13.64453125, 14.8544921875, 16.064453125, 17.2744140625, 18.484375, 19.6943359375, 20.904296875, 22.1142578125, 23.32421875, 24.5341796875, 25.744140625, 26.9541015625, 28.1640625, 29.3740234375, 30.583984375, 31.7939453125, 33.00390625, 34.2138671875, 35.423828125, 36.6337890625, 37.84375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 8.0, 17.0, 17.0, 14.0, 31.0, 32.0, 41.0, 45.0, 53.0, 74.0, 99.0, 107.0, 113.0, 144.0, 139.0, 176.0, 201.0, 176.0, 187.0, 204.0, 201.0, 225.0, 182.0, 207.0, 181.0, 170.0, 161.0, 129.0, 119.0, 120.0, 91.0, 69.0, 67.0, 63.0, 48.0, 34.0, 27.0, 20.0, 20.0, 15.0, 14.0, 6.0, 3.0, 3.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-16.953125, -16.419677734375, -15.88623046875, -15.352783203125, -14.8193359375, -14.285888671875, -13.75244140625, -13.218994140625, -12.685546875, -12.152099609375, -11.61865234375, -11.085205078125, -10.5517578125, -10.018310546875, -9.48486328125, -8.951416015625, -8.41796875, -7.884521484375, -7.35107421875, -6.817626953125, -6.2841796875, -5.750732421875, -5.21728515625, -4.683837890625, -4.150390625, -3.616943359375, -3.08349609375, -2.550048828125, -2.0166015625, -1.483154296875, -0.94970703125, -0.416259765625, 0.1171875, 0.650634765625, 1.18408203125, 1.717529296875, 2.2509765625, 2.784423828125, 3.31787109375, 3.851318359375, 4.384765625, 4.918212890625, 5.45166015625, 5.985107421875, 6.5185546875, 7.052001953125, 7.58544921875, 8.118896484375, 8.65234375, 9.185791015625, 9.71923828125, 10.252685546875, 10.7861328125, 11.319580078125, 11.85302734375, 12.386474609375, 12.919921875, 13.453369140625, 13.98681640625, 14.520263671875, 15.0537109375, 15.587158203125, 16.12060546875, 16.654052734375, 17.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 12.0, 12.0, 11.0, 7.0, 16.0, 19.0, 13.0, 18.0, 19.0, 33.0, 19.0, 30.0, 33.0, 37.0, 35.0, 47.0, 44.0, 37.0, 44.0, 58.0, 45.0, 41.0, 28.0, 41.0, 30.0, 30.0, 23.0, 23.0, 23.0, 24.0, 23.0, 24.0, 15.0, 12.0, 15.0, 11.0, 10.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-33.89326477050781, -32.73695373535156, -31.580642700195312, -30.424331665039062, -29.26801872253418, -28.11170768737793, -26.95539665222168, -25.799083709716797, -24.642772674560547, -23.486461639404297, -22.330150604248047, -21.173839569091797, -20.017526626586914, -18.861215591430664, -17.704904556274414, -16.54859161376953, -15.392282485961914, -14.235971450805664, -13.079659461975098, -11.923348426818848, -10.767036437988281, -9.610725402832031, -8.454414367675781, -7.298102378845215, -6.141791343688965, -4.985479831695557, -3.8291685581207275, -2.6728572845458984, -1.5165457725524902, -0.36023426055908203, 0.796076774597168, 1.9523887634277344, 3.1086997985839844, 4.265011310577393, 5.421322822570801, 6.577633857727051, 7.733945369720459, 8.890256881713867, 10.046567916870117, 11.202879905700684, 12.359190940856934, 13.515501976013184, 14.67181396484375, 15.828125, 16.98443603515625, 18.1407470703125, 19.29705810546875, 20.453371047973633, 21.609682083129883, 22.765993118286133, 23.922304153442383, 25.078617095947266, 26.234928131103516, 27.391239166259766, 28.547550201416016, 29.703861236572266, 30.860172271728516, 32.016483306884766, 33.172794342041016, 34.329105377197266, 35.485416412353516, 36.64173126220703, 37.79804229736328, 38.95435333251953, 40.11066436767578]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 4.0, 6.0, 5.0, 4.0, 2.0, 17.0, 12.0, 20.0, 15.0, 15.0, 19.0, 13.0, 25.0, 24.0, 25.0, 33.0, 36.0, 31.0, 24.0, 40.0, 38.0, 33.0, 40.0, 35.0, 40.0, 39.0, 34.0, 30.0, 24.0, 30.0, 35.0, 19.0, 26.0, 24.0, 25.0, 21.0, 16.0, 17.0, 18.0, 10.0, 7.0, 10.0, 5.0, 8.0, 5.0, 10.0, 6.0, 4.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-34.078948974609375, -33.02825164794922, -31.97755241394043, -30.92685317993164, -29.87615394592285, -28.825454711914062, -27.774757385253906, -26.724058151245117, -25.673358917236328, -24.62265968322754, -23.571962356567383, -22.521263122558594, -21.470563888549805, -20.419864654541016, -19.36916732788086, -18.31846809387207, -17.267770767211914, -16.217071533203125, -15.166373252868652, -14.11567497253418, -13.06497573852539, -12.014277458190918, -10.963579177856445, -9.912879943847656, -8.862181663513184, -7.811482906341553, -6.760784149169922, -5.710085868835449, -4.659387111663818, -3.6086883544921875, -2.557990074157715, -1.507291316986084, -0.4565925598144531, 0.5941060781478882, 1.6448047161102295, 2.6955032348632812, 3.746201992034912, 4.796900749206543, 5.847599029541016, 6.8982977867126465, 7.948996543884277, 8.99969482421875, 10.050394058227539, 11.101092338562012, 12.151790618896484, 13.202489852905273, 14.253188133239746, 15.303886413574219, 16.354585647583008, 17.405284881591797, 18.455982208251953, 19.506681442260742, 20.55738067626953, 21.608078002929688, 22.658777236938477, 23.709476470947266, 24.760173797607422, 25.81087303161621, 26.861570358276367, 27.912269592285156, 28.962968826293945, 30.013668060302734, 31.06436538696289, 32.11506271362305, 33.16576385498047]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 7.0, 15.0, 17.0, 13.0, 41.0, 52.0, 72.0, 102.0, 171.0, 284.0, 423.0, 745.0, 1428.0, 2532.0, 4776.0, 8666.0, 16604.0, 31564.0, 57895.0, 103174.0, 163499.0, 203724.0, 179943.0, 121201.0, 70118.0, 37642.0, 20188.0, 10728.0, 5727.0, 3089.0, 1672.0, 1000.0, 528.0, 317.0, 208.0, 114.0, 95.0, 45.0, 48.0, 26.0, 20.0, 13.0, 9.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-48.9375, -47.4833984375, -46.029296875, -44.5751953125, -43.12109375, -41.6669921875, -40.212890625, -38.7587890625, -37.3046875, -35.8505859375, -34.396484375, -32.9423828125, -31.48828125, -30.0341796875, -28.580078125, -27.1259765625, -25.671875, -24.2177734375, -22.763671875, -21.3095703125, -19.85546875, -18.4013671875, -16.947265625, -15.4931640625, -14.0390625, -12.5849609375, -11.130859375, -9.6767578125, -8.22265625, -6.7685546875, -5.314453125, -3.8603515625, -2.40625, -0.9521484375, 0.501953125, 1.9560546875, 3.41015625, 4.8642578125, 6.318359375, 7.7724609375, 9.2265625, 10.6806640625, 12.134765625, 13.5888671875, 15.04296875, 16.4970703125, 17.951171875, 19.4052734375, 20.859375, 22.3134765625, 23.767578125, 25.2216796875, 26.67578125, 28.1298828125, 29.583984375, 31.0380859375, 32.4921875, 33.9462890625, 35.400390625, 36.8544921875, 38.30859375, 39.7626953125, 41.216796875, 42.6708984375, 44.125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 3.0, 7.0, 3.0, 6.0, 5.0, 1.0, 14.0, 11.0, 22.0, 11.0, 17.0, 21.0, 17.0, 17.0, 29.0, 23.0, 32.0, 33.0, 22.0, 37.0, 35.0, 40.0, 34.0, 36.0, 31.0, 48.0, 33.0, 34.0, 34.0, 28.0, 29.0, 31.0, 26.0, 20.0, 29.0, 21.0, 20.0, 22.0, 11.0, 20.0, 9.0, 13.0, 6.0, 8.0, 8.0, 5.0, 10.0, 5.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0], "bins": [-34.46875, -33.41259765625, -32.3564453125, -31.30029296875, -30.244140625, -29.18798828125, -28.1318359375, -27.07568359375, -26.01953125, -24.96337890625, -23.9072265625, -22.85107421875, -21.794921875, -20.73876953125, -19.6826171875, -18.62646484375, -17.5703125, -16.51416015625, -15.4580078125, -14.40185546875, -13.345703125, -12.28955078125, -11.2333984375, -10.17724609375, -9.12109375, -8.06494140625, -7.0087890625, -5.95263671875, -4.896484375, -3.84033203125, -2.7841796875, -1.72802734375, -0.671875, 0.38427734375, 1.4404296875, 2.49658203125, 3.552734375, 4.60888671875, 5.6650390625, 6.72119140625, 7.77734375, 8.83349609375, 9.8896484375, 10.94580078125, 12.001953125, 13.05810546875, 14.1142578125, 15.17041015625, 16.2265625, 17.28271484375, 18.3388671875, 19.39501953125, 20.451171875, 21.50732421875, 22.5634765625, 23.61962890625, 24.67578125, 25.73193359375, 26.7880859375, 27.84423828125, 28.900390625, 29.95654296875, 31.0126953125, 32.06884765625, 33.125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 8.0, 7.0, 16.0, 19.0, 16.0, 30.0, 27.0, 47.0, 62.0, 72.0, 98.0, 140.0, 178.0, 219.0, 319.0, 473.0, 738.0, 1066.0, 1746.0, 2914.0, 5169.0, 9344.0, 18361.0, 37894.0, 84895.0, 185909.0, 293098.0, 214913.0, 100114.0, 44131.0, 20948.0, 10668.0, 5813.0, 3344.0, 1924.0, 1207.0, 778.0, 555.0, 355.0, 245.0, 182.0, 155.0, 87.0, 70.0, 53.0, 42.0, 23.0, 14.0, 13.0, 16.0, 12.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0], "bins": [-50.71875, -49.1630859375, -47.607421875, -46.0517578125, -44.49609375, -42.9404296875, -41.384765625, -39.8291015625, -38.2734375, -36.7177734375, -35.162109375, -33.6064453125, -32.05078125, -30.4951171875, -28.939453125, -27.3837890625, -25.828125, -24.2724609375, -22.716796875, -21.1611328125, -19.60546875, -18.0498046875, -16.494140625, -14.9384765625, -13.3828125, -11.8271484375, -10.271484375, -8.7158203125, -7.16015625, -5.6044921875, -4.048828125, -2.4931640625, -0.9375, 0.6181640625, 2.173828125, 3.7294921875, 5.28515625, 6.8408203125, 8.396484375, 9.9521484375, 11.5078125, 13.0634765625, 14.619140625, 16.1748046875, 17.73046875, 19.2861328125, 20.841796875, 22.3974609375, 23.953125, 25.5087890625, 27.064453125, 28.6201171875, 30.17578125, 31.7314453125, 33.287109375, 34.8427734375, 36.3984375, 37.9541015625, 39.509765625, 41.0654296875, 42.62109375, 44.1767578125, 45.732421875, 47.2880859375, 48.84375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 11.0, 3.0, 7.0, 9.0, 12.0, 11.0, 15.0, 16.0, 16.0, 18.0, 15.0, 20.0, 27.0, 13.0, 25.0, 35.0, 33.0, 33.0, 34.0, 42.0, 39.0, 32.0, 36.0, 42.0, 37.0, 47.0, 38.0, 29.0, 28.0, 28.0, 29.0, 38.0, 23.0, 15.0, 22.0, 20.0, 13.0, 12.0, 15.0, 10.0, 15.0, 10.0, 6.0, 3.0, 6.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.59375, -21.875732421875, -21.15771484375, -20.439697265625, -19.7216796875, -19.003662109375, -18.28564453125, -17.567626953125, -16.849609375, -16.131591796875, -15.41357421875, -14.695556640625, -13.9775390625, -13.259521484375, -12.54150390625, -11.823486328125, -11.10546875, -10.387451171875, -9.66943359375, -8.951416015625, -8.2333984375, -7.515380859375, -6.79736328125, -6.079345703125, -5.361328125, -4.643310546875, -3.92529296875, -3.207275390625, -2.4892578125, -1.771240234375, -1.05322265625, -0.335205078125, 0.3828125, 1.100830078125, 1.81884765625, 2.536865234375, 3.2548828125, 3.972900390625, 4.69091796875, 5.408935546875, 6.126953125, 6.844970703125, 7.56298828125, 8.281005859375, 8.9990234375, 9.717041015625, 10.43505859375, 11.153076171875, 11.87109375, 12.589111328125, 13.30712890625, 14.025146484375, 14.7431640625, 15.461181640625, 16.17919921875, 16.897216796875, 17.615234375, 18.333251953125, 19.05126953125, 19.769287109375, 20.4873046875, 21.205322265625, 21.92333984375, 22.641357421875, 23.359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 11.0, 5.0, 11.0, 20.0, 29.0, 47.0, 58.0, 78.0, 113.0, 180.0, 266.0, 363.0, 585.0, 914.0, 1487.0, 2397.0, 4015.0, 7101.0, 12955.0, 25007.0, 51051.0, 108887.0, 221186.0, 279226.0, 171002.0, 80018.0, 38047.0, 19174.0, 9949.0, 5683.0, 3171.0, 2007.0, 1185.0, 780.0, 507.0, 358.0, 219.0, 126.0, 92.0, 77.0, 42.0, 43.0, 21.0, 21.0, 10.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.75, -16.2314453125, -15.712890625, -15.1943359375, -14.67578125, -14.1572265625, -13.638671875, -13.1201171875, -12.6015625, -12.0830078125, -11.564453125, -11.0458984375, -10.52734375, -10.0087890625, -9.490234375, -8.9716796875, -8.453125, -7.9345703125, -7.416015625, -6.8974609375, -6.37890625, -5.8603515625, -5.341796875, -4.8232421875, -4.3046875, -3.7861328125, -3.267578125, -2.7490234375, -2.23046875, -1.7119140625, -1.193359375, -0.6748046875, -0.15625, 0.3623046875, 0.880859375, 1.3994140625, 1.91796875, 2.4365234375, 2.955078125, 3.4736328125, 3.9921875, 4.5107421875, 5.029296875, 5.5478515625, 6.06640625, 6.5849609375, 7.103515625, 7.6220703125, 8.140625, 8.6591796875, 9.177734375, 9.6962890625, 10.21484375, 10.7333984375, 11.251953125, 11.7705078125, 12.2890625, 12.8076171875, 13.326171875, 13.8447265625, 14.36328125, 14.8818359375, 15.400390625, 15.9189453125, 16.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 6.0, 9.0, 7.0, 10.0, 14.0, 13.0, 15.0, 18.0, 27.0, 39.0, 41.0, 47.0, 46.0, 38.0, 54.0, 61.0, 62.0, 74.0, 66.0, 62.0, 44.0, 32.0, 41.0, 29.0, 25.0, 24.0, 19.0, 18.0, 9.0, 3.0, 7.0, 5.0, 1.0, 10.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009183883666992188, -0.0008790194988250732, -0.0008396506309509277, -0.0008002817630767822, -0.0007609128952026367, -0.0007215440273284912, -0.0006821751594543457, -0.0006428062915802002, -0.0006034374237060547, -0.0005640685558319092, -0.0005246996879577637, -0.00048533082008361816, -0.00044596195220947266, -0.00040659308433532715, -0.00036722421646118164, -0.00032785534858703613, -0.0002884864807128906, -0.0002491176128387451, -0.0002097487449645996, -0.0001703798770904541, -0.0001310110092163086, -9.164214134216309e-05, -5.227327346801758e-05, -1.290440559387207e-05, 2.6464462280273438e-05, 6.583333015441895e-05, 0.00010520219802856445, 0.00014457106590270996, 0.00018393993377685547, 0.00022330880165100098, 0.0002626776695251465, 0.000302046537399292, 0.0003414154052734375, 0.000380784273147583, 0.0004201531410217285, 0.000459522008895874, 0.0004988908767700195, 0.000538259744644165, 0.0005776286125183105, 0.0006169974803924561, 0.0006563663482666016, 0.0006957352161407471, 0.0007351040840148926, 0.0007744729518890381, 0.0008138418197631836, 0.0008532106876373291, 0.0008925795555114746, 0.0009319484233856201, 0.0009713172912597656, 0.0010106861591339111, 0.0010500550270080566, 0.0010894238948822021, 0.0011287927627563477, 0.0011681616306304932, 0.0012075304985046387, 0.0012468993663787842, 0.0012862682342529297, 0.0013256371021270752, 0.0013650059700012207, 0.0014043748378753662, 0.0014437437057495117, 0.0014831125736236572, 0.0015224814414978027, 0.0015618503093719482, 0.0016012191772460938]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 8.0, 16.0, 12.0, 20.0, 25.0, 43.0, 56.0, 76.0, 146.0, 207.0, 288.0, 408.0, 561.0, 824.0, 1260.0, 1827.0, 2693.0, 4102.0, 6087.0, 9307.0, 13802.0, 20975.0, 32175.0, 48238.0, 70709.0, 98532.0, 125026.0, 137582.0, 130282.0, 105485.0, 78175.0, 53705.0, 35858.0, 23403.0, 15613.0, 10330.0, 6822.0, 4404.0, 3044.0, 2019.0, 1385.0, 946.0, 648.0, 414.0, 319.0, 226.0, 145.0, 109.0, 75.0, 45.0, 40.0, 19.0, 18.0, 9.0, 9.0, 5.0, 6.0, 3.0], "bins": [-15.125, -14.67529296875, -14.2255859375, -13.77587890625, -13.326171875, -12.87646484375, -12.4267578125, -11.97705078125, -11.52734375, -11.07763671875, -10.6279296875, -10.17822265625, -9.728515625, -9.27880859375, -8.8291015625, -8.37939453125, -7.9296875, -7.47998046875, -7.0302734375, -6.58056640625, -6.130859375, -5.68115234375, -5.2314453125, -4.78173828125, -4.33203125, -3.88232421875, -3.4326171875, -2.98291015625, -2.533203125, -2.08349609375, -1.6337890625, -1.18408203125, -0.734375, -0.28466796875, 0.1650390625, 0.61474609375, 1.064453125, 1.51416015625, 1.9638671875, 2.41357421875, 2.86328125, 3.31298828125, 3.7626953125, 4.21240234375, 4.662109375, 5.11181640625, 5.5615234375, 6.01123046875, 6.4609375, 6.91064453125, 7.3603515625, 7.81005859375, 8.259765625, 8.70947265625, 9.1591796875, 9.60888671875, 10.05859375, 10.50830078125, 10.9580078125, 11.40771484375, 11.857421875, 12.30712890625, 12.7568359375, 13.20654296875, 13.65625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 10.0, 9.0, 12.0, 13.0, 14.0, 21.0, 15.0, 23.0, 24.0, 26.0, 25.0, 31.0, 37.0, 45.0, 46.0, 38.0, 46.0, 37.0, 38.0, 47.0, 41.0, 43.0, 40.0, 36.0, 31.0, 30.0, 33.0, 32.0, 22.0, 27.0, 16.0, 21.0, 10.0, 11.0, 13.0, 11.0, 7.0, 3.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.44921875, -5.2933349609375, -5.137451171875, -4.9815673828125, -4.82568359375, -4.6697998046875, -4.513916015625, -4.3580322265625, -4.2021484375, -4.0462646484375, -3.890380859375, -3.7344970703125, -3.57861328125, -3.4227294921875, -3.266845703125, -3.1109619140625, -2.955078125, -2.7991943359375, -2.643310546875, -2.4874267578125, -2.33154296875, -2.1756591796875, -2.019775390625, -1.8638916015625, -1.7080078125, -1.5521240234375, -1.396240234375, -1.2403564453125, -1.08447265625, -0.9285888671875, -0.772705078125, -0.6168212890625, -0.4609375, -0.3050537109375, -0.149169921875, 0.0067138671875, 0.16259765625, 0.3184814453125, 0.474365234375, 0.6302490234375, 0.7861328125, 0.9420166015625, 1.097900390625, 1.2537841796875, 1.40966796875, 1.5655517578125, 1.721435546875, 1.8773193359375, 2.033203125, 2.1890869140625, 2.344970703125, 2.5008544921875, 2.65673828125, 2.8126220703125, 2.968505859375, 3.1243896484375, 3.2802734375, 3.4361572265625, 3.592041015625, 3.7479248046875, 3.90380859375, 4.0596923828125, 4.215576171875, 4.3714599609375, 4.52734375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 3.0, 12.0, 10.0, 11.0, 11.0, 9.0, 22.0, 17.0, 17.0, 16.0, 21.0, 27.0, 25.0, 32.0, 42.0, 47.0, 50.0, 44.0, 57.0, 43.0, 51.0, 53.0, 33.0, 46.0, 21.0, 35.0, 23.0, 27.0, 13.0, 25.0, 20.0, 23.0, 17.0, 18.0, 13.0, 8.0, 18.0, 9.0, 7.0, 2.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-37.495628356933594, -36.27681350708008, -35.05799865722656, -33.83917999267578, -32.620365142822266, -31.40155029296875, -30.1827335357666, -28.963916778564453, -27.745101928710938, -26.526287078857422, -25.307470321655273, -24.088653564453125, -22.86983871459961, -21.651023864746094, -20.432207107543945, -19.213390350341797, -17.99457550048828, -16.775760650634766, -15.556943893432617, -14.338128089904785, -13.119312286376953, -11.900496482849121, -10.681680679321289, -9.462864875793457, -8.244049072265625, -7.025233268737793, -5.806417465209961, -4.587601661682129, -3.368785858154297, -2.149970054626465, -0.9311542510986328, 0.2876615524291992, 1.5064773559570312, 2.7252931594848633, 3.9441089630126953, 5.162924766540527, 6.381740570068359, 7.600556373596191, 8.819372177124023, 10.038187980651855, 11.257003784179688, 12.47581958770752, 13.694635391235352, 14.913451194763184, 16.132266998291016, 17.35108184814453, 18.56989860534668, 19.788715362548828, 21.007530212402344, 22.22634506225586, 23.445161819458008, 24.663978576660156, 25.882793426513672, 27.101608276367188, 28.320425033569336, 29.539241790771484, 30.758056640625, 31.976871490478516, 33.19568634033203, 34.41450500488281, 35.63331985473633, 36.852134704589844, 38.070953369140625, 39.28976821899414, 40.508583068847656]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 2.0, 4.0, 4.0, 8.0, 4.0, 9.0, 4.0, 11.0, 21.0, 18.0, 18.0, 15.0, 23.0, 21.0, 18.0, 27.0, 33.0, 37.0, 32.0, 34.0, 38.0, 46.0, 35.0, 34.0, 38.0, 40.0, 32.0, 39.0, 26.0, 33.0, 37.0, 22.0, 26.0, 22.0, 25.0, 24.0, 22.0, 22.0, 13.0, 8.0, 11.0, 9.0, 7.0, 7.0, 6.0, 10.0, 8.0, 4.0, 8.0, 1.0, 6.0, 1.0, 0.0, 3.0, 1.0], "bins": [-36.65275573730469, -35.549339294433594, -34.445926666259766, -33.34251022338867, -32.23909378051758, -31.135679244995117, -30.032264709472656, -28.928848266601562, -27.82543182373047, -26.722017288208008, -25.618600845336914, -24.515186309814453, -23.41176986694336, -22.3083553314209, -21.204940795898438, -20.101524353027344, -18.998109817504883, -17.894695281982422, -16.791278839111328, -15.687864303588867, -14.584447860717773, -13.481033325195312, -12.377617835998535, -11.274202346801758, -10.17078685760498, -9.067371368408203, -7.963955879211426, -6.860540866851807, -5.757125377655029, -4.653709888458252, -3.550294876098633, -2.4468793869018555, -1.3434638977050781, -0.24004852771759033, 0.8633668422698975, 1.9667820930480957, 3.070197582244873, 4.17361307144165, 5.2770280838012695, 6.380443572998047, 7.483859062194824, 8.587274551391602, 9.690690040588379, 10.794105529785156, 11.897520065307617, 13.000936508178711, 14.104351043701172, 15.20776653289795, 16.311182022094727, 17.414596557617188, 18.51801300048828, 19.621427536010742, 20.724843978881836, 21.828258514404297, 22.93167495727539, 24.03508949279785, 25.138504028320312, 26.241918563842773, 27.345335006713867, 28.448749542236328, 29.552165985107422, 30.655580520629883, 31.758995056152344, 32.86241149902344, 33.96582794189453]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 12.0, 8.0, 14.0, 29.0, 37.0, 65.0, 122.0, 180.0, 277.0, 484.0, 791.0, 1404.0, 2427.0, 3885.0, 6419.0, 10394.0, 16748.0, 25977.0, 38873.0, 54763.0, 73815.0, 92391.0, 107035.0, 114552.0, 112133.0, 101452.0, 83856.0, 64446.0, 47257.0, 32588.0, 21081.0, 13694.0, 8499.0, 5274.0, 2969.0, 1811.0, 1134.0, 669.0, 409.0, 216.0, 133.0, 90.0, 49.0, 36.0, 29.0, 7.0, 9.0, 5.0, 1.0, 1.0, 5.0, 2.0, 3.0], "bins": [-45.28125, -43.97900390625, -42.6767578125, -41.37451171875, -40.072265625, -38.77001953125, -37.4677734375, -36.16552734375, -34.86328125, -33.56103515625, -32.2587890625, -30.95654296875, -29.654296875, -28.35205078125, -27.0498046875, -25.74755859375, -24.4453125, -23.14306640625, -21.8408203125, -20.53857421875, -19.236328125, -17.93408203125, -16.6318359375, -15.32958984375, -14.02734375, -12.72509765625, -11.4228515625, -10.12060546875, -8.818359375, -7.51611328125, -6.2138671875, -4.91162109375, -3.609375, -2.30712890625, -1.0048828125, 0.29736328125, 1.599609375, 2.90185546875, 4.2041015625, 5.50634765625, 6.80859375, 8.11083984375, 9.4130859375, 10.71533203125, 12.017578125, 13.31982421875, 14.6220703125, 15.92431640625, 17.2265625, 18.52880859375, 19.8310546875, 21.13330078125, 22.435546875, 23.73779296875, 25.0400390625, 26.34228515625, 27.64453125, 28.94677734375, 30.2490234375, 31.55126953125, 32.853515625, 34.15576171875, 35.4580078125, 36.76025390625, 38.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 2.0, 4.0, 3.0, 7.0, 5.0, 4.0, 9.0, 8.0, 14.0, 23.0, 18.0, 12.0, 29.0, 15.0, 19.0, 20.0, 36.0, 33.0, 29.0, 38.0, 31.0, 49.0, 36.0, 32.0, 38.0, 35.0, 38.0, 37.0, 34.0, 27.0, 32.0, 31.0, 25.0, 27.0, 19.0, 26.0, 24.0, 23.0, 19.0, 10.0, 9.0, 12.0, 7.0, 8.0, 6.0, 10.0, 7.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-34.71875, -33.66064453125, -32.6025390625, -31.54443359375, -30.486328125, -29.42822265625, -28.3701171875, -27.31201171875, -26.25390625, -25.19580078125, -24.1376953125, -23.07958984375, -22.021484375, -20.96337890625, -19.9052734375, -18.84716796875, -17.7890625, -16.73095703125, -15.6728515625, -14.61474609375, -13.556640625, -12.49853515625, -11.4404296875, -10.38232421875, -9.32421875, -8.26611328125, -7.2080078125, -6.14990234375, -5.091796875, -4.03369140625, -2.9755859375, -1.91748046875, -0.859375, 0.19873046875, 1.2568359375, 2.31494140625, 3.373046875, 4.43115234375, 5.4892578125, 6.54736328125, 7.60546875, 8.66357421875, 9.7216796875, 10.77978515625, 11.837890625, 12.89599609375, 13.9541015625, 15.01220703125, 16.0703125, 17.12841796875, 18.1865234375, 19.24462890625, 20.302734375, 21.36083984375, 22.4189453125, 23.47705078125, 24.53515625, 25.59326171875, 26.6513671875, 27.70947265625, 28.767578125, 29.82568359375, 30.8837890625, 31.94189453125, 33.0]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 13.0, 20.0, 20.0, 36.0, 58.0, 90.0, 133.0, 207.0, 377.0, 606.0, 1040.0, 1644.0, 2949.0, 5125.0, 9014.0, 15421.0, 25970.0, 42304.0, 64453.0, 90587.0, 117230.0, 133666.0, 135484.0, 121120.0, 95656.0, 69629.0, 46030.0, 28711.0, 17347.0, 10016.0, 5684.0, 3308.0, 1873.0, 1051.0, 666.0, 373.0, 223.0, 159.0, 93.0, 65.0, 34.0, 35.0, 10.0, 16.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.6875, -49.00341796875, -47.3193359375, -45.63525390625, -43.951171875, -42.26708984375, -40.5830078125, -38.89892578125, -37.21484375, -35.53076171875, -33.8466796875, -32.16259765625, -30.478515625, -28.79443359375, -27.1103515625, -25.42626953125, -23.7421875, -22.05810546875, -20.3740234375, -18.68994140625, -17.005859375, -15.32177734375, -13.6376953125, -11.95361328125, -10.26953125, -8.58544921875, -6.9013671875, -5.21728515625, -3.533203125, -1.84912109375, -0.1650390625, 1.51904296875, 3.203125, 4.88720703125, 6.5712890625, 8.25537109375, 9.939453125, 11.62353515625, 13.3076171875, 14.99169921875, 16.67578125, 18.35986328125, 20.0439453125, 21.72802734375, 23.412109375, 25.09619140625, 26.7802734375, 28.46435546875, 30.1484375, 31.83251953125, 33.5166015625, 35.20068359375, 36.884765625, 38.56884765625, 40.2529296875, 41.93701171875, 43.62109375, 45.30517578125, 46.9892578125, 48.67333984375, 50.357421875, 52.04150390625, 53.7255859375, 55.40966796875, 57.09375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 7.0, 5.0, 11.0, 9.0, 7.0, 13.0, 14.0, 8.0, 20.0, 17.0, 22.0, 24.0, 27.0, 34.0, 42.0, 26.0, 42.0, 41.0, 37.0, 43.0, 37.0, 24.0, 47.0, 27.0, 45.0, 36.0, 34.0, 35.0, 30.0, 37.0, 31.0, 24.0, 17.0, 24.0, 21.0, 13.0, 14.0, 14.0, 8.0, 13.0, 10.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.421875, -26.603759765625, -25.78564453125, -24.967529296875, -24.1494140625, -23.331298828125, -22.51318359375, -21.695068359375, -20.876953125, -20.058837890625, -19.24072265625, -18.422607421875, -17.6044921875, -16.786376953125, -15.96826171875, -15.150146484375, -14.33203125, -13.513916015625, -12.69580078125, -11.877685546875, -11.0595703125, -10.241455078125, -9.42333984375, -8.605224609375, -7.787109375, -6.968994140625, -6.15087890625, -5.332763671875, -4.5146484375, -3.696533203125, -2.87841796875, -2.060302734375, -1.2421875, -0.424072265625, 0.39404296875, 1.212158203125, 2.0302734375, 2.848388671875, 3.66650390625, 4.484619140625, 5.302734375, 6.120849609375, 6.93896484375, 7.757080078125, 8.5751953125, 9.393310546875, 10.21142578125, 11.029541015625, 11.84765625, 12.665771484375, 13.48388671875, 14.302001953125, 15.1201171875, 15.938232421875, 16.75634765625, 17.574462890625, 18.392578125, 19.210693359375, 20.02880859375, 20.846923828125, 21.6650390625, 22.483154296875, 23.30126953125, 24.119384765625, 24.9375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 4.0, 8.0, 12.0, 33.0, 49.0, 67.0, 88.0, 127.0, 207.0, 301.0, 431.0, 667.0, 1026.0, 1527.0, 2433.0, 3805.0, 6156.0, 9785.0, 16064.0, 26127.0, 41775.0, 63815.0, 92129.0, 120363.0, 138235.0, 139225.0, 119412.0, 91532.0, 63695.0, 41228.0, 25659.0, 15796.0, 9758.0, 6164.0, 3729.0, 2456.0, 1590.0, 1024.0, 675.0, 457.0, 289.0, 224.0, 129.0, 89.0, 70.0, 42.0, 27.0, 13.0, 13.0, 10.0, 11.0, 4.0, 0.0, 1.0, 2.0], "bins": [-17.0, -16.4998779296875, -15.999755859375, -15.4996337890625, -14.99951171875, -14.4993896484375, -13.999267578125, -13.4991455078125, -12.9990234375, -12.4989013671875, -11.998779296875, -11.4986572265625, -10.99853515625, -10.4984130859375, -9.998291015625, -9.4981689453125, -8.998046875, -8.4979248046875, -7.997802734375, -7.4976806640625, -6.99755859375, -6.4974365234375, -5.997314453125, -5.4971923828125, -4.9970703125, -4.4969482421875, -3.996826171875, -3.4967041015625, -2.99658203125, -2.4964599609375, -1.996337890625, -1.4962158203125, -0.99609375, -0.4959716796875, 0.004150390625, 0.5042724609375, 1.00439453125, 1.5045166015625, 2.004638671875, 2.5047607421875, 3.0048828125, 3.5050048828125, 4.005126953125, 4.5052490234375, 5.00537109375, 5.5054931640625, 6.005615234375, 6.5057373046875, 7.005859375, 7.5059814453125, 8.006103515625, 8.5062255859375, 9.00634765625, 9.5064697265625, 10.006591796875, 10.5067138671875, 11.0068359375, 11.5069580078125, 12.007080078125, 12.5072021484375, 13.00732421875, 13.5074462890625, 14.007568359375, 14.5076904296875, 15.0078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 6.0, 7.0, 11.0, 15.0, 10.0, 21.0, 33.0, 27.0, 29.0, 38.0, 45.0, 60.0, 46.0, 58.0, 79.0, 75.0, 55.0, 62.0, 71.0, 59.0, 35.0, 39.0, 20.0, 19.0, 14.0, 23.0, 9.0, 5.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002964019775390625, -0.002888202667236328, -0.0028123855590820312, -0.0027365684509277344, -0.0026607513427734375, -0.0025849342346191406, -0.0025091171264648438, -0.002433300018310547, -0.00235748291015625, -0.002281665802001953, -0.0022058486938476562, -0.0021300315856933594, -0.0020542144775390625, -0.0019783973693847656, -0.0019025802612304688, -0.0018267631530761719, -0.001750946044921875, -0.0016751289367675781, -0.0015993118286132812, -0.0015234947204589844, -0.0014476776123046875, -0.0013718605041503906, -0.0012960433959960938, -0.0012202262878417969, -0.0011444091796875, -0.0010685920715332031, -0.0009927749633789062, -0.0009169578552246094, -0.0008411407470703125, -0.0007653236389160156, -0.0006895065307617188, -0.0006136894226074219, -0.000537872314453125, -0.0004620552062988281, -0.00038623809814453125, -0.0003104209899902344, -0.0002346038818359375, -0.00015878677368164062, -8.296966552734375e-05, -7.152557373046875e-06, 6.866455078125e-05, 0.00014448165893554688, 0.00022029876708984375, 0.0002961158752441406, 0.0003719329833984375, 0.0004477500915527344, 0.0005235671997070312, 0.0005993843078613281, 0.000675201416015625, 0.0007510185241699219, 0.0008268356323242188, 0.0009026527404785156, 0.0009784698486328125, 0.0010542869567871094, 0.0011301040649414062, 0.0012059211730957031, 0.00128173828125, 0.0013575553894042969, 0.0014333724975585938, 0.0015091896057128906, 0.0015850067138671875, 0.0016608238220214844, 0.0017366409301757812, 0.0018124580383300781, 0.001888275146484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 12.0, 14.0, 19.0, 39.0, 36.0, 56.0, 73.0, 124.0, 162.0, 237.0, 356.0, 541.0, 773.0, 1220.0, 2012.0, 3394.0, 5831.0, 10434.0, 19373.0, 34303.0, 58626.0, 93085.0, 129575.0, 156809.0, 158591.0, 133104.0, 95232.0, 61246.0, 36302.0, 20109.0, 11073.0, 6309.0, 3538.0, 2074.0, 1270.0, 874.0, 555.0, 374.0, 243.0, 161.0, 112.0, 101.0, 59.0, 31.0, 31.0, 21.0, 9.0, 11.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.53125, -16.984130859375, -16.43701171875, -15.889892578125, -15.3427734375, -14.795654296875, -14.24853515625, -13.701416015625, -13.154296875, -12.607177734375, -12.06005859375, -11.512939453125, -10.9658203125, -10.418701171875, -9.87158203125, -9.324462890625, -8.77734375, -8.230224609375, -7.68310546875, -7.135986328125, -6.5888671875, -6.041748046875, -5.49462890625, -4.947509765625, -4.400390625, -3.853271484375, -3.30615234375, -2.759033203125, -2.2119140625, -1.664794921875, -1.11767578125, -0.570556640625, -0.0234375, 0.523681640625, 1.07080078125, 1.617919921875, 2.1650390625, 2.712158203125, 3.25927734375, 3.806396484375, 4.353515625, 4.900634765625, 5.44775390625, 5.994873046875, 6.5419921875, 7.089111328125, 7.63623046875, 8.183349609375, 8.73046875, 9.277587890625, 9.82470703125, 10.371826171875, 10.9189453125, 11.466064453125, 12.01318359375, 12.560302734375, 13.107421875, 13.654541015625, 14.20166015625, 14.748779296875, 15.2958984375, 15.843017578125, 16.39013671875, 16.937255859375, 17.484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 5.0, 13.0, 21.0, 15.0, 30.0, 24.0, 30.0, 46.0, 39.0, 38.0, 45.0, 54.0, 39.0, 55.0, 39.0, 54.0, 48.0, 59.0, 48.0, 44.0, 37.0, 39.0, 23.0, 28.0, 22.0, 13.0, 17.0, 9.0, 14.0, 6.0, 6.0, 8.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.86944580078125, -6.6724853515625, -6.47552490234375, -6.278564453125, -6.08160400390625, -5.8846435546875, -5.68768310546875, -5.49072265625, -5.29376220703125, -5.0968017578125, -4.89984130859375, -4.702880859375, -4.50592041015625, -4.3089599609375, -4.11199951171875, -3.9150390625, -3.71807861328125, -3.5211181640625, -3.32415771484375, -3.127197265625, -2.93023681640625, -2.7332763671875, -2.53631591796875, -2.33935546875, -2.14239501953125, -1.9454345703125, -1.74847412109375, -1.551513671875, -1.35455322265625, -1.1575927734375, -0.96063232421875, -0.763671875, -0.56671142578125, -0.3697509765625, -0.17279052734375, 0.024169921875, 0.22113037109375, 0.4180908203125, 0.61505126953125, 0.81201171875, 1.00897216796875, 1.2059326171875, 1.40289306640625, 1.599853515625, 1.79681396484375, 1.9937744140625, 2.19073486328125, 2.3876953125, 2.58465576171875, 2.7816162109375, 2.97857666015625, 3.175537109375, 3.37249755859375, 3.5694580078125, 3.76641845703125, 3.96337890625, 4.16033935546875, 4.3572998046875, 4.55426025390625, 4.751220703125, 4.94818115234375, 5.1451416015625, 5.34210205078125, 5.5390625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 11.0, 7.0, 5.0, 13.0, 16.0, 17.0, 13.0, 14.0, 21.0, 24.0, 23.0, 36.0, 22.0, 37.0, 45.0, 34.0, 42.0, 52.0, 38.0, 42.0, 45.0, 41.0, 44.0, 39.0, 32.0, 35.0, 33.0, 25.0, 17.0, 26.0, 23.0, 20.0, 19.0, 15.0, 13.0, 12.0, 9.0, 3.0, 11.0, 3.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.001365661621094, -33.795631408691406, -32.58989334106445, -31.384157180786133, -30.178421020507812, -28.972686767578125, -27.766950607299805, -26.561214447021484, -25.355478286743164, -24.149742126464844, -22.944005966186523, -21.738269805908203, -20.532535552978516, -19.326797485351562, -18.121063232421875, -16.915327072143555, -15.709590911865234, -14.503854751586914, -13.298118591308594, -12.09238338470459, -10.88664722442627, -9.68091106414795, -8.475175857543945, -7.269439697265625, -6.063703536987305, -4.857967376708984, -3.6522316932678223, -2.446495771408081, -1.2407598495483398, -0.03502368927001953, 1.1707119941711426, 2.3764476776123047, 3.582183837890625, 4.787919998168945, 5.993655681610107, 7.1993913650512695, 8.40512752532959, 9.61086368560791, 10.816598892211914, 12.022335052490234, 13.228071212768555, 14.433807373046875, 15.639543533325195, 16.845279693603516, 18.051013946533203, 19.256752014160156, 20.462486267089844, 21.668222427368164, 22.873958587646484, 24.079694747924805, 25.285430908203125, 26.491167068481445, 27.696903228759766, 28.902637481689453, 30.108373641967773, 31.314109802246094, 32.51984405517578, 33.72557830810547, 34.93131637573242, 36.13705062866211, 37.34278869628906, 38.54852294921875, 39.7542610168457, 40.95999526977539, 42.165733337402344]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 6.0, 7.0, 8.0, 9.0, 15.0, 13.0, 14.0, 12.0, 16.0, 27.0, 21.0, 19.0, 34.0, 29.0, 31.0, 41.0, 27.0, 32.0, 40.0, 42.0, 38.0, 43.0, 34.0, 40.0, 29.0, 35.0, 32.0, 27.0, 26.0, 28.0, 27.0, 15.0, 20.0, 22.0, 18.0, 7.0, 26.0, 16.0, 11.0, 13.0, 11.0, 7.0, 10.0, 4.0, 3.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-37.75242233276367, -36.604209899902344, -35.455997467041016, -34.30778503417969, -33.15957260131836, -32.01136016845703, -30.863149642944336, -29.714937210083008, -28.56672477722168, -27.41851234436035, -26.270299911499023, -25.122087478637695, -23.973876953125, -22.825664520263672, -21.677452087402344, -20.529239654541016, -19.381027221679688, -18.23281478881836, -17.08460235595703, -15.93639087677002, -14.788178443908691, -13.639966011047363, -12.491754531860352, -11.343542098999023, -10.195329666137695, -9.047117233276367, -7.898905277252197, -6.750693321228027, -5.602480888366699, -4.454268455505371, -3.306056499481201, -2.1578445434570312, -1.0096282958984375, 0.13858389854431152, 1.2867960929870605, 2.4350082874298096, 3.5832204818725586, 4.731432914733887, 5.879644870758057, 7.027856826782227, 8.176069259643555, 9.324281692504883, 10.472494125366211, 11.620705604553223, 12.76891803741455, 13.917130470275879, 15.06534194946289, 16.21355438232422, 17.361766815185547, 18.509979248046875, 19.658191680908203, 20.80640411376953, 21.95461654663086, 23.102828979492188, 24.251039505004883, 25.39925193786621, 26.54746437072754, 27.695676803588867, 28.843889236450195, 29.992101669311523, 31.14031219482422, 32.28852462768555, 33.436737060546875, 34.5849494934082, 35.73316192626953]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 10.0, 15.0, 17.0, 40.0, 56.0, 94.0, 153.0, 233.0, 385.0, 635.0, 943.0, 1516.0, 2414.0, 3743.0, 5956.0, 9110.0, 14232.0, 22163.0, 34570.0, 52294.0, 80038.0, 118582.0, 173557.0, 242471.0, 326287.0, 407901.0, 465268.0, 478396.0, 443668.0, 373286.0, 288972.0, 210864.0, 146796.0, 99514.0, 66165.0, 43496.0, 28639.0, 18335.0, 11937.0, 7785.0, 5075.0, 3093.0, 2011.0, 1260.0, 814.0, 560.0, 335.0, 217.0, 151.0, 100.0, 55.0, 31.0, 21.0, 18.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-34.0, -32.94677734375, -31.8935546875, -30.84033203125, -29.787109375, -28.73388671875, -27.6806640625, -26.62744140625, -25.57421875, -24.52099609375, -23.4677734375, -22.41455078125, -21.361328125, -20.30810546875, -19.2548828125, -18.20166015625, -17.1484375, -16.09521484375, -15.0419921875, -13.98876953125, -12.935546875, -11.88232421875, -10.8291015625, -9.77587890625, -8.72265625, -7.66943359375, -6.6162109375, -5.56298828125, -4.509765625, -3.45654296875, -2.4033203125, -1.35009765625, -0.296875, 0.75634765625, 1.8095703125, 2.86279296875, 3.916015625, 4.96923828125, 6.0224609375, 7.07568359375, 8.12890625, 9.18212890625, 10.2353515625, 11.28857421875, 12.341796875, 13.39501953125, 14.4482421875, 15.50146484375, 16.5546875, 17.60791015625, 18.6611328125, 19.71435546875, 20.767578125, 21.82080078125, 22.8740234375, 23.92724609375, 24.98046875, 26.03369140625, 27.0869140625, 28.14013671875, 29.193359375, 30.24658203125, 31.2998046875, 32.35302734375, 33.40625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 7.0, 13.0, 8.0, 14.0, 12.0, 14.0, 20.0, 18.0, 19.0, 18.0, 30.0, 26.0, 43.0, 27.0, 38.0, 28.0, 46.0, 47.0, 34.0, 30.0, 44.0, 32.0, 38.0, 33.0, 38.0, 32.0, 24.0, 28.0, 28.0, 21.0, 19.0, 23.0, 18.0, 21.0, 12.0, 15.0, 13.0, 9.0, 14.0, 10.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-33.34375, -32.30419921875, -31.2646484375, -30.22509765625, -29.185546875, -28.14599609375, -27.1064453125, -26.06689453125, -25.02734375, -23.98779296875, -22.9482421875, -21.90869140625, -20.869140625, -19.82958984375, -18.7900390625, -17.75048828125, -16.7109375, -15.67138671875, -14.6318359375, -13.59228515625, -12.552734375, -11.51318359375, -10.4736328125, -9.43408203125, -8.39453125, -7.35498046875, -6.3154296875, -5.27587890625, -4.236328125, -3.19677734375, -2.1572265625, -1.11767578125, -0.078125, 0.96142578125, 2.0009765625, 3.04052734375, 4.080078125, 5.11962890625, 6.1591796875, 7.19873046875, 8.23828125, 9.27783203125, 10.3173828125, 11.35693359375, 12.396484375, 13.43603515625, 14.4755859375, 15.51513671875, 16.5546875, 17.59423828125, 18.6337890625, 19.67333984375, 20.712890625, 21.75244140625, 22.7919921875, 23.83154296875, 24.87109375, 25.91064453125, 26.9501953125, 27.98974609375, 29.029296875, 30.06884765625, 31.1083984375, 32.14794921875, 33.1875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 13.0, 13.0, 20.0, 29.0, 60.0, 92.0, 177.0, 281.0, 494.0, 750.0, 1296.0, 2238.0, 3638.0, 6296.0, 10391.0, 16962.0, 27496.0, 43943.0, 70815.0, 108385.0, 160513.0, 228352.0, 307720.0, 387336.0, 448116.0, 474764.0, 454602.0, 398108.0, 319101.0, 239548.0, 170508.0, 114852.0, 74025.0, 47650.0, 29800.0, 18347.0, 11208.0, 6623.0, 3882.0, 2370.0, 1411.0, 833.0, 517.0, 287.0, 178.0, 89.0, 66.0, 40.0, 21.0, 13.0, 9.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.375, -36.2275390625, -35.080078125, -33.9326171875, -32.78515625, -31.6376953125, -30.490234375, -29.3427734375, -28.1953125, -27.0478515625, -25.900390625, -24.7529296875, -23.60546875, -22.4580078125, -21.310546875, -20.1630859375, -19.015625, -17.8681640625, -16.720703125, -15.5732421875, -14.42578125, -13.2783203125, -12.130859375, -10.9833984375, -9.8359375, -8.6884765625, -7.541015625, -6.3935546875, -5.24609375, -4.0986328125, -2.951171875, -1.8037109375, -0.65625, 0.4912109375, 1.638671875, 2.7861328125, 3.93359375, 5.0810546875, 6.228515625, 7.3759765625, 8.5234375, 9.6708984375, 10.818359375, 11.9658203125, 13.11328125, 14.2607421875, 15.408203125, 16.5556640625, 17.703125, 18.8505859375, 19.998046875, 21.1455078125, 22.29296875, 23.4404296875, 24.587890625, 25.7353515625, 26.8828125, 28.0302734375, 29.177734375, 30.3251953125, 31.47265625, 32.6201171875, 33.767578125, 34.9150390625, 36.0625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 7.0, 3.0, 3.0, 5.0, 12.0, 21.0, 17.0, 18.0, 33.0, 53.0, 48.0, 59.0, 78.0, 77.0, 99.0, 122.0, 143.0, 170.0, 202.0, 171.0, 194.0, 202.0, 213.0, 204.0, 197.0, 204.0, 201.0, 176.0, 179.0, 157.0, 130.0, 109.0, 120.0, 85.0, 64.0, 57.0, 47.0, 53.0, 21.0, 20.0, 28.0, 25.0, 14.0, 15.0, 5.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.375, -17.810302734375, -17.24560546875, -16.680908203125, -16.1162109375, -15.551513671875, -14.98681640625, -14.422119140625, -13.857421875, -13.292724609375, -12.72802734375, -12.163330078125, -11.5986328125, -11.033935546875, -10.46923828125, -9.904541015625, -9.33984375, -8.775146484375, -8.21044921875, -7.645751953125, -7.0810546875, -6.516357421875, -5.95166015625, -5.386962890625, -4.822265625, -4.257568359375, -3.69287109375, -3.128173828125, -2.5634765625, -1.998779296875, -1.43408203125, -0.869384765625, -0.3046875, 0.260009765625, 0.82470703125, 1.389404296875, 1.9541015625, 2.518798828125, 3.08349609375, 3.648193359375, 4.212890625, 4.777587890625, 5.34228515625, 5.906982421875, 6.4716796875, 7.036376953125, 7.60107421875, 8.165771484375, 8.73046875, 9.295166015625, 9.85986328125, 10.424560546875, 10.9892578125, 11.553955078125, 12.11865234375, 12.683349609375, 13.248046875, 13.812744140625, 14.37744140625, 14.942138671875, 15.5068359375, 16.071533203125, 16.63623046875, 17.200927734375, 17.765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 5.0, 14.0, 9.0, 11.0, 14.0, 11.0, 16.0, 26.0, 28.0, 27.0, 32.0, 32.0, 48.0, 37.0, 49.0, 29.0, 45.0, 38.0, 42.0, 38.0, 42.0, 49.0, 39.0, 36.0, 46.0, 35.0, 34.0, 23.0, 14.0, 21.0, 13.0, 12.0, 9.0, 17.0, 7.0, 9.0, 8.0, 8.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-42.77632522583008, -41.45649719238281, -40.13666915893555, -38.81684112548828, -37.49701690673828, -36.177188873291016, -34.85736083984375, -33.537532806396484, -32.21770477294922, -30.897876739501953, -29.578048706054688, -28.258222579956055, -26.93839454650879, -25.618566513061523, -24.29874038696289, -22.978912353515625, -21.65908432006836, -20.339256286621094, -19.019428253173828, -17.699602127075195, -16.37977409362793, -15.059946060180664, -13.740118980407715, -12.420291900634766, -11.1004638671875, -9.780635833740234, -8.460808753967285, -7.140981197357178, -5.82115364074707, -4.501326084136963, -3.1814985275268555, -1.8616714477539062, -0.5418434143066406, 0.7779841423034668, 2.097811698913574, 3.4176392555236816, 4.737466812133789, 6.0572943687438965, 7.377121925354004, 8.696949005126953, 10.016777038574219, 11.336605072021484, 12.656432151794434, 13.976259231567383, 15.296087265014648, 16.615915298461914, 17.935741424560547, 19.255569458007812, 20.575397491455078, 21.895225524902344, 23.21505355834961, 24.534879684448242, 25.854707717895508, 27.174535751342773, 28.494361877441406, 29.814189910888672, 31.134017944335938, 32.4538459777832, 33.77367401123047, 35.093502044677734, 36.413330078125, 37.733154296875, 39.052982330322266, 40.37281036376953, 41.6926383972168]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 8.0, 4.0, 11.0, 17.0, 23.0, 12.0, 13.0, 27.0, 26.0, 25.0, 31.0, 20.0, 28.0, 40.0, 42.0, 55.0, 37.0, 36.0, 37.0, 38.0, 35.0, 35.0, 29.0, 39.0, 30.0, 39.0, 28.0, 19.0, 23.0, 25.0, 24.0, 16.0, 22.0, 20.0, 16.0, 9.0, 7.0, 12.0, 11.0, 11.0, 3.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-39.52040100097656, -38.30002975463867, -37.07966232299805, -35.859291076660156, -34.638919830322266, -33.418548583984375, -32.19818115234375, -30.97780990600586, -29.7574405670166, -28.537071228027344, -27.316699981689453, -26.096330642700195, -24.875961303710938, -23.655590057373047, -22.43522071838379, -21.21485137939453, -19.99448013305664, -18.774110794067383, -17.553739547729492, -16.333370208740234, -15.11299991607666, -13.892629623413086, -12.672260284423828, -11.451889991760254, -10.23151969909668, -9.011149406433105, -7.7907795906066895, -6.570409774780273, -5.350039482116699, -4.129669189453125, -2.909299373626709, -1.688929557800293, -0.46855926513671875, 0.7518107891082764, 1.9721808433532715, 3.1925508975982666, 4.412920951843262, 5.633291244506836, 6.853661060333252, 8.074030876159668, 9.294401168823242, 10.514771461486816, 11.73514175415039, 12.955511093139648, 14.175881385803223, 15.396251678466797, 16.616621017456055, 17.836990356445312, 19.057361602783203, 20.27773094177246, 21.49810218811035, 22.71847152709961, 23.9388427734375, 25.159212112426758, 26.379581451416016, 27.599952697753906, 28.820322036743164, 30.040691375732422, 31.261062622070312, 32.4814338684082, 33.70180130004883, 34.92217254638672, 36.14254379272461, 37.362911224365234, 38.583282470703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 8.0, 15.0, 27.0, 34.0, 45.0, 68.0, 100.0, 118.0, 147.0, 231.0, 317.0, 438.0, 654.0, 861.0, 1330.0, 1790.0, 2694.0, 4121.0, 6194.0, 10194.0, 17250.0, 30396.0, 56079.0, 102272.0, 165535.0, 207482.0, 177789.0, 112966.0, 63362.0, 34554.0, 19292.0, 11365.0, 6967.0, 4395.0, 2809.0, 1929.0, 1388.0, 939.0, 666.0, 477.0, 375.0, 241.0, 170.0, 151.0, 93.0, 70.0, 40.0, 25.0, 28.0, 20.0, 14.0, 8.0, 10.0, 7.0, 1.0, 1.0, 4.0], "bins": [-46.78125, -45.34619140625, -43.9111328125, -42.47607421875, -41.041015625, -39.60595703125, -38.1708984375, -36.73583984375, -35.30078125, -33.86572265625, -32.4306640625, -30.99560546875, -29.560546875, -28.12548828125, -26.6904296875, -25.25537109375, -23.8203125, -22.38525390625, -20.9501953125, -19.51513671875, -18.080078125, -16.64501953125, -15.2099609375, -13.77490234375, -12.33984375, -10.90478515625, -9.4697265625, -8.03466796875, -6.599609375, -5.16455078125, -3.7294921875, -2.29443359375, -0.859375, 0.57568359375, 2.0107421875, 3.44580078125, 4.880859375, 6.31591796875, 7.7509765625, 9.18603515625, 10.62109375, 12.05615234375, 13.4912109375, 14.92626953125, 16.361328125, 17.79638671875, 19.2314453125, 20.66650390625, 22.1015625, 23.53662109375, 24.9716796875, 26.40673828125, 27.841796875, 29.27685546875, 30.7119140625, 32.14697265625, 33.58203125, 35.01708984375, 36.4521484375, 37.88720703125, 39.322265625, 40.75732421875, 42.1923828125, 43.62744140625, 45.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 13.0, 20.0, 17.0, 14.0, 17.0, 24.0, 25.0, 23.0, 35.0, 18.0, 32.0, 35.0, 47.0, 50.0, 37.0, 38.0, 38.0, 33.0, 35.0, 39.0, 28.0, 36.0, 29.0, 40.0, 27.0, 19.0, 24.0, 24.0, 25.0, 13.0, 25.0, 19.0, 17.0, 10.0, 5.0, 11.0, 13.0, 11.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-38.59375, -37.39501953125, -36.1962890625, -34.99755859375, -33.798828125, -32.60009765625, -31.4013671875, -30.20263671875, -29.00390625, -27.80517578125, -26.6064453125, -25.40771484375, -24.208984375, -23.01025390625, -21.8115234375, -20.61279296875, -19.4140625, -18.21533203125, -17.0166015625, -15.81787109375, -14.619140625, -13.42041015625, -12.2216796875, -11.02294921875, -9.82421875, -8.62548828125, -7.4267578125, -6.22802734375, -5.029296875, -3.83056640625, -2.6318359375, -1.43310546875, -0.234375, 0.96435546875, 2.1630859375, 3.36181640625, 4.560546875, 5.75927734375, 6.9580078125, 8.15673828125, 9.35546875, 10.55419921875, 11.7529296875, 12.95166015625, 14.150390625, 15.34912109375, 16.5478515625, 17.74658203125, 18.9453125, 20.14404296875, 21.3427734375, 22.54150390625, 23.740234375, 24.93896484375, 26.1376953125, 27.33642578125, 28.53515625, 29.73388671875, 30.9326171875, 32.13134765625, 33.330078125, 34.52880859375, 35.7275390625, 36.92626953125, 38.125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 8.0, 16.0, 17.0, 18.0, 17.0, 48.0, 72.0, 108.0, 168.0, 234.0, 322.0, 545.0, 751.0, 1182.0, 1998.0, 3300.0, 5964.0, 11450.0, 24538.0, 64145.0, 205213.0, 414530.0, 201346.0, 62693.0, 24097.0, 11097.0, 5871.0, 3366.0, 1946.0, 1215.0, 746.0, 489.0, 345.0, 211.0, 144.0, 99.0, 76.0, 56.0, 33.0, 24.0, 22.0, 12.0, 13.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-71.5, -69.2294921875, -66.958984375, -64.6884765625, -62.41796875, -60.1474609375, -57.876953125, -55.6064453125, -53.3359375, -51.0654296875, -48.794921875, -46.5244140625, -44.25390625, -41.9833984375, -39.712890625, -37.4423828125, -35.171875, -32.9013671875, -30.630859375, -28.3603515625, -26.08984375, -23.8193359375, -21.548828125, -19.2783203125, -17.0078125, -14.7373046875, -12.466796875, -10.1962890625, -7.92578125, -5.6552734375, -3.384765625, -1.1142578125, 1.15625, 3.4267578125, 5.697265625, 7.9677734375, 10.23828125, 12.5087890625, 14.779296875, 17.0498046875, 19.3203125, 21.5908203125, 23.861328125, 26.1318359375, 28.40234375, 30.6728515625, 32.943359375, 35.2138671875, 37.484375, 39.7548828125, 42.025390625, 44.2958984375, 46.56640625, 48.8369140625, 51.107421875, 53.3779296875, 55.6484375, 57.9189453125, 60.189453125, 62.4599609375, 64.73046875, 67.0009765625, 69.271484375, 71.5419921875, 73.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 9.0, 7.0, 10.0, 8.0, 11.0, 17.0, 20.0, 20.0, 10.0, 35.0, 28.0, 35.0, 39.0, 30.0, 31.0, 50.0, 45.0, 42.0, 34.0, 42.0, 40.0, 33.0, 36.0, 47.0, 48.0, 25.0, 31.0, 33.0, 23.0, 28.0, 25.0, 24.0, 20.0, 9.0, 13.0, 10.0, 4.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.78125, -23.93701171875, -23.0927734375, -22.24853515625, -21.404296875, -20.56005859375, -19.7158203125, -18.87158203125, -18.02734375, -17.18310546875, -16.3388671875, -15.49462890625, -14.650390625, -13.80615234375, -12.9619140625, -12.11767578125, -11.2734375, -10.42919921875, -9.5849609375, -8.74072265625, -7.896484375, -7.05224609375, -6.2080078125, -5.36376953125, -4.51953125, -3.67529296875, -2.8310546875, -1.98681640625, -1.142578125, -0.29833984375, 0.5458984375, 1.39013671875, 2.234375, 3.07861328125, 3.9228515625, 4.76708984375, 5.611328125, 6.45556640625, 7.2998046875, 8.14404296875, 8.98828125, 9.83251953125, 10.6767578125, 11.52099609375, 12.365234375, 13.20947265625, 14.0537109375, 14.89794921875, 15.7421875, 16.58642578125, 17.4306640625, 18.27490234375, 19.119140625, 19.96337890625, 20.8076171875, 21.65185546875, 22.49609375, 23.34033203125, 24.1845703125, 25.02880859375, 25.873046875, 26.71728515625, 27.5615234375, 28.40576171875, 29.25]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 11.0, 11.0, 24.0, 37.0, 42.0, 38.0, 67.0, 94.0, 129.0, 209.0, 270.0, 349.0, 556.0, 703.0, 1062.0, 1499.0, 2295.0, 3505.0, 5748.0, 9741.0, 19026.0, 41305.0, 102081.0, 258369.0, 331060.0, 152829.0, 59028.0, 25496.0, 12840.0, 7239.0, 4330.0, 2825.0, 1788.0, 1149.0, 810.0, 589.0, 404.0, 281.0, 189.0, 140.0, 105.0, 63.0, 61.0, 44.0, 31.0, 24.0, 17.0, 11.0, 11.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-21.453125, -20.80712890625, -20.1611328125, -19.51513671875, -18.869140625, -18.22314453125, -17.5771484375, -16.93115234375, -16.28515625, -15.63916015625, -14.9931640625, -14.34716796875, -13.701171875, -13.05517578125, -12.4091796875, -11.76318359375, -11.1171875, -10.47119140625, -9.8251953125, -9.17919921875, -8.533203125, -7.88720703125, -7.2412109375, -6.59521484375, -5.94921875, -5.30322265625, -4.6572265625, -4.01123046875, -3.365234375, -2.71923828125, -2.0732421875, -1.42724609375, -0.78125, -0.13525390625, 0.5107421875, 1.15673828125, 1.802734375, 2.44873046875, 3.0947265625, 3.74072265625, 4.38671875, 5.03271484375, 5.6787109375, 6.32470703125, 6.970703125, 7.61669921875, 8.2626953125, 8.90869140625, 9.5546875, 10.20068359375, 10.8466796875, 11.49267578125, 12.138671875, 12.78466796875, 13.4306640625, 14.07666015625, 14.72265625, 15.36865234375, 16.0146484375, 16.66064453125, 17.306640625, 17.95263671875, 18.5986328125, 19.24462890625, 19.890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 5.0, 10.0, 20.0, 28.0, 33.0, 82.0, 124.0, 156.0, 154.0, 133.0, 91.0, 66.0, 41.0, 19.0, 9.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00304412841796875, -0.0029400289058685303, -0.0028359293937683105, -0.002731829881668091, -0.002627730369567871, -0.0025236308574676514, -0.0024195313453674316, -0.002315431833267212, -0.002211332321166992, -0.0021072328090667725, -0.0020031332969665527, -0.001899033784866333, -0.0017949342727661133, -0.0016908347606658936, -0.0015867352485656738, -0.001482635736465454, -0.0013785362243652344, -0.0012744367122650146, -0.001170337200164795, -0.0010662376880645752, -0.0009621381759643555, -0.0008580386638641357, -0.000753939151763916, -0.0006498396396636963, -0.0005457401275634766, -0.00044164061546325684, -0.0003375411033630371, -0.00023344159126281738, -0.00012934207916259766, -2.524256706237793e-05, 7.88569450378418e-05, 0.00018295645713806152, 0.00028705596923828125, 0.000391155481338501, 0.0004952549934387207, 0.0005993545055389404, 0.0007034540176391602, 0.0008075535297393799, 0.0009116530418395996, 0.0010157525539398193, 0.001119852066040039, 0.0012239515781402588, 0.0013280510902404785, 0.0014321506023406982, 0.001536250114440918, 0.0016403496265411377, 0.0017444491386413574, 0.0018485486507415771, 0.0019526481628417969, 0.0020567476749420166, 0.0021608471870422363, 0.002264946699142456, 0.0023690462112426758, 0.0024731457233428955, 0.0025772452354431152, 0.002681344747543335, 0.0027854442596435547, 0.0028895437717437744, 0.002993643283843994, 0.003097742795944214, 0.0032018423080444336, 0.0033059418201446533, 0.003410041332244873, 0.0035141408443450928, 0.0036182403564453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 6.0, 6.0, 18.0, 7.0, 14.0, 28.0, 40.0, 54.0, 80.0, 110.0, 197.0, 261.0, 366.0, 553.0, 805.0, 1185.0, 1732.0, 2644.0, 4184.0, 6678.0, 10825.0, 17589.0, 30631.0, 54207.0, 98357.0, 163911.0, 209755.0, 179265.0, 113362.0, 63169.0, 35204.0, 20245.0, 12014.0, 7282.0, 4675.0, 3049.0, 2042.0, 1350.0, 840.0, 543.0, 376.0, 272.0, 215.0, 127.0, 93.0, 70.0, 46.0, 27.0, 22.0, 16.0, 8.0, 4.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.109375, -18.4853515625, -17.861328125, -17.2373046875, -16.61328125, -15.9892578125, -15.365234375, -14.7412109375, -14.1171875, -13.4931640625, -12.869140625, -12.2451171875, -11.62109375, -10.9970703125, -10.373046875, -9.7490234375, -9.125, -8.5009765625, -7.876953125, -7.2529296875, -6.62890625, -6.0048828125, -5.380859375, -4.7568359375, -4.1328125, -3.5087890625, -2.884765625, -2.2607421875, -1.63671875, -1.0126953125, -0.388671875, 0.2353515625, 0.859375, 1.4833984375, 2.107421875, 2.7314453125, 3.35546875, 3.9794921875, 4.603515625, 5.2275390625, 5.8515625, 6.4755859375, 7.099609375, 7.7236328125, 8.34765625, 8.9716796875, 9.595703125, 10.2197265625, 10.84375, 11.4677734375, 12.091796875, 12.7158203125, 13.33984375, 13.9638671875, 14.587890625, 15.2119140625, 15.8359375, 16.4599609375, 17.083984375, 17.7080078125, 18.33203125, 18.9560546875, 19.580078125, 20.2041015625, 20.828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 3.0, 9.0, 3.0, 8.0, 6.0, 21.0, 18.0, 31.0, 33.0, 49.0, 56.0, 73.0, 88.0, 113.0, 96.0, 81.0, 87.0, 51.0, 51.0, 30.0, 21.0, 13.0, 17.0, 9.0, 6.0, 9.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.375, -11.064697265625, -10.75439453125, -10.444091796875, -10.1337890625, -9.823486328125, -9.51318359375, -9.202880859375, -8.892578125, -8.582275390625, -8.27197265625, -7.961669921875, -7.6513671875, -7.341064453125, -7.03076171875, -6.720458984375, -6.41015625, -6.099853515625, -5.78955078125, -5.479248046875, -5.1689453125, -4.858642578125, -4.54833984375, -4.238037109375, -3.927734375, -3.617431640625, -3.30712890625, -2.996826171875, -2.6865234375, -2.376220703125, -2.06591796875, -1.755615234375, -1.4453125, -1.135009765625, -0.82470703125, -0.514404296875, -0.2041015625, 0.106201171875, 0.41650390625, 0.726806640625, 1.037109375, 1.347412109375, 1.65771484375, 1.968017578125, 2.2783203125, 2.588623046875, 2.89892578125, 3.209228515625, 3.51953125, 3.829833984375, 4.14013671875, 4.450439453125, 4.7607421875, 5.071044921875, 5.38134765625, 5.691650390625, 6.001953125, 6.312255859375, 6.62255859375, 6.932861328125, 7.2431640625, 7.553466796875, 7.86376953125, 8.174072265625, 8.484375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 2.0, 8.0, 9.0, 12.0, 9.0, 12.0, 10.0, 16.0, 22.0, 28.0, 25.0, 27.0, 37.0, 22.0, 36.0, 51.0, 40.0, 39.0, 40.0, 50.0, 32.0, 47.0, 38.0, 42.0, 30.0, 33.0, 32.0, 34.0, 35.0, 23.0, 21.0, 17.0, 16.0, 11.0, 14.0, 9.0, 6.0, 18.0, 8.0, 9.0, 8.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-42.1766471862793, -40.90530014038086, -39.63395309448242, -38.36260986328125, -37.09126281738281, -35.819915771484375, -34.54856872558594, -33.2772216796875, -32.00587463378906, -30.734527587890625, -29.46318244934082, -28.191835403442383, -26.920490264892578, -25.64914321899414, -24.377796173095703, -23.106449127197266, -21.835105895996094, -20.563758850097656, -19.29241371154785, -18.021066665649414, -16.74972152709961, -15.478374481201172, -14.207027435302734, -12.935681343078613, -11.664335250854492, -10.392989158630371, -9.12164306640625, -7.8502960205078125, -6.578949928283691, -5.30760383605957, -4.036257266998291, -2.7649106979370117, -1.4935646057128906, -0.22221827507019043, 1.0491280555725098, 2.32047438621521, 3.59182071685791, 4.863166809082031, 6.1345133781433105, 7.40585994720459, 8.677206039428711, 9.948552131652832, 11.219898223876953, 12.49124526977539, 13.762591361999512, 15.033937454223633, 16.30528450012207, 17.576629638671875, 18.847976684570312, 20.11932373046875, 21.390668869018555, 22.662015914916992, 23.933361053466797, 25.204708099365234, 26.476055145263672, 27.74740219116211, 29.018747329711914, 30.29009437561035, 31.561439514160156, 32.832786560058594, 34.10413360595703, 35.37548065185547, 36.64682388305664, 37.91817092895508, 39.189517974853516]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 9.0, 6.0, 17.0, 15.0, 13.0, 21.0, 20.0, 20.0, 24.0, 23.0, 16.0, 32.0, 30.0, 37.0, 41.0, 28.0, 40.0, 34.0, 37.0, 42.0, 29.0, 36.0, 25.0, 42.0, 26.0, 30.0, 36.0, 33.0, 24.0, 18.0, 25.0, 10.0, 22.0, 16.0, 17.0, 20.0, 15.0, 15.0, 8.0, 8.0, 7.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-38.038238525390625, -36.883705139160156, -35.72916793823242, -34.57463455200195, -33.42009735107422, -32.26556396484375, -31.11103057861328, -29.95649528503418, -28.801959991455078, -27.647424697875977, -26.492889404296875, -25.338356018066406, -24.183820724487305, -23.029285430908203, -21.874752044677734, -20.720216751098633, -19.56568145751953, -18.41114616394043, -17.256610870361328, -16.10207748413086, -14.947542190551758, -13.793006896972656, -12.638472557067871, -11.483938217163086, -10.329402923583984, -9.174867630004883, -8.020333290100098, -6.865798473358154, -5.711263656616211, -4.556728839874268, -3.402194023132324, -2.247659683227539, -1.0931282043457031, 0.061406612396240234, 1.2159414291381836, 2.370476245880127, 3.5250110626220703, 4.679545879364014, 5.834080696105957, 6.988615036010742, 8.143150329589844, 9.297685623168945, 10.45221996307373, 11.606754302978516, 12.761289596557617, 13.915824890136719, 15.070359230041504, 16.22489356994629, 17.37942886352539, 18.533964157104492, 19.688499450683594, 20.843032836914062, 21.997568130493164, 23.152103424072266, 24.306636810302734, 25.461172103881836, 26.615707397460938, 27.77024269104004, 28.92477798461914, 30.07931137084961, 31.23384666442871, 32.38838195800781, 33.54291534423828, 34.69744873046875, 35.851985931396484]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 4.0, 11.0, 19.0, 24.0, 31.0, 55.0, 86.0, 134.0, 211.0, 345.0, 609.0, 938.0, 1589.0, 2777.0, 4636.0, 7857.0, 12841.0, 20517.0, 32172.0, 48978.0, 67936.0, 89445.0, 109061.0, 121225.0, 120876.0, 109752.0, 90500.0, 69443.0, 49362.0, 33110.0, 21164.0, 13203.0, 7980.0, 4652.0, 2848.0, 1619.0, 977.0, 570.0, 364.0, 244.0, 143.0, 91.0, 57.0, 36.0, 16.0, 13.0, 5.0, 10.0, 3.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.71875, -41.341796875, -39.96484375, -38.587890625, -37.2109375, -35.833984375, -34.45703125, -33.080078125, -31.703125, -30.326171875, -28.94921875, -27.572265625, -26.1953125, -24.818359375, -23.44140625, -22.064453125, -20.6875, -19.310546875, -17.93359375, -16.556640625, -15.1796875, -13.802734375, -12.42578125, -11.048828125, -9.671875, -8.294921875, -6.91796875, -5.541015625, -4.1640625, -2.787109375, -1.41015625, -0.033203125, 1.34375, 2.720703125, 4.09765625, 5.474609375, 6.8515625, 8.228515625, 9.60546875, 10.982421875, 12.359375, 13.736328125, 15.11328125, 16.490234375, 17.8671875, 19.244140625, 20.62109375, 21.998046875, 23.375, 24.751953125, 26.12890625, 27.505859375, 28.8828125, 30.259765625, 31.63671875, 33.013671875, 34.390625, 35.767578125, 37.14453125, 38.521484375, 39.8984375, 41.275390625, 42.65234375, 44.029296875, 45.40625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 11.0, 12.0, 17.0, 18.0, 18.0, 21.0, 16.0, 28.0, 24.0, 24.0, 19.0, 42.0, 33.0, 38.0, 30.0, 39.0, 34.0, 41.0, 45.0, 26.0, 32.0, 36.0, 33.0, 28.0, 31.0, 31.0, 28.0, 21.0, 25.0, 20.0, 18.0, 18.0, 20.0, 11.0, 17.0, 16.0, 13.0, 9.0, 8.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-35.3125, -34.23291015625, -33.1533203125, -32.07373046875, -30.994140625, -29.91455078125, -28.8349609375, -27.75537109375, -26.67578125, -25.59619140625, -24.5166015625, -23.43701171875, -22.357421875, -21.27783203125, -20.1982421875, -19.11865234375, -18.0390625, -16.95947265625, -15.8798828125, -14.80029296875, -13.720703125, -12.64111328125, -11.5615234375, -10.48193359375, -9.40234375, -8.32275390625, -7.2431640625, -6.16357421875, -5.083984375, -4.00439453125, -2.9248046875, -1.84521484375, -0.765625, 0.31396484375, 1.3935546875, 2.47314453125, 3.552734375, 4.63232421875, 5.7119140625, 6.79150390625, 7.87109375, 8.95068359375, 10.0302734375, 11.10986328125, 12.189453125, 13.26904296875, 14.3486328125, 15.42822265625, 16.5078125, 17.58740234375, 18.6669921875, 19.74658203125, 20.826171875, 21.90576171875, 22.9853515625, 24.06494140625, 25.14453125, 26.22412109375, 27.3037109375, 28.38330078125, 29.462890625, 30.54248046875, 31.6220703125, 32.70166015625, 33.78125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 6.0, 9.0, 18.0, 19.0, 28.0, 44.0, 77.0, 135.0, 226.0, 342.0, 597.0, 993.0, 1666.0, 2991.0, 5229.0, 8466.0, 14896.0, 24631.0, 39650.0, 59962.0, 84936.0, 110527.0, 129074.0, 134250.0, 123076.0, 100312.0, 74136.0, 50818.0, 32536.0, 20031.0, 12049.0, 6907.0, 4156.0, 2334.0, 1399.0, 800.0, 482.0, 267.0, 175.0, 99.0, 66.0, 37.0, 32.0, 23.0, 20.0, 13.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.71875, -49.1953125, -47.671875, -46.1484375, -44.625, -43.1015625, -41.578125, -40.0546875, -38.53125, -37.0078125, -35.484375, -33.9609375, -32.4375, -30.9140625, -29.390625, -27.8671875, -26.34375, -24.8203125, -23.296875, -21.7734375, -20.25, -18.7265625, -17.203125, -15.6796875, -14.15625, -12.6328125, -11.109375, -9.5859375, -8.0625, -6.5390625, -5.015625, -3.4921875, -1.96875, -0.4453125, 1.078125, 2.6015625, 4.125, 5.6484375, 7.171875, 8.6953125, 10.21875, 11.7421875, 13.265625, 14.7890625, 16.3125, 17.8359375, 19.359375, 20.8828125, 22.40625, 23.9296875, 25.453125, 26.9765625, 28.5, 30.0234375, 31.546875, 33.0703125, 34.59375, 36.1171875, 37.640625, 39.1640625, 40.6875, 42.2109375, 43.734375, 45.2578125, 46.78125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 10.0, 10.0, 17.0, 12.0, 12.0, 12.0, 17.0, 24.0, 18.0, 23.0, 14.0, 28.0, 24.0, 25.0, 30.0, 27.0, 39.0, 32.0, 44.0, 43.0, 38.0, 41.0, 38.0, 36.0, 33.0, 33.0, 27.0, 32.0, 22.0, 16.0, 28.0, 23.0, 22.0, 24.0, 11.0, 17.0, 14.0, 11.0, 16.0, 9.0, 11.0, 9.0, 6.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.125, -21.37451171875, -20.6240234375, -19.87353515625, -19.123046875, -18.37255859375, -17.6220703125, -16.87158203125, -16.12109375, -15.37060546875, -14.6201171875, -13.86962890625, -13.119140625, -12.36865234375, -11.6181640625, -10.86767578125, -10.1171875, -9.36669921875, -8.6162109375, -7.86572265625, -7.115234375, -6.36474609375, -5.6142578125, -4.86376953125, -4.11328125, -3.36279296875, -2.6123046875, -1.86181640625, -1.111328125, -0.36083984375, 0.3896484375, 1.14013671875, 1.890625, 2.64111328125, 3.3916015625, 4.14208984375, 4.892578125, 5.64306640625, 6.3935546875, 7.14404296875, 7.89453125, 8.64501953125, 9.3955078125, 10.14599609375, 10.896484375, 11.64697265625, 12.3974609375, 13.14794921875, 13.8984375, 14.64892578125, 15.3994140625, 16.14990234375, 16.900390625, 17.65087890625, 18.4013671875, 19.15185546875, 19.90234375, 20.65283203125, 21.4033203125, 22.15380859375, 22.904296875, 23.65478515625, 24.4052734375, 25.15576171875, 25.90625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 4.0, 5.0, 14.0, 16.0, 30.0, 40.0, 41.0, 56.0, 122.0, 146.0, 252.0, 353.0, 589.0, 848.0, 1404.0, 2311.0, 3839.0, 6565.0, 10999.0, 18650.0, 30631.0, 49231.0, 74311.0, 103149.0, 128833.0, 140874.0, 134683.0, 112119.0, 82876.0, 55976.0, 35807.0, 21495.0, 12744.0, 7634.0, 4602.0, 2732.0, 1656.0, 1031.0, 622.0, 424.0, 237.0, 179.0, 132.0, 85.0, 66.0, 45.0, 27.0, 22.0, 18.0, 10.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-15.8515625, -15.3660888671875, -14.880615234375, -14.3951416015625, -13.90966796875, -13.4241943359375, -12.938720703125, -12.4532470703125, -11.9677734375, -11.4822998046875, -10.996826171875, -10.5113525390625, -10.02587890625, -9.5404052734375, -9.054931640625, -8.5694580078125, -8.083984375, -7.5985107421875, -7.113037109375, -6.6275634765625, -6.14208984375, -5.6566162109375, -5.171142578125, -4.6856689453125, -4.2001953125, -3.7147216796875, -3.229248046875, -2.7437744140625, -2.25830078125, -1.7728271484375, -1.287353515625, -0.8018798828125, -0.31640625, 0.1690673828125, 0.654541015625, 1.1400146484375, 1.62548828125, 2.1109619140625, 2.596435546875, 3.0819091796875, 3.5673828125, 4.0528564453125, 4.538330078125, 5.0238037109375, 5.50927734375, 5.9947509765625, 6.480224609375, 6.9656982421875, 7.451171875, 7.9366455078125, 8.422119140625, 8.9075927734375, 9.39306640625, 9.8785400390625, 10.364013671875, 10.8494873046875, 11.3349609375, 11.8204345703125, 12.305908203125, 12.7913818359375, 13.27685546875, 13.7623291015625, 14.247802734375, 14.7332763671875, 15.21875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 6.0, 10.0, 18.0, 14.0, 21.0, 16.0, 15.0, 26.0, 23.0, 36.0, 57.0, 49.0, 50.0, 66.0, 58.0, 67.0, 73.0, 72.0, 44.0, 49.0, 37.0, 37.0, 26.0, 16.0, 23.0, 14.0, 19.0, 8.0, 11.0, 10.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0022602081298828125, -0.0022002607583999634, -0.0021403133869171143, -0.002080366015434265, -0.002020418643951416, -0.001960471272468567, -0.0019005239009857178, -0.0018405765295028687, -0.0017806291580200195, -0.0017206817865371704, -0.0016607344150543213, -0.0016007870435714722, -0.001540839672088623, -0.001480892300605774, -0.0014209449291229248, -0.0013609975576400757, -0.0013010501861572266, -0.0012411028146743774, -0.0011811554431915283, -0.0011212080717086792, -0.00106126070022583, -0.001001313328742981, -0.0009413659572601318, -0.0008814185857772827, -0.0008214712142944336, -0.0007615238428115845, -0.0007015764713287354, -0.0006416290998458862, -0.0005816817283630371, -0.000521734356880188, -0.00046178698539733887, -0.00040183961391448975, -0.0003418922424316406, -0.0002819448709487915, -0.00022199749946594238, -0.00016205012798309326, -0.00010210275650024414, -4.215538501739502e-05, 1.77919864654541e-05, 7.773935794830322e-05, 0.00013768672943115234, 0.00019763410091400146, 0.0002575814723968506, 0.0003175288438796997, 0.00037747621536254883, 0.00043742358684539795, 0.0004973709583282471, 0.0005573183298110962, 0.0006172657012939453, 0.0006772130727767944, 0.0007371604442596436, 0.0007971078157424927, 0.0008570551872253418, 0.0009170025587081909, 0.00097694993019104, 0.0010368973016738892, 0.0010968446731567383, 0.0011567920446395874, 0.0012167394161224365, 0.0012766867876052856, 0.0013366341590881348, 0.0013965815305709839, 0.001456528902053833, 0.0015164762735366821, 0.0015764236450195312]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 6.0, 12.0, 13.0, 19.0, 26.0, 56.0, 86.0, 123.0, 186.0, 335.0, 476.0, 833.0, 1457.0, 2590.0, 4386.0, 7901.0, 13843.0, 24378.0, 41345.0, 65480.0, 97113.0, 127300.0, 147060.0, 145428.0, 123172.0, 92410.0, 61814.0, 38173.0, 22470.0, 12798.0, 7414.0, 4134.0, 2361.0, 1287.0, 802.0, 477.0, 282.0, 182.0, 115.0, 52.0, 59.0, 31.0, 20.0, 15.0, 10.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.15625, -14.63232421875, -14.1083984375, -13.58447265625, -13.060546875, -12.53662109375, -12.0126953125, -11.48876953125, -10.96484375, -10.44091796875, -9.9169921875, -9.39306640625, -8.869140625, -8.34521484375, -7.8212890625, -7.29736328125, -6.7734375, -6.24951171875, -5.7255859375, -5.20166015625, -4.677734375, -4.15380859375, -3.6298828125, -3.10595703125, -2.58203125, -2.05810546875, -1.5341796875, -1.01025390625, -0.486328125, 0.03759765625, 0.5615234375, 1.08544921875, 1.609375, 2.13330078125, 2.6572265625, 3.18115234375, 3.705078125, 4.22900390625, 4.7529296875, 5.27685546875, 5.80078125, 6.32470703125, 6.8486328125, 7.37255859375, 7.896484375, 8.42041015625, 8.9443359375, 9.46826171875, 9.9921875, 10.51611328125, 11.0400390625, 11.56396484375, 12.087890625, 12.61181640625, 13.1357421875, 13.65966796875, 14.18359375, 14.70751953125, 15.2314453125, 15.75537109375, 16.279296875, 16.80322265625, 17.3271484375, 17.85107421875, 18.375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 9.0, 10.0, 6.0, 23.0, 19.0, 25.0, 19.0, 32.0, 44.0, 43.0, 55.0, 70.0, 58.0, 50.0, 62.0, 55.0, 59.0, 49.0, 51.0, 48.0, 32.0, 45.0, 27.0, 22.0, 20.0, 22.0, 10.0, 14.0, 4.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.5703125, -8.33721923828125, -8.1041259765625, -7.87103271484375, -7.637939453125, -7.40484619140625, -7.1717529296875, -6.93865966796875, -6.70556640625, -6.47247314453125, -6.2393798828125, -6.00628662109375, -5.773193359375, -5.54010009765625, -5.3070068359375, -5.07391357421875, -4.8408203125, -4.60772705078125, -4.3746337890625, -4.14154052734375, -3.908447265625, -3.67535400390625, -3.4422607421875, -3.20916748046875, -2.97607421875, -2.74298095703125, -2.5098876953125, -2.27679443359375, -2.043701171875, -1.81060791015625, -1.5775146484375, -1.34442138671875, -1.111328125, -0.87823486328125, -0.6451416015625, -0.41204833984375, -0.178955078125, 0.05413818359375, 0.2872314453125, 0.52032470703125, 0.75341796875, 0.98651123046875, 1.2196044921875, 1.45269775390625, 1.685791015625, 1.91888427734375, 2.1519775390625, 2.38507080078125, 2.6181640625, 2.85125732421875, 3.0843505859375, 3.31744384765625, 3.550537109375, 3.78363037109375, 4.0167236328125, 4.24981689453125, 4.48291015625, 4.71600341796875, 4.9490966796875, 5.18218994140625, 5.415283203125, 5.64837646484375, 5.8814697265625, 6.11456298828125, 6.34765625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 5.0, 10.0, 13.0, 21.0, 20.0, 13.0, 14.0, 18.0, 20.0, 33.0, 36.0, 28.0, 40.0, 33.0, 39.0, 49.0, 44.0, 42.0, 41.0, 41.0, 33.0, 44.0, 32.0, 29.0, 35.0, 32.0, 27.0, 20.0, 27.0, 20.0, 19.0, 16.0, 10.0, 11.0, 14.0, 6.0, 7.0, 11.0, 5.0, 3.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-41.918182373046875, -40.69587707519531, -39.47357177734375, -38.25126647949219, -37.028961181640625, -35.80665588378906, -34.5843505859375, -33.36204528808594, -32.139739990234375, -30.917434692382812, -29.69512939453125, -28.472824096679688, -27.250518798828125, -26.028213500976562, -24.805910110473633, -23.58360481262207, -22.36130142211914, -21.138996124267578, -19.916690826416016, -18.694385528564453, -17.47208023071289, -16.249774932861328, -15.027471542358398, -13.805166244506836, -12.582860946655273, -11.360555648803711, -10.138250350952148, -8.915946006774902, -7.69364070892334, -6.471335411071777, -5.249030590057373, -4.026725769042969, -2.804424285888672, -1.5821192264556885, -0.3598141670227051, 0.8624908924102783, 2.0847959518432617, 3.307101249694824, 4.5294060707092285, 5.751710891723633, 6.974016189575195, 8.196321487426758, 9.41862678527832, 10.640931129455566, 11.863236427307129, 13.085541725158691, 14.307846069335938, 15.5301513671875, 16.752456665039062, 17.974761962890625, 19.197067260742188, 20.41937255859375, 21.641677856445312, 22.863983154296875, 24.086286544799805, 25.308591842651367, 26.53089714050293, 27.753202438354492, 28.975507736206055, 30.197813034057617, 31.420116424560547, 32.64242172241211, 33.86472702026367, 35.087032318115234, 36.3093376159668]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 5.0, 8.0, 2.0, 6.0, 11.0, 15.0, 10.0, 9.0, 17.0, 31.0, 22.0, 25.0, 24.0, 36.0, 37.0, 39.0, 33.0, 41.0, 33.0, 37.0, 43.0, 36.0, 31.0, 33.0, 35.0, 32.0, 30.0, 33.0, 28.0, 22.0, 33.0, 31.0, 24.0, 17.0, 14.0, 23.0, 16.0, 16.0, 14.0, 10.0, 9.0, 6.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.795631408691406, -35.632545471191406, -34.46946334838867, -33.30638122558594, -32.14329528808594, -30.98021125793457, -29.817127227783203, -28.654043197631836, -27.49095916748047, -26.3278751373291, -25.164791107177734, -24.001707077026367, -22.838623046875, -21.675539016723633, -20.512454986572266, -19.3493709564209, -18.18628692626953, -17.023202896118164, -15.860118865966797, -14.69703483581543, -13.533950805664062, -12.370866775512695, -11.207782745361328, -10.044698715209961, -8.881614685058594, -7.718530654907227, -6.555446624755859, -5.392362594604492, -4.229278564453125, -3.066194534301758, -1.9031105041503906, -0.7400264739990234, 0.4230613708496094, 1.5861454010009766, 2.7492294311523438, 3.912313461303711, 5.075397491455078, 6.238481521606445, 7.4015655517578125, 8.56464958190918, 9.727733612060547, 10.890817642211914, 12.053901672363281, 13.216985702514648, 14.380069732666016, 15.543153762817383, 16.70623779296875, 17.869321823120117, 19.032405853271484, 20.19548988342285, 21.35857391357422, 22.521657943725586, 23.684741973876953, 24.84782600402832, 26.010910034179688, 27.173994064331055, 28.337078094482422, 29.50016212463379, 30.663246154785156, 31.826330184936523, 32.98941421508789, 34.152496337890625, 35.315582275390625, 36.478668212890625, 37.64175033569336]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 6.0, 17.0, 13.0, 37.0, 55.0, 75.0, 133.0, 202.0, 329.0, 507.0, 812.0, 1294.0, 2067.0, 3276.0, 5490.0, 8396.0, 13371.0, 21229.0, 32960.0, 50656.0, 76541.0, 113685.0, 162921.0, 226843.0, 298542.0, 369479.0, 425468.0, 448901.0, 436078.0, 384889.0, 316457.0, 243047.0, 178391.0, 124837.0, 85676.0, 56965.0, 37389.0, 24513.0, 15676.0, 9947.0, 6325.0, 3996.0, 2564.0, 1649.0, 987.0, 630.0, 356.0, 243.0, 137.0, 101.0, 58.0, 23.0, 25.0, 10.0, 6.0, 8.0, 1.0, 3.0, 0.0, 1.0], "bins": [-31.34375, -30.35302734375, -29.3623046875, -28.37158203125, -27.380859375, -26.39013671875, -25.3994140625, -24.40869140625, -23.41796875, -22.42724609375, -21.4365234375, -20.44580078125, -19.455078125, -18.46435546875, -17.4736328125, -16.48291015625, -15.4921875, -14.50146484375, -13.5107421875, -12.52001953125, -11.529296875, -10.53857421875, -9.5478515625, -8.55712890625, -7.56640625, -6.57568359375, -5.5849609375, -4.59423828125, -3.603515625, -2.61279296875, -1.6220703125, -0.63134765625, 0.359375, 1.35009765625, 2.3408203125, 3.33154296875, 4.322265625, 5.31298828125, 6.3037109375, 7.29443359375, 8.28515625, 9.27587890625, 10.2666015625, 11.25732421875, 12.248046875, 13.23876953125, 14.2294921875, 15.22021484375, 16.2109375, 17.20166015625, 18.1923828125, 19.18310546875, 20.173828125, 21.16455078125, 22.1552734375, 23.14599609375, 24.13671875, 25.12744140625, 26.1181640625, 27.10888671875, 28.099609375, 29.09033203125, 30.0810546875, 31.07177734375, 32.0625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 2.0, 7.0, 2.0, 9.0, 9.0, 6.0, 10.0, 8.0, 9.0, 15.0, 19.0, 19.0, 20.0, 23.0, 32.0, 36.0, 29.0, 32.0, 39.0, 30.0, 40.0, 42.0, 41.0, 39.0, 30.0, 32.0, 38.0, 34.0, 32.0, 27.0, 33.0, 28.0, 22.0, 31.0, 28.0, 17.0, 21.0, 21.0, 11.0, 15.0, 12.0, 14.0, 11.0, 11.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-32.5, -31.48193359375, -30.4638671875, -29.44580078125, -28.427734375, -27.40966796875, -26.3916015625, -25.37353515625, -24.35546875, -23.33740234375, -22.3193359375, -21.30126953125, -20.283203125, -19.26513671875, -18.2470703125, -17.22900390625, -16.2109375, -15.19287109375, -14.1748046875, -13.15673828125, -12.138671875, -11.12060546875, -10.1025390625, -9.08447265625, -8.06640625, -7.04833984375, -6.0302734375, -5.01220703125, -3.994140625, -2.97607421875, -1.9580078125, -0.93994140625, 0.078125, 1.09619140625, 2.1142578125, 3.13232421875, 4.150390625, 5.16845703125, 6.1865234375, 7.20458984375, 8.22265625, 9.24072265625, 10.2587890625, 11.27685546875, 12.294921875, 13.31298828125, 14.3310546875, 15.34912109375, 16.3671875, 17.38525390625, 18.4033203125, 19.42138671875, 20.439453125, 21.45751953125, 22.4755859375, 23.49365234375, 24.51171875, 25.52978515625, 26.5478515625, 27.56591796875, 28.583984375, 29.60205078125, 30.6201171875, 31.63818359375, 32.65625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 8.0, 10.0, 23.0, 39.0, 73.0, 86.0, 191.0, 312.0, 545.0, 859.0, 1445.0, 2277.0, 3847.0, 6370.0, 10222.0, 16285.0, 25825.0, 39505.0, 60588.0, 88646.0, 127240.0, 176005.0, 232235.0, 292202.0, 348356.0, 391085.0, 410486.0, 401422.0, 364220.0, 312480.0, 251832.0, 193253.0, 142282.0, 100479.0, 68427.0, 45319.0, 29919.0, 18988.0, 11947.0, 7372.0, 4506.0, 2780.0, 1665.0, 1050.0, 637.0, 371.0, 228.0, 132.0, 81.0, 53.0, 29.0, 20.0, 14.0, 11.0, 5.0, 2.0, 1.0], "bins": [-33.65625, -32.656494140625, -31.65673828125, -30.656982421875, -29.6572265625, -28.657470703125, -27.65771484375, -26.657958984375, -25.658203125, -24.658447265625, -23.65869140625, -22.658935546875, -21.6591796875, -20.659423828125, -19.65966796875, -18.659912109375, -17.66015625, -16.660400390625, -15.66064453125, -14.660888671875, -13.6611328125, -12.661376953125, -11.66162109375, -10.661865234375, -9.662109375, -8.662353515625, -7.66259765625, -6.662841796875, -5.6630859375, -4.663330078125, -3.66357421875, -2.663818359375, -1.6640625, -0.664306640625, 0.33544921875, 1.335205078125, 2.3349609375, 3.334716796875, 4.33447265625, 5.334228515625, 6.333984375, 7.333740234375, 8.33349609375, 9.333251953125, 10.3330078125, 11.332763671875, 12.33251953125, 13.332275390625, 14.33203125, 15.331787109375, 16.33154296875, 17.331298828125, 18.3310546875, 19.330810546875, 20.33056640625, 21.330322265625, 22.330078125, 23.329833984375, 24.32958984375, 25.329345703125, 26.3291015625, 27.328857421875, 28.32861328125, 29.328369140625, 30.328125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 5.0, 9.0, 12.0, 10.0, 17.0, 17.0, 31.0, 30.0, 49.0, 52.0, 66.0, 86.0, 113.0, 122.0, 130.0, 139.0, 156.0, 179.0, 190.0, 202.0, 214.0, 199.0, 206.0, 216.0, 229.0, 169.0, 202.0, 165.0, 133.0, 111.0, 140.0, 98.0, 81.0, 74.0, 50.0, 32.0, 40.0, 27.0, 26.0, 13.0, 18.0, 9.0, 4.0, 3.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.984375, -18.42626953125, -17.8681640625, -17.31005859375, -16.751953125, -16.19384765625, -15.6357421875, -15.07763671875, -14.51953125, -13.96142578125, -13.4033203125, -12.84521484375, -12.287109375, -11.72900390625, -11.1708984375, -10.61279296875, -10.0546875, -9.49658203125, -8.9384765625, -8.38037109375, -7.822265625, -7.26416015625, -6.7060546875, -6.14794921875, -5.58984375, -5.03173828125, -4.4736328125, -3.91552734375, -3.357421875, -2.79931640625, -2.2412109375, -1.68310546875, -1.125, -0.56689453125, -0.0087890625, 0.54931640625, 1.107421875, 1.66552734375, 2.2236328125, 2.78173828125, 3.33984375, 3.89794921875, 4.4560546875, 5.01416015625, 5.572265625, 6.13037109375, 6.6884765625, 7.24658203125, 7.8046875, 8.36279296875, 8.9208984375, 9.47900390625, 10.037109375, 10.59521484375, 11.1533203125, 11.71142578125, 12.26953125, 12.82763671875, 13.3857421875, 13.94384765625, 14.501953125, 15.06005859375, 15.6181640625, 16.17626953125, 16.734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 7.0, 4.0, 7.0, 11.0, 9.0, 17.0, 15.0, 32.0, 19.0, 32.0, 26.0, 25.0, 34.0, 32.0, 35.0, 50.0, 41.0, 42.0, 43.0, 42.0, 39.0, 49.0, 43.0, 30.0, 29.0, 26.0, 40.0, 31.0, 21.0, 16.0, 21.0, 32.0, 16.0, 13.0, 7.0, 11.0, 10.0, 6.0, 8.0, 3.0, 6.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.564903259277344, -36.2888298034668, -35.012760162353516, -33.73668670654297, -32.46061325073242, -31.184541702270508, -29.908470153808594, -28.632396697998047, -27.3563232421875, -26.080251693725586, -24.80417823791504, -23.528106689453125, -22.252033233642578, -20.975961685180664, -19.69989013671875, -18.423816680908203, -17.14774513244629, -15.871672630310059, -14.595600128173828, -13.319528579711914, -12.043455123901367, -10.767383575439453, -9.491311073303223, -8.215238571166992, -6.939166069030762, -5.663093566894531, -4.387021064758301, -3.1109490394592285, -1.834876537322998, -0.5588040351867676, 0.7172679901123047, 1.9933404922485352, 3.2694129943847656, 4.545485496520996, 5.821557998657227, 7.097630023956299, 8.373703002929688, 9.649774551391602, 10.925847053527832, 12.201919555664062, 13.477992057800293, 14.754064559936523, 16.030136108398438, 17.306209564208984, 18.5822811126709, 19.858354568481445, 21.13442611694336, 22.410499572753906, 23.68657112121582, 24.962642669677734, 26.23871612548828, 27.514787673950195, 28.790861129760742, 30.066932678222656, 31.343006134033203, 32.61907958984375, 33.89514923095703, 35.17122268676758, 36.44729232788086, 37.723365783691406, 38.99943923950195, 40.2755126953125, 41.55158233642578, 42.82765579223633, 44.103729248046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 4.0, 5.0, 7.0, 11.0, 6.0, 15.0, 10.0, 11.0, 13.0, 19.0, 15.0, 20.0, 25.0, 12.0, 20.0, 18.0, 29.0, 31.0, 33.0, 34.0, 43.0, 44.0, 38.0, 34.0, 31.0, 37.0, 35.0, 52.0, 31.0, 34.0, 31.0, 27.0, 28.0, 15.0, 27.0, 22.0, 28.0, 16.0, 12.0, 15.0, 9.0, 10.0, 10.0, 11.0, 9.0, 4.0, 3.0, 5.0, 3.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.58451843261719, -35.48551940917969, -34.38652038574219, -33.28752136230469, -32.18852233886719, -31.089523315429688, -29.99052619934082, -28.89152717590332, -27.79252815246582, -26.69352912902832, -25.59453010559082, -24.49553108215332, -23.396533966064453, -22.297534942626953, -21.198535919189453, -20.099536895751953, -19.000537872314453, -17.901538848876953, -16.802539825439453, -15.70354175567627, -14.60454273223877, -13.50554370880127, -12.406545639038086, -11.307546615600586, -10.208547592163086, -9.109548568725586, -8.010549545288086, -6.911551475524902, -5.812552452087402, -4.713553428649902, -3.6145548820495605, -2.5155563354492188, -1.4165611267089844, -0.3175623416900635, 0.7814364433288574, 1.8804352283477783, 2.979434013366699, 4.078433036804199, 5.177431583404541, 6.276430130004883, 7.375429153442383, 8.474428176879883, 9.573427200317383, 10.672425270080566, 11.771424293518066, 12.870423316955566, 13.96942138671875, 15.06842041015625, 16.16741943359375, 17.26641845703125, 18.36541748046875, 19.46441650390625, 20.56341552734375, 21.66241455078125, 22.761411666870117, 23.860410690307617, 24.959409713745117, 26.058408737182617, 27.157407760620117, 28.256406784057617, 29.355403900146484, 30.454402923583984, 31.553401947021484, 32.652400970458984, 33.751399993896484]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 10.0, 14.0, 11.0, 37.0, 38.0, 52.0, 72.0, 120.0, 178.0, 263.0, 383.0, 571.0, 898.0, 1352.0, 2079.0, 3277.0, 4927.0, 7826.0, 12896.0, 20900.0, 33691.0, 54164.0, 82712.0, 117559.0, 145695.0, 152684.0, 131329.0, 97970.0, 65895.0, 41378.0, 26071.0, 15953.0, 9982.0, 6231.0, 3894.0, 2522.0, 1633.0, 1091.0, 718.0, 498.0, 298.0, 225.0, 154.0, 100.0, 62.0, 47.0, 27.0, 26.0, 10.0, 10.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.953125, -28.02587890625, -27.0986328125, -26.17138671875, -25.244140625, -24.31689453125, -23.3896484375, -22.46240234375, -21.53515625, -20.60791015625, -19.6806640625, -18.75341796875, -17.826171875, -16.89892578125, -15.9716796875, -15.04443359375, -14.1171875, -13.18994140625, -12.2626953125, -11.33544921875, -10.408203125, -9.48095703125, -8.5537109375, -7.62646484375, -6.69921875, -5.77197265625, -4.8447265625, -3.91748046875, -2.990234375, -2.06298828125, -1.1357421875, -0.20849609375, 0.71875, 1.64599609375, 2.5732421875, 3.50048828125, 4.427734375, 5.35498046875, 6.2822265625, 7.20947265625, 8.13671875, 9.06396484375, 9.9912109375, 10.91845703125, 11.845703125, 12.77294921875, 13.7001953125, 14.62744140625, 15.5546875, 16.48193359375, 17.4091796875, 18.33642578125, 19.263671875, 20.19091796875, 21.1181640625, 22.04541015625, 22.97265625, 23.89990234375, 24.8271484375, 25.75439453125, 26.681640625, 27.60888671875, 28.5361328125, 29.46337890625, 30.390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 3.0, 6.0, 7.0, 11.0, 8.0, 13.0, 10.0, 11.0, 16.0, 16.0, 14.0, 22.0, 22.0, 17.0, 17.0, 23.0, 26.0, 30.0, 32.0, 32.0, 42.0, 48.0, 37.0, 31.0, 34.0, 37.0, 36.0, 47.0, 35.0, 28.0, 35.0, 31.0, 23.0, 20.0, 25.0, 25.0, 20.0, 20.0, 13.0, 14.0, 9.0, 11.0, 9.0, 11.0, 9.0, 7.0, 1.0, 4.0, 4.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-36.09375, -35.00537109375, -33.9169921875, -32.82861328125, -31.740234375, -30.65185546875, -29.5634765625, -28.47509765625, -27.38671875, -26.29833984375, -25.2099609375, -24.12158203125, -23.033203125, -21.94482421875, -20.8564453125, -19.76806640625, -18.6796875, -17.59130859375, -16.5029296875, -15.41455078125, -14.326171875, -13.23779296875, -12.1494140625, -11.06103515625, -9.97265625, -8.88427734375, -7.7958984375, -6.70751953125, -5.619140625, -4.53076171875, -3.4423828125, -2.35400390625, -1.265625, -0.17724609375, 0.9111328125, 1.99951171875, 3.087890625, 4.17626953125, 5.2646484375, 6.35302734375, 7.44140625, 8.52978515625, 9.6181640625, 10.70654296875, 11.794921875, 12.88330078125, 13.9716796875, 15.06005859375, 16.1484375, 17.23681640625, 18.3251953125, 19.41357421875, 20.501953125, 21.59033203125, 22.6787109375, 23.76708984375, 24.85546875, 25.94384765625, 27.0322265625, 28.12060546875, 29.208984375, 30.29736328125, 31.3857421875, 32.47412109375, 33.5625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 8.0, 19.0, 35.0, 42.0, 45.0, 67.0, 80.0, 130.0, 201.0, 246.0, 354.0, 514.0, 718.0, 1262.0, 1978.0, 3352.0, 5676.0, 10568.0, 21720.0, 50146.0, 125707.0, 287918.0, 298830.0, 135733.0, 53514.0, 23289.0, 11134.0, 5858.0, 3410.0, 2111.0, 1316.0, 813.0, 534.0, 346.0, 265.0, 187.0, 125.0, 97.0, 56.0, 34.0, 33.0, 21.0, 25.0, 17.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-54.625, -52.9716796875, -51.318359375, -49.6650390625, -48.01171875, -46.3583984375, -44.705078125, -43.0517578125, -41.3984375, -39.7451171875, -38.091796875, -36.4384765625, -34.78515625, -33.1318359375, -31.478515625, -29.8251953125, -28.171875, -26.5185546875, -24.865234375, -23.2119140625, -21.55859375, -19.9052734375, -18.251953125, -16.5986328125, -14.9453125, -13.2919921875, -11.638671875, -9.9853515625, -8.33203125, -6.6787109375, -5.025390625, -3.3720703125, -1.71875, -0.0654296875, 1.587890625, 3.2412109375, 4.89453125, 6.5478515625, 8.201171875, 9.8544921875, 11.5078125, 13.1611328125, 14.814453125, 16.4677734375, 18.12109375, 19.7744140625, 21.427734375, 23.0810546875, 24.734375, 26.3876953125, 28.041015625, 29.6943359375, 31.34765625, 33.0009765625, 34.654296875, 36.3076171875, 37.9609375, 39.6142578125, 41.267578125, 42.9208984375, 44.57421875, 46.2275390625, 47.880859375, 49.5341796875, 51.1875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 11.0, 9.0, 5.0, 15.0, 14.0, 18.0, 25.0, 31.0, 26.0, 29.0, 34.0, 40.0, 53.0, 51.0, 35.0, 49.0, 50.0, 50.0, 37.0, 37.0, 50.0, 47.0, 41.0, 28.0, 36.0, 26.0, 17.0, 22.0, 30.0, 22.0, 7.0, 9.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.984375, -27.11669921875, -26.2490234375, -25.38134765625, -24.513671875, -23.64599609375, -22.7783203125, -21.91064453125, -21.04296875, -20.17529296875, -19.3076171875, -18.43994140625, -17.572265625, -16.70458984375, -15.8369140625, -14.96923828125, -14.1015625, -13.23388671875, -12.3662109375, -11.49853515625, -10.630859375, -9.76318359375, -8.8955078125, -8.02783203125, -7.16015625, -6.29248046875, -5.4248046875, -4.55712890625, -3.689453125, -2.82177734375, -1.9541015625, -1.08642578125, -0.21875, 0.64892578125, 1.5166015625, 2.38427734375, 3.251953125, 4.11962890625, 4.9873046875, 5.85498046875, 6.72265625, 7.59033203125, 8.4580078125, 9.32568359375, 10.193359375, 11.06103515625, 11.9287109375, 12.79638671875, 13.6640625, 14.53173828125, 15.3994140625, 16.26708984375, 17.134765625, 18.00244140625, 18.8701171875, 19.73779296875, 20.60546875, 21.47314453125, 22.3408203125, 23.20849609375, 24.076171875, 24.94384765625, 25.8115234375, 26.67919921875, 27.546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 18.0, 25.0, 20.0, 47.0, 48.0, 80.0, 115.0, 135.0, 223.0, 289.0, 421.0, 616.0, 839.0, 1325.0, 2017.0, 3224.0, 5633.0, 10298.0, 21305.0, 50115.0, 136898.0, 343794.0, 288429.0, 103948.0, 39425.0, 17426.0, 8723.0, 4708.0, 2828.0, 1818.0, 1139.0, 780.0, 546.0, 392.0, 273.0, 184.0, 122.0, 102.0, 63.0, 47.0, 35.0, 21.0, 21.0, 10.0, 9.0, 8.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.1875, -22.4599609375, -21.732421875, -21.0048828125, -20.27734375, -19.5498046875, -18.822265625, -18.0947265625, -17.3671875, -16.6396484375, -15.912109375, -15.1845703125, -14.45703125, -13.7294921875, -13.001953125, -12.2744140625, -11.546875, -10.8193359375, -10.091796875, -9.3642578125, -8.63671875, -7.9091796875, -7.181640625, -6.4541015625, -5.7265625, -4.9990234375, -4.271484375, -3.5439453125, -2.81640625, -2.0888671875, -1.361328125, -0.6337890625, 0.09375, 0.8212890625, 1.548828125, 2.2763671875, 3.00390625, 3.7314453125, 4.458984375, 5.1865234375, 5.9140625, 6.6416015625, 7.369140625, 8.0966796875, 8.82421875, 9.5517578125, 10.279296875, 11.0068359375, 11.734375, 12.4619140625, 13.189453125, 13.9169921875, 14.64453125, 15.3720703125, 16.099609375, 16.8271484375, 17.5546875, 18.2822265625, 19.009765625, 19.7373046875, 20.46484375, 21.1923828125, 21.919921875, 22.6474609375, 23.375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 7.0, 7.0, 19.0, 17.0, 23.0, 16.0, 28.0, 34.0, 46.0, 56.0, 40.0, 68.0, 62.0, 52.0, 83.0, 52.0, 64.0, 57.0, 59.0, 50.0, 40.0, 28.0, 22.0, 19.0, 9.0, 7.0, 5.0, 7.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013790130615234375, -0.0013393014669418335, -0.0012995898723602295, -0.0012598782777786255, -0.0012201666831970215, -0.0011804550886154175, -0.0011407434940338135, -0.0011010318994522095, -0.0010613203048706055, -0.0010216087102890015, -0.0009818971157073975, -0.0009421855211257935, -0.0009024739265441895, -0.0008627623319625854, -0.0008230507373809814, -0.0007833391427993774, -0.0007436275482177734, -0.0007039159536361694, -0.0006642043590545654, -0.0006244927644729614, -0.0005847811698913574, -0.0005450695753097534, -0.0005053579807281494, -0.0004656463861465454, -0.0004259347915649414, -0.0003862231969833374, -0.0003465116024017334, -0.0003068000078201294, -0.0002670884132385254, -0.0002273768186569214, -0.00018766522407531738, -0.00014795362949371338, -0.00010824203491210938, -6.853044033050537e-05, -2.8818845748901367e-05, 1.0892748832702637e-05, 5.060434341430664e-05, 9.031593799591064e-05, 0.00013002753257751465, 0.00016973912715911865, 0.00020945072174072266, 0.00024916231632232666, 0.00028887391090393066, 0.00032858550548553467, 0.00036829710006713867, 0.0004080086946487427, 0.0004477202892303467, 0.0004874318838119507, 0.0005271434783935547, 0.0005668550729751587, 0.0006065666675567627, 0.0006462782621383667, 0.0006859898567199707, 0.0007257014513015747, 0.0007654130458831787, 0.0008051246404647827, 0.0008448362350463867, 0.0008845478296279907, 0.0009242594242095947, 0.0009639710187911987, 0.0010036826133728027, 0.0010433942079544067, 0.0010831058025360107, 0.0011228173971176147, 0.0011625289916992188]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 5.0, 13.0, 12.0, 18.0, 20.0, 43.0, 44.0, 67.0, 101.0, 144.0, 204.0, 286.0, 408.0, 608.0, 801.0, 1292.0, 1971.0, 3139.0, 5839.0, 11233.0, 24455.0, 57736.0, 134866.0, 254459.0, 269870.0, 155542.0, 67870.0, 28141.0, 12921.0, 6472.0, 3427.0, 2152.0, 1303.0, 892.0, 687.0, 466.0, 313.0, 222.0, 143.0, 115.0, 99.0, 45.0, 36.0, 22.0, 18.0, 10.0, 8.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.0, -30.9365234375, -29.873046875, -28.8095703125, -27.74609375, -26.6826171875, -25.619140625, -24.5556640625, -23.4921875, -22.4287109375, -21.365234375, -20.3017578125, -19.23828125, -18.1748046875, -17.111328125, -16.0478515625, -14.984375, -13.9208984375, -12.857421875, -11.7939453125, -10.73046875, -9.6669921875, -8.603515625, -7.5400390625, -6.4765625, -5.4130859375, -4.349609375, -3.2861328125, -2.22265625, -1.1591796875, -0.095703125, 0.9677734375, 2.03125, 3.0947265625, 4.158203125, 5.2216796875, 6.28515625, 7.3486328125, 8.412109375, 9.4755859375, 10.5390625, 11.6025390625, 12.666015625, 13.7294921875, 14.79296875, 15.8564453125, 16.919921875, 17.9833984375, 19.046875, 20.1103515625, 21.173828125, 22.2373046875, 23.30078125, 24.3642578125, 25.427734375, 26.4912109375, 27.5546875, 28.6181640625, 29.681640625, 30.7451171875, 31.80859375, 32.8720703125, 33.935546875, 34.9990234375, 36.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 7.0, 5.0, 7.0, 17.0, 17.0, 24.0, 25.0, 35.0, 51.0, 72.0, 75.0, 103.0, 84.0, 84.0, 80.0, 62.0, 54.0, 37.0, 28.0, 27.0, 41.0, 13.0, 9.0, 7.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.234375, -11.850341796875, -11.46630859375, -11.082275390625, -10.6982421875, -10.314208984375, -9.93017578125, -9.546142578125, -9.162109375, -8.778076171875, -8.39404296875, -8.010009765625, -7.6259765625, -7.241943359375, -6.85791015625, -6.473876953125, -6.08984375, -5.705810546875, -5.32177734375, -4.937744140625, -4.5537109375, -4.169677734375, -3.78564453125, -3.401611328125, -3.017578125, -2.633544921875, -2.24951171875, -1.865478515625, -1.4814453125, -1.097412109375, -0.71337890625, -0.329345703125, 0.0546875, 0.438720703125, 0.82275390625, 1.206787109375, 1.5908203125, 1.974853515625, 2.35888671875, 2.742919921875, 3.126953125, 3.510986328125, 3.89501953125, 4.279052734375, 4.6630859375, 5.047119140625, 5.43115234375, 5.815185546875, 6.19921875, 6.583251953125, 6.96728515625, 7.351318359375, 7.7353515625, 8.119384765625, 8.50341796875, 8.887451171875, 9.271484375, 9.655517578125, 10.03955078125, 10.423583984375, 10.8076171875, 11.191650390625, 11.57568359375, 11.959716796875, 12.34375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 6.0, 12.0, 12.0, 13.0, 16.0, 27.0, 25.0, 27.0, 31.0, 32.0, 28.0, 37.0, 48.0, 48.0, 52.0, 49.0, 45.0, 56.0, 49.0, 35.0, 35.0, 41.0, 38.0, 25.0, 32.0, 29.0, 16.0, 22.0, 18.0, 21.0, 10.0, 11.0, 10.0, 6.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.994632720947266, -40.575931549072266, -39.157230377197266, -37.738529205322266, -36.319828033447266, -34.901126861572266, -33.48242950439453, -32.06372833251953, -30.6450252532959, -29.2263240814209, -27.8076229095459, -26.38892364501953, -24.97022247314453, -23.55152130126953, -22.13282012939453, -20.71411895751953, -19.29541778564453, -17.87671661376953, -16.45801544189453, -15.039315223693848, -13.620614051818848, -12.201912879943848, -10.783212661743164, -9.364511489868164, -7.945810317993164, -6.527109146118164, -5.108408451080322, -3.6897077560424805, -2.2710065841674805, -0.8523054122924805, 0.5663948059082031, 1.9850959777832031, 3.4037933349609375, 4.8224945068359375, 6.241195201873779, 7.659895896911621, 9.078597068786621, 10.497298240661621, 11.915998458862305, 13.334699630737305, 14.753400802612305, 16.172101974487305, 17.590803146362305, 19.009502410888672, 20.428203582763672, 21.846904754638672, 23.265605926513672, 24.684307098388672, 26.103008270263672, 27.521709442138672, 28.940410614013672, 30.359111785888672, 31.777812957763672, 33.19651412963867, 34.615211486816406, 36.033912658691406, 37.452613830566406, 38.871315002441406, 40.290016174316406, 41.708717346191406, 43.127418518066406, 44.546119689941406, 45.964820861816406, 47.383522033691406, 48.802223205566406]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 11.0, 9.0, 9.0, 5.0, 9.0, 16.0, 26.0, 12.0, 15.0, 20.0, 21.0, 36.0, 22.0, 30.0, 22.0, 31.0, 33.0, 51.0, 49.0, 34.0, 41.0, 37.0, 42.0, 33.0, 45.0, 32.0, 31.0, 26.0, 33.0, 33.0, 32.0, 27.0, 21.0, 23.0, 9.0, 11.0, 6.0, 12.0, 11.0, 9.0, 8.0, 5.0, 5.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.43608093261719, -38.23658752441406, -37.03709030151367, -35.83759689331055, -34.638099670410156, -33.43860626220703, -32.239112854003906, -31.03961753845215, -29.84012222290039, -28.640626907348633, -27.441131591796875, -26.24163818359375, -25.042142868041992, -23.842647552490234, -22.64315414428711, -21.44365882873535, -20.244163513183594, -19.044668197631836, -17.845172882080078, -16.645679473876953, -15.446184158325195, -14.246688842773438, -13.047194480895996, -11.847700119018555, -10.648204803466797, -9.448709487915039, -8.249215126037598, -7.049720287322998, -5.850225448608398, -4.650730609893799, -3.451235771179199, -2.251741409301758, -1.0522499084472656, 0.14724493026733398, 1.3467397689819336, 2.546234607696533, 3.745729446411133, 4.945224285125732, 6.144719123840332, 7.344213485717773, 8.543708801269531, 9.743204116821289, 10.94269847869873, 12.142192840576172, 13.34168815612793, 14.541183471679688, 15.740677833557129, 16.94017219543457, 18.139667510986328, 19.339162826538086, 20.538658142089844, 21.73815155029297, 22.937646865844727, 24.137142181396484, 25.33663558959961, 26.536130905151367, 27.735626220703125, 28.935121536254883, 30.13461685180664, 31.334110260009766, 32.533607482910156, 33.73310089111328, 34.932594299316406, 36.13208770751953, 37.33158493041992]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 8.0, 23.0, 22.0, 37.0, 72.0, 128.0, 198.0, 300.0, 455.0, 681.0, 1151.0, 1831.0, 2808.0, 4236.0, 6130.0, 9438.0, 13674.0, 19339.0, 26317.0, 35959.0, 46128.0, 58024.0, 69048.0, 78596.0, 86588.0, 89645.0, 87911.0, 82623.0, 73186.0, 62676.0, 50953.0, 40077.0, 30015.0, 22172.0, 15829.0, 10719.0, 7354.0, 4877.0, 3344.0, 2185.0, 1463.0, 872.0, 501.0, 344.0, 218.0, 137.0, 97.0, 63.0, 46.0, 22.0, 20.0, 9.0, 7.0, 2.0, 0.0, 1.0, 1.0], "bins": [-32.96875, -31.960693359375, -30.95263671875, -29.944580078125, -28.9365234375, -27.928466796875, -26.92041015625, -25.912353515625, -24.904296875, -23.896240234375, -22.88818359375, -21.880126953125, -20.8720703125, -19.864013671875, -18.85595703125, -17.847900390625, -16.83984375, -15.831787109375, -14.82373046875, -13.815673828125, -12.8076171875, -11.799560546875, -10.79150390625, -9.783447265625, -8.775390625, -7.767333984375, -6.75927734375, -5.751220703125, -4.7431640625, -3.735107421875, -2.72705078125, -1.718994140625, -0.7109375, 0.297119140625, 1.30517578125, 2.313232421875, 3.3212890625, 4.329345703125, 5.33740234375, 6.345458984375, 7.353515625, 8.361572265625, 9.36962890625, 10.377685546875, 11.3857421875, 12.393798828125, 13.40185546875, 14.409912109375, 15.41796875, 16.426025390625, 17.43408203125, 18.442138671875, 19.4501953125, 20.458251953125, 21.46630859375, 22.474365234375, 23.482421875, 24.490478515625, 25.49853515625, 26.506591796875, 27.5146484375, 28.522705078125, 29.53076171875, 30.538818359375, 31.546875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 13.0, 9.0, 7.0, 7.0, 10.0, 14.0, 22.0, 16.0, 13.0, 18.0, 17.0, 34.0, 25.0, 31.0, 20.0, 26.0, 40.0, 42.0, 49.0, 41.0, 37.0, 38.0, 40.0, 31.0, 39.0, 41.0, 34.0, 33.0, 23.0, 30.0, 37.0, 24.0, 20.0, 32.0, 11.0, 9.0, 8.0, 12.0, 10.0, 10.0, 9.0, 6.0, 3.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.90625, -36.76416015625, -35.6220703125, -34.47998046875, -33.337890625, -32.19580078125, -31.0537109375, -29.91162109375, -28.76953125, -27.62744140625, -26.4853515625, -25.34326171875, -24.201171875, -23.05908203125, -21.9169921875, -20.77490234375, -19.6328125, -18.49072265625, -17.3486328125, -16.20654296875, -15.064453125, -13.92236328125, -12.7802734375, -11.63818359375, -10.49609375, -9.35400390625, -8.2119140625, -7.06982421875, -5.927734375, -4.78564453125, -3.6435546875, -2.50146484375, -1.359375, -0.21728515625, 0.9248046875, 2.06689453125, 3.208984375, 4.35107421875, 5.4931640625, 6.63525390625, 7.77734375, 8.91943359375, 10.0615234375, 11.20361328125, 12.345703125, 13.48779296875, 14.6298828125, 15.77197265625, 16.9140625, 18.05615234375, 19.1982421875, 20.34033203125, 21.482421875, 22.62451171875, 23.7666015625, 24.90869140625, 26.05078125, 27.19287109375, 28.3349609375, 29.47705078125, 30.619140625, 31.76123046875, 32.9033203125, 34.04541015625, 35.1875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [7.0, 2.0, 3.0, 2.0, 6.0, 2.0, 10.0, 19.0, 27.0, 44.0, 60.0, 96.0, 134.0, 236.0, 373.0, 676.0, 1183.0, 2051.0, 3538.0, 6009.0, 10170.0, 16749.0, 26641.0, 40676.0, 58557.0, 79607.0, 100097.0, 115287.0, 120723.0, 115562.0, 101052.0, 79947.0, 59288.0, 41153.0, 26737.0, 16874.0, 10425.0, 6028.0, 3531.0, 2045.0, 1214.0, 749.0, 372.0, 247.0, 136.0, 91.0, 56.0, 24.0, 24.0, 13.0, 9.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.96875, -38.56689453125, -37.1650390625, -35.76318359375, -34.361328125, -32.95947265625, -31.5576171875, -30.15576171875, -28.75390625, -27.35205078125, -25.9501953125, -24.54833984375, -23.146484375, -21.74462890625, -20.3427734375, -18.94091796875, -17.5390625, -16.13720703125, -14.7353515625, -13.33349609375, -11.931640625, -10.52978515625, -9.1279296875, -7.72607421875, -6.32421875, -4.92236328125, -3.5205078125, -2.11865234375, -0.716796875, 0.68505859375, 2.0869140625, 3.48876953125, 4.890625, 6.29248046875, 7.6943359375, 9.09619140625, 10.498046875, 11.89990234375, 13.3017578125, 14.70361328125, 16.10546875, 17.50732421875, 18.9091796875, 20.31103515625, 21.712890625, 23.11474609375, 24.5166015625, 25.91845703125, 27.3203125, 28.72216796875, 30.1240234375, 31.52587890625, 32.927734375, 34.32958984375, 35.7314453125, 37.13330078125, 38.53515625, 39.93701171875, 41.3388671875, 42.74072265625, 44.142578125, 45.54443359375, 46.9462890625, 48.34814453125, 49.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 10.0, 9.0, 15.0, 8.0, 10.0, 19.0, 17.0, 11.0, 19.0, 19.0, 26.0, 17.0, 18.0, 32.0, 32.0, 56.0, 49.0, 31.0, 39.0, 39.0, 38.0, 37.0, 46.0, 31.0, 45.0, 41.0, 27.0, 34.0, 23.0, 25.0, 28.0, 25.0, 15.0, 16.0, 22.0, 14.0, 13.0, 11.0, 7.0, 6.0, 3.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.734375, -20.9638671875, -20.193359375, -19.4228515625, -18.65234375, -17.8818359375, -17.111328125, -16.3408203125, -15.5703125, -14.7998046875, -14.029296875, -13.2587890625, -12.48828125, -11.7177734375, -10.947265625, -10.1767578125, -9.40625, -8.6357421875, -7.865234375, -7.0947265625, -6.32421875, -5.5537109375, -4.783203125, -4.0126953125, -3.2421875, -2.4716796875, -1.701171875, -0.9306640625, -0.16015625, 0.6103515625, 1.380859375, 2.1513671875, 2.921875, 3.6923828125, 4.462890625, 5.2333984375, 6.00390625, 6.7744140625, 7.544921875, 8.3154296875, 9.0859375, 9.8564453125, 10.626953125, 11.3974609375, 12.16796875, 12.9384765625, 13.708984375, 14.4794921875, 15.25, 16.0205078125, 16.791015625, 17.5615234375, 18.33203125, 19.1025390625, 19.873046875, 20.6435546875, 21.4140625, 22.1845703125, 22.955078125, 23.7255859375, 24.49609375, 25.2666015625, 26.037109375, 26.8076171875, 27.578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 16.0, 28.0, 35.0, 57.0, 70.0, 115.0, 164.0, 243.0, 413.0, 642.0, 949.0, 1582.0, 2785.0, 4953.0, 8880.0, 16062.0, 29102.0, 51084.0, 84363.0, 124056.0, 157686.0, 165659.0, 143268.0, 103140.0, 65568.0, 38750.0, 21444.0, 11804.0, 6538.0, 3684.0, 2082.0, 1209.0, 761.0, 485.0, 279.0, 185.0, 148.0, 92.0, 58.0, 36.0, 26.0, 12.0, 11.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.609375, -19.94970703125, -19.2900390625, -18.63037109375, -17.970703125, -17.31103515625, -16.6513671875, -15.99169921875, -15.33203125, -14.67236328125, -14.0126953125, -13.35302734375, -12.693359375, -12.03369140625, -11.3740234375, -10.71435546875, -10.0546875, -9.39501953125, -8.7353515625, -8.07568359375, -7.416015625, -6.75634765625, -6.0966796875, -5.43701171875, -4.77734375, -4.11767578125, -3.4580078125, -2.79833984375, -2.138671875, -1.47900390625, -0.8193359375, -0.15966796875, 0.5, 1.15966796875, 1.8193359375, 2.47900390625, 3.138671875, 3.79833984375, 4.4580078125, 5.11767578125, 5.77734375, 6.43701171875, 7.0966796875, 7.75634765625, 8.416015625, 9.07568359375, 9.7353515625, 10.39501953125, 11.0546875, 11.71435546875, 12.3740234375, 13.03369140625, 13.693359375, 14.35302734375, 15.0126953125, 15.67236328125, 16.33203125, 16.99169921875, 17.6513671875, 18.31103515625, 18.970703125, 19.63037109375, 20.2900390625, 20.94970703125, 21.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 1.0, 7.0, 10.0, 13.0, 23.0, 17.0, 21.0, 31.0, 41.0, 55.0, 53.0, 83.0, 68.0, 79.0, 58.0, 63.0, 66.0, 52.0, 45.0, 49.0, 39.0, 38.0, 20.0, 18.0, 12.0, 17.0, 2.0, 10.0, 2.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00323486328125, -0.003147721290588379, -0.003060579299926758, -0.0029734373092651367, -0.0028862953186035156, -0.0027991533279418945, -0.0027120113372802734, -0.0026248693466186523, -0.0025377273559570312, -0.00245058536529541, -0.002363443374633789, -0.002276301383972168, -0.002189159393310547, -0.0021020174026489258, -0.0020148754119873047, -0.0019277334213256836, -0.0018405914306640625, -0.0017534494400024414, -0.0016663074493408203, -0.0015791654586791992, -0.0014920234680175781, -0.001404881477355957, -0.001317739486694336, -0.0012305974960327148, -0.0011434555053710938, -0.0010563135147094727, -0.0009691715240478516, -0.0008820295333862305, -0.0007948875427246094, -0.0007077455520629883, -0.0006206035614013672, -0.0005334615707397461, -0.000446319580078125, -0.0003591775894165039, -0.0002720355987548828, -0.00018489360809326172, -9.775161743164062e-05, -1.0609626770019531e-05, 7.653236389160156e-05, 0.00016367435455322266, 0.00025081634521484375, 0.00033795833587646484, 0.00042510032653808594, 0.000512242317199707, 0.0005993843078613281, 0.0006865262985229492, 0.0007736682891845703, 0.0008608102798461914, 0.0009479522705078125, 0.0010350942611694336, 0.0011222362518310547, 0.0012093782424926758, 0.0012965202331542969, 0.001383662223815918, 0.001470804214477539, 0.0015579462051391602, 0.0016450881958007812, 0.0017322301864624023, 0.0018193721771240234, 0.0019065141677856445, 0.0019936561584472656, 0.0020807981491088867, 0.002167940139770508, 0.002255082130432129, 0.00234222412109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 16.0, 21.0, 30.0, 38.0, 53.0, 98.0, 115.0, 199.0, 309.0, 498.0, 733.0, 1248.0, 2012.0, 3873.0, 7375.0, 14645.0, 29584.0, 57642.0, 103140.0, 158337.0, 192940.0, 179961.0, 131539.0, 78648.0, 41577.0, 21074.0, 10378.0, 5312.0, 2914.0, 1676.0, 873.0, 569.0, 418.0, 218.0, 154.0, 110.0, 62.0, 42.0, 39.0, 22.0, 17.0, 15.0, 6.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-27.828125, -27.003662109375, -26.17919921875, -25.354736328125, -24.5302734375, -23.705810546875, -22.88134765625, -22.056884765625, -21.232421875, -20.407958984375, -19.58349609375, -18.759033203125, -17.9345703125, -17.110107421875, -16.28564453125, -15.461181640625, -14.63671875, -13.812255859375, -12.98779296875, -12.163330078125, -11.3388671875, -10.514404296875, -9.68994140625, -8.865478515625, -8.041015625, -7.216552734375, -6.39208984375, -5.567626953125, -4.7431640625, -3.918701171875, -3.09423828125, -2.269775390625, -1.4453125, -0.620849609375, 0.20361328125, 1.028076171875, 1.8525390625, 2.677001953125, 3.50146484375, 4.325927734375, 5.150390625, 5.974853515625, 6.79931640625, 7.623779296875, 8.4482421875, 9.272705078125, 10.09716796875, 10.921630859375, 11.74609375, 12.570556640625, 13.39501953125, 14.219482421875, 15.0439453125, 15.868408203125, 16.69287109375, 17.517333984375, 18.341796875, 19.166259765625, 19.99072265625, 20.815185546875, 21.6396484375, 22.464111328125, 23.28857421875, 24.113037109375, 24.9375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 4.0, 16.0, 13.0, 19.0, 34.0, 41.0, 50.0, 63.0, 83.0, 99.0, 84.0, 97.0, 90.0, 75.0, 54.0, 58.0, 28.0, 27.0, 18.0, 7.0, 11.0, 7.0, 8.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0, -12.580810546875, -12.16162109375, -11.742431640625, -11.3232421875, -10.904052734375, -10.48486328125, -10.065673828125, -9.646484375, -9.227294921875, -8.80810546875, -8.388916015625, -7.9697265625, -7.550537109375, -7.13134765625, -6.712158203125, -6.29296875, -5.873779296875, -5.45458984375, -5.035400390625, -4.6162109375, -4.197021484375, -3.77783203125, -3.358642578125, -2.939453125, -2.520263671875, -2.10107421875, -1.681884765625, -1.2626953125, -0.843505859375, -0.42431640625, -0.005126953125, 0.4140625, 0.833251953125, 1.25244140625, 1.671630859375, 2.0908203125, 2.510009765625, 2.92919921875, 3.348388671875, 3.767578125, 4.186767578125, 4.60595703125, 5.025146484375, 5.4443359375, 5.863525390625, 6.28271484375, 6.701904296875, 7.12109375, 7.540283203125, 7.95947265625, 8.378662109375, 8.7978515625, 9.217041015625, 9.63623046875, 10.055419921875, 10.474609375, 10.893798828125, 11.31298828125, 11.732177734375, 12.1513671875, 12.570556640625, 12.98974609375, 13.408935546875, 13.828125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 7.0, 8.0, 6.0, 7.0, 4.0, 13.0, 10.0, 25.0, 24.0, 23.0, 27.0, 34.0, 34.0, 34.0, 37.0, 52.0, 56.0, 48.0, 52.0, 46.0, 48.0, 42.0, 32.0, 49.0, 39.0, 42.0, 38.0, 25.0, 22.0, 19.0, 19.0, 24.0, 10.0, 8.0, 8.0, 9.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.97378158569336, -39.521446228027344, -38.069114685058594, -36.61677932739258, -35.16444778442383, -33.71211242675781, -32.25978088378906, -30.807445526123047, -29.355112075805664, -27.90277862548828, -26.4504451751709, -24.998111724853516, -23.5457763671875, -22.09344482421875, -20.641109466552734, -19.18877601623535, -17.73644256591797, -16.284109115600586, -14.831775665283203, -13.379441261291504, -11.927107810974121, -10.474774360656738, -9.022439956665039, -7.570106506347656, -6.117773056030273, -4.665439605712891, -3.2131056785583496, -1.7607717514038086, -0.3084383010864258, 1.143895149230957, 2.5962295532226562, 4.048563003540039, 5.500896453857422, 6.953229904174805, 8.405563354492188, 9.857897758483887, 11.31023120880127, 12.762564659118652, 14.214899063110352, 15.667232513427734, 17.119565963745117, 18.5718994140625, 20.024232864379883, 21.476566314697266, 22.92890167236328, 24.38123321533203, 25.833568572998047, 27.28590202331543, 28.738235473632812, 30.190568923950195, 31.642902374267578, 33.095237731933594, 34.547569274902344, 35.99990463256836, 37.452239990234375, 38.904571533203125, 40.356903076171875, 41.80923843383789, 43.26156997680664, 44.713905334472656, 46.166236877441406, 47.61857223510742, 49.07090759277344, 50.52323913574219, 51.9755744934082]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 9.0, 6.0, 9.0, 15.0, 14.0, 18.0, 15.0, 15.0, 15.0, 22.0, 27.0, 22.0, 36.0, 35.0, 33.0, 34.0, 41.0, 33.0, 36.0, 40.0, 43.0, 42.0, 32.0, 38.0, 34.0, 33.0, 38.0, 39.0, 35.0, 20.0, 25.0, 23.0, 20.0, 18.0, 16.0, 10.0, 11.0, 10.0, 7.0, 5.0, 9.0, 5.0, 1.0, 2.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-39.057952880859375, -37.83039474487305, -36.60283279418945, -35.375274658203125, -34.14771270751953, -32.9201545715332, -31.692594528198242, -30.46503448486328, -29.23747444152832, -28.00991439819336, -26.7823543548584, -25.554794311523438, -24.32723617553711, -23.099674224853516, -21.872116088867188, -20.644556045532227, -19.416996002197266, -18.189435958862305, -16.961875915527344, -15.7343168258667, -14.506756782531738, -13.279196739196777, -12.051637649536133, -10.824077606201172, -9.596517562866211, -8.36895751953125, -7.141397953033447, -5.9138383865356445, -4.686278343200684, -3.4587182998657227, -2.23115873336792, -1.0035991668701172, 0.22396087646484375, 1.4515206813812256, 2.6790804862976074, 3.9066402912139893, 5.134200096130371, 6.361760139465332, 7.589319705963135, 8.816879272460938, 10.044439315795898, 11.27199935913086, 12.49955940246582, 13.727118492126465, 14.954678535461426, 16.182239532470703, 17.40979766845703, 18.637357711791992, 19.864917755126953, 21.092477798461914, 22.320037841796875, 23.547597885131836, 24.775157928466797, 26.002716064453125, 27.230276107788086, 28.457836151123047, 29.685396194458008, 30.91295623779297, 32.1405143737793, 33.36807632446289, 34.59563446044922, 35.82319641113281, 37.05075454711914, 38.27831268310547, 39.50587463378906]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 9.0, 19.0, 18.0, 34.0, 62.0, 122.0, 193.0, 339.0, 556.0, 941.0, 1801.0, 3158.0, 5418.0, 9725.0, 16928.0, 28719.0, 48506.0, 80247.0, 127349.0, 195392.0, 283286.0, 380189.0, 467473.0, 518892.0, 507689.0, 444876.0, 353702.0, 256352.0, 175230.0, 113199.0, 70483.0, 42925.0, 25472.0, 14880.0, 8526.0, 5016.0, 2804.0, 1634.0, 923.0, 498.0, 276.0, 166.0, 89.0, 65.0, 45.0, 28.0, 12.0, 14.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-39.03125, -37.84375, -36.65625, -35.46875, -34.28125, -33.09375, -31.90625, -30.71875, -29.53125, -28.34375, -27.15625, -25.96875, -24.78125, -23.59375, -22.40625, -21.21875, -20.03125, -18.84375, -17.65625, -16.46875, -15.28125, -14.09375, -12.90625, -11.71875, -10.53125, -9.34375, -8.15625, -6.96875, -5.78125, -4.59375, -3.40625, -2.21875, -1.03125, 0.15625, 1.34375, 2.53125, 3.71875, 4.90625, 6.09375, 7.28125, 8.46875, 9.65625, 10.84375, 12.03125, 13.21875, 14.40625, 15.59375, 16.78125, 17.96875, 19.15625, 20.34375, 21.53125, 22.71875, 23.90625, 25.09375, 26.28125, 27.46875, 28.65625, 29.84375, 31.03125, 32.21875, 33.40625, 34.59375, 35.78125, 36.96875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 11.0, 7.0, 10.0, 20.0, 16.0, 12.0, 17.0, 18.0, 16.0, 19.0, 29.0, 19.0, 35.0, 40.0, 39.0, 35.0, 41.0, 40.0, 31.0, 35.0, 34.0, 42.0, 27.0, 42.0, 37.0, 31.0, 35.0, 43.0, 34.0, 28.0, 15.0, 19.0, 18.0, 12.0, 21.0, 14.0, 5.0, 10.0, 6.0, 9.0, 7.0, 3.0, 2.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.6875, -32.60498046875, -31.5224609375, -30.43994140625, -29.357421875, -28.27490234375, -27.1923828125, -26.10986328125, -25.02734375, -23.94482421875, -22.8623046875, -21.77978515625, -20.697265625, -19.61474609375, -18.5322265625, -17.44970703125, -16.3671875, -15.28466796875, -14.2021484375, -13.11962890625, -12.037109375, -10.95458984375, -9.8720703125, -8.78955078125, -7.70703125, -6.62451171875, -5.5419921875, -4.45947265625, -3.376953125, -2.29443359375, -1.2119140625, -0.12939453125, 0.953125, 2.03564453125, 3.1181640625, 4.20068359375, 5.283203125, 6.36572265625, 7.4482421875, 8.53076171875, 9.61328125, 10.69580078125, 11.7783203125, 12.86083984375, 13.943359375, 15.02587890625, 16.1083984375, 17.19091796875, 18.2734375, 19.35595703125, 20.4384765625, 21.52099609375, 22.603515625, 23.68603515625, 24.7685546875, 25.85107421875, 26.93359375, 28.01611328125, 29.0986328125, 30.18115234375, 31.263671875, 32.34619140625, 33.4287109375, 34.51123046875, 35.59375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 10.0, 10.0, 22.0, 41.0, 62.0, 112.0, 156.0, 311.0, 504.0, 876.0, 1491.0, 2345.0, 3836.0, 6353.0, 10422.0, 16556.0, 25944.0, 39726.0, 59642.0, 86987.0, 123505.0, 169561.0, 222461.0, 278887.0, 333652.0, 375090.0, 396261.0, 391614.0, 364570.0, 318290.0, 263049.0, 206309.0, 155252.0, 112335.0, 78619.0, 53195.0, 35521.0, 22776.0, 14653.0, 9119.0, 5614.0, 3483.0, 2060.0, 1224.0, 726.0, 420.0, 241.0, 155.0, 93.0, 59.0, 42.0, 18.0, 12.0, 4.0, 3.0, 1.0, 3.0, 2.0], "bins": [-32.90625, -31.90478515625, -30.9033203125, -29.90185546875, -28.900390625, -27.89892578125, -26.8974609375, -25.89599609375, -24.89453125, -23.89306640625, -22.8916015625, -21.89013671875, -20.888671875, -19.88720703125, -18.8857421875, -17.88427734375, -16.8828125, -15.88134765625, -14.8798828125, -13.87841796875, -12.876953125, -11.87548828125, -10.8740234375, -9.87255859375, -8.87109375, -7.86962890625, -6.8681640625, -5.86669921875, -4.865234375, -3.86376953125, -2.8623046875, -1.86083984375, -0.859375, 0.14208984375, 1.1435546875, 2.14501953125, 3.146484375, 4.14794921875, 5.1494140625, 6.15087890625, 7.15234375, 8.15380859375, 9.1552734375, 10.15673828125, 11.158203125, 12.15966796875, 13.1611328125, 14.16259765625, 15.1640625, 16.16552734375, 17.1669921875, 18.16845703125, 19.169921875, 20.17138671875, 21.1728515625, 22.17431640625, 23.17578125, 24.17724609375, 25.1787109375, 26.18017578125, 27.181640625, 28.18310546875, 29.1845703125, 30.18603515625, 31.1875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 13.0, 13.0, 14.0, 18.0, 24.0, 38.0, 38.0, 52.0, 85.0, 97.0, 102.0, 103.0, 126.0, 168.0, 156.0, 195.0, 204.0, 235.0, 225.0, 243.0, 221.0, 215.0, 224.0, 192.0, 176.0, 174.0, 133.0, 115.0, 93.0, 79.0, 79.0, 58.0, 39.0, 40.0, 30.0, 13.0, 9.0, 11.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.234375, -16.626953125, -16.01953125, -15.412109375, -14.8046875, -14.197265625, -13.58984375, -12.982421875, -12.375, -11.767578125, -11.16015625, -10.552734375, -9.9453125, -9.337890625, -8.73046875, -8.123046875, -7.515625, -6.908203125, -6.30078125, -5.693359375, -5.0859375, -4.478515625, -3.87109375, -3.263671875, -2.65625, -2.048828125, -1.44140625, -0.833984375, -0.2265625, 0.380859375, 0.98828125, 1.595703125, 2.203125, 2.810546875, 3.41796875, 4.025390625, 4.6328125, 5.240234375, 5.84765625, 6.455078125, 7.0625, 7.669921875, 8.27734375, 8.884765625, 9.4921875, 10.099609375, 10.70703125, 11.314453125, 11.921875, 12.529296875, 13.13671875, 13.744140625, 14.3515625, 14.958984375, 15.56640625, 16.173828125, 16.78125, 17.388671875, 17.99609375, 18.603515625, 19.2109375, 19.818359375, 20.42578125, 21.033203125, 21.640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 13.0, 5.0, 4.0, 8.0, 9.0, 11.0, 12.0, 22.0, 12.0, 10.0, 23.0, 21.0, 41.0, 32.0, 24.0, 38.0, 33.0, 34.0, 40.0, 31.0, 32.0, 31.0, 32.0, 36.0, 43.0, 37.0, 42.0, 24.0, 39.0, 26.0, 35.0, 26.0, 24.0, 26.0, 19.0, 12.0, 13.0, 12.0, 14.0, 11.0, 11.0, 2.0, 6.0, 2.0, 5.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.383460998535156, -36.183631896972656, -34.98379898071289, -33.78396987915039, -32.584136962890625, -31.384307861328125, -30.184476852416992, -28.98464584350586, -27.78481674194336, -26.584985733032227, -25.385154724121094, -24.185325622558594, -22.98549461364746, -21.785663604736328, -20.585832595825195, -19.386001586914062, -18.18617057800293, -16.986339569091797, -15.78650951385498, -14.586678504943848, -13.386848449707031, -12.187017440795898, -10.987186431884766, -9.78735637664795, -8.587525367736816, -7.387694835662842, -6.187864303588867, -4.988033294677734, -3.7882027626037598, -2.588372230529785, -1.3885412216186523, -0.18871116638183594, 1.0111198425292969, 2.2109503746032715, 3.410781145095825, 4.610611915588379, 5.8104424476623535, 7.010272979736328, 8.210103988647461, 9.409934043884277, 10.60976505279541, 11.809596061706543, 13.00942611694336, 14.209257125854492, 15.409088134765625, 16.608917236328125, 17.80875015258789, 19.00857925415039, 20.208410263061523, 21.408241271972656, 22.60807228088379, 23.807903289794922, 25.007732391357422, 26.207563400268555, 27.407394409179688, 28.607223510742188, 29.807056427001953, 31.006887435913086, 32.20671844482422, 33.40654754638672, 34.606380462646484, 35.806209564208984, 37.00604248046875, 38.20587158203125, 39.40570068359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 8.0, 2.0, 5.0, 16.0, 10.0, 12.0, 22.0, 14.0, 17.0, 26.0, 40.0, 40.0, 33.0, 27.0, 28.0, 34.0, 44.0, 40.0, 31.0, 36.0, 55.0, 50.0, 42.0, 29.0, 38.0, 35.0, 21.0, 32.0, 25.0, 27.0, 12.0, 17.0, 20.0, 19.0, 13.0, 8.0, 9.0, 14.0, 15.0, 5.0, 2.0, 5.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.1006965637207, -37.86515808105469, -36.629615783691406, -35.39407730102539, -34.158538818359375, -32.922996520996094, -31.687458038330078, -30.45191764831543, -29.21637725830078, -27.980836868286133, -26.745298385620117, -25.50975799560547, -24.27421760559082, -23.038677215576172, -21.803138732910156, -20.567598342895508, -19.332059860229492, -18.096519470214844, -16.860980987548828, -15.62544059753418, -14.389900207519531, -13.1543607711792, -11.918821334838867, -10.683280944824219, -9.447741508483887, -8.212202072143555, -6.976661682128906, -5.741122245788574, -4.505582332611084, -3.2700424194335938, -2.0345029830932617, -0.7989625930786133, 0.43657684326171875, 1.6721166372299194, 2.90765643119812, 4.143196105957031, 5.3787360191345215, 6.614275932312012, 7.849815368652344, 9.085355758666992, 10.320895195007324, 11.556434631347656, 12.791975021362305, 14.027514457702637, 15.263053894042969, 16.498594284057617, 17.734134674072266, 18.96967315673828, 20.20521354675293, 21.440753936767578, 22.676292419433594, 23.911832809448242, 25.14737319946289, 26.382911682128906, 27.618452072143555, 28.853992462158203, 30.08953094482422, 31.325071334838867, 32.560611724853516, 33.79615020751953, 35.03168869018555, 36.26723098754883, 37.502769470214844, 38.738311767578125, 39.97385025024414]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 2.0, 6.0, 6.0, 11.0, 19.0, 18.0, 39.0, 50.0, 72.0, 110.0, 167.0, 225.0, 332.0, 489.0, 772.0, 1152.0, 1820.0, 2870.0, 4596.0, 7467.0, 12882.0, 22496.0, 40150.0, 71903.0, 121610.0, 176368.0, 194909.0, 156625.0, 98450.0, 56350.0, 31452.0, 17900.0, 10388.0, 6135.0, 3883.0, 2393.0, 1569.0, 986.0, 646.0, 394.0, 248.0, 181.0, 138.0, 83.0, 65.0, 49.0, 30.0, 19.0, 15.0, 8.0, 6.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.1875, -31.125, -30.0625, -29.0, -27.9375, -26.875, -25.8125, -24.75, -23.6875, -22.625, -21.5625, -20.5, -19.4375, -18.375, -17.3125, -16.25, -15.1875, -14.125, -13.0625, -12.0, -10.9375, -9.875, -8.8125, -7.75, -6.6875, -5.625, -4.5625, -3.5, -2.4375, -1.375, -0.3125, 0.75, 1.8125, 2.875, 3.9375, 5.0, 6.0625, 7.125, 8.1875, 9.25, 10.3125, 11.375, 12.4375, 13.5, 14.5625, 15.625, 16.6875, 17.75, 18.8125, 19.875, 20.9375, 22.0, 23.0625, 24.125, 25.1875, 26.25, 27.3125, 28.375, 29.4375, 30.5, 31.5625, 32.625, 33.6875, 34.75, 35.8125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 5.0, 8.0, 7.0, 1.0, 12.0, 12.0, 13.0, 10.0, 21.0, 18.0, 14.0, 33.0, 35.0, 40.0, 36.0, 25.0, 23.0, 40.0, 44.0, 39.0, 31.0, 41.0, 52.0, 47.0, 38.0, 32.0, 36.0, 34.0, 27.0, 25.0, 29.0, 22.0, 12.0, 19.0, 18.0, 19.0, 14.0, 6.0, 9.0, 16.0, 16.0, 3.0, 3.0, 4.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.28125, -37.0654296875, -35.849609375, -34.6337890625, -33.41796875, -32.2021484375, -30.986328125, -29.7705078125, -28.5546875, -27.3388671875, -26.123046875, -24.9072265625, -23.69140625, -22.4755859375, -21.259765625, -20.0439453125, -18.828125, -17.6123046875, -16.396484375, -15.1806640625, -13.96484375, -12.7490234375, -11.533203125, -10.3173828125, -9.1015625, -7.8857421875, -6.669921875, -5.4541015625, -4.23828125, -3.0224609375, -1.806640625, -0.5908203125, 0.625, 1.8408203125, 3.056640625, 4.2724609375, 5.48828125, 6.7041015625, 7.919921875, 9.1357421875, 10.3515625, 11.5673828125, 12.783203125, 13.9990234375, 15.21484375, 16.4306640625, 17.646484375, 18.8623046875, 20.078125, 21.2939453125, 22.509765625, 23.7255859375, 24.94140625, 26.1572265625, 27.373046875, 28.5888671875, 29.8046875, 31.0205078125, 32.236328125, 33.4521484375, 34.66796875, 35.8837890625, 37.099609375, 38.3154296875, 39.53125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 4.0, 11.0, 10.0, 10.0, 21.0, 29.0, 38.0, 39.0, 72.0, 84.0, 100.0, 161.0, 248.0, 294.0, 518.0, 724.0, 1142.0, 1824.0, 2832.0, 4752.0, 8511.0, 16492.0, 35588.0, 87754.0, 220392.0, 329816.0, 194454.0, 75884.0, 31725.0, 15040.0, 7742.0, 4481.0, 2662.0, 1632.0, 1113.0, 723.0, 474.0, 337.0, 232.0, 156.0, 104.0, 83.0, 58.0, 34.0, 36.0, 27.0, 18.0, 27.0, 16.0, 8.0, 7.0, 4.0, 2.0, 2.0, 8.0], "bins": [-51.65625, -50.15576171875, -48.6552734375, -47.15478515625, -45.654296875, -44.15380859375, -42.6533203125, -41.15283203125, -39.65234375, -38.15185546875, -36.6513671875, -35.15087890625, -33.650390625, -32.14990234375, -30.6494140625, -29.14892578125, -27.6484375, -26.14794921875, -24.6474609375, -23.14697265625, -21.646484375, -20.14599609375, -18.6455078125, -17.14501953125, -15.64453125, -14.14404296875, -12.6435546875, -11.14306640625, -9.642578125, -8.14208984375, -6.6416015625, -5.14111328125, -3.640625, -2.14013671875, -0.6396484375, 0.86083984375, 2.361328125, 3.86181640625, 5.3623046875, 6.86279296875, 8.36328125, 9.86376953125, 11.3642578125, 12.86474609375, 14.365234375, 15.86572265625, 17.3662109375, 18.86669921875, 20.3671875, 21.86767578125, 23.3681640625, 24.86865234375, 26.369140625, 27.86962890625, 29.3701171875, 30.87060546875, 32.37109375, 33.87158203125, 35.3720703125, 36.87255859375, 38.373046875, 39.87353515625, 41.3740234375, 42.87451171875, 44.375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 2.0, 2.0, 11.0, 11.0, 11.0, 11.0, 4.0, 14.0, 19.0, 20.0, 22.0, 25.0, 32.0, 29.0, 27.0, 31.0, 29.0, 38.0, 37.0, 44.0, 52.0, 36.0, 48.0, 42.0, 37.0, 28.0, 36.0, 37.0, 27.0, 25.0, 27.0, 28.0, 12.0, 31.0, 12.0, 21.0, 7.0, 10.0, 8.0, 10.0, 13.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-25.171875, -24.415771484375, -23.65966796875, -22.903564453125, -22.1474609375, -21.391357421875, -20.63525390625, -19.879150390625, -19.123046875, -18.366943359375, -17.61083984375, -16.854736328125, -16.0986328125, -15.342529296875, -14.58642578125, -13.830322265625, -13.07421875, -12.318115234375, -11.56201171875, -10.805908203125, -10.0498046875, -9.293701171875, -8.53759765625, -7.781494140625, -7.025390625, -6.269287109375, -5.51318359375, -4.757080078125, -4.0009765625, -3.244873046875, -2.48876953125, -1.732666015625, -0.9765625, -0.220458984375, 0.53564453125, 1.291748046875, 2.0478515625, 2.803955078125, 3.56005859375, 4.316162109375, 5.072265625, 5.828369140625, 6.58447265625, 7.340576171875, 8.0966796875, 8.852783203125, 9.60888671875, 10.364990234375, 11.12109375, 11.877197265625, 12.63330078125, 13.389404296875, 14.1455078125, 14.901611328125, 15.65771484375, 16.413818359375, 17.169921875, 17.926025390625, 18.68212890625, 19.438232421875, 20.1943359375, 20.950439453125, 21.70654296875, 22.462646484375, 23.21875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [8.0, 6.0, 4.0, 10.0, 11.0, 11.0, 20.0, 39.0, 30.0, 43.0, 61.0, 82.0, 123.0, 151.0, 216.0, 300.0, 478.0, 619.0, 959.0, 1360.0, 2141.0, 3372.0, 5441.0, 9002.0, 15937.0, 29730.0, 59151.0, 127237.0, 253622.0, 263712.0, 136204.0, 63745.0, 31547.0, 16873.0, 9895.0, 5690.0, 3533.0, 2303.0, 1471.0, 985.0, 679.0, 496.0, 372.0, 277.0, 171.0, 129.0, 83.0, 72.0, 45.0, 26.0, 27.0, 18.0, 15.0, 13.0, 7.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-15.203125, -14.6796875, -14.15625, -13.6328125, -13.109375, -12.5859375, -12.0625, -11.5390625, -11.015625, -10.4921875, -9.96875, -9.4453125, -8.921875, -8.3984375, -7.875, -7.3515625, -6.828125, -6.3046875, -5.78125, -5.2578125, -4.734375, -4.2109375, -3.6875, -3.1640625, -2.640625, -2.1171875, -1.59375, -1.0703125, -0.546875, -0.0234375, 0.5, 1.0234375, 1.546875, 2.0703125, 2.59375, 3.1171875, 3.640625, 4.1640625, 4.6875, 5.2109375, 5.734375, 6.2578125, 6.78125, 7.3046875, 7.828125, 8.3515625, 8.875, 9.3984375, 9.921875, 10.4453125, 10.96875, 11.4921875, 12.015625, 12.5390625, 13.0625, 13.5859375, 14.109375, 14.6328125, 15.15625, 15.6796875, 16.203125, 16.7265625, 17.25, 17.7734375, 18.296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 4.0, 4.0, 4.0, 11.0, 14.0, 27.0, 31.0, 40.0, 58.0, 67.0, 88.0, 114.0, 108.0, 103.0, 89.0, 74.0, 47.0, 36.0, 33.0, 17.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013828277587890625, -0.0013264119625091553, -0.001269996166229248, -0.0012135803699493408, -0.0011571645736694336, -0.0011007487773895264, -0.0010443329811096191, -0.000987917184829712, -0.0009315013885498047, -0.0008750855922698975, -0.0008186697959899902, -0.000762253999710083, -0.0007058382034301758, -0.0006494224071502686, -0.0005930066108703613, -0.0005365908145904541, -0.0004801750183105469, -0.00042375922203063965, -0.0003673434257507324, -0.0003109276294708252, -0.00025451183319091797, -0.00019809603691101074, -0.00014168024063110352, -8.526444435119629e-05, -2.8848648071289062e-05, 2.7567148208618164e-05, 8.398294448852539e-05, 0.00014039874076843262, 0.00019681453704833984, 0.00025323033332824707, 0.0003096461296081543, 0.0003660619258880615, 0.00042247772216796875, 0.000478893518447876, 0.0005353093147277832, 0.0005917251110076904, 0.0006481409072875977, 0.0007045567035675049, 0.0007609724998474121, 0.0008173882961273193, 0.0008738040924072266, 0.0009302198886871338, 0.000986635684967041, 0.0010430514812469482, 0.0010994672775268555, 0.0011558830738067627, 0.00121229887008667, 0.0012687146663665771, 0.0013251304626464844, 0.0013815462589263916, 0.0014379620552062988, 0.001494377851486206, 0.0015507936477661133, 0.0016072094440460205, 0.0016636252403259277, 0.001720041036605835, 0.0017764568328857422, 0.0018328726291656494, 0.0018892884254455566, 0.0019457042217254639, 0.002002120018005371, 0.0020585358142852783, 0.0021149516105651855, 0.0021713674068450928, 0.002227783203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 15.0, 25.0, 26.0, 67.0, 89.0, 138.0, 191.0, 358.0, 570.0, 983.0, 1603.0, 2725.0, 4591.0, 7739.0, 13222.0, 22691.0, 39622.0, 67813.0, 111759.0, 165796.0, 190712.0, 160039.0, 106015.0, 63404.0, 36812.0, 21233.0, 12311.0, 7274.0, 4351.0, 2506.0, 1520.0, 938.0, 524.0, 348.0, 209.0, 130.0, 87.0, 32.0, 31.0, 19.0, 12.0, 5.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.609375, -20.963134765625, -20.31689453125, -19.670654296875, -19.0244140625, -18.378173828125, -17.73193359375, -17.085693359375, -16.439453125, -15.793212890625, -15.14697265625, -14.500732421875, -13.8544921875, -13.208251953125, -12.56201171875, -11.915771484375, -11.26953125, -10.623291015625, -9.97705078125, -9.330810546875, -8.6845703125, -8.038330078125, -7.39208984375, -6.745849609375, -6.099609375, -5.453369140625, -4.80712890625, -4.160888671875, -3.5146484375, -2.868408203125, -2.22216796875, -1.575927734375, -0.9296875, -0.283447265625, 0.36279296875, 1.009033203125, 1.6552734375, 2.301513671875, 2.94775390625, 3.593994140625, 4.240234375, 4.886474609375, 5.53271484375, 6.178955078125, 6.8251953125, 7.471435546875, 8.11767578125, 8.763916015625, 9.41015625, 10.056396484375, 10.70263671875, 11.348876953125, 11.9951171875, 12.641357421875, 13.28759765625, 13.933837890625, 14.580078125, 15.226318359375, 15.87255859375, 16.518798828125, 17.1650390625, 17.811279296875, 18.45751953125, 19.103759765625, 19.75]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 8.0, 14.0, 14.0, 14.0, 18.0, 17.0, 32.0, 43.0, 33.0, 48.0, 51.0, 47.0, 50.0, 45.0, 58.0, 51.0, 52.0, 42.0, 43.0, 46.0, 41.0, 34.0, 32.0, 24.0, 21.0, 20.0, 20.0, 12.0, 16.0, 7.0, 12.0, 6.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.13232421875, -7.9130859375, -7.69384765625, -7.474609375, -7.25537109375, -7.0361328125, -6.81689453125, -6.59765625, -6.37841796875, -6.1591796875, -5.93994140625, -5.720703125, -5.50146484375, -5.2822265625, -5.06298828125, -4.84375, -4.62451171875, -4.4052734375, -4.18603515625, -3.966796875, -3.74755859375, -3.5283203125, -3.30908203125, -3.08984375, -2.87060546875, -2.6513671875, -2.43212890625, -2.212890625, -1.99365234375, -1.7744140625, -1.55517578125, -1.3359375, -1.11669921875, -0.8974609375, -0.67822265625, -0.458984375, -0.23974609375, -0.0205078125, 0.19873046875, 0.41796875, 0.63720703125, 0.8564453125, 1.07568359375, 1.294921875, 1.51416015625, 1.7333984375, 1.95263671875, 2.171875, 2.39111328125, 2.6103515625, 2.82958984375, 3.048828125, 3.26806640625, 3.4873046875, 3.70654296875, 3.92578125, 4.14501953125, 4.3642578125, 4.58349609375, 4.802734375, 5.02197265625, 5.2412109375, 5.46044921875, 5.6796875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 5.0, 11.0, 13.0, 7.0, 23.0, 14.0, 17.0, 18.0, 17.0, 25.0, 30.0, 30.0, 34.0, 28.0, 31.0, 31.0, 33.0, 41.0, 27.0, 31.0, 40.0, 40.0, 37.0, 35.0, 41.0, 29.0, 27.0, 32.0, 23.0, 24.0, 36.0, 27.0, 16.0, 21.0, 15.0, 12.0, 13.0, 7.0, 10.0, 6.0, 4.0, 3.0, 6.0, 6.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-37.576820373535156, -36.40310287475586, -35.22938919067383, -34.05567169189453, -32.8819580078125, -31.708240509033203, -30.53452491760254, -29.360809326171875, -28.187091827392578, -27.013376235961914, -25.83966064453125, -24.665943145751953, -23.49222755432129, -22.318511962890625, -21.14479637145996, -19.971080780029297, -18.797365188598633, -17.62364959716797, -16.449934005737305, -15.276217460632324, -14.102500915527344, -12.92878532409668, -11.755069732666016, -10.581353187561035, -9.407637596130371, -8.233922004699707, -7.060205459594727, -5.8864898681640625, -4.71277379989624, -3.539057731628418, -2.365342140197754, -1.1916255950927734, -0.017910003662109375, 1.1558059453964233, 2.329521894454956, 3.503237724304199, 4.6769537925720215, 5.850669860839844, 7.024385452270508, 8.198101997375488, 9.371817588806152, 10.545533180236816, 11.719249725341797, 12.892965316772461, 14.066680908203125, 15.240397453308105, 16.414112091064453, 17.58782958984375, 18.761545181274414, 19.935260772705078, 21.108976364135742, 22.282691955566406, 23.456409454345703, 24.630125045776367, 25.80384063720703, 26.977558135986328, 28.15127182006836, 29.324987411499023, 30.498703002929688, 31.672420501708984, 32.846134185791016, 34.01985168457031, 35.193565368652344, 36.36728286743164, 37.54100036621094]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 2.0, 8.0, 6.0, 7.0, 11.0, 5.0, 12.0, 18.0, 17.0, 23.0, 16.0, 12.0, 42.0, 40.0, 42.0, 24.0, 31.0, 39.0, 40.0, 36.0, 38.0, 41.0, 56.0, 37.0, 42.0, 38.0, 35.0, 32.0, 33.0, 24.0, 28.0, 20.0, 17.0, 10.0, 22.0, 19.0, 14.0, 14.0, 10.0, 10.0, 11.0, 2.0, 5.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.58220672607422, -38.32613754272461, -37.070068359375, -35.81399917602539, -34.55792999267578, -33.30186462402344, -32.04579544067383, -30.78972625732422, -29.53365707397461, -28.277587890625, -27.02151870727539, -25.765451431274414, -24.509382247924805, -23.253313064575195, -21.99724578857422, -20.74117660522461, -19.485107421875, -18.22903823852539, -16.97296905517578, -15.716901779174805, -14.460832595825195, -13.204763412475586, -11.948695182800293, -10.692626953125, -9.43655776977539, -8.180488586425781, -6.924420356750488, -5.668351650238037, -4.412282943725586, -3.1562142372131348, -1.9001455307006836, -0.6440773010253906, 0.6119918823242188, 1.86806058883667, 3.124129295349121, 4.380198001861572, 5.636266708374023, 6.892335414886475, 8.148404121398926, 9.404472351074219, 10.660541534423828, 11.916610717773438, 13.17267894744873, 14.428747177124023, 15.684816360473633, 16.940885543823242, 18.19695281982422, 19.453022003173828, 20.709091186523438, 21.965160369873047, 23.221229553222656, 24.477296829223633, 25.733366012573242, 26.98943519592285, 28.245502471923828, 29.501571655273438, 30.757640838623047, 32.013710021972656, 33.269779205322266, 34.525848388671875, 35.78191375732422, 37.03798294067383, 38.29405212402344, 39.55012130737305, 40.806190490722656]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 12.0, 25.0, 23.0, 54.0, 74.0, 118.0, 255.0, 447.0, 677.0, 1235.0, 1961.0, 3466.0, 5717.0, 9136.0, 14521.0, 22266.0, 32992.0, 46269.0, 62977.0, 79645.0, 94432.0, 105083.0, 107657.0, 103594.0, 91952.0, 75914.0, 58846.0, 43523.0, 30714.0, 20691.0, 13273.0, 8265.0, 5192.0, 3144.0, 1861.0, 1080.0, 619.0, 339.0, 230.0, 108.0, 52.0, 49.0, 29.0, 11.0, 19.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-37.375, -36.1455078125, -34.916015625, -33.6865234375, -32.45703125, -31.2275390625, -29.998046875, -28.7685546875, -27.5390625, -26.3095703125, -25.080078125, -23.8505859375, -22.62109375, -21.3916015625, -20.162109375, -18.9326171875, -17.703125, -16.4736328125, -15.244140625, -14.0146484375, -12.78515625, -11.5556640625, -10.326171875, -9.0966796875, -7.8671875, -6.6376953125, -5.408203125, -4.1787109375, -2.94921875, -1.7197265625, -0.490234375, 0.7392578125, 1.96875, 3.1982421875, 4.427734375, 5.6572265625, 6.88671875, 8.1162109375, 9.345703125, 10.5751953125, 11.8046875, 13.0341796875, 14.263671875, 15.4931640625, 16.72265625, 17.9521484375, 19.181640625, 20.4111328125, 21.640625, 22.8701171875, 24.099609375, 25.3291015625, 26.55859375, 27.7880859375, 29.017578125, 30.2470703125, 31.4765625, 32.7060546875, 33.935546875, 35.1650390625, 36.39453125, 37.6240234375, 38.853515625, 40.0830078125, 41.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 6.0, 5.0, 8.0, 5.0, 12.0, 4.0, 16.0, 13.0, 17.0, 25.0, 15.0, 18.0, 34.0, 43.0, 44.0, 21.0, 31.0, 38.0, 42.0, 35.0, 33.0, 52.0, 44.0, 40.0, 42.0, 37.0, 38.0, 34.0, 33.0, 21.0, 27.0, 20.0, 20.0, 12.0, 17.0, 18.0, 20.0, 10.0, 14.0, 9.0, 10.0, 3.0, 4.0, 8.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.03125, -36.826171875, -35.62109375, -34.416015625, -33.2109375, -32.005859375, -30.80078125, -29.595703125, -28.390625, -27.185546875, -25.98046875, -24.775390625, -23.5703125, -22.365234375, -21.16015625, -19.955078125, -18.75, -17.544921875, -16.33984375, -15.134765625, -13.9296875, -12.724609375, -11.51953125, -10.314453125, -9.109375, -7.904296875, -6.69921875, -5.494140625, -4.2890625, -3.083984375, -1.87890625, -0.673828125, 0.53125, 1.736328125, 2.94140625, 4.146484375, 5.3515625, 6.556640625, 7.76171875, 8.966796875, 10.171875, 11.376953125, 12.58203125, 13.787109375, 14.9921875, 16.197265625, 17.40234375, 18.607421875, 19.8125, 21.017578125, 22.22265625, 23.427734375, 24.6328125, 25.837890625, 27.04296875, 28.248046875, 29.453125, 30.658203125, 31.86328125, 33.068359375, 34.2734375, 35.478515625, 36.68359375, 37.888671875, 39.09375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 17.0, 12.0, 24.0, 49.0, 71.0, 123.0, 176.0, 292.0, 512.0, 812.0, 1326.0, 2156.0, 3530.0, 5528.0, 8546.0, 12987.0, 19655.0, 28790.0, 39918.0, 54301.0, 69155.0, 84006.0, 95723.0, 102106.0, 101788.0, 95164.0, 82296.0, 67591.0, 52753.0, 38629.0, 27204.0, 18841.0, 12779.0, 8046.0, 5187.0, 3263.0, 2007.0, 1250.0, 734.0, 457.0, 304.0, 160.0, 113.0, 65.0, 35.0, 32.0, 15.0, 7.0, 9.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-36.5625, -35.380859375, -34.19921875, -33.017578125, -31.8359375, -30.654296875, -29.47265625, -28.291015625, -27.109375, -25.927734375, -24.74609375, -23.564453125, -22.3828125, -21.201171875, -20.01953125, -18.837890625, -17.65625, -16.474609375, -15.29296875, -14.111328125, -12.9296875, -11.748046875, -10.56640625, -9.384765625, -8.203125, -7.021484375, -5.83984375, -4.658203125, -3.4765625, -2.294921875, -1.11328125, 0.068359375, 1.25, 2.431640625, 3.61328125, 4.794921875, 5.9765625, 7.158203125, 8.33984375, 9.521484375, 10.703125, 11.884765625, 13.06640625, 14.248046875, 15.4296875, 16.611328125, 17.79296875, 18.974609375, 20.15625, 21.337890625, 22.51953125, 23.701171875, 24.8828125, 26.064453125, 27.24609375, 28.427734375, 29.609375, 30.791015625, 31.97265625, 33.154296875, 34.3359375, 35.517578125, 36.69921875, 37.880859375, 39.0625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 2.0, 6.0, 8.0, 5.0, 13.0, 13.0, 9.0, 14.0, 17.0, 20.0, 22.0, 29.0, 29.0, 24.0, 16.0, 50.0, 30.0, 43.0, 44.0, 27.0, 40.0, 54.0, 30.0, 46.0, 36.0, 28.0, 35.0, 33.0, 27.0, 32.0, 31.0, 23.0, 14.0, 22.0, 11.0, 14.0, 21.0, 11.0, 10.0, 15.0, 10.0, 7.0, 12.0, 5.0, 3.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-25.828125, -25.0478515625, -24.267578125, -23.4873046875, -22.70703125, -21.9267578125, -21.146484375, -20.3662109375, -19.5859375, -18.8056640625, -18.025390625, -17.2451171875, -16.46484375, -15.6845703125, -14.904296875, -14.1240234375, -13.34375, -12.5634765625, -11.783203125, -11.0029296875, -10.22265625, -9.4423828125, -8.662109375, -7.8818359375, -7.1015625, -6.3212890625, -5.541015625, -4.7607421875, -3.98046875, -3.2001953125, -2.419921875, -1.6396484375, -0.859375, -0.0791015625, 0.701171875, 1.4814453125, 2.26171875, 3.0419921875, 3.822265625, 4.6025390625, 5.3828125, 6.1630859375, 6.943359375, 7.7236328125, 8.50390625, 9.2841796875, 10.064453125, 10.8447265625, 11.625, 12.4052734375, 13.185546875, 13.9658203125, 14.74609375, 15.5263671875, 16.306640625, 17.0869140625, 17.8671875, 18.6474609375, 19.427734375, 20.2080078125, 20.98828125, 21.7685546875, 22.548828125, 23.3291015625, 24.109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 14.0, 16.0, 27.0, 25.0, 51.0, 102.0, 166.0, 257.0, 364.0, 574.0, 1023.0, 1699.0, 2750.0, 4529.0, 7422.0, 12063.0, 19741.0, 30773.0, 45974.0, 66784.0, 89556.0, 109957.0, 123321.0, 124509.0, 111935.0, 91917.0, 68964.0, 48473.0, 31870.0, 20659.0, 13015.0, 7811.0, 4820.0, 2902.0, 1742.0, 1009.0, 689.0, 403.0, 235.0, 136.0, 91.0, 61.0, 37.0, 30.0, 16.0, 13.0, 12.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-16.25, -15.7728271484375, -15.295654296875, -14.8184814453125, -14.34130859375, -13.8641357421875, -13.386962890625, -12.9097900390625, -12.4326171875, -11.9554443359375, -11.478271484375, -11.0010986328125, -10.52392578125, -10.0467529296875, -9.569580078125, -9.0924072265625, -8.615234375, -8.1380615234375, -7.660888671875, -7.1837158203125, -6.70654296875, -6.2293701171875, -5.752197265625, -5.2750244140625, -4.7978515625, -4.3206787109375, -3.843505859375, -3.3663330078125, -2.88916015625, -2.4119873046875, -1.934814453125, -1.4576416015625, -0.98046875, -0.5032958984375, -0.026123046875, 0.4510498046875, 0.92822265625, 1.4053955078125, 1.882568359375, 2.3597412109375, 2.8369140625, 3.3140869140625, 3.791259765625, 4.2684326171875, 4.74560546875, 5.2227783203125, 5.699951171875, 6.1771240234375, 6.654296875, 7.1314697265625, 7.608642578125, 8.0858154296875, 8.56298828125, 9.0401611328125, 9.517333984375, 9.9945068359375, 10.4716796875, 10.9488525390625, 11.426025390625, 11.9031982421875, 12.38037109375, 12.8575439453125, 13.334716796875, 13.8118896484375, 14.2890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 3.0, 10.0, 15.0, 10.0, 13.0, 15.0, 24.0, 27.0, 29.0, 44.0, 48.0, 43.0, 36.0, 45.0, 60.0, 53.0, 64.0, 57.0, 49.0, 52.0, 59.0, 42.0, 38.0, 27.0, 30.0, 20.0, 21.0, 9.0, 6.0, 7.0, 12.0, 6.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0023746490478515625, -0.0023070871829986572, -0.002239525318145752, -0.0021719634532928467, -0.0021044015884399414, -0.002036839723587036, -0.001969277858734131, -0.0019017159938812256, -0.0018341541290283203, -0.001766592264175415, -0.0016990303993225098, -0.0016314685344696045, -0.0015639066696166992, -0.001496344804763794, -0.0014287829399108887, -0.0013612210750579834, -0.0012936592102050781, -0.0012260973453521729, -0.0011585354804992676, -0.0010909736156463623, -0.001023411750793457, -0.0009558498859405518, -0.0008882880210876465, -0.0008207261562347412, -0.0007531642913818359, -0.0006856024265289307, -0.0006180405616760254, -0.0005504786968231201, -0.00048291683197021484, -0.00041535496711730957, -0.0003477931022644043, -0.000280231237411499, -0.00021266937255859375, -0.00014510750770568848, -7.75456428527832e-05, -9.98377799987793e-06, 5.7578086853027344e-05, 0.00012513995170593262, 0.0001927018165588379, 0.00026026368141174316, 0.00032782554626464844, 0.0003953874111175537, 0.000462949275970459, 0.0005305111408233643, 0.0005980730056762695, 0.0006656348705291748, 0.0007331967353820801, 0.0008007586002349854, 0.0008683204650878906, 0.0009358823299407959, 0.0010034441947937012, 0.0010710060596466064, 0.0011385679244995117, 0.001206129789352417, 0.0012736916542053223, 0.0013412535190582275, 0.0014088153839111328, 0.001476377248764038, 0.0015439391136169434, 0.0016115009784698486, 0.001679062843322754, 0.0017466247081756592, 0.0018141865730285645, 0.0018817484378814697, 0.001949310302734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 18.0, 33.0, 36.0, 59.0, 89.0, 162.0, 206.0, 325.0, 513.0, 834.0, 1369.0, 2130.0, 3468.0, 5568.0, 9130.0, 14654.0, 22978.0, 35019.0, 51959.0, 72703.0, 94470.0, 113351.0, 122253.0, 119306.0, 106006.0, 85036.0, 63196.0, 44213.0, 29338.0, 19089.0, 11660.0, 7305.0, 4517.0, 2794.0, 1743.0, 1145.0, 673.0, 441.0, 271.0, 167.0, 119.0, 77.0, 46.0, 23.0, 24.0, 15.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0], "bins": [-17.34375, -16.8450927734375, -16.346435546875, -15.8477783203125, -15.34912109375, -14.8504638671875, -14.351806640625, -13.8531494140625, -13.3544921875, -12.8558349609375, -12.357177734375, -11.8585205078125, -11.35986328125, -10.8612060546875, -10.362548828125, -9.8638916015625, -9.365234375, -8.8665771484375, -8.367919921875, -7.8692626953125, -7.37060546875, -6.8719482421875, -6.373291015625, -5.8746337890625, -5.3759765625, -4.8773193359375, -4.378662109375, -3.8800048828125, -3.38134765625, -2.8826904296875, -2.384033203125, -1.8853759765625, -1.38671875, -0.8880615234375, -0.389404296875, 0.1092529296875, 0.60791015625, 1.1065673828125, 1.605224609375, 2.1038818359375, 2.6025390625, 3.1011962890625, 3.599853515625, 4.0985107421875, 4.59716796875, 5.0958251953125, 5.594482421875, 6.0931396484375, 6.591796875, 7.0904541015625, 7.589111328125, 8.0877685546875, 8.58642578125, 9.0850830078125, 9.583740234375, 10.0823974609375, 10.5810546875, 11.0797119140625, 11.578369140625, 12.0770263671875, 12.57568359375, 13.0743408203125, 13.572998046875, 14.0716552734375, 14.5703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 5.0, 5.0, 11.0, 7.0, 8.0, 15.0, 12.0, 27.0, 29.0, 21.0, 26.0, 33.0, 30.0, 39.0, 41.0, 37.0, 51.0, 40.0, 38.0, 58.0, 45.0, 49.0, 53.0, 45.0, 39.0, 33.0, 36.0, 21.0, 21.0, 28.0, 14.0, 14.0, 9.0, 14.0, 7.0, 5.0, 9.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-6.37109375, -6.18170166015625, -5.9923095703125, -5.80291748046875, -5.613525390625, -5.42413330078125, -5.2347412109375, -5.04534912109375, -4.85595703125, -4.66656494140625, -4.4771728515625, -4.28778076171875, -4.098388671875, -3.90899658203125, -3.7196044921875, -3.53021240234375, -3.3408203125, -3.15142822265625, -2.9620361328125, -2.77264404296875, -2.583251953125, -2.39385986328125, -2.2044677734375, -2.01507568359375, -1.82568359375, -1.63629150390625, -1.4468994140625, -1.25750732421875, -1.068115234375, -0.87872314453125, -0.6893310546875, -0.49993896484375, -0.310546875, -0.12115478515625, 0.0682373046875, 0.25762939453125, 0.447021484375, 0.63641357421875, 0.8258056640625, 1.01519775390625, 1.20458984375, 1.39398193359375, 1.5833740234375, 1.77276611328125, 1.962158203125, 2.15155029296875, 2.3409423828125, 2.53033447265625, 2.7197265625, 2.90911865234375, 3.0985107421875, 3.28790283203125, 3.477294921875, 3.66668701171875, 3.8560791015625, 4.04547119140625, 4.23486328125, 4.42425537109375, 4.6136474609375, 4.80303955078125, 4.992431640625, 5.18182373046875, 5.3712158203125, 5.56060791015625, 5.75]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 3.0, 3.0, 8.0, 3.0, 4.0, 7.0, 15.0, 14.0, 14.0, 13.0, 19.0, 19.0, 20.0, 34.0, 29.0, 21.0, 32.0, 41.0, 28.0, 45.0, 42.0, 35.0, 36.0, 33.0, 28.0, 45.0, 28.0, 49.0, 31.0, 32.0, 29.0, 30.0, 26.0, 30.0, 25.0, 22.0, 14.0, 21.0, 15.0, 12.0, 6.0, 12.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.880313873291016, -37.65155029296875, -36.42278289794922, -35.19401931762695, -33.96525192260742, -32.736488342285156, -31.507722854614258, -30.27895736694336, -29.05019187927246, -27.821426391601562, -26.592660903930664, -25.363895416259766, -24.1351318359375, -22.90636444091797, -21.677600860595703, -20.448835372924805, -19.220069885253906, -17.991304397583008, -16.76253890991211, -15.533774375915527, -14.305008888244629, -13.07624340057373, -11.847478866577148, -10.61871337890625, -9.389947891235352, -8.161182403564453, -6.932417392730713, -5.703652381896973, -4.474886894226074, -3.246121406555176, -2.0173563957214355, -0.7885913848876953, 0.4401741027832031, 1.6689393520355225, 2.897704601287842, 4.126469612121582, 5.3552350997924805, 6.584000587463379, 7.812765598297119, 9.04153060913086, 10.270296096801758, 11.499061584472656, 12.727827072143555, 13.956591606140137, 15.185357093811035, 16.41412353515625, 17.642887115478516, 18.871652603149414, 20.100418090820312, 21.32918357849121, 22.55794906616211, 23.786714553833008, 25.015480041503906, 26.244243621826172, 27.47300910949707, 28.70177459716797, 29.930540084838867, 31.159305572509766, 32.38806915283203, 33.61683654785156, 34.84560012817383, 36.07436752319336, 37.303131103515625, 38.531898498535156, 39.76066207885742]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 6.0, 2.0, 6.0, 13.0, 6.0, 10.0, 15.0, 10.0, 11.0, 16.0, 14.0, 21.0, 24.0, 26.0, 33.0, 41.0, 46.0, 39.0, 35.0, 25.0, 45.0, 64.0, 39.0, 42.0, 49.0, 40.0, 37.0, 33.0, 34.0, 31.0, 25.0, 24.0, 29.0, 13.0, 18.0, 9.0, 15.0, 13.0, 10.0, 9.0, 8.0, 6.0, 6.0, 2.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.3790397644043, -38.07585144042969, -36.772666931152344, -35.469478607177734, -34.166290283203125, -32.86310577392578, -31.559917449951172, -30.256729125976562, -28.953542709350586, -27.65035629272461, -26.34716796875, -25.043981552124023, -23.740795135498047, -22.437606811523438, -21.13442039489746, -19.831233978271484, -18.528045654296875, -17.2248592376709, -15.921670913696289, -14.618484497070312, -13.31529712677002, -12.012109756469727, -10.70892333984375, -9.405735969543457, -8.102548599243164, -6.799361228942871, -5.496174335479736, -4.192987442016602, -2.8898000717163086, -1.5866127014160156, -0.28342580795288086, 1.019761085510254, 2.3229446411132812, 3.626131772994995, 4.929318904876709, 6.232505798339844, 7.535693168640137, 8.83888053894043, 10.142066955566406, 11.4452543258667, 12.748441696166992, 14.051629066467285, 15.354816436767578, 16.658002853393555, 17.96118927001953, 19.26437759399414, 20.567564010620117, 21.870750427246094, 23.173938751220703, 24.47712516784668, 25.78031349182129, 27.083499908447266, 28.386688232421875, 29.68987464904785, 30.993061065673828, 32.29624938964844, 33.59943389892578, 34.90262222290039, 36.205806732177734, 37.508995056152344, 38.81218338012695, 40.11537170410156, 41.418556213378906, 42.721744537353516, 44.024932861328125]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 9.0, 21.0, 37.0, 43.0, 69.0, 122.0, 197.0, 328.0, 511.0, 789.0, 1330.0, 2203.0, 3514.0, 5527.0, 8948.0, 13911.0, 22286.0, 33783.0, 51948.0, 77660.0, 113603.0, 160943.0, 217176.0, 284154.0, 347193.0, 399776.0, 425069.0, 420916.0, 384744.0, 325920.0, 260207.0, 196675.0, 142689.0, 99033.0, 67138.0, 44928.0, 29654.0, 18653.0, 12077.0, 7749.0, 4800.0, 2909.0, 1889.0, 1216.0, 736.0, 431.0, 282.0, 186.0, 98.0, 74.0, 50.0, 28.0, 23.0, 19.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-31.375, -30.38916015625, -29.4033203125, -28.41748046875, -27.431640625, -26.44580078125, -25.4599609375, -24.47412109375, -23.48828125, -22.50244140625, -21.5166015625, -20.53076171875, -19.544921875, -18.55908203125, -17.5732421875, -16.58740234375, -15.6015625, -14.61572265625, -13.6298828125, -12.64404296875, -11.658203125, -10.67236328125, -9.6865234375, -8.70068359375, -7.71484375, -6.72900390625, -5.7431640625, -4.75732421875, -3.771484375, -2.78564453125, -1.7998046875, -0.81396484375, 0.171875, 1.15771484375, 2.1435546875, 3.12939453125, 4.115234375, 5.10107421875, 6.0869140625, 7.07275390625, 8.05859375, 9.04443359375, 10.0302734375, 11.01611328125, 12.001953125, 12.98779296875, 13.9736328125, 14.95947265625, 15.9453125, 16.93115234375, 17.9169921875, 18.90283203125, 19.888671875, 20.87451171875, 21.8603515625, 22.84619140625, 23.83203125, 24.81787109375, 25.8037109375, 26.78955078125, 27.775390625, 28.76123046875, 29.7470703125, 30.73291015625, 31.71875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 6.0, 7.0, 8.0, 10.0, 15.0, 10.0, 19.0, 10.0, 15.0, 31.0, 27.0, 35.0, 38.0, 33.0, 30.0, 40.0, 45.0, 33.0, 55.0, 41.0, 47.0, 48.0, 42.0, 40.0, 39.0, 22.0, 29.0, 34.0, 25.0, 26.0, 23.0, 12.0, 14.0, 13.0, 12.0, 14.0, 11.0, 5.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.99365234375, -31.8310546875, -30.66845703125, -29.505859375, -28.34326171875, -27.1806640625, -26.01806640625, -24.85546875, -23.69287109375, -22.5302734375, -21.36767578125, -20.205078125, -19.04248046875, -17.8798828125, -16.71728515625, -15.5546875, -14.39208984375, -13.2294921875, -12.06689453125, -10.904296875, -9.74169921875, -8.5791015625, -7.41650390625, -6.25390625, -5.09130859375, -3.9287109375, -2.76611328125, -1.603515625, -0.44091796875, 0.7216796875, 1.88427734375, 3.046875, 4.20947265625, 5.3720703125, 6.53466796875, 7.697265625, 8.85986328125, 10.0224609375, 11.18505859375, 12.34765625, 13.51025390625, 14.6728515625, 15.83544921875, 16.998046875, 18.16064453125, 19.3232421875, 20.48583984375, 21.6484375, 22.81103515625, 23.9736328125, 25.13623046875, 26.298828125, 27.46142578125, 28.6240234375, 29.78662109375, 30.94921875, 32.11181640625, 33.2744140625, 34.43701171875, 35.599609375, 36.76220703125, 37.9248046875, 39.08740234375, 40.25]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 10.0, 29.0, 60.0, 81.0, 155.0, 244.0, 455.0, 708.0, 1172.0, 1949.0, 3233.0, 5295.0, 8228.0, 13036.0, 20925.0, 31522.0, 48341.0, 70733.0, 101225.0, 140097.0, 187990.0, 240874.0, 293985.0, 341255.0, 374177.0, 387596.0, 376186.0, 344830.0, 299055.0, 246126.0, 192670.0, 143539.0, 104280.0, 73016.0, 49840.0, 33244.0, 21826.0, 13778.0, 8724.0, 5462.0, 3326.0, 1890.0, 1222.0, 795.0, 457.0, 250.0, 158.0, 89.0, 60.0, 34.0, 15.0, 13.0, 6.0, 6.0, 3.0, 4.0], "bins": [-33.25, -32.2587890625, -31.267578125, -30.2763671875, -29.28515625, -28.2939453125, -27.302734375, -26.3115234375, -25.3203125, -24.3291015625, -23.337890625, -22.3466796875, -21.35546875, -20.3642578125, -19.373046875, -18.3818359375, -17.390625, -16.3994140625, -15.408203125, -14.4169921875, -13.42578125, -12.4345703125, -11.443359375, -10.4521484375, -9.4609375, -8.4697265625, -7.478515625, -6.4873046875, -5.49609375, -4.5048828125, -3.513671875, -2.5224609375, -1.53125, -0.5400390625, 0.451171875, 1.4423828125, 2.43359375, 3.4248046875, 4.416015625, 5.4072265625, 6.3984375, 7.3896484375, 8.380859375, 9.3720703125, 10.36328125, 11.3544921875, 12.345703125, 13.3369140625, 14.328125, 15.3193359375, 16.310546875, 17.3017578125, 18.29296875, 19.2841796875, 20.275390625, 21.2666015625, 22.2578125, 23.2490234375, 24.240234375, 25.2314453125, 26.22265625, 27.2138671875, 28.205078125, 29.1962890625, 30.1875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 7.0, 12.0, 9.0, 13.0, 28.0, 28.0, 40.0, 41.0, 66.0, 78.0, 93.0, 89.0, 119.0, 126.0, 155.0, 172.0, 160.0, 204.0, 188.0, 175.0, 197.0, 184.0, 180.0, 159.0, 210.0, 162.0, 156.0, 155.0, 138.0, 113.0, 102.0, 80.0, 87.0, 80.0, 58.0, 34.0, 37.0, 29.0, 27.0, 26.0, 12.0, 11.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0, -14.47314453125, -13.9462890625, -13.41943359375, -12.892578125, -12.36572265625, -11.8388671875, -11.31201171875, -10.78515625, -10.25830078125, -9.7314453125, -9.20458984375, -8.677734375, -8.15087890625, -7.6240234375, -7.09716796875, -6.5703125, -6.04345703125, -5.5166015625, -4.98974609375, -4.462890625, -3.93603515625, -3.4091796875, -2.88232421875, -2.35546875, -1.82861328125, -1.3017578125, -0.77490234375, -0.248046875, 0.27880859375, 0.8056640625, 1.33251953125, 1.859375, 2.38623046875, 2.9130859375, 3.43994140625, 3.966796875, 4.49365234375, 5.0205078125, 5.54736328125, 6.07421875, 6.60107421875, 7.1279296875, 7.65478515625, 8.181640625, 8.70849609375, 9.2353515625, 9.76220703125, 10.2890625, 10.81591796875, 11.3427734375, 11.86962890625, 12.396484375, 12.92333984375, 13.4501953125, 13.97705078125, 14.50390625, 15.03076171875, 15.5576171875, 16.08447265625, 16.611328125, 17.13818359375, 17.6650390625, 18.19189453125, 18.71875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 2.0, 4.0, 8.0, 6.0, 11.0, 6.0, 9.0, 12.0, 11.0, 17.0, 19.0, 16.0, 32.0, 25.0, 30.0, 33.0, 29.0, 36.0, 41.0, 41.0, 45.0, 41.0, 34.0, 42.0, 42.0, 45.0, 34.0, 36.0, 35.0, 38.0, 27.0, 25.0, 28.0, 19.0, 17.0, 15.0, 13.0, 15.0, 12.0, 12.0, 5.0, 4.0, 8.0, 5.0, 4.0, 1.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-40.19083023071289, -38.88701248168945, -37.58319091796875, -36.27937316894531, -34.975555419921875, -33.67173767089844, -32.367916107177734, -31.064098358154297, -29.76028060913086, -28.45646095275879, -27.15264320373535, -25.84882354736328, -24.545005798339844, -23.241186141967773, -21.937366485595703, -20.633548736572266, -19.329729080200195, -18.025909423828125, -16.722091674804688, -15.418272018432617, -14.11445426940918, -12.81063461303711, -11.506815910339355, -10.202997207641602, -8.899178504943848, -7.595359802246094, -6.29154109954834, -4.987721920013428, -3.683903217315674, -2.38008451461792, -1.0762653350830078, 0.2275533676147461, 1.5313720703125, 2.835190773010254, 4.139009475708008, 5.44282865524292, 6.746647357940674, 8.050466537475586, 9.35428524017334, 10.658103942871094, 11.961922645568848, 13.265741348266602, 14.569560050964355, 15.87337875366211, 17.17719841003418, 18.481016159057617, 19.784835815429688, 21.088653564453125, 22.392473220825195, 23.696292877197266, 25.000110626220703, 26.303930282592773, 27.60774803161621, 28.91156768798828, 30.21538543701172, 31.51920509338379, 32.82302474975586, 34.1268424987793, 35.4306640625, 36.73448181152344, 38.038299560546875, 39.34211730957031, 40.645938873291016, 41.94975662231445, 43.25357437133789]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 3.0, 3.0, 3.0, 7.0, 6.0, 14.0, 11.0, 10.0, 8.0, 14.0, 17.0, 23.0, 23.0, 27.0, 28.0, 31.0, 30.0, 21.0, 36.0, 33.0, 36.0, 56.0, 40.0, 38.0, 34.0, 36.0, 44.0, 39.0, 28.0, 28.0, 32.0, 34.0, 32.0, 25.0, 21.0, 14.0, 17.0, 10.0, 6.0, 14.0, 24.0, 6.0, 6.0, 8.0, 5.0, 3.0, 8.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.97538757324219, -34.80400466918945, -33.63262176513672, -32.46123504638672, -31.289852142333984, -30.11846923828125, -28.947084426879883, -27.775699615478516, -26.60431671142578, -25.432933807373047, -24.26154899597168, -23.090164184570312, -21.918781280517578, -20.747398376464844, -19.576013565063477, -18.40462875366211, -17.233245849609375, -16.06186294555664, -14.890478134155273, -13.719094276428223, -12.547710418701172, -11.376326560974121, -10.20494270324707, -9.03355884552002, -7.862174987792969, -6.690791130065918, -5.519407272338867, -4.348023414611816, -3.1766395568847656, -2.005255699157715, -0.8338718414306641, 0.3375120162963867, 1.5088996887207031, 2.680283546447754, 3.8516674041748047, 5.0230512619018555, 6.194435119628906, 7.365818977355957, 8.537202835083008, 9.708586692810059, 10.87997055053711, 12.05135440826416, 13.222738265991211, 14.394122123718262, 15.565505981445312, 16.736888885498047, 17.908273696899414, 19.07965850830078, 20.251041412353516, 21.42242431640625, 22.593809127807617, 23.765193939208984, 24.93657684326172, 26.107959747314453, 27.27934455871582, 28.450729370117188, 29.622112274169922, 30.793495178222656, 31.964879989624023, 33.13626480102539, 34.307647705078125, 35.47903060913086, 36.650413513183594, 37.821800231933594, 38.99318313598633]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 4.0, 7.0, 13.0, 12.0, 36.0, 35.0, 36.0, 94.0, 106.0, 192.0, 226.0, 382.0, 564.0, 807.0, 1280.0, 1987.0, 2988.0, 4866.0, 7765.0, 12461.0, 19288.0, 30304.0, 46018.0, 66667.0, 92601.0, 116090.0, 130843.0, 129235.0, 112619.0, 88158.0, 62834.0, 42766.0, 28152.0, 17849.0, 11373.0, 7179.0, 4536.0, 2878.0, 1808.0, 1200.0, 799.0, 479.0, 325.0, 234.0, 154.0, 115.0, 63.0, 50.0, 31.0, 23.0, 10.0, 15.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-21.65625, -20.998291015625, -20.34033203125, -19.682373046875, -19.0244140625, -18.366455078125, -17.70849609375, -17.050537109375, -16.392578125, -15.734619140625, -15.07666015625, -14.418701171875, -13.7607421875, -13.102783203125, -12.44482421875, -11.786865234375, -11.12890625, -10.470947265625, -9.81298828125, -9.155029296875, -8.4970703125, -7.839111328125, -7.18115234375, -6.523193359375, -5.865234375, -5.207275390625, -4.54931640625, -3.891357421875, -3.2333984375, -2.575439453125, -1.91748046875, -1.259521484375, -0.6015625, 0.056396484375, 0.71435546875, 1.372314453125, 2.0302734375, 2.688232421875, 3.34619140625, 4.004150390625, 4.662109375, 5.320068359375, 5.97802734375, 6.635986328125, 7.2939453125, 7.951904296875, 8.60986328125, 9.267822265625, 9.92578125, 10.583740234375, 11.24169921875, 11.899658203125, 12.5576171875, 13.215576171875, 13.87353515625, 14.531494140625, 15.189453125, 15.847412109375, 16.50537109375, 17.163330078125, 17.8212890625, 18.479248046875, 19.13720703125, 19.795166015625, 20.453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 5.0, 3.0, 3.0, 5.0, 8.0, 10.0, 14.0, 8.0, 10.0, 14.0, 15.0, 24.0, 23.0, 25.0, 28.0, 29.0, 33.0, 20.0, 38.0, 28.0, 37.0, 58.0, 40.0, 35.0, 36.0, 39.0, 41.0, 38.0, 32.0, 29.0, 29.0, 36.0, 33.0, 26.0, 16.0, 20.0, 16.0, 8.0, 8.0, 15.0, 21.0, 8.0, 7.0, 6.0, 6.0, 3.0, 8.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.96875, -34.80029296875, -33.6318359375, -32.46337890625, -31.294921875, -30.12646484375, -28.9580078125, -27.78955078125, -26.62109375, -25.45263671875, -24.2841796875, -23.11572265625, -21.947265625, -20.77880859375, -19.6103515625, -18.44189453125, -17.2734375, -16.10498046875, -14.9365234375, -13.76806640625, -12.599609375, -11.43115234375, -10.2626953125, -9.09423828125, -7.92578125, -6.75732421875, -5.5888671875, -4.42041015625, -3.251953125, -2.08349609375, -0.9150390625, 0.25341796875, 1.421875, 2.59033203125, 3.7587890625, 4.92724609375, 6.095703125, 7.26416015625, 8.4326171875, 9.60107421875, 10.76953125, 11.93798828125, 13.1064453125, 14.27490234375, 15.443359375, 16.61181640625, 17.7802734375, 18.94873046875, 20.1171875, 21.28564453125, 22.4541015625, 23.62255859375, 24.791015625, 25.95947265625, 27.1279296875, 28.29638671875, 29.46484375, 30.63330078125, 31.8017578125, 32.97021484375, 34.138671875, 35.30712890625, 36.4755859375, 37.64404296875, 38.8125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 12.0, 18.0, 15.0, 25.0, 39.0, 58.0, 79.0, 135.0, 223.0, 334.0, 564.0, 859.0, 1467.0, 2644.0, 4893.0, 9445.0, 19328.0, 42344.0, 96175.0, 199905.0, 279653.0, 205313.0, 99567.0, 43785.0, 20232.0, 9782.0, 5032.0, 2697.0, 1504.0, 883.0, 579.0, 334.0, 214.0, 140.0, 95.0, 60.0, 38.0, 36.0, 20.0, 16.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.1875, -31.09716796875, -30.0068359375, -28.91650390625, -27.826171875, -26.73583984375, -25.6455078125, -24.55517578125, -23.46484375, -22.37451171875, -21.2841796875, -20.19384765625, -19.103515625, -18.01318359375, -16.9228515625, -15.83251953125, -14.7421875, -13.65185546875, -12.5615234375, -11.47119140625, -10.380859375, -9.29052734375, -8.2001953125, -7.10986328125, -6.01953125, -4.92919921875, -3.8388671875, -2.74853515625, -1.658203125, -0.56787109375, 0.5224609375, 1.61279296875, 2.703125, 3.79345703125, 4.8837890625, 5.97412109375, 7.064453125, 8.15478515625, 9.2451171875, 10.33544921875, 11.42578125, 12.51611328125, 13.6064453125, 14.69677734375, 15.787109375, 16.87744140625, 17.9677734375, 19.05810546875, 20.1484375, 21.23876953125, 22.3291015625, 23.41943359375, 24.509765625, 25.60009765625, 26.6904296875, 27.78076171875, 28.87109375, 29.96142578125, 31.0517578125, 32.14208984375, 33.232421875, 34.32275390625, 35.4130859375, 36.50341796875, 37.59375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 7.0, 7.0, 7.0, 16.0, 9.0, 14.0, 23.0, 17.0, 22.0, 20.0, 21.0, 37.0, 41.0, 41.0, 39.0, 42.0, 46.0, 51.0, 44.0, 31.0, 50.0, 54.0, 44.0, 41.0, 36.0, 32.0, 35.0, 27.0, 30.0, 20.0, 15.0, 12.0, 12.0, 10.0, 17.0, 3.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.75, -24.908935546875, -24.06787109375, -23.226806640625, -22.3857421875, -21.544677734375, -20.70361328125, -19.862548828125, -19.021484375, -18.180419921875, -17.33935546875, -16.498291015625, -15.6572265625, -14.816162109375, -13.97509765625, -13.134033203125, -12.29296875, -11.451904296875, -10.61083984375, -9.769775390625, -8.9287109375, -8.087646484375, -7.24658203125, -6.405517578125, -5.564453125, -4.723388671875, -3.88232421875, -3.041259765625, -2.2001953125, -1.359130859375, -0.51806640625, 0.322998046875, 1.1640625, 2.005126953125, 2.84619140625, 3.687255859375, 4.5283203125, 5.369384765625, 6.21044921875, 7.051513671875, 7.892578125, 8.733642578125, 9.57470703125, 10.415771484375, 11.2568359375, 12.097900390625, 12.93896484375, 13.780029296875, 14.62109375, 15.462158203125, 16.30322265625, 17.144287109375, 17.9853515625, 18.826416015625, 19.66748046875, 20.508544921875, 21.349609375, 22.190673828125, 23.03173828125, 23.872802734375, 24.7138671875, 25.554931640625, 26.39599609375, 27.237060546875, 28.078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 10.0, 13.0, 19.0, 29.0, 36.0, 82.0, 89.0, 153.0, 247.0, 398.0, 708.0, 1139.0, 2039.0, 4100.0, 7443.0, 15465.0, 33370.0, 78748.0, 200555.0, 351096.0, 206064.0, 80551.0, 33992.0, 15564.0, 7622.0, 3864.0, 2116.0, 1211.0, 706.0, 389.0, 248.0, 157.0, 112.0, 77.0, 43.0, 27.0, 24.0, 14.0, 9.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-21.875, -21.2412109375, -20.607421875, -19.9736328125, -19.33984375, -18.7060546875, -18.072265625, -17.4384765625, -16.8046875, -16.1708984375, -15.537109375, -14.9033203125, -14.26953125, -13.6357421875, -13.001953125, -12.3681640625, -11.734375, -11.1005859375, -10.466796875, -9.8330078125, -9.19921875, -8.5654296875, -7.931640625, -7.2978515625, -6.6640625, -6.0302734375, -5.396484375, -4.7626953125, -4.12890625, -3.4951171875, -2.861328125, -2.2275390625, -1.59375, -0.9599609375, -0.326171875, 0.3076171875, 0.94140625, 1.5751953125, 2.208984375, 2.8427734375, 3.4765625, 4.1103515625, 4.744140625, 5.3779296875, 6.01171875, 6.6455078125, 7.279296875, 7.9130859375, 8.546875, 9.1806640625, 9.814453125, 10.4482421875, 11.08203125, 11.7158203125, 12.349609375, 12.9833984375, 13.6171875, 14.2509765625, 14.884765625, 15.5185546875, 16.15234375, 16.7861328125, 17.419921875, 18.0537109375, 18.6875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 15.0, 14.0, 27.0, 35.0, 54.0, 59.0, 67.0, 70.0, 90.0, 85.0, 102.0, 76.0, 67.0, 46.0, 51.0, 36.0, 25.0, 24.0, 12.0, 12.0, 7.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012264251708984375, -0.0011851489543914795, -0.0011438727378845215, -0.0011025965213775635, -0.0010613203048706055, -0.0010200440883636475, -0.0009787678718566895, -0.0009374916553497314, -0.0008962154388427734, -0.0008549392223358154, -0.0008136630058288574, -0.0007723867893218994, -0.0007311105728149414, -0.0006898343563079834, -0.0006485581398010254, -0.0006072819232940674, -0.0005660057067871094, -0.0005247294902801514, -0.00048345327377319336, -0.00044217705726623535, -0.00040090084075927734, -0.00035962462425231934, -0.00031834840774536133, -0.0002770721912384033, -0.0002357959747314453, -0.0001945197582244873, -0.0001532435417175293, -0.00011196732521057129, -7.069110870361328e-05, -2.9414892196655273e-05, 1.1861324310302734e-05, 5.313754081726074e-05, 9.441375732421875e-05, 0.00013568997383117676, 0.00017696619033813477, 0.00021824240684509277, 0.0002595186233520508, 0.0003007948398590088, 0.0003420710563659668, 0.0003833472728729248, 0.0004246234893798828, 0.0004658997058868408, 0.0005071759223937988, 0.0005484521389007568, 0.0005897283554077148, 0.0006310045719146729, 0.0006722807884216309, 0.0007135570049285889, 0.0007548332214355469, 0.0007961094379425049, 0.0008373856544494629, 0.0008786618709564209, 0.0009199380874633789, 0.0009612143039703369, 0.001002490520477295, 0.001043766736984253, 0.001085042953491211, 0.001126319169998169, 0.001167595386505127, 0.001208871603012085, 0.001250147819519043, 0.001291424036026001, 0.001332700252532959, 0.001373976469039917, 0.001415252685546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 3.0, 5.0, 7.0, 14.0, 17.0, 18.0, 38.0, 64.0, 106.0, 124.0, 173.0, 270.0, 410.0, 603.0, 909.0, 1344.0, 2028.0, 3149.0, 4655.0, 7223.0, 11033.0, 16570.0, 25070.0, 38496.0, 56436.0, 79375.0, 105615.0, 125519.0, 131363.0, 119380.0, 97497.0, 72179.0, 50086.0, 33657.0, 22080.0, 14670.0, 9466.0, 6557.0, 4135.0, 2740.0, 1856.0, 1186.0, 799.0, 540.0, 346.0, 243.0, 162.0, 114.0, 65.0, 52.0, 36.0, 29.0, 17.0, 17.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-14.390625, -13.9315185546875, -13.472412109375, -13.0133056640625, -12.55419921875, -12.0950927734375, -11.635986328125, -11.1768798828125, -10.7177734375, -10.2586669921875, -9.799560546875, -9.3404541015625, -8.88134765625, -8.4222412109375, -7.963134765625, -7.5040283203125, -7.044921875, -6.5858154296875, -6.126708984375, -5.6676025390625, -5.20849609375, -4.7493896484375, -4.290283203125, -3.8311767578125, -3.3720703125, -2.9129638671875, -2.453857421875, -1.9947509765625, -1.53564453125, -1.0765380859375, -0.617431640625, -0.1583251953125, 0.30078125, 0.7598876953125, 1.218994140625, 1.6781005859375, 2.13720703125, 2.5963134765625, 3.055419921875, 3.5145263671875, 3.9736328125, 4.4327392578125, 4.891845703125, 5.3509521484375, 5.81005859375, 6.2691650390625, 6.728271484375, 7.1873779296875, 7.646484375, 8.1055908203125, 8.564697265625, 9.0238037109375, 9.48291015625, 9.9420166015625, 10.401123046875, 10.8602294921875, 11.3193359375, 11.7784423828125, 12.237548828125, 12.6966552734375, 13.15576171875, 13.6148681640625, 14.073974609375, 14.5330810546875, 14.9921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 8.0, 5.0, 9.0, 16.0, 10.0, 13.0, 13.0, 18.0, 37.0, 40.0, 30.0, 52.0, 57.0, 57.0, 59.0, 51.0, 60.0, 74.0, 65.0, 58.0, 38.0, 51.0, 38.0, 37.0, 22.0, 20.0, 9.0, 15.0, 12.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.03125, -8.78802490234375, -8.5447998046875, -8.30157470703125, -8.058349609375, -7.81512451171875, -7.5718994140625, -7.32867431640625, -7.08544921875, -6.84222412109375, -6.5989990234375, -6.35577392578125, -6.112548828125, -5.86932373046875, -5.6260986328125, -5.38287353515625, -5.1396484375, -4.89642333984375, -4.6531982421875, -4.40997314453125, -4.166748046875, -3.92352294921875, -3.6802978515625, -3.43707275390625, -3.19384765625, -2.95062255859375, -2.7073974609375, -2.46417236328125, -2.220947265625, -1.97772216796875, -1.7344970703125, -1.49127197265625, -1.248046875, -1.00482177734375, -0.7615966796875, -0.51837158203125, -0.275146484375, -0.03192138671875, 0.2113037109375, 0.45452880859375, 0.69775390625, 0.94097900390625, 1.1842041015625, 1.42742919921875, 1.670654296875, 1.91387939453125, 2.1571044921875, 2.40032958984375, 2.6435546875, 2.88677978515625, 3.1300048828125, 3.37322998046875, 3.616455078125, 3.85968017578125, 4.1029052734375, 4.34613037109375, 4.58935546875, 4.83258056640625, 5.0758056640625, 5.31903076171875, 5.562255859375, 5.80548095703125, 6.0487060546875, 6.29193115234375, 6.53515625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 1.0, 7.0, 5.0, 8.0, 6.0, 5.0, 11.0, 7.0, 8.0, 13.0, 21.0, 15.0, 29.0, 22.0, 30.0, 29.0, 34.0, 33.0, 47.0, 39.0, 51.0, 34.0, 33.0, 48.0, 44.0, 48.0, 31.0, 35.0, 44.0, 34.0, 34.0, 33.0, 20.0, 18.0, 18.0, 17.0, 16.0, 15.0, 13.0, 12.0, 7.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-40.58571243286133, -39.239959716796875, -37.894203186035156, -36.5484504699707, -35.20269775390625, -33.85694122314453, -32.51118850708008, -31.165433883666992, -29.819679260253906, -28.47392463684082, -27.128170013427734, -25.78241729736328, -24.436662673950195, -23.09090805053711, -21.745155334472656, -20.39940071105957, -19.053646087646484, -17.7078914642334, -16.362136840820312, -15.01638412475586, -13.670629501342773, -12.324874877929688, -10.979121208190918, -9.633367538452148, -8.287612915039062, -6.941858768463135, -5.596104621887207, -4.250350475311279, -2.9045963287353516, -1.5588421821594238, -0.2130880355834961, 1.1326656341552734, 2.478424072265625, 3.8241782188415527, 5.1699323654174805, 6.515686511993408, 7.861440658569336, 9.207195281982422, 10.552948951721191, 11.898702621459961, 13.244457244873047, 14.590211868286133, 15.935965538024902, 17.281719207763672, 18.627473831176758, 19.973228454589844, 21.318981170654297, 22.664735794067383, 24.01049041748047, 25.356245040893555, 26.70199966430664, 28.047752380371094, 29.39350700378418, 30.739261627197266, 32.08501434326172, 33.43077087402344, 34.77652359008789, 36.122276306152344, 37.46803283691406, 38.813785552978516, 40.15953826904297, 41.50529479980469, 42.85104751586914, 44.196800231933594, 45.54255676269531]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 9.0, 1.0, 8.0, 7.0, 11.0, 13.0, 12.0, 10.0, 15.0, 22.0, 19.0, 22.0, 33.0, 31.0, 30.0, 32.0, 30.0, 31.0, 36.0, 46.0, 50.0, 31.0, 38.0, 36.0, 39.0, 35.0, 40.0, 36.0, 26.0, 32.0, 35.0, 22.0, 30.0, 20.0, 10.0, 17.0, 8.0, 15.0, 9.0, 11.0, 13.0, 4.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.22665786743164, -36.025390625, -34.82412338256836, -33.62285614013672, -32.42158889770508, -31.220321655273438, -30.019054412841797, -28.817787170410156, -27.616519927978516, -26.415252685546875, -25.213985443115234, -24.012718200683594, -22.811450958251953, -21.610183715820312, -20.408916473388672, -19.20764923095703, -18.006383895874023, -16.805116653442383, -15.603849411010742, -14.402582168579102, -13.201314926147461, -12.00004768371582, -10.798781394958496, -9.597514152526855, -8.396246910095215, -7.194979667663574, -5.993712425231934, -4.792445659637451, -3.5911784172058105, -2.38991117477417, -1.1886444091796875, 0.012622833251953125, 1.2138900756835938, 2.4151573181152344, 3.616424322128296, 4.817691326141357, 6.018958568572998, 7.220225811004639, 8.421492576599121, 9.622759819030762, 10.824027061462402, 12.025294303894043, 13.226561546325684, 14.427827835083008, 15.629095077514648, 16.83036231994629, 18.03162956237793, 19.23289680480957, 20.43416404724121, 21.63543128967285, 22.836698532104492, 24.037965774536133, 25.239233016967773, 26.440500259399414, 27.641765594482422, 28.843032836914062, 30.044300079345703, 31.245567321777344, 32.446834564208984, 33.648101806640625, 34.849369049072266, 36.050636291503906, 37.25190353393555, 38.45317077636719, 39.65443801879883]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 14.0, 21.0, 44.0, 69.0, 94.0, 150.0, 235.0, 402.0, 668.0, 1021.0, 1567.0, 2464.0, 3825.0, 5708.0, 8712.0, 12820.0, 18185.0, 25036.0, 33777.0, 43932.0, 55342.0, 66230.0, 76866.0, 84264.0, 88878.0, 87896.0, 83191.0, 75587.0, 65380.0, 53884.0, 42392.0, 32273.0, 24289.0, 17267.0, 12005.0, 8445.0, 5472.0, 3656.0, 2386.0, 1480.0, 971.0, 627.0, 383.0, 235.0, 156.0, 87.0, 63.0, 37.0, 20.0, 20.0, 13.0, 6.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.125, -31.149658203125, -30.17431640625, -29.198974609375, -28.2236328125, -27.248291015625, -26.27294921875, -25.297607421875, -24.322265625, -23.346923828125, -22.37158203125, -21.396240234375, -20.4208984375, -19.445556640625, -18.47021484375, -17.494873046875, -16.51953125, -15.544189453125, -14.56884765625, -13.593505859375, -12.6181640625, -11.642822265625, -10.66748046875, -9.692138671875, -8.716796875, -7.741455078125, -6.76611328125, -5.790771484375, -4.8154296875, -3.840087890625, -2.86474609375, -1.889404296875, -0.9140625, 0.061279296875, 1.03662109375, 2.011962890625, 2.9873046875, 3.962646484375, 4.93798828125, 5.913330078125, 6.888671875, 7.864013671875, 8.83935546875, 9.814697265625, 10.7900390625, 11.765380859375, 12.74072265625, 13.716064453125, 14.69140625, 15.666748046875, 16.64208984375, 17.617431640625, 18.5927734375, 19.568115234375, 20.54345703125, 21.518798828125, 22.494140625, 23.469482421875, 24.44482421875, 25.420166015625, 26.3955078125, 27.370849609375, 28.34619140625, 29.321533203125, 30.296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 1.0, 7.0, 3.0, 8.0, 5.0, 12.0, 12.0, 14.0, 13.0, 13.0, 18.0, 21.0, 29.0, 24.0, 36.0, 32.0, 30.0, 32.0, 27.0, 32.0, 44.0, 56.0, 30.0, 42.0, 32.0, 39.0, 32.0, 42.0, 36.0, 30.0, 33.0, 31.0, 24.0, 32.0, 18.0, 11.0, 16.0, 9.0, 14.0, 8.0, 14.0, 9.0, 6.0, 6.0, 4.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.125, -34.9619140625, -33.798828125, -32.6357421875, -31.47265625, -30.3095703125, -29.146484375, -27.9833984375, -26.8203125, -25.6572265625, -24.494140625, -23.3310546875, -22.16796875, -21.0048828125, -19.841796875, -18.6787109375, -17.515625, -16.3525390625, -15.189453125, -14.0263671875, -12.86328125, -11.7001953125, -10.537109375, -9.3740234375, -8.2109375, -7.0478515625, -5.884765625, -4.7216796875, -3.55859375, -2.3955078125, -1.232421875, -0.0693359375, 1.09375, 2.2568359375, 3.419921875, 4.5830078125, 5.74609375, 6.9091796875, 8.072265625, 9.2353515625, 10.3984375, 11.5615234375, 12.724609375, 13.8876953125, 15.05078125, 16.2138671875, 17.376953125, 18.5400390625, 19.703125, 20.8662109375, 22.029296875, 23.1923828125, 24.35546875, 25.5185546875, 26.681640625, 27.8447265625, 29.0078125, 30.1708984375, 31.333984375, 32.4970703125, 33.66015625, 34.8232421875, 35.986328125, 37.1494140625, 38.3125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 8.0, 13.0, 20.0, 46.0, 87.0, 112.0, 193.0, 314.0, 523.0, 952.0, 1650.0, 2813.0, 4542.0, 7506.0, 12351.0, 19452.0, 28824.0, 41877.0, 57613.0, 73979.0, 89934.0, 102441.0, 108002.0, 106419.0, 96716.0, 81596.0, 65046.0, 48773.0, 34126.0, 23380.0, 15126.0, 9554.0, 5841.0, 3536.0, 2150.0, 1202.0, 734.0, 419.0, 264.0, 153.0, 101.0, 52.0, 42.0, 21.0, 20.0, 12.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.6416015625, -32.470703125, -31.2998046875, -30.12890625, -28.9580078125, -27.787109375, -26.6162109375, -25.4453125, -24.2744140625, -23.103515625, -21.9326171875, -20.76171875, -19.5908203125, -18.419921875, -17.2490234375, -16.078125, -14.9072265625, -13.736328125, -12.5654296875, -11.39453125, -10.2236328125, -9.052734375, -7.8818359375, -6.7109375, -5.5400390625, -4.369140625, -3.1982421875, -2.02734375, -0.8564453125, 0.314453125, 1.4853515625, 2.65625, 3.8271484375, 4.998046875, 6.1689453125, 7.33984375, 8.5107421875, 9.681640625, 10.8525390625, 12.0234375, 13.1943359375, 14.365234375, 15.5361328125, 16.70703125, 17.8779296875, 19.048828125, 20.2197265625, 21.390625, 22.5615234375, 23.732421875, 24.9033203125, 26.07421875, 27.2451171875, 28.416015625, 29.5869140625, 30.7578125, 31.9287109375, 33.099609375, 34.2705078125, 35.44140625, 36.6123046875, 37.783203125, 38.9541015625, 40.125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 11.0, 12.0, 14.0, 15.0, 15.0, 22.0, 22.0, 24.0, 14.0, 20.0, 25.0, 31.0, 31.0, 32.0, 27.0, 37.0, 40.0, 35.0, 36.0, 24.0, 45.0, 27.0, 32.0, 38.0, 33.0, 37.0, 25.0, 29.0, 33.0, 31.0, 25.0, 23.0, 19.0, 18.0, 21.0, 6.0, 11.0, 8.0, 9.0, 7.0, 8.0, 4.0, 4.0, 6.0, 0.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-25.46875, -24.71533203125, -23.9619140625, -23.20849609375, -22.455078125, -21.70166015625, -20.9482421875, -20.19482421875, -19.44140625, -18.68798828125, -17.9345703125, -17.18115234375, -16.427734375, -15.67431640625, -14.9208984375, -14.16748046875, -13.4140625, -12.66064453125, -11.9072265625, -11.15380859375, -10.400390625, -9.64697265625, -8.8935546875, -8.14013671875, -7.38671875, -6.63330078125, -5.8798828125, -5.12646484375, -4.373046875, -3.61962890625, -2.8662109375, -2.11279296875, -1.359375, -0.60595703125, 0.1474609375, 0.90087890625, 1.654296875, 2.40771484375, 3.1611328125, 3.91455078125, 4.66796875, 5.42138671875, 6.1748046875, 6.92822265625, 7.681640625, 8.43505859375, 9.1884765625, 9.94189453125, 10.6953125, 11.44873046875, 12.2021484375, 12.95556640625, 13.708984375, 14.46240234375, 15.2158203125, 15.96923828125, 16.72265625, 17.47607421875, 18.2294921875, 18.98291015625, 19.736328125, 20.48974609375, 21.2431640625, 21.99658203125, 22.75]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 3.0, 6.0, 15.0, 8.0, 35.0, 34.0, 51.0, 78.0, 99.0, 175.0, 300.0, 489.0, 860.0, 1742.0, 3666.0, 8516.0, 20152.0, 46090.0, 94406.0, 159790.0, 209390.0, 202414.0, 146733.0, 82925.0, 39574.0, 17179.0, 7273.0, 3167.0, 1506.0, 735.0, 442.0, 246.0, 163.0, 102.0, 66.0, 33.0, 24.0, 26.0, 14.0, 9.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.03125, -22.205810546875, -21.38037109375, -20.554931640625, -19.7294921875, -18.904052734375, -18.07861328125, -17.253173828125, -16.427734375, -15.602294921875, -14.77685546875, -13.951416015625, -13.1259765625, -12.300537109375, -11.47509765625, -10.649658203125, -9.82421875, -8.998779296875, -8.17333984375, -7.347900390625, -6.5224609375, -5.697021484375, -4.87158203125, -4.046142578125, -3.220703125, -2.395263671875, -1.56982421875, -0.744384765625, 0.0810546875, 0.906494140625, 1.73193359375, 2.557373046875, 3.3828125, 4.208251953125, 5.03369140625, 5.859130859375, 6.6845703125, 7.510009765625, 8.33544921875, 9.160888671875, 9.986328125, 10.811767578125, 11.63720703125, 12.462646484375, 13.2880859375, 14.113525390625, 14.93896484375, 15.764404296875, 16.58984375, 17.415283203125, 18.24072265625, 19.066162109375, 19.8916015625, 20.717041015625, 21.54248046875, 22.367919921875, 23.193359375, 24.018798828125, 24.84423828125, 25.669677734375, 26.4951171875, 27.320556640625, 28.14599609375, 28.971435546875, 29.796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 11.0, 15.0, 17.0, 18.0, 17.0, 29.0, 25.0, 36.0, 30.0, 25.0, 42.0, 35.0, 47.0, 40.0, 46.0, 45.0, 50.0, 55.0, 40.0, 43.0, 36.0, 38.0, 27.0, 31.0, 29.0, 16.0, 24.0, 12.0, 20.0, 13.0, 11.0, 11.0, 6.0, 12.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0017099380493164062, -0.0016562491655349731, -0.00160256028175354, -0.001548871397972107, -0.0014951825141906738, -0.0014414936304092407, -0.0013878047466278076, -0.0013341158628463745, -0.0012804269790649414, -0.0012267380952835083, -0.0011730492115020752, -0.001119360327720642, -0.001065671443939209, -0.0010119825601577759, -0.0009582936763763428, -0.0009046047925949097, -0.0008509159088134766, -0.0007972270250320435, -0.0007435381412506104, -0.0006898492574691772, -0.0006361603736877441, -0.000582471489906311, -0.0005287826061248779, -0.0004750937223434448, -0.0004214048385620117, -0.0003677159547805786, -0.0003140270709991455, -0.0002603381872177124, -0.0002066493034362793, -0.0001529604196548462, -9.927153587341309e-05, -4.558265209197998e-05, 8.106231689453125e-06, 6.179511547088623e-05, 0.00011548399925231934, 0.00016917288303375244, 0.00022286176681518555, 0.00027655065059661865, 0.00033023953437805176, 0.00038392841815948486, 0.00043761730194091797, 0.0004913061857223511, 0.0005449950695037842, 0.0005986839532852173, 0.0006523728370666504, 0.0007060617208480835, 0.0007597506046295166, 0.0008134394884109497, 0.0008671283721923828, 0.0009208172559738159, 0.000974506139755249, 0.0010281950235366821, 0.0010818839073181152, 0.0011355727910995483, 0.0011892616748809814, 0.0012429505586624146, 0.0012966394424438477, 0.0013503283262252808, 0.0014040172100067139, 0.001457706093788147, 0.00151139497756958, 0.0015650838613510132, 0.0016187727451324463, 0.0016724616289138794, 0.0017261505126953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 5.0, 9.0, 10.0, 18.0, 21.0, 41.0, 42.0, 77.0, 103.0, 128.0, 222.0, 347.0, 531.0, 837.0, 1320.0, 2392.0, 3925.0, 7053.0, 12617.0, 22277.0, 38659.0, 64425.0, 98022.0, 132160.0, 154048.0, 151126.0, 126089.0, 91040.0, 58956.0, 35096.0, 20047.0, 11236.0, 6505.0, 3639.0, 2094.0, 1286.0, 748.0, 474.0, 308.0, 188.0, 131.0, 103.0, 55.0, 41.0, 31.0, 13.0, 23.0, 13.0, 13.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-21.4375, -20.765625, -20.09375, -19.421875, -18.75, -18.078125, -17.40625, -16.734375, -16.0625, -15.390625, -14.71875, -14.046875, -13.375, -12.703125, -12.03125, -11.359375, -10.6875, -10.015625, -9.34375, -8.671875, -8.0, -7.328125, -6.65625, -5.984375, -5.3125, -4.640625, -3.96875, -3.296875, -2.625, -1.953125, -1.28125, -0.609375, 0.0625, 0.734375, 1.40625, 2.078125, 2.75, 3.421875, 4.09375, 4.765625, 5.4375, 6.109375, 6.78125, 7.453125, 8.125, 8.796875, 9.46875, 10.140625, 10.8125, 11.484375, 12.15625, 12.828125, 13.5, 14.171875, 14.84375, 15.515625, 16.1875, 16.859375, 17.53125, 18.203125, 18.875, 19.546875, 20.21875, 20.890625, 21.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 8.0, 8.0, 17.0, 12.0, 21.0, 28.0, 23.0, 29.0, 45.0, 41.0, 38.0, 36.0, 42.0, 46.0, 47.0, 42.0, 49.0, 52.0, 55.0, 47.0, 29.0, 38.0, 35.0, 34.0, 30.0, 29.0, 24.0, 19.0, 15.0, 7.0, 6.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.74609375, -7.50140380859375, -7.2567138671875, -7.01202392578125, -6.767333984375, -6.52264404296875, -6.2779541015625, -6.03326416015625, -5.78857421875, -5.54388427734375, -5.2991943359375, -5.05450439453125, -4.809814453125, -4.56512451171875, -4.3204345703125, -4.07574462890625, -3.8310546875, -3.58636474609375, -3.3416748046875, -3.09698486328125, -2.852294921875, -2.60760498046875, -2.3629150390625, -2.11822509765625, -1.87353515625, -1.62884521484375, -1.3841552734375, -1.13946533203125, -0.894775390625, -0.65008544921875, -0.4053955078125, -0.16070556640625, 0.083984375, 0.32867431640625, 0.5733642578125, 0.81805419921875, 1.062744140625, 1.30743408203125, 1.5521240234375, 1.79681396484375, 2.04150390625, 2.28619384765625, 2.5308837890625, 2.77557373046875, 3.020263671875, 3.26495361328125, 3.5096435546875, 3.75433349609375, 3.9990234375, 4.24371337890625, 4.4884033203125, 4.73309326171875, 4.977783203125, 5.22247314453125, 5.4671630859375, 5.71185302734375, 5.95654296875, 6.20123291015625, 6.4459228515625, 6.69061279296875, 6.935302734375, 7.17999267578125, 7.4246826171875, 7.66937255859375, 7.9140625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 6.0, 7.0, 7.0, 4.0, 7.0, 8.0, 8.0, 22.0, 14.0, 21.0, 27.0, 36.0, 24.0, 40.0, 42.0, 34.0, 37.0, 36.0, 40.0, 40.0, 56.0, 62.0, 48.0, 41.0, 48.0, 31.0, 45.0, 29.0, 30.0, 20.0, 26.0, 26.0, 11.0, 15.0, 7.0, 15.0, 7.0, 3.0, 6.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.8323974609375, -41.37943649291992, -39.92647933959961, -38.47351837158203, -37.02056121826172, -35.56760025024414, -34.11463928222656, -32.66168212890625, -31.208721160888672, -29.755762100219727, -28.30280303955078, -26.849842071533203, -25.396883010864258, -23.943923950195312, -22.490962982177734, -21.03800392150879, -19.585044860839844, -18.1320858001709, -16.679126739501953, -15.226165771484375, -13.77320671081543, -12.320247650146484, -10.867287635803223, -9.414327621459961, -7.961368560791016, -6.508409023284912, -5.055449485778809, -3.602489948272705, -2.1495304107666016, -0.696570873260498, 0.7563886642456055, 2.209348678588867, 3.662303924560547, 5.11526346206665, 6.568222999572754, 8.021183013916016, 9.474142074584961, 10.927101135253906, 12.380061149597168, 13.83302116394043, 15.285980224609375, 16.73893928527832, 18.191898345947266, 19.644859313964844, 21.09781837463379, 22.550777435302734, 24.003738403320312, 25.456697463989258, 26.909656524658203, 28.36261558532715, 29.815574645996094, 31.268535614013672, 32.72149658203125, 34.17445373535156, 35.62741470336914, 37.08037567138672, 38.53333282470703, 39.98629379272461, 41.43925094604492, 42.8922119140625, 44.34516906738281, 45.79813003540039, 47.25109100341797, 48.70404815673828, 50.15700912475586]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 7.0, 7.0, 8.0, 4.0, 13.0, 14.0, 20.0, 17.0, 30.0, 16.0, 19.0, 22.0, 30.0, 35.0, 38.0, 34.0, 40.0, 29.0, 40.0, 35.0, 39.0, 42.0, 43.0, 33.0, 29.0, 36.0, 26.0, 36.0, 30.0, 29.0, 26.0, 23.0, 24.0, 25.0, 12.0, 10.0, 10.0, 13.0, 10.0, 10.0, 11.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-36.750152587890625, -35.5157356262207, -34.28131866455078, -33.046905517578125, -31.812488555908203, -30.57807159423828, -29.34365463256836, -28.10923957824707, -26.87482452392578, -25.64040756225586, -24.40599250793457, -23.17157554626465, -21.93716049194336, -20.702743530273438, -19.468326568603516, -18.233911514282227, -16.999494552612305, -15.7650785446167, -14.530662536621094, -13.296245574951172, -12.061830520629883, -10.827413558959961, -9.592997550964355, -8.35858154296875, -7.1241655349731445, -5.889749526977539, -4.655333518981934, -3.42091703414917, -2.1865010261535645, -0.952085018157959, 0.2823314666748047, 1.5167474746704102, 2.7511634826660156, 3.985579490661621, 5.219995498657227, 6.45441198348999, 7.688827991485596, 8.92324447631836, 10.157660484313965, 11.39207649230957, 12.626492500305176, 13.860908508300781, 15.095324516296387, 16.329740524291992, 17.564157485961914, 18.798572540283203, 20.032989501953125, 21.267406463623047, 22.501821517944336, 23.736238479614258, 24.970653533935547, 26.20507049560547, 27.439485549926758, 28.67390251159668, 29.90831756591797, 31.14273452758789, 32.37715148925781, 33.611568450927734, 34.845985412597656, 36.08039855957031, 37.314815521240234, 38.549232482910156, 39.78364944458008, 41.01806640625, 42.252479553222656]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [6.0, 3.0, 12.0, 21.0, 17.0, 34.0, 64.0, 87.0, 134.0, 262.0, 422.0, 602.0, 1036.0, 1594.0, 2650.0, 4061.0, 6443.0, 9570.0, 15016.0, 22193.0, 33392.0, 48258.0, 69379.0, 97424.0, 133398.0, 175756.0, 224451.0, 273992.0, 320130.0, 354786.0, 371870.0, 367802.0, 342548.0, 302699.0, 255287.0, 205433.0, 158638.0, 118609.0, 86227.0, 61222.0, 42916.0, 29062.0, 19978.0, 12743.0, 8590.0, 5554.0, 3593.0, 2364.0, 1507.0, 919.0, 543.0, 390.0, 234.0, 129.0, 103.0, 58.0, 40.0, 23.0, 13.0, 6.0, 5.0, 3.0, 2.0, 1.0], "bins": [-27.328125, -26.44140625, -25.5546875, -24.66796875, -23.78125, -22.89453125, -22.0078125, -21.12109375, -20.234375, -19.34765625, -18.4609375, -17.57421875, -16.6875, -15.80078125, -14.9140625, -14.02734375, -13.140625, -12.25390625, -11.3671875, -10.48046875, -9.59375, -8.70703125, -7.8203125, -6.93359375, -6.046875, -5.16015625, -4.2734375, -3.38671875, -2.5, -1.61328125, -0.7265625, 0.16015625, 1.046875, 1.93359375, 2.8203125, 3.70703125, 4.59375, 5.48046875, 6.3671875, 7.25390625, 8.140625, 9.02734375, 9.9140625, 10.80078125, 11.6875, 12.57421875, 13.4609375, 14.34765625, 15.234375, 16.12109375, 17.0078125, 17.89453125, 18.78125, 19.66796875, 20.5546875, 21.44140625, 22.328125, 23.21484375, 24.1015625, 24.98828125, 25.875, 26.76171875, 27.6484375, 28.53515625, 29.421875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 4.0, 11.0, 7.0, 6.0, 12.0, 18.0, 22.0, 24.0, 18.0, 22.0, 18.0, 21.0, 37.0, 37.0, 39.0, 40.0, 36.0, 29.0, 40.0, 37.0, 43.0, 41.0, 33.0, 35.0, 28.0, 29.0, 38.0, 34.0, 26.0, 24.0, 30.0, 24.0, 22.0, 18.0, 13.0, 8.0, 14.0, 13.0, 7.0, 9.0, 10.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.15625, -33.03369140625, -31.9111328125, -30.78857421875, -29.666015625, -28.54345703125, -27.4208984375, -26.29833984375, -25.17578125, -24.05322265625, -22.9306640625, -21.80810546875, -20.685546875, -19.56298828125, -18.4404296875, -17.31787109375, -16.1953125, -15.07275390625, -13.9501953125, -12.82763671875, -11.705078125, -10.58251953125, -9.4599609375, -8.33740234375, -7.21484375, -6.09228515625, -4.9697265625, -3.84716796875, -2.724609375, -1.60205078125, -0.4794921875, 0.64306640625, 1.765625, 2.88818359375, 4.0107421875, 5.13330078125, 6.255859375, 7.37841796875, 8.5009765625, 9.62353515625, 10.74609375, 11.86865234375, 12.9912109375, 14.11376953125, 15.236328125, 16.35888671875, 17.4814453125, 18.60400390625, 19.7265625, 20.84912109375, 21.9716796875, 23.09423828125, 24.216796875, 25.33935546875, 26.4619140625, 27.58447265625, 28.70703125, 29.82958984375, 30.9521484375, 32.07470703125, 33.197265625, 34.31982421875, 35.4423828125, 36.56494140625, 37.6875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 12.0, 11.0, 40.0, 47.0, 80.0, 187.0, 316.0, 503.0, 930.0, 1631.0, 2811.0, 4885.0, 8121.0, 13628.0, 22503.0, 35537.0, 55377.0, 83809.0, 122556.0, 171686.0, 229483.0, 289896.0, 347312.0, 390185.0, 411643.0, 404652.0, 373954.0, 321127.0, 261643.0, 201698.0, 147447.0, 103217.0, 69427.0, 45506.0, 28663.0, 17715.0, 10835.0, 6447.0, 3838.0, 2091.0, 1224.0, 703.0, 430.0, 233.0, 110.0, 58.0, 30.0, 25.0, 14.0, 7.0, 2.0, 2.0, 2.0, 3.0], "bins": [-37.59375, -36.512451171875, -35.43115234375, -34.349853515625, -33.2685546875, -32.187255859375, -31.10595703125, -30.024658203125, -28.943359375, -27.862060546875, -26.78076171875, -25.699462890625, -24.6181640625, -23.536865234375, -22.45556640625, -21.374267578125, -20.29296875, -19.211669921875, -18.13037109375, -17.049072265625, -15.9677734375, -14.886474609375, -13.80517578125, -12.723876953125, -11.642578125, -10.561279296875, -9.47998046875, -8.398681640625, -7.3173828125, -6.236083984375, -5.15478515625, -4.073486328125, -2.9921875, -1.910888671875, -0.82958984375, 0.251708984375, 1.3330078125, 2.414306640625, 3.49560546875, 4.576904296875, 5.658203125, 6.739501953125, 7.82080078125, 8.902099609375, 9.9833984375, 11.064697265625, 12.14599609375, 13.227294921875, 14.30859375, 15.389892578125, 16.47119140625, 17.552490234375, 18.6337890625, 19.715087890625, 20.79638671875, 21.877685546875, 22.958984375, 24.040283203125, 25.12158203125, 26.202880859375, 27.2841796875, 28.365478515625, 29.44677734375, 30.528076171875, 31.609375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 10.0, 12.0, 13.0, 23.0, 28.0, 35.0, 45.0, 61.0, 64.0, 79.0, 77.0, 105.0, 147.0, 114.0, 145.0, 150.0, 187.0, 184.0, 172.0, 201.0, 192.0, 221.0, 186.0, 195.0, 187.0, 168.0, 158.0, 146.0, 121.0, 136.0, 95.0, 73.0, 67.0, 72.0, 42.0, 51.0, 25.0, 25.0, 14.0, 13.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.623046875, -15.05859375, -14.494140625, -13.9296875, -13.365234375, -12.80078125, -12.236328125, -11.671875, -11.107421875, -10.54296875, -9.978515625, -9.4140625, -8.849609375, -8.28515625, -7.720703125, -7.15625, -6.591796875, -6.02734375, -5.462890625, -4.8984375, -4.333984375, -3.76953125, -3.205078125, -2.640625, -2.076171875, -1.51171875, -0.947265625, -0.3828125, 0.181640625, 0.74609375, 1.310546875, 1.875, 2.439453125, 3.00390625, 3.568359375, 4.1328125, 4.697265625, 5.26171875, 5.826171875, 6.390625, 6.955078125, 7.51953125, 8.083984375, 8.6484375, 9.212890625, 9.77734375, 10.341796875, 10.90625, 11.470703125, 12.03515625, 12.599609375, 13.1640625, 13.728515625, 14.29296875, 14.857421875, 15.421875, 15.986328125, 16.55078125, 17.115234375, 17.6796875, 18.244140625, 18.80859375, 19.373046875, 19.9375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 3.0, 9.0, 10.0, 13.0, 13.0, 8.0, 18.0, 16.0, 11.0, 23.0, 18.0, 14.0, 36.0, 34.0, 26.0, 39.0, 38.0, 40.0, 28.0, 39.0, 30.0, 40.0, 44.0, 36.0, 35.0, 42.0, 27.0, 39.0, 29.0, 23.0, 26.0, 20.0, 25.0, 17.0, 18.0, 15.0, 16.0, 16.0, 10.0, 8.0, 4.0, 8.0, 5.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-39.685359954833984, -38.46506881713867, -37.244781494140625, -36.02449035644531, -34.80419921875, -33.58390808105469, -32.363616943359375, -31.143329620361328, -29.923038482666016, -28.702747344970703, -27.482458114624023, -26.262168884277344, -25.04187774658203, -23.82158660888672, -22.60129737854004, -21.38100814819336, -20.160717010498047, -18.940425872802734, -17.720136642456055, -16.499847412109375, -15.279556274414062, -14.059266090393066, -12.83897590637207, -11.618685722351074, -10.398395538330078, -9.178105354309082, -7.957815170288086, -6.73752498626709, -5.517234802246094, -4.296944618225098, -3.0766544342041016, -1.8563642501831055, -0.6360702514648438, 0.5842199325561523, 1.8045101165771484, 3.0248003005981445, 4.245090484619141, 5.465380668640137, 6.685670852661133, 7.905961036682129, 9.126251220703125, 10.346541404724121, 11.566831588745117, 12.787121772766113, 14.00741195678711, 15.227702140808105, 16.4479923248291, 17.66828155517578, 18.888572692871094, 20.108863830566406, 21.329153060913086, 22.549442291259766, 23.769733428955078, 24.99002456665039, 26.21031379699707, 27.43060302734375, 28.650894165039062, 29.871185302734375, 31.091474533081055, 32.311763763427734, 33.53205490112305, 34.75234603881836, 35.972633361816406, 37.19292449951172, 38.41321563720703]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 5.0, 6.0, 8.0, 10.0, 9.0, 15.0, 8.0, 12.0, 24.0, 18.0, 11.0, 26.0, 30.0, 35.0, 31.0, 40.0, 32.0, 35.0, 41.0, 44.0, 31.0, 42.0, 36.0, 31.0, 39.0, 37.0, 39.0, 30.0, 32.0, 24.0, 29.0, 27.0, 21.0, 22.0, 17.0, 17.0, 17.0, 14.0, 11.0, 9.0, 7.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-36.868553161621094, -35.66728210449219, -34.46601486206055, -33.26474380493164, -32.063472747802734, -30.86220359802246, -29.660934448242188, -28.45966339111328, -27.258392333984375, -26.0571231842041, -24.855852127075195, -23.654582977294922, -22.453311920166016, -21.252042770385742, -20.05077362060547, -18.849502563476562, -17.64823341369629, -16.446964263916016, -15.24569320678711, -14.044424057006836, -12.84315299987793, -11.641883850097656, -10.440613746643066, -9.239343643188477, -8.038073539733887, -6.836803436279297, -5.635533332824707, -4.434263706207275, -3.2329936027526855, -2.0317234992980957, -0.8304538726806641, 0.3708162307739258, 1.5720863342285156, 2.7733564376831055, 3.974626302719116, 5.175896167755127, 6.377166271209717, 7.578436374664307, 8.779706001281738, 9.980976104736328, 11.182246208190918, 12.383516311645508, 13.584786415100098, 14.786056518554688, 15.987325668334961, 17.188596725463867, 18.38986587524414, 19.591136932373047, 20.79240608215332, 21.993675231933594, 23.1949462890625, 24.396215438842773, 25.59748649597168, 26.798755645751953, 28.00002670288086, 29.201295852661133, 30.402565002441406, 31.60383415222168, 32.80510330200195, 34.00637435913086, 35.207645416259766, 36.40891647338867, 37.61018371582031, 38.81145477294922, 40.012725830078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 10.0, 17.0, 22.0, 48.0, 67.0, 99.0, 123.0, 227.0, 266.0, 466.0, 688.0, 969.0, 1622.0, 2601.0, 4127.0, 6936.0, 11892.0, 19862.0, 33587.0, 56175.0, 87460.0, 126518.0, 155400.0, 159654.0, 132689.0, 94020.0, 60897.0, 37011.0, 22218.0, 12755.0, 7593.0, 4664.0, 2843.0, 1777.0, 1128.0, 714.0, 468.0, 328.0, 185.0, 150.0, 90.0, 66.0, 49.0, 29.0, 18.0, 4.0, 8.0, 10.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.390625, -21.646484375, -20.90234375, -20.158203125, -19.4140625, -18.669921875, -17.92578125, -17.181640625, -16.4375, -15.693359375, -14.94921875, -14.205078125, -13.4609375, -12.716796875, -11.97265625, -11.228515625, -10.484375, -9.740234375, -8.99609375, -8.251953125, -7.5078125, -6.763671875, -6.01953125, -5.275390625, -4.53125, -3.787109375, -3.04296875, -2.298828125, -1.5546875, -0.810546875, -0.06640625, 0.677734375, 1.421875, 2.166015625, 2.91015625, 3.654296875, 4.3984375, 5.142578125, 5.88671875, 6.630859375, 7.375, 8.119140625, 8.86328125, 9.607421875, 10.3515625, 11.095703125, 11.83984375, 12.583984375, 13.328125, 14.072265625, 14.81640625, 15.560546875, 16.3046875, 17.048828125, 17.79296875, 18.537109375, 19.28125, 20.025390625, 20.76953125, 21.513671875, 22.2578125, 23.001953125, 23.74609375, 24.490234375, 25.234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 6.0, 12.0, 8.0, 15.0, 8.0, 11.0, 23.0, 19.0, 12.0, 27.0, 26.0, 36.0, 33.0, 37.0, 30.0, 42.0, 37.0, 42.0, 35.0, 40.0, 35.0, 35.0, 38.0, 37.0, 38.0, 32.0, 30.0, 27.0, 25.0, 30.0, 18.0, 22.0, 21.0, 12.0, 22.0, 13.0, 11.0, 10.0, 7.0, 3.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-37.1875, -35.98486328125, -34.7822265625, -33.57958984375, -32.376953125, -31.17431640625, -29.9716796875, -28.76904296875, -27.56640625, -26.36376953125, -25.1611328125, -23.95849609375, -22.755859375, -21.55322265625, -20.3505859375, -19.14794921875, -17.9453125, -16.74267578125, -15.5400390625, -14.33740234375, -13.134765625, -11.93212890625, -10.7294921875, -9.52685546875, -8.32421875, -7.12158203125, -5.9189453125, -4.71630859375, -3.513671875, -2.31103515625, -1.1083984375, 0.09423828125, 1.296875, 2.49951171875, 3.7021484375, 4.90478515625, 6.107421875, 7.31005859375, 8.5126953125, 9.71533203125, 10.91796875, 12.12060546875, 13.3232421875, 14.52587890625, 15.728515625, 16.93115234375, 18.1337890625, 19.33642578125, 20.5390625, 21.74169921875, 22.9443359375, 24.14697265625, 25.349609375, 26.55224609375, 27.7548828125, 28.95751953125, 30.16015625, 31.36279296875, 32.5654296875, 33.76806640625, 34.970703125, 36.17333984375, 37.3759765625, 38.57861328125, 39.78125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 6.0, 11.0, 18.0, 17.0, 25.0, 45.0, 60.0, 108.0, 174.0, 230.0, 367.0, 538.0, 920.0, 1627.0, 2748.0, 4990.0, 10039.0, 20660.0, 46988.0, 110787.0, 231588.0, 290905.0, 179609.0, 79186.0, 34249.0, 15418.0, 7598.0, 3968.0, 2250.0, 1280.0, 775.0, 482.0, 303.0, 209.0, 124.0, 81.0, 51.0, 45.0, 18.0, 15.0, 12.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-36.28125, -35.19189453125, -34.1025390625, -33.01318359375, -31.923828125, -30.83447265625, -29.7451171875, -28.65576171875, -27.56640625, -26.47705078125, -25.3876953125, -24.29833984375, -23.208984375, -22.11962890625, -21.0302734375, -19.94091796875, -18.8515625, -17.76220703125, -16.6728515625, -15.58349609375, -14.494140625, -13.40478515625, -12.3154296875, -11.22607421875, -10.13671875, -9.04736328125, -7.9580078125, -6.86865234375, -5.779296875, -4.68994140625, -3.6005859375, -2.51123046875, -1.421875, -0.33251953125, 0.7568359375, 1.84619140625, 2.935546875, 4.02490234375, 5.1142578125, 6.20361328125, 7.29296875, 8.38232421875, 9.4716796875, 10.56103515625, 11.650390625, 12.73974609375, 13.8291015625, 14.91845703125, 16.0078125, 17.09716796875, 18.1865234375, 19.27587890625, 20.365234375, 21.45458984375, 22.5439453125, 23.63330078125, 24.72265625, 25.81201171875, 26.9013671875, 27.99072265625, 29.080078125, 30.16943359375, 31.2587890625, 32.34814453125, 33.4375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 12.0, 6.0, 6.0, 11.0, 14.0, 24.0, 15.0, 25.0, 25.0, 33.0, 24.0, 41.0, 42.0, 42.0, 43.0, 30.0, 52.0, 32.0, 39.0, 46.0, 54.0, 37.0, 44.0, 36.0, 39.0, 39.0, 27.0, 26.0, 23.0, 18.0, 21.0, 14.0, 14.0, 14.0, 6.0, 10.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.28125, -25.384033203125, -24.48681640625, -23.589599609375, -22.6923828125, -21.795166015625, -20.89794921875, -20.000732421875, -19.103515625, -18.206298828125, -17.30908203125, -16.411865234375, -15.5146484375, -14.617431640625, -13.72021484375, -12.822998046875, -11.92578125, -11.028564453125, -10.13134765625, -9.234130859375, -8.3369140625, -7.439697265625, -6.54248046875, -5.645263671875, -4.748046875, -3.850830078125, -2.95361328125, -2.056396484375, -1.1591796875, -0.261962890625, 0.63525390625, 1.532470703125, 2.4296875, 3.326904296875, 4.22412109375, 5.121337890625, 6.0185546875, 6.915771484375, 7.81298828125, 8.710205078125, 9.607421875, 10.504638671875, 11.40185546875, 12.299072265625, 13.1962890625, 14.093505859375, 14.99072265625, 15.887939453125, 16.78515625, 17.682373046875, 18.57958984375, 19.476806640625, 20.3740234375, 21.271240234375, 22.16845703125, 23.065673828125, 23.962890625, 24.860107421875, 25.75732421875, 26.654541015625, 27.5517578125, 28.448974609375, 29.34619140625, 30.243408203125, 31.140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 5.0, 6.0, 11.0, 5.0, 15.0, 25.0, 33.0, 51.0, 84.0, 98.0, 159.0, 224.0, 363.0, 528.0, 847.0, 1156.0, 1805.0, 2928.0, 4462.0, 7607.0, 13232.0, 25012.0, 50976.0, 113499.0, 249615.0, 292059.0, 148600.0, 64307.0, 30843.0, 15990.0, 9090.0, 5500.0, 3345.0, 2093.0, 1327.0, 839.0, 611.0, 373.0, 258.0, 192.0, 120.0, 70.0, 62.0, 43.0, 25.0, 21.0, 11.0, 10.0, 6.0, 6.0, 2.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.3125, -14.787353515625, -14.26220703125, -13.737060546875, -13.2119140625, -12.686767578125, -12.16162109375, -11.636474609375, -11.111328125, -10.586181640625, -10.06103515625, -9.535888671875, -9.0107421875, -8.485595703125, -7.96044921875, -7.435302734375, -6.91015625, -6.385009765625, -5.85986328125, -5.334716796875, -4.8095703125, -4.284423828125, -3.75927734375, -3.234130859375, -2.708984375, -2.183837890625, -1.65869140625, -1.133544921875, -0.6083984375, -0.083251953125, 0.44189453125, 0.967041015625, 1.4921875, 2.017333984375, 2.54248046875, 3.067626953125, 3.5927734375, 4.117919921875, 4.64306640625, 5.168212890625, 5.693359375, 6.218505859375, 6.74365234375, 7.268798828125, 7.7939453125, 8.319091796875, 8.84423828125, 9.369384765625, 9.89453125, 10.419677734375, 10.94482421875, 11.469970703125, 11.9951171875, 12.520263671875, 13.04541015625, 13.570556640625, 14.095703125, 14.620849609375, 15.14599609375, 15.671142578125, 16.1962890625, 16.721435546875, 17.24658203125, 17.771728515625, 18.296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 4.0, 11.0, 8.0, 12.0, 6.0, 10.0, 13.0, 13.0, 19.0, 27.0, 30.0, 36.0, 40.0, 42.0, 53.0, 45.0, 67.0, 56.0, 63.0, 51.0, 59.0, 50.0, 50.0, 47.0, 43.0, 23.0, 18.0, 24.0, 18.0, 12.0, 17.0, 7.0, 6.0, 6.0, 7.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006880760192871094, -0.000661902129650116, -0.0006357282400131226, -0.0006095543503761292, -0.0005833804607391357, -0.0005572065711021423, -0.0005310326814651489, -0.0005048587918281555, -0.0004786849021911621, -0.0004525110125541687, -0.0004263371229171753, -0.0004001632332801819, -0.0003739893436431885, -0.00034781545400619507, -0.00032164156436920166, -0.00029546767473220825, -0.00026929378509521484, -0.00024311989545822144, -0.00021694600582122803, -0.00019077211618423462, -0.0001645982265472412, -0.0001384243369102478, -0.0001122504472732544, -8.607655763626099e-05, -5.990266799926758e-05, -3.372877836227417e-05, -7.554888725280762e-06, 1.8619000911712646e-05, 4.4792890548706055e-05, 7.096678018569946e-05, 9.714066982269287e-05, 0.00012331455945968628, 0.0001494884490966797, 0.0001756623387336731, 0.0002018362283706665, 0.0002280101180076599, 0.0002541840076446533, 0.00028035789728164673, 0.00030653178691864014, 0.00033270567655563354, 0.00035887956619262695, 0.00038505345582962036, 0.00041122734546661377, 0.0004374012351036072, 0.0004635751247406006, 0.000489749014377594, 0.0005159229040145874, 0.0005420967936515808, 0.0005682706832885742, 0.0005944445729255676, 0.000620618462562561, 0.0006467923521995544, 0.0006729662418365479, 0.0006991401314735413, 0.0007253140211105347, 0.0007514879107475281, 0.0007776618003845215, 0.0008038356900215149, 0.0008300095796585083, 0.0008561834692955017, 0.0008823573589324951, 0.0009085312485694885, 0.0009347051382064819, 0.0009608790278434753, 0.0009870529174804688]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 20.0, 30.0, 49.0, 63.0, 78.0, 148.0, 165.0, 241.0, 340.0, 534.0, 773.0, 1152.0, 1647.0, 2428.0, 3705.0, 5655.0, 8478.0, 13311.0, 20342.0, 32355.0, 49443.0, 74263.0, 104213.0, 132362.0, 144146.0, 132173.0, 104790.0, 74291.0, 49662.0, 32033.0, 20545.0, 13339.0, 8580.0, 5816.0, 3729.0, 2447.0, 1601.0, 1135.0, 761.0, 528.0, 379.0, 263.0, 151.0, 123.0, 79.0, 56.0, 44.0, 26.0, 21.0, 14.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-15.84375, -15.3408203125, -14.837890625, -14.3349609375, -13.83203125, -13.3291015625, -12.826171875, -12.3232421875, -11.8203125, -11.3173828125, -10.814453125, -10.3115234375, -9.80859375, -9.3056640625, -8.802734375, -8.2998046875, -7.796875, -7.2939453125, -6.791015625, -6.2880859375, -5.78515625, -5.2822265625, -4.779296875, -4.2763671875, -3.7734375, -3.2705078125, -2.767578125, -2.2646484375, -1.76171875, -1.2587890625, -0.755859375, -0.2529296875, 0.25, 0.7529296875, 1.255859375, 1.7587890625, 2.26171875, 2.7646484375, 3.267578125, 3.7705078125, 4.2734375, 4.7763671875, 5.279296875, 5.7822265625, 6.28515625, 6.7880859375, 7.291015625, 7.7939453125, 8.296875, 8.7998046875, 9.302734375, 9.8056640625, 10.30859375, 10.8115234375, 11.314453125, 11.8173828125, 12.3203125, 12.8232421875, 13.326171875, 13.8291015625, 14.33203125, 14.8349609375, 15.337890625, 15.8408203125, 16.34375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 8.0, 8.0, 3.0, 8.0, 7.0, 12.0, 19.0, 16.0, 32.0, 27.0, 42.0, 33.0, 51.0, 48.0, 55.0, 48.0, 57.0, 63.0, 61.0, 57.0, 56.0, 39.0, 32.0, 36.0, 36.0, 25.0, 19.0, 12.0, 16.0, 11.0, 6.0, 13.0, 7.0, 3.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.3671875, -6.182373046875, -5.99755859375, -5.812744140625, -5.6279296875, -5.443115234375, -5.25830078125, -5.073486328125, -4.888671875, -4.703857421875, -4.51904296875, -4.334228515625, -4.1494140625, -3.964599609375, -3.77978515625, -3.594970703125, -3.41015625, -3.225341796875, -3.04052734375, -2.855712890625, -2.6708984375, -2.486083984375, -2.30126953125, -2.116455078125, -1.931640625, -1.746826171875, -1.56201171875, -1.377197265625, -1.1923828125, -1.007568359375, -0.82275390625, -0.637939453125, -0.453125, -0.268310546875, -0.08349609375, 0.101318359375, 0.2861328125, 0.470947265625, 0.65576171875, 0.840576171875, 1.025390625, 1.210205078125, 1.39501953125, 1.579833984375, 1.7646484375, 1.949462890625, 2.13427734375, 2.319091796875, 2.50390625, 2.688720703125, 2.87353515625, 3.058349609375, 3.2431640625, 3.427978515625, 3.61279296875, 3.797607421875, 3.982421875, 4.167236328125, 4.35205078125, 4.536865234375, 4.7216796875, 4.906494140625, 5.09130859375, 5.276123046875, 5.4609375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 3.0, 7.0, 4.0, 12.0, 13.0, 17.0, 10.0, 10.0, 14.0, 17.0, 18.0, 21.0, 28.0, 26.0, 27.0, 41.0, 52.0, 22.0, 41.0, 31.0, 31.0, 44.0, 35.0, 42.0, 36.0, 44.0, 32.0, 45.0, 27.0, 26.0, 21.0, 28.0, 23.0, 24.0, 25.0, 10.0, 14.0, 17.0, 5.0, 8.0, 10.0, 8.0, 7.0, 6.0, 2.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-40.318756103515625, -39.06785583496094, -37.81695556640625, -36.5660514831543, -35.31515121459961, -34.06425094604492, -32.813350677490234, -31.562450408935547, -30.311548233032227, -29.06064796447754, -27.80974578857422, -26.55884552001953, -25.307945251464844, -24.057043075561523, -22.806142807006836, -21.555240631103516, -20.304340362548828, -19.05344009399414, -17.80253791809082, -16.551637649536133, -15.300736427307129, -14.049835205078125, -12.798934936523438, -11.548033714294434, -10.29713249206543, -9.046231269836426, -7.79533052444458, -6.544429779052734, -5.2935285568237305, -4.042627334594727, -2.791726589202881, -1.5408258438110352, -0.2899284362792969, 0.9609725475311279, 2.2118735313415527, 3.4627745151519775, 4.713675498962402, 5.964576721191406, 7.215477466583252, 8.466378211975098, 9.717279434204102, 10.968180656433105, 12.21908187866211, 13.469982147216797, 14.7208833694458, 15.971784591674805, 17.222684860229492, 18.473587036132812, 19.7244873046875, 20.975387573242188, 22.226289749145508, 23.477190017700195, 24.728092193603516, 25.978992462158203, 27.22989273071289, 28.480792999267578, 29.7316951751709, 30.982595443725586, 32.233497619628906, 33.484397888183594, 34.73529815673828, 35.98619842529297, 37.23710250854492, 38.48800277709961, 39.7389030456543]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 1.0, 7.0, 10.0, 14.0, 9.0, 11.0, 9.0, 12.0, 22.0, 18.0, 19.0, 27.0, 24.0, 32.0, 37.0, 29.0, 32.0, 41.0, 33.0, 44.0, 39.0, 38.0, 32.0, 36.0, 40.0, 40.0, 34.0, 27.0, 28.0, 34.0, 32.0, 20.0, 23.0, 16.0, 19.0, 18.0, 15.0, 18.0, 9.0, 10.0, 7.0, 4.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.19147491455078, -34.01076889038086, -32.83006286621094, -31.64935302734375, -30.468647003173828, -29.287940979003906, -28.10723304748535, -26.926525115966797, -25.745819091796875, -24.565113067626953, -23.3844051361084, -22.203697204589844, -21.022991180419922, -19.84228515625, -18.661577224731445, -17.48086929321289, -16.30016326904297, -15.11945629119873, -13.938749313354492, -12.758042335510254, -11.577335357666016, -10.396628379821777, -9.215921401977539, -8.0352144241333, -6.8545074462890625, -5.673800468444824, -4.493093490600586, -3.3123865127563477, -2.1316795349121094, -0.9509725570678711, 0.2297344207763672, 1.4104413986206055, 2.591144561767578, 3.7718515396118164, 4.952558517456055, 6.133265495300293, 7.313972473144531, 8.49467945098877, 9.675386428833008, 10.856093406677246, 12.036800384521484, 13.217507362365723, 14.398214340209961, 15.5789213180542, 16.759628295898438, 17.94033432006836, 19.121042251586914, 20.30175018310547, 21.48245620727539, 22.663162231445312, 23.843870162963867, 25.024578094482422, 26.205284118652344, 27.385990142822266, 28.56669807434082, 29.747406005859375, 30.928112030029297, 32.10881805419922, 33.289527893066406, 34.47023391723633, 35.65093994140625, 36.83164596557617, 38.012351989746094, 39.19306182861328, 40.3737678527832]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 11.0, 11.0, 10.0, 24.0, 42.0, 58.0, 80.0, 135.0, 224.0, 327.0, 499.0, 800.0, 1198.0, 1903.0, 2859.0, 4361.0, 6273.0, 9113.0, 13293.0, 18676.0, 25022.0, 33693.0, 42884.0, 53121.0, 63857.0, 73513.0, 80974.0, 84479.0, 85061.0, 81398.0, 74727.0, 65357.0, 54941.0, 44748.0, 34829.0, 26354.0, 19569.0, 13971.0, 9861.0, 6929.0, 4662.0, 2938.0, 2012.0, 1372.0, 849.0, 562.0, 368.0, 227.0, 139.0, 88.0, 63.0, 43.0, 20.0, 15.0, 5.0, 3.0, 3.0, 7.0, 4.0, 0.0, 1.0], "bins": [-29.640625, -28.68701171875, -27.7333984375, -26.77978515625, -25.826171875, -24.87255859375, -23.9189453125, -22.96533203125, -22.01171875, -21.05810546875, -20.1044921875, -19.15087890625, -18.197265625, -17.24365234375, -16.2900390625, -15.33642578125, -14.3828125, -13.42919921875, -12.4755859375, -11.52197265625, -10.568359375, -9.61474609375, -8.6611328125, -7.70751953125, -6.75390625, -5.80029296875, -4.8466796875, -3.89306640625, -2.939453125, -1.98583984375, -1.0322265625, -0.07861328125, 0.875, 1.82861328125, 2.7822265625, 3.73583984375, 4.689453125, 5.64306640625, 6.5966796875, 7.55029296875, 8.50390625, 9.45751953125, 10.4111328125, 11.36474609375, 12.318359375, 13.27197265625, 14.2255859375, 15.17919921875, 16.1328125, 17.08642578125, 18.0400390625, 18.99365234375, 19.947265625, 20.90087890625, 21.8544921875, 22.80810546875, 23.76171875, 24.71533203125, 25.6689453125, 26.62255859375, 27.576171875, 28.52978515625, 29.4833984375, 30.43701171875, 31.390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 1.0, 7.0, 13.0, 12.0, 7.0, 11.0, 12.0, 11.0, 20.0, 15.0, 25.0, 27.0, 23.0, 35.0, 36.0, 33.0, 27.0, 44.0, 39.0, 43.0, 39.0, 35.0, 28.0, 42.0, 40.0, 37.0, 36.0, 26.0, 25.0, 37.0, 30.0, 25.0, 20.0, 16.0, 15.0, 17.0, 19.0, 15.0, 9.0, 8.0, 8.0, 4.0, 2.0, 3.0, 6.0, 1.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.96875, -32.82373046875, -31.6787109375, -30.53369140625, -29.388671875, -28.24365234375, -27.0986328125, -25.95361328125, -24.80859375, -23.66357421875, -22.5185546875, -21.37353515625, -20.228515625, -19.08349609375, -17.9384765625, -16.79345703125, -15.6484375, -14.50341796875, -13.3583984375, -12.21337890625, -11.068359375, -9.92333984375, -8.7783203125, -7.63330078125, -6.48828125, -5.34326171875, -4.1982421875, -3.05322265625, -1.908203125, -0.76318359375, 0.3818359375, 1.52685546875, 2.671875, 3.81689453125, 4.9619140625, 6.10693359375, 7.251953125, 8.39697265625, 9.5419921875, 10.68701171875, 11.83203125, 12.97705078125, 14.1220703125, 15.26708984375, 16.412109375, 17.55712890625, 18.7021484375, 19.84716796875, 20.9921875, 22.13720703125, 23.2822265625, 24.42724609375, 25.572265625, 26.71728515625, 27.8623046875, 29.00732421875, 30.15234375, 31.29736328125, 32.4423828125, 33.58740234375, 34.732421875, 35.87744140625, 37.0224609375, 38.16748046875, 39.3125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 10.0, 15.0, 31.0, 39.0, 75.0, 142.0, 221.0, 345.0, 559.0, 891.0, 1408.0, 2044.0, 3231.0, 4890.0, 7122.0, 10389.0, 14729.0, 20714.0, 28296.0, 36994.0, 47075.0, 57444.0, 68494.0, 76683.0, 83043.0, 85577.0, 84768.0, 80355.0, 71064.0, 61781.0, 50770.0, 40697.0, 31355.0, 23485.0, 17162.0, 12000.0, 8264.0, 5628.0, 3829.0, 2490.0, 1602.0, 1042.0, 678.0, 414.0, 262.0, 177.0, 111.0, 68.0, 44.0, 22.0, 9.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.96875, -29.023193359375, -28.07763671875, -27.132080078125, -26.1865234375, -25.240966796875, -24.29541015625, -23.349853515625, -22.404296875, -21.458740234375, -20.51318359375, -19.567626953125, -18.6220703125, -17.676513671875, -16.73095703125, -15.785400390625, -14.83984375, -13.894287109375, -12.94873046875, -12.003173828125, -11.0576171875, -10.112060546875, -9.16650390625, -8.220947265625, -7.275390625, -6.329833984375, -5.38427734375, -4.438720703125, -3.4931640625, -2.547607421875, -1.60205078125, -0.656494140625, 0.2890625, 1.234619140625, 2.18017578125, 3.125732421875, 4.0712890625, 5.016845703125, 5.96240234375, 6.907958984375, 7.853515625, 8.799072265625, 9.74462890625, 10.690185546875, 11.6357421875, 12.581298828125, 13.52685546875, 14.472412109375, 15.41796875, 16.363525390625, 17.30908203125, 18.254638671875, 19.2001953125, 20.145751953125, 21.09130859375, 22.036865234375, 22.982421875, 23.927978515625, 24.87353515625, 25.819091796875, 26.7646484375, 27.710205078125, 28.65576171875, 29.601318359375, 30.546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 7.0, 8.0, 7.0, 17.0, 13.0, 13.0, 15.0, 27.0, 31.0, 25.0, 32.0, 29.0, 35.0, 40.0, 30.0, 41.0, 50.0, 35.0, 46.0, 39.0, 45.0, 45.0, 39.0, 31.0, 58.0, 32.0, 33.0, 20.0, 34.0, 11.0, 15.0, 18.0, 15.0, 14.0, 4.0, 10.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.5, -27.634765625, -26.76953125, -25.904296875, -25.0390625, -24.173828125, -23.30859375, -22.443359375, -21.578125, -20.712890625, -19.84765625, -18.982421875, -18.1171875, -17.251953125, -16.38671875, -15.521484375, -14.65625, -13.791015625, -12.92578125, -12.060546875, -11.1953125, -10.330078125, -9.46484375, -8.599609375, -7.734375, -6.869140625, -6.00390625, -5.138671875, -4.2734375, -3.408203125, -2.54296875, -1.677734375, -0.8125, 0.052734375, 0.91796875, 1.783203125, 2.6484375, 3.513671875, 4.37890625, 5.244140625, 6.109375, 6.974609375, 7.83984375, 8.705078125, 9.5703125, 10.435546875, 11.30078125, 12.166015625, 13.03125, 13.896484375, 14.76171875, 15.626953125, 16.4921875, 17.357421875, 18.22265625, 19.087890625, 19.953125, 20.818359375, 21.68359375, 22.548828125, 23.4140625, 24.279296875, 25.14453125, 26.009765625, 26.875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 10.0, 8.0, 20.0, 27.0, 49.0, 87.0, 127.0, 230.0, 416.0, 610.0, 1084.0, 1822.0, 3155.0, 5462.0, 9070.0, 14868.0, 23886.0, 36973.0, 54590.0, 76167.0, 97731.0, 115073.0, 122670.0, 119296.0, 104340.0, 83320.0, 61850.0, 42827.0, 28356.0, 17798.0, 10961.0, 6477.0, 3794.0, 2214.0, 1295.0, 789.0, 416.0, 277.0, 154.0, 101.0, 61.0, 38.0, 25.0, 12.0, 9.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.2755126953125, -14.777587890625, -14.2796630859375, -13.78173828125, -13.2838134765625, -12.785888671875, -12.2879638671875, -11.7900390625, -11.2921142578125, -10.794189453125, -10.2962646484375, -9.79833984375, -9.3004150390625, -8.802490234375, -8.3045654296875, -7.806640625, -7.3087158203125, -6.810791015625, -6.3128662109375, -5.81494140625, -5.3170166015625, -4.819091796875, -4.3211669921875, -3.8232421875, -3.3253173828125, -2.827392578125, -2.3294677734375, -1.83154296875, -1.3336181640625, -0.835693359375, -0.3377685546875, 0.16015625, 0.6580810546875, 1.156005859375, 1.6539306640625, 2.15185546875, 2.6497802734375, 3.147705078125, 3.6456298828125, 4.1435546875, 4.6414794921875, 5.139404296875, 5.6373291015625, 6.13525390625, 6.6331787109375, 7.131103515625, 7.6290283203125, 8.126953125, 8.6248779296875, 9.122802734375, 9.6207275390625, 10.11865234375, 10.6165771484375, 11.114501953125, 11.6124267578125, 12.1103515625, 12.6082763671875, 13.106201171875, 13.6041259765625, 14.10205078125, 14.5999755859375, 15.097900390625, 15.5958251953125, 16.09375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 5.0, 2.0, 10.0, 15.0, 22.0, 14.0, 19.0, 28.0, 21.0, 31.0, 25.0, 29.0, 35.0, 44.0, 36.0, 42.0, 49.0, 43.0, 51.0, 41.0, 53.0, 30.0, 41.0, 40.0, 38.0, 45.0, 22.0, 23.0, 29.0, 22.0, 16.0, 17.0, 14.0, 11.0, 7.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.002002716064453125, -0.001947358250617981, -0.001892000436782837, -0.0018366426229476929, -0.0017812848091125488, -0.0017259269952774048, -0.0016705691814422607, -0.0016152113676071167, -0.0015598535537719727, -0.0015044957399368286, -0.0014491379261016846, -0.0013937801122665405, -0.0013384222984313965, -0.0012830644845962524, -0.0012277066707611084, -0.0011723488569259644, -0.0011169910430908203, -0.0010616332292556763, -0.0010062754154205322, -0.0009509176015853882, -0.0008955597877502441, -0.0008402019739151001, -0.0007848441600799561, -0.000729486346244812, -0.000674128532409668, -0.0006187707185745239, -0.0005634129047393799, -0.0005080550909042358, -0.0004526972770690918, -0.00039733946323394775, -0.0003419816493988037, -0.00028662383556365967, -0.00023126602172851562, -0.00017590820789337158, -0.00012055039405822754, -6.51925802230835e-05, -9.834766387939453e-06, 4.552304744720459e-05, 0.00010088086128234863, 0.00015623867511749268, 0.00021159648895263672, 0.00026695430278778076, 0.0003223121166229248, 0.00037766993045806885, 0.0004330277442932129, 0.0004883855581283569, 0.000543743371963501, 0.000599101185798645, 0.0006544589996337891, 0.0007098168134689331, 0.0007651746273040771, 0.0008205324411392212, 0.0008758902549743652, 0.0009312480688095093, 0.0009866058826446533, 0.0010419636964797974, 0.0010973215103149414, 0.0011526793241500854, 0.0012080371379852295, 0.0012633949518203735, 0.0013187527656555176, 0.0013741105794906616, 0.0014294683933258057, 0.0014848262071609497, 0.0015401840209960938]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 12.0, 20.0, 22.0, 50.0, 71.0, 74.0, 147.0, 232.0, 299.0, 476.0, 823.0, 1237.0, 2006.0, 3391.0, 5317.0, 8189.0, 13356.0, 20449.0, 31074.0, 44688.0, 61906.0, 80729.0, 97591.0, 109126.0, 112434.0, 107326.0, 94017.0, 75855.0, 57447.0, 41210.0, 28082.0, 18668.0, 12052.0, 7392.0, 4783.0, 3038.0, 1746.0, 1111.0, 738.0, 475.0, 294.0, 216.0, 132.0, 85.0, 51.0, 42.0, 24.0, 17.0, 16.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-15.703125, -15.186279296875, -14.66943359375, -14.152587890625, -13.6357421875, -13.118896484375, -12.60205078125, -12.085205078125, -11.568359375, -11.051513671875, -10.53466796875, -10.017822265625, -9.5009765625, -8.984130859375, -8.46728515625, -7.950439453125, -7.43359375, -6.916748046875, -6.39990234375, -5.883056640625, -5.3662109375, -4.849365234375, -4.33251953125, -3.815673828125, -3.298828125, -2.781982421875, -2.26513671875, -1.748291015625, -1.2314453125, -0.714599609375, -0.19775390625, 0.319091796875, 0.8359375, 1.352783203125, 1.86962890625, 2.386474609375, 2.9033203125, 3.420166015625, 3.93701171875, 4.453857421875, 4.970703125, 5.487548828125, 6.00439453125, 6.521240234375, 7.0380859375, 7.554931640625, 8.07177734375, 8.588623046875, 9.10546875, 9.622314453125, 10.13916015625, 10.656005859375, 11.1728515625, 11.689697265625, 12.20654296875, 12.723388671875, 13.240234375, 13.757080078125, 14.27392578125, 14.790771484375, 15.3076171875, 15.824462890625, 16.34130859375, 16.858154296875, 17.375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 3.0, 8.0, 8.0, 9.0, 10.0, 18.0, 12.0, 30.0, 34.0, 31.0, 36.0, 46.0, 45.0, 35.0, 54.0, 44.0, 56.0, 59.0, 44.0, 56.0, 56.0, 46.0, 34.0, 50.0, 32.0, 31.0, 20.0, 17.0, 18.0, 12.0, 6.0, 9.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1953125, -8.90771484375, -8.6201171875, -8.33251953125, -8.044921875, -7.75732421875, -7.4697265625, -7.18212890625, -6.89453125, -6.60693359375, -6.3193359375, -6.03173828125, -5.744140625, -5.45654296875, -5.1689453125, -4.88134765625, -4.59375, -4.30615234375, -4.0185546875, -3.73095703125, -3.443359375, -3.15576171875, -2.8681640625, -2.58056640625, -2.29296875, -2.00537109375, -1.7177734375, -1.43017578125, -1.142578125, -0.85498046875, -0.5673828125, -0.27978515625, 0.0078125, 0.29541015625, 0.5830078125, 0.87060546875, 1.158203125, 1.44580078125, 1.7333984375, 2.02099609375, 2.30859375, 2.59619140625, 2.8837890625, 3.17138671875, 3.458984375, 3.74658203125, 4.0341796875, 4.32177734375, 4.609375, 4.89697265625, 5.1845703125, 5.47216796875, 5.759765625, 6.04736328125, 6.3349609375, 6.62255859375, 6.91015625, 7.19775390625, 7.4853515625, 7.77294921875, 8.060546875, 8.34814453125, 8.6357421875, 8.92333984375, 9.2109375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 8.0, 6.0, 7.0, 13.0, 16.0, 12.0, 24.0, 20.0, 15.0, 28.0, 25.0, 25.0, 35.0, 41.0, 30.0, 37.0, 38.0, 47.0, 44.0, 39.0, 42.0, 50.0, 39.0, 38.0, 40.0, 42.0, 33.0, 27.0, 29.0, 21.0, 17.0, 15.0, 19.0, 10.0, 17.0, 5.0, 9.0, 5.0, 7.0, 4.0, 5.0, 6.0, 0.0, 1.0, 7.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-44.46174240112305, -43.09592056274414, -41.73009490966797, -40.36427307128906, -38.99844741821289, -37.632625579833984, -36.26679992675781, -34.900978088378906, -33.535152435302734, -32.16933059692383, -30.803504943847656, -29.437681198120117, -28.071857452392578, -26.70603370666504, -25.3402099609375, -23.974388122558594, -22.608564376831055, -21.242740631103516, -19.876916885375977, -18.511093139648438, -17.1452693939209, -15.77944564819336, -14.413622856140137, -13.047799110412598, -11.681975364685059, -10.31615161895752, -8.95032787322998, -7.5845046043396, -6.2186808586120605, -4.8528571128845215, -3.4870338439941406, -2.1212100982666016, -0.7553863525390625, 0.610437273979187, 1.9762609004974365, 3.3420844078063965, 4.7079081535339355, 6.073731899261475, 7.4395551681518555, 8.805378913879395, 10.171202659606934, 11.537026405334473, 12.902850151062012, 14.268672943115234, 15.634496688842773, 17.000320434570312, 18.36614418029785, 19.73196792602539, 21.09779167175293, 22.46361541748047, 23.829439163208008, 25.195262908935547, 26.561086654663086, 27.926910400390625, 29.29273223876953, 30.658557891845703, 32.02437973022461, 33.390201568603516, 34.75602722167969, 36.121849060058594, 37.487674713134766, 38.85349655151367, 40.219322204589844, 41.58514404296875, 42.95096969604492]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 11.0, 5.0, 3.0, 4.0, 9.0, 8.0, 12.0, 14.0, 9.0, 17.0, 19.0, 19.0, 25.0, 31.0, 28.0, 37.0, 38.0, 40.0, 32.0, 33.0, 34.0, 36.0, 36.0, 33.0, 46.0, 44.0, 35.0, 32.0, 35.0, 28.0, 32.0, 33.0, 17.0, 28.0, 22.0, 26.0, 16.0, 13.0, 13.0, 10.0, 8.0, 5.0, 7.0, 5.0, 5.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.35667037963867, -35.100257873535156, -33.843841552734375, -32.58742904663086, -31.331016540527344, -30.074602127075195, -28.818187713623047, -27.56177520751953, -26.305360794067383, -25.048946380615234, -23.79253387451172, -22.53611946105957, -21.279705047607422, -20.023292541503906, -18.766878128051758, -17.51046371459961, -16.254051208496094, -14.997637748718262, -13.74122428894043, -12.484809875488281, -11.22839641571045, -9.971982955932617, -8.715568542480469, -7.459155082702637, -6.202741622924805, -4.946328163146973, -3.6899142265319824, -2.4335005283355713, -1.1770868301391602, 0.07932662963867188, 1.335740566253662, 2.5921545028686523, 3.8485641479492188, 5.104977607727051, 6.361391544342041, 7.617805480957031, 8.874218940734863, 10.130632400512695, 11.387046813964844, 12.643460273742676, 13.899873733520508, 15.15628719329834, 16.412700653076172, 17.66911506652832, 18.92552947998047, 20.181941986083984, 21.438356399536133, 22.69477081298828, 23.951183319091797, 25.207597732543945, 26.46401023864746, 27.72042465209961, 28.976837158203125, 30.233251571655273, 31.489665985107422, 32.74607849121094, 34.00249481201172, 35.258907318115234, 36.515323638916016, 37.77173614501953, 39.02814865112305, 40.28456115722656, 41.540977478027344, 42.79738998413086, 44.053802490234375]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 7.0, 10.0, 11.0, 22.0, 27.0, 42.0, 66.0, 157.0, 239.0, 350.0, 581.0, 1022.0, 1576.0, 2628.0, 4164.0, 6582.0, 10410.0, 16688.0, 25036.0, 38956.0, 57826.0, 83629.0, 120497.0, 162631.0, 217779.0, 273754.0, 328901.0, 372383.0, 395266.0, 394390.0, 367521.0, 321819.0, 265596.0, 209748.0, 157444.0, 115487.0, 80660.0, 55445.0, 37280.0, 24457.0, 15790.0, 10008.0, 6687.0, 4097.0, 2533.0, 1599.0, 988.0, 587.0, 316.0, 245.0, 135.0, 87.0, 50.0, 27.0, 24.0, 13.0, 7.0, 10.0, 3.0, 3.0], "bins": [-31.34375, -30.392333984375, -29.44091796875, -28.489501953125, -27.5380859375, -26.586669921875, -25.63525390625, -24.683837890625, -23.732421875, -22.781005859375, -21.82958984375, -20.878173828125, -19.9267578125, -18.975341796875, -18.02392578125, -17.072509765625, -16.12109375, -15.169677734375, -14.21826171875, -13.266845703125, -12.3154296875, -11.364013671875, -10.41259765625, -9.461181640625, -8.509765625, -7.558349609375, -6.60693359375, -5.655517578125, -4.7041015625, -3.752685546875, -2.80126953125, -1.849853515625, -0.8984375, 0.052978515625, 1.00439453125, 1.955810546875, 2.9072265625, 3.858642578125, 4.81005859375, 5.761474609375, 6.712890625, 7.664306640625, 8.61572265625, 9.567138671875, 10.5185546875, 11.469970703125, 12.42138671875, 13.372802734375, 14.32421875, 15.275634765625, 16.22705078125, 17.178466796875, 18.1298828125, 19.081298828125, 20.03271484375, 20.984130859375, 21.935546875, 22.886962890625, 23.83837890625, 24.789794921875, 25.7412109375, 26.692626953125, 27.64404296875, 28.595458984375, 29.546875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 9.0, 7.0, 2.0, 4.0, 9.0, 10.0, 14.0, 12.0, 10.0, 18.0, 21.0, 26.0, 22.0, 26.0, 36.0, 35.0, 41.0, 34.0, 33.0, 36.0, 32.0, 32.0, 45.0, 36.0, 42.0, 42.0, 28.0, 36.0, 29.0, 33.0, 32.0, 28.0, 18.0, 28.0, 27.0, 16.0, 22.0, 11.0, 13.0, 8.0, 7.0, 7.0, 7.0, 3.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.4375, -31.30712890625, -30.1767578125, -29.04638671875, -27.916015625, -26.78564453125, -25.6552734375, -24.52490234375, -23.39453125, -22.26416015625, -21.1337890625, -20.00341796875, -18.873046875, -17.74267578125, -16.6123046875, -15.48193359375, -14.3515625, -13.22119140625, -12.0908203125, -10.96044921875, -9.830078125, -8.69970703125, -7.5693359375, -6.43896484375, -5.30859375, -4.17822265625, -3.0478515625, -1.91748046875, -0.787109375, 0.34326171875, 1.4736328125, 2.60400390625, 3.734375, 4.86474609375, 5.9951171875, 7.12548828125, 8.255859375, 9.38623046875, 10.5166015625, 11.64697265625, 12.77734375, 13.90771484375, 15.0380859375, 16.16845703125, 17.298828125, 18.42919921875, 19.5595703125, 20.68994140625, 21.8203125, 22.95068359375, 24.0810546875, 25.21142578125, 26.341796875, 27.47216796875, 28.6025390625, 29.73291015625, 30.86328125, 31.99365234375, 33.1240234375, 34.25439453125, 35.384765625, 36.51513671875, 37.6455078125, 38.77587890625, 39.90625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 1.0, 3.0, 6.0, 17.0, 34.0, 50.0, 81.0, 156.0, 281.0, 502.0, 778.0, 1237.0, 2073.0, 3541.0, 5637.0, 9108.0, 14192.0, 22413.0, 33883.0, 50600.0, 73149.0, 102942.0, 140927.0, 184717.0, 233642.0, 281146.0, 324385.0, 355442.0, 368440.0, 363159.0, 338570.0, 300234.0, 252557.0, 203795.0, 156376.0, 116858.0, 84079.0, 58136.0, 39661.0, 26034.0, 17058.0, 10960.0, 6764.0, 4311.0, 2578.0, 1505.0, 948.0, 550.0, 308.0, 203.0, 109.0, 67.0, 39.0, 30.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-30.6875, -29.71923828125, -28.7509765625, -27.78271484375, -26.814453125, -25.84619140625, -24.8779296875, -23.90966796875, -22.94140625, -21.97314453125, -21.0048828125, -20.03662109375, -19.068359375, -18.10009765625, -17.1318359375, -16.16357421875, -15.1953125, -14.22705078125, -13.2587890625, -12.29052734375, -11.322265625, -10.35400390625, -9.3857421875, -8.41748046875, -7.44921875, -6.48095703125, -5.5126953125, -4.54443359375, -3.576171875, -2.60791015625, -1.6396484375, -0.67138671875, 0.296875, 1.26513671875, 2.2333984375, 3.20166015625, 4.169921875, 5.13818359375, 6.1064453125, 7.07470703125, 8.04296875, 9.01123046875, 9.9794921875, 10.94775390625, 11.916015625, 12.88427734375, 13.8525390625, 14.82080078125, 15.7890625, 16.75732421875, 17.7255859375, 18.69384765625, 19.662109375, 20.63037109375, 21.5986328125, 22.56689453125, 23.53515625, 24.50341796875, 25.4716796875, 26.43994140625, 27.408203125, 28.37646484375, 29.3447265625, 30.31298828125, 31.28125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 6.0, 10.0, 11.0, 14.0, 14.0, 19.0, 26.0, 25.0, 44.0, 44.0, 60.0, 69.0, 80.0, 79.0, 117.0, 132.0, 126.0, 149.0, 133.0, 158.0, 160.0, 164.0, 167.0, 197.0, 174.0, 201.0, 162.0, 181.0, 144.0, 158.0, 135.0, 140.0, 113.0, 111.0, 88.0, 91.0, 78.0, 54.0, 39.0, 51.0, 37.0, 33.0, 21.0, 13.0, 12.0, 11.0, 6.0, 7.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 1.0], "bins": [-16.90625, -16.393310546875, -15.88037109375, -15.367431640625, -14.8544921875, -14.341552734375, -13.82861328125, -13.315673828125, -12.802734375, -12.289794921875, -11.77685546875, -11.263916015625, -10.7509765625, -10.238037109375, -9.72509765625, -9.212158203125, -8.69921875, -8.186279296875, -7.67333984375, -7.160400390625, -6.6474609375, -6.134521484375, -5.62158203125, -5.108642578125, -4.595703125, -4.082763671875, -3.56982421875, -3.056884765625, -2.5439453125, -2.031005859375, -1.51806640625, -1.005126953125, -0.4921875, 0.020751953125, 0.53369140625, 1.046630859375, 1.5595703125, 2.072509765625, 2.58544921875, 3.098388671875, 3.611328125, 4.124267578125, 4.63720703125, 5.150146484375, 5.6630859375, 6.176025390625, 6.68896484375, 7.201904296875, 7.71484375, 8.227783203125, 8.74072265625, 9.253662109375, 9.7666015625, 10.279541015625, 10.79248046875, 11.305419921875, 11.818359375, 12.331298828125, 12.84423828125, 13.357177734375, 13.8701171875, 14.383056640625, 14.89599609375, 15.408935546875, 15.921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 8.0, 13.0, 11.0, 16.0, 18.0, 18.0, 16.0, 25.0, 26.0, 28.0, 25.0, 26.0, 30.0, 34.0, 40.0, 37.0, 45.0, 32.0, 30.0, 45.0, 34.0, 35.0, 39.0, 46.0, 36.0, 31.0, 31.0, 29.0, 21.0, 23.0, 24.0, 24.0, 10.0, 15.0, 11.0, 11.0, 8.0, 12.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0], "bins": [-43.5806999206543, -42.294368743896484, -41.00803756713867, -39.72170639038086, -38.43537521362305, -37.149044036865234, -35.86271286010742, -34.576385498046875, -33.29005432128906, -32.00372314453125, -30.717391967773438, -29.431060791015625, -28.144729614257812, -26.8583984375, -25.57206916809082, -24.285737991333008, -22.999404907226562, -21.71307373046875, -20.426742553710938, -19.140411376953125, -17.854080200195312, -16.5677490234375, -15.28141975402832, -13.995088577270508, -12.708757400512695, -11.422426223754883, -10.13609504699707, -8.849764823913574, -7.563433647155762, -6.277102470397949, -4.990771770477295, -3.7044410705566406, -2.4181060791015625, -1.131775140762329, 0.1545557975769043, 1.4408867359161377, 2.727217674255371, 4.013548851013184, 5.299879550933838, 6.586210250854492, 7.872541427612305, 9.158872604370117, 10.44520378112793, 11.731534004211426, 13.017865180969238, 14.30419635772705, 15.590526580810547, 16.87685775756836, 18.163188934326172, 19.449520111083984, 20.735851287841797, 22.02218246459961, 23.308513641357422, 24.594844818115234, 25.881174087524414, 27.167505264282227, 28.45383644104004, 29.74016761779785, 31.026498794555664, 32.312828063964844, 33.599159240722656, 34.88549041748047, 36.17182159423828, 37.458152770996094, 38.744483947753906]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 7.0, 9.0, 10.0, 13.0, 12.0, 13.0, 22.0, 23.0, 22.0, 30.0, 32.0, 26.0, 35.0, 30.0, 35.0, 42.0, 43.0, 42.0, 37.0, 37.0, 43.0, 34.0, 43.0, 33.0, 24.0, 30.0, 33.0, 16.0, 28.0, 26.0, 23.0, 17.0, 15.0, 17.0, 11.0, 11.0, 16.0, 8.0, 3.0, 7.0, 4.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.58380126953125, -34.40702819824219, -33.230255126953125, -32.05348205566406, -30.876707077026367, -29.699934005737305, -28.52315902709961, -27.346385955810547, -26.169612884521484, -24.992839813232422, -23.81606674194336, -22.639291763305664, -21.4625186920166, -20.28574562072754, -19.108970642089844, -17.93219757080078, -16.75542449951172, -15.578651428222656, -14.401877403259277, -13.225103378295898, -12.048330307006836, -10.871557235717773, -9.694783210754395, -8.518009185791016, -7.341236114501953, -6.164462566375732, -4.987689018249512, -3.810915470123291, -2.6341419219970703, -1.4573683738708496, -0.2805948257446289, 0.89617919921875, 2.072948455810547, 3.2497220039367676, 4.426495552062988, 5.603269100189209, 6.78004264831543, 7.95681619644165, 9.133589744567871, 10.31036376953125, 11.487136840820312, 12.663909912109375, 13.840683937072754, 15.017457962036133, 16.194231033325195, 17.371004104614258, 18.547779083251953, 19.724552154541016, 20.901325225830078, 22.07809829711914, 23.254871368408203, 24.4316463470459, 25.60841941833496, 26.785192489624023, 27.96196746826172, 29.13874053955078, 30.315513610839844, 31.492286682128906, 32.66905975341797, 33.84583282470703, 35.022605895996094, 36.19938278198242, 37.376155853271484, 38.55292892456055, 39.72970199584961]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 5.0, 6.0, 11.0, 18.0, 22.0, 40.0, 66.0, 96.0, 161.0, 232.0, 376.0, 578.0, 954.0, 1409.0, 2377.0, 3657.0, 5717.0, 9006.0, 14239.0, 21641.0, 32975.0, 47549.0, 67105.0, 89346.0, 107849.0, 120805.0, 120099.0, 108267.0, 88553.0, 66062.0, 47268.0, 32378.0, 21374.0, 14016.0, 8921.0, 5545.0, 3566.0, 2324.0, 1445.0, 922.0, 576.0, 364.0, 233.0, 137.0, 90.0, 67.0, 46.0, 24.0, 11.0, 13.0, 6.0, 5.0, 3.0, 3.0, 2.0, 5.0], "bins": [-17.40625, -16.89404296875, -16.3818359375, -15.86962890625, -15.357421875, -14.84521484375, -14.3330078125, -13.82080078125, -13.30859375, -12.79638671875, -12.2841796875, -11.77197265625, -11.259765625, -10.74755859375, -10.2353515625, -9.72314453125, -9.2109375, -8.69873046875, -8.1865234375, -7.67431640625, -7.162109375, -6.64990234375, -6.1376953125, -5.62548828125, -5.11328125, -4.60107421875, -4.0888671875, -3.57666015625, -3.064453125, -2.55224609375, -2.0400390625, -1.52783203125, -1.015625, -0.50341796875, 0.0087890625, 0.52099609375, 1.033203125, 1.54541015625, 2.0576171875, 2.56982421875, 3.08203125, 3.59423828125, 4.1064453125, 4.61865234375, 5.130859375, 5.64306640625, 6.1552734375, 6.66748046875, 7.1796875, 7.69189453125, 8.2041015625, 8.71630859375, 9.228515625, 9.74072265625, 10.2529296875, 10.76513671875, 11.27734375, 11.78955078125, 12.3017578125, 12.81396484375, 13.326171875, 13.83837890625, 14.3505859375, 14.86279296875, 15.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 9.0, 6.0, 11.0, 8.0, 15.0, 10.0, 16.0, 21.0, 27.0, 20.0, 30.0, 33.0, 22.0, 38.0, 33.0, 37.0, 36.0, 45.0, 43.0, 37.0, 38.0, 40.0, 38.0, 37.0, 34.0, 26.0, 32.0, 31.0, 12.0, 36.0, 19.0, 22.0, 17.0, 16.0, 15.0, 13.0, 11.0, 16.0, 5.0, 4.0, 6.0, 3.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.3125, -34.1396484375, -32.966796875, -31.7939453125, -30.62109375, -29.4482421875, -28.275390625, -27.1025390625, -25.9296875, -24.7568359375, -23.583984375, -22.4111328125, -21.23828125, -20.0654296875, -18.892578125, -17.7197265625, -16.546875, -15.3740234375, -14.201171875, -13.0283203125, -11.85546875, -10.6826171875, -9.509765625, -8.3369140625, -7.1640625, -5.9912109375, -4.818359375, -3.6455078125, -2.47265625, -1.2998046875, -0.126953125, 1.0458984375, 2.21875, 3.3916015625, 4.564453125, 5.7373046875, 6.91015625, 8.0830078125, 9.255859375, 10.4287109375, 11.6015625, 12.7744140625, 13.947265625, 15.1201171875, 16.29296875, 17.4658203125, 18.638671875, 19.8115234375, 20.984375, 22.1572265625, 23.330078125, 24.5029296875, 25.67578125, 26.8486328125, 28.021484375, 29.1943359375, 30.3671875, 31.5400390625, 32.712890625, 33.8857421875, 35.05859375, 36.2314453125, 37.404296875, 38.5771484375, 39.75]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 8.0, 27.0, 41.0, 69.0, 111.0, 190.0, 277.0, 384.0, 679.0, 1103.0, 1749.0, 2841.0, 4948.0, 8546.0, 15268.0, 27135.0, 49170.0, 86989.0, 143922.0, 194657.0, 189902.0, 135560.0, 81243.0, 45054.0, 24880.0, 14051.0, 7883.0, 4566.0, 2807.0, 1705.0, 1047.0, 659.0, 360.0, 256.0, 173.0, 78.0, 60.0, 43.0, 42.0, 25.0, 12.0, 3.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.9375, -21.25048828125, -20.5634765625, -19.87646484375, -19.189453125, -18.50244140625, -17.8154296875, -17.12841796875, -16.44140625, -15.75439453125, -15.0673828125, -14.38037109375, -13.693359375, -13.00634765625, -12.3193359375, -11.63232421875, -10.9453125, -10.25830078125, -9.5712890625, -8.88427734375, -8.197265625, -7.51025390625, -6.8232421875, -6.13623046875, -5.44921875, -4.76220703125, -4.0751953125, -3.38818359375, -2.701171875, -2.01416015625, -1.3271484375, -0.64013671875, 0.046875, 0.73388671875, 1.4208984375, 2.10791015625, 2.794921875, 3.48193359375, 4.1689453125, 4.85595703125, 5.54296875, 6.22998046875, 6.9169921875, 7.60400390625, 8.291015625, 8.97802734375, 9.6650390625, 10.35205078125, 11.0390625, 11.72607421875, 12.4130859375, 13.10009765625, 13.787109375, 14.47412109375, 15.1611328125, 15.84814453125, 16.53515625, 17.22216796875, 17.9091796875, 18.59619140625, 19.283203125, 19.97021484375, 20.6572265625, 21.34423828125, 22.03125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 12.0, 8.0, 15.0, 9.0, 12.0, 13.0, 15.0, 18.0, 19.0, 22.0, 20.0, 21.0, 36.0, 34.0, 41.0, 26.0, 33.0, 38.0, 45.0, 47.0, 47.0, 41.0, 35.0, 49.0, 36.0, 43.0, 17.0, 31.0, 22.0, 22.0, 22.0, 27.0, 18.0, 18.0, 14.0, 13.0, 12.0, 14.0, 11.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.140625, -24.372314453125, -23.60400390625, -22.835693359375, -22.0673828125, -21.299072265625, -20.53076171875, -19.762451171875, -18.994140625, -18.225830078125, -17.45751953125, -16.689208984375, -15.9208984375, -15.152587890625, -14.38427734375, -13.615966796875, -12.84765625, -12.079345703125, -11.31103515625, -10.542724609375, -9.7744140625, -9.006103515625, -8.23779296875, -7.469482421875, -6.701171875, -5.932861328125, -5.16455078125, -4.396240234375, -3.6279296875, -2.859619140625, -2.09130859375, -1.322998046875, -0.5546875, 0.213623046875, 0.98193359375, 1.750244140625, 2.5185546875, 3.286865234375, 4.05517578125, 4.823486328125, 5.591796875, 6.360107421875, 7.12841796875, 7.896728515625, 8.6650390625, 9.433349609375, 10.20166015625, 10.969970703125, 11.73828125, 12.506591796875, 13.27490234375, 14.043212890625, 14.8115234375, 15.579833984375, 16.34814453125, 17.116455078125, 17.884765625, 18.653076171875, 19.42138671875, 20.189697265625, 20.9580078125, 21.726318359375, 22.49462890625, 23.262939453125, 24.03125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 6.0, 12.0, 10.0, 19.0, 20.0, 29.0, 45.0, 68.0, 90.0, 115.0, 162.0, 216.0, 329.0, 519.0, 709.0, 1109.0, 1615.0, 2578.0, 3937.0, 6415.0, 10482.0, 18104.0, 32893.0, 61982.0, 123300.0, 227438.0, 247301.0, 145886.0, 73232.0, 37566.0, 20723.0, 11875.0, 7069.0, 4416.0, 2766.0, 1823.0, 1168.0, 756.0, 506.0, 350.0, 281.0, 208.0, 134.0, 85.0, 54.0, 44.0, 30.0, 31.0, 17.0, 9.0, 7.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0], "bins": [-13.265625, -12.8651123046875, -12.464599609375, -12.0640869140625, -11.66357421875, -11.2630615234375, -10.862548828125, -10.4620361328125, -10.0615234375, -9.6610107421875, -9.260498046875, -8.8599853515625, -8.45947265625, -8.0589599609375, -7.658447265625, -7.2579345703125, -6.857421875, -6.4569091796875, -6.056396484375, -5.6558837890625, -5.25537109375, -4.8548583984375, -4.454345703125, -4.0538330078125, -3.6533203125, -3.2528076171875, -2.852294921875, -2.4517822265625, -2.05126953125, -1.6507568359375, -1.250244140625, -0.8497314453125, -0.44921875, -0.0487060546875, 0.351806640625, 0.7523193359375, 1.15283203125, 1.5533447265625, 1.953857421875, 2.3543701171875, 2.7548828125, 3.1553955078125, 3.555908203125, 3.9564208984375, 4.35693359375, 4.7574462890625, 5.157958984375, 5.5584716796875, 5.958984375, 6.3594970703125, 6.760009765625, 7.1605224609375, 7.56103515625, 7.9615478515625, 8.362060546875, 8.7625732421875, 9.1630859375, 9.5635986328125, 9.964111328125, 10.3646240234375, 10.76513671875, 11.1656494140625, 11.566162109375, 11.9666748046875, 12.3671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 10.0, 3.0, 12.0, 11.0, 11.0, 20.0, 22.0, 11.0, 35.0, 18.0, 23.0, 28.0, 35.0, 54.0, 49.0, 51.0, 65.0, 43.0, 55.0, 39.0, 38.0, 38.0, 46.0, 35.0, 35.0, 32.0, 36.0, 37.0, 15.0, 20.0, 13.0, 12.0, 15.0, 8.0, 8.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0007367134094238281, -0.0007161125540733337, -0.0006955116987228394, -0.000674910843372345, -0.0006543099880218506, -0.0006337091326713562, -0.0006131082773208618, -0.0005925074219703674, -0.000571906566619873, -0.0005513057112693787, -0.0005307048559188843, -0.0005101040005683899, -0.0004895031452178955, -0.0004689022898674011, -0.00044830143451690674, -0.00042770057916641235, -0.00040709972381591797, -0.0003864988684654236, -0.0003658980131149292, -0.0003452971577644348, -0.00032469630241394043, -0.00030409544706344604, -0.00028349459171295166, -0.0002628937363624573, -0.0002422928810119629, -0.0002216920256614685, -0.00020109117031097412, -0.00018049031496047974, -0.00015988945960998535, -0.00013928860425949097, -0.00011868774890899658, -9.80868935585022e-05, -7.748603820800781e-05, -5.688518285751343e-05, -3.628432750701904e-05, -1.5683472156524658e-05, 4.9173831939697266e-06, 2.551823854446411e-05, 4.6119093894958496e-05, 6.671994924545288e-05, 8.732080459594727e-05, 0.00010792165994644165, 0.00012852251529693604, 0.00014912337064743042, 0.0001697242259979248, 0.0001903250813484192, 0.00021092593669891357, 0.00023152679204940796, 0.00025212764739990234, 0.00027272850275039673, 0.0002933293581008911, 0.0003139302134513855, 0.0003345310688018799, 0.00035513192415237427, 0.00037573277950286865, 0.00039633363485336304, 0.0004169344902038574, 0.0004375353455543518, 0.0004581362009048462, 0.0004787370562553406, 0.000499337911605835, 0.0005199387669563293, 0.0005405396223068237, 0.0005611404776573181, 0.0005817413330078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 12.0, 26.0, 31.0, 44.0, 75.0, 120.0, 179.0, 292.0, 433.0, 587.0, 898.0, 1440.0, 2266.0, 3426.0, 5415.0, 8228.0, 12547.0, 19476.0, 29733.0, 43659.0, 63442.0, 88069.0, 112150.0, 128827.0, 129430.0, 113643.0, 89054.0, 63971.0, 44617.0, 29904.0, 19814.0, 12864.0, 8287.0, 5511.0, 3503.0, 2239.0, 1508.0, 948.0, 618.0, 445.0, 267.0, 197.0, 126.0, 85.0, 52.0, 28.0, 25.0, 15.0, 13.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.5546875, -12.136474609375, -11.71826171875, -11.300048828125, -10.8818359375, -10.463623046875, -10.04541015625, -9.627197265625, -9.208984375, -8.790771484375, -8.37255859375, -7.954345703125, -7.5361328125, -7.117919921875, -6.69970703125, -6.281494140625, -5.86328125, -5.445068359375, -5.02685546875, -4.608642578125, -4.1904296875, -3.772216796875, -3.35400390625, -2.935791015625, -2.517578125, -2.099365234375, -1.68115234375, -1.262939453125, -0.8447265625, -0.426513671875, -0.00830078125, 0.409912109375, 0.828125, 1.246337890625, 1.66455078125, 2.082763671875, 2.5009765625, 2.919189453125, 3.33740234375, 3.755615234375, 4.173828125, 4.592041015625, 5.01025390625, 5.428466796875, 5.8466796875, 6.264892578125, 6.68310546875, 7.101318359375, 7.51953125, 7.937744140625, 8.35595703125, 8.774169921875, 9.1923828125, 9.610595703125, 10.02880859375, 10.447021484375, 10.865234375, 11.283447265625, 11.70166015625, 12.119873046875, 12.5380859375, 12.956298828125, 13.37451171875, 13.792724609375, 14.2109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 10.0, 6.0, 9.0, 9.0, 11.0, 10.0, 17.0, 16.0, 28.0, 38.0, 31.0, 38.0, 43.0, 57.0, 49.0, 49.0, 61.0, 57.0, 63.0, 67.0, 43.0, 47.0, 42.0, 31.0, 25.0, 25.0, 25.0, 19.0, 17.0, 14.0, 11.0, 5.0, 4.0, 5.0, 9.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-6.16015625, -5.960205078125, -5.76025390625, -5.560302734375, -5.3603515625, -5.160400390625, -4.96044921875, -4.760498046875, -4.560546875, -4.360595703125, -4.16064453125, -3.960693359375, -3.7607421875, -3.560791015625, -3.36083984375, -3.160888671875, -2.9609375, -2.760986328125, -2.56103515625, -2.361083984375, -2.1611328125, -1.961181640625, -1.76123046875, -1.561279296875, -1.361328125, -1.161376953125, -0.96142578125, -0.761474609375, -0.5615234375, -0.361572265625, -0.16162109375, 0.038330078125, 0.23828125, 0.438232421875, 0.63818359375, 0.838134765625, 1.0380859375, 1.238037109375, 1.43798828125, 1.637939453125, 1.837890625, 2.037841796875, 2.23779296875, 2.437744140625, 2.6376953125, 2.837646484375, 3.03759765625, 3.237548828125, 3.4375, 3.637451171875, 3.83740234375, 4.037353515625, 4.2373046875, 4.437255859375, 4.63720703125, 4.837158203125, 5.037109375, 5.237060546875, 5.43701171875, 5.636962890625, 5.8369140625, 6.036865234375, 6.23681640625, 6.436767578125, 6.63671875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 1.0, 7.0, 7.0, 11.0, 17.0, 16.0, 20.0, 19.0, 19.0, 25.0, 19.0, 26.0, 34.0, 23.0, 24.0, 31.0, 43.0, 33.0, 40.0, 35.0, 36.0, 32.0, 37.0, 33.0, 37.0, 46.0, 34.0, 37.0, 27.0, 25.0, 27.0, 28.0, 29.0, 16.0, 15.0, 15.0, 10.0, 14.0, 7.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0], "bins": [-42.819190979003906, -41.55305099487305, -40.28690719604492, -39.02076721191406, -37.75462341308594, -36.48848342895508, -35.22234344482422, -33.956199645996094, -32.690059661865234, -31.423917770385742, -30.15777587890625, -28.89163589477539, -27.6254940032959, -26.359352111816406, -25.093212127685547, -23.827070236206055, -22.560928344726562, -21.29478645324707, -20.028644561767578, -18.76250457763672, -17.496362686157227, -16.230220794677734, -14.964079856872559, -13.697938919067383, -12.43179702758789, -11.165655136108398, -9.899514198303223, -8.633373260498047, -7.367231369018555, -6.101089954376221, -4.834948539733887, -3.568807601928711, -2.302661895751953, -1.0365204811096191, 0.22962093353271484, 1.4957623481750488, 2.761903762817383, 4.028045177459717, 5.294186592102051, 6.560327529907227, 7.826469421386719, 9.092611312866211, 10.358752250671387, 11.624893188476562, 12.891035079956055, 14.157176971435547, 15.423317909240723, 16.6894588470459, 17.95560073852539, 19.221742630004883, 20.487884521484375, 21.754024505615234, 23.020166397094727, 24.28630828857422, 25.552448272705078, 26.81859016418457, 28.084732055664062, 29.350873947143555, 30.617015838623047, 31.883155822753906, 33.14929962158203, 34.41543960571289, 35.68157958984375, 36.947723388671875, 38.213863372802734]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 11.0, 9.0, 10.0, 15.0, 13.0, 20.0, 27.0, 31.0, 27.0, 30.0, 30.0, 27.0, 31.0, 37.0, 33.0, 50.0, 42.0, 32.0, 45.0, 37.0, 43.0, 38.0, 31.0, 36.0, 31.0, 27.0, 20.0, 21.0, 27.0, 15.0, 20.0, 17.0, 17.0, 12.0, 8.0, 14.0, 5.0, 7.0, 8.0, 3.0, 5.0, 5.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.8571662902832, -34.66831970214844, -33.479469299316406, -32.29062271118164, -31.101776123046875, -29.91292953491211, -28.72408103942871, -27.535232543945312, -26.346385955810547, -25.15753936767578, -23.968690872192383, -22.779842376708984, -21.59099578857422, -20.402149200439453, -19.213300704956055, -18.024452209472656, -16.83560562133789, -15.646758079528809, -14.457910537719727, -13.269062995910645, -12.080215454101562, -10.89136791229248, -9.702520370483398, -8.513672828674316, -7.324825286865234, -6.135977745056152, -4.94713020324707, -3.7582826614379883, -2.5694351196289062, -1.3805875778198242, -0.1917400360107422, 0.9971075057983398, 2.1859588623046875, 3.3748064041137695, 4.563653945922852, 5.752501487731934, 6.941349029541016, 8.130196571350098, 9.31904411315918, 10.507891654968262, 11.696739196777344, 12.885586738586426, 14.074434280395508, 15.26328182220459, 16.452129364013672, 17.640975952148438, 18.829824447631836, 20.018672943115234, 21.20751953125, 22.396366119384766, 23.585214614868164, 24.774063110351562, 25.962909698486328, 27.151756286621094, 28.340604782104492, 29.52945327758789, 30.718299865722656, 31.907146453857422, 33.09599304199219, 34.28484344482422, 35.473690032958984, 36.66253662109375, 37.85138702392578, 39.04023361206055, 40.22908020019531]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 8.0, 20.0, 38.0, 51.0, 86.0, 129.0, 216.0, 360.0, 520.0, 897.0, 1339.0, 2084.0, 3074.0, 4524.0, 6537.0, 9653.0, 13294.0, 18607.0, 24910.0, 32327.0, 41703.0, 50605.0, 59866.0, 68899.0, 76089.0, 80557.0, 81552.0, 78746.0, 74139.0, 66332.0, 57414.0, 47937.0, 38517.0, 29869.0, 22534.0, 16751.0, 12151.0, 8556.0, 5919.0, 4105.0, 2717.0, 1766.0, 1135.0, 763.0, 445.0, 305.0, 208.0, 114.0, 78.0, 49.0, 23.0, 14.0, 6.0, 6.0, 6.0, 3.0, 0.0, 4.0], "bins": [-28.671875, -27.785400390625, -26.89892578125, -26.012451171875, -25.1259765625, -24.239501953125, -23.35302734375, -22.466552734375, -21.580078125, -20.693603515625, -19.80712890625, -18.920654296875, -18.0341796875, -17.147705078125, -16.26123046875, -15.374755859375, -14.48828125, -13.601806640625, -12.71533203125, -11.828857421875, -10.9423828125, -10.055908203125, -9.16943359375, -8.282958984375, -7.396484375, -6.510009765625, -5.62353515625, -4.737060546875, -3.8505859375, -2.964111328125, -2.07763671875, -1.191162109375, -0.3046875, 0.581787109375, 1.46826171875, 2.354736328125, 3.2412109375, 4.127685546875, 5.01416015625, 5.900634765625, 6.787109375, 7.673583984375, 8.56005859375, 9.446533203125, 10.3330078125, 11.219482421875, 12.10595703125, 12.992431640625, 13.87890625, 14.765380859375, 15.65185546875, 16.538330078125, 17.4248046875, 18.311279296875, 19.19775390625, 20.084228515625, 20.970703125, 21.857177734375, 22.74365234375, 23.630126953125, 24.5166015625, 25.403076171875, 26.28955078125, 27.176025390625, 28.0625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 6.0, 10.0, 10.0, 8.0, 11.0, 15.0, 15.0, 23.0, 25.0, 25.0, 31.0, 29.0, 29.0, 26.0, 37.0, 34.0, 34.0, 51.0, 37.0, 40.0, 40.0, 38.0, 43.0, 39.0, 40.0, 22.0, 35.0, 29.0, 17.0, 23.0, 21.0, 22.0, 15.0, 19.0, 17.0, 13.0, 7.0, 11.0, 7.0, 6.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.5, -33.353515625, -32.20703125, -31.060546875, -29.9140625, -28.767578125, -27.62109375, -26.474609375, -25.328125, -24.181640625, -23.03515625, -21.888671875, -20.7421875, -19.595703125, -18.44921875, -17.302734375, -16.15625, -15.009765625, -13.86328125, -12.716796875, -11.5703125, -10.423828125, -9.27734375, -8.130859375, -6.984375, -5.837890625, -4.69140625, -3.544921875, -2.3984375, -1.251953125, -0.10546875, 1.041015625, 2.1875, 3.333984375, 4.48046875, 5.626953125, 6.7734375, 7.919921875, 9.06640625, 10.212890625, 11.359375, 12.505859375, 13.65234375, 14.798828125, 15.9453125, 17.091796875, 18.23828125, 19.384765625, 20.53125, 21.677734375, 22.82421875, 23.970703125, 25.1171875, 26.263671875, 27.41015625, 28.556640625, 29.703125, 30.849609375, 31.99609375, 33.142578125, 34.2890625, 35.435546875, 36.58203125, 37.728515625, 38.875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 9.0, 13.0, 16.0, 22.0, 34.0, 67.0, 86.0, 124.0, 210.0, 332.0, 514.0, 831.0, 1350.0, 2109.0, 3015.0, 4781.0, 7003.0, 10201.0, 14693.0, 20309.0, 27629.0, 36965.0, 46917.0, 57123.0, 68414.0, 76704.0, 83080.0, 85942.0, 85640.0, 80150.0, 72081.0, 62121.0, 51365.0, 40974.0, 31204.0, 23230.0, 16783.0, 11926.0, 8345.0, 5679.0, 3772.0, 2475.0, 1552.0, 1019.0, 647.0, 411.0, 253.0, 153.0, 109.0, 57.0, 45.0, 30.0, 25.0, 7.0, 11.0, 5.0, 5.0, 0.0, 2.0], "bins": [-29.734375, -28.825439453125, -27.91650390625, -27.007568359375, -26.0986328125, -25.189697265625, -24.28076171875, -23.371826171875, -22.462890625, -21.553955078125, -20.64501953125, -19.736083984375, -18.8271484375, -17.918212890625, -17.00927734375, -16.100341796875, -15.19140625, -14.282470703125, -13.37353515625, -12.464599609375, -11.5556640625, -10.646728515625, -9.73779296875, -8.828857421875, -7.919921875, -7.010986328125, -6.10205078125, -5.193115234375, -4.2841796875, -3.375244140625, -2.46630859375, -1.557373046875, -0.6484375, 0.260498046875, 1.16943359375, 2.078369140625, 2.9873046875, 3.896240234375, 4.80517578125, 5.714111328125, 6.623046875, 7.531982421875, 8.44091796875, 9.349853515625, 10.2587890625, 11.167724609375, 12.07666015625, 12.985595703125, 13.89453125, 14.803466796875, 15.71240234375, 16.621337890625, 17.5302734375, 18.439208984375, 19.34814453125, 20.257080078125, 21.166015625, 22.074951171875, 22.98388671875, 23.892822265625, 24.8017578125, 25.710693359375, 26.61962890625, 27.528564453125, 28.4375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 2.0, 8.0, 7.0, 9.0, 10.0, 12.0, 11.0, 25.0, 26.0, 29.0, 27.0, 31.0, 28.0, 20.0, 35.0, 42.0, 40.0, 28.0, 39.0, 51.0, 38.0, 41.0, 34.0, 50.0, 42.0, 35.0, 30.0, 32.0, 28.0, 28.0, 25.0, 26.0, 24.0, 14.0, 7.0, 9.0, 8.0, 11.0, 10.0, 8.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.09375, -25.288330078125, -24.48291015625, -23.677490234375, -22.8720703125, -22.066650390625, -21.26123046875, -20.455810546875, -19.650390625, -18.844970703125, -18.03955078125, -17.234130859375, -16.4287109375, -15.623291015625, -14.81787109375, -14.012451171875, -13.20703125, -12.401611328125, -11.59619140625, -10.790771484375, -9.9853515625, -9.179931640625, -8.37451171875, -7.569091796875, -6.763671875, -5.958251953125, -5.15283203125, -4.347412109375, -3.5419921875, -2.736572265625, -1.93115234375, -1.125732421875, -0.3203125, 0.485107421875, 1.29052734375, 2.095947265625, 2.9013671875, 3.706787109375, 4.51220703125, 5.317626953125, 6.123046875, 6.928466796875, 7.73388671875, 8.539306640625, 9.3447265625, 10.150146484375, 10.95556640625, 11.760986328125, 12.56640625, 13.371826171875, 14.17724609375, 14.982666015625, 15.7880859375, 16.593505859375, 17.39892578125, 18.204345703125, 19.009765625, 19.815185546875, 20.62060546875, 21.426025390625, 22.2314453125, 23.036865234375, 23.84228515625, 24.647705078125, 25.453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 9.0, 17.0, 29.0, 37.0, 61.0, 81.0, 154.0, 252.0, 452.0, 830.0, 1652.0, 3098.0, 5878.0, 10717.0, 19460.0, 33794.0, 54141.0, 81708.0, 110914.0, 132626.0, 141591.0, 133189.0, 109276.0, 79954.0, 53749.0, 32912.0, 19158.0, 10496.0, 5706.0, 3044.0, 1584.0, 896.0, 452.0, 271.0, 131.0, 79.0, 54.0, 34.0, 27.0, 11.0, 8.0, 8.0, 7.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.5625, -16.986328125, -16.41015625, -15.833984375, -15.2578125, -14.681640625, -14.10546875, -13.529296875, -12.953125, -12.376953125, -11.80078125, -11.224609375, -10.6484375, -10.072265625, -9.49609375, -8.919921875, -8.34375, -7.767578125, -7.19140625, -6.615234375, -6.0390625, -5.462890625, -4.88671875, -4.310546875, -3.734375, -3.158203125, -2.58203125, -2.005859375, -1.4296875, -0.853515625, -0.27734375, 0.298828125, 0.875, 1.451171875, 2.02734375, 2.603515625, 3.1796875, 3.755859375, 4.33203125, 4.908203125, 5.484375, 6.060546875, 6.63671875, 7.212890625, 7.7890625, 8.365234375, 8.94140625, 9.517578125, 10.09375, 10.669921875, 11.24609375, 11.822265625, 12.3984375, 12.974609375, 13.55078125, 14.126953125, 14.703125, 15.279296875, 15.85546875, 16.431640625, 17.0078125, 17.583984375, 18.16015625, 18.736328125, 19.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 16.0, 9.0, 14.0, 15.0, 17.0, 18.0, 27.0, 34.0, 20.0, 27.0, 35.0, 35.0, 45.0, 54.0, 46.0, 48.0, 54.0, 59.0, 37.0, 46.0, 43.0, 37.0, 49.0, 32.0, 34.0, 21.0, 17.0, 26.0, 11.0, 14.0, 11.0, 10.0, 8.0, 7.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002010345458984375, -0.001952141523361206, -0.0018939375877380371, -0.0018357336521148682, -0.0017775297164916992, -0.0017193257808685303, -0.0016611218452453613, -0.0016029179096221924, -0.0015447139739990234, -0.0014865100383758545, -0.0014283061027526855, -0.0013701021671295166, -0.0013118982315063477, -0.0012536942958831787, -0.0011954903602600098, -0.0011372864246368408, -0.0010790824890136719, -0.001020878553390503, -0.000962674617767334, -0.000904470682144165, -0.0008462667465209961, -0.0007880628108978271, -0.0007298588752746582, -0.0006716549396514893, -0.0006134510040283203, -0.0005552470684051514, -0.0004970431327819824, -0.0004388391971588135, -0.00038063526153564453, -0.0003224313259124756, -0.00026422739028930664, -0.0002060234546661377, -0.00014781951904296875, -8.96155834197998e-05, -3.141164779663086e-05, 2.6792287826538086e-05, 8.499622344970703e-05, 0.00014320015907287598, 0.00020140409469604492, 0.00025960803031921387, 0.0003178119659423828, 0.00037601590156555176, 0.0004342198371887207, 0.0004924237728118896, 0.0005506277084350586, 0.0006088316440582275, 0.0006670355796813965, 0.0007252395153045654, 0.0007834434509277344, 0.0008416473865509033, 0.0008998513221740723, 0.0009580552577972412, 0.0010162591934204102, 0.001074463129043579, 0.001132667064666748, 0.001190871000289917, 0.001249074935913086, 0.0013072788715362549, 0.0013654828071594238, 0.0014236867427825928, 0.0014818906784057617, 0.0015400946140289307, 0.0015982985496520996, 0.0016565024852752686, 0.0017147064208984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 13.0, 11.0, 29.0, 36.0, 59.0, 84.0, 154.0, 218.0, 367.0, 590.0, 968.0, 1637.0, 2725.0, 4418.0, 7372.0, 12244.0, 19228.0, 30370.0, 45603.0, 64734.0, 85174.0, 104771.0, 117197.0, 119316.0, 111232.0, 94123.0, 73719.0, 53564.0, 36251.0, 24110.0, 14999.0, 9336.0, 5460.0, 3321.0, 2004.0, 1158.0, 736.0, 449.0, 278.0, 187.0, 117.0, 76.0, 40.0, 25.0, 13.0, 16.0, 10.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.390625, -17.81982421875, -17.2490234375, -16.67822265625, -16.107421875, -15.53662109375, -14.9658203125, -14.39501953125, -13.82421875, -13.25341796875, -12.6826171875, -12.11181640625, -11.541015625, -10.97021484375, -10.3994140625, -9.82861328125, -9.2578125, -8.68701171875, -8.1162109375, -7.54541015625, -6.974609375, -6.40380859375, -5.8330078125, -5.26220703125, -4.69140625, -4.12060546875, -3.5498046875, -2.97900390625, -2.408203125, -1.83740234375, -1.2666015625, -0.69580078125, -0.125, 0.44580078125, 1.0166015625, 1.58740234375, 2.158203125, 2.72900390625, 3.2998046875, 3.87060546875, 4.44140625, 5.01220703125, 5.5830078125, 6.15380859375, 6.724609375, 7.29541015625, 7.8662109375, 8.43701171875, 9.0078125, 9.57861328125, 10.1494140625, 10.72021484375, 11.291015625, 11.86181640625, 12.4326171875, 13.00341796875, 13.57421875, 14.14501953125, 14.7158203125, 15.28662109375, 15.857421875, 16.42822265625, 16.9990234375, 17.56982421875, 18.140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 6.0, 10.0, 14.0, 18.0, 19.0, 13.0, 30.0, 41.0, 24.0, 39.0, 37.0, 43.0, 49.0, 47.0, 54.0, 50.0, 63.0, 64.0, 58.0, 37.0, 46.0, 41.0, 32.0, 37.0, 28.0, 27.0, 18.0, 13.0, 7.0, 5.0, 8.0, 8.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.63787841796875, -7.3499755859375, -7.06207275390625, -6.774169921875, -6.48626708984375, -6.1983642578125, -5.91046142578125, -5.62255859375, -5.33465576171875, -5.0467529296875, -4.75885009765625, -4.470947265625, -4.18304443359375, -3.8951416015625, -3.60723876953125, -3.3193359375, -3.03143310546875, -2.7435302734375, -2.45562744140625, -2.167724609375, -1.87982177734375, -1.5919189453125, -1.30401611328125, -1.01611328125, -0.72821044921875, -0.4403076171875, -0.15240478515625, 0.135498046875, 0.42340087890625, 0.7113037109375, 0.99920654296875, 1.287109375, 1.57501220703125, 1.8629150390625, 2.15081787109375, 2.438720703125, 2.72662353515625, 3.0145263671875, 3.30242919921875, 3.59033203125, 3.87823486328125, 4.1661376953125, 4.45404052734375, 4.741943359375, 5.02984619140625, 5.3177490234375, 5.60565185546875, 5.8935546875, 6.18145751953125, 6.4693603515625, 6.75726318359375, 7.045166015625, 7.33306884765625, 7.6209716796875, 7.90887451171875, 8.19677734375, 8.48468017578125, 8.7725830078125, 9.06048583984375, 9.348388671875, 9.63629150390625, 9.9241943359375, 10.21209716796875, 10.5]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 11.0, 18.0, 22.0, 14.0, 18.0, 13.0, 24.0, 28.0, 22.0, 22.0, 33.0, 34.0, 30.0, 30.0, 26.0, 47.0, 33.0, 30.0, 31.0, 35.0, 37.0, 39.0, 38.0, 28.0, 28.0, 36.0, 39.0, 25.0, 20.0, 27.0, 22.0, 13.0, 15.0, 19.0, 14.0, 13.0, 3.0, 6.0, 5.0, 11.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.93421936035156, -37.695472717285156, -36.456729888916016, -35.21798324584961, -33.97924041748047, -32.74049377441406, -31.501747131347656, -30.263002395629883, -29.02425765991211, -27.785512924194336, -26.546768188476562, -25.308021545410156, -24.069276809692383, -22.83053207397461, -21.591785430908203, -20.35304069519043, -19.114295959472656, -17.875551223754883, -16.63680648803711, -15.398059844970703, -14.15931510925293, -12.920570373535156, -11.681824684143066, -10.443078994750977, -9.204334259033203, -7.9655890464782715, -6.72684383392334, -5.488098621368408, -4.249353408813477, -3.010608196258545, -1.7718629837036133, -0.5331172943115234, 0.7056312561035156, 1.9443764686584473, 3.183121681213379, 4.4218668937683105, 5.660612106323242, 6.899357318878174, 8.138102531433105, 9.376848220825195, 10.615592956542969, 11.854337692260742, 13.093083381652832, 14.331829071044922, 15.570573806762695, 16.80931854248047, 18.048065185546875, 19.28680992126465, 20.525554656982422, 21.764299392700195, 23.00304412841797, 24.241790771484375, 25.48053550720215, 26.719280242919922, 27.958026885986328, 29.1967716217041, 30.435516357421875, 31.67426109313965, 32.91300582885742, 34.15175247192383, 35.39049530029297, 36.629241943359375, 37.86798858642578, 39.10673522949219, 40.34547805786133]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 6.0, 3.0, 6.0, 10.0, 10.0, 15.0, 14.0, 16.0, 23.0, 28.0, 29.0, 37.0, 29.0, 50.0, 44.0, 44.0, 50.0, 44.0, 46.0, 43.0, 51.0, 39.0, 42.0, 53.0, 41.0, 29.0, 34.0, 32.0, 16.0, 19.0, 24.0, 14.0, 19.0, 13.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21979904174805, -41.74457550048828, -40.269351959228516, -38.79412841796875, -37.31890106201172, -35.84367752075195, -34.36845397949219, -32.89323043823242, -31.418006896972656, -29.94278335571289, -28.467559814453125, -26.992334365844727, -25.51711082458496, -24.041887283325195, -22.566661834716797, -21.09143829345703, -19.616214752197266, -18.1409912109375, -16.665767669677734, -15.190542221069336, -13.71531867980957, -12.240095138549805, -10.764870643615723, -9.28964614868164, -7.814422607421875, -6.339198589324951, -4.863974571228027, -3.3887505531311035, -1.9135265350341797, -0.43830251693725586, 1.036921501159668, 2.51214599609375, 3.9873695373535156, 5.4625935554504395, 6.937817573547363, 8.413042068481445, 9.888265609741211, 11.363489151000977, 12.838713645935059, 14.31393814086914, 15.789161682128906, 17.264385223388672, 18.739608764648438, 20.214834213256836, 21.6900577545166, 23.165281295776367, 24.640506744384766, 26.11573028564453, 27.590953826904297, 29.066177368164062, 30.541400909423828, 32.016624450683594, 33.491851806640625, 34.96707534790039, 36.442298889160156, 37.91752243041992, 39.39274597167969, 40.86796951293945, 42.34319305419922, 43.818416595458984, 45.29364013671875, 46.76886749267578, 48.24409103393555, 49.71931457519531, 51.19453811645508]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [4.0, 6.0, 4.0, 3.0, 10.0, 22.0, 46.0, 76.0, 98.0, 188.0, 293.0, 505.0, 845.0, 1374.0, 2357.0, 3727.0, 6037.0, 9750.0, 15637.0, 24403.0, 37338.0, 56305.0, 82569.0, 117415.0, 163358.0, 214192.0, 270792.0, 326770.0, 369180.0, 394742.0, 393637.0, 369039.0, 325811.0, 270583.0, 214845.0, 161847.0, 118096.0, 82782.0, 56541.0, 37436.0, 24153.0, 15589.0, 10026.0, 6078.0, 3840.0, 2360.0, 1408.0, 854.0, 533.0, 307.0, 198.0, 115.0, 74.0, 35.0, 32.0, 17.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.84375, -27.88232421875, -26.9208984375, -25.95947265625, -24.998046875, -24.03662109375, -23.0751953125, -22.11376953125, -21.15234375, -20.19091796875, -19.2294921875, -18.26806640625, -17.306640625, -16.34521484375, -15.3837890625, -14.42236328125, -13.4609375, -12.49951171875, -11.5380859375, -10.57666015625, -9.615234375, -8.65380859375, -7.6923828125, -6.73095703125, -5.76953125, -4.80810546875, -3.8466796875, -2.88525390625, -1.923828125, -0.96240234375, -0.0009765625, 0.96044921875, 1.921875, 2.88330078125, 3.8447265625, 4.80615234375, 5.767578125, 6.72900390625, 7.6904296875, 8.65185546875, 9.61328125, 10.57470703125, 11.5361328125, 12.49755859375, 13.458984375, 14.42041015625, 15.3818359375, 16.34326171875, 17.3046875, 18.26611328125, 19.2275390625, 20.18896484375, 21.150390625, 22.11181640625, 23.0732421875, 24.03466796875, 24.99609375, 25.95751953125, 26.9189453125, 27.88037109375, 28.841796875, 29.80322265625, 30.7646484375, 31.72607421875, 32.6875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 0.0, 2.0, 5.0, 7.0, 9.0, 13.0, 12.0, 10.0, 15.0, 25.0, 21.0, 38.0, 29.0, 37.0, 45.0, 47.0, 46.0, 47.0, 43.0, 49.0, 45.0, 50.0, 38.0, 49.0, 46.0, 40.0, 34.0, 25.0, 34.0, 23.0, 20.0, 22.0, 15.0, 18.0, 9.0, 13.0, 6.0, 0.0, 6.0, 1.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.25, -37.91015625, -36.5703125, -35.23046875, -33.890625, -32.55078125, -31.2109375, -29.87109375, -28.53125, -27.19140625, -25.8515625, -24.51171875, -23.171875, -21.83203125, -20.4921875, -19.15234375, -17.8125, -16.47265625, -15.1328125, -13.79296875, -12.453125, -11.11328125, -9.7734375, -8.43359375, -7.09375, -5.75390625, -4.4140625, -3.07421875, -1.734375, -0.39453125, 0.9453125, 2.28515625, 3.625, 4.96484375, 6.3046875, 7.64453125, 8.984375, 10.32421875, 11.6640625, 13.00390625, 14.34375, 15.68359375, 17.0234375, 18.36328125, 19.703125, 21.04296875, 22.3828125, 23.72265625, 25.0625, 26.40234375, 27.7421875, 29.08203125, 30.421875, 31.76171875, 33.1015625, 34.44140625, 35.78125, 37.12109375, 38.4609375, 39.80078125, 41.140625, 42.48046875, 43.8203125, 45.16015625, 46.5]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 4.0, 7.0, 12.0, 19.0, 45.0, 64.0, 129.0, 182.0, 330.0, 544.0, 910.0, 1502.0, 2621.0, 4024.0, 6587.0, 10437.0, 16120.0, 24707.0, 36770.0, 53579.0, 76806.0, 106400.0, 142327.0, 184667.0, 229785.0, 273558.0, 312857.0, 341654.0, 355435.0, 351434.0, 330073.0, 295845.0, 253059.0, 207054.0, 163573.0, 124581.0, 91853.0, 64268.0, 44912.0, 30339.0, 20163.0, 13128.0, 8329.0, 5337.0, 3369.0, 1934.0, 1217.0, 712.0, 422.0, 268.0, 145.0, 79.0, 51.0, 32.0, 13.0, 18.0, 3.0, 2.0, 1.0, 2.0], "bins": [-30.984375, -30.03857421875, -29.0927734375, -28.14697265625, -27.201171875, -26.25537109375, -25.3095703125, -24.36376953125, -23.41796875, -22.47216796875, -21.5263671875, -20.58056640625, -19.634765625, -18.68896484375, -17.7431640625, -16.79736328125, -15.8515625, -14.90576171875, -13.9599609375, -13.01416015625, -12.068359375, -11.12255859375, -10.1767578125, -9.23095703125, -8.28515625, -7.33935546875, -6.3935546875, -5.44775390625, -4.501953125, -3.55615234375, -2.6103515625, -1.66455078125, -0.71875, 0.22705078125, 1.1728515625, 2.11865234375, 3.064453125, 4.01025390625, 4.9560546875, 5.90185546875, 6.84765625, 7.79345703125, 8.7392578125, 9.68505859375, 10.630859375, 11.57666015625, 12.5224609375, 13.46826171875, 14.4140625, 15.35986328125, 16.3056640625, 17.25146484375, 18.197265625, 19.14306640625, 20.0888671875, 21.03466796875, 21.98046875, 22.92626953125, 23.8720703125, 24.81787109375, 25.763671875, 26.70947265625, 27.6552734375, 28.60107421875, 29.546875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 28.0, 22.0, 25.0, 34.0, 39.0, 60.0, 52.0, 72.0, 90.0, 86.0, 109.0, 129.0, 141.0, 147.0, 160.0, 140.0, 196.0, 178.0, 222.0, 204.0, 180.0, 202.0, 194.0, 164.0, 187.0, 151.0, 141.0, 111.0, 93.0, 91.0, 83.0, 59.0, 51.0, 45.0, 40.0, 30.0, 18.0, 20.0, 16.0, 9.0, 11.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.0, -16.455078125, -15.91015625, -15.365234375, -14.8203125, -14.275390625, -13.73046875, -13.185546875, -12.640625, -12.095703125, -11.55078125, -11.005859375, -10.4609375, -9.916015625, -9.37109375, -8.826171875, -8.28125, -7.736328125, -7.19140625, -6.646484375, -6.1015625, -5.556640625, -5.01171875, -4.466796875, -3.921875, -3.376953125, -2.83203125, -2.287109375, -1.7421875, -1.197265625, -0.65234375, -0.107421875, 0.4375, 0.982421875, 1.52734375, 2.072265625, 2.6171875, 3.162109375, 3.70703125, 4.251953125, 4.796875, 5.341796875, 5.88671875, 6.431640625, 6.9765625, 7.521484375, 8.06640625, 8.611328125, 9.15625, 9.701171875, 10.24609375, 10.791015625, 11.3359375, 11.880859375, 12.42578125, 12.970703125, 13.515625, 14.060546875, 14.60546875, 15.150390625, 15.6953125, 16.240234375, 16.78515625, 17.330078125, 17.875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 5.0, 8.0, 7.0, 13.0, 9.0, 15.0, 24.0, 23.0, 32.0, 23.0, 32.0, 30.0, 32.0, 31.0, 43.0, 38.0, 58.0, 55.0, 41.0, 42.0, 53.0, 37.0, 51.0, 33.0, 39.0, 29.0, 37.0, 27.0, 23.0, 20.0, 19.0, 13.0, 15.0, 11.0, 9.0, 2.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.768611907958984, -46.28770065307617, -44.80678939819336, -43.32587814331055, -41.844966888427734, -40.36405563354492, -38.88314437866211, -37.4022331237793, -35.921321868896484, -34.44041061401367, -32.95949935913086, -31.478588104248047, -29.997676849365234, -28.516765594482422, -27.03585433959961, -25.554943084716797, -24.07402992248535, -22.59311866760254, -21.112207412719727, -19.631296157836914, -18.1503849029541, -16.66947364807129, -15.18856143951416, -13.707650184631348, -12.226738929748535, -10.745827674865723, -9.26491641998291, -7.7840046882629395, -6.303093433380127, -4.8221821784973145, -3.3412704467773438, -1.8603591918945312, -0.37944793701171875, 1.1014634370803833, 2.5823748111724854, 4.063286304473877, 5.5441975593566895, 7.025108814239502, 8.506020545959473, 9.986931800842285, 11.467843055725098, 12.94875431060791, 14.429665565490723, 15.910577774047852, 17.391489028930664, 18.872400283813477, 20.35331153869629, 21.8342227935791, 23.315134048461914, 24.796045303344727, 26.27695655822754, 27.75786781311035, 29.238779067993164, 30.719690322875977, 32.20060348510742, 33.681514739990234, 35.16242599487305, 36.64333724975586, 38.12424850463867, 39.605159759521484, 41.0860710144043, 42.56698226928711, 44.04789352416992, 45.528804779052734, 47.00971603393555]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 9.0, 8.0, 15.0, 16.0, 16.0, 21.0, 25.0, 33.0, 25.0, 37.0, 47.0, 38.0, 47.0, 47.0, 39.0, 53.0, 33.0, 46.0, 53.0, 42.0, 41.0, 38.0, 36.0, 23.0, 28.0, 21.0, 23.0, 15.0, 26.0, 14.0, 20.0, 9.0, 9.0, 5.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.65757369995117, -38.266448974609375, -36.87532043457031, -35.484195709228516, -34.09307098388672, -32.70194625854492, -31.310819625854492, -29.919692993164062, -28.528568267822266, -27.13744354248047, -25.74631690979004, -24.35519027709961, -22.964065551757812, -21.572940826416016, -20.181814193725586, -18.790687561035156, -17.39956283569336, -16.008438110351562, -14.617311477661133, -13.22618579864502, -11.835060119628906, -10.443934440612793, -9.05280876159668, -7.661683082580566, -6.270557403564453, -4.87943172454834, -3.4883060455322266, -2.0971803665161133, -0.7060546875, 0.6850709915161133, 2.0761966705322266, 3.46732234954834, 4.858448028564453, 6.249573707580566, 7.64069938659668, 9.031825065612793, 10.422950744628906, 11.81407642364502, 13.205202102661133, 14.596327781677246, 15.98745346069336, 17.378578186035156, 18.769704818725586, 20.160831451416016, 21.551956176757812, 22.94308090209961, 24.33420753479004, 25.72533416748047, 27.116458892822266, 28.507583618164062, 29.898710250854492, 31.289836883544922, 32.68096160888672, 34.072086334228516, 35.46321105957031, 36.854339599609375, 38.24546432495117, 39.63658905029297, 41.02771759033203, 42.41884231567383, 43.809967041015625, 45.20109176635742, 46.59221649169922, 47.98334503173828, 49.37446975708008]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 9.0, 8.0, 19.0, 30.0, 47.0, 67.0, 112.0, 170.0, 254.0, 374.0, 608.0, 915.0, 1533.0, 2468.0, 3814.0, 6134.0, 9870.0, 15569.0, 24969.0, 38463.0, 57565.0, 81280.0, 107172.0, 127657.0, 134155.0, 122018.0, 98679.0, 72970.0, 50918.0, 33447.0, 21156.0, 13557.0, 8297.0, 5260.0, 3341.0, 2098.0, 1322.0, 816.0, 508.0, 332.0, 209.0, 133.0, 85.0, 51.0, 37.0, 23.0, 18.0, 13.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.5, -16.923095703125, -16.34619140625, -15.769287109375, -15.1923828125, -14.615478515625, -14.03857421875, -13.461669921875, -12.884765625, -12.307861328125, -11.73095703125, -11.154052734375, -10.5771484375, -10.000244140625, -9.42333984375, -8.846435546875, -8.26953125, -7.692626953125, -7.11572265625, -6.538818359375, -5.9619140625, -5.385009765625, -4.80810546875, -4.231201171875, -3.654296875, -3.077392578125, -2.50048828125, -1.923583984375, -1.3466796875, -0.769775390625, -0.19287109375, 0.384033203125, 0.9609375, 1.537841796875, 2.11474609375, 2.691650390625, 3.2685546875, 3.845458984375, 4.42236328125, 4.999267578125, 5.576171875, 6.153076171875, 6.72998046875, 7.306884765625, 7.8837890625, 8.460693359375, 9.03759765625, 9.614501953125, 10.19140625, 10.768310546875, 11.34521484375, 11.922119140625, 12.4990234375, 13.075927734375, 13.65283203125, 14.229736328125, 14.806640625, 15.383544921875, 15.96044921875, 16.537353515625, 17.1142578125, 17.691162109375, 18.26806640625, 18.844970703125, 19.421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 8.0, 9.0, 13.0, 16.0, 15.0, 23.0, 26.0, 34.0, 21.0, 40.0, 46.0, 37.0, 47.0, 44.0, 45.0, 49.0, 34.0, 48.0, 50.0, 45.0, 39.0, 39.0, 38.0, 23.0, 25.0, 24.0, 19.0, 21.0, 23.0, 12.0, 21.0, 10.0, 9.0, 5.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.71875, -38.3271484375, -36.935546875, -35.5439453125, -34.15234375, -32.7607421875, -31.369140625, -29.9775390625, -28.5859375, -27.1943359375, -25.802734375, -24.4111328125, -23.01953125, -21.6279296875, -20.236328125, -18.8447265625, -17.453125, -16.0615234375, -14.669921875, -13.2783203125, -11.88671875, -10.4951171875, -9.103515625, -7.7119140625, -6.3203125, -4.9287109375, -3.537109375, -2.1455078125, -0.75390625, 0.6376953125, 2.029296875, 3.4208984375, 4.8125, 6.2041015625, 7.595703125, 8.9873046875, 10.37890625, 11.7705078125, 13.162109375, 14.5537109375, 15.9453125, 17.3369140625, 18.728515625, 20.1201171875, 21.51171875, 22.9033203125, 24.294921875, 25.6865234375, 27.078125, 28.4697265625, 29.861328125, 31.2529296875, 32.64453125, 34.0361328125, 35.427734375, 36.8193359375, 38.2109375, 39.6025390625, 40.994140625, 42.3857421875, 43.77734375, 45.1689453125, 46.560546875, 47.9521484375, 49.34375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 6.0, 10.0, 16.0, 19.0, 25.0, 51.0, 52.0, 90.0, 151.0, 173.0, 280.0, 484.0, 692.0, 1099.0, 1875.0, 3152.0, 5306.0, 9540.0, 17390.0, 32360.0, 61795.0, 113204.0, 185300.0, 221147.0, 172126.0, 101497.0, 54763.0, 28869.0, 15751.0, 8694.0, 4993.0, 2832.0, 1704.0, 1085.0, 695.0, 412.0, 307.0, 180.0, 146.0, 86.0, 76.0, 39.0, 41.0, 10.0, 10.0, 9.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-25.578125, -24.788818359375, -23.99951171875, -23.210205078125, -22.4208984375, -21.631591796875, -20.84228515625, -20.052978515625, -19.263671875, -18.474365234375, -17.68505859375, -16.895751953125, -16.1064453125, -15.317138671875, -14.52783203125, -13.738525390625, -12.94921875, -12.159912109375, -11.37060546875, -10.581298828125, -9.7919921875, -9.002685546875, -8.21337890625, -7.424072265625, -6.634765625, -5.845458984375, -5.05615234375, -4.266845703125, -3.4775390625, -2.688232421875, -1.89892578125, -1.109619140625, -0.3203125, 0.468994140625, 1.25830078125, 2.047607421875, 2.8369140625, 3.626220703125, 4.41552734375, 5.204833984375, 5.994140625, 6.783447265625, 7.57275390625, 8.362060546875, 9.1513671875, 9.940673828125, 10.72998046875, 11.519287109375, 12.30859375, 13.097900390625, 13.88720703125, 14.676513671875, 15.4658203125, 16.255126953125, 17.04443359375, 17.833740234375, 18.623046875, 19.412353515625, 20.20166015625, 20.990966796875, 21.7802734375, 22.569580078125, 23.35888671875, 24.148193359375, 24.9375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 9.0, 4.0, 3.0, 10.0, 7.0, 7.0, 12.0, 15.0, 16.0, 15.0, 17.0, 18.0, 21.0, 27.0, 35.0, 32.0, 38.0, 43.0, 35.0, 51.0, 40.0, 43.0, 40.0, 40.0, 41.0, 39.0, 29.0, 45.0, 34.0, 28.0, 24.0, 22.0, 26.0, 18.0, 18.0, 11.0, 15.0, 14.0, 13.0, 10.0, 7.0, 5.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.03125, -25.239013671875, -24.44677734375, -23.654541015625, -22.8623046875, -22.070068359375, -21.27783203125, -20.485595703125, -19.693359375, -18.901123046875, -18.10888671875, -17.316650390625, -16.5244140625, -15.732177734375, -14.93994140625, -14.147705078125, -13.35546875, -12.563232421875, -11.77099609375, -10.978759765625, -10.1865234375, -9.394287109375, -8.60205078125, -7.809814453125, -7.017578125, -6.225341796875, -5.43310546875, -4.640869140625, -3.8486328125, -3.056396484375, -2.26416015625, -1.471923828125, -0.6796875, 0.112548828125, 0.90478515625, 1.697021484375, 2.4892578125, 3.281494140625, 4.07373046875, 4.865966796875, 5.658203125, 6.450439453125, 7.24267578125, 8.034912109375, 8.8271484375, 9.619384765625, 10.41162109375, 11.203857421875, 11.99609375, 12.788330078125, 13.58056640625, 14.372802734375, 15.1650390625, 15.957275390625, 16.74951171875, 17.541748046875, 18.333984375, 19.126220703125, 19.91845703125, 20.710693359375, 21.5029296875, 22.295166015625, 23.08740234375, 23.879638671875, 24.671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 18.0, 19.0, 39.0, 50.0, 63.0, 85.0, 151.0, 234.0, 318.0, 470.0, 682.0, 1071.0, 1723.0, 2727.0, 4379.0, 7423.0, 13039.0, 23662.0, 44945.0, 91920.0, 189667.0, 280013.0, 190193.0, 92449.0, 45308.0, 24126.0, 13440.0, 7879.0, 4538.0, 2746.0, 1737.0, 1107.0, 758.0, 499.0, 359.0, 204.0, 143.0, 109.0, 62.0, 58.0, 37.0, 32.0, 20.0, 12.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-15.03125, -14.56884765625, -14.1064453125, -13.64404296875, -13.181640625, -12.71923828125, -12.2568359375, -11.79443359375, -11.33203125, -10.86962890625, -10.4072265625, -9.94482421875, -9.482421875, -9.02001953125, -8.5576171875, -8.09521484375, -7.6328125, -7.17041015625, -6.7080078125, -6.24560546875, -5.783203125, -5.32080078125, -4.8583984375, -4.39599609375, -3.93359375, -3.47119140625, -3.0087890625, -2.54638671875, -2.083984375, -1.62158203125, -1.1591796875, -0.69677734375, -0.234375, 0.22802734375, 0.6904296875, 1.15283203125, 1.615234375, 2.07763671875, 2.5400390625, 3.00244140625, 3.46484375, 3.92724609375, 4.3896484375, 4.85205078125, 5.314453125, 5.77685546875, 6.2392578125, 6.70166015625, 7.1640625, 7.62646484375, 8.0888671875, 8.55126953125, 9.013671875, 9.47607421875, 9.9384765625, 10.40087890625, 10.86328125, 11.32568359375, 11.7880859375, 12.25048828125, 12.712890625, 13.17529296875, 13.6376953125, 14.10009765625, 14.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 6.0, 8.0, 9.0, 10.0, 20.0, 28.0, 26.0, 43.0, 31.0, 52.0, 49.0, 62.0, 63.0, 67.0, 85.0, 65.0, 58.0, 44.0, 56.0, 48.0, 39.0, 32.0, 20.0, 13.0, 15.0, 8.0, 12.0, 4.0, 4.0, 2.0, 3.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009813308715820312, -0.0009529963135719299, -0.0009246617555618286, -0.0008963271975517273, -0.000867992639541626, -0.0008396580815315247, -0.0008113235235214233, -0.000782988965511322, -0.0007546544075012207, -0.0007263198494911194, -0.0006979852914810181, -0.0006696507334709167, -0.0006413161754608154, -0.0006129816174507141, -0.0005846470594406128, -0.0005563125014305115, -0.0005279779434204102, -0.0004996433854103088, -0.0004713088274002075, -0.0004429742693901062, -0.0004146397113800049, -0.00038630515336990356, -0.00035797059535980225, -0.00032963603734970093, -0.0003013014793395996, -0.0002729669213294983, -0.00024463236331939697, -0.00021629780530929565, -0.00018796324729919434, -0.00015962868928909302, -0.0001312941312789917, -0.00010295957326889038, -7.462501525878906e-05, -4.6290457248687744e-05, -1.7955899238586426e-05, 1.0378658771514893e-05, 3.871321678161621e-05, 6.704777479171753e-05, 9.538233280181885e-05, 0.00012371689081192017, 0.00015205144882202148, 0.0001803860068321228, 0.00020872056484222412, 0.00023705512285232544, 0.00026538968086242676, 0.0002937242388725281, 0.0003220587968826294, 0.0003503933548927307, 0.00037872791290283203, 0.00040706247091293335, 0.00043539702892303467, 0.000463731586933136, 0.0004920661449432373, 0.0005204007029533386, 0.0005487352609634399, 0.0005770698189735413, 0.0006054043769836426, 0.0006337389349937439, 0.0006620734930038452, 0.0006904080510139465, 0.0007187426090240479, 0.0007470771670341492, 0.0007754117250442505, 0.0008037462830543518, 0.0008320808410644531]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 5.0, 5.0, 14.0, 26.0, 43.0, 44.0, 72.0, 122.0, 206.0, 341.0, 444.0, 663.0, 1175.0, 1730.0, 2709.0, 4414.0, 6706.0, 10700.0, 17282.0, 26813.0, 42017.0, 63960.0, 91402.0, 119939.0, 137727.0, 137427.0, 118130.0, 89707.0, 62044.0, 40960.0, 26170.0, 16668.0, 10350.0, 6664.0, 4239.0, 2698.0, 1723.0, 1136.0, 736.0, 485.0, 301.0, 194.0, 129.0, 85.0, 60.0, 51.0, 15.0, 11.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-15.953125, -15.4835205078125, -15.013916015625, -14.5443115234375, -14.07470703125, -13.6051025390625, -13.135498046875, -12.6658935546875, -12.1962890625, -11.7266845703125, -11.257080078125, -10.7874755859375, -10.31787109375, -9.8482666015625, -9.378662109375, -8.9090576171875, -8.439453125, -7.9698486328125, -7.500244140625, -7.0306396484375, -6.56103515625, -6.0914306640625, -5.621826171875, -5.1522216796875, -4.6826171875, -4.2130126953125, -3.743408203125, -3.2738037109375, -2.80419921875, -2.3345947265625, -1.864990234375, -1.3953857421875, -0.92578125, -0.4561767578125, 0.013427734375, 0.4830322265625, 0.95263671875, 1.4222412109375, 1.891845703125, 2.3614501953125, 2.8310546875, 3.3006591796875, 3.770263671875, 4.2398681640625, 4.70947265625, 5.1790771484375, 5.648681640625, 6.1182861328125, 6.587890625, 7.0574951171875, 7.527099609375, 7.9967041015625, 8.46630859375, 8.9359130859375, 9.405517578125, 9.8751220703125, 10.3447265625, 10.8143310546875, 11.283935546875, 11.7535400390625, 12.22314453125, 12.6927490234375, 13.162353515625, 13.6319580078125, 14.1015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 8.0, 9.0, 12.0, 10.0, 13.0, 17.0, 22.0, 22.0, 23.0, 38.0, 47.0, 62.0, 49.0, 70.0, 63.0, 48.0, 68.0, 62.0, 50.0, 42.0, 46.0, 33.0, 35.0, 23.0, 22.0, 30.0, 17.0, 15.0, 9.0, 9.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.86163330078125, -5.6763916015625, -5.49114990234375, -5.305908203125, -5.12066650390625, -4.9354248046875, -4.75018310546875, -4.56494140625, -4.37969970703125, -4.1944580078125, -4.00921630859375, -3.823974609375, -3.63873291015625, -3.4534912109375, -3.26824951171875, -3.0830078125, -2.89776611328125, -2.7125244140625, -2.52728271484375, -2.342041015625, -2.15679931640625, -1.9715576171875, -1.78631591796875, -1.60107421875, -1.41583251953125, -1.2305908203125, -1.04534912109375, -0.860107421875, -0.67486572265625, -0.4896240234375, -0.30438232421875, -0.119140625, 0.06610107421875, 0.2513427734375, 0.43658447265625, 0.621826171875, 0.80706787109375, 0.9923095703125, 1.17755126953125, 1.36279296875, 1.54803466796875, 1.7332763671875, 1.91851806640625, 2.103759765625, 2.28900146484375, 2.4742431640625, 2.65948486328125, 2.8447265625, 3.02996826171875, 3.2152099609375, 3.40045166015625, 3.585693359375, 3.77093505859375, 3.9561767578125, 4.14141845703125, 4.32666015625, 4.51190185546875, 4.6971435546875, 4.88238525390625, 5.067626953125, 5.25286865234375, 5.4381103515625, 5.62335205078125, 5.80859375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 7.0, 9.0, 8.0, 8.0, 8.0, 12.0, 16.0, 18.0, 27.0, 32.0, 24.0, 32.0, 25.0, 29.0, 32.0, 45.0, 33.0, 54.0, 53.0, 42.0, 48.0, 38.0, 48.0, 34.0, 45.0, 36.0, 48.0, 24.0, 25.0, 23.0, 24.0, 19.0, 20.0, 15.0, 13.0, 8.0, 6.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-46.073143005371094, -44.606754302978516, -43.14036560058594, -41.673980712890625, -40.20759201049805, -38.74120330810547, -37.27481460571289, -35.80842590332031, -34.342041015625, -32.87565231323242, -31.409265518188477, -29.9428768157959, -28.476490020751953, -27.010101318359375, -25.543712615966797, -24.07732391357422, -22.61093521118164, -21.144546508789062, -19.678159713745117, -18.21177101135254, -16.745384216308594, -15.278995513916016, -13.812606811523438, -12.346219062805176, -10.879831314086914, -9.413443565368652, -7.947055339813232, -6.4806671142578125, -5.014279365539551, -3.547891616821289, -2.081502914428711, -0.6151151657104492, 0.8512725830078125, 2.3176605701446533, 3.784048557281494, 5.250436782836914, 6.716824531555176, 8.183212280273438, 9.649600982666016, 11.115988731384277, 12.582376480102539, 14.0487642288208, 15.515151977539062, 16.98154067993164, 18.44792938232422, 19.914316177368164, 21.380704879760742, 22.847091674804688, 24.313480377197266, 25.779869079589844, 27.24625587463379, 28.712644577026367, 30.179031372070312, 31.64542007446289, 33.11180877685547, 34.57819747924805, 36.044586181640625, 37.5109748840332, 38.97736358642578, 40.443748474121094, 41.91013717651367, 43.37652587890625, 44.84291458129883, 46.309303283691406, 47.77568817138672]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 4.0, 6.0, 13.0, 17.0, 14.0, 19.0, 21.0, 25.0, 29.0, 29.0, 46.0, 41.0, 43.0, 37.0, 46.0, 48.0, 40.0, 50.0, 36.0, 50.0, 42.0, 41.0, 42.0, 33.0, 26.0, 25.0, 26.0, 27.0, 19.0, 11.0, 17.0, 16.0, 10.0, 10.0, 4.0, 12.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.1818733215332, -36.783782958984375, -35.38568878173828, -33.98759460449219, -32.58950424194336, -31.1914119720459, -29.793319702148438, -28.395227432250977, -26.997135162353516, -25.599042892456055, -24.200950622558594, -22.802858352661133, -21.404766082763672, -20.00667381286621, -18.60858154296875, -17.21048927307129, -15.812397003173828, -14.414304733276367, -13.016212463378906, -11.618120193481445, -10.220027923583984, -8.821935653686523, -7.4238433837890625, -6.025751113891602, -4.627658843994141, -3.2295665740966797, -1.8314743041992188, -0.4333820343017578, 0.9647102355957031, 2.362802505493164, 3.760894775390625, 5.158987045288086, 6.557075500488281, 7.955167770385742, 9.353260040283203, 10.751352310180664, 12.149444580078125, 13.547536849975586, 14.945629119873047, 16.343721389770508, 17.74181365966797, 19.13990592956543, 20.53799819946289, 21.93609046936035, 23.334182739257812, 24.732275009155273, 26.130367279052734, 27.528459548950195, 28.926551818847656, 30.324644088745117, 31.722736358642578, 33.120826721191406, 34.5189208984375, 35.917015075683594, 37.31510543823242, 38.71319580078125, 40.111289978027344, 41.50938415527344, 42.907474517822266, 44.305564880371094, 45.70365905761719, 47.10175323486328, 48.49984359741211, 49.89793395996094, 51.29602813720703]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 11.0, 10.0, 17.0, 30.0, 67.0, 94.0, 139.0, 244.0, 371.0, 617.0, 1001.0, 1556.0, 2324.0, 3580.0, 5521.0, 8065.0, 12039.0, 16410.0, 22920.0, 30337.0, 39907.0, 49899.0, 60306.0, 70236.0, 78276.0, 83147.0, 84677.0, 82957.0, 77446.0, 68772.0, 59274.0, 48641.0, 38431.0, 29447.0, 21986.0, 16027.0, 11106.0, 7835.0, 5165.0, 3545.0, 2277.0, 1451.0, 903.0, 563.0, 362.0, 224.0, 155.0, 76.0, 48.0, 31.0, 17.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-29.53125, -28.620849609375, -27.71044921875, -26.800048828125, -25.8896484375, -24.979248046875, -24.06884765625, -23.158447265625, -22.248046875, -21.337646484375, -20.42724609375, -19.516845703125, -18.6064453125, -17.696044921875, -16.78564453125, -15.875244140625, -14.96484375, -14.054443359375, -13.14404296875, -12.233642578125, -11.3232421875, -10.412841796875, -9.50244140625, -8.592041015625, -7.681640625, -6.771240234375, -5.86083984375, -4.950439453125, -4.0400390625, -3.129638671875, -2.21923828125, -1.308837890625, -0.3984375, 0.511962890625, 1.42236328125, 2.332763671875, 3.2431640625, 4.153564453125, 5.06396484375, 5.974365234375, 6.884765625, 7.795166015625, 8.70556640625, 9.615966796875, 10.5263671875, 11.436767578125, 12.34716796875, 13.257568359375, 14.16796875, 15.078369140625, 15.98876953125, 16.899169921875, 17.8095703125, 18.719970703125, 19.63037109375, 20.540771484375, 21.451171875, 22.361572265625, 23.27197265625, 24.182373046875, 25.0927734375, 26.003173828125, 26.91357421875, 27.823974609375, 28.734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 7.0, 11.0, 18.0, 12.0, 22.0, 24.0, 21.0, 29.0, 31.0, 47.0, 41.0, 42.0, 40.0, 51.0, 42.0, 39.0, 47.0, 43.0, 53.0, 34.0, 45.0, 42.0, 27.0, 32.0, 25.0, 24.0, 27.0, 16.0, 15.0, 16.0, 14.0, 11.0, 7.0, 7.0, 10.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.84375, -35.48681640625, -34.1298828125, -32.77294921875, -31.416015625, -30.05908203125, -28.7021484375, -27.34521484375, -25.98828125, -24.63134765625, -23.2744140625, -21.91748046875, -20.560546875, -19.20361328125, -17.8466796875, -16.48974609375, -15.1328125, -13.77587890625, -12.4189453125, -11.06201171875, -9.705078125, -8.34814453125, -6.9912109375, -5.63427734375, -4.27734375, -2.92041015625, -1.5634765625, -0.20654296875, 1.150390625, 2.50732421875, 3.8642578125, 5.22119140625, 6.578125, 7.93505859375, 9.2919921875, 10.64892578125, 12.005859375, 13.36279296875, 14.7197265625, 16.07666015625, 17.43359375, 18.79052734375, 20.1474609375, 21.50439453125, 22.861328125, 24.21826171875, 25.5751953125, 26.93212890625, 28.2890625, 29.64599609375, 31.0029296875, 32.35986328125, 33.716796875, 35.07373046875, 36.4306640625, 37.78759765625, 39.14453125, 40.50146484375, 41.8583984375, 43.21533203125, 44.572265625, 45.92919921875, 47.2861328125, 48.64306640625, 50.0]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 1.0, 5.0, 7.0, 11.0, 15.0, 28.0, 55.0, 74.0, 136.0, 236.0, 360.0, 565.0, 916.0, 1553.0, 2325.0, 3351.0, 5125.0, 7765.0, 11166.0, 15747.0, 21787.0, 29772.0, 38703.0, 48744.0, 59506.0, 69401.0, 78005.0, 83598.0, 85467.0, 83874.0, 78653.0, 69584.0, 59953.0, 49181.0, 39287.0, 30186.0, 22599.0, 16186.0, 11533.0, 7843.0, 5359.0, 3503.0, 2325.0, 1452.0, 1029.0, 588.0, 364.0, 256.0, 169.0, 74.0, 68.0, 37.0, 17.0, 5.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0], "bins": [-28.609375, -27.72998046875, -26.8505859375, -25.97119140625, -25.091796875, -24.21240234375, -23.3330078125, -22.45361328125, -21.57421875, -20.69482421875, -19.8154296875, -18.93603515625, -18.056640625, -17.17724609375, -16.2978515625, -15.41845703125, -14.5390625, -13.65966796875, -12.7802734375, -11.90087890625, -11.021484375, -10.14208984375, -9.2626953125, -8.38330078125, -7.50390625, -6.62451171875, -5.7451171875, -4.86572265625, -3.986328125, -3.10693359375, -2.2275390625, -1.34814453125, -0.46875, 0.41064453125, 1.2900390625, 2.16943359375, 3.048828125, 3.92822265625, 4.8076171875, 5.68701171875, 6.56640625, 7.44580078125, 8.3251953125, 9.20458984375, 10.083984375, 10.96337890625, 11.8427734375, 12.72216796875, 13.6015625, 14.48095703125, 15.3603515625, 16.23974609375, 17.119140625, 17.99853515625, 18.8779296875, 19.75732421875, 20.63671875, 21.51611328125, 22.3955078125, 23.27490234375, 24.154296875, 25.03369140625, 25.9130859375, 26.79248046875, 27.671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 9.0, 6.0, 10.0, 9.0, 12.0, 12.0, 13.0, 22.0, 23.0, 22.0, 21.0, 33.0, 39.0, 30.0, 23.0, 37.0, 40.0, 40.0, 44.0, 35.0, 47.0, 37.0, 30.0, 43.0, 43.0, 33.0, 32.0, 23.0, 27.0, 34.0, 27.0, 17.0, 19.0, 14.0, 18.0, 18.0, 10.0, 13.0, 7.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.796875, -23.01123046875, -22.2255859375, -21.43994140625, -20.654296875, -19.86865234375, -19.0830078125, -18.29736328125, -17.51171875, -16.72607421875, -15.9404296875, -15.15478515625, -14.369140625, -13.58349609375, -12.7978515625, -12.01220703125, -11.2265625, -10.44091796875, -9.6552734375, -8.86962890625, -8.083984375, -7.29833984375, -6.5126953125, -5.72705078125, -4.94140625, -4.15576171875, -3.3701171875, -2.58447265625, -1.798828125, -1.01318359375, -0.2275390625, 0.55810546875, 1.34375, 2.12939453125, 2.9150390625, 3.70068359375, 4.486328125, 5.27197265625, 6.0576171875, 6.84326171875, 7.62890625, 8.41455078125, 9.2001953125, 9.98583984375, 10.771484375, 11.55712890625, 12.3427734375, 13.12841796875, 13.9140625, 14.69970703125, 15.4853515625, 16.27099609375, 17.056640625, 17.84228515625, 18.6279296875, 19.41357421875, 20.19921875, 20.98486328125, 21.7705078125, 22.55615234375, 23.341796875, 24.12744140625, 24.9130859375, 25.69873046875, 26.484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 8.0, 7.0, 9.0, 8.0, 17.0, 33.0, 51.0, 50.0, 137.0, 243.0, 394.0, 712.0, 1161.0, 2018.0, 3617.0, 6042.0, 10166.0, 16307.0, 26092.0, 39452.0, 56239.0, 76326.0, 94213.0, 109787.0, 116606.0, 113734.0, 101823.0, 82984.0, 63998.0, 45259.0, 30973.0, 19837.0, 12339.0, 7416.0, 4362.0, 2569.0, 1545.0, 868.0, 484.0, 270.0, 151.0, 101.0, 58.0, 44.0, 19.0, 12.0, 12.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3359375, -12.8712158203125, -12.406494140625, -11.9417724609375, -11.47705078125, -11.0123291015625, -10.547607421875, -10.0828857421875, -9.6181640625, -9.1534423828125, -8.688720703125, -8.2239990234375, -7.75927734375, -7.2945556640625, -6.829833984375, -6.3651123046875, -5.900390625, -5.4356689453125, -4.970947265625, -4.5062255859375, -4.04150390625, -3.5767822265625, -3.112060546875, -2.6473388671875, -2.1826171875, -1.7178955078125, -1.253173828125, -0.7884521484375, -0.32373046875, 0.1409912109375, 0.605712890625, 1.0704345703125, 1.53515625, 1.9998779296875, 2.464599609375, 2.9293212890625, 3.39404296875, 3.8587646484375, 4.323486328125, 4.7882080078125, 5.2529296875, 5.7176513671875, 6.182373046875, 6.6470947265625, 7.11181640625, 7.5765380859375, 8.041259765625, 8.5059814453125, 8.970703125, 9.4354248046875, 9.900146484375, 10.3648681640625, 10.82958984375, 11.2943115234375, 11.759033203125, 12.2237548828125, 12.6884765625, 13.1531982421875, 13.617919921875, 14.0826416015625, 14.54736328125, 15.0120849609375, 15.476806640625, 15.9415283203125, 16.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 7.0, 5.0, 6.0, 15.0, 12.0, 24.0, 14.0, 16.0, 23.0, 22.0, 31.0, 22.0, 27.0, 26.0, 45.0, 53.0, 40.0, 46.0, 51.0, 38.0, 41.0, 37.0, 34.0, 39.0, 36.0, 30.0, 36.0, 34.0, 22.0, 27.0, 28.0, 16.0, 21.0, 15.0, 13.0, 9.0, 7.0, 6.0, 7.0, 7.0, 7.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.0018205642700195312, -0.0017708837985992432, -0.001721203327178955, -0.001671522855758667, -0.001621842384338379, -0.0015721619129180908, -0.0015224814414978027, -0.0014728009700775146, -0.0014231204986572266, -0.0013734400272369385, -0.0013237595558166504, -0.0012740790843963623, -0.0012243986129760742, -0.0011747181415557861, -0.001125037670135498, -0.00107535719871521, -0.0010256767272949219, -0.0009759962558746338, -0.0009263157844543457, -0.0008766353130340576, -0.0008269548416137695, -0.0007772743701934814, -0.0007275938987731934, -0.0006779134273529053, -0.0006282329559326172, -0.0005785524845123291, -0.000528872013092041, -0.00047919154167175293, -0.00042951107025146484, -0.00037983059883117676, -0.00033015012741088867, -0.0002804696559906006, -0.0002307891845703125, -0.00018110871315002441, -0.00013142824172973633, -8.174777030944824e-05, -3.2067298889160156e-05, 1.761317253112793e-05, 6.729364395141602e-05, 0.0001169741153717041, 0.0001666545867919922, 0.00021633505821228027, 0.00026601552963256836, 0.00031569600105285645, 0.00036537647247314453, 0.0004150569438934326, 0.0004647374153137207, 0.0005144178867340088, 0.0005640983581542969, 0.000613778829574585, 0.000663459300994873, 0.0007131397724151611, 0.0007628202438354492, 0.0008125007152557373, 0.0008621811866760254, 0.0009118616580963135, 0.0009615421295166016, 0.0010112226009368896, 0.0010609030723571777, 0.0011105835437774658, 0.001160264015197754, 0.001209944486618042, 0.00125962495803833, 0.0013093054294586182, 0.0013589859008789062]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 15.0, 12.0, 16.0, 35.0, 66.0, 106.0, 163.0, 271.0, 450.0, 751.0, 1410.0, 2393.0, 4265.0, 7106.0, 12178.0, 19908.0, 31658.0, 48398.0, 68954.0, 91989.0, 111839.0, 124149.0, 123224.0, 111917.0, 91545.0, 68318.0, 47774.0, 31213.0, 19660.0, 11898.0, 7099.0, 4092.0, 2446.0, 1261.0, 811.0, 480.0, 278.0, 152.0, 106.0, 55.0, 27.0, 25.0, 15.0, 6.0, 5.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.46875, -17.891357421875, -17.31396484375, -16.736572265625, -16.1591796875, -15.581787109375, -15.00439453125, -14.427001953125, -13.849609375, -13.272216796875, -12.69482421875, -12.117431640625, -11.5400390625, -10.962646484375, -10.38525390625, -9.807861328125, -9.23046875, -8.653076171875, -8.07568359375, -7.498291015625, -6.9208984375, -6.343505859375, -5.76611328125, -5.188720703125, -4.611328125, -4.033935546875, -3.45654296875, -2.879150390625, -2.3017578125, -1.724365234375, -1.14697265625, -0.569580078125, 0.0078125, 0.585205078125, 1.16259765625, 1.739990234375, 2.3173828125, 2.894775390625, 3.47216796875, 4.049560546875, 4.626953125, 5.204345703125, 5.78173828125, 6.359130859375, 6.9365234375, 7.513916015625, 8.09130859375, 8.668701171875, 9.24609375, 9.823486328125, 10.40087890625, 10.978271484375, 11.5556640625, 12.133056640625, 12.71044921875, 13.287841796875, 13.865234375, 14.442626953125, 15.02001953125, 15.597412109375, 16.1748046875, 16.752197265625, 17.32958984375, 17.906982421875, 18.484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 3.0, 12.0, 10.0, 12.0, 6.0, 15.0, 10.0, 17.0, 17.0, 28.0, 30.0, 34.0, 31.0, 35.0, 34.0, 38.0, 45.0, 40.0, 44.0, 44.0, 37.0, 38.0, 43.0, 38.0, 39.0, 42.0, 31.0, 34.0, 27.0, 26.0, 18.0, 19.0, 12.0, 13.0, 13.0, 8.0, 10.0, 7.0, 4.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-7.00390625, -6.80194091796875, -6.5999755859375, -6.39801025390625, -6.196044921875, -5.99407958984375, -5.7921142578125, -5.59014892578125, -5.38818359375, -5.18621826171875, -4.9842529296875, -4.78228759765625, -4.580322265625, -4.37835693359375, -4.1763916015625, -3.97442626953125, -3.7724609375, -3.57049560546875, -3.3685302734375, -3.16656494140625, -2.964599609375, -2.76263427734375, -2.5606689453125, -2.35870361328125, -2.15673828125, -1.95477294921875, -1.7528076171875, -1.55084228515625, -1.348876953125, -1.14691162109375, -0.9449462890625, -0.74298095703125, -0.541015625, -0.33905029296875, -0.1370849609375, 0.06488037109375, 0.266845703125, 0.46881103515625, 0.6707763671875, 0.87274169921875, 1.07470703125, 1.27667236328125, 1.4786376953125, 1.68060302734375, 1.882568359375, 2.08453369140625, 2.2864990234375, 2.48846435546875, 2.6904296875, 2.89239501953125, 3.0943603515625, 3.29632568359375, 3.498291015625, 3.70025634765625, 3.9022216796875, 4.10418701171875, 4.30615234375, 4.50811767578125, 4.7100830078125, 4.91204833984375, 5.114013671875, 5.31597900390625, 5.5179443359375, 5.71990966796875, 5.921875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 4.0, 7.0, 8.0, 13.0, 7.0, 8.0, 11.0, 13.0, 25.0, 25.0, 28.0, 26.0, 40.0, 31.0, 30.0, 34.0, 39.0, 42.0, 36.0, 39.0, 45.0, 45.0, 48.0, 36.0, 47.0, 52.0, 40.0, 25.0, 34.0, 16.0, 22.0, 28.0, 23.0, 19.0, 12.0, 13.0, 11.0, 6.0, 8.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.42247772216797, -40.99325942993164, -39.56404113769531, -38.134822845458984, -36.705604553222656, -35.276390075683594, -33.847171783447266, -32.41795349121094, -30.98873519897461, -29.55951690673828, -28.130298614501953, -26.701082229614258, -25.27186393737793, -23.8426456451416, -22.413429260253906, -20.984210968017578, -19.55499267578125, -18.125774383544922, -16.696556091308594, -15.267339706420898, -13.83812141418457, -12.408903121948242, -10.97968578338623, -9.550468444824219, -8.12125015258789, -6.692032337188721, -5.262814521789551, -3.833596706390381, -2.404378890991211, -0.975161075592041, 0.4540567398071289, 1.8832740783691406, 3.3124961853027344, 4.741714000701904, 6.170931816101074, 7.600149631500244, 9.029367446899414, 10.458585739135742, 11.887803077697754, 13.317020416259766, 14.746238708496094, 16.175457000732422, 17.60467529296875, 19.033891677856445, 20.463109970092773, 21.8923282623291, 23.321544647216797, 24.750762939453125, 26.179981231689453, 27.60919952392578, 29.03841781616211, 30.467634201049805, 31.896852493286133, 33.32606887817383, 34.755287170410156, 36.184505462646484, 37.61372375488281, 39.04294204711914, 40.47216033935547, 41.9013786315918, 43.330596923828125, 44.75981140136719, 46.189029693603516, 47.618247985839844, 49.04746627807617]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 8.0, 8.0, 6.0, 14.0, 13.0, 18.0, 18.0, 24.0, 20.0, 27.0, 41.0, 33.0, 36.0, 38.0, 36.0, 44.0, 38.0, 49.0, 46.0, 56.0, 40.0, 40.0, 31.0, 29.0, 29.0, 37.0, 23.0, 23.0, 24.0, 22.0, 22.0, 20.0, 16.0, 16.0, 10.0, 10.0, 13.0, 6.0, 7.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.5181884765625, -41.14090347290039, -39.76361846923828, -38.38633728027344, -37.00905227661133, -35.63176727294922, -34.254486083984375, -32.877201080322266, -31.499916076660156, -30.122631072998047, -28.74534797668457, -27.368064880371094, -25.990779876708984, -24.613494873046875, -23.2362117767334, -21.858928680419922, -20.481643676757812, -19.104358673095703, -17.727075576782227, -16.34979248046875, -14.97250747680664, -13.595223426818848, -12.217939376831055, -10.840655326843262, -9.463371276855469, -8.086087226867676, -6.708803176879883, -5.33151912689209, -3.954235076904297, -2.576951026916504, -1.199666976928711, 0.17761707305908203, 1.5548973083496094, 2.9321813583374023, 4.309465408325195, 5.686749458312988, 7.064033508300781, 8.441317558288574, 9.818601608276367, 11.19588565826416, 12.573169708251953, 13.950453758239746, 15.327737808227539, 16.705020904541016, 18.082305908203125, 19.459590911865234, 20.83687400817871, 22.214157104492188, 23.591442108154297, 24.968727111816406, 26.346010208129883, 27.72329330444336, 29.10057830810547, 30.477863311767578, 31.855146408081055, 33.23242950439453, 34.60971450805664, 35.98699951171875, 37.364280700683594, 38.7415657043457, 40.11885070800781, 41.49613571166992, 42.87342071533203, 44.250701904296875, 45.627986907958984]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 9.0, 5.0, 15.0, 24.0, 24.0, 56.0, 89.0, 127.0, 239.0, 378.0, 613.0, 1011.0, 1540.0, 2537.0, 3885.0, 6116.0, 9319.0, 14180.0, 21429.0, 32227.0, 46749.0, 67245.0, 94639.0, 128306.0, 170141.0, 216310.0, 265252.0, 309037.0, 342911.0, 362062.0, 361366.0, 342265.0, 308317.0, 264317.0, 216421.0, 169893.0, 129595.0, 95408.0, 68332.0, 46971.0, 32770.0, 21598.0, 14349.0, 9479.0, 6113.0, 3876.0, 2519.0, 1620.0, 938.0, 662.0, 386.0, 241.0, 155.0, 99.0, 57.0, 31.0, 24.0, 11.0, 8.0, 3.0], "bins": [-30.96875, -30.05810546875, -29.1474609375, -28.23681640625, -27.326171875, -26.41552734375, -25.5048828125, -24.59423828125, -23.68359375, -22.77294921875, -21.8623046875, -20.95166015625, -20.041015625, -19.13037109375, -18.2197265625, -17.30908203125, -16.3984375, -15.48779296875, -14.5771484375, -13.66650390625, -12.755859375, -11.84521484375, -10.9345703125, -10.02392578125, -9.11328125, -8.20263671875, -7.2919921875, -6.38134765625, -5.470703125, -4.56005859375, -3.6494140625, -2.73876953125, -1.828125, -0.91748046875, -0.0068359375, 0.90380859375, 1.814453125, 2.72509765625, 3.6357421875, 4.54638671875, 5.45703125, 6.36767578125, 7.2783203125, 8.18896484375, 9.099609375, 10.01025390625, 10.9208984375, 11.83154296875, 12.7421875, 13.65283203125, 14.5634765625, 15.47412109375, 16.384765625, 17.29541015625, 18.2060546875, 19.11669921875, 20.02734375, 20.93798828125, 21.8486328125, 22.75927734375, 23.669921875, 24.58056640625, 25.4912109375, 26.40185546875, 27.3125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 9.0, 9.0, 7.0, 11.0, 16.0, 20.0, 21.0, 15.0, 28.0, 21.0, 50.0, 34.0, 38.0, 30.0, 49.0, 37.0, 45.0, 47.0, 58.0, 42.0, 39.0, 40.0, 30.0, 33.0, 30.0, 30.0, 24.0, 25.0, 20.0, 25.0, 17.0, 22.0, 11.0, 17.0, 14.0, 8.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.59375, -37.3271484375, -36.060546875, -34.7939453125, -33.52734375, -32.2607421875, -30.994140625, -29.7275390625, -28.4609375, -27.1943359375, -25.927734375, -24.6611328125, -23.39453125, -22.1279296875, -20.861328125, -19.5947265625, -18.328125, -17.0615234375, -15.794921875, -14.5283203125, -13.26171875, -11.9951171875, -10.728515625, -9.4619140625, -8.1953125, -6.9287109375, -5.662109375, -4.3955078125, -3.12890625, -1.8623046875, -0.595703125, 0.6708984375, 1.9375, 3.2041015625, 4.470703125, 5.7373046875, 7.00390625, 8.2705078125, 9.537109375, 10.8037109375, 12.0703125, 13.3369140625, 14.603515625, 15.8701171875, 17.13671875, 18.4033203125, 19.669921875, 20.9365234375, 22.203125, 23.4697265625, 24.736328125, 26.0029296875, 27.26953125, 28.5361328125, 29.802734375, 31.0693359375, 32.3359375, 33.6025390625, 34.869140625, 36.1357421875, 37.40234375, 38.6689453125, 39.935546875, 41.2021484375, 42.46875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 5.0, 15.0, 30.0, 37.0, 61.0, 110.0, 206.0, 284.0, 492.0, 847.0, 1403.0, 2197.0, 3401.0, 5584.0, 8621.0, 13305.0, 19903.0, 29816.0, 43891.0, 62158.0, 86317.0, 117253.0, 151737.0, 193043.0, 234999.0, 275035.0, 309343.0, 332521.0, 341030.0, 335258.0, 315754.0, 282131.0, 244011.0, 200628.0, 160339.0, 123126.0, 91851.0, 66346.0, 46847.0, 32515.0, 21871.0, 14416.0, 9424.0, 5972.0, 3816.0, 2479.0, 1470.0, 919.0, 589.0, 361.0, 194.0, 131.0, 87.0, 42.0, 34.0, 16.0, 10.0, 7.0, 2.0, 2.0], "bins": [-30.15625, -29.231201171875, -28.30615234375, -27.381103515625, -26.4560546875, -25.531005859375, -24.60595703125, -23.680908203125, -22.755859375, -21.830810546875, -20.90576171875, -19.980712890625, -19.0556640625, -18.130615234375, -17.20556640625, -16.280517578125, -15.35546875, -14.430419921875, -13.50537109375, -12.580322265625, -11.6552734375, -10.730224609375, -9.80517578125, -8.880126953125, -7.955078125, -7.030029296875, -6.10498046875, -5.179931640625, -4.2548828125, -3.329833984375, -2.40478515625, -1.479736328125, -0.5546875, 0.370361328125, 1.29541015625, 2.220458984375, 3.1455078125, 4.070556640625, 4.99560546875, 5.920654296875, 6.845703125, 7.770751953125, 8.69580078125, 9.620849609375, 10.5458984375, 11.470947265625, 12.39599609375, 13.321044921875, 14.24609375, 15.171142578125, 16.09619140625, 17.021240234375, 17.9462890625, 18.871337890625, 19.79638671875, 20.721435546875, 21.646484375, 22.571533203125, 23.49658203125, 24.421630859375, 25.3466796875, 26.271728515625, 27.19677734375, 28.121826171875, 29.046875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 6.0, 4.0, 6.0, 9.0, 22.0, 23.0, 19.0, 32.0, 47.0, 49.0, 57.0, 65.0, 67.0, 102.0, 98.0, 135.0, 112.0, 146.0, 183.0, 163.0, 184.0, 200.0, 191.0, 184.0, 181.0, 205.0, 175.0, 189.0, 157.0, 150.0, 139.0, 112.0, 119.0, 93.0, 77.0, 82.0, 62.0, 40.0, 32.0, 27.0, 25.0, 30.0, 22.0, 12.0, 13.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-17.734375, -17.19140625, -16.6484375, -16.10546875, -15.5625, -15.01953125, -14.4765625, -13.93359375, -13.390625, -12.84765625, -12.3046875, -11.76171875, -11.21875, -10.67578125, -10.1328125, -9.58984375, -9.046875, -8.50390625, -7.9609375, -7.41796875, -6.875, -6.33203125, -5.7890625, -5.24609375, -4.703125, -4.16015625, -3.6171875, -3.07421875, -2.53125, -1.98828125, -1.4453125, -0.90234375, -0.359375, 0.18359375, 0.7265625, 1.26953125, 1.8125, 2.35546875, 2.8984375, 3.44140625, 3.984375, 4.52734375, 5.0703125, 5.61328125, 6.15625, 6.69921875, 7.2421875, 7.78515625, 8.328125, 8.87109375, 9.4140625, 9.95703125, 10.5, 11.04296875, 11.5859375, 12.12890625, 12.671875, 13.21484375, 13.7578125, 14.30078125, 14.84375, 15.38671875, 15.9296875, 16.47265625, 17.015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 2.0, 6.0, 10.0, 20.0, 17.0, 19.0, 38.0, 27.0, 31.0, 31.0, 47.0, 53.0, 45.0, 35.0, 51.0, 47.0, 54.0, 39.0, 46.0, 37.0, 39.0, 38.0, 32.0, 39.0, 38.0, 30.0, 16.0, 20.0, 12.0, 18.0, 11.0, 7.0, 9.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.53585433959961, -45.968074798583984, -44.400291442871094, -42.83251190185547, -41.26472854614258, -39.69694900512695, -38.12916564941406, -36.56138610839844, -34.99360656738281, -33.42582702636719, -31.858043670654297, -30.290264129638672, -28.72248077392578, -27.154701232910156, -25.5869197845459, -24.01913833618164, -22.45135498046875, -20.883573532104492, -19.315792083740234, -17.74801254272461, -16.18022918701172, -14.612448692321777, -13.044668197631836, -11.476886749267578, -9.90910530090332, -8.341323852539062, -6.773542881011963, -5.205761909484863, -3.6379804611206055, -2.0701990127563477, -0.5024185180664062, 1.0653629302978516, 2.633148193359375, 4.200929641723633, 5.768710613250732, 7.336491584777832, 8.90427303314209, 10.472054481506348, 12.039834976196289, 13.607616424560547, 15.175397872924805, 16.743179321289062, 18.31096076965332, 19.878742218017578, 21.446521759033203, 23.014305114746094, 24.58208465576172, 26.149866104125977, 27.717647552490234, 29.285429000854492, 30.85321044921875, 32.420989990234375, 33.988773345947266, 35.55655288696289, 37.12433624267578, 38.692115783691406, 40.25989532470703, 41.827674865722656, 43.39545822143555, 44.96323776245117, 46.53102111816406, 48.09880065917969, 49.66658020019531, 51.2343635559082, 52.802146911621094]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 8.0, 14.0, 11.0, 12.0, 18.0, 20.0, 24.0, 23.0, 30.0, 39.0, 29.0, 35.0, 36.0, 40.0, 57.0, 32.0, 46.0, 48.0, 53.0, 44.0, 38.0, 42.0, 25.0, 31.0, 33.0, 30.0, 21.0, 23.0, 20.0, 12.0, 12.0, 12.0, 14.0, 10.0, 7.0, 8.0, 12.0, 5.0, 7.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.12860107421875, -40.748653411865234, -39.36870574951172, -37.98876190185547, -36.60881423950195, -35.22886657714844, -33.84891891479492, -32.468971252441406, -31.089025497436523, -29.709077835083008, -28.329132080078125, -26.94918441772461, -25.569236755371094, -24.18929100036621, -22.809343338012695, -21.429397583007812, -20.049449920654297, -18.66950225830078, -17.2895565032959, -15.909608840942383, -14.529662132263184, -13.149715423583984, -11.769767761230469, -10.38982105255127, -9.00987434387207, -7.629927635192871, -6.249980449676514, -4.870033264160156, -3.490086555480957, -2.110139846801758, -0.7301921844482422, 0.649754524230957, 2.029705047607422, 3.4096519947052, 4.7895989418029785, 6.169546127319336, 7.549492835998535, 8.929439544677734, 10.30938720703125, 11.68933391571045, 13.069280624389648, 14.449227333068848, 15.829174041748047, 17.209121704101562, 18.589069366455078, 19.96901512145996, 21.348962783813477, 22.72890853881836, 24.108856201171875, 25.48880386352539, 26.868749618530273, 28.24869728088379, 29.628643035888672, 31.008590698242188, 32.3885383605957, 33.76848602294922, 35.14842987060547, 36.528377532958984, 37.9083251953125, 39.28826904296875, 40.668216705322266, 42.04816436767578, 43.4281120300293, 44.80805969238281, 46.18800735473633]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 8.0, 8.0, 7.0, 23.0, 23.0, 19.0, 43.0, 51.0, 56.0, 106.0, 163.0, 260.0, 449.0, 761.0, 1462.0, 2788.0, 5667.0, 12113.0, 25738.0, 55697.0, 111395.0, 185206.0, 227837.0, 190363.0, 116167.0, 58825.0, 27763.0, 12845.0, 5990.0, 3004.0, 1521.0, 879.0, 492.0, 287.0, 190.0, 114.0, 58.0, 59.0, 33.0, 18.0, 20.0, 17.0, 8.0, 6.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0], "bins": [-35.59375, -34.61962890625, -33.6455078125, -32.67138671875, -31.697265625, -30.72314453125, -29.7490234375, -28.77490234375, -27.80078125, -26.82666015625, -25.8525390625, -24.87841796875, -23.904296875, -22.93017578125, -21.9560546875, -20.98193359375, -20.0078125, -19.03369140625, -18.0595703125, -17.08544921875, -16.111328125, -15.13720703125, -14.1630859375, -13.18896484375, -12.21484375, -11.24072265625, -10.2666015625, -9.29248046875, -8.318359375, -7.34423828125, -6.3701171875, -5.39599609375, -4.421875, -3.44775390625, -2.4736328125, -1.49951171875, -0.525390625, 0.44873046875, 1.4228515625, 2.39697265625, 3.37109375, 4.34521484375, 5.3193359375, 6.29345703125, 7.267578125, 8.24169921875, 9.2158203125, 10.18994140625, 11.1640625, 12.13818359375, 13.1123046875, 14.08642578125, 15.060546875, 16.03466796875, 17.0087890625, 17.98291015625, 18.95703125, 19.93115234375, 20.9052734375, 21.87939453125, 22.853515625, 23.82763671875, 24.8017578125, 25.77587890625, 26.75]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 8.0, 14.0, 12.0, 11.0, 19.0, 19.0, 23.0, 24.0, 31.0, 41.0, 28.0, 33.0, 35.0, 44.0, 56.0, 35.0, 44.0, 46.0, 58.0, 37.0, 38.0, 45.0, 25.0, 31.0, 30.0, 32.0, 23.0, 20.0, 19.0, 15.0, 12.0, 12.0, 14.0, 8.0, 10.0, 5.0, 12.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.84375, -40.46435546875, -39.0849609375, -37.70556640625, -36.326171875, -34.94677734375, -33.5673828125, -32.18798828125, -30.80859375, -29.42919921875, -28.0498046875, -26.67041015625, -25.291015625, -23.91162109375, -22.5322265625, -21.15283203125, -19.7734375, -18.39404296875, -17.0146484375, -15.63525390625, -14.255859375, -12.87646484375, -11.4970703125, -10.11767578125, -8.73828125, -7.35888671875, -5.9794921875, -4.60009765625, -3.220703125, -1.84130859375, -0.4619140625, 0.91748046875, 2.296875, 3.67626953125, 5.0556640625, 6.43505859375, 7.814453125, 9.19384765625, 10.5732421875, 11.95263671875, 13.33203125, 14.71142578125, 16.0908203125, 17.47021484375, 18.849609375, 20.22900390625, 21.6083984375, 22.98779296875, 24.3671875, 25.74658203125, 27.1259765625, 28.50537109375, 29.884765625, 31.26416015625, 32.6435546875, 34.02294921875, 35.40234375, 36.78173828125, 38.1611328125, 39.54052734375, 40.919921875, 42.29931640625, 43.6787109375, 45.05810546875, 46.4375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 6.0, 16.0, 28.0, 36.0, 54.0, 81.0, 105.0, 143.0, 195.0, 351.0, 517.0, 790.0, 1204.0, 2033.0, 3615.0, 6615.0, 12831.0, 27476.0, 60026.0, 129522.0, 236801.0, 260048.0, 160593.0, 75891.0, 34353.0, 16421.0, 8065.0, 4285.0, 2463.0, 1372.0, 832.0, 587.0, 346.0, 247.0, 176.0, 119.0, 86.0, 52.0, 38.0, 33.0, 24.0, 14.0, 17.0, 19.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-27.1875, -26.2216796875, -25.255859375, -24.2900390625, -23.32421875, -22.3583984375, -21.392578125, -20.4267578125, -19.4609375, -18.4951171875, -17.529296875, -16.5634765625, -15.59765625, -14.6318359375, -13.666015625, -12.7001953125, -11.734375, -10.7685546875, -9.802734375, -8.8369140625, -7.87109375, -6.9052734375, -5.939453125, -4.9736328125, -4.0078125, -3.0419921875, -2.076171875, -1.1103515625, -0.14453125, 0.8212890625, 1.787109375, 2.7529296875, 3.71875, 4.6845703125, 5.650390625, 6.6162109375, 7.58203125, 8.5478515625, 9.513671875, 10.4794921875, 11.4453125, 12.4111328125, 13.376953125, 14.3427734375, 15.30859375, 16.2744140625, 17.240234375, 18.2060546875, 19.171875, 20.1376953125, 21.103515625, 22.0693359375, 23.03515625, 24.0009765625, 24.966796875, 25.9326171875, 26.8984375, 27.8642578125, 28.830078125, 29.7958984375, 30.76171875, 31.7275390625, 32.693359375, 33.6591796875, 34.625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 10.0, 7.0, 11.0, 22.0, 13.0, 15.0, 18.0, 34.0, 32.0, 43.0, 48.0, 37.0, 40.0, 46.0, 49.0, 44.0, 36.0, 34.0, 47.0, 37.0, 37.0, 48.0, 53.0, 42.0, 26.0, 30.0, 20.0, 22.0, 11.0, 13.0, 10.0, 6.0, 7.0, 9.0, 8.0, 5.0, 8.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.34375, -25.39599609375, -24.4482421875, -23.50048828125, -22.552734375, -21.60498046875, -20.6572265625, -19.70947265625, -18.76171875, -17.81396484375, -16.8662109375, -15.91845703125, -14.970703125, -14.02294921875, -13.0751953125, -12.12744140625, -11.1796875, -10.23193359375, -9.2841796875, -8.33642578125, -7.388671875, -6.44091796875, -5.4931640625, -4.54541015625, -3.59765625, -2.64990234375, -1.7021484375, -0.75439453125, 0.193359375, 1.14111328125, 2.0888671875, 3.03662109375, 3.984375, 4.93212890625, 5.8798828125, 6.82763671875, 7.775390625, 8.72314453125, 9.6708984375, 10.61865234375, 11.56640625, 12.51416015625, 13.4619140625, 14.40966796875, 15.357421875, 16.30517578125, 17.2529296875, 18.20068359375, 19.1484375, 20.09619140625, 21.0439453125, 21.99169921875, 22.939453125, 23.88720703125, 24.8349609375, 25.78271484375, 26.73046875, 27.67822265625, 28.6259765625, 29.57373046875, 30.521484375, 31.46923828125, 32.4169921875, 33.36474609375, 34.3125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 10.0, 6.0, 12.0, 23.0, 22.0, 44.0, 60.0, 102.0, 147.0, 193.0, 254.0, 381.0, 536.0, 842.0, 1170.0, 1904.0, 2901.0, 4536.0, 7694.0, 13307.0, 24110.0, 47700.0, 103065.0, 225124.0, 296161.0, 162727.0, 73690.0, 35169.0, 19001.0, 10357.0, 6312.0, 3845.0, 2365.0, 1544.0, 1071.0, 664.0, 459.0, 342.0, 225.0, 154.0, 105.0, 56.0, 47.0, 40.0, 31.0, 15.0, 14.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.0794677734375, -15.596435546875, -15.1134033203125, -14.63037109375, -14.1473388671875, -13.664306640625, -13.1812744140625, -12.6982421875, -12.2152099609375, -11.732177734375, -11.2491455078125, -10.76611328125, -10.2830810546875, -9.800048828125, -9.3170166015625, -8.833984375, -8.3509521484375, -7.867919921875, -7.3848876953125, -6.90185546875, -6.4188232421875, -5.935791015625, -5.4527587890625, -4.9697265625, -4.4866943359375, -4.003662109375, -3.5206298828125, -3.03759765625, -2.5545654296875, -2.071533203125, -1.5885009765625, -1.10546875, -0.6224365234375, -0.139404296875, 0.3436279296875, 0.82666015625, 1.3096923828125, 1.792724609375, 2.2757568359375, 2.7587890625, 3.2418212890625, 3.724853515625, 4.2078857421875, 4.69091796875, 5.1739501953125, 5.656982421875, 6.1400146484375, 6.623046875, 7.1060791015625, 7.589111328125, 8.0721435546875, 8.55517578125, 9.0382080078125, 9.521240234375, 10.0042724609375, 10.4873046875, 10.9703369140625, 11.453369140625, 11.9364013671875, 12.41943359375, 12.9024658203125, 13.385498046875, 13.8685302734375, 14.3515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 4.0, 8.0, 7.0, 11.0, 8.0, 14.0, 13.0, 18.0, 28.0, 27.0, 30.0, 27.0, 30.0, 52.0, 47.0, 53.0, 59.0, 56.0, 60.0, 66.0, 58.0, 61.0, 36.0, 36.0, 25.0, 31.0, 26.0, 18.0, 15.0, 15.0, 17.0, 11.0, 13.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007386207580566406, -0.0007161125540733337, -0.0006936043500900269, -0.00067109614610672, -0.0006485879421234131, -0.0006260797381401062, -0.0006035715341567993, -0.0005810633301734924, -0.0005585551261901855, -0.0005360469222068787, -0.0005135387182235718, -0.0004910305142402649, -0.000468522310256958, -0.0004460141062736511, -0.00042350590229034424, -0.00040099769830703735, -0.00037848949432373047, -0.0003559812903404236, -0.0003334730863571167, -0.0003109648823738098, -0.00028845667839050293, -0.00026594847440719604, -0.00024344027042388916, -0.00022093206644058228, -0.0001984238624572754, -0.0001759156584739685, -0.00015340745449066162, -0.00013089925050735474, -0.00010839104652404785, -8.588284254074097e-05, -6.337463855743408e-05, -4.08664345741272e-05, -1.8358230590820312e-05, 4.149973392486572e-06, 2.6658177375793457e-05, 4.916638135910034e-05, 7.167458534240723e-05, 9.418278932571411e-05, 0.000116690993309021, 0.00013919919729232788, 0.00016170740127563477, 0.00018421560525894165, 0.00020672380924224854, 0.00022923201322555542, 0.0002517402172088623, 0.0002742484211921692, 0.0002967566251754761, 0.00031926482915878296, 0.00034177303314208984, 0.00036428123712539673, 0.0003867894411087036, 0.0004092976450920105, 0.0004318058490753174, 0.00045431405305862427, 0.00047682225704193115, 0.000499330461025238, 0.0005218386650085449, 0.0005443468689918518, 0.0005668550729751587, 0.0005893632769584656, 0.0006118714809417725, 0.0006343796849250793, 0.0006568878889083862, 0.0006793960928916931, 0.000701904296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 12.0, 9.0, 28.0, 36.0, 55.0, 92.0, 157.0, 207.0, 367.0, 557.0, 872.0, 1457.0, 2331.0, 3917.0, 6514.0, 11283.0, 19623.0, 34432.0, 59053.0, 97675.0, 145681.0, 177331.0, 168147.0, 125233.0, 80666.0, 47311.0, 27081.0, 15534.0, 9224.0, 5308.0, 3178.0, 1926.0, 1167.0, 790.0, 485.0, 293.0, 176.0, 114.0, 82.0, 50.0, 33.0, 20.0, 20.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.652587890625, -17.03955078125, -16.426513671875, -15.8134765625, -15.200439453125, -14.58740234375, -13.974365234375, -13.361328125, -12.748291015625, -12.13525390625, -11.522216796875, -10.9091796875, -10.296142578125, -9.68310546875, -9.070068359375, -8.45703125, -7.843994140625, -7.23095703125, -6.617919921875, -6.0048828125, -5.391845703125, -4.77880859375, -4.165771484375, -3.552734375, -2.939697265625, -2.32666015625, -1.713623046875, -1.1005859375, -0.487548828125, 0.12548828125, 0.738525390625, 1.3515625, 1.964599609375, 2.57763671875, 3.190673828125, 3.8037109375, 4.416748046875, 5.02978515625, 5.642822265625, 6.255859375, 6.868896484375, 7.48193359375, 8.094970703125, 8.7080078125, 9.321044921875, 9.93408203125, 10.547119140625, 11.16015625, 11.773193359375, 12.38623046875, 12.999267578125, 13.6123046875, 14.225341796875, 14.83837890625, 15.451416015625, 16.064453125, 16.677490234375, 17.29052734375, 17.903564453125, 18.5166015625, 19.129638671875, 19.74267578125, 20.355712890625, 20.96875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 18.0, 9.0, 8.0, 16.0, 24.0, 26.0, 23.0, 33.0, 38.0, 26.0, 45.0, 44.0, 47.0, 54.0, 55.0, 51.0, 50.0, 50.0, 56.0, 48.0, 36.0, 40.0, 33.0, 21.0, 27.0, 23.0, 16.0, 11.0, 18.0, 10.0, 12.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.203125, -6.02398681640625, -5.8448486328125, -5.66571044921875, -5.486572265625, -5.30743408203125, -5.1282958984375, -4.94915771484375, -4.77001953125, -4.59088134765625, -4.4117431640625, -4.23260498046875, -4.053466796875, -3.87432861328125, -3.6951904296875, -3.51605224609375, -3.3369140625, -3.15777587890625, -2.9786376953125, -2.79949951171875, -2.620361328125, -2.44122314453125, -2.2620849609375, -2.08294677734375, -1.90380859375, -1.72467041015625, -1.5455322265625, -1.36639404296875, -1.187255859375, -1.00811767578125, -0.8289794921875, -0.64984130859375, -0.470703125, -0.29156494140625, -0.1124267578125, 0.06671142578125, 0.245849609375, 0.42498779296875, 0.6041259765625, 0.78326416015625, 0.96240234375, 1.14154052734375, 1.3206787109375, 1.49981689453125, 1.678955078125, 1.85809326171875, 2.0372314453125, 2.21636962890625, 2.3955078125, 2.57464599609375, 2.7537841796875, 2.93292236328125, 3.112060546875, 3.29119873046875, 3.4703369140625, 3.64947509765625, 3.82861328125, 4.00775146484375, 4.1868896484375, 4.36602783203125, 4.545166015625, 4.72430419921875, 4.9034423828125, 5.08258056640625, 5.26171875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 4.0, 5.0, 8.0, 6.0, 10.0, 8.0, 4.0, 21.0, 27.0, 28.0, 25.0, 31.0, 32.0, 34.0, 46.0, 39.0, 37.0, 43.0, 40.0, 66.0, 46.0, 39.0, 37.0, 48.0, 34.0, 29.0, 35.0, 41.0, 29.0, 23.0, 25.0, 20.0, 13.0, 14.0, 16.0, 7.0, 11.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-45.06380844116211, -43.56110382080078, -42.05839538574219, -40.55569076538086, -39.05298614501953, -37.55027770996094, -36.04757308959961, -34.54486846923828, -33.04216003417969, -31.539453506469727, -30.036746978759766, -28.534042358398438, -27.031335830688477, -25.528629302978516, -24.025924682617188, -22.523218154907227, -21.020511627197266, -19.517805099487305, -18.015098571777344, -16.512393951416016, -15.009687423706055, -13.506980895996094, -12.00427532196045, -10.501569747924805, -8.998863220214844, -7.496157169342041, -5.993451118469238, -4.4907450675964355, -2.988039016723633, -1.48533296585083, 0.017373085021972656, 1.5200786590576172, 3.022785186767578, 4.525491237640381, 6.028197288513184, 7.530903339385986, 9.033609390258789, 10.53631591796875, 12.039021492004395, 13.541727066040039, 15.04443359375, 16.54714012145996, 18.049846649169922, 19.55255126953125, 21.05525779724121, 22.557964324951172, 24.0606689453125, 25.56337547302246, 27.066082000732422, 28.568788528442383, 30.071495056152344, 31.574199676513672, 33.076904296875, 34.579612731933594, 36.08231735229492, 37.58502197265625, 39.087730407714844, 40.59043502807617, 42.093143463134766, 43.595848083496094, 45.09855651855469, 46.601261138916016, 48.103965759277344, 49.60667419433594, 51.109378814697266]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 3.0, 12.0, 10.0, 11.0, 14.0, 20.0, 21.0, 18.0, 27.0, 34.0, 29.0, 40.0, 40.0, 39.0, 38.0, 46.0, 45.0, 50.0, 35.0, 50.0, 50.0, 41.0, 35.0, 35.0, 23.0, 33.0, 33.0, 20.0, 19.0, 15.0, 16.0, 10.0, 18.0, 10.0, 9.0, 9.0, 8.0, 6.0, 5.0, 8.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.128089904785156, -40.725746154785156, -39.32340621948242, -37.92106246948242, -36.51872253417969, -35.11637878417969, -33.71403503417969, -32.31169509887695, -30.909353256225586, -29.50701141357422, -28.10466957092285, -26.702327728271484, -25.299983978271484, -23.89764404296875, -22.49530029296875, -21.092958450317383, -19.690616607666016, -18.28827476501465, -16.88593292236328, -15.483590126037598, -14.08124828338623, -12.678906440734863, -11.27656364440918, -9.874221801757812, -8.471879959106445, -7.069538116455078, -5.667195796966553, -4.264853477478027, -2.86251163482666, -1.460169792175293, -0.057826995849609375, 1.3445148468017578, 2.7468605041503906, 4.149202346801758, 5.551544666290283, 6.953886985778809, 8.356228828430176, 9.758570671081543, 11.160913467407227, 12.563255310058594, 13.965597152709961, 15.367938995361328, 16.770280838012695, 18.172622680664062, 19.574966430664062, 20.977306365966797, 22.379650115966797, 23.781991958618164, 25.18433380126953, 26.5866756439209, 27.989017486572266, 29.391361236572266, 30.793701171875, 32.196044921875, 33.598388671875, 35.000728607177734, 36.40306854248047, 37.80541229248047, 39.2077522277832, 40.6100959777832, 42.01243591308594, 43.41477966308594, 44.81712341308594, 46.21946334838867, 47.62180709838867]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 11.0, 21.0, 39.0, 62.0, 97.0, 183.0, 317.0, 438.0, 802.0, 1169.0, 1781.0, 2742.0, 4277.0, 6489.0, 9072.0, 13040.0, 18125.0, 24536.0, 32453.0, 41928.0, 51373.0, 61300.0, 70767.0, 77531.0, 81814.0, 82450.0, 80481.0, 74754.0, 66861.0, 57388.0, 47271.0, 37786.0, 29113.0, 21584.0, 15812.0, 11315.0, 7922.0, 5257.0, 3615.0, 2387.0, 1533.0, 1001.0, 613.0, 405.0, 234.0, 174.0, 96.0, 64.0, 29.0, 22.0, 15.0, 3.0, 3.0, 1.0, 2.0, 3.0], "bins": [-29.8125, -28.9169921875, -28.021484375, -27.1259765625, -26.23046875, -25.3349609375, -24.439453125, -23.5439453125, -22.6484375, -21.7529296875, -20.857421875, -19.9619140625, -19.06640625, -18.1708984375, -17.275390625, -16.3798828125, -15.484375, -14.5888671875, -13.693359375, -12.7978515625, -11.90234375, -11.0068359375, -10.111328125, -9.2158203125, -8.3203125, -7.4248046875, -6.529296875, -5.6337890625, -4.73828125, -3.8427734375, -2.947265625, -2.0517578125, -1.15625, -0.2607421875, 0.634765625, 1.5302734375, 2.42578125, 3.3212890625, 4.216796875, 5.1123046875, 6.0078125, 6.9033203125, 7.798828125, 8.6943359375, 9.58984375, 10.4853515625, 11.380859375, 12.2763671875, 13.171875, 14.0673828125, 14.962890625, 15.8583984375, 16.75390625, 17.6494140625, 18.544921875, 19.4404296875, 20.3359375, 21.2314453125, 22.126953125, 23.0224609375, 23.91796875, 24.8134765625, 25.708984375, 26.6044921875, 27.5]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 6.0, 8.0, 10.0, 12.0, 16.0, 17.0, 23.0, 17.0, 28.0, 37.0, 31.0, 35.0, 44.0, 37.0, 43.0, 45.0, 39.0, 51.0, 37.0, 55.0, 44.0, 38.0, 41.0, 34.0, 23.0, 33.0, 30.0, 22.0, 16.0, 18.0, 14.0, 12.0, 14.0, 12.0, 8.0, 9.0, 8.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.5625, -39.2080078125, -37.853515625, -36.4990234375, -35.14453125, -33.7900390625, -32.435546875, -31.0810546875, -29.7265625, -28.3720703125, -27.017578125, -25.6630859375, -24.30859375, -22.9541015625, -21.599609375, -20.2451171875, -18.890625, -17.5361328125, -16.181640625, -14.8271484375, -13.47265625, -12.1181640625, -10.763671875, -9.4091796875, -8.0546875, -6.7001953125, -5.345703125, -3.9912109375, -2.63671875, -1.2822265625, 0.072265625, 1.4267578125, 2.78125, 4.1357421875, 5.490234375, 6.8447265625, 8.19921875, 9.5537109375, 10.908203125, 12.2626953125, 13.6171875, 14.9716796875, 16.326171875, 17.6806640625, 19.03515625, 20.3896484375, 21.744140625, 23.0986328125, 24.453125, 25.8076171875, 27.162109375, 28.5166015625, 29.87109375, 31.2255859375, 32.580078125, 33.9345703125, 35.2890625, 36.6435546875, 37.998046875, 39.3525390625, 40.70703125, 42.0615234375, 43.416015625, 44.7705078125, 46.125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 10.0, 9.0, 14.0, 16.0, 32.0, 40.0, 83.0, 129.0, 193.0, 309.0, 461.0, 715.0, 1101.0, 1664.0, 2670.0, 3914.0, 5915.0, 8168.0, 11802.0, 16326.0, 22148.0, 28989.0, 37135.0, 46542.0, 55946.0, 65013.0, 72698.0, 78151.0, 81060.0, 79610.0, 76131.0, 70147.0, 61659.0, 52167.0, 42558.0, 33544.0, 26091.0, 19606.0, 14259.0, 10039.0, 7042.0, 4785.0, 3252.0, 2286.0, 1518.0, 925.0, 575.0, 430.0, 256.0, 182.0, 88.0, 69.0, 38.0, 18.0, 21.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-25.859375, -25.01953125, -24.1796875, -23.33984375, -22.5, -21.66015625, -20.8203125, -19.98046875, -19.140625, -18.30078125, -17.4609375, -16.62109375, -15.78125, -14.94140625, -14.1015625, -13.26171875, -12.421875, -11.58203125, -10.7421875, -9.90234375, -9.0625, -8.22265625, -7.3828125, -6.54296875, -5.703125, -4.86328125, -4.0234375, -3.18359375, -2.34375, -1.50390625, -0.6640625, 0.17578125, 1.015625, 1.85546875, 2.6953125, 3.53515625, 4.375, 5.21484375, 6.0546875, 6.89453125, 7.734375, 8.57421875, 9.4140625, 10.25390625, 11.09375, 11.93359375, 12.7734375, 13.61328125, 14.453125, 15.29296875, 16.1328125, 16.97265625, 17.8125, 18.65234375, 19.4921875, 20.33203125, 21.171875, 22.01171875, 22.8515625, 23.69140625, 24.53125, 25.37109375, 26.2109375, 27.05078125, 27.890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 7.0, 10.0, 9.0, 16.0, 14.0, 19.0, 11.0, 14.0, 25.0, 23.0, 21.0, 23.0, 27.0, 30.0, 43.0, 29.0, 39.0, 42.0, 38.0, 20.0, 29.0, 45.0, 31.0, 39.0, 39.0, 24.0, 36.0, 21.0, 20.0, 28.0, 36.0, 20.0, 20.0, 18.0, 11.0, 15.0, 15.0, 10.0, 14.0, 9.0, 10.0, 13.0, 5.0, 4.0, 4.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0], "bins": [-24.09375, -23.337158203125, -22.58056640625, -21.823974609375, -21.0673828125, -20.310791015625, -19.55419921875, -18.797607421875, -18.041015625, -17.284423828125, -16.52783203125, -15.771240234375, -15.0146484375, -14.258056640625, -13.50146484375, -12.744873046875, -11.98828125, -11.231689453125, -10.47509765625, -9.718505859375, -8.9619140625, -8.205322265625, -7.44873046875, -6.692138671875, -5.935546875, -5.178955078125, -4.42236328125, -3.665771484375, -2.9091796875, -2.152587890625, -1.39599609375, -0.639404296875, 0.1171875, 0.873779296875, 1.63037109375, 2.386962890625, 3.1435546875, 3.900146484375, 4.65673828125, 5.413330078125, 6.169921875, 6.926513671875, 7.68310546875, 8.439697265625, 9.1962890625, 9.952880859375, 10.70947265625, 11.466064453125, 12.22265625, 12.979248046875, 13.73583984375, 14.492431640625, 15.2490234375, 16.005615234375, 16.76220703125, 17.518798828125, 18.275390625, 19.031982421875, 19.78857421875, 20.545166015625, 21.3017578125, 22.058349609375, 22.81494140625, 23.571533203125, 24.328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 13.0, 17.0, 21.0, 45.0, 71.0, 93.0, 138.0, 206.0, 359.0, 561.0, 863.0, 1342.0, 2033.0, 3326.0, 4989.0, 7640.0, 11248.0, 16596.0, 23680.0, 32704.0, 44123.0, 57683.0, 70140.0, 82879.0, 91637.0, 95777.0, 93647.0, 87481.0, 77139.0, 63975.0, 50809.0, 38597.0, 28116.0, 19955.0, 13744.0, 9246.0, 6139.0, 4064.0, 2646.0, 1680.0, 1121.0, 720.0, 447.0, 303.0, 185.0, 123.0, 82.0, 57.0, 33.0, 20.0, 14.0, 14.0, 4.0, 6.0, 3.0, 1.0], "bins": [-14.265625, -13.843017578125, -13.42041015625, -12.997802734375, -12.5751953125, -12.152587890625, -11.72998046875, -11.307373046875, -10.884765625, -10.462158203125, -10.03955078125, -9.616943359375, -9.1943359375, -8.771728515625, -8.34912109375, -7.926513671875, -7.50390625, -7.081298828125, -6.65869140625, -6.236083984375, -5.8134765625, -5.390869140625, -4.96826171875, -4.545654296875, -4.123046875, -3.700439453125, -3.27783203125, -2.855224609375, -2.4326171875, -2.010009765625, -1.58740234375, -1.164794921875, -0.7421875, -0.319580078125, 0.10302734375, 0.525634765625, 0.9482421875, 1.370849609375, 1.79345703125, 2.216064453125, 2.638671875, 3.061279296875, 3.48388671875, 3.906494140625, 4.3291015625, 4.751708984375, 5.17431640625, 5.596923828125, 6.01953125, 6.442138671875, 6.86474609375, 7.287353515625, 7.7099609375, 8.132568359375, 8.55517578125, 8.977783203125, 9.400390625, 9.822998046875, 10.24560546875, 10.668212890625, 11.0908203125, 11.513427734375, 11.93603515625, 12.358642578125, 12.78125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 4.0, 6.0, 9.0, 9.0, 14.0, 15.0, 17.0, 22.0, 15.0, 22.0, 25.0, 38.0, 25.0, 41.0, 25.0, 45.0, 44.0, 42.0, 40.0, 40.0, 39.0, 42.0, 38.0, 40.0, 47.0, 36.0, 30.0, 31.0, 31.0, 29.0, 26.0, 14.0, 14.0, 18.0, 15.0, 9.0, 10.0, 6.0, 10.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0016088485717773438, -0.0015544891357421875, -0.0015001296997070312, -0.001445770263671875, -0.0013914108276367188, -0.0013370513916015625, -0.0012826919555664062, -0.00122833251953125, -0.0011739730834960938, -0.0011196136474609375, -0.0010652542114257812, -0.001010894775390625, -0.0009565353393554688, -0.0009021759033203125, -0.0008478164672851562, -0.00079345703125, -0.0007390975952148438, -0.0006847381591796875, -0.0006303787231445312, -0.000576019287109375, -0.0005216598510742188, -0.0004673004150390625, -0.00041294097900390625, -0.00035858154296875, -0.00030422210693359375, -0.0002498626708984375, -0.00019550323486328125, -0.000141143798828125, -8.678436279296875e-05, -3.24249267578125e-05, 2.193450927734375e-05, 7.62939453125e-05, 0.00013065338134765625, 0.0001850128173828125, 0.00023937225341796875, 0.000293731689453125, 0.00034809112548828125, 0.0004024505615234375, 0.00045680999755859375, 0.00051116943359375, 0.0005655288696289062, 0.0006198883056640625, 0.0006742477416992188, 0.000728607177734375, 0.0007829666137695312, 0.0008373260498046875, 0.0008916854858398438, 0.000946044921875, 0.0010004043579101562, 0.0010547637939453125, 0.0011091232299804688, 0.001163482666015625, 0.0012178421020507812, 0.0012722015380859375, 0.0013265609741210938, 0.00138092041015625, 0.0014352798461914062, 0.0014896392822265625, 0.0015439987182617188, 0.001598358154296875, 0.0016527175903320312, 0.0017070770263671875, 0.0017614364624023438, 0.0018157958984375, 0.0018701553344726562]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 12.0, 6.0, 14.0, 24.0, 33.0, 60.0, 90.0, 142.0, 182.0, 330.0, 518.0, 818.0, 1219.0, 1795.0, 3012.0, 4565.0, 7075.0, 11159.0, 16552.0, 24359.0, 34634.0, 47811.0, 62763.0, 78314.0, 91461.0, 100740.0, 103408.0, 99190.0, 87560.0, 73660.0, 57972.0, 43907.0, 31467.0, 21828.0, 14843.0, 9606.0, 6387.0, 4073.0, 2534.0, 1570.0, 1063.0, 623.0, 426.0, 252.0, 160.0, 128.0, 75.0, 29.0, 36.0, 27.0, 16.0, 12.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0], "bins": [-17.375, -16.837890625, -16.30078125, -15.763671875, -15.2265625, -14.689453125, -14.15234375, -13.615234375, -13.078125, -12.541015625, -12.00390625, -11.466796875, -10.9296875, -10.392578125, -9.85546875, -9.318359375, -8.78125, -8.244140625, -7.70703125, -7.169921875, -6.6328125, -6.095703125, -5.55859375, -5.021484375, -4.484375, -3.947265625, -3.41015625, -2.873046875, -2.3359375, -1.798828125, -1.26171875, -0.724609375, -0.1875, 0.349609375, 0.88671875, 1.423828125, 1.9609375, 2.498046875, 3.03515625, 3.572265625, 4.109375, 4.646484375, 5.18359375, 5.720703125, 6.2578125, 6.794921875, 7.33203125, 7.869140625, 8.40625, 8.943359375, 9.48046875, 10.017578125, 10.5546875, 11.091796875, 11.62890625, 12.166015625, 12.703125, 13.240234375, 13.77734375, 14.314453125, 14.8515625, 15.388671875, 15.92578125, 16.462890625, 17.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 7.0, 8.0, 5.0, 13.0, 13.0, 13.0, 19.0, 14.0, 14.0, 20.0, 28.0, 40.0, 35.0, 36.0, 40.0, 41.0, 37.0, 50.0, 49.0, 52.0, 40.0, 50.0, 46.0, 48.0, 51.0, 33.0, 26.0, 18.0, 22.0, 22.0, 18.0, 12.0, 16.0, 10.0, 12.0, 5.0, 7.0, 9.0, 5.0, 8.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.5703125, -8.3048095703125, -8.039306640625, -7.7738037109375, -7.50830078125, -7.2427978515625, -6.977294921875, -6.7117919921875, -6.4462890625, -6.1807861328125, -5.915283203125, -5.6497802734375, -5.38427734375, -5.1187744140625, -4.853271484375, -4.5877685546875, -4.322265625, -4.0567626953125, -3.791259765625, -3.5257568359375, -3.26025390625, -2.9947509765625, -2.729248046875, -2.4637451171875, -2.1982421875, -1.9327392578125, -1.667236328125, -1.4017333984375, -1.13623046875, -0.8707275390625, -0.605224609375, -0.3397216796875, -0.07421875, 0.1912841796875, 0.456787109375, 0.7222900390625, 0.98779296875, 1.2532958984375, 1.518798828125, 1.7843017578125, 2.0498046875, 2.3153076171875, 2.580810546875, 2.8463134765625, 3.11181640625, 3.3773193359375, 3.642822265625, 3.9083251953125, 4.173828125, 4.4393310546875, 4.704833984375, 4.9703369140625, 5.23583984375, 5.5013427734375, 5.766845703125, 6.0323486328125, 6.2978515625, 6.5633544921875, 6.828857421875, 7.0943603515625, 7.35986328125, 7.6253662109375, 7.890869140625, 8.1563720703125, 8.421875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 11.0, 14.0, 13.0, 15.0, 16.0, 22.0, 26.0, 28.0, 24.0, 55.0, 30.0, 41.0, 40.0, 40.0, 47.0, 48.0, 36.0, 33.0, 43.0, 42.0, 40.0, 37.0, 40.0, 28.0, 16.0, 33.0, 29.0, 31.0, 19.0, 25.0, 11.0, 12.0, 13.0, 7.0, 6.0, 3.0, 6.0, 7.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-44.92041778564453, -43.47650909423828, -42.0326042175293, -40.58869552612305, -39.1447868347168, -37.70087814331055, -36.25697326660156, -34.81306457519531, -33.36915588378906, -31.925249099731445, -30.481340408325195, -29.037433624267578, -27.593524932861328, -26.14961814880371, -24.705711364746094, -23.261802673339844, -21.817895889282227, -20.37398910522461, -18.93008041381836, -17.486173629760742, -16.042264938354492, -14.598358154296875, -13.154450416564941, -11.710542678833008, -10.266634941101074, -8.82272720336914, -7.378819465637207, -5.934912204742432, -4.491004467010498, -3.0470967292785645, -1.603189468383789, -0.15928173065185547, 1.2846260070800781, 2.7285337448120117, 4.172441482543945, 5.616348743438721, 7.060256481170654, 8.50416374206543, 9.948071479797363, 11.391979217529297, 12.83588695526123, 14.279794692993164, 15.723702430725098, 17.16761016845703, 18.61151695251465, 20.0554256439209, 21.499332427978516, 22.943241119384766, 24.387147903442383, 25.8310546875, 27.27496337890625, 28.718870162963867, 30.162778854370117, 31.606685638427734, 33.050594329833984, 34.49449920654297, 35.93840789794922, 37.38231658935547, 38.82622146606445, 40.2701301574707, 41.71403884887695, 43.1579475402832, 44.60185241699219, 46.04576110839844, 47.48966979980469]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 2.0, 8.0, 5.0, 10.0, 9.0, 13.0, 14.0, 8.0, 23.0, 22.0, 27.0, 29.0, 25.0, 30.0, 26.0, 23.0, 44.0, 21.0, 49.0, 45.0, 34.0, 45.0, 47.0, 42.0, 47.0, 35.0, 29.0, 32.0, 24.0, 34.0, 23.0, 24.0, 18.0, 18.0, 17.0, 16.0, 14.0, 10.0, 9.0, 10.0, 6.0, 7.0, 3.0, 7.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-42.56993865966797, -41.2236213684082, -39.87730407714844, -38.530982971191406, -37.18466567993164, -35.838348388671875, -34.492027282714844, -33.14570999145508, -31.799392700195312, -30.453075408935547, -29.10675621032715, -27.76043701171875, -26.414119720458984, -25.06780242919922, -23.72148323059082, -22.375164031982422, -21.028846740722656, -19.68252944946289, -18.336210250854492, -16.989891052246094, -15.643573760986328, -14.297255516052246, -12.950937271118164, -11.604619026184082, -10.25830078125, -8.911982536315918, -7.565664291381836, -6.219346046447754, -4.873027801513672, -3.52670955657959, -2.180391311645508, -0.8340730667114258, 0.5122413635253906, 1.8585596084594727, 3.2048778533935547, 4.551196098327637, 5.897514343261719, 7.243832588195801, 8.590150833129883, 9.936469078063965, 11.282787322998047, 12.629105567932129, 13.975423812866211, 15.321742057800293, 16.668060302734375, 18.01437759399414, 19.36069679260254, 20.707015991210938, 22.053333282470703, 23.39965057373047, 24.745969772338867, 26.092288970947266, 27.43860626220703, 28.784923553466797, 30.131242752075195, 31.477561950683594, 32.82387924194336, 34.170196533203125, 35.516517639160156, 36.86283493041992, 38.20915222167969, 39.55546951293945, 40.90178680419922, 42.24810791015625, 43.594425201416016]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 13.0, 21.0, 38.0, 60.0, 100.0, 174.0, 296.0, 508.0, 894.0, 1466.0, 2624.0, 4396.0, 7132.0, 11816.0, 18709.0, 29483.0, 44674.0, 66779.0, 96969.0, 136621.0, 184058.0, 238704.0, 293091.0, 341689.0, 376760.0, 390350.0, 382224.0, 351269.0, 304728.0, 250363.0, 196417.0, 146504.0, 105650.0, 73881.0, 49015.0, 32889.0, 20627.0, 13125.0, 7907.0, 5070.0, 2943.0, 1780.0, 976.0, 595.0, 390.0, 217.0, 134.0, 70.0, 39.0, 25.0, 11.0, 6.0, 3.0, 5.0, 3.0], "bins": [-35.5625, -34.53515625, -33.5078125, -32.48046875, -31.453125, -30.42578125, -29.3984375, -28.37109375, -27.34375, -26.31640625, -25.2890625, -24.26171875, -23.234375, -22.20703125, -21.1796875, -20.15234375, -19.125, -18.09765625, -17.0703125, -16.04296875, -15.015625, -13.98828125, -12.9609375, -11.93359375, -10.90625, -9.87890625, -8.8515625, -7.82421875, -6.796875, -5.76953125, -4.7421875, -3.71484375, -2.6875, -1.66015625, -0.6328125, 0.39453125, 1.421875, 2.44921875, 3.4765625, 4.50390625, 5.53125, 6.55859375, 7.5859375, 8.61328125, 9.640625, 10.66796875, 11.6953125, 12.72265625, 13.75, 14.77734375, 15.8046875, 16.83203125, 17.859375, 18.88671875, 19.9140625, 20.94140625, 21.96875, 22.99609375, 24.0234375, 25.05078125, 26.078125, 27.10546875, 28.1328125, 29.16015625, 30.1875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 10.0, 10.0, 9.0, 15.0, 12.0, 23.0, 25.0, 21.0, 32.0, 30.0, 26.0, 24.0, 26.0, 40.0, 34.0, 41.0, 44.0, 37.0, 40.0, 49.0, 46.0, 47.0, 32.0, 31.0, 35.0, 18.0, 34.0, 26.0, 20.0, 19.0, 22.0, 13.0, 15.0, 14.0, 5.0, 13.0, 8.0, 8.0, 6.0, 2.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-39.21875, -37.9658203125, -36.712890625, -35.4599609375, -34.20703125, -32.9541015625, -31.701171875, -30.4482421875, -29.1953125, -27.9423828125, -26.689453125, -25.4365234375, -24.18359375, -22.9306640625, -21.677734375, -20.4248046875, -19.171875, -17.9189453125, -16.666015625, -15.4130859375, -14.16015625, -12.9072265625, -11.654296875, -10.4013671875, -9.1484375, -7.8955078125, -6.642578125, -5.3896484375, -4.13671875, -2.8837890625, -1.630859375, -0.3779296875, 0.875, 2.1279296875, 3.380859375, 4.6337890625, 5.88671875, 7.1396484375, 8.392578125, 9.6455078125, 10.8984375, 12.1513671875, 13.404296875, 14.6572265625, 15.91015625, 17.1630859375, 18.416015625, 19.6689453125, 20.921875, 22.1748046875, 23.427734375, 24.6806640625, 25.93359375, 27.1865234375, 28.439453125, 29.6923828125, 30.9453125, 32.1982421875, 33.451171875, 34.7041015625, 35.95703125, 37.2099609375, 38.462890625, 39.7158203125, 40.96875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 12.0, 16.0, 33.0, 67.0, 118.0, 205.0, 351.0, 645.0, 1254.0, 2143.0, 3637.0, 6330.0, 10763.0, 17837.0, 28675.0, 45596.0, 69505.0, 102683.0, 144563.0, 196542.0, 253359.0, 310438.0, 357516.0, 389956.0, 399203.0, 385385.0, 347778.0, 297407.0, 240534.0, 184377.0, 134203.0, 93529.0, 63500.0, 41216.0, 26103.0, 15948.0, 9632.0, 5659.0, 3261.0, 1864.0, 1090.0, 624.0, 342.0, 193.0, 100.0, 42.0, 27.0, 13.0, 11.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.6875, -35.5546875, -34.421875, -33.2890625, -32.15625, -31.0234375, -29.890625, -28.7578125, -27.625, -26.4921875, -25.359375, -24.2265625, -23.09375, -21.9609375, -20.828125, -19.6953125, -18.5625, -17.4296875, -16.296875, -15.1640625, -14.03125, -12.8984375, -11.765625, -10.6328125, -9.5, -8.3671875, -7.234375, -6.1015625, -4.96875, -3.8359375, -2.703125, -1.5703125, -0.4375, 0.6953125, 1.828125, 2.9609375, 4.09375, 5.2265625, 6.359375, 7.4921875, 8.625, 9.7578125, 10.890625, 12.0234375, 13.15625, 14.2890625, 15.421875, 16.5546875, 17.6875, 18.8203125, 19.953125, 21.0859375, 22.21875, 23.3515625, 24.484375, 25.6171875, 26.75, 27.8828125, 29.015625, 30.1484375, 31.28125, 32.4140625, 33.546875, 34.6796875, 35.8125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 5.0, 10.0, 14.0, 21.0, 27.0, 40.0, 47.0, 74.0, 95.0, 126.0, 97.0, 146.0, 129.0, 175.0, 169.0, 204.0, 215.0, 228.0, 221.0, 230.0, 260.0, 220.0, 194.0, 190.0, 169.0, 140.0, 115.0, 110.0, 79.0, 66.0, 70.0, 48.0, 47.0, 28.0, 28.0, 8.0, 5.0, 12.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.859375, -18.157958984375, -17.45654296875, -16.755126953125, -16.0537109375, -15.352294921875, -14.65087890625, -13.949462890625, -13.248046875, -12.546630859375, -11.84521484375, -11.143798828125, -10.4423828125, -9.740966796875, -9.03955078125, -8.338134765625, -7.63671875, -6.935302734375, -6.23388671875, -5.532470703125, -4.8310546875, -4.129638671875, -3.42822265625, -2.726806640625, -2.025390625, -1.323974609375, -0.62255859375, 0.078857421875, 0.7802734375, 1.481689453125, 2.18310546875, 2.884521484375, 3.5859375, 4.287353515625, 4.98876953125, 5.690185546875, 6.3916015625, 7.093017578125, 7.79443359375, 8.495849609375, 9.197265625, 9.898681640625, 10.60009765625, 11.301513671875, 12.0029296875, 12.704345703125, 13.40576171875, 14.107177734375, 14.80859375, 15.510009765625, 16.21142578125, 16.912841796875, 17.6142578125, 18.315673828125, 19.01708984375, 19.718505859375, 20.419921875, 21.121337890625, 21.82275390625, 22.524169921875, 23.2255859375, 23.927001953125, 24.62841796875, 25.329833984375, 26.03125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 10.0, 8.0, 11.0, 13.0, 16.0, 24.0, 7.0, 21.0, 31.0, 37.0, 45.0, 36.0, 39.0, 47.0, 41.0, 50.0, 51.0, 55.0, 44.0, 47.0, 46.0, 45.0, 46.0, 35.0, 31.0, 17.0, 23.0, 16.0, 17.0, 19.0, 13.0, 12.0, 10.0, 8.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.83346176147461, -46.1873779296875, -44.541290283203125, -42.895206451416016, -41.249122619628906, -39.60303497314453, -37.95695114135742, -36.31086730957031, -34.66477966308594, -33.01869583129883, -31.372610092163086, -29.726524353027344, -28.0804386138916, -26.43435287475586, -24.78826904296875, -23.142183303833008, -21.4960994720459, -19.850013732910156, -18.203929901123047, -16.557844161987305, -14.911758422851562, -13.265673637390137, -11.619588851928711, -9.973503112792969, -8.327418327331543, -6.681333065032959, -5.035247802734375, -3.389163017272949, -1.7430777549743652, -0.09699249267578125, 1.5490922927856445, 3.1951780319213867, 4.8412628173828125, 6.4873480796813965, 8.13343334197998, 9.779518127441406, 11.425603866577148, 13.071688652038574, 14.7177734375, 16.363859176635742, 18.009944915771484, 19.656030654907227, 21.302114486694336, 22.948200225830078, 24.59428596496582, 26.240371704101562, 27.886455535888672, 29.532541275024414, 31.178625106811523, 32.824710845947266, 34.470794677734375, 36.11688232421875, 37.76296615600586, 39.40904998779297, 41.055137634277344, 42.70122146606445, 44.34730529785156, 45.99338912963867, 47.63947677612305, 49.285560607910156, 50.931644439697266, 52.57773208618164, 54.22381591796875, 55.869903564453125, 57.515987396240234]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 11.0, 4.0, 9.0, 6.0, 10.0, 18.0, 12.0, 20.0, 26.0, 21.0, 16.0, 33.0, 32.0, 35.0, 20.0, 30.0, 29.0, 43.0, 41.0, 34.0, 49.0, 43.0, 30.0, 40.0, 40.0, 30.0, 36.0, 29.0, 27.0, 24.0, 25.0, 19.0, 19.0, 17.0, 18.0, 14.0, 14.0, 7.0, 16.0, 9.0, 11.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-40.360687255859375, -38.97404479980469, -37.58740234375, -36.20075988769531, -34.814117431640625, -33.42747497558594, -32.04083251953125, -30.654191970825195, -29.267549514770508, -27.88090705871582, -26.494264602661133, -25.107624053955078, -23.72098159790039, -22.334339141845703, -20.947696685791016, -19.561054229736328, -18.17441177368164, -16.787769317626953, -15.401126861572266, -14.014485359191895, -12.627842903137207, -11.24120044708252, -9.854558944702148, -8.467916488647461, -7.081274032592773, -5.694631576538086, -4.307989597320557, -2.9213476181030273, -1.5347051620483398, -0.14806270599365234, 1.2385787963867188, 2.6252212524414062, 4.011863708496094, 5.398506164550781, 6.7851481437683105, 8.17179012298584, 9.558432579040527, 10.945075035095215, 12.331716537475586, 13.718358993530273, 15.105001449584961, 16.49164390563965, 17.878286361694336, 19.26492691040039, 20.651569366455078, 22.038211822509766, 23.424854278564453, 24.81149673461914, 26.198139190673828, 27.584781646728516, 28.971424102783203, 30.35806655883789, 31.744709014892578, 33.131351470947266, 34.51799011230469, 35.904632568359375, 37.29127502441406, 38.67791748046875, 40.06455993652344, 41.451202392578125, 42.83784484863281, 44.2244873046875, 45.61112976074219, 46.997772216796875, 48.38441467285156]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 9.0, 6.0, 16.0, 23.0, 39.0, 44.0, 58.0, 90.0, 131.0, 192.0, 311.0, 482.0, 741.0, 1241.0, 2034.0, 3412.0, 5733.0, 9939.0, 16620.0, 28077.0, 45822.0, 70478.0, 101233.0, 131025.0, 147325.0, 140903.0, 115228.0, 83881.0, 55910.0, 35097.0, 21222.0, 12766.0, 7405.0, 4372.0, 2562.0, 1516.0, 970.0, 568.0, 387.0, 226.0, 150.0, 102.0, 73.0, 53.0, 25.0, 24.0, 16.0, 9.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0], "bins": [-21.984375, -21.33251953125, -20.6806640625, -20.02880859375, -19.376953125, -18.72509765625, -18.0732421875, -17.42138671875, -16.76953125, -16.11767578125, -15.4658203125, -14.81396484375, -14.162109375, -13.51025390625, -12.8583984375, -12.20654296875, -11.5546875, -10.90283203125, -10.2509765625, -9.59912109375, -8.947265625, -8.29541015625, -7.6435546875, -6.99169921875, -6.33984375, -5.68798828125, -5.0361328125, -4.38427734375, -3.732421875, -3.08056640625, -2.4287109375, -1.77685546875, -1.125, -0.47314453125, 0.1787109375, 0.83056640625, 1.482421875, 2.13427734375, 2.7861328125, 3.43798828125, 4.08984375, 4.74169921875, 5.3935546875, 6.04541015625, 6.697265625, 7.34912109375, 8.0009765625, 8.65283203125, 9.3046875, 9.95654296875, 10.6083984375, 11.26025390625, 11.912109375, 12.56396484375, 13.2158203125, 13.86767578125, 14.51953125, 15.17138671875, 15.8232421875, 16.47509765625, 17.126953125, 17.77880859375, 18.4306640625, 19.08251953125, 19.734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 12.0, 4.0, 7.0, 4.0, 12.0, 17.0, 15.0, 16.0, 26.0, 22.0, 17.0, 33.0, 34.0, 33.0, 22.0, 26.0, 32.0, 41.0, 42.0, 33.0, 51.0, 42.0, 31.0, 42.0, 39.0, 29.0, 39.0, 28.0, 24.0, 27.0, 23.0, 19.0, 20.0, 18.0, 19.0, 12.0, 14.0, 7.0, 17.0, 8.0, 11.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-40.34375, -38.955078125, -37.56640625, -36.177734375, -34.7890625, -33.400390625, -32.01171875, -30.623046875, -29.234375, -27.845703125, -26.45703125, -25.068359375, -23.6796875, -22.291015625, -20.90234375, -19.513671875, -18.125, -16.736328125, -15.34765625, -13.958984375, -12.5703125, -11.181640625, -9.79296875, -8.404296875, -7.015625, -5.626953125, -4.23828125, -2.849609375, -1.4609375, -0.072265625, 1.31640625, 2.705078125, 4.09375, 5.482421875, 6.87109375, 8.259765625, 9.6484375, 11.037109375, 12.42578125, 13.814453125, 15.203125, 16.591796875, 17.98046875, 19.369140625, 20.7578125, 22.146484375, 23.53515625, 24.923828125, 26.3125, 27.701171875, 29.08984375, 30.478515625, 31.8671875, 33.255859375, 34.64453125, 36.033203125, 37.421875, 38.810546875, 40.19921875, 41.587890625, 42.9765625, 44.365234375, 45.75390625, 47.142578125, 48.53125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 12.0, 6.0, 10.0, 19.0, 29.0, 32.0, 46.0, 65.0, 100.0, 176.0, 219.0, 322.0, 566.0, 865.0, 1548.0, 2604.0, 4389.0, 7830.0, 15132.0, 29292.0, 57575.0, 111696.0, 188563.0, 231944.0, 179690.0, 103094.0, 53605.0, 27076.0, 14127.0, 7523.0, 4175.0, 2367.0, 1443.0, 819.0, 530.0, 329.0, 235.0, 159.0, 100.0, 79.0, 47.0, 34.0, 21.0, 20.0, 11.0, 8.0, 5.0, 2.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.734375, -24.8603515625, -23.986328125, -23.1123046875, -22.23828125, -21.3642578125, -20.490234375, -19.6162109375, -18.7421875, -17.8681640625, -16.994140625, -16.1201171875, -15.24609375, -14.3720703125, -13.498046875, -12.6240234375, -11.75, -10.8759765625, -10.001953125, -9.1279296875, -8.25390625, -7.3798828125, -6.505859375, -5.6318359375, -4.7578125, -3.8837890625, -3.009765625, -2.1357421875, -1.26171875, -0.3876953125, 0.486328125, 1.3603515625, 2.234375, 3.1083984375, 3.982421875, 4.8564453125, 5.73046875, 6.6044921875, 7.478515625, 8.3525390625, 9.2265625, 10.1005859375, 10.974609375, 11.8486328125, 12.72265625, 13.5966796875, 14.470703125, 15.3447265625, 16.21875, 17.0927734375, 17.966796875, 18.8408203125, 19.71484375, 20.5888671875, 21.462890625, 22.3369140625, 23.2109375, 24.0849609375, 24.958984375, 25.8330078125, 26.70703125, 27.5810546875, 28.455078125, 29.3291015625, 30.203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 6.0, 2.0, 2.0, 4.0, 10.0, 8.0, 10.0, 13.0, 25.0, 13.0, 30.0, 31.0, 42.0, 32.0, 30.0, 37.0, 32.0, 46.0, 37.0, 46.0, 61.0, 42.0, 45.0, 40.0, 40.0, 34.0, 31.0, 40.0, 29.0, 20.0, 36.0, 22.0, 24.0, 15.0, 19.0, 15.0, 8.0, 10.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.53125, -31.46875, -30.40625, -29.34375, -28.28125, -27.21875, -26.15625, -25.09375, -24.03125, -22.96875, -21.90625, -20.84375, -19.78125, -18.71875, -17.65625, -16.59375, -15.53125, -14.46875, -13.40625, -12.34375, -11.28125, -10.21875, -9.15625, -8.09375, -7.03125, -5.96875, -4.90625, -3.84375, -2.78125, -1.71875, -0.65625, 0.40625, 1.46875, 2.53125, 3.59375, 4.65625, 5.71875, 6.78125, 7.84375, 8.90625, 9.96875, 11.03125, 12.09375, 13.15625, 14.21875, 15.28125, 16.34375, 17.40625, 18.46875, 19.53125, 20.59375, 21.65625, 22.71875, 23.78125, 24.84375, 25.90625, 26.96875, 28.03125, 29.09375, 30.15625, 31.21875, 32.28125, 33.34375, 34.40625, 35.46875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 9.0, 10.0, 15.0, 20.0, 16.0, 43.0, 52.0, 103.0, 137.0, 177.0, 268.0, 433.0, 653.0, 1030.0, 1581.0, 2499.0, 3998.0, 6609.0, 11481.0, 20885.0, 39819.0, 83119.0, 180948.0, 296990.0, 204414.0, 93993.0, 44802.0, 23214.0, 12272.0, 7200.0, 4374.0, 2674.0, 1706.0, 1060.0, 663.0, 433.0, 304.0, 188.0, 118.0, 68.0, 61.0, 47.0, 27.0, 13.0, 10.0, 9.0, 8.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.1953125, -14.6983642578125, -14.201416015625, -13.7044677734375, -13.20751953125, -12.7105712890625, -12.213623046875, -11.7166748046875, -11.2197265625, -10.7227783203125, -10.225830078125, -9.7288818359375, -9.23193359375, -8.7349853515625, -8.238037109375, -7.7410888671875, -7.244140625, -6.7471923828125, -6.250244140625, -5.7532958984375, -5.25634765625, -4.7593994140625, -4.262451171875, -3.7655029296875, -3.2685546875, -2.7716064453125, -2.274658203125, -1.7777099609375, -1.28076171875, -0.7838134765625, -0.286865234375, 0.2100830078125, 0.70703125, 1.2039794921875, 1.700927734375, 2.1978759765625, 2.69482421875, 3.1917724609375, 3.688720703125, 4.1856689453125, 4.6826171875, 5.1795654296875, 5.676513671875, 6.1734619140625, 6.67041015625, 7.1673583984375, 7.664306640625, 8.1612548828125, 8.658203125, 9.1551513671875, 9.652099609375, 10.1490478515625, 10.64599609375, 11.1429443359375, 11.639892578125, 12.1368408203125, 12.6337890625, 13.1307373046875, 13.627685546875, 14.1246337890625, 14.62158203125, 15.1185302734375, 15.615478515625, 16.1124267578125, 16.609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 7.0, 9.0, 13.0, 15.0, 27.0, 24.0, 28.0, 26.0, 31.0, 52.0, 42.0, 54.0, 72.0, 66.0, 63.0, 58.0, 79.0, 45.0, 51.0, 45.0, 37.0, 32.0, 29.0, 21.0, 20.0, 15.0, 10.0, 5.0, 7.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008072853088378906, -0.0007821023464202881, -0.0007569193840026855, -0.000731736421585083, -0.0007065534591674805, -0.0006813704967498779, -0.0006561875343322754, -0.0006310045719146729, -0.0006058216094970703, -0.0005806386470794678, -0.0005554556846618652, -0.0005302727222442627, -0.0005050897598266602, -0.0004799067974090576, -0.0004547238349914551, -0.00042954087257385254, -0.00040435791015625, -0.00037917494773864746, -0.0003539919853210449, -0.0003288090229034424, -0.00030362606048583984, -0.0002784430980682373, -0.00025326013565063477, -0.00022807717323303223, -0.0002028942108154297, -0.00017771124839782715, -0.0001525282859802246, -0.00012734532356262207, -0.00010216236114501953, -7.697939872741699e-05, -5.179643630981445e-05, -2.6613473892211914e-05, -1.430511474609375e-06, 2.3752450942993164e-05, 4.89354133605957e-05, 7.411837577819824e-05, 9.930133819580078e-05, 0.00012448430061340332, 0.00014966726303100586, 0.0001748502254486084, 0.00020003318786621094, 0.00022521615028381348, 0.000250399112701416, 0.00027558207511901855, 0.0003007650375366211, 0.00032594799995422363, 0.00035113096237182617, 0.0003763139247894287, 0.00040149688720703125, 0.0004266798496246338, 0.00045186281204223633, 0.00047704577445983887, 0.0005022287368774414, 0.0005274116992950439, 0.0005525946617126465, 0.000577777624130249, 0.0006029605865478516, 0.0006281435489654541, 0.0006533265113830566, 0.0006785094738006592, 0.0007036924362182617, 0.0007288753986358643, 0.0007540583610534668, 0.0007792413234710693, 0.0008044242858886719]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 4.0, 16.0, 20.0, 21.0, 35.0, 58.0, 87.0, 135.0, 239.0, 309.0, 513.0, 851.0, 1292.0, 2176.0, 3651.0, 5864.0, 9328.0, 15201.0, 24446.0, 39426.0, 61976.0, 94849.0, 131502.0, 156083.0, 151589.0, 120801.0, 84060.0, 54609.0, 33630.0, 21252.0, 13053.0, 8232.0, 5082.0, 3101.0, 1932.0, 1190.0, 747.0, 430.0, 293.0, 162.0, 108.0, 79.0, 47.0, 26.0, 14.0, 15.0, 8.0, 4.0, 4.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-18.421875, -17.861083984375, -17.30029296875, -16.739501953125, -16.1787109375, -15.617919921875, -15.05712890625, -14.496337890625, -13.935546875, -13.374755859375, -12.81396484375, -12.253173828125, -11.6923828125, -11.131591796875, -10.57080078125, -10.010009765625, -9.44921875, -8.888427734375, -8.32763671875, -7.766845703125, -7.2060546875, -6.645263671875, -6.08447265625, -5.523681640625, -4.962890625, -4.402099609375, -3.84130859375, -3.280517578125, -2.7197265625, -2.158935546875, -1.59814453125, -1.037353515625, -0.4765625, 0.084228515625, 0.64501953125, 1.205810546875, 1.7666015625, 2.327392578125, 2.88818359375, 3.448974609375, 4.009765625, 4.570556640625, 5.13134765625, 5.692138671875, 6.2529296875, 6.813720703125, 7.37451171875, 7.935302734375, 8.49609375, 9.056884765625, 9.61767578125, 10.178466796875, 10.7392578125, 11.300048828125, 11.86083984375, 12.421630859375, 12.982421875, 13.543212890625, 14.10400390625, 14.664794921875, 15.2255859375, 15.786376953125, 16.34716796875, 16.907958984375, 17.46875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 5.0, 4.0, 5.0, 6.0, 9.0, 12.0, 15.0, 23.0, 7.0, 21.0, 22.0, 32.0, 31.0, 28.0, 32.0, 34.0, 39.0, 35.0, 49.0, 47.0, 58.0, 48.0, 46.0, 48.0, 35.0, 35.0, 36.0, 30.0, 34.0, 22.0, 25.0, 18.0, 8.0, 12.0, 16.0, 7.0, 6.0, 6.0, 8.0, 8.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.3828125, -6.18646240234375, -5.9901123046875, -5.79376220703125, -5.597412109375, -5.40106201171875, -5.2047119140625, -5.00836181640625, -4.81201171875, -4.61566162109375, -4.4193115234375, -4.22296142578125, -4.026611328125, -3.83026123046875, -3.6339111328125, -3.43756103515625, -3.2412109375, -3.04486083984375, -2.8485107421875, -2.65216064453125, -2.455810546875, -2.25946044921875, -2.0631103515625, -1.86676025390625, -1.67041015625, -1.47406005859375, -1.2777099609375, -1.08135986328125, -0.885009765625, -0.68865966796875, -0.4923095703125, -0.29595947265625, -0.099609375, 0.09674072265625, 0.2930908203125, 0.48944091796875, 0.685791015625, 0.88214111328125, 1.0784912109375, 1.27484130859375, 1.47119140625, 1.66754150390625, 1.8638916015625, 2.06024169921875, 2.256591796875, 2.45294189453125, 2.6492919921875, 2.84564208984375, 3.0419921875, 3.23834228515625, 3.4346923828125, 3.63104248046875, 3.827392578125, 4.02374267578125, 4.2200927734375, 4.41644287109375, 4.61279296875, 4.80914306640625, 5.0054931640625, 5.20184326171875, 5.398193359375, 5.59454345703125, 5.7908935546875, 5.98724365234375, 6.18359375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 6.0, 3.0, 11.0, 9.0, 15.0, 10.0, 15.0, 19.0, 16.0, 22.0, 36.0, 42.0, 41.0, 27.0, 40.0, 46.0, 50.0, 39.0, 47.0, 56.0, 37.0, 43.0, 46.0, 50.0, 23.0, 38.0, 28.0, 32.0, 12.0, 22.0, 14.0, 15.0, 16.0, 10.0, 7.0, 8.0, 12.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.74151611328125, -42.22362518310547, -40.70573425292969, -39.18784713745117, -37.66995620727539, -36.15206527709961, -34.634178161621094, -33.11628723144531, -31.59839630126953, -30.08050537109375, -28.5626163482666, -27.044727325439453, -25.526836395263672, -24.00894546508789, -22.491056442260742, -20.973167419433594, -19.455276489257812, -17.93738555908203, -16.419496536254883, -14.901606559753418, -13.383716583251953, -11.865826606750488, -10.347936630249023, -8.830046653747559, -7.312156677246094, -5.794266700744629, -4.276376724243164, -2.758486747741699, -1.2405967712402344, 0.27729320526123047, 1.7951831817626953, 3.31307315826416, 4.830963134765625, 6.34885311126709, 7.866743087768555, 9.38463306427002, 10.902523040771484, 12.42041301727295, 13.938302993774414, 15.456192970275879, 16.974082946777344, 18.491973876953125, 20.009862899780273, 21.527751922607422, 23.045642852783203, 24.563533782958984, 26.081422805786133, 27.59931182861328, 29.117202758789062, 30.635093688964844, 32.152984619140625, 33.67087173461914, 35.18876266479492, 36.7066535949707, 38.22454071044922, 39.742431640625, 41.26032257080078, 42.77821350097656, 44.296104431152344, 45.81399154663086, 47.33188247680664, 48.84977340698242, 50.36766052246094, 51.88555145263672, 53.4034423828125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 2.0, 6.0, 6.0, 6.0, 7.0, 4.0, 11.0, 13.0, 10.0, 23.0, 24.0, 14.0, 29.0, 23.0, 26.0, 25.0, 26.0, 24.0, 38.0, 31.0, 41.0, 31.0, 41.0, 45.0, 47.0, 34.0, 35.0, 32.0, 40.0, 36.0, 26.0, 29.0, 26.0, 23.0, 19.0, 19.0, 15.0, 14.0, 21.0, 12.0, 9.0, 14.0, 13.0, 4.0, 6.0, 0.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0], "bins": [-41.411251068115234, -40.02577209472656, -38.64029312133789, -37.25481414794922, -35.86933135986328, -34.48385238647461, -33.09837341308594, -31.712894439697266, -30.32741355895996, -28.94193458557129, -27.556453704833984, -26.170974731445312, -24.78549575805664, -23.400014877319336, -22.014535903930664, -20.62905502319336, -19.243576049804688, -17.858097076416016, -16.47261619567871, -15.087137222290039, -13.70165729522705, -12.316177368164062, -10.93069839477539, -9.545218467712402, -8.159738540649414, -6.774258613586426, -5.388779163360596, -4.003299713134766, -2.6178197860717773, -1.232339859008789, 0.1531391143798828, 1.538619041442871, 2.924102783203125, 4.309582710266113, 5.695062160491943, 7.080541610717773, 8.466021537780762, 9.85150146484375, 11.236980438232422, 12.62246036529541, 14.007940292358398, 15.393420219421387, 16.778900146484375, 18.164379119873047, 19.54985809326172, 20.935338973999023, 22.320817947387695, 23.706298828125, 25.091777801513672, 26.477256774902344, 27.86273765563965, 29.24821662902832, 30.633697509765625, 32.0191764831543, 33.40465545654297, 34.79013442993164, 36.17561340332031, 37.561092376708984, 38.946571350097656, 40.332054138183594, 41.717533111572266, 43.10301208496094, 44.48849105834961, 45.87397003173828, 47.25945281982422]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 18.0, 34.0, 34.0, 80.0, 110.0, 150.0, 291.0, 406.0, 651.0, 977.0, 1631.0, 2364.0, 3598.0, 5328.0, 7634.0, 10805.0, 14912.0, 20438.0, 27072.0, 34603.0, 42843.0, 51930.0, 61134.0, 68215.0, 74842.0, 78494.0, 78767.0, 76880.0, 71145.0, 64345.0, 55372.0, 46622.0, 37679.0, 29775.0, 22857.0, 16963.0, 12309.0, 8893.0, 6139.0, 4255.0, 2746.0, 1864.0, 1198.0, 763.0, 526.0, 299.0, 223.0, 125.0, 84.0, 58.0, 27.0, 21.0, 15.0, 5.0, 6.0, 4.0], "bins": [-30.75, -29.850830078125, -28.95166015625, -28.052490234375, -27.1533203125, -26.254150390625, -25.35498046875, -24.455810546875, -23.556640625, -22.657470703125, -21.75830078125, -20.859130859375, -19.9599609375, -19.060791015625, -18.16162109375, -17.262451171875, -16.36328125, -15.464111328125, -14.56494140625, -13.665771484375, -12.7666015625, -11.867431640625, -10.96826171875, -10.069091796875, -9.169921875, -8.270751953125, -7.37158203125, -6.472412109375, -5.5732421875, -4.674072265625, -3.77490234375, -2.875732421875, -1.9765625, -1.077392578125, -0.17822265625, 0.720947265625, 1.6201171875, 2.519287109375, 3.41845703125, 4.317626953125, 5.216796875, 6.115966796875, 7.01513671875, 7.914306640625, 8.8134765625, 9.712646484375, 10.61181640625, 11.510986328125, 12.41015625, 13.309326171875, 14.20849609375, 15.107666015625, 16.0068359375, 16.906005859375, 17.80517578125, 18.704345703125, 19.603515625, 20.502685546875, 21.40185546875, 22.301025390625, 23.2001953125, 24.099365234375, 24.99853515625, 25.897705078125, 26.796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 3.0, 8.0, 5.0, 9.0, 4.0, 9.0, 11.0, 9.0, 18.0, 29.0, 13.0, 25.0, 26.0, 20.0, 33.0, 24.0, 22.0, 40.0, 30.0, 36.0, 31.0, 47.0, 44.0, 44.0, 37.0, 32.0, 35.0, 41.0, 33.0, 33.0, 28.0, 28.0, 21.0, 17.0, 22.0, 19.0, 9.0, 20.0, 15.0, 14.0, 9.0, 14.0, 6.0, 5.0, 1.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0], "bins": [-40.6875, -39.33935546875, -37.9912109375, -36.64306640625, -35.294921875, -33.94677734375, -32.5986328125, -31.25048828125, -29.90234375, -28.55419921875, -27.2060546875, -25.85791015625, -24.509765625, -23.16162109375, -21.8134765625, -20.46533203125, -19.1171875, -17.76904296875, -16.4208984375, -15.07275390625, -13.724609375, -12.37646484375, -11.0283203125, -9.68017578125, -8.33203125, -6.98388671875, -5.6357421875, -4.28759765625, -2.939453125, -1.59130859375, -0.2431640625, 1.10498046875, 2.453125, 3.80126953125, 5.1494140625, 6.49755859375, 7.845703125, 9.19384765625, 10.5419921875, 11.89013671875, 13.23828125, 14.58642578125, 15.9345703125, 17.28271484375, 18.630859375, 19.97900390625, 21.3271484375, 22.67529296875, 24.0234375, 25.37158203125, 26.7197265625, 28.06787109375, 29.416015625, 30.76416015625, 32.1123046875, 33.46044921875, 34.80859375, 36.15673828125, 37.5048828125, 38.85302734375, 40.201171875, 41.54931640625, 42.8974609375, 44.24560546875, 45.59375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 13.0, 31.0, 35.0, 52.0, 97.0, 144.0, 228.0, 399.0, 649.0, 1042.0, 1775.0, 2800.0, 4218.0, 6880.0, 10462.0, 15032.0, 21974.0, 30769.0, 40836.0, 52462.0, 64968.0, 76533.0, 85711.0, 91366.0, 91725.0, 88312.0, 80101.0, 69071.0, 56817.0, 44688.0, 34022.0, 24569.0, 17341.0, 11779.0, 7996.0, 5110.0, 3236.0, 1953.0, 1288.0, 834.0, 494.0, 274.0, 186.0, 120.0, 69.0, 37.0, 23.0, 12.0, 9.0, 8.0, 3.0, 4.0, 1.0, 2.0], "bins": [-34.40625, -33.3994140625, -32.392578125, -31.3857421875, -30.37890625, -29.3720703125, -28.365234375, -27.3583984375, -26.3515625, -25.3447265625, -24.337890625, -23.3310546875, -22.32421875, -21.3173828125, -20.310546875, -19.3037109375, -18.296875, -17.2900390625, -16.283203125, -15.2763671875, -14.26953125, -13.2626953125, -12.255859375, -11.2490234375, -10.2421875, -9.2353515625, -8.228515625, -7.2216796875, -6.21484375, -5.2080078125, -4.201171875, -3.1943359375, -2.1875, -1.1806640625, -0.173828125, 0.8330078125, 1.83984375, 2.8466796875, 3.853515625, 4.8603515625, 5.8671875, 6.8740234375, 7.880859375, 8.8876953125, 9.89453125, 10.9013671875, 11.908203125, 12.9150390625, 13.921875, 14.9287109375, 15.935546875, 16.9423828125, 17.94921875, 18.9560546875, 19.962890625, 20.9697265625, 21.9765625, 22.9833984375, 23.990234375, 24.9970703125, 26.00390625, 27.0107421875, 28.017578125, 29.0244140625, 30.03125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 6.0, 9.0, 11.0, 11.0, 5.0, 13.0, 15.0, 19.0, 20.0, 32.0, 28.0, 36.0, 36.0, 33.0, 47.0, 46.0, 47.0, 45.0, 37.0, 47.0, 61.0, 39.0, 38.0, 28.0, 33.0, 34.0, 26.0, 28.0, 28.0, 22.0, 21.0, 14.0, 18.0, 14.0, 12.0, 5.0, 9.0, 8.0, 6.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-38.46875, -37.432373046875, -36.39599609375, -35.359619140625, -34.3232421875, -33.286865234375, -32.25048828125, -31.214111328125, -30.177734375, -29.141357421875, -28.10498046875, -27.068603515625, -26.0322265625, -24.995849609375, -23.95947265625, -22.923095703125, -21.88671875, -20.850341796875, -19.81396484375, -18.777587890625, -17.7412109375, -16.704833984375, -15.66845703125, -14.632080078125, -13.595703125, -12.559326171875, -11.52294921875, -10.486572265625, -9.4501953125, -8.413818359375, -7.37744140625, -6.341064453125, -5.3046875, -4.268310546875, -3.23193359375, -2.195556640625, -1.1591796875, -0.122802734375, 0.91357421875, 1.949951171875, 2.986328125, 4.022705078125, 5.05908203125, 6.095458984375, 7.1318359375, 8.168212890625, 9.20458984375, 10.240966796875, 11.27734375, 12.313720703125, 13.35009765625, 14.386474609375, 15.4228515625, 16.459228515625, 17.49560546875, 18.531982421875, 19.568359375, 20.604736328125, 21.64111328125, 22.677490234375, 23.7138671875, 24.750244140625, 25.78662109375, 26.822998046875, 27.859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 13.0, 27.0, 23.0, 59.0, 90.0, 135.0, 229.0, 369.0, 609.0, 952.0, 1535.0, 2424.0, 3919.0, 6104.0, 9273.0, 13843.0, 20152.0, 28558.0, 39316.0, 51833.0, 65201.0, 78177.0, 89443.0, 95449.0, 96615.0, 92295.0, 82326.0, 69879.0, 56551.0, 43140.0, 32069.0, 22780.0, 15771.0, 10411.0, 7066.0, 4499.0, 2733.0, 1828.0, 1084.0, 688.0, 399.0, 255.0, 201.0, 86.0, 58.0, 31.0, 24.0, 21.0, 8.0, 7.0, 0.0, 3.0, 1.0], "bins": [-16.703125, -16.2281494140625, -15.753173828125, -15.2781982421875, -14.80322265625, -14.3282470703125, -13.853271484375, -13.3782958984375, -12.9033203125, -12.4283447265625, -11.953369140625, -11.4783935546875, -11.00341796875, -10.5284423828125, -10.053466796875, -9.5784912109375, -9.103515625, -8.6285400390625, -8.153564453125, -7.6785888671875, -7.20361328125, -6.7286376953125, -6.253662109375, -5.7786865234375, -5.3037109375, -4.8287353515625, -4.353759765625, -3.8787841796875, -3.40380859375, -2.9288330078125, -2.453857421875, -1.9788818359375, -1.50390625, -1.0289306640625, -0.553955078125, -0.0789794921875, 0.39599609375, 0.8709716796875, 1.345947265625, 1.8209228515625, 2.2958984375, 2.7708740234375, 3.245849609375, 3.7208251953125, 4.19580078125, 4.6707763671875, 5.145751953125, 5.6207275390625, 6.095703125, 6.5706787109375, 7.045654296875, 7.5206298828125, 7.99560546875, 8.4705810546875, 8.945556640625, 9.4205322265625, 9.8955078125, 10.3704833984375, 10.845458984375, 11.3204345703125, 11.79541015625, 12.2703857421875, 12.745361328125, 13.2203369140625, 13.6953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 6.0, 7.0, 9.0, 8.0, 11.0, 10.0, 24.0, 21.0, 14.0, 28.0, 26.0, 29.0, 46.0, 41.0, 67.0, 51.0, 67.0, 47.0, 48.0, 57.0, 51.0, 43.0, 47.0, 35.0, 27.0, 31.0, 34.0, 25.0, 28.0, 16.0, 5.0, 10.0, 6.0, 5.0, 8.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0021915435791015625, -0.0021154582500457764, -0.0020393729209899902, -0.001963287591934204, -0.001887202262878418, -0.0018111169338226318, -0.0017350316047668457, -0.0016589462757110596, -0.0015828609466552734, -0.0015067756175994873, -0.0014306902885437012, -0.001354604959487915, -0.001278519630432129, -0.0012024343013763428, -0.0011263489723205566, -0.0010502636432647705, -0.0009741783142089844, -0.0008980929851531982, -0.0008220076560974121, -0.000745922327041626, -0.0006698369979858398, -0.0005937516689300537, -0.0005176663398742676, -0.00044158101081848145, -0.0003654956817626953, -0.0002894103527069092, -0.00021332502365112305, -0.00013723969459533691, -6.115436553955078e-05, 1.4930963516235352e-05, 9.101629257202148e-05, 0.00016710162162780762, 0.00024318695068359375, 0.0003192722797393799, 0.000395357608795166, 0.00047144293785095215, 0.0005475282669067383, 0.0006236135959625244, 0.0006996989250183105, 0.0007757842540740967, 0.0008518695831298828, 0.0009279549121856689, 0.001004040241241455, 0.0010801255702972412, 0.0011562108993530273, 0.0012322962284088135, 0.0013083815574645996, 0.0013844668865203857, 0.0014605522155761719, 0.001536637544631958, 0.0016127228736877441, 0.0016888082027435303, 0.0017648935317993164, 0.0018409788608551025, 0.0019170641899108887, 0.001993149518966675, 0.002069234848022461, 0.002145320177078247, 0.002221405506134033, 0.0022974908351898193, 0.0023735761642456055, 0.0024496614933013916, 0.0025257468223571777, 0.002601832151412964, 0.00267791748046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 10.0, 7.0, 16.0, 18.0, 25.0, 42.0, 79.0, 114.0, 178.0, 277.0, 447.0, 748.0, 1162.0, 1991.0, 3166.0, 5000.0, 8120.0, 12427.0, 18914.0, 27904.0, 39817.0, 54128.0, 69974.0, 85398.0, 97108.0, 104229.0, 104096.0, 96138.0, 83282.0, 67491.0, 51849.0, 38076.0, 26780.0, 17869.0, 11749.0, 7551.0, 4735.0, 3040.0, 1775.0, 1089.0, 681.0, 377.0, 256.0, 159.0, 106.0, 60.0, 35.0, 23.0, 17.0, 15.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-19.09375, -18.513916015625, -17.93408203125, -17.354248046875, -16.7744140625, -16.194580078125, -15.61474609375, -15.034912109375, -14.455078125, -13.875244140625, -13.29541015625, -12.715576171875, -12.1357421875, -11.555908203125, -10.97607421875, -10.396240234375, -9.81640625, -9.236572265625, -8.65673828125, -8.076904296875, -7.4970703125, -6.917236328125, -6.33740234375, -5.757568359375, -5.177734375, -4.597900390625, -4.01806640625, -3.438232421875, -2.8583984375, -2.278564453125, -1.69873046875, -1.118896484375, -0.5390625, 0.040771484375, 0.62060546875, 1.200439453125, 1.7802734375, 2.360107421875, 2.93994140625, 3.519775390625, 4.099609375, 4.679443359375, 5.25927734375, 5.839111328125, 6.4189453125, 6.998779296875, 7.57861328125, 8.158447265625, 8.73828125, 9.318115234375, 9.89794921875, 10.477783203125, 11.0576171875, 11.637451171875, 12.21728515625, 12.797119140625, 13.376953125, 13.956787109375, 14.53662109375, 15.116455078125, 15.6962890625, 16.276123046875, 16.85595703125, 17.435791015625, 18.015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 5.0, 8.0, 5.0, 6.0, 11.0, 16.0, 15.0, 16.0, 17.0, 20.0, 23.0, 38.0, 30.0, 31.0, 29.0, 35.0, 48.0, 44.0, 51.0, 47.0, 58.0, 45.0, 47.0, 41.0, 39.0, 42.0, 25.0, 33.0, 25.0, 29.0, 18.0, 14.0, 9.0, 10.0, 11.0, 13.0, 8.0, 10.0, 10.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.046875, -7.78662109375, -7.5263671875, -7.26611328125, -7.005859375, -6.74560546875, -6.4853515625, -6.22509765625, -5.96484375, -5.70458984375, -5.4443359375, -5.18408203125, -4.923828125, -4.66357421875, -4.4033203125, -4.14306640625, -3.8828125, -3.62255859375, -3.3623046875, -3.10205078125, -2.841796875, -2.58154296875, -2.3212890625, -2.06103515625, -1.80078125, -1.54052734375, -1.2802734375, -1.02001953125, -0.759765625, -0.49951171875, -0.2392578125, 0.02099609375, 0.28125, 0.54150390625, 0.8017578125, 1.06201171875, 1.322265625, 1.58251953125, 1.8427734375, 2.10302734375, 2.36328125, 2.62353515625, 2.8837890625, 3.14404296875, 3.404296875, 3.66455078125, 3.9248046875, 4.18505859375, 4.4453125, 4.70556640625, 4.9658203125, 5.22607421875, 5.486328125, 5.74658203125, 6.0068359375, 6.26708984375, 6.52734375, 6.78759765625, 7.0478515625, 7.30810546875, 7.568359375, 7.82861328125, 8.0888671875, 8.34912109375, 8.609375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 2.0, 5.0, 8.0, 5.0, 10.0, 24.0, 22.0, 16.0, 20.0, 33.0, 26.0, 33.0, 28.0, 37.0, 41.0, 49.0, 53.0, 39.0, 47.0, 49.0, 38.0, 43.0, 39.0, 50.0, 37.0, 34.0, 30.0, 28.0, 21.0, 19.0, 18.0, 18.0, 19.0, 11.0, 4.0, 11.0, 14.0, 8.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.055877685546875, -46.465736389160156, -44.87559509277344, -43.28545379638672, -41.6953125, -40.105167388916016, -38.5150260925293, -36.92488479614258, -35.33474349975586, -33.74460220336914, -32.15446090698242, -30.56431770324707, -28.97417640686035, -27.384035110473633, -25.79389190673828, -24.203750610351562, -22.613609313964844, -21.023468017578125, -19.433326721191406, -17.843183517456055, -16.253042221069336, -14.662900924682617, -13.072758674621582, -11.482616424560547, -9.892475128173828, -8.30233383178711, -6.712191581726074, -5.122049808502197, -3.5319080352783203, -1.9417662620544434, -0.3516244888305664, 1.2385177612304688, 2.828662872314453, 4.41880464553833, 6.008946418762207, 7.599088191986084, 9.189229965209961, 10.77937126159668, 12.369513511657715, 13.95965576171875, 15.549797058105469, 17.139938354492188, 18.730079650878906, 20.320222854614258, 21.910364151000977, 23.500505447387695, 25.090648651123047, 26.680789947509766, 28.270931243896484, 29.861072540283203, 31.451213836669922, 33.04135513305664, 34.631500244140625, 36.221641540527344, 37.81178283691406, 39.40192413330078, 40.9920654296875, 42.58220672607422, 44.17234802246094, 45.762489318847656, 47.352630615234375, 48.94277572631836, 50.53291702270508, 52.1230583190918, 53.713199615478516]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 5.0, 3.0, 5.0, 11.0, 11.0, 8.0, 8.0, 11.0, 24.0, 21.0, 21.0, 19.0, 23.0, 35.0, 35.0, 46.0, 41.0, 33.0, 44.0, 62.0, 32.0, 47.0, 35.0, 45.0, 32.0, 33.0, 36.0, 36.0, 39.0, 36.0, 21.0, 27.0, 18.0, 16.0, 10.0, 17.0, 8.0, 13.0, 6.0, 8.0, 2.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.87618637084961, -48.218204498291016, -46.56022262573242, -44.90224075317383, -43.244258880615234, -41.58627700805664, -39.92829132080078, -38.27030944824219, -36.612327575683594, -34.954345703125, -33.296363830566406, -31.638381958007812, -29.98040008544922, -28.322418212890625, -26.6644344329834, -25.006452560424805, -23.348472595214844, -21.69049072265625, -20.032508850097656, -18.374526977539062, -16.71654510498047, -15.058562278747559, -13.400579452514648, -11.742597579956055, -10.084615707397461, -8.426633834838867, -6.768651485443115, -5.110669136047363, -3.4526872634887695, -1.7947053909301758, -0.13672256469726562, 1.5212593078613281, 3.179241180419922, 4.837223052978516, 6.495205402374268, 8.15318775177002, 9.811169624328613, 11.469151496887207, 13.127134323120117, 14.785116195678711, 16.443098068237305, 18.1010799407959, 19.759061813354492, 21.41704559326172, 23.075027465820312, 24.733009338378906, 26.3909912109375, 28.048973083496094, 29.706954956054688, 31.36493682861328, 33.022918701171875, 34.68090057373047, 36.33888244628906, 37.996864318847656, 39.65484619140625, 41.312828063964844, 42.97080993652344, 44.62879180908203, 46.286773681640625, 47.94475555419922, 49.60273742675781, 51.260719299316406, 52.918701171875, 54.576683044433594, 56.23466873168945]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 10.0, 8.0, 20.0, 46.0, 86.0, 148.0, 206.0, 365.0, 606.0, 931.0, 1560.0, 2587.0, 3989.0, 6512.0, 10237.0, 15534.0, 24431.0, 36609.0, 53517.0, 78296.0, 110165.0, 150811.0, 197814.0, 247393.0, 298873.0, 342089.0, 370475.0, 379481.0, 365350.0, 333067.0, 287964.0, 236496.0, 185057.0, 139804.0, 101428.0, 71578.0, 48984.0, 32666.0, 21266.0, 14202.0, 8874.0, 5682.0, 3476.0, 2169.0, 1345.0, 844.0, 479.0, 286.0, 207.0, 106.0, 69.0, 46.0, 22.0, 10.0, 12.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.8125, -30.76513671875, -29.7177734375, -28.67041015625, -27.623046875, -26.57568359375, -25.5283203125, -24.48095703125, -23.43359375, -22.38623046875, -21.3388671875, -20.29150390625, -19.244140625, -18.19677734375, -17.1494140625, -16.10205078125, -15.0546875, -14.00732421875, -12.9599609375, -11.91259765625, -10.865234375, -9.81787109375, -8.7705078125, -7.72314453125, -6.67578125, -5.62841796875, -4.5810546875, -3.53369140625, -2.486328125, -1.43896484375, -0.3916015625, 0.65576171875, 1.703125, 2.75048828125, 3.7978515625, 4.84521484375, 5.892578125, 6.93994140625, 7.9873046875, 9.03466796875, 10.08203125, 11.12939453125, 12.1767578125, 13.22412109375, 14.271484375, 15.31884765625, 16.3662109375, 17.41357421875, 18.4609375, 19.50830078125, 20.5556640625, 21.60302734375, 22.650390625, 23.69775390625, 24.7451171875, 25.79248046875, 26.83984375, 27.88720703125, 28.9345703125, 29.98193359375, 31.029296875, 32.07666015625, 33.1240234375, 34.17138671875, 35.21875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 6.0, 5.0, 2.0, 7.0, 10.0, 10.0, 7.0, 9.0, 12.0, 24.0, 23.0, 14.0, 21.0, 26.0, 32.0, 37.0, 38.0, 53.0, 29.0, 49.0, 57.0, 36.0, 39.0, 39.0, 41.0, 35.0, 41.0, 35.0, 36.0, 29.0, 31.0, 31.0, 25.0, 19.0, 16.0, 11.0, 13.0, 13.0, 7.0, 10.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.375, -46.7724609375, -45.169921875, -43.5673828125, -41.96484375, -40.3623046875, -38.759765625, -37.1572265625, -35.5546875, -33.9521484375, -32.349609375, -30.7470703125, -29.14453125, -27.5419921875, -25.939453125, -24.3369140625, -22.734375, -21.1318359375, -19.529296875, -17.9267578125, -16.32421875, -14.7216796875, -13.119140625, -11.5166015625, -9.9140625, -8.3115234375, -6.708984375, -5.1064453125, -3.50390625, -1.9013671875, -0.298828125, 1.3037109375, 2.90625, 4.5087890625, 6.111328125, 7.7138671875, 9.31640625, 10.9189453125, 12.521484375, 14.1240234375, 15.7265625, 17.3291015625, 18.931640625, 20.5341796875, 22.13671875, 23.7392578125, 25.341796875, 26.9443359375, 28.546875, 30.1494140625, 31.751953125, 33.3544921875, 34.95703125, 36.5595703125, 38.162109375, 39.7646484375, 41.3671875, 42.9697265625, 44.572265625, 46.1748046875, 47.77734375, 49.3798828125, 50.982421875, 52.5849609375, 54.1875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 8.0, 14.0, 22.0, 29.0, 66.0, 122.0, 191.0, 288.0, 501.0, 858.0, 1372.0, 2338.0, 3764.0, 5994.0, 9621.0, 15022.0, 22766.0, 35054.0, 51722.0, 72690.0, 101891.0, 137946.0, 178833.0, 225041.0, 269869.0, 311560.0, 341380.0, 355828.0, 353649.0, 332935.0, 301079.0, 258719.0, 212352.0, 167640.0, 128321.0, 93974.0, 67016.0, 46231.0, 31150.0, 20898.0, 13368.0, 8438.0, 5341.0, 3297.0, 2048.0, 1230.0, 726.0, 467.0, 255.0, 164.0, 102.0, 38.0, 29.0, 14.0, 7.0, 9.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-33.6875, -32.59619140625, -31.5048828125, -30.41357421875, -29.322265625, -28.23095703125, -27.1396484375, -26.04833984375, -24.95703125, -23.86572265625, -22.7744140625, -21.68310546875, -20.591796875, -19.50048828125, -18.4091796875, -17.31787109375, -16.2265625, -15.13525390625, -14.0439453125, -12.95263671875, -11.861328125, -10.77001953125, -9.6787109375, -8.58740234375, -7.49609375, -6.40478515625, -5.3134765625, -4.22216796875, -3.130859375, -2.03955078125, -0.9482421875, 0.14306640625, 1.234375, 2.32568359375, 3.4169921875, 4.50830078125, 5.599609375, 6.69091796875, 7.7822265625, 8.87353515625, 9.96484375, 11.05615234375, 12.1474609375, 13.23876953125, 14.330078125, 15.42138671875, 16.5126953125, 17.60400390625, 18.6953125, 19.78662109375, 20.8779296875, 21.96923828125, 23.060546875, 24.15185546875, 25.2431640625, 26.33447265625, 27.42578125, 28.51708984375, 29.6083984375, 30.69970703125, 31.791015625, 32.88232421875, 33.9736328125, 35.06494140625, 36.15625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 10.0, 12.0, 13.0, 16.0, 21.0, 39.0, 35.0, 39.0, 54.0, 61.0, 83.0, 101.0, 97.0, 120.0, 142.0, 153.0, 197.0, 168.0, 189.0, 195.0, 193.0, 222.0, 190.0, 201.0, 192.0, 199.0, 161.0, 130.0, 130.0, 124.0, 104.0, 83.0, 82.0, 71.0, 59.0, 44.0, 32.0, 30.0, 17.0, 16.0, 14.0, 8.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.0, -20.30908203125, -19.6181640625, -18.92724609375, -18.236328125, -17.54541015625, -16.8544921875, -16.16357421875, -15.47265625, -14.78173828125, -14.0908203125, -13.39990234375, -12.708984375, -12.01806640625, -11.3271484375, -10.63623046875, -9.9453125, -9.25439453125, -8.5634765625, -7.87255859375, -7.181640625, -6.49072265625, -5.7998046875, -5.10888671875, -4.41796875, -3.72705078125, -3.0361328125, -2.34521484375, -1.654296875, -0.96337890625, -0.2724609375, 0.41845703125, 1.109375, 1.80029296875, 2.4912109375, 3.18212890625, 3.873046875, 4.56396484375, 5.2548828125, 5.94580078125, 6.63671875, 7.32763671875, 8.0185546875, 8.70947265625, 9.400390625, 10.09130859375, 10.7822265625, 11.47314453125, 12.1640625, 12.85498046875, 13.5458984375, 14.23681640625, 14.927734375, 15.61865234375, 16.3095703125, 17.00048828125, 17.69140625, 18.38232421875, 19.0732421875, 19.76416015625, 20.455078125, 21.14599609375, 21.8369140625, 22.52783203125, 23.21875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 10.0, 7.0, 9.0, 9.0, 16.0, 17.0, 23.0, 19.0, 30.0, 41.0, 48.0, 31.0, 37.0, 36.0, 31.0, 43.0, 42.0, 48.0, 55.0, 49.0, 31.0, 43.0, 38.0, 35.0, 35.0, 21.0, 29.0, 24.0, 23.0, 19.0, 16.0, 18.0, 11.0, 11.0, 12.0, 4.0, 4.0, 2.0, 4.0, 7.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.021820068359375, -51.36710739135742, -49.71239471435547, -48.057682037353516, -46.40296936035156, -44.748260498046875, -43.09354782104492, -41.43883514404297, -39.784122467041016, -38.12940979003906, -36.47469711303711, -34.819984436035156, -33.16527557373047, -31.510560989379883, -29.855850219726562, -28.20113754272461, -26.546424865722656, -24.891712188720703, -23.23699951171875, -21.58228874206543, -19.927576065063477, -18.272863388061523, -16.618152618408203, -14.96343994140625, -13.308727264404297, -11.654014587402344, -9.999302864074707, -8.34459114074707, -6.689878463745117, -5.035165786743164, -3.3804540634155273, -1.7257423400878906, -0.07102584838867188, 1.583686351776123, 3.238398551940918, 4.893110752105713, 6.547822952270508, 8.202535629272461, 9.857247352600098, 11.511959075927734, 13.166671752929688, 14.82138442993164, 16.476097106933594, 18.130807876586914, 19.785520553588867, 21.44023323059082, 23.09494400024414, 24.749656677246094, 26.404369354248047, 28.05908203125, 29.713794708251953, 31.368505477905273, 33.023216247558594, 34.67793273925781, 36.3326416015625, 37.98735427856445, 39.642066955566406, 41.29677963256836, 42.95149230957031, 44.606204986572266, 46.26091766357422, 47.915626525878906, 49.57033920288086, 51.22505187988281, 52.879764556884766]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 1.0, 5.0, 10.0, 7.0, 7.0, 10.0, 14.0, 18.0, 16.0, 25.0, 27.0, 31.0, 18.0, 43.0, 28.0, 36.0, 41.0, 59.0, 48.0, 53.0, 41.0, 46.0, 48.0, 42.0, 40.0, 36.0, 42.0, 28.0, 33.0, 21.0, 25.0, 21.0, 9.0, 14.0, 6.0, 14.0, 6.0, 7.0, 8.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.673866271972656, -56.72898864746094, -54.78411102294922, -52.8392333984375, -50.89435958862305, -48.94948196411133, -47.00460433959961, -45.05972671508789, -43.11484909057617, -41.16997146606445, -39.225093841552734, -37.28022003173828, -35.33534240722656, -33.390464782714844, -31.445587158203125, -29.500709533691406, -27.55583381652832, -25.6109561920166, -23.666080474853516, -21.721202850341797, -19.776325225830078, -17.83144760131836, -15.886571884155273, -13.941694259643555, -11.996817588806152, -10.05194091796875, -8.107063293457031, -6.162186622619629, -4.217309474945068, -2.272432327270508, -0.32755565643310547, 1.6173219680786133, 3.5621986389160156, 5.507075786590576, 7.451952934265137, 9.396829605102539, 11.341707229614258, 13.28658390045166, 15.231460571289062, 17.17633819580078, 19.1212158203125, 21.06609344482422, 23.010969161987305, 24.955846786499023, 26.900724411010742, 28.845600128173828, 30.790477752685547, 32.735355377197266, 34.68022918701172, 36.62510681152344, 38.569984436035156, 40.514862060546875, 42.45973587036133, 44.40461349487305, 46.349491119384766, 48.294368743896484, 50.2392463684082, 52.18412399291992, 54.12900161743164, 56.073875427246094, 58.01875305175781, 59.96363067626953, 61.90850830078125, 63.85338592529297, 65.79826354980469]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 4.0, 9.0, 10.0, 17.0, 15.0, 25.0, 32.0, 53.0, 77.0, 134.0, 193.0, 297.0, 449.0, 682.0, 1166.0, 1828.0, 2809.0, 4284.0, 6600.0, 10415.0, 15971.0, 24069.0, 35105.0, 50850.0, 69076.0, 88592.0, 105742.0, 116300.0, 115300.0, 103539.0, 85229.0, 65190.0, 47872.0, 32979.0, 22203.0, 14644.0, 9543.0, 6211.0, 3922.0, 2541.0, 1653.0, 1047.0, 678.0, 432.0, 271.0, 174.0, 123.0, 70.0, 52.0, 39.0, 22.0, 10.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.513671875, -15.01171875, -14.509765625, -14.0078125, -13.505859375, -13.00390625, -12.501953125, -12.0, -11.498046875, -10.99609375, -10.494140625, -9.9921875, -9.490234375, -8.98828125, -8.486328125, -7.984375, -7.482421875, -6.98046875, -6.478515625, -5.9765625, -5.474609375, -4.97265625, -4.470703125, -3.96875, -3.466796875, -2.96484375, -2.462890625, -1.9609375, -1.458984375, -0.95703125, -0.455078125, 0.046875, 0.548828125, 1.05078125, 1.552734375, 2.0546875, 2.556640625, 3.05859375, 3.560546875, 4.0625, 4.564453125, 5.06640625, 5.568359375, 6.0703125, 6.572265625, 7.07421875, 7.576171875, 8.078125, 8.580078125, 9.08203125, 9.583984375, 10.0859375, 10.587890625, 11.08984375, 11.591796875, 12.09375, 12.595703125, 13.09765625, 13.599609375, 14.1015625, 14.603515625, 15.10546875, 15.607421875, 16.109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 3.0, 10.0, 7.0, 7.0, 11.0, 13.0, 18.0, 16.0, 27.0, 27.0, 31.0, 15.0, 43.0, 29.0, 36.0, 40.0, 60.0, 50.0, 53.0, 38.0, 46.0, 53.0, 36.0, 43.0, 35.0, 41.0, 31.0, 28.0, 24.0, 25.0, 21.0, 9.0, 14.0, 6.0, 14.0, 6.0, 8.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.53125, -56.58642578125, -54.6416015625, -52.69677734375, -50.751953125, -48.80712890625, -46.8623046875, -44.91748046875, -42.97265625, -41.02783203125, -39.0830078125, -37.13818359375, -35.193359375, -33.24853515625, -31.3037109375, -29.35888671875, -27.4140625, -25.46923828125, -23.5244140625, -21.57958984375, -19.634765625, -17.68994140625, -15.7451171875, -13.80029296875, -11.85546875, -9.91064453125, -7.9658203125, -6.02099609375, -4.076171875, -2.13134765625, -0.1865234375, 1.75830078125, 3.703125, 5.64794921875, 7.5927734375, 9.53759765625, 11.482421875, 13.42724609375, 15.3720703125, 17.31689453125, 19.26171875, 21.20654296875, 23.1513671875, 25.09619140625, 27.041015625, 28.98583984375, 30.9306640625, 32.87548828125, 34.8203125, 36.76513671875, 38.7099609375, 40.65478515625, 42.599609375, 44.54443359375, 46.4892578125, 48.43408203125, 50.37890625, 52.32373046875, 54.2685546875, 56.21337890625, 58.158203125, 60.10302734375, 62.0478515625, 63.99267578125, 65.9375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 8.0, 15.0, 18.0, 23.0, 43.0, 45.0, 74.0, 102.0, 170.0, 250.0, 412.0, 598.0, 1004.0, 1547.0, 2711.0, 4599.0, 8199.0, 15124.0, 28433.0, 53095.0, 95644.0, 155678.0, 203179.0, 187463.0, 127875.0, 73481.0, 39972.0, 21559.0, 11437.0, 6402.0, 3603.0, 2193.0, 1305.0, 845.0, 480.0, 292.0, 210.0, 141.0, 86.0, 67.0, 47.0, 28.0, 24.0, 24.0, 10.0, 12.0, 10.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-25.046875, -24.23291015625, -23.4189453125, -22.60498046875, -21.791015625, -20.97705078125, -20.1630859375, -19.34912109375, -18.53515625, -17.72119140625, -16.9072265625, -16.09326171875, -15.279296875, -14.46533203125, -13.6513671875, -12.83740234375, -12.0234375, -11.20947265625, -10.3955078125, -9.58154296875, -8.767578125, -7.95361328125, -7.1396484375, -6.32568359375, -5.51171875, -4.69775390625, -3.8837890625, -3.06982421875, -2.255859375, -1.44189453125, -0.6279296875, 0.18603515625, 1.0, 1.81396484375, 2.6279296875, 3.44189453125, 4.255859375, 5.06982421875, 5.8837890625, 6.69775390625, 7.51171875, 8.32568359375, 9.1396484375, 9.95361328125, 10.767578125, 11.58154296875, 12.3955078125, 13.20947265625, 14.0234375, 14.83740234375, 15.6513671875, 16.46533203125, 17.279296875, 18.09326171875, 18.9072265625, 19.72119140625, 20.53515625, 21.34912109375, 22.1630859375, 22.97705078125, 23.791015625, 24.60498046875, 25.4189453125, 26.23291015625, 27.046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 2.0, 9.0, 12.0, 8.0, 12.0, 14.0, 10.0, 21.0, 19.0, 26.0, 30.0, 26.0, 54.0, 42.0, 31.0, 43.0, 41.0, 34.0, 30.0, 41.0, 41.0, 47.0, 46.0, 36.0, 33.0, 23.0, 25.0, 30.0, 23.0, 22.0, 18.0, 24.0, 16.0, 21.0, 19.0, 18.0, 10.0, 7.0, 10.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-32.875, -31.74267578125, -30.6103515625, -29.47802734375, -28.345703125, -27.21337890625, -26.0810546875, -24.94873046875, -23.81640625, -22.68408203125, -21.5517578125, -20.41943359375, -19.287109375, -18.15478515625, -17.0224609375, -15.89013671875, -14.7578125, -13.62548828125, -12.4931640625, -11.36083984375, -10.228515625, -9.09619140625, -7.9638671875, -6.83154296875, -5.69921875, -4.56689453125, -3.4345703125, -2.30224609375, -1.169921875, -0.03759765625, 1.0947265625, 2.22705078125, 3.359375, 4.49169921875, 5.6240234375, 6.75634765625, 7.888671875, 9.02099609375, 10.1533203125, 11.28564453125, 12.41796875, 13.55029296875, 14.6826171875, 15.81494140625, 16.947265625, 18.07958984375, 19.2119140625, 20.34423828125, 21.4765625, 22.60888671875, 23.7412109375, 24.87353515625, 26.005859375, 27.13818359375, 28.2705078125, 29.40283203125, 30.53515625, 31.66748046875, 32.7998046875, 33.93212890625, 35.064453125, 36.19677734375, 37.3291015625, 38.46142578125, 39.59375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 18.0, 13.0, 18.0, 32.0, 28.0, 39.0, 63.0, 117.0, 136.0, 221.0, 346.0, 458.0, 718.0, 1203.0, 1962.0, 3310.0, 5826.0, 10676.0, 21075.0, 46018.0, 110373.0, 259373.0, 314596.0, 151085.0, 62122.0, 27643.0, 13837.0, 7104.0, 3967.0, 2263.0, 1404.0, 865.0, 533.0, 336.0, 231.0, 155.0, 115.0, 72.0, 58.0, 40.0, 25.0, 23.0, 20.0, 13.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.6875, -18.106689453125, -17.52587890625, -16.945068359375, -16.3642578125, -15.783447265625, -15.20263671875, -14.621826171875, -14.041015625, -13.460205078125, -12.87939453125, -12.298583984375, -11.7177734375, -11.136962890625, -10.55615234375, -9.975341796875, -9.39453125, -8.813720703125, -8.23291015625, -7.652099609375, -7.0712890625, -6.490478515625, -5.90966796875, -5.328857421875, -4.748046875, -4.167236328125, -3.58642578125, -3.005615234375, -2.4248046875, -1.843994140625, -1.26318359375, -0.682373046875, -0.1015625, 0.479248046875, 1.06005859375, 1.640869140625, 2.2216796875, 2.802490234375, 3.38330078125, 3.964111328125, 4.544921875, 5.125732421875, 5.70654296875, 6.287353515625, 6.8681640625, 7.448974609375, 8.02978515625, 8.610595703125, 9.19140625, 9.772216796875, 10.35302734375, 10.933837890625, 11.5146484375, 12.095458984375, 12.67626953125, 13.257080078125, 13.837890625, 14.418701171875, 14.99951171875, 15.580322265625, 16.1611328125, 16.741943359375, 17.32275390625, 17.903564453125, 18.484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 2.0, 5.0, 8.0, 4.0, 12.0, 7.0, 8.0, 9.0, 13.0, 24.0, 24.0, 30.0, 34.0, 33.0, 46.0, 46.0, 66.0, 49.0, 59.0, 55.0, 42.0, 42.0, 48.0, 44.0, 47.0, 38.0, 37.0, 23.0, 21.0, 22.0, 20.0, 13.0, 17.0, 10.0, 13.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007476806640625, -0.0007245838642120361, -0.0007014870643615723, -0.0006783902645111084, -0.0006552934646606445, -0.0006321966648101807, -0.0006090998649597168, -0.0005860030651092529, -0.0005629062652587891, -0.0005398094654083252, -0.0005167126655578613, -0.0004936158657073975, -0.0004705190658569336, -0.0004474222660064697, -0.00042432546615600586, -0.000401228666305542, -0.0003781318664550781, -0.00035503506660461426, -0.0003319382667541504, -0.0003088414669036865, -0.00028574466705322266, -0.0002626478672027588, -0.00023955106735229492, -0.00021645426750183105, -0.0001933574676513672, -0.00017026066780090332, -0.00014716386795043945, -0.00012406706809997559, -0.00010097026824951172, -7.787346839904785e-05, -5.4776668548583984e-05, -3.167986869812012e-05, -8.58306884765625e-06, 1.4513731002807617e-05, 3.7610530853271484e-05, 6.070733070373535e-05, 8.380413055419922e-05, 0.00010690093040466309, 0.00012999773025512695, 0.00015309453010559082, 0.0001761913299560547, 0.00019928812980651855, 0.00022238492965698242, 0.0002454817295074463, 0.00026857852935791016, 0.000291675329208374, 0.0003147721290588379, 0.00033786892890930176, 0.0003609657287597656, 0.0003840625286102295, 0.00040715932846069336, 0.0004302561283111572, 0.0004533529281616211, 0.00047644972801208496, 0.0004995465278625488, 0.0005226433277130127, 0.0005457401275634766, 0.0005688369274139404, 0.0005919337272644043, 0.0006150305271148682, 0.000638127326965332, 0.0006612241268157959, 0.0006843209266662598, 0.0007074177265167236, 0.0007305145263671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 14.0, 15.0, 21.0, 51.0, 55.0, 85.0, 134.0, 206.0, 282.0, 391.0, 635.0, 960.0, 1616.0, 2508.0, 4264.0, 7659.0, 14027.0, 26037.0, 47588.0, 85708.0, 139270.0, 186684.0, 189028.0, 142572.0, 88590.0, 49860.0, 26421.0, 14167.0, 7981.0, 4576.0, 2578.0, 1584.0, 970.0, 654.0, 447.0, 307.0, 206.0, 148.0, 90.0, 54.0, 33.0, 23.0, 14.0, 12.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.703125, -17.09326171875, -16.4833984375, -15.87353515625, -15.263671875, -14.65380859375, -14.0439453125, -13.43408203125, -12.82421875, -12.21435546875, -11.6044921875, -10.99462890625, -10.384765625, -9.77490234375, -9.1650390625, -8.55517578125, -7.9453125, -7.33544921875, -6.7255859375, -6.11572265625, -5.505859375, -4.89599609375, -4.2861328125, -3.67626953125, -3.06640625, -2.45654296875, -1.8466796875, -1.23681640625, -0.626953125, -0.01708984375, 0.5927734375, 1.20263671875, 1.8125, 2.42236328125, 3.0322265625, 3.64208984375, 4.251953125, 4.86181640625, 5.4716796875, 6.08154296875, 6.69140625, 7.30126953125, 7.9111328125, 8.52099609375, 9.130859375, 9.74072265625, 10.3505859375, 10.96044921875, 11.5703125, 12.18017578125, 12.7900390625, 13.39990234375, 14.009765625, 14.61962890625, 15.2294921875, 15.83935546875, 16.44921875, 17.05908203125, 17.6689453125, 18.27880859375, 18.888671875, 19.49853515625, 20.1083984375, 20.71826171875, 21.328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 1.0, 14.0, 9.0, 9.0, 16.0, 19.0, 29.0, 28.0, 30.0, 32.0, 48.0, 40.0, 49.0, 62.0, 45.0, 51.0, 64.0, 56.0, 50.0, 42.0, 52.0, 48.0, 37.0, 45.0, 20.0, 15.0, 20.0, 12.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.33001708984375, -5.1170654296875, -4.90411376953125, -4.691162109375, -4.47821044921875, -4.2652587890625, -4.05230712890625, -3.83935546875, -3.62640380859375, -3.4134521484375, -3.20050048828125, -2.987548828125, -2.77459716796875, -2.5616455078125, -2.34869384765625, -2.1357421875, -1.92279052734375, -1.7098388671875, -1.49688720703125, -1.283935546875, -1.07098388671875, -0.8580322265625, -0.64508056640625, -0.43212890625, -0.21917724609375, -0.0062255859375, 0.20672607421875, 0.419677734375, 0.63262939453125, 0.8455810546875, 1.05853271484375, 1.271484375, 1.48443603515625, 1.6973876953125, 1.91033935546875, 2.123291015625, 2.33624267578125, 2.5491943359375, 2.76214599609375, 2.97509765625, 3.18804931640625, 3.4010009765625, 3.61395263671875, 3.826904296875, 4.03985595703125, 4.2528076171875, 4.46575927734375, 4.6787109375, 4.89166259765625, 5.1046142578125, 5.31756591796875, 5.530517578125, 5.74346923828125, 5.9564208984375, 6.16937255859375, 6.38232421875, 6.59527587890625, 6.8082275390625, 7.02117919921875, 7.234130859375, 7.44708251953125, 7.6600341796875, 7.87298583984375, 8.0859375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 7.0, 7.0, 12.0, 9.0, 23.0, 22.0, 28.0, 27.0, 24.0, 40.0, 34.0, 40.0, 36.0, 41.0, 51.0, 32.0, 41.0, 47.0, 50.0, 43.0, 34.0, 47.0, 32.0, 18.0, 34.0, 33.0, 21.0, 33.0, 20.0, 20.0, 8.0, 15.0, 9.0, 13.0, 7.0, 5.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.210025787353516, -51.56853485107422, -49.92704772949219, -48.28555679321289, -46.64406967163086, -45.00257873535156, -43.36109161376953, -41.719600677490234, -40.07810974121094, -38.43661880493164, -36.79513168334961, -35.15364074707031, -33.51215362548828, -31.870662689208984, -30.22917366027832, -28.587684631347656, -26.946197509765625, -25.30470848083496, -23.663219451904297, -22.021728515625, -20.38024139404297, -18.738750457763672, -17.097261428833008, -15.455772399902344, -13.81428337097168, -12.172794342041016, -10.531305313110352, -8.889815330505371, -7.248326301574707, -5.606837272644043, -3.9653472900390625, -2.3238582611083984, -0.682373046875, 0.9591162204742432, 2.6006054878234863, 4.242094993591309, 5.883584022521973, 7.525073051452637, 9.166563034057617, 10.808052062988281, 12.449541091918945, 14.09103012084961, 15.732519149780273, 17.374008178710938, 19.015499114990234, 20.656986236572266, 22.298477172851562, 23.939966201782227, 25.58145523071289, 27.222944259643555, 28.86443328857422, 30.505924224853516, 32.14741134643555, 33.788902282714844, 35.430389404296875, 37.07188034057617, 38.71337127685547, 40.354862213134766, 41.9963493347168, 43.637840270996094, 45.279327392578125, 46.92081832885742, 48.56230926513672, 50.20379638671875, 51.84528350830078]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 10.0, 4.0, 10.0, 10.0, 13.0, 18.0, 19.0, 26.0, 19.0, 30.0, 25.0, 43.0, 23.0, 36.0, 39.0, 54.0, 52.0, 47.0, 45.0, 50.0, 44.0, 42.0, 38.0, 33.0, 49.0, 36.0, 21.0, 21.0, 25.0, 25.0, 11.0, 18.0, 5.0, 11.0, 9.0, 4.0, 11.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.333404541015625, -56.407047271728516, -54.480690002441406, -52.5543327331543, -50.62797546386719, -48.70161819458008, -46.77526092529297, -44.848899841308594, -42.92254638671875, -40.99618911743164, -39.06983184814453, -37.14347457885742, -35.21711730957031, -33.2907600402832, -31.36440086364746, -29.43804359436035, -27.51168441772461, -25.5853271484375, -23.65896987915039, -21.73261260986328, -19.806255340576172, -17.879898071289062, -15.95353889465332, -14.027181625366211, -12.100824356079102, -10.174467086791992, -8.248109817504883, -6.321751594543457, -4.395394325256348, -2.4690370559692383, -0.5426788330078125, 1.3836784362792969, 3.3100357055664062, 5.236392974853516, 7.162750720977783, 9.08910846710205, 11.01546573638916, 12.94182300567627, 14.868181228637695, 16.794538497924805, 18.720895767211914, 20.647253036499023, 22.573610305786133, 24.499969482421875, 26.426326751708984, 28.352684020996094, 30.279041290283203, 32.20539855957031, 34.13175582885742, 36.05811309814453, 37.98447036743164, 39.91082763671875, 41.83718490600586, 43.76354217529297, 45.689903259277344, 47.61625671386719, 49.54261779785156, 51.46897506713867, 53.39533233642578, 55.32168960571289, 57.248046875, 59.17440414428711, 61.10076141357422, 63.027122497558594, 64.95347595214844]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 8.0, 4.0, 18.0, 19.0, 23.0, 24.0, 56.0, 69.0, 119.0, 175.0, 285.0, 475.0, 753.0, 1341.0, 2176.0, 3554.0, 5726.0, 9214.0, 14390.0, 22152.0, 32090.0, 45433.0, 60847.0, 77074.0, 91840.0, 101422.0, 105220.0, 101684.0, 91915.0, 77637.0, 61700.0, 46254.0, 32901.0, 22557.0, 14755.0, 9442.0, 5790.0, 3657.0, 2262.0, 1326.0, 803.0, 493.0, 310.0, 192.0, 128.0, 91.0, 48.0, 34.0, 31.0, 19.0, 14.0, 11.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.5, -40.18359375, -38.8671875, -37.55078125, -36.234375, -34.91796875, -33.6015625, -32.28515625, -30.96875, -29.65234375, -28.3359375, -27.01953125, -25.703125, -24.38671875, -23.0703125, -21.75390625, -20.4375, -19.12109375, -17.8046875, -16.48828125, -15.171875, -13.85546875, -12.5390625, -11.22265625, -9.90625, -8.58984375, -7.2734375, -5.95703125, -4.640625, -3.32421875, -2.0078125, -0.69140625, 0.625, 1.94140625, 3.2578125, 4.57421875, 5.890625, 7.20703125, 8.5234375, 9.83984375, 11.15625, 12.47265625, 13.7890625, 15.10546875, 16.421875, 17.73828125, 19.0546875, 20.37109375, 21.6875, 23.00390625, 24.3203125, 25.63671875, 26.953125, 28.26953125, 29.5859375, 30.90234375, 32.21875, 33.53515625, 34.8515625, 36.16796875, 37.484375, 38.80078125, 40.1171875, 41.43359375, 42.75]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 1.0, 5.0, 10.0, 4.0, 13.0, 4.0, 17.0, 16.0, 23.0, 22.0, 23.0, 28.0, 25.0, 43.0, 25.0, 35.0, 34.0, 58.0, 51.0, 47.0, 42.0, 51.0, 46.0, 40.0, 39.0, 34.0, 48.0, 33.0, 25.0, 23.0, 24.0, 27.0, 8.0, 18.0, 3.0, 12.0, 10.0, 5.0, 10.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.8125, -55.9033203125, -53.994140625, -52.0849609375, -50.17578125, -48.2666015625, -46.357421875, -44.4482421875, -42.5390625, -40.6298828125, -38.720703125, -36.8115234375, -34.90234375, -32.9931640625, -31.083984375, -29.1748046875, -27.265625, -25.3564453125, -23.447265625, -21.5380859375, -19.62890625, -17.7197265625, -15.810546875, -13.9013671875, -11.9921875, -10.0830078125, -8.173828125, -6.2646484375, -4.35546875, -2.4462890625, -0.537109375, 1.3720703125, 3.28125, 5.1904296875, 7.099609375, 9.0087890625, 10.91796875, 12.8271484375, 14.736328125, 16.6455078125, 18.5546875, 20.4638671875, 22.373046875, 24.2822265625, 26.19140625, 28.1005859375, 30.009765625, 31.9189453125, 33.828125, 35.7373046875, 37.646484375, 39.5556640625, 41.46484375, 43.3740234375, 45.283203125, 47.1923828125, 49.1015625, 51.0107421875, 52.919921875, 54.8291015625, 56.73828125, 58.6474609375, 60.556640625, 62.4658203125, 64.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 15.0, 25.0, 33.0, 45.0, 86.0, 108.0, 202.0, 315.0, 501.0, 803.0, 1376.0, 2421.0, 3959.0, 6527.0, 11088.0, 17698.0, 27980.0, 42338.0, 61482.0, 82268.0, 101711.0, 115972.0, 120114.0, 113622.0, 97763.0, 77382.0, 57130.0, 39213.0, 25274.0, 16141.0, 10065.0, 5995.0, 3668.0, 2094.0, 1238.0, 688.0, 474.0, 291.0, 181.0, 89.0, 56.0, 47.0, 31.0, 16.0, 10.0, 8.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.15625, -44.53076171875, -42.9052734375, -41.27978515625, -39.654296875, -38.02880859375, -36.4033203125, -34.77783203125, -33.15234375, -31.52685546875, -29.9013671875, -28.27587890625, -26.650390625, -25.02490234375, -23.3994140625, -21.77392578125, -20.1484375, -18.52294921875, -16.8974609375, -15.27197265625, -13.646484375, -12.02099609375, -10.3955078125, -8.77001953125, -7.14453125, -5.51904296875, -3.8935546875, -2.26806640625, -0.642578125, 0.98291015625, 2.6083984375, 4.23388671875, 5.859375, 7.48486328125, 9.1103515625, 10.73583984375, 12.361328125, 13.98681640625, 15.6123046875, 17.23779296875, 18.86328125, 20.48876953125, 22.1142578125, 23.73974609375, 25.365234375, 26.99072265625, 28.6162109375, 30.24169921875, 31.8671875, 33.49267578125, 35.1181640625, 36.74365234375, 38.369140625, 39.99462890625, 41.6201171875, 43.24560546875, 44.87109375, 46.49658203125, 48.1220703125, 49.74755859375, 51.373046875, 52.99853515625, 54.6240234375, 56.24951171875, 57.875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 5.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 7.0, 11.0, 14.0, 13.0, 21.0, 31.0, 29.0, 37.0, 26.0, 37.0, 40.0, 36.0, 43.0, 37.0, 28.0, 39.0, 51.0, 45.0, 40.0, 40.0, 36.0, 32.0, 36.0, 33.0, 31.0, 30.0, 27.0, 15.0, 19.0, 20.0, 20.0, 12.0, 12.0, 8.0, 4.0, 6.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.86767578125, -31.5791015625, -30.29052734375, -29.001953125, -27.71337890625, -26.4248046875, -25.13623046875, -23.84765625, -22.55908203125, -21.2705078125, -19.98193359375, -18.693359375, -17.40478515625, -16.1162109375, -14.82763671875, -13.5390625, -12.25048828125, -10.9619140625, -9.67333984375, -8.384765625, -7.09619140625, -5.8076171875, -4.51904296875, -3.23046875, -1.94189453125, -0.6533203125, 0.63525390625, 1.923828125, 3.21240234375, 4.5009765625, 5.78955078125, 7.078125, 8.36669921875, 9.6552734375, 10.94384765625, 12.232421875, 13.52099609375, 14.8095703125, 16.09814453125, 17.38671875, 18.67529296875, 19.9638671875, 21.25244140625, 22.541015625, 23.82958984375, 25.1181640625, 26.40673828125, 27.6953125, 28.98388671875, 30.2724609375, 31.56103515625, 32.849609375, 34.13818359375, 35.4267578125, 36.71533203125, 38.00390625, 39.29248046875, 40.5810546875, 41.86962890625, 43.158203125, 44.44677734375, 45.7353515625, 47.02392578125, 48.3125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 9.0, 7.0, 10.0, 23.0, 31.0, 36.0, 53.0, 91.0, 138.0, 215.0, 360.0, 545.0, 916.0, 1409.0, 2376.0, 3823.0, 6161.0, 9968.0, 15187.0, 23878.0, 35368.0, 50707.0, 67891.0, 85850.0, 101250.0, 110390.0, 111513.0, 102757.0, 88230.0, 70202.0, 52010.0, 37024.0, 25529.0, 16590.0, 10630.0, 6556.0, 4089.0, 2689.0, 1480.0, 975.0, 551.0, 337.0, 256.0, 148.0, 119.0, 61.0, 47.0, 18.0, 20.0, 14.0, 3.0, 10.0, 8.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-18.265625, -17.696044921875, -17.12646484375, -16.556884765625, -15.9873046875, -15.417724609375, -14.84814453125, -14.278564453125, -13.708984375, -13.139404296875, -12.56982421875, -12.000244140625, -11.4306640625, -10.861083984375, -10.29150390625, -9.721923828125, -9.15234375, -8.582763671875, -8.01318359375, -7.443603515625, -6.8740234375, -6.304443359375, -5.73486328125, -5.165283203125, -4.595703125, -4.026123046875, -3.45654296875, -2.886962890625, -2.3173828125, -1.747802734375, -1.17822265625, -0.608642578125, -0.0390625, 0.530517578125, 1.10009765625, 1.669677734375, 2.2392578125, 2.808837890625, 3.37841796875, 3.947998046875, 4.517578125, 5.087158203125, 5.65673828125, 6.226318359375, 6.7958984375, 7.365478515625, 7.93505859375, 8.504638671875, 9.07421875, 9.643798828125, 10.21337890625, 10.782958984375, 11.3525390625, 11.922119140625, 12.49169921875, 13.061279296875, 13.630859375, 14.200439453125, 14.77001953125, 15.339599609375, 15.9091796875, 16.478759765625, 17.04833984375, 17.617919921875, 18.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 7.0, 8.0, 13.0, 14.0, 16.0, 18.0, 14.0, 26.0, 20.0, 25.0, 37.0, 28.0, 41.0, 33.0, 50.0, 47.0, 45.0, 44.0, 39.0, 58.0, 54.0, 50.0, 39.0, 40.0, 33.0, 36.0, 27.0, 25.0, 15.0, 14.0, 16.0, 14.0, 10.0, 10.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00238800048828125, -0.002317070960998535, -0.0022461414337158203, -0.0021752119064331055, -0.0021042823791503906, -0.0020333528518676758, -0.001962423324584961, -0.001891493797302246, -0.0018205642700195312, -0.0017496347427368164, -0.0016787052154541016, -0.0016077756881713867, -0.0015368461608886719, -0.001465916633605957, -0.0013949871063232422, -0.0013240575790405273, -0.0012531280517578125, -0.0011821985244750977, -0.0011112689971923828, -0.001040339469909668, -0.0009694099426269531, -0.0008984804153442383, -0.0008275508880615234, -0.0007566213607788086, -0.0006856918334960938, -0.0006147623062133789, -0.0005438327789306641, -0.0004729032516479492, -0.0004019737243652344, -0.00033104419708251953, -0.0002601146697998047, -0.00018918514251708984, -0.000118255615234375, -4.7326087951660156e-05, 2.3603439331054688e-05, 9.453296661376953e-05, 0.00016546249389648438, 0.00023639202117919922, 0.00030732154846191406, 0.0003782510757446289, 0.00044918060302734375, 0.0005201101303100586, 0.0005910396575927734, 0.0006619691848754883, 0.0007328987121582031, 0.000803828239440918, 0.0008747577667236328, 0.0009456872940063477, 0.0010166168212890625, 0.0010875463485717773, 0.0011584758758544922, 0.001229405403137207, 0.0013003349304199219, 0.0013712644577026367, 0.0014421939849853516, 0.0015131235122680664, 0.0015840530395507812, 0.001654982566833496, 0.001725912094116211, 0.0017968416213989258, 0.0018677711486816406, 0.0019387006759643555, 0.0020096302032470703, 0.002080559730529785, 0.0021514892578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 12.0, 22.0, 30.0, 45.0, 87.0, 159.0, 255.0, 447.0, 679.0, 1110.0, 1978.0, 3196.0, 5091.0, 8198.0, 13258.0, 20228.0, 30394.0, 42872.0, 58987.0, 76685.0, 91665.0, 103249.0, 108270.0, 105375.0, 95255.0, 79664.0, 62116.0, 46232.0, 32804.0, 22122.0, 14443.0, 9004.0, 5630.0, 3506.0, 2157.0, 1320.0, 801.0, 485.0, 253.0, 177.0, 120.0, 62.0, 42.0, 25.0, 24.0, 11.0, 7.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.551513671875, -16.97802734375, -16.404541015625, -15.8310546875, -15.257568359375, -14.68408203125, -14.110595703125, -13.537109375, -12.963623046875, -12.39013671875, -11.816650390625, -11.2431640625, -10.669677734375, -10.09619140625, -9.522705078125, -8.94921875, -8.375732421875, -7.80224609375, -7.228759765625, -6.6552734375, -6.081787109375, -5.50830078125, -4.934814453125, -4.361328125, -3.787841796875, -3.21435546875, -2.640869140625, -2.0673828125, -1.493896484375, -0.92041015625, -0.346923828125, 0.2265625, 0.800048828125, 1.37353515625, 1.947021484375, 2.5205078125, 3.093994140625, 3.66748046875, 4.240966796875, 4.814453125, 5.387939453125, 5.96142578125, 6.534912109375, 7.1083984375, 7.681884765625, 8.25537109375, 8.828857421875, 9.40234375, 9.975830078125, 10.54931640625, 11.122802734375, 11.6962890625, 12.269775390625, 12.84326171875, 13.416748046875, 13.990234375, 14.563720703125, 15.13720703125, 15.710693359375, 16.2841796875, 16.857666015625, 17.43115234375, 18.004638671875, 18.578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 3.0, 10.0, 11.0, 13.0, 20.0, 18.0, 23.0, 21.0, 33.0, 28.0, 40.0, 38.0, 57.0, 43.0, 35.0, 48.0, 55.0, 43.0, 46.0, 43.0, 40.0, 45.0, 45.0, 37.0, 41.0, 23.0, 22.0, 18.0, 23.0, 9.0, 13.0, 5.0, 8.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-9.5234375, -9.2333984375, -8.943359375, -8.6533203125, -8.36328125, -8.0732421875, -7.783203125, -7.4931640625, -7.203125, -6.9130859375, -6.623046875, -6.3330078125, -6.04296875, -5.7529296875, -5.462890625, -5.1728515625, -4.8828125, -4.5927734375, -4.302734375, -4.0126953125, -3.72265625, -3.4326171875, -3.142578125, -2.8525390625, -2.5625, -2.2724609375, -1.982421875, -1.6923828125, -1.40234375, -1.1123046875, -0.822265625, -0.5322265625, -0.2421875, 0.0478515625, 0.337890625, 0.6279296875, 0.91796875, 1.2080078125, 1.498046875, 1.7880859375, 2.078125, 2.3681640625, 2.658203125, 2.9482421875, 3.23828125, 3.5283203125, 3.818359375, 4.1083984375, 4.3984375, 4.6884765625, 4.978515625, 5.2685546875, 5.55859375, 5.8486328125, 6.138671875, 6.4287109375, 6.71875, 7.0087890625, 7.298828125, 7.5888671875, 7.87890625, 8.1689453125, 8.458984375, 8.7490234375, 9.0390625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 6.0, 10.0, 21.0, 19.0, 25.0, 23.0, 31.0, 20.0, 24.0, 32.0, 45.0, 36.0, 47.0, 51.0, 36.0, 44.0, 35.0, 45.0, 40.0, 40.0, 46.0, 39.0, 38.0, 30.0, 29.0, 24.0, 23.0, 22.0, 22.0, 12.0, 15.0, 13.0, 10.0, 10.0, 7.0, 1.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.689064025878906, -49.94804382324219, -48.207027435302734, -46.466007232666016, -44.72499084472656, -42.983970642089844, -41.242950439453125, -39.50193405151367, -37.76091766357422, -36.0198974609375, -34.27888107299805, -32.53786087036133, -30.796844482421875, -29.055824279785156, -27.31480598449707, -25.573787689208984, -23.832767486572266, -22.09174919128418, -20.350730895996094, -18.609710693359375, -16.868694305419922, -15.12767505645752, -13.386655807495117, -11.645637512207031, -9.904619216918945, -8.16360092163086, -6.422582149505615, -4.681563377380371, -2.940545082092285, -1.1995267868041992, 0.5414924621582031, 2.282510757446289, 4.023529052734375, 5.764547348022461, 7.505566120147705, 9.24658489227295, 10.987603187561035, 12.728621482849121, 14.469640731811523, 16.21065902709961, 17.951677322387695, 19.69269561767578, 21.433713912963867, 23.174732208251953, 24.915752410888672, 26.656768798828125, 28.397789001464844, 30.13880729675293, 31.879825592041016, 33.620845794677734, 35.36186218261719, 37.102882385253906, 38.84389877319336, 40.58491897583008, 42.32593536376953, 44.06695556640625, 45.80797576904297, 47.54899597167969, 49.29001235961914, 51.03103256225586, 52.77204895019531, 54.51306915283203, 56.25408935546875, 57.9951057434082, 59.736122131347656]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 3.0, 7.0, 7.0, 9.0, 21.0, 12.0, 21.0, 24.0, 19.0, 32.0, 30.0, 41.0, 32.0, 37.0, 40.0, 45.0, 41.0, 44.0, 50.0, 37.0, 45.0, 49.0, 56.0, 48.0, 27.0, 29.0, 30.0, 35.0, 24.0, 16.0, 13.0, 12.0, 12.0, 12.0, 10.0, 8.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.05008697509766, -67.79537200927734, -65.54065704345703, -63.28593826293945, -61.03122329711914, -58.77650833129883, -56.52178955078125, -54.26707458496094, -52.012359619140625, -49.75764465332031, -47.5029296875, -45.24821090698242, -42.99349594116211, -40.7387809753418, -38.48406219482422, -36.229347229003906, -33.974632263183594, -31.71991729736328, -29.465200424194336, -27.21048355102539, -24.955768585205078, -22.701053619384766, -20.44633674621582, -18.191619873046875, -15.936904907226562, -13.682188987731934, -11.427473068237305, -9.172757148742676, -6.918041229248047, -4.663325309753418, -2.408609390258789, -0.15389347076416016, 2.100830078125, 4.355545997619629, 6.610261917114258, 8.864977836608887, 11.119693756103516, 13.374409675598145, 15.629125595092773, 17.88384246826172, 20.13855743408203, 22.393272399902344, 24.64798927307129, 26.902706146240234, 29.157421112060547, 31.41213607788086, 33.66685485839844, 35.92156982421875, 38.17628479003906, 40.430999755859375, 42.68571472167969, 44.940433502197266, 47.19514846801758, 49.44986343383789, 51.70458221435547, 53.95929718017578, 56.214012145996094, 58.468727111816406, 60.72344207763672, 62.9781608581543, 65.23287963867188, 67.48759460449219, 69.7423095703125, 71.99702453613281, 74.25173950195312]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 2.0, 6.0, 10.0, 9.0, 19.0, 26.0, 43.0, 59.0, 64.0, 120.0, 149.0, 241.0, 343.0, 481.0, 728.0, 983.0, 1471.0, 1886.0, 2503.0, 2994.0, 1023910.0, 3864.0, 2768.0, 2174.0, 1684.0, 1191.0, 867.0, 628.0, 438.0, 298.0, 213.0, 129.0, 73.0, 62.0, 42.0, 28.0, 27.0, 17.0, 20.0, 9.0, 7.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-687.7626953125, -664.6614990234375, -641.560302734375, -618.4591064453125, -595.35791015625, -572.2567138671875, -549.155517578125, -526.0543212890625, -502.9530944824219, -479.8518981933594, -456.7507019042969, -433.64947509765625, -410.54827880859375, -387.44708251953125, -364.34588623046875, -341.24468994140625, -318.14349365234375, -295.04229736328125, -271.94110107421875, -248.8398895263672, -225.7386932373047, -202.6374969482422, -179.53628540039062, -156.43508911132812, -133.33389282226562, -110.23269653320312, -87.1314926147461, -64.03028869628906, -40.92909240722656, -17.827896118164062, 5.2733154296875, 28.37451171875, 51.47564697265625, 74.57684326171875, 97.67804718017578, 120.77925109863281, 143.8804473876953, 166.9816436767578, 190.08285522460938, 213.18405151367188, 236.28524780273438, 259.3864440917969, 282.4876403808594, 305.5888671875, 328.6900634765625, 351.791259765625, 374.8924560546875, 397.99365234375, 421.0948486328125, 444.196044921875, 467.2972412109375, 490.3984375, 513.4996337890625, 536.600830078125, 559.7020263671875, 582.80322265625, 605.9044189453125, 629.005615234375, 652.1068115234375, 675.2080078125, 698.3092041015625, 721.410400390625, 744.5115966796875, 767.61279296875, 790.7140502929688]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 7.0, 17.0, 8.0, 15.0, 32.0, 40.0, 48.0, 81.0, 107.0, 142.0, 231.0, 313.0, 488.0, 643.0, 950.0, 1227.0, 1703.0, 2289.0, 3300.0, 4833.0, 7550.0, 12566.0, 21487.0, 51323312.0, 41807.0, 17170.0, 10269.0, 6317.0, 4165.0, 2900.0, 2066.0, 1530.0, 1113.0, 805.0, 521.0, 414.0, 290.0, 173.0, 121.0, 89.0, 71.0, 39.0, 29.0, 17.0, 19.0, 18.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-453.78790283203125, -438.561767578125, -423.33563232421875, -408.1095275878906, -392.8833923339844, -377.6572570800781, -362.4311218261719, -347.20501708984375, -331.9788818359375, -316.75274658203125, -301.526611328125, -286.3005065917969, -271.0743713378906, -255.84823608398438, -240.62210083007812, -225.39598083496094, -210.1698455810547, -194.94371032714844, -179.71759033203125, -164.491455078125, -149.2653350830078, -134.03919982910156, -118.81307220458984, -103.58694458007812, -88.3608169555664, -73.13468933105469, -57.90856170654297, -42.682430267333984, -27.456302642822266, -12.230171203613281, 2.9959564208984375, 18.222084045410156, 33.448211669921875, 48.674339294433594, 63.90046691894531, 79.12660217285156, 94.35272216796875, 109.578857421875, 124.80498504638672, 140.03111267089844, 155.25723266601562, 170.48336791992188, 185.70948791503906, 200.9356231689453, 216.1617431640625, 231.38787841796875, 246.614013671875, 261.84014892578125, 277.0662841796875, 292.29241943359375, 307.5185546875, 322.7446594238281, 337.9707946777344, 353.1969299316406, 368.4230651855469, 383.649169921875, 398.87530517578125, 414.1014404296875, 429.32757568359375, 444.5536804199219, 459.7798156738281, 475.0059509277344, 490.2320861816406, 505.45819091796875, 520.684326171875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 10.0, 6.0, 14.0, 9.0, 19.0, 38.0, 45.0, 72.0, 126.0, 177.0, 261.0, 403.0, 632.0, 947.0, 1552.0, 2404.0, 3790.0, 6372.0, 10733.0, 18858.0, 34463.0, 66873.0, 136630.0, 300552.0, 719828.0, 1969634.0, 1811970.0, 659050.0, 278935.0, 128233.0, 61776.0, 32570.0, 18083.0, 10246.0, 6083.0, 3726.0, 2302.0, 1416.0, 902.0, 568.0, 366.0, 248.0, 161.0, 121.0, 77.0, 60.0, 38.0, 19.0, 22.0, 11.0, 8.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-42.6875, -41.39208984375, -40.0966796875, -38.80126953125, -37.505859375, -36.21044921875, -34.9150390625, -33.61962890625, -32.32421875, -31.02880859375, -29.7333984375, -28.43798828125, -27.142578125, -25.84716796875, -24.5517578125, -23.25634765625, -21.9609375, -20.66552734375, -19.3701171875, -18.07470703125, -16.779296875, -15.48388671875, -14.1884765625, -12.89306640625, -11.59765625, -10.30224609375, -9.0068359375, -7.71142578125, -6.416015625, -5.12060546875, -3.8251953125, -2.52978515625, -1.234375, 0.06103515625, 1.3564453125, 2.65185546875, 3.947265625, 5.24267578125, 6.5380859375, 7.83349609375, 9.12890625, 10.42431640625, 11.7197265625, 13.01513671875, 14.310546875, 15.60595703125, 16.9013671875, 18.19677734375, 19.4921875, 20.78759765625, 22.0830078125, 23.37841796875, 24.673828125, 25.96923828125, 27.2646484375, 28.56005859375, 29.85546875, 31.15087890625, 32.4462890625, 33.74169921875, 35.037109375, 36.33251953125, 37.6279296875, 38.92333984375, 40.21875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 7.0, 11.0, 10.0, 8.0, 17.0, 14.0, 22.0, 23.0, 19.0, 26.0, 30.0, 39.0, 41.0, 41.0, 60.0, 75.0, 102.0, 188.0, 286.0, 277.0, 190.0, 115.0, 84.0, 46.0, 49.0, 32.0, 24.0, 25.0, 20.0, 25.0, 22.0, 18.0, 14.0, 19.0, 13.0, 6.0, 3.0, 6.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.71875, -35.60888671875, -34.4990234375, -33.38916015625, -32.279296875, -31.16943359375, -30.0595703125, -28.94970703125, -27.83984375, -26.72998046875, -25.6201171875, -24.51025390625, -23.400390625, -22.29052734375, -21.1806640625, -20.07080078125, -18.9609375, -17.85107421875, -16.7412109375, -15.63134765625, -14.521484375, -13.41162109375, -12.3017578125, -11.19189453125, -10.08203125, -8.97216796875, -7.8623046875, -6.75244140625, -5.642578125, -4.53271484375, -3.4228515625, -2.31298828125, -1.203125, -0.09326171875, 1.0166015625, 2.12646484375, 3.236328125, 4.34619140625, 5.4560546875, 6.56591796875, 7.67578125, 8.78564453125, 9.8955078125, 11.00537109375, 12.115234375, 13.22509765625, 14.3349609375, 15.44482421875, 16.5546875, 17.66455078125, 18.7744140625, 19.88427734375, 20.994140625, 22.10400390625, 23.2138671875, 24.32373046875, 25.43359375, 26.54345703125, 27.6533203125, 28.76318359375, 29.873046875, 30.98291015625, 32.0927734375, 33.20263671875, 34.3125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 8.0, 10.0, 11.0, 16.0, 12.0, 34.0, 54.0, 70.0, 123.0, 156.0, 265.0, 479.0, 851.0, 1544.0, 2791.0, 5680.0, 10656.0, 20448.0, 39334.0, 75703.0, 144835.0, 274111.0, 557595.0, 1748728.0, 2107509.0, 658797.0, 305248.0, 159955.0, 84355.0, 44042.0, 22536.0, 11790.0, 6136.0, 3390.0, 1827.0, 974.0, 545.0, 299.0, 198.0, 122.0, 71.0, 43.0, 32.0, 19.0, 13.0, 5.0, 9.0, 6.0, 3.0, 1.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.578125, -15.966064453125, -15.35400390625, -14.741943359375, -14.1298828125, -13.517822265625, -12.90576171875, -12.293701171875, -11.681640625, -11.069580078125, -10.45751953125, -9.845458984375, -9.2333984375, -8.621337890625, -8.00927734375, -7.397216796875, -6.78515625, -6.173095703125, -5.56103515625, -4.948974609375, -4.3369140625, -3.724853515625, -3.11279296875, -2.500732421875, -1.888671875, -1.276611328125, -0.66455078125, -0.052490234375, 0.5595703125, 1.171630859375, 1.78369140625, 2.395751953125, 3.0078125, 3.619873046875, 4.23193359375, 4.843994140625, 5.4560546875, 6.068115234375, 6.68017578125, 7.292236328125, 7.904296875, 8.516357421875, 9.12841796875, 9.740478515625, 10.3525390625, 10.964599609375, 11.57666015625, 12.188720703125, 12.80078125, 13.412841796875, 14.02490234375, 14.636962890625, 15.2490234375, 15.861083984375, 16.47314453125, 17.085205078125, 17.697265625, 18.309326171875, 18.92138671875, 19.533447265625, 20.1455078125, 20.757568359375, 21.36962890625, 21.981689453125, 22.59375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 8.0, 7.0, 10.0, 12.0, 11.0, 10.0, 21.0, 16.0, 18.0, 24.0, 26.0, 17.0, 32.0, 37.0, 40.0, 40.0, 73.0, 109.0, 163.0, 270.0, 298.0, 224.0, 119.0, 56.0, 51.0, 45.0, 44.0, 27.0, 28.0, 20.0, 19.0, 26.0, 21.0, 11.0, 16.0, 13.0, 12.0, 7.0, 10.0, 4.0, 5.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.515625, -24.673583984375, -23.83154296875, -22.989501953125, -22.1474609375, -21.305419921875, -20.46337890625, -19.621337890625, -18.779296875, -17.937255859375, -17.09521484375, -16.253173828125, -15.4111328125, -14.569091796875, -13.72705078125, -12.885009765625, -12.04296875, -11.200927734375, -10.35888671875, -9.516845703125, -8.6748046875, -7.832763671875, -6.99072265625, -6.148681640625, -5.306640625, -4.464599609375, -3.62255859375, -2.780517578125, -1.9384765625, -1.096435546875, -0.25439453125, 0.587646484375, 1.4296875, 2.271728515625, 3.11376953125, 3.955810546875, 4.7978515625, 5.639892578125, 6.48193359375, 7.323974609375, 8.166015625, 9.008056640625, 9.85009765625, 10.692138671875, 11.5341796875, 12.376220703125, 13.21826171875, 14.060302734375, 14.90234375, 15.744384765625, 16.58642578125, 17.428466796875, 18.2705078125, 19.112548828125, 19.95458984375, 20.796630859375, 21.638671875, 22.480712890625, 23.32275390625, 24.164794921875, 25.0068359375, 25.848876953125, 26.69091796875, 27.532958984375, 28.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 8.0, 11.0, 16.0, 14.0, 16.0, 31.0, 50.0, 50.0, 78.0, 88.0, 136.0, 167.0, 251.0, 338.0, 517.0, 733.0, 1157.0, 1858.0, 3291.0, 6365.0, 13353.0, 29844.0, 73962.0, 409704.0, 5582277.0, 96354.0, 36870.0, 16283.0, 7746.0, 3833.0, 2041.0, 1247.0, 833.0, 559.0, 363.0, 244.0, 198.0, 144.0, 98.0, 81.0, 57.0, 64.0, 35.0, 29.0, 13.0, 7.0, 9.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-57.78125, -55.982421875, -54.18359375, -52.384765625, -50.5859375, -48.787109375, -46.98828125, -45.189453125, -43.390625, -41.591796875, -39.79296875, -37.994140625, -36.1953125, -34.396484375, -32.59765625, -30.798828125, -29.0, -27.201171875, -25.40234375, -23.603515625, -21.8046875, -20.005859375, -18.20703125, -16.408203125, -14.609375, -12.810546875, -11.01171875, -9.212890625, -7.4140625, -5.615234375, -3.81640625, -2.017578125, -0.21875, 1.580078125, 3.37890625, 5.177734375, 6.9765625, 8.775390625, 10.57421875, 12.373046875, 14.171875, 15.970703125, 17.76953125, 19.568359375, 21.3671875, 23.166015625, 24.96484375, 26.763671875, 28.5625, 30.361328125, 32.16015625, 33.958984375, 35.7578125, 37.556640625, 39.35546875, 41.154296875, 42.953125, 44.751953125, 46.55078125, 48.349609375, 50.1484375, 51.947265625, 53.74609375, 55.544921875, 57.34375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 5.0, 7.0, 7.0, 11.0, 8.0, 10.0, 11.0, 17.0, 18.0, 20.0, 16.0, 25.0, 29.0, 30.0, 30.0, 33.0, 35.0, 41.0, 59.0, 88.0, 196.0, 346.0, 346.0, 148.0, 73.0, 37.0, 33.0, 44.0, 32.0, 34.0, 26.0, 33.0, 23.0, 15.0, 24.0, 20.0, 12.0, 16.0, 11.0, 11.0, 8.0, 4.0, 7.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.265625, -24.359130859375, -23.45263671875, -22.546142578125, -21.6396484375, -20.733154296875, -19.82666015625, -18.920166015625, -18.013671875, -17.107177734375, -16.20068359375, -15.294189453125, -14.3876953125, -13.481201171875, -12.57470703125, -11.668212890625, -10.76171875, -9.855224609375, -8.94873046875, -8.042236328125, -7.1357421875, -6.229248046875, -5.32275390625, -4.416259765625, -3.509765625, -2.603271484375, -1.69677734375, -0.790283203125, 0.1162109375, 1.022705078125, 1.92919921875, 2.835693359375, 3.7421875, 4.648681640625, 5.55517578125, 6.461669921875, 7.3681640625, 8.274658203125, 9.18115234375, 10.087646484375, 10.994140625, 11.900634765625, 12.80712890625, 13.713623046875, 14.6201171875, 15.526611328125, 16.43310546875, 17.339599609375, 18.24609375, 19.152587890625, 20.05908203125, 20.965576171875, 21.8720703125, 22.778564453125, 23.68505859375, 24.591552734375, 25.498046875, 26.404541015625, 27.31103515625, 28.217529296875, 29.1240234375, 30.030517578125, 30.93701171875, 31.843505859375, 32.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 13.0, 21.0, 33.0, 110.0, 562.0, 161.0, 50.0, 23.0, 12.0, 2.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1604.7135009765625, -1558.310546875, -1511.907470703125, -1465.5045166015625, -1419.1014404296875, -1372.698486328125, -1326.29541015625, -1279.8924560546875, -1233.489501953125, -1187.0865478515625, -1140.6834716796875, -1094.280517578125, -1047.87744140625, -1001.4744873046875, -955.0714721679688, -908.66845703125, -862.265380859375, -815.8623657226562, -769.4593505859375, -723.056396484375, -676.6533203125, -630.2503662109375, -583.8473510742188, -537.4443359375, -491.04132080078125, -444.6383056640625, -398.23529052734375, -351.8323059082031, -305.4292907714844, -259.0262756347656, -212.623291015625, -166.22027587890625, -119.8172607421875, -73.41425323486328, -27.011245727539062, 19.391754150390625, 65.79476928710938, 112.19778442382812, 158.60076904296875, 205.0037841796875, 251.40679931640625, 297.809814453125, 344.21282958984375, 390.6158142089844, 437.0188293457031, 483.4218444824219, 529.8248291015625, 576.2278442382812, 622.630859375, 669.0338745117188, 715.4368896484375, 761.83984375, 808.242919921875, 854.6458740234375, 901.0488891601562, 947.451904296875, 993.8549194335938, 1040.2579345703125, 1086.660888671875, 1133.06396484375, 1179.4669189453125, 1225.8699951171875, 1272.27294921875, 1318.676025390625, 1365.0789794921875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 7.0, 11.0, 10.0, 9.0, 22.0, 30.0, 52.0, 145.0, 395.0, 149.0, 55.0, 22.0, 22.0, 19.0, 13.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1452.1236572265625, -1404.576904296875, -1357.0301513671875, -1309.4833984375, -1261.936767578125, -1214.3900146484375, -1166.84326171875, -1119.2965087890625, -1071.749755859375, -1024.2030029296875, -976.65625, -929.1095581054688, -881.5628051757812, -834.0160522460938, -786.4693603515625, -738.922607421875, -691.3758544921875, -643.8291015625, -596.2823486328125, -548.7356567382812, -501.18890380859375, -453.64215087890625, -406.0954284667969, -358.5487060546875, -311.001953125, -263.4552001953125, -215.90847778320312, -168.3617401123047, -120.81500244140625, -73.26826477050781, -25.721527099609375, 21.8251953125, 69.3720703125, 116.91880798339844, 164.46554565429688, 212.0122833251953, 259.55902099609375, 307.10577392578125, 354.6524963378906, 402.19921875, 449.7459716796875, 497.292724609375, 544.8394775390625, 592.3861694335938, 639.9329223632812, 687.4796752929688, 735.0263671875, 782.5731201171875, 830.119873046875, 877.6666259765625, 925.21337890625, 972.7600708007812, 1020.3068237304688, 1067.853515625, 1115.4002685546875, 1162.947021484375, 1210.4937744140625, 1258.04052734375, 1305.5872802734375, 1353.134033203125, 1400.6806640625, 1448.2274169921875, 1495.774169921875, 1543.3209228515625, 1590.86767578125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 4.0, 13.0, 10.0, 8.0, 28.0, 23.0, 31.0, 50.0, 64.0, 74.0, 108.0, 145.0, 154.0, 216.0, 324.0, 425.0, 554.0, 780.0, 1132.0, 1800.0, 2908.0, 4879.0, 9032.0, 18413.0, 41730.0, 116273.0, 712764.0, 2966705.0, 209657.0, 60061.0, 23338.0, 10619.0, 5243.0, 2814.0, 1560.0, 807.0, 560.0, 352.0, 232.0, 133.0, 81.0, 63.0, 49.0, 30.0, 10.0, 9.0, 3.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.48980712890625, -4.3585205078125, -4.22723388671875, -4.095947265625, -3.96466064453125, -3.8333740234375, -3.70208740234375, -3.57080078125, -3.43951416015625, -3.3082275390625, -3.17694091796875, -3.045654296875, -2.91436767578125, -2.7830810546875, -2.65179443359375, -2.5205078125, -2.38922119140625, -2.2579345703125, -2.12664794921875, -1.995361328125, -1.86407470703125, -1.7327880859375, -1.60150146484375, -1.47021484375, -1.33892822265625, -1.2076416015625, -1.07635498046875, -0.945068359375, -0.81378173828125, -0.6824951171875, -0.55120849609375, -0.419921875, -0.28863525390625, -0.1573486328125, -0.02606201171875, 0.105224609375, 0.23651123046875, 0.3677978515625, 0.49908447265625, 0.63037109375, 0.76165771484375, 0.8929443359375, 1.02423095703125, 1.155517578125, 1.28680419921875, 1.4180908203125, 1.54937744140625, 1.6806640625, 1.81195068359375, 1.9432373046875, 2.07452392578125, 2.205810546875, 2.33709716796875, 2.4683837890625, 2.59967041015625, 2.73095703125, 2.86224365234375, 2.9935302734375, 3.12481689453125, 3.256103515625, 3.38739013671875, 3.5186767578125, 3.64996337890625, 3.78125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 7.0, 17.0, 11.0, 16.0, 25.0, 26.0, 36.0, 49.0, 171.0, 284.0, 138.0, 70.0, 35.0, 28.0, 11.0, 14.0, 17.0, 6.0, 1.0, 7.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.72119140625, -0.7040748596191406, -0.6869583129882812, -0.6698417663574219, -0.6527252197265625, -0.6356086730957031, -0.6184921264648438, -0.6013755798339844, -0.584259033203125, -0.5671424865722656, -0.5500259399414062, -0.5329093933105469, -0.5157928466796875, -0.4986763000488281, -0.48155975341796875, -0.4644432067871094, -0.44732666015625, -0.4302101135253906, -0.41309356689453125, -0.3959770202636719, -0.3788604736328125, -0.3617439270019531, -0.34462738037109375, -0.3275108337402344, -0.310394287109375, -0.2932777404785156, -0.27616119384765625, -0.2590446472167969, -0.2419281005859375, -0.22481155395507812, -0.20769500732421875, -0.19057846069335938, -0.1734619140625, -0.15634536743164062, -0.13922882080078125, -0.12211227416992188, -0.1049957275390625, -0.08787918090820312, -0.07076263427734375, -0.053646087646484375, -0.036529541015625, -0.019412994384765625, -0.00229644775390625, 0.014820098876953125, 0.0319366455078125, 0.049053192138671875, 0.06616973876953125, 0.08328628540039062, 0.10040283203125, 0.11751937866210938, 0.13463592529296875, 0.15175247192382812, 0.1688690185546875, 0.18598556518554688, 0.20310211181640625, 0.22021865844726562, 0.237335205078125, 0.2544517517089844, 0.27156829833984375, 0.2886848449707031, 0.3058013916015625, 0.3229179382324219, 0.34003448486328125, 0.3571510314941406, 0.374267578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 9.0, 6.0, 16.0, 17.0, 28.0, 39.0, 74.0, 108.0, 279.0, 547.0, 1220.0, 3093.0, 10052.0, 44012.0, 354689.0, 3083116.0, 614770.0, 62787.0, 12871.0, 3803.0, 1395.0, 615.0, 286.0, 160.0, 83.0, 62.0, 33.0, 29.0, 17.0, 16.0, 11.0, 6.0, 7.0, 4.0, 2.0, 4.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8984375, -6.68017578125, -6.4619140625, -6.24365234375, -6.025390625, -5.80712890625, -5.5888671875, -5.37060546875, -5.15234375, -4.93408203125, -4.7158203125, -4.49755859375, -4.279296875, -4.06103515625, -3.8427734375, -3.62451171875, -3.40625, -3.18798828125, -2.9697265625, -2.75146484375, -2.533203125, -2.31494140625, -2.0966796875, -1.87841796875, -1.66015625, -1.44189453125, -1.2236328125, -1.00537109375, -0.787109375, -0.56884765625, -0.3505859375, -0.13232421875, 0.0859375, 0.30419921875, 0.5224609375, 0.74072265625, 0.958984375, 1.17724609375, 1.3955078125, 1.61376953125, 1.83203125, 2.05029296875, 2.2685546875, 2.48681640625, 2.705078125, 2.92333984375, 3.1416015625, 3.35986328125, 3.578125, 3.79638671875, 4.0146484375, 4.23291015625, 4.451171875, 4.66943359375, 4.8876953125, 5.10595703125, 5.32421875, 5.54248046875, 5.7607421875, 5.97900390625, 6.197265625, 6.41552734375, 6.6337890625, 6.85205078125, 7.0703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 4.0, 6.0, 12.0, 17.0, 35.0, 19.0, 34.0, 34.0, 59.0, 56.0, 96.0, 118.0, 168.0, 203.0, 256.0, 336.0, 389.0, 443.0, 384.0, 333.0, 235.0, 212.0, 144.0, 111.0, 84.0, 64.0, 54.0, 48.0, 28.0, 20.0, 14.0, 12.0, 15.0, 9.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7789077758789062, -0.7497100830078125, -0.7205123901367188, -0.691314697265625, -0.6621170043945312, -0.6329193115234375, -0.6037216186523438, -0.57452392578125, -0.5453262329101562, -0.5161285400390625, -0.48693084716796875, -0.457733154296875, -0.42853546142578125, -0.3993377685546875, -0.37014007568359375, -0.3409423828125, -0.31174468994140625, -0.2825469970703125, -0.25334930419921875, -0.224151611328125, -0.19495391845703125, -0.1657562255859375, -0.13655853271484375, -0.10736083984375, -0.07816314697265625, -0.0489654541015625, -0.01976776123046875, 0.009429931640625, 0.03862762451171875, 0.0678253173828125, 0.09702301025390625, 0.126220703125, 0.15541839599609375, 0.1846160888671875, 0.21381378173828125, 0.243011474609375, 0.27220916748046875, 0.3014068603515625, 0.33060455322265625, 0.35980224609375, 0.38899993896484375, 0.4181976318359375, 0.44739532470703125, 0.476593017578125, 0.5057907104492188, 0.5349884033203125, 0.5641860961914062, 0.5933837890625, 0.6225814819335938, 0.6517791748046875, 0.6809768676757812, 0.710174560546875, 0.7393722534179688, 0.7685699462890625, 0.7977676391601562, 0.82696533203125, 0.8561630249023438, 0.8853607177734375, 0.9145584106445312, 0.943756103515625, 0.9729537963867188, 1.0021514892578125, 1.0313491821289062, 1.060546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 4.0, 11.0, 19.0, 39.0, 37.0, 59.0, 96.0, 146.0, 152.0, 125.0, 102.0, 60.0, 50.0, 31.0, 15.0, 9.0, 10.0, 9.0, 1.0, 4.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.963120460510254, -15.550540924072266, -15.137961387634277, -14.725381851196289, -14.312803268432617, -13.900222778320312, -13.48764419555664, -13.075064659118652, -12.662485122680664, -12.249905586242676, -11.837326049804688, -11.4247465133667, -11.012166976928711, -10.599588394165039, -10.18700885772705, -9.774429321289062, -9.361849784851074, -8.949270248413086, -8.536690711975098, -8.12411117553711, -7.711532115936279, -7.298952579498291, -6.886373519897461, -6.473793983459473, -6.061214447021484, -5.648634910583496, -5.236055374145508, -4.823476314544678, -4.4108967781066895, -3.998317241668701, -3.585737943649292, -3.173158645629883, -2.760578155517578, -2.34799861907959, -1.9354193210601807, -1.522839903831482, -1.1102604866027832, -0.6976809501647949, -0.28510165214538574, 0.12747764587402344, 0.5400571823120117, 0.9526365995407104, 1.3652160167694092, 1.777795433998108, 2.1903748512268066, 2.602954387664795, 3.015533685684204, 3.4281129837036133, 3.8406925201416016, 4.25327205657959, 4.665851593017578, 5.078430652618408, 5.4910101890563965, 5.903589725494385, 6.316168785095215, 6.728748321533203, 7.141327857971191, 7.55390739440918, 7.966486930847168, 8.379066467285156, 8.791645050048828, 9.204225540161133, 9.616804122924805, 10.029383659362793, 10.441963195800781]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 12.0, 15.0, 29.0, 26.0, 39.0, 46.0, 48.0, 58.0, 108.0, 92.0, 93.0, 93.0, 68.0, 79.0, 62.0, 39.0, 25.0, 24.0, 14.0, 14.0, 11.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.812475204467773, -7.484566688537598, -7.156658172607422, -6.828749656677246, -6.50084114074707, -6.1729326248168945, -5.845024108886719, -5.517115592956543, -5.189207077026367, -4.861298561096191, -4.533390045166016, -4.20548152923584, -3.877573013305664, -3.5496644973754883, -3.2217557430267334, -2.8938472270965576, -2.5659384727478027, -2.238029956817627, -1.9101214408874512, -1.5822128057479858, -1.25430428981781, -0.9263957738876343, -0.598487138748169, -0.27057862281799316, 0.05732989311218262, 0.3852384388446808, 0.713146984577179, 1.0410555601119995, 1.3689640760421753, 1.696872591972351, 2.0247812271118164, 2.352689743041992, 2.680598258972168, 3.0085067749023438, 3.3364152908325195, 3.6643238067626953, 3.992232322692871, 4.320140838623047, 4.648049354553223, 4.975957870483398, 5.303866386413574, 5.63177490234375, 5.959683418273926, 6.287591934204102, 6.615500450134277, 6.943408966064453, 7.271317481994629, 7.599225997924805, 7.927134990692139, 8.255043983459473, 8.582952499389648, 8.910861015319824, 9.23876953125, 9.566678047180176, 9.894586563110352, 10.222495079040527, 10.550403594970703, 10.878312110900879, 11.206220626831055, 11.53412914276123, 11.862037658691406, 12.189946174621582, 12.517854690551758, 12.845763206481934, 13.17367172241211]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 10.0, 11.0, 25.0, 34.0, 47.0, 47.0, 38.0, 71.0, 103.0, 144.0, 252.0, 418.0, 783.0, 1456.0, 2971.0, 6893.0, 19834.0, 86907.0, 687453.0, 191608.0, 31276.0, 9921.0, 3996.0, 1812.0, 939.0, 540.0, 350.0, 195.0, 113.0, 75.0, 58.0, 47.0, 40.0, 29.0, 16.0, 14.0, 5.0, 8.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.49609375, -6.30877685546875, -6.1214599609375, -5.93414306640625, -5.746826171875, -5.55950927734375, -5.3721923828125, -5.18487548828125, -4.99755859375, -4.81024169921875, -4.6229248046875, -4.43560791015625, -4.248291015625, -4.06097412109375, -3.8736572265625, -3.68634033203125, -3.4990234375, -3.31170654296875, -3.1243896484375, -2.93707275390625, -2.749755859375, -2.56243896484375, -2.3751220703125, -2.18780517578125, -2.00048828125, -1.81317138671875, -1.6258544921875, -1.43853759765625, -1.251220703125, -1.06390380859375, -0.8765869140625, -0.68927001953125, -0.501953125, -0.31463623046875, -0.1273193359375, 0.05999755859375, 0.247314453125, 0.43463134765625, 0.6219482421875, 0.80926513671875, 0.99658203125, 1.18389892578125, 1.3712158203125, 1.55853271484375, 1.745849609375, 1.93316650390625, 2.1204833984375, 2.30780029296875, 2.4951171875, 2.68243408203125, 2.8697509765625, 3.05706787109375, 3.244384765625, 3.43170166015625, 3.6190185546875, 3.80633544921875, 3.99365234375, 4.18096923828125, 4.3682861328125, 4.55560302734375, 4.742919921875, 4.93023681640625, 5.1175537109375, 5.30487060546875, 5.4921875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 6.0, 8.0, 3.0, 10.0, 13.0, 20.0, 24.0, 34.0, 40.0, 73.0, 119.0, 168.0, 131.0, 117.0, 77.0, 43.0, 25.0, 26.0, 11.0, 12.0, 8.0, 5.0, 2.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.68896484375, -0.6720085144042969, -0.6550521850585938, -0.6380958557128906, -0.6211395263671875, -0.6041831970214844, -0.5872268676757812, -0.5702705383300781, -0.553314208984375, -0.5363578796386719, -0.5194015502929688, -0.5024452209472656, -0.4854888916015625, -0.4685325622558594, -0.45157623291015625, -0.4346199035644531, -0.41766357421875, -0.4007072448730469, -0.38375091552734375, -0.3667945861816406, -0.3498382568359375, -0.3328819274902344, -0.31592559814453125, -0.2989692687988281, -0.282012939453125, -0.2650566101074219, -0.24810028076171875, -0.23114395141601562, -0.2141876220703125, -0.19723129272460938, -0.18027496337890625, -0.16331863403320312, -0.1463623046875, -0.12940597534179688, -0.11244964599609375, -0.09549331665039062, -0.0785369873046875, -0.061580657958984375, -0.04462432861328125, -0.027667999267578125, -0.010711669921875, 0.006244659423828125, 0.02320098876953125, 0.040157318115234375, 0.0571136474609375, 0.07406997680664062, 0.09102630615234375, 0.10798263549804688, 0.12493896484375, 0.14189529418945312, 0.15885162353515625, 0.17580795288085938, 0.1927642822265625, 0.20972061157226562, 0.22667694091796875, 0.24363327026367188, 0.260589599609375, 0.2775459289550781, 0.29450225830078125, 0.3114585876464844, 0.3284149169921875, 0.3453712463378906, 0.36232757568359375, 0.3792839050292969, 0.396240234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 12.0, 17.0, 9.0, 14.0, 20.0, 31.0, 33.0, 39.0, 51.0, 97.0, 140.0, 249.0, 378.0, 858.0, 2079.0, 5466.0, 18668.0, 172214.0, 775387.0, 55346.0, 10821.0, 3695.0, 1415.0, 596.0, 319.0, 181.0, 108.0, 76.0, 60.0, 36.0, 27.0, 34.0, 18.0, 14.0, 11.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-8.296875, -8.06829833984375, -7.8397216796875, -7.61114501953125, -7.382568359375, -7.15399169921875, -6.9254150390625, -6.69683837890625, -6.46826171875, -6.23968505859375, -6.0111083984375, -5.78253173828125, -5.553955078125, -5.32537841796875, -5.0968017578125, -4.86822509765625, -4.6396484375, -4.41107177734375, -4.1824951171875, -3.95391845703125, -3.725341796875, -3.49676513671875, -3.2681884765625, -3.03961181640625, -2.81103515625, -2.58245849609375, -2.3538818359375, -2.12530517578125, -1.896728515625, -1.66815185546875, -1.4395751953125, -1.21099853515625, -0.982421875, -0.75384521484375, -0.5252685546875, -0.29669189453125, -0.068115234375, 0.16046142578125, 0.3890380859375, 0.61761474609375, 0.84619140625, 1.07476806640625, 1.3033447265625, 1.53192138671875, 1.760498046875, 1.98907470703125, 2.2176513671875, 2.44622802734375, 2.6748046875, 2.90338134765625, 3.1319580078125, 3.36053466796875, 3.589111328125, 3.81768798828125, 4.0462646484375, 4.27484130859375, 4.50341796875, 4.73199462890625, 4.9605712890625, 5.18914794921875, 5.417724609375, 5.64630126953125, 5.8748779296875, 6.10345458984375, 6.33203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 7.0, 2.0, 10.0, 9.0, 11.0, 15.0, 15.0, 17.0, 17.0, 21.0, 31.0, 31.0, 26.0, 34.0, 31.0, 36.0, 33.0, 30.0, 32.0, 47.0, 27.0, 40.0, 37.0, 51.0, 34.0, 28.0, 33.0, 29.0, 35.0, 20.0, 21.0, 29.0, 13.0, 21.0, 20.0, 20.0, 16.0, 19.0, 9.0, 3.0, 8.0, 7.0, 10.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.8173828125, -1.762298583984375, -1.70721435546875, -1.652130126953125, -1.5970458984375, -1.541961669921875, -1.48687744140625, -1.431793212890625, -1.376708984375, -1.321624755859375, -1.26654052734375, -1.211456298828125, -1.1563720703125, -1.101287841796875, -1.04620361328125, -0.991119384765625, -0.93603515625, -0.880950927734375, -0.82586669921875, -0.770782470703125, -0.7156982421875, -0.660614013671875, -0.60552978515625, -0.550445556640625, -0.495361328125, -0.440277099609375, -0.38519287109375, -0.330108642578125, -0.2750244140625, -0.219940185546875, -0.16485595703125, -0.109771728515625, -0.0546875, 0.000396728515625, 0.05548095703125, 0.110565185546875, 0.1656494140625, 0.220733642578125, 0.27581787109375, 0.330902099609375, 0.385986328125, 0.441070556640625, 0.49615478515625, 0.551239013671875, 0.6063232421875, 0.661407470703125, 0.71649169921875, 0.771575927734375, 0.82666015625, 0.881744384765625, 0.93682861328125, 0.991912841796875, 1.0469970703125, 1.102081298828125, 1.15716552734375, 1.212249755859375, 1.267333984375, 1.322418212890625, 1.37750244140625, 1.432586669921875, 1.4876708984375, 1.542755126953125, 1.59783935546875, 1.652923583984375, 1.7080078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 9.0, 7.0, 10.0, 5.0, 10.0, 20.0, 27.0, 33.0, 53.0, 64.0, 75.0, 151.0, 219.0, 332.0, 678.0, 1214.0, 2810.0, 7293.0, 30560.0, 711277.0, 264251.0, 19371.0, 5321.0, 2247.0, 1041.0, 571.0, 327.0, 187.0, 112.0, 79.0, 56.0, 30.0, 32.0, 24.0, 22.0, 12.0, 8.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.1663818359375, -9.801513671875, -9.4366455078125, -9.07177734375, -8.7069091796875, -8.342041015625, -7.9771728515625, -7.6123046875, -7.2474365234375, -6.882568359375, -6.5177001953125, -6.15283203125, -5.7879638671875, -5.423095703125, -5.0582275390625, -4.693359375, -4.3284912109375, -3.963623046875, -3.5987548828125, -3.23388671875, -2.8690185546875, -2.504150390625, -2.1392822265625, -1.7744140625, -1.4095458984375, -1.044677734375, -0.6798095703125, -0.31494140625, 0.0499267578125, 0.414794921875, 0.7796630859375, 1.14453125, 1.5093994140625, 1.874267578125, 2.2391357421875, 2.60400390625, 2.9688720703125, 3.333740234375, 3.6986083984375, 4.0634765625, 4.4283447265625, 4.793212890625, 5.1580810546875, 5.52294921875, 5.8878173828125, 6.252685546875, 6.6175537109375, 6.982421875, 7.3472900390625, 7.712158203125, 8.0770263671875, 8.44189453125, 8.8067626953125, 9.171630859375, 9.5364990234375, 9.9013671875, 10.2662353515625, 10.631103515625, 10.9959716796875, 11.36083984375, 11.7257080078125, 12.090576171875, 12.4554443359375, 12.8203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 13.0, 5.0, 6.0, 12.0, 17.0, 19.0, 17.0, 22.0, 32.0, 38.0, 31.0, 35.0, 44.0, 75.0, 65.0, 65.0, 60.0, 53.0, 45.0, 56.0, 43.0, 32.0, 42.0, 33.0, 36.0, 21.0, 12.0, 15.0, 14.0, 10.0, 10.0, 3.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00022113323211669922, -0.00021559931337833405, -0.00021006539463996887, -0.0002045314759016037, -0.00019899755716323853, -0.00019346363842487335, -0.00018792971968650818, -0.000182395800948143, -0.00017686188220977783, -0.00017132796347141266, -0.00016579404473304749, -0.0001602601259946823, -0.00015472620725631714, -0.00014919228851795197, -0.0001436583697795868, -0.00013812445104122162, -0.00013259053230285645, -0.00012705661356449127, -0.0001215226948261261, -0.00011598877608776093, -0.00011045485734939575, -0.00010492093861103058, -9.93870198726654e-05, -9.385310113430023e-05, -8.831918239593506e-05, -8.278526365756989e-05, -7.725134491920471e-05, -7.171742618083954e-05, -6.618350744247437e-05, -6.064958870410919e-05, -5.511566996574402e-05, -4.9581751227378845e-05, -4.404783248901367e-05, -3.85139137506485e-05, -3.2979995012283325e-05, -2.7446076273918152e-05, -2.191215753555298e-05, -1.6378238797187805e-05, -1.0844320058822632e-05, -5.3104013204574585e-06, 2.2351741790771484e-07, 5.757436156272888e-06, 1.1291354894638062e-05, 1.6825273633003235e-05, 2.2359192371368408e-05, 2.789311110973358e-05, 3.3427029848098755e-05, 3.896094858646393e-05, 4.44948673248291e-05, 5.0028786063194275e-05, 5.556270480155945e-05, 6.109662353992462e-05, 6.66305422782898e-05, 7.216446101665497e-05, 7.769837975502014e-05, 8.323229849338531e-05, 8.876621723175049e-05, 9.430013597011566e-05, 9.983405470848083e-05, 0.00010536797344684601, 0.00011090189218521118, 0.00011643581092357635, 0.00012196972966194153, 0.0001275036484003067, 0.00013303756713867188]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 9.0, 19.0, 23.0, 47.0, 63.0, 113.0, 138.0, 210.0, 355.0, 617.0, 1056.0, 1906.0, 3954.0, 9254.0, 31616.0, 290679.0, 631915.0, 53141.0, 12858.0, 5012.0, 2390.0, 1292.0, 714.0, 420.0, 258.0, 148.0, 104.0, 72.0, 36.0, 36.0, 17.0, 12.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.7265625, -7.4703369140625, -7.214111328125, -6.9578857421875, -6.70166015625, -6.4454345703125, -6.189208984375, -5.9329833984375, -5.6767578125, -5.4205322265625, -5.164306640625, -4.9080810546875, -4.65185546875, -4.3956298828125, -4.139404296875, -3.8831787109375, -3.626953125, -3.3707275390625, -3.114501953125, -2.8582763671875, -2.60205078125, -2.3458251953125, -2.089599609375, -1.8333740234375, -1.5771484375, -1.3209228515625, -1.064697265625, -0.8084716796875, -0.55224609375, -0.2960205078125, -0.039794921875, 0.2164306640625, 0.47265625, 0.7288818359375, 0.985107421875, 1.2413330078125, 1.49755859375, 1.7537841796875, 2.010009765625, 2.2662353515625, 2.5224609375, 2.7786865234375, 3.034912109375, 3.2911376953125, 3.54736328125, 3.8035888671875, 4.059814453125, 4.3160400390625, 4.572265625, 4.8284912109375, 5.084716796875, 5.3409423828125, 5.59716796875, 5.8533935546875, 6.109619140625, 6.3658447265625, 6.6220703125, 6.8782958984375, 7.134521484375, 7.3907470703125, 7.64697265625, 7.9031982421875, 8.159423828125, 8.4156494140625, 8.671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 7.0, 19.0, 16.0, 20.0, 34.0, 51.0, 62.0, 75.0, 94.0, 95.0, 112.0, 94.0, 87.0, 57.0, 54.0, 37.0, 24.0, 24.0, 8.0, 9.0, 8.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2578125, -4.12158203125, -3.9853515625, -3.84912109375, -3.712890625, -3.57666015625, -3.4404296875, -3.30419921875, -3.16796875, -3.03173828125, -2.8955078125, -2.75927734375, -2.623046875, -2.48681640625, -2.3505859375, -2.21435546875, -2.078125, -1.94189453125, -1.8056640625, -1.66943359375, -1.533203125, -1.39697265625, -1.2607421875, -1.12451171875, -0.98828125, -0.85205078125, -0.7158203125, -0.57958984375, -0.443359375, -0.30712890625, -0.1708984375, -0.03466796875, 0.1015625, 0.23779296875, 0.3740234375, 0.51025390625, 0.646484375, 0.78271484375, 0.9189453125, 1.05517578125, 1.19140625, 1.32763671875, 1.4638671875, 1.60009765625, 1.736328125, 1.87255859375, 2.0087890625, 2.14501953125, 2.28125, 2.41748046875, 2.5537109375, 2.68994140625, 2.826171875, 2.96240234375, 3.0986328125, 3.23486328125, 3.37109375, 3.50732421875, 3.6435546875, 3.77978515625, 3.916015625, 4.05224609375, 4.1884765625, 4.32470703125, 4.4609375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 3.0, 11.0, 20.0, 47.0, 146.0, 403.0, 270.0, 52.0, 19.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0], "bins": [-129.99583435058594, -127.3298568725586, -124.66388702392578, -121.99790954589844, -119.33193969726562, -116.66596221923828, -113.99998474121094, -111.33401489257812, -108.66803741455078, -106.00205993652344, -103.33609008789062, -100.67011260986328, -98.00414276123047, -95.33816528320312, -92.67219543457031, -90.00621795654297, -87.34024047851562, -84.67426300048828, -82.00829315185547, -79.34231567382812, -76.67634582519531, -74.01036834716797, -71.34439086914062, -68.67842102050781, -66.012451171875, -63.34647750854492, -60.680503845214844, -58.0145263671875, -55.34855270385742, -52.682579040527344, -50.016605377197266, -47.35063171386719, -44.684654235839844, -42.018680572509766, -39.35270690917969, -36.686729431152344, -34.020755767822266, -31.354782104492188, -28.68880844116211, -26.0228328704834, -23.35685920715332, -20.690885543823242, -18.02490997314453, -15.358936309814453, -12.692961692810059, -10.026987075805664, -7.361013412475586, -4.695037841796875, -2.029064178466797, 0.6369102001190186, 3.302884578704834, 5.96885871887207, 8.634833335876465, 11.30080795288086, 13.966781616210938, 16.63275718688965, 19.298730850219727, 21.964704513549805, 24.630680084228516, 27.296653747558594, 29.962627410888672, 32.62860107421875, 35.294578552246094, 37.96055221557617, 40.62652587890625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 10.0, 3.0, 4.0, 6.0, 13.0, 15.0, 19.0, 36.0, 79.0, 98.0, 133.0, 139.0, 120.0, 107.0, 74.0, 47.0, 28.0, 4.0, 14.0, 8.0, 10.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.31155776977539, -26.101890563964844, -24.892221450805664, -23.682552337646484, -22.472885131835938, -21.26321792602539, -20.05354881286621, -18.84387969970703, -17.634212493896484, -16.424545288085938, -15.214876174926758, -14.005208015441895, -12.795539855957031, -11.585871696472168, -10.376203536987305, -9.166535377502441, -7.956867218017578, -6.747199058532715, -5.537530899047852, -4.327862739562988, -3.118194580078125, -1.9085264205932617, -0.6988582611083984, 0.5108098983764648, 1.7204780578613281, 2.9301462173461914, 4.139814376831055, 5.349482536315918, 6.559150695800781, 7.7688188552856445, 8.978487014770508, 10.188155174255371, 11.397819519042969, 12.607487678527832, 13.817155838012695, 15.026823997497559, 16.236492156982422, 17.44615936279297, 18.65582847595215, 19.865497589111328, 21.075164794921875, 22.284832000732422, 23.4945011138916, 24.70417022705078, 25.913837432861328, 27.123504638671875, 28.333173751831055, 29.542842864990234, 30.75251007080078, 31.962177276611328, 33.171844482421875, 34.38151550292969, 35.591182708740234, 36.80084991455078, 38.010520935058594, 39.22018814086914, 40.42985534667969, 41.639522552490234, 42.84918975830078, 44.058860778808594, 45.26852798461914, 46.47819519042969, 47.6878662109375, 48.89753341674805, 50.107200622558594]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 10.0, 8.0, 7.0, 20.0, 47.0, 76.0, 128.0, 209.0, 455.0, 1059.0, 3923.0, 22104.0, 644424.0, 3487566.0, 29857.0, 3392.0, 668.0, 168.0, 79.0, 29.0, 21.0, 11.0, 8.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.125, -35.266845703125, -34.40869140625, -33.550537109375, -32.6923828125, -31.834228515625, -30.97607421875, -30.117919921875, -29.259765625, -28.401611328125, -27.54345703125, -26.685302734375, -25.8271484375, -24.968994140625, -24.11083984375, -23.252685546875, -22.39453125, -21.536376953125, -20.67822265625, -19.820068359375, -18.9619140625, -18.103759765625, -17.24560546875, -16.387451171875, -15.529296875, -14.671142578125, -13.81298828125, -12.954833984375, -12.0966796875, -11.238525390625, -10.38037109375, -9.522216796875, -8.6640625, -7.805908203125, -6.94775390625, -6.089599609375, -5.2314453125, -4.373291015625, -3.51513671875, -2.656982421875, -1.798828125, -0.940673828125, -0.08251953125, 0.775634765625, 1.6337890625, 2.491943359375, 3.35009765625, 4.208251953125, 5.06640625, 5.924560546875, 6.78271484375, 7.640869140625, 8.4990234375, 9.357177734375, 10.21533203125, 11.073486328125, 11.931640625, 12.789794921875, 13.64794921875, 14.506103515625, 15.3642578125, 16.222412109375, 17.08056640625, 17.938720703125, 18.796875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 7.0, 7.0, 5.0, 13.0, 18.0, 23.0, 19.0, 36.0, 59.0, 71.0, 96.0, 126.0, 126.0, 119.0, 86.0, 55.0, 33.0, 29.0, 19.0, 7.0, 15.0, 8.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.689453125, -0.6740188598632812, -0.6585845947265625, -0.6431503295898438, -0.627716064453125, -0.6122817993164062, -0.5968475341796875, -0.5814132690429688, -0.56597900390625, -0.5505447387695312, -0.5351104736328125, -0.5196762084960938, -0.504241943359375, -0.48880767822265625, -0.4733734130859375, -0.45793914794921875, -0.4425048828125, -0.42707061767578125, -0.4116363525390625, -0.39620208740234375, -0.380767822265625, -0.36533355712890625, -0.3498992919921875, -0.33446502685546875, -0.31903076171875, -0.30359649658203125, -0.2881622314453125, -0.27272796630859375, -0.257293701171875, -0.24185943603515625, -0.2264251708984375, -0.21099090576171875, -0.195556640625, -0.18012237548828125, -0.1646881103515625, -0.14925384521484375, -0.133819580078125, -0.11838531494140625, -0.1029510498046875, -0.08751678466796875, -0.07208251953125, -0.05664825439453125, -0.0412139892578125, -0.02577972412109375, -0.010345458984375, 0.00508880615234375, 0.0205230712890625, 0.03595733642578125, 0.0513916015625, 0.06682586669921875, 0.0822601318359375, 0.09769439697265625, 0.113128662109375, 0.12856292724609375, 0.1439971923828125, 0.15943145751953125, 0.17486572265625, 0.19029998779296875, 0.2057342529296875, 0.22116851806640625, 0.236602783203125, 0.25203704833984375, 0.2674713134765625, 0.28290557861328125, 0.29833984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 8.0, 16.0, 17.0, 20.0, 26.0, 48.0, 58.0, 87.0, 192.0, 364.0, 1036.0, 3165.0, 13708.0, 85845.0, 1257348.0, 2691500.0, 117296.0, 17528.0, 3870.0, 1129.0, 450.0, 193.0, 117.0, 63.0, 42.0, 33.0, 17.0, 15.0, 19.0, 8.0, 6.0, 9.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.296875, -12.786865234375, -12.27685546875, -11.766845703125, -11.2568359375, -10.746826171875, -10.23681640625, -9.726806640625, -9.216796875, -8.706787109375, -8.19677734375, -7.686767578125, -7.1767578125, -6.666748046875, -6.15673828125, -5.646728515625, -5.13671875, -4.626708984375, -4.11669921875, -3.606689453125, -3.0966796875, -2.586669921875, -2.07666015625, -1.566650390625, -1.056640625, -0.546630859375, -0.03662109375, 0.473388671875, 0.9833984375, 1.493408203125, 2.00341796875, 2.513427734375, 3.0234375, 3.533447265625, 4.04345703125, 4.553466796875, 5.0634765625, 5.573486328125, 6.08349609375, 6.593505859375, 7.103515625, 7.613525390625, 8.12353515625, 8.633544921875, 9.1435546875, 9.653564453125, 10.16357421875, 10.673583984375, 11.18359375, 11.693603515625, 12.20361328125, 12.713623046875, 13.2236328125, 13.733642578125, 14.24365234375, 14.753662109375, 15.263671875, 15.773681640625, 16.28369140625, 16.793701171875, 17.3037109375, 17.813720703125, 18.32373046875, 18.833740234375, 19.34375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 6.0, 6.0, 7.0, 12.0, 20.0, 10.0, 15.0, 16.0, 29.0, 37.0, 47.0, 54.0, 76.0, 88.0, 110.0, 136.0, 167.0, 222.0, 396.0, 807.0, 535.0, 289.0, 199.0, 134.0, 132.0, 109.0, 80.0, 67.0, 43.0, 54.0, 31.0, 34.0, 23.0, 19.0, 10.0, 11.0, 4.0, 4.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79443359375, -0.76849365234375, -0.7425537109375, -0.71661376953125, -0.690673828125, -0.66473388671875, -0.6387939453125, -0.61285400390625, -0.5869140625, -0.56097412109375, -0.5350341796875, -0.50909423828125, -0.483154296875, -0.45721435546875, -0.4312744140625, -0.40533447265625, -0.37939453125, -0.35345458984375, -0.3275146484375, -0.30157470703125, -0.275634765625, -0.24969482421875, -0.2237548828125, -0.19781494140625, -0.171875, -0.14593505859375, -0.1199951171875, -0.09405517578125, -0.068115234375, -0.04217529296875, -0.0162353515625, 0.00970458984375, 0.03564453125, 0.06158447265625, 0.0875244140625, 0.11346435546875, 0.139404296875, 0.16534423828125, 0.1912841796875, 0.21722412109375, 0.2431640625, 0.26910400390625, 0.2950439453125, 0.32098388671875, 0.346923828125, 0.37286376953125, 0.3988037109375, 0.42474365234375, 0.45068359375, 0.47662353515625, 0.5025634765625, 0.52850341796875, 0.554443359375, 0.58038330078125, 0.6063232421875, 0.63226318359375, 0.658203125, 0.68414306640625, 0.7100830078125, 0.73602294921875, 0.761962890625, 0.78790283203125, 0.8138427734375, 0.83978271484375, 0.86572265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 34.0, 97.0, 330.0, 373.0, 127.0, 26.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.757938385009766, -19.539562225341797, -18.321186065673828, -17.10280990600586, -15.884435653686523, -14.666059494018555, -13.447683334350586, -12.229308128356934, -11.010931968688965, -9.792555809020996, -8.574180603027344, -7.355804443359375, -6.1374287605285645, -4.919053077697754, -3.700676918029785, -2.482301712036133, -1.263925552368164, -0.045549750328063965, 1.1728260517120361, 2.391201972961426, 3.6095776557922363, 4.827953338623047, 6.046329498291016, 7.264704704284668, 8.483080863952637, 9.701457023620605, 10.919832229614258, 12.138208389282227, 13.356584548950195, 14.574959754943848, 15.793335914611816, 17.01171112060547, 18.230087280273438, 19.448463439941406, 20.666839599609375, 21.885215759277344, 23.10359001159668, 24.32196617126465, 25.540342330932617, 26.758716583251953, 27.977092742919922, 29.19546890258789, 30.41384506225586, 31.632221221923828, 32.8505973815918, 34.0689697265625, 35.28734588623047, 36.50572204589844, 37.724098205566406, 38.942474365234375, 40.160850524902344, 41.37922668457031, 42.59760284423828, 43.81597900390625, 45.03435516357422, 46.25272750854492, 47.471107482910156, 48.689483642578125, 49.907859802246094, 51.12623596191406, 52.34461212158203, 53.56298828125, 54.78136444091797, 55.99973678588867, 57.21811294555664]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 7.0, 15.0, 14.0, 24.0, 39.0, 45.0, 44.0, 65.0, 66.0, 73.0, 66.0, 75.0, 79.0, 73.0, 72.0, 52.0, 35.0, 36.0, 32.0, 22.0, 21.0, 12.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4342851638793945, -5.20179557800293, -4.969306468963623, -4.736816883087158, -4.504327774047852, -4.271838188171387, -4.039348602294922, -3.8068594932556152, -3.5743699073791504, -3.3418805599212646, -3.109391212463379, -2.876901626586914, -2.6444122791290283, -2.4119229316711426, -2.179433584213257, -1.9469441175460815, -1.7144548892974854, -1.4819655418395996, -1.2494760751724243, -1.0169867277145386, -0.7844973206520081, -0.5520079135894775, -0.3195185661315918, -0.0870290994644165, 0.14546024799346924, 0.37794965505599976, 0.6104390621185303, 0.842928409576416, 1.0754177570343018, 1.307907223701477, 1.5403965711593628, 1.772886037826538, 2.005375385284424, 2.2378647327423096, 2.4703540802001953, 2.70284366607666, 2.935333013534546, 3.1678223609924316, 3.4003117084503174, 3.632801055908203, 3.865290641784668, 4.097780227661133, 4.3302693367004395, 4.562758922576904, 4.795248031616211, 5.027737617492676, 5.260227203369141, 5.492716312408447, 5.725205421447754, 5.957695007324219, 6.190184116363525, 6.42267370223999, 6.655162811279297, 6.887652397155762, 7.120141983032227, 7.352631092071533, 7.585120677947998, 7.817610263824463, 8.05009937286377, 8.282588958740234, 8.5150785446167, 8.747568130493164, 8.980056762695312, 9.212546348571777, 9.445035934448242]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 7.0, 12.0, 9.0, 10.0, 20.0, 22.0, 44.0, 47.0, 78.0, 135.0, 291.0, 549.0, 1414.0, 4149.0, 14665.0, 88143.0, 730997.0, 175447.0, 23350.0, 5660.0, 1910.0, 751.0, 352.0, 144.0, 109.0, 62.0, 40.0, 25.0, 22.0, 16.0, 16.0, 8.0, 8.0, 8.0, 4.0, 6.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.2421875, -13.805908203125, -13.36962890625, -12.933349609375, -12.4970703125, -12.060791015625, -11.62451171875, -11.188232421875, -10.751953125, -10.315673828125, -9.87939453125, -9.443115234375, -9.0068359375, -8.570556640625, -8.13427734375, -7.697998046875, -7.26171875, -6.825439453125, -6.38916015625, -5.952880859375, -5.5166015625, -5.080322265625, -4.64404296875, -4.207763671875, -3.771484375, -3.335205078125, -2.89892578125, -2.462646484375, -2.0263671875, -1.590087890625, -1.15380859375, -0.717529296875, -0.28125, 0.155029296875, 0.59130859375, 1.027587890625, 1.4638671875, 1.900146484375, 2.33642578125, 2.772705078125, 3.208984375, 3.645263671875, 4.08154296875, 4.517822265625, 4.9541015625, 5.390380859375, 5.82666015625, 6.262939453125, 6.69921875, 7.135498046875, 7.57177734375, 8.008056640625, 8.4443359375, 8.880615234375, 9.31689453125, 9.753173828125, 10.189453125, 10.625732421875, 11.06201171875, 11.498291015625, 11.9345703125, 12.370849609375, 12.80712890625, 13.243408203125, 13.6796875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 13.0, 19.0, 24.0, 31.0, 64.0, 71.0, 90.0, 107.0, 108.0, 125.0, 96.0, 83.0, 52.0, 35.0, 22.0, 18.0, 10.0, 8.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.67816162109375, -0.6566162109375, -0.63507080078125, -0.613525390625, -0.59197998046875, -0.5704345703125, -0.54888916015625, -0.52734375, -0.50579833984375, -0.4842529296875, -0.46270751953125, -0.441162109375, -0.41961669921875, -0.3980712890625, -0.37652587890625, -0.35498046875, -0.33343505859375, -0.3118896484375, -0.29034423828125, -0.268798828125, -0.24725341796875, -0.2257080078125, -0.20416259765625, -0.1826171875, -0.16107177734375, -0.1395263671875, -0.11798095703125, -0.096435546875, -0.07489013671875, -0.0533447265625, -0.03179931640625, -0.01025390625, 0.01129150390625, 0.0328369140625, 0.05438232421875, 0.075927734375, 0.09747314453125, 0.1190185546875, 0.14056396484375, 0.162109375, 0.18365478515625, 0.2052001953125, 0.22674560546875, 0.248291015625, 0.26983642578125, 0.2913818359375, 0.31292724609375, 0.33447265625, 0.35601806640625, 0.3775634765625, 0.39910888671875, 0.420654296875, 0.44219970703125, 0.4637451171875, 0.48529052734375, 0.5068359375, 0.52838134765625, 0.5499267578125, 0.57147216796875, 0.593017578125, 0.61456298828125, 0.6361083984375, 0.65765380859375, 0.67919921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 6.0, 8.0, 9.0, 9.0, 9.0, 15.0, 18.0, 17.0, 21.0, 30.0, 45.0, 72.0, 308.0, 2292.0, 104240.0, 933147.0, 7307.0, 631.0, 129.0, 47.0, 31.0, 17.0, 33.0, 21.0, 10.0, 12.0, 10.0, 6.0, 6.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.7861328125, -21.978515625, -21.1708984375, -20.36328125, -19.5556640625, -18.748046875, -17.9404296875, -17.1328125, -16.3251953125, -15.517578125, -14.7099609375, -13.90234375, -13.0947265625, -12.287109375, -11.4794921875, -10.671875, -9.8642578125, -9.056640625, -8.2490234375, -7.44140625, -6.6337890625, -5.826171875, -5.0185546875, -4.2109375, -3.4033203125, -2.595703125, -1.7880859375, -0.98046875, -0.1728515625, 0.634765625, 1.4423828125, 2.25, 3.0576171875, 3.865234375, 4.6728515625, 5.48046875, 6.2880859375, 7.095703125, 7.9033203125, 8.7109375, 9.5185546875, 10.326171875, 11.1337890625, 11.94140625, 12.7490234375, 13.556640625, 14.3642578125, 15.171875, 15.9794921875, 16.787109375, 17.5947265625, 18.40234375, 19.2099609375, 20.017578125, 20.8251953125, 21.6328125, 22.4404296875, 23.248046875, 24.0556640625, 24.86328125, 25.6708984375, 26.478515625, 27.2861328125, 28.09375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 7.0, 7.0, 14.0, 6.0, 14.0, 13.0, 28.0, 12.0, 31.0, 31.0, 33.0, 29.0, 37.0, 40.0, 48.0, 35.0, 49.0, 55.0, 34.0, 48.0, 45.0, 44.0, 42.0, 35.0, 38.0, 33.0, 33.0, 21.0, 23.0, 22.0, 13.0, 16.0, 12.0, 8.0, 9.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.990234375, -1.9333953857421875, -1.876556396484375, -1.8197174072265625, -1.76287841796875, -1.7060394287109375, -1.649200439453125, -1.5923614501953125, -1.5355224609375, -1.4786834716796875, -1.421844482421875, -1.3650054931640625, -1.30816650390625, -1.2513275146484375, -1.194488525390625, -1.1376495361328125, -1.080810546875, -1.0239715576171875, -0.967132568359375, -0.9102935791015625, -0.85345458984375, -0.7966156005859375, -0.739776611328125, -0.6829376220703125, -0.6260986328125, -0.5692596435546875, -0.512420654296875, -0.4555816650390625, -0.39874267578125, -0.3419036865234375, -0.285064697265625, -0.2282257080078125, -0.17138671875, -0.1145477294921875, -0.057708740234375, -0.0008697509765625, 0.05596923828125, 0.1128082275390625, 0.169647216796875, 0.2264862060546875, 0.2833251953125, 0.3401641845703125, 0.397003173828125, 0.4538421630859375, 0.51068115234375, 0.5675201416015625, 0.624359130859375, 0.6811981201171875, 0.738037109375, 0.7948760986328125, 0.851715087890625, 0.9085540771484375, 0.96539306640625, 1.0222320556640625, 1.079071044921875, 1.1359100341796875, 1.1927490234375, 1.2495880126953125, 1.306427001953125, 1.3632659912109375, 1.42010498046875, 1.4769439697265625, 1.533782958984375, 1.5906219482421875, 1.6474609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 0.0, 2.0, 7.0, 4.0, 7.0, 6.0, 7.0, 19.0, 24.0, 32.0, 87.0, 348.0, 4012.0, 1038599.0, 4845.0, 347.0, 87.0, 59.0, 18.0, 12.0, 5.0, 7.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-112.3125, -108.5087890625, -104.705078125, -100.9013671875, -97.09765625, -93.2939453125, -89.490234375, -85.6865234375, -81.8828125, -78.0791015625, -74.275390625, -70.4716796875, -66.66796875, -62.8642578125, -59.060546875, -55.2568359375, -51.453125, -47.6494140625, -43.845703125, -40.0419921875, -36.23828125, -32.4345703125, -28.630859375, -24.8271484375, -21.0234375, -17.2197265625, -13.416015625, -9.6123046875, -5.80859375, -2.0048828125, 1.798828125, 5.6025390625, 9.40625, 13.2099609375, 17.013671875, 20.8173828125, 24.62109375, 28.4248046875, 32.228515625, 36.0322265625, 39.8359375, 43.6396484375, 47.443359375, 51.2470703125, 55.05078125, 58.8544921875, 62.658203125, 66.4619140625, 70.265625, 74.0693359375, 77.873046875, 81.6767578125, 85.48046875, 89.2841796875, 93.087890625, 96.8916015625, 100.6953125, 104.4990234375, 108.302734375, 112.1064453125, 115.91015625, 119.7138671875, 123.517578125, 127.3212890625, 131.125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 8.0, 17.0, 10.0, 27.0, 26.0, 49.0, 84.0, 102.0, 142.0, 141.0, 121.0, 82.0, 56.0, 35.0, 33.0, 12.0, 13.0, 11.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003628730773925781, -0.0003479421138763428, -0.0003330111503601074, -0.00031808018684387207, -0.0003031492233276367, -0.00028821825981140137, -0.000273287296295166, -0.00025835633277893066, -0.0002434253692626953, -0.00022849440574645996, -0.0002135634422302246, -0.00019863247871398926, -0.0001837015151977539, -0.00016877055168151855, -0.0001538395881652832, -0.00013890862464904785, -0.0001239776611328125, -0.00010904669761657715, -9.41157341003418e-05, -7.918477058410645e-05, -6.42538070678711e-05, -4.932284355163574e-05, -3.439188003540039e-05, -1.946091651916504e-05, -4.5299530029296875e-06, 1.0401010513305664e-05, 2.5331974029541016e-05, 4.026293754577637e-05, 5.519390106201172e-05, 7.012486457824707e-05, 8.505582809448242e-05, 9.998679161071777e-05, 0.00011491775512695312, 0.00012984871864318848, 0.00014477968215942383, 0.00015971064567565918, 0.00017464160919189453, 0.00018957257270812988, 0.00020450353622436523, 0.00021943449974060059, 0.00023436546325683594, 0.0002492964267730713, 0.00026422739028930664, 0.000279158353805542, 0.00029408931732177734, 0.0003090202808380127, 0.00032395124435424805, 0.0003388822078704834, 0.00035381317138671875, 0.0003687441349029541, 0.00038367509841918945, 0.0003986060619354248, 0.00041353702545166016, 0.0004284679889678955, 0.00044339895248413086, 0.0004583299160003662, 0.00047326087951660156, 0.0004881918430328369, 0.0005031228065490723, 0.0005180537700653076, 0.000532984733581543, 0.0005479156970977783, 0.0005628466606140137, 0.000577777624130249, 0.0005927085876464844]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 5.0, 7.0, 13.0, 26.0, 26.0, 27.0, 37.0, 56.0, 80.0, 133.0, 176.0, 250.0, 389.0, 670.0, 1022.0, 1777.0, 3443.0, 6323.0, 13899.0, 35562.0, 166711.0, 689075.0, 82956.0, 24250.0, 10206.0, 4839.0, 2582.0, 1451.0, 865.0, 555.0, 359.0, 252.0, 181.0, 109.0, 55.0, 52.0, 36.0, 26.0, 14.0, 14.0, 9.0, 2.0, 3.0, 9.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-20.5625, -19.96337890625, -19.3642578125, -18.76513671875, -18.166015625, -17.56689453125, -16.9677734375, -16.36865234375, -15.76953125, -15.17041015625, -14.5712890625, -13.97216796875, -13.373046875, -12.77392578125, -12.1748046875, -11.57568359375, -10.9765625, -10.37744140625, -9.7783203125, -9.17919921875, -8.580078125, -7.98095703125, -7.3818359375, -6.78271484375, -6.18359375, -5.58447265625, -4.9853515625, -4.38623046875, -3.787109375, -3.18798828125, -2.5888671875, -1.98974609375, -1.390625, -0.79150390625, -0.1923828125, 0.40673828125, 1.005859375, 1.60498046875, 2.2041015625, 2.80322265625, 3.40234375, 4.00146484375, 4.6005859375, 5.19970703125, 5.798828125, 6.39794921875, 6.9970703125, 7.59619140625, 8.1953125, 8.79443359375, 9.3935546875, 9.99267578125, 10.591796875, 11.19091796875, 11.7900390625, 12.38916015625, 12.98828125, 13.58740234375, 14.1865234375, 14.78564453125, 15.384765625, 15.98388671875, 16.5830078125, 17.18212890625, 17.78125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 0.0, 4.0, 5.0, 2.0, 11.0, 9.0, 8.0, 7.0, 26.0, 20.0, 38.0, 75.0, 155.0, 256.0, 160.0, 76.0, 50.0, 21.0, 24.0, 6.0, 7.0, 6.0, 7.0, 4.0, 0.0, 0.0, 5.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.1875, -10.820068359375, -10.45263671875, -10.085205078125, -9.7177734375, -9.350341796875, -8.98291015625, -8.615478515625, -8.248046875, -7.880615234375, -7.51318359375, -7.145751953125, -6.7783203125, -6.410888671875, -6.04345703125, -5.676025390625, -5.30859375, -4.941162109375, -4.57373046875, -4.206298828125, -3.8388671875, -3.471435546875, -3.10400390625, -2.736572265625, -2.369140625, -2.001708984375, -1.63427734375, -1.266845703125, -0.8994140625, -0.531982421875, -0.16455078125, 0.202880859375, 0.5703125, 0.937744140625, 1.30517578125, 1.672607421875, 2.0400390625, 2.407470703125, 2.77490234375, 3.142333984375, 3.509765625, 3.877197265625, 4.24462890625, 4.612060546875, 4.9794921875, 5.346923828125, 5.71435546875, 6.081787109375, 6.44921875, 6.816650390625, 7.18408203125, 7.551513671875, 7.9189453125, 8.286376953125, 8.65380859375, 9.021240234375, 9.388671875, 9.756103515625, 10.12353515625, 10.490966796875, 10.8583984375, 11.225830078125, 11.59326171875, 11.960693359375, 12.328125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 12.0, 32.0, 101.0, 217.0, 264.0, 195.0, 87.0, 46.0, 18.0, 10.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.495487213134766, -32.06806564331055, -29.64064598083496, -27.213226318359375, -24.785804748535156, -22.358383178710938, -19.93096351623535, -17.503543853759766, -15.076122283935547, -12.648701667785645, -10.221281051635742, -7.79386043548584, -5.3664398193359375, -2.939019203186035, -0.5115985870361328, 1.9158210754394531, 4.343242645263672, 6.770663261413574, 9.198083877563477, 11.625504493713379, 14.052925109863281, 16.4803466796875, 18.907766342163086, 21.335186004638672, 23.76260757446289, 26.19002914428711, 28.617448806762695, 31.04486846923828, 33.4722900390625, 35.89971160888672, 38.32713317871094, 40.75455093383789, 43.181976318359375, 45.609397888183594, 48.03681945800781, 50.464237213134766, 52.891658782958984, 55.3190803527832, 57.746498107910156, 60.173919677734375, 62.601341247558594, 65.02876281738281, 67.45618438720703, 69.88360595703125, 72.31101989746094, 74.73844146728516, 77.16586303710938, 79.5932846069336, 82.02070617675781, 84.44812774658203, 86.87554931640625, 89.30297088623047, 91.73039245605469, 94.15780639648438, 96.5852279663086, 99.01264953613281, 101.44007110595703, 103.86749267578125, 106.29491424560547, 108.72233581542969, 111.14974975585938, 113.5771713256836, 116.00459289550781, 118.43201446533203, 120.85943603515625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 16.0, 17.0, 28.0, 38.0, 43.0, 67.0, 65.0, 78.0, 102.0, 100.0, 95.0, 74.0, 82.0, 53.0, 48.0, 27.0, 19.0, 13.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.052967071533203, -24.968441009521484, -23.883913040161133, -22.799386978149414, -21.714859008789062, -20.630332946777344, -19.545806884765625, -18.461280822753906, -17.376752853393555, -16.292226791381836, -15.207698822021484, -14.123172760009766, -13.03864574432373, -11.954118728637695, -10.869592666625977, -9.785065650939941, -8.700538635253906, -7.616011619567871, -6.531485080718994, -5.446958541870117, -4.362431526184082, -3.277904510498047, -2.19337797164917, -1.108851432800293, -0.024324417114257812, 1.0602023601531982, 2.1447291374206543, 3.2292559146881104, 4.313782691955566, 5.398309707641602, 6.4828362464904785, 7.5673627853393555, 8.651885986328125, 9.73641300201416, 10.820940017700195, 11.905466079711914, 12.98999309539795, 14.074520111083984, 15.159046173095703, 16.243572235107422, 17.328100204467773, 18.412626266479492, 19.497154235839844, 20.581680297851562, 21.66620635986328, 22.750734329223633, 23.83526039123535, 24.919788360595703, 26.004314422607422, 27.08884048461914, 28.173368453979492, 29.25789451599121, 30.342422485351562, 31.42694854736328, 32.511474609375, 33.59600067138672, 34.68052673339844, 35.765052795410156, 36.849578857421875, 37.93410873413086, 39.01863479614258, 40.1031608581543, 41.187686920166016, 42.272212982177734, 43.35674285888672]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 24.0, 20.0, 29.0, 51.0, 95.0, 233.0, 564.0, 1752.0, 6796.0, 43490.0, 1548598.0, 2535868.0, 47016.0, 6603.0, 1642.0, 550.0, 249.0, 139.0, 118.0, 76.0, 46.0, 61.0, 45.0, 42.0, 24.0, 19.0, 14.0, 17.0, 21.0, 14.0, 9.0, 10.0, 6.0, 9.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.5625, -15.7353515625, -14.908203125, -14.0810546875, -13.25390625, -12.4267578125, -11.599609375, -10.7724609375, -9.9453125, -9.1181640625, -8.291015625, -7.4638671875, -6.63671875, -5.8095703125, -4.982421875, -4.1552734375, -3.328125, -2.5009765625, -1.673828125, -0.8466796875, -0.01953125, 0.8076171875, 1.634765625, 2.4619140625, 3.2890625, 4.1162109375, 4.943359375, 5.7705078125, 6.59765625, 7.4248046875, 8.251953125, 9.0791015625, 9.90625, 10.7333984375, 11.560546875, 12.3876953125, 13.21484375, 14.0419921875, 14.869140625, 15.6962890625, 16.5234375, 17.3505859375, 18.177734375, 19.0048828125, 19.83203125, 20.6591796875, 21.486328125, 22.3134765625, 23.140625, 23.9677734375, 24.794921875, 25.6220703125, 26.44921875, 27.2763671875, 28.103515625, 28.9306640625, 29.7578125, 30.5849609375, 31.412109375, 32.2392578125, 33.06640625, 33.8935546875, 34.720703125, 35.5478515625, 36.375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 7.0, 19.0, 45.0, 80.0, 150.0, 199.0, 197.0, 160.0, 68.0, 46.0, 18.0, 12.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73291015625, -0.6870956420898438, -0.6412811279296875, -0.5954666137695312, -0.549652099609375, -0.5038375854492188, -0.4580230712890625, -0.41220855712890625, -0.36639404296875, -0.32057952880859375, -0.2747650146484375, -0.22895050048828125, -0.183135986328125, -0.13732147216796875, -0.0915069580078125, -0.04569244384765625, 0.0001220703125, 0.04593658447265625, 0.0917510986328125, 0.13756561279296875, 0.183380126953125, 0.22919464111328125, 0.2750091552734375, 0.32082366943359375, 0.36663818359375, 0.41245269775390625, 0.4582672119140625, 0.5040817260742188, 0.549896240234375, 0.5957107543945312, 0.6415252685546875, 0.6873397827148438, 0.733154296875, 0.7789688110351562, 0.8247833251953125, 0.8705978393554688, 0.916412353515625, 0.9622268676757812, 1.0080413818359375, 1.0538558959960938, 1.09967041015625, 1.1454849243164062, 1.1912994384765625, 1.2371139526367188, 1.282928466796875, 1.3287429809570312, 1.3745574951171875, 1.4203720092773438, 1.4661865234375, 1.5120010375976562, 1.5578155517578125, 1.6036300659179688, 1.649444580078125, 1.6952590942382812, 1.7410736083984375, 1.7868881225585938, 1.83270263671875, 1.8785171508789062, 1.9243316650390625, 1.9701461791992188, 2.015960693359375, 2.0617752075195312, 2.1075897216796875, 2.1534042358398438, 2.19921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 7.0, 2.0, 6.0, 9.0, 15.0, 19.0, 14.0, 26.0, 41.0, 52.0, 60.0, 83.0, 126.0, 216.0, 567.0, 1975.0, 12204.0, 226199.0, 3823337.0, 118590.0, 8247.0, 1499.0, 441.0, 184.0, 98.0, 73.0, 40.0, 27.0, 31.0, 23.0, 17.0, 11.0, 12.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-41.0625, -39.934814453125, -38.80712890625, -37.679443359375, -36.5517578125, -35.424072265625, -34.29638671875, -33.168701171875, -32.041015625, -30.913330078125, -29.78564453125, -28.657958984375, -27.5302734375, -26.402587890625, -25.27490234375, -24.147216796875, -23.01953125, -21.891845703125, -20.76416015625, -19.636474609375, -18.5087890625, -17.381103515625, -16.25341796875, -15.125732421875, -13.998046875, -12.870361328125, -11.74267578125, -10.614990234375, -9.4873046875, -8.359619140625, -7.23193359375, -6.104248046875, -4.9765625, -3.848876953125, -2.72119140625, -1.593505859375, -0.4658203125, 0.661865234375, 1.78955078125, 2.917236328125, 4.044921875, 5.172607421875, 6.30029296875, 7.427978515625, 8.5556640625, 9.683349609375, 10.81103515625, 11.938720703125, 13.06640625, 14.194091796875, 15.32177734375, 16.449462890625, 17.5771484375, 18.704833984375, 19.83251953125, 20.960205078125, 22.087890625, 23.215576171875, 24.34326171875, 25.470947265625, 26.5986328125, 27.726318359375, 28.85400390625, 29.981689453125, 31.109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 8.0, 9.0, 14.0, 20.0, 23.0, 43.0, 44.0, 65.0, 94.0, 138.0, 178.0, 272.0, 451.0, 852.0, 608.0, 385.0, 238.0, 169.0, 133.0, 85.0, 54.0, 48.0, 33.0, 22.0, 18.0, 13.0, 18.0, 5.0, 5.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.69140625, -1.634735107421875, -1.57806396484375, -1.521392822265625, -1.4647216796875, -1.408050537109375, -1.35137939453125, -1.294708251953125, -1.238037109375, -1.181365966796875, -1.12469482421875, -1.068023681640625, -1.0113525390625, -0.954681396484375, -0.89801025390625, -0.841339111328125, -0.78466796875, -0.727996826171875, -0.67132568359375, -0.614654541015625, -0.5579833984375, -0.501312255859375, -0.44464111328125, -0.387969970703125, -0.331298828125, -0.274627685546875, -0.21795654296875, -0.161285400390625, -0.1046142578125, -0.047943115234375, 0.00872802734375, 0.065399169921875, 0.1220703125, 0.178741455078125, 0.23541259765625, 0.292083740234375, 0.3487548828125, 0.405426025390625, 0.46209716796875, 0.518768310546875, 0.575439453125, 0.632110595703125, 0.68878173828125, 0.745452880859375, 0.8021240234375, 0.858795166015625, 0.91546630859375, 0.972137451171875, 1.02880859375, 1.085479736328125, 1.14215087890625, 1.198822021484375, 1.2554931640625, 1.312164306640625, 1.36883544921875, 1.425506591796875, 1.482177734375, 1.538848876953125, 1.59552001953125, 1.652191162109375, 1.7088623046875, 1.765533447265625, 1.82220458984375, 1.878875732421875, 1.935546875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 8.0, 10.0, 58.0, 188.0, 439.0, 230.0, 55.0, 16.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-101.82221984863281, -99.84638977050781, -97.87055969238281, -95.89472961425781, -93.91889953613281, -91.94306945800781, -89.96723175048828, -87.99140167236328, -86.01557159423828, -84.03974151611328, -82.06391143798828, -80.08808135986328, -78.11225128173828, -76.13641357421875, -74.16058349609375, -72.18475341796875, -70.20892333984375, -68.23309326171875, -66.25726318359375, -64.28143310546875, -62.305599212646484, -60.329769134521484, -58.353939056396484, -56.37810516357422, -54.402278900146484, -52.426448822021484, -50.450618743896484, -48.47478485107422, -46.49895477294922, -44.52312469482422, -42.54729461669922, -40.57146453857422, -38.59562683105469, -36.61979675292969, -34.64396667480469, -32.66813278198242, -30.692302703857422, -28.716472625732422, -26.740642547607422, -24.76481056213379, -22.788982391357422, -20.813152313232422, -18.83732032775879, -16.86149024963379, -14.885658264160156, -12.909828186035156, -10.93399715423584, -8.958166122436523, -6.982334136962891, -5.006503105163574, -3.030672311782837, -1.0548415184020996, 0.9209895133972168, 2.896820068359375, 4.872651100158691, 6.848482131958008, 8.824313163757324, 10.80014419555664, 12.775975227355957, 14.751806259155273, 16.727636337280273, 18.703468322753906, 20.679298400878906, 22.655128479003906, 24.63096046447754]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 12.0, 11.0, 24.0, 23.0, 46.0, 39.0, 72.0, 98.0, 92.0, 117.0, 108.0, 98.0, 88.0, 64.0, 47.0, 24.0, 15.0, 14.0, 10.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.66547393798828, -28.049875259399414, -27.434274673461914, -26.818675994873047, -26.203075408935547, -25.58747673034668, -24.971878051757812, -24.356277465820312, -23.740678787231445, -23.125080108642578, -22.509479522705078, -21.89388084411621, -21.278282165527344, -20.662681579589844, -20.047082901000977, -19.43148422241211, -18.81588363647461, -18.200284957885742, -17.584684371948242, -16.969085693359375, -16.353485107421875, -15.737886428833008, -15.12228775024414, -14.506688117980957, -13.891088485717773, -13.27548885345459, -12.659889221191406, -12.044290542602539, -11.428690910339355, -10.813091278076172, -10.197492599487305, -9.581892967224121, -8.966294288635254, -8.35069465637207, -7.735095500946045, -7.1194963455200195, -6.503896713256836, -5.888297080993652, -5.272697925567627, -4.657098770141602, -4.041499137878418, -3.4258997440338135, -2.810300350189209, -2.1947009563446045, -1.5791015625, -0.9635021686553955, -0.347902774810791, 0.2676963806152344, 0.883296012878418, 1.4988954067230225, 2.114494800567627, 2.7300941944122314, 3.345693588256836, 3.9612929821014404, 4.576892375946045, 5.19249153137207, 5.808091163635254, 6.4236907958984375, 7.039289951324463, 7.654889106750488, 8.270488739013672, 8.886088371276855, 9.501688003540039, 10.117286682128906, 10.73288631439209]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 8.0, 5.0, 9.0, 16.0, 15.0, 28.0, 25.0, 34.0, 46.0, 40.0, 81.0, 295.0, 2033.0, 28294.0, 485931.0, 499471.0, 29538.0, 2043.0, 324.0, 69.0, 42.0, 30.0, 31.0, 22.0, 26.0, 14.0, 17.0, 17.0, 10.0, 8.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.21875, -20.534423828125, -19.85009765625, -19.165771484375, -18.4814453125, -17.797119140625, -17.11279296875, -16.428466796875, -15.744140625, -15.059814453125, -14.37548828125, -13.691162109375, -13.0068359375, -12.322509765625, -11.63818359375, -10.953857421875, -10.26953125, -9.585205078125, -8.90087890625, -8.216552734375, -7.5322265625, -6.847900390625, -6.16357421875, -5.479248046875, -4.794921875, -4.110595703125, -3.42626953125, -2.741943359375, -2.0576171875, -1.373291015625, -0.68896484375, -0.004638671875, 0.6796875, 1.364013671875, 2.04833984375, 2.732666015625, 3.4169921875, 4.101318359375, 4.78564453125, 5.469970703125, 6.154296875, 6.838623046875, 7.52294921875, 8.207275390625, 8.8916015625, 9.575927734375, 10.26025390625, 10.944580078125, 11.62890625, 12.313232421875, 12.99755859375, 13.681884765625, 14.3662109375, 15.050537109375, 15.73486328125, 16.419189453125, 17.103515625, 17.787841796875, 18.47216796875, 19.156494140625, 19.8408203125, 20.525146484375, 21.20947265625, 21.893798828125, 22.578125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 11.0, 14.0, 28.0, 60.0, 88.0, 108.0, 156.0, 142.0, 125.0, 117.0, 67.0, 54.0, 14.0, 13.0, 7.0, 4.0, 4.0, 2.0, 1.0], "bins": [-2.49609375, -2.448333740234375, -2.40057373046875, -2.352813720703125, -2.3050537109375, -2.257293701171875, -2.20953369140625, -2.161773681640625, -2.114013671875, -2.066253662109375, -2.01849365234375, -1.970733642578125, -1.9229736328125, -1.875213623046875, -1.82745361328125, -1.779693603515625, -1.73193359375, -1.684173583984375, -1.63641357421875, -1.588653564453125, -1.5408935546875, -1.493133544921875, -1.44537353515625, -1.397613525390625, -1.349853515625, -1.302093505859375, -1.25433349609375, -1.206573486328125, -1.1588134765625, -1.111053466796875, -1.06329345703125, -1.015533447265625, -0.9677734375, -0.920013427734375, -0.87225341796875, -0.824493408203125, -0.7767333984375, -0.728973388671875, -0.68121337890625, -0.633453369140625, -0.585693359375, -0.537933349609375, -0.49017333984375, -0.442413330078125, -0.3946533203125, -0.346893310546875, -0.29913330078125, -0.251373291015625, -0.20361328125, -0.155853271484375, -0.10809326171875, -0.060333251953125, -0.0125732421875, 0.035186767578125, 0.08294677734375, 0.130706787109375, 0.178466796875, 0.226226806640625, 0.27398681640625, 0.321746826171875, 0.3695068359375, 0.417266845703125, 0.46502685546875, 0.512786865234375, 0.560546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 5.0, 4.0, 12.0, 5.0, 13.0, 16.0, 22.0, 26.0, 51.0, 80.0, 110.0, 141.0, 227.0, 376.0, 560.0, 1083.0, 2076.0, 4867.0, 13397.0, 38356.0, 117435.0, 294153.0, 339086.0, 154893.0, 52539.0, 17129.0, 6191.0, 2589.0, 1223.0, 660.0, 449.0, 267.0, 169.0, 81.0, 77.0, 57.0, 23.0, 27.0, 18.0, 16.0, 14.0, 8.0, 8.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.9774169921875, -7.712646484375, -7.4478759765625, -7.18310546875, -6.9183349609375, -6.653564453125, -6.3887939453125, -6.1240234375, -5.8592529296875, -5.594482421875, -5.3297119140625, -5.06494140625, -4.8001708984375, -4.535400390625, -4.2706298828125, -4.005859375, -3.7410888671875, -3.476318359375, -3.2115478515625, -2.94677734375, -2.6820068359375, -2.417236328125, -2.1524658203125, -1.8876953125, -1.6229248046875, -1.358154296875, -1.0933837890625, -0.82861328125, -0.5638427734375, -0.299072265625, -0.0343017578125, 0.23046875, 0.4952392578125, 0.760009765625, 1.0247802734375, 1.28955078125, 1.5543212890625, 1.819091796875, 2.0838623046875, 2.3486328125, 2.6134033203125, 2.878173828125, 3.1429443359375, 3.40771484375, 3.6724853515625, 3.937255859375, 4.2020263671875, 4.466796875, 4.7315673828125, 4.996337890625, 5.2611083984375, 5.52587890625, 5.7906494140625, 6.055419921875, 6.3201904296875, 6.5849609375, 6.8497314453125, 7.114501953125, 7.3792724609375, 7.64404296875, 7.9088134765625, 8.173583984375, 8.4383544921875, 8.703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 8.0, 12.0, 1.0, 12.0, 7.0, 6.0, 13.0, 13.0, 26.0, 16.0, 26.0, 27.0, 30.0, 33.0, 33.0, 36.0, 30.0, 44.0, 42.0, 35.0, 53.0, 35.0, 42.0, 48.0, 55.0, 32.0, 34.0, 34.0, 27.0, 28.0, 30.0, 22.0, 17.0, 21.0, 21.0, 9.0, 8.0, 6.0, 4.0, 6.0, 2.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.4453125, -3.342681884765625, -3.24005126953125, -3.137420654296875, -3.0347900390625, -2.932159423828125, -2.82952880859375, -2.726898193359375, -2.624267578125, -2.521636962890625, -2.41900634765625, -2.316375732421875, -2.2137451171875, -2.111114501953125, -2.00848388671875, -1.905853271484375, -1.80322265625, -1.700592041015625, -1.59796142578125, -1.495330810546875, -1.3927001953125, -1.290069580078125, -1.18743896484375, -1.084808349609375, -0.982177734375, -0.879547119140625, -0.77691650390625, -0.674285888671875, -0.5716552734375, -0.469024658203125, -0.36639404296875, -0.263763427734375, -0.1611328125, -0.058502197265625, 0.04412841796875, 0.146759033203125, 0.2493896484375, 0.352020263671875, 0.45465087890625, 0.557281494140625, 0.659912109375, 0.762542724609375, 0.86517333984375, 0.967803955078125, 1.0704345703125, 1.173065185546875, 1.27569580078125, 1.378326416015625, 1.48095703125, 1.583587646484375, 1.68621826171875, 1.788848876953125, 1.8914794921875, 1.994110107421875, 2.09674072265625, 2.199371337890625, 2.302001953125, 2.404632568359375, 2.50726318359375, 2.609893798828125, 2.7125244140625, 2.815155029296875, 2.91778564453125, 3.020416259765625, 3.123046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 13.0, 31.0, 42.0, 89.0, 151.0, 289.0, 651.0, 1735.0, 4940.0, 17234.0, 79315.0, 371274.0, 439349.0, 102892.0, 21178.0, 5846.0, 2002.0, 786.0, 320.0, 152.0, 105.0, 63.0, 33.0, 20.0, 14.0, 8.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1171875, -12.763427734375, -12.40966796875, -12.055908203125, -11.7021484375, -11.348388671875, -10.99462890625, -10.640869140625, -10.287109375, -9.933349609375, -9.57958984375, -9.225830078125, -8.8720703125, -8.518310546875, -8.16455078125, -7.810791015625, -7.45703125, -7.103271484375, -6.74951171875, -6.395751953125, -6.0419921875, -5.688232421875, -5.33447265625, -4.980712890625, -4.626953125, -4.273193359375, -3.91943359375, -3.565673828125, -3.2119140625, -2.858154296875, -2.50439453125, -2.150634765625, -1.796875, -1.443115234375, -1.08935546875, -0.735595703125, -0.3818359375, -0.028076171875, 0.32568359375, 0.679443359375, 1.033203125, 1.386962890625, 1.74072265625, 2.094482421875, 2.4482421875, 2.802001953125, 3.15576171875, 3.509521484375, 3.86328125, 4.217041015625, 4.57080078125, 4.924560546875, 5.2783203125, 5.632080078125, 5.98583984375, 6.339599609375, 6.693359375, 7.047119140625, 7.40087890625, 7.754638671875, 8.1083984375, 8.462158203125, 8.81591796875, 9.169677734375, 9.5234375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 4.0, 6.0, 12.0, 11.0, 16.0, 18.0, 22.0, 25.0, 29.0, 34.0, 51.0, 54.0, 73.0, 57.0, 70.0, 67.0, 81.0, 61.0, 50.0, 40.0, 43.0, 27.0, 18.0, 22.0, 21.0, 19.0, 14.0, 9.0, 7.0, 5.0, 5.0, 8.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009074211120605469, -0.0008795484900474548, -0.0008516758680343628, -0.0008238032460212708, -0.0007959306240081787, -0.0007680580019950867, -0.0007401853799819946, -0.0007123127579689026, -0.0006844401359558105, -0.0006565675139427185, -0.0006286948919296265, -0.0006008222699165344, -0.0005729496479034424, -0.0005450770258903503, -0.0005172044038772583, -0.0004893317818641663, -0.0004614591598510742, -0.0004335865378379822, -0.00040571391582489014, -0.0003778412938117981, -0.00034996867179870605, -0.000322096049785614, -0.00029422342777252197, -0.00026635080575942993, -0.0002384781837463379, -0.00021060556173324585, -0.0001827329397201538, -0.00015486031770706177, -0.00012698769569396973, -9.911507368087769e-05, -7.124245166778564e-05, -4.3369829654693604e-05, -1.5497207641601562e-05, 1.2375414371490479e-05, 4.024803638458252e-05, 6.812065839767456e-05, 9.59932804107666e-05, 0.00012386590242385864, 0.00015173852443695068, 0.00017961114645004272, 0.00020748376846313477, 0.0002353563904762268, 0.00026322901248931885, 0.0002911016345024109, 0.00031897425651550293, 0.00034684687852859497, 0.000374719500541687, 0.00040259212255477905, 0.0004304647445678711, 0.00045833736658096313, 0.0004862099885940552, 0.0005140826106071472, 0.0005419552326202393, 0.0005698278546333313, 0.0005977004766464233, 0.0006255730986595154, 0.0006534457206726074, 0.0006813183426856995, 0.0007091909646987915, 0.0007370635867118835, 0.0007649362087249756, 0.0007928088307380676, 0.0008206814527511597, 0.0008485540747642517, 0.0008764266967773438]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 11.0, 9.0, 16.0, 36.0, 41.0, 91.0, 152.0, 265.0, 579.0, 1754.0, 5615.0, 28630.0, 249955.0, 637819.0, 104114.0, 14168.0, 3299.0, 1079.0, 433.0, 215.0, 92.0, 77.0, 32.0, 26.0, 17.0, 11.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.08984375, -13.625, -13.16015625, -12.6953125, -12.23046875, -11.765625, -11.30078125, -10.8359375, -10.37109375, -9.90625, -9.44140625, -8.9765625, -8.51171875, -8.046875, -7.58203125, -7.1171875, -6.65234375, -6.1875, -5.72265625, -5.2578125, -4.79296875, -4.328125, -3.86328125, -3.3984375, -2.93359375, -2.46875, -2.00390625, -1.5390625, -1.07421875, -0.609375, -0.14453125, 0.3203125, 0.78515625, 1.25, 1.71484375, 2.1796875, 2.64453125, 3.109375, 3.57421875, 4.0390625, 4.50390625, 4.96875, 5.43359375, 5.8984375, 6.36328125, 6.828125, 7.29296875, 7.7578125, 8.22265625, 8.6875, 9.15234375, 9.6171875, 10.08203125, 10.546875, 11.01171875, 11.4765625, 11.94140625, 12.40625, 12.87109375, 13.3359375, 13.80078125, 14.265625, 14.73046875, 15.1953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 1.0, 6.0, 12.0, 10.0, 14.0, 19.0, 21.0, 42.0, 35.0, 56.0, 67.0, 74.0, 96.0, 103.0, 90.0, 80.0, 73.0, 59.0, 42.0, 36.0, 18.0, 8.0, 12.0, 7.0, 10.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.72265625, -3.55877685546875, -3.3948974609375, -3.23101806640625, -3.067138671875, -2.90325927734375, -2.7393798828125, -2.57550048828125, -2.41162109375, -2.24774169921875, -2.0838623046875, -1.91998291015625, -1.756103515625, -1.59222412109375, -1.4283447265625, -1.26446533203125, -1.1005859375, -0.93670654296875, -0.7728271484375, -0.60894775390625, -0.445068359375, -0.28118896484375, -0.1173095703125, 0.04656982421875, 0.21044921875, 0.37432861328125, 0.5382080078125, 0.70208740234375, 0.865966796875, 1.02984619140625, 1.1937255859375, 1.35760498046875, 1.521484375, 1.68536376953125, 1.8492431640625, 2.01312255859375, 2.177001953125, 2.34088134765625, 2.5047607421875, 2.66864013671875, 2.83251953125, 2.99639892578125, 3.1602783203125, 3.32415771484375, 3.488037109375, 3.65191650390625, 3.8157958984375, 3.97967529296875, 4.1435546875, 4.30743408203125, 4.4713134765625, 4.63519287109375, 4.799072265625, 4.96295166015625, 5.1268310546875, 5.29071044921875, 5.45458984375, 5.61846923828125, 5.7823486328125, 5.94622802734375, 6.110107421875, 6.27398681640625, 6.4378662109375, 6.60174560546875, 6.765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 7.0, 10.0, 19.0, 34.0, 64.0, 76.0, 114.0, 134.0, 140.0, 137.0, 98.0, 75.0, 23.0, 28.0, 14.0, 8.0, 4.0, 1.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.63613891601562, -75.70919799804688, -73.78225708007812, -71.85531616210938, -69.92838287353516, -68.0014419555664, -66.07450103759766, -64.1475601196289, -62.220619201660156, -60.293678283691406, -58.36674118041992, -56.43980026245117, -54.51285934448242, -52.58592224121094, -50.65898132324219, -48.73204040527344, -46.80509948730469, -44.87815856933594, -42.95122146606445, -41.0242805480957, -39.09733963012695, -37.17040252685547, -35.24346160888672, -33.31652069091797, -31.389583587646484, -29.462644577026367, -27.535703659057617, -25.6087646484375, -23.68182373046875, -21.754884719848633, -19.827945709228516, -17.901004791259766, -15.974063873291016, -14.047123908996582, -12.120183944702148, -10.193244934082031, -8.266304016113281, -6.339365005493164, -4.4124250411987305, -2.485485076904297, -0.5585451126098633, 1.3683947324752808, 3.295334577560425, 5.222274303436279, 7.149214267730713, 9.076153755187988, 11.003093719482422, 12.930033683776855, 14.856973648071289, 16.783912658691406, 18.710853576660156, 20.637792587280273, 22.564733505249023, 24.49167251586914, 26.41861343383789, 28.345552444458008, 30.272491455078125, 32.199432373046875, 34.12636947631836, 36.05331039428711, 37.98025131225586, 39.907188415527344, 41.834129333496094, 43.761070251464844, 45.688011169433594]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 3.0, 14.0, 10.0, 11.0, 21.0, 19.0, 17.0, 30.0, 39.0, 39.0, 46.0, 46.0, 36.0, 48.0, 56.0, 56.0, 48.0, 47.0, 39.0, 48.0, 47.0, 37.0, 42.0, 29.0, 25.0, 26.0, 21.0, 21.0, 12.0, 14.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-25.92521858215332, -25.13916778564453, -24.35311508178711, -23.56706428527832, -22.78101348876953, -21.99496078491211, -21.20890998840332, -20.42285919189453, -19.63680648803711, -18.85075569152832, -18.0647029876709, -17.27865219116211, -16.492599487304688, -15.706548690795898, -14.92049789428711, -14.134446144104004, -13.348394393920898, -12.562342643737793, -11.776290893554688, -10.990240097045898, -10.204188346862793, -9.418136596679688, -8.632085800170898, -7.846034049987793, -7.0599822998046875, -6.273930549621582, -5.487879276275635, -4.7018280029296875, -3.915776252746582, -3.1297247409820557, -2.3436732292175293, -1.557621955871582, -0.7715721130371094, 0.014479398727416992, 0.8005309104919434, 1.5865824222564697, 2.372633934020996, 3.1586854457855225, 3.944736957550049, 4.730788230895996, 5.516839981079102, 6.302891731262207, 7.088943004608154, 7.874994277954102, 8.661046028137207, 9.447097778320312, 10.233148574829102, 11.019200325012207, 11.805252075195312, 12.591303825378418, 13.377355575561523, 14.163406372070312, 14.949458122253418, 15.735509872436523, 16.521560668945312, 17.307613372802734, 18.093664169311523, 18.879714965820312, 19.665767669677734, 20.451818466186523, 21.237869262695312, 22.023921966552734, 22.809972763061523, 23.596023559570312, 24.382076263427734]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 4.0, 8.0, 9.0, 15.0, 12.0, 11.0, 24.0, 27.0, 36.0, 53.0, 78.0, 139.0, 304.0, 1047.0, 6634.0, 123080.0, 4004493.0, 53686.0, 3719.0, 587.0, 151.0, 70.0, 29.0, 29.0, 24.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-66.5625, -65.062744140625, -63.56298828125, -62.063232421875, -60.5634765625, -59.063720703125, -57.56396484375, -56.064208984375, -54.564453125, -53.064697265625, -51.56494140625, -50.065185546875, -48.5654296875, -47.065673828125, -45.56591796875, -44.066162109375, -42.56640625, -41.066650390625, -39.56689453125, -38.067138671875, -36.5673828125, -35.067626953125, -33.56787109375, -32.068115234375, -30.568359375, -29.068603515625, -27.56884765625, -26.069091796875, -24.5693359375, -23.069580078125, -21.56982421875, -20.070068359375, -18.5703125, -17.070556640625, -15.57080078125, -14.071044921875, -12.5712890625, -11.071533203125, -9.57177734375, -8.072021484375, -6.572265625, -5.072509765625, -3.57275390625, -2.072998046875, -0.5732421875, 0.926513671875, 2.42626953125, 3.926025390625, 5.42578125, 6.925537109375, 8.42529296875, 9.925048828125, 11.4248046875, 12.924560546875, 14.42431640625, 15.924072265625, 17.423828125, 18.923583984375, 20.42333984375, 21.923095703125, 23.4228515625, 24.922607421875, 26.42236328125, 27.922119140625, 29.421875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 17.0, 21.0, 45.0, 66.0, 95.0, 133.0, 132.0, 120.0, 107.0, 88.0, 63.0, 37.0, 24.0, 24.0, 10.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.505859375, -2.45465087890625, -2.4034423828125, -2.35223388671875, -2.301025390625, -2.24981689453125, -2.1986083984375, -2.14739990234375, -2.09619140625, -2.04498291015625, -1.9937744140625, -1.94256591796875, -1.891357421875, -1.84014892578125, -1.7889404296875, -1.73773193359375, -1.6865234375, -1.63531494140625, -1.5841064453125, -1.53289794921875, -1.481689453125, -1.43048095703125, -1.3792724609375, -1.32806396484375, -1.27685546875, -1.22564697265625, -1.1744384765625, -1.12322998046875, -1.072021484375, -1.02081298828125, -0.9696044921875, -0.91839599609375, -0.8671875, -0.81597900390625, -0.7647705078125, -0.71356201171875, -0.662353515625, -0.61114501953125, -0.5599365234375, -0.50872802734375, -0.45751953125, -0.40631103515625, -0.3551025390625, -0.30389404296875, -0.252685546875, -0.20147705078125, -0.1502685546875, -0.09906005859375, -0.0478515625, 0.00335693359375, 0.0545654296875, 0.10577392578125, 0.156982421875, 0.20819091796875, 0.2593994140625, 0.31060791015625, 0.36181640625, 0.41302490234375, 0.4642333984375, 0.51544189453125, 0.566650390625, 0.61785888671875, 0.6690673828125, 0.72027587890625, 0.771484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 27.0, 27.0, 48.0, 65.0, 107.0, 188.0, 357.0, 1225.0, 9085.0, 263762.0, 3864433.0, 50366.0, 3365.0, 656.0, 239.0, 134.0, 74.0, 56.0, 22.0, 20.0, 11.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-61.5625, -60.140380859375, -58.71826171875, -57.296142578125, -55.8740234375, -54.451904296875, -53.02978515625, -51.607666015625, -50.185546875, -48.763427734375, -47.34130859375, -45.919189453125, -44.4970703125, -43.074951171875, -41.65283203125, -40.230712890625, -38.80859375, -37.386474609375, -35.96435546875, -34.542236328125, -33.1201171875, -31.697998046875, -30.27587890625, -28.853759765625, -27.431640625, -26.009521484375, -24.58740234375, -23.165283203125, -21.7431640625, -20.321044921875, -18.89892578125, -17.476806640625, -16.0546875, -14.632568359375, -13.21044921875, -11.788330078125, -10.3662109375, -8.944091796875, -7.52197265625, -6.099853515625, -4.677734375, -3.255615234375, -1.83349609375, -0.411376953125, 1.0107421875, 2.432861328125, 3.85498046875, 5.277099609375, 6.69921875, 8.121337890625, 9.54345703125, 10.965576171875, 12.3876953125, 13.809814453125, 15.23193359375, 16.654052734375, 18.076171875, 19.498291015625, 20.92041015625, 22.342529296875, 23.7646484375, 25.186767578125, 26.60888671875, 28.031005859375, 29.453125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 10.0, 7.0, 7.0, 10.0, 28.0, 50.0, 62.0, 109.0, 191.0, 393.0, 1091.0, 1139.0, 425.0, 221.0, 125.0, 77.0, 50.0, 30.0, 16.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.20703125, -5.088714599609375, -4.97039794921875, -4.852081298828125, -4.7337646484375, -4.615447998046875, -4.49713134765625, -4.378814697265625, -4.260498046875, -4.142181396484375, -4.02386474609375, -3.905548095703125, -3.7872314453125, -3.668914794921875, -3.55059814453125, -3.432281494140625, -3.31396484375, -3.195648193359375, -3.07733154296875, -2.959014892578125, -2.8406982421875, -2.722381591796875, -2.60406494140625, -2.485748291015625, -2.367431640625, -2.249114990234375, -2.13079833984375, -2.012481689453125, -1.8941650390625, -1.775848388671875, -1.65753173828125, -1.539215087890625, -1.4208984375, -1.302581787109375, -1.18426513671875, -1.065948486328125, -0.9476318359375, -0.829315185546875, -0.71099853515625, -0.592681884765625, -0.474365234375, -0.356048583984375, -0.23773193359375, -0.119415283203125, -0.0010986328125, 0.117218017578125, 0.23553466796875, 0.353851318359375, 0.47216796875, 0.590484619140625, 0.70880126953125, 0.827117919921875, 0.9454345703125, 1.063751220703125, 1.18206787109375, 1.300384521484375, 1.418701171875, 1.537017822265625, 1.65533447265625, 1.773651123046875, 1.8919677734375, 2.010284423828125, 2.12860107421875, 2.246917724609375, 2.365234375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 11.0, 27.0, 71.0, 162.0, 317.0, 259.0, 108.0, 33.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.55364990234375, -71.60183715820312, -69.65001678466797, -67.69820404052734, -65.74638366699219, -63.7945671081543, -61.842750549316406, -59.89093780517578, -57.939117431640625, -55.987300872802734, -54.035484313964844, -52.08366775512695, -50.13185119628906, -48.18003463745117, -46.22821807861328, -44.276405334472656, -42.324588775634766, -40.372772216796875, -38.420955657958984, -36.469139099121094, -34.5173225402832, -32.56550598144531, -30.613691329956055, -28.661874771118164, -26.710058212280273, -24.758241653442383, -22.806425094604492, -20.854610443115234, -18.902793884277344, -16.950977325439453, -14.999160766601562, -13.047344207763672, -11.095527648925781, -9.14371109008789, -7.191895008087158, -5.240078926086426, -3.288262367248535, -1.3364458084106445, 0.6153697967529297, 2.5671863555908203, 4.519002914428711, 6.470819473266602, 8.422636032104492, 10.374451637268066, 12.326268196105957, 14.278084754943848, 16.229900360107422, 18.181716918945312, 20.133533477783203, 22.085350036621094, 24.037166595458984, 25.988983154296875, 27.940799713134766, 29.892616271972656, 31.844430923461914, 33.79624938964844, 35.74806213378906, 37.69987869262695, 39.651695251464844, 41.603511810302734, 43.555328369140625, 45.507144927978516, 47.458961486816406, 49.41077423095703, 51.36259460449219]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 8.0, 12.0, 20.0, 24.0, 35.0, 50.0, 44.0, 50.0, 62.0, 59.0, 65.0, 82.0, 70.0, 69.0, 57.0, 62.0, 51.0, 38.0, 43.0, 17.0, 23.0, 20.0, 13.0, 4.0, 10.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.330360412597656, -15.811052322387695, -15.291744232177734, -14.772436141967773, -14.253128051757812, -13.733819961547852, -13.214512825012207, -12.695204734802246, -12.175896644592285, -11.656588554382324, -11.137280464172363, -10.617972373962402, -10.098665237426758, -9.579357147216797, -9.060049057006836, -8.540740966796875, -8.021432876586914, -7.502124786376953, -6.982816696166992, -6.4635090827941895, -5.9442009925842285, -5.424892902374268, -4.905585289001465, -4.386277198791504, -3.866969108581543, -3.347661018371582, -2.8283531665802, -2.3090453147888184, -1.7897372245788574, -1.2704291343688965, -0.7511212825775146, -0.2318134307861328, 0.2874927520751953, 0.8068007230758667, 1.326108694076538, 1.8454166650772095, 2.364724636077881, 2.884032726287842, 3.4033405780792236, 3.9226484298706055, 4.441956520080566, 4.961264610290527, 5.480572700500488, 5.999880313873291, 6.519188404083252, 7.038496494293213, 7.557804107666016, 8.077112197875977, 8.596420288085938, 9.115728378295898, 9.63503646850586, 10.15434455871582, 10.673652648925781, 11.192960739135742, 11.712267875671387, 12.231575965881348, 12.750884056091309, 13.27019214630127, 13.78950023651123, 14.308808326721191, 14.828115463256836, 15.347423553466797, 15.866731643676758, 16.38603973388672, 16.90534782409668]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 7.0, 17.0, 13.0, 19.0, 23.0, 26.0, 24.0, 39.0, 71.0, 104.0, 260.0, 685.0, 2676.0, 14428.0, 100676.0, 491640.0, 365950.0, 59924.0, 9004.0, 1844.0, 501.0, 225.0, 117.0, 48.0, 39.0, 26.0, 23.0, 21.0, 23.0, 8.0, 11.0, 9.0, 11.0, 4.0, 6.0, 5.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.984375, -15.498046875, -15.01171875, -14.525390625, -14.0390625, -13.552734375, -13.06640625, -12.580078125, -12.09375, -11.607421875, -11.12109375, -10.634765625, -10.1484375, -9.662109375, -9.17578125, -8.689453125, -8.203125, -7.716796875, -7.23046875, -6.744140625, -6.2578125, -5.771484375, -5.28515625, -4.798828125, -4.3125, -3.826171875, -3.33984375, -2.853515625, -2.3671875, -1.880859375, -1.39453125, -0.908203125, -0.421875, 0.064453125, 0.55078125, 1.037109375, 1.5234375, 2.009765625, 2.49609375, 2.982421875, 3.46875, 3.955078125, 4.44140625, 4.927734375, 5.4140625, 5.900390625, 6.38671875, 6.873046875, 7.359375, 7.845703125, 8.33203125, 8.818359375, 9.3046875, 9.791015625, 10.27734375, 10.763671875, 11.25, 11.736328125, 12.22265625, 12.708984375, 13.1953125, 13.681640625, 14.16796875, 14.654296875, 15.140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 7.0, 7.0, 19.0, 35.0, 50.0, 72.0, 100.0, 125.0, 134.0, 112.0, 110.0, 79.0, 66.0, 42.0, 28.0, 13.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.771820068359375, -2.70965576171875, -2.647491455078125, -2.5853271484375, -2.523162841796875, -2.46099853515625, -2.398834228515625, -2.336669921875, -2.274505615234375, -2.21234130859375, -2.150177001953125, -2.0880126953125, -2.025848388671875, -1.96368408203125, -1.901519775390625, -1.83935546875, -1.777191162109375, -1.71502685546875, -1.652862548828125, -1.5906982421875, -1.528533935546875, -1.46636962890625, -1.404205322265625, -1.342041015625, -1.279876708984375, -1.21771240234375, -1.155548095703125, -1.0933837890625, -1.031219482421875, -0.96905517578125, -0.906890869140625, -0.8447265625, -0.782562255859375, -0.72039794921875, -0.658233642578125, -0.5960693359375, -0.533905029296875, -0.47174072265625, -0.409576416015625, -0.347412109375, -0.285247802734375, -0.22308349609375, -0.160919189453125, -0.0987548828125, -0.036590576171875, 0.02557373046875, 0.087738037109375, 0.14990234375, 0.212066650390625, 0.27423095703125, 0.336395263671875, 0.3985595703125, 0.460723876953125, 0.52288818359375, 0.585052490234375, 0.647216796875, 0.709381103515625, 0.77154541015625, 0.833709716796875, 0.8958740234375, 0.958038330078125, 1.02020263671875, 1.082366943359375, 1.14453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 15.0, 13.0, 29.0, 47.0, 42.0, 92.0, 115.0, 165.0, 287.0, 407.0, 627.0, 1032.0, 1796.0, 3998.0, 11073.0, 35409.0, 116498.0, 301217.0, 346749.0, 154808.0, 48479.0, 14930.0, 5221.0, 2215.0, 1147.0, 689.0, 454.0, 315.0, 203.0, 147.0, 115.0, 74.0, 39.0, 32.0, 24.0, 8.0, 11.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6015625, -8.3419189453125, -8.082275390625, -7.8226318359375, -7.56298828125, -7.3033447265625, -7.043701171875, -6.7840576171875, -6.5244140625, -6.2647705078125, -6.005126953125, -5.7454833984375, -5.48583984375, -5.2261962890625, -4.966552734375, -4.7069091796875, -4.447265625, -4.1876220703125, -3.927978515625, -3.6683349609375, -3.40869140625, -3.1490478515625, -2.889404296875, -2.6297607421875, -2.3701171875, -2.1104736328125, -1.850830078125, -1.5911865234375, -1.33154296875, -1.0718994140625, -0.812255859375, -0.5526123046875, -0.29296875, -0.0333251953125, 0.226318359375, 0.4859619140625, 0.74560546875, 1.0052490234375, 1.264892578125, 1.5245361328125, 1.7841796875, 2.0438232421875, 2.303466796875, 2.5631103515625, 2.82275390625, 3.0823974609375, 3.342041015625, 3.6016845703125, 3.861328125, 4.1209716796875, 4.380615234375, 4.6402587890625, 4.89990234375, 5.1595458984375, 5.419189453125, 5.6788330078125, 5.9384765625, 6.1981201171875, 6.457763671875, 6.7174072265625, 6.97705078125, 7.2366943359375, 7.496337890625, 7.7559814453125, 8.015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 10.0, 7.0, 8.0, 9.0, 10.0, 23.0, 16.0, 20.0, 32.0, 28.0, 28.0, 38.0, 34.0, 69.0, 40.0, 37.0, 54.0, 50.0, 59.0, 44.0, 43.0, 50.0, 39.0, 38.0, 35.0, 34.0, 29.0, 19.0, 17.0, 13.0, 9.0, 11.0, 10.0, 10.0, 4.0, 6.0, 9.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3515625, -5.20086669921875, -5.0501708984375, -4.89947509765625, -4.748779296875, -4.59808349609375, -4.4473876953125, -4.29669189453125, -4.14599609375, -3.99530029296875, -3.8446044921875, -3.69390869140625, -3.543212890625, -3.39251708984375, -3.2418212890625, -3.09112548828125, -2.9404296875, -2.78973388671875, -2.6390380859375, -2.48834228515625, -2.337646484375, -2.18695068359375, -2.0362548828125, -1.88555908203125, -1.73486328125, -1.58416748046875, -1.4334716796875, -1.28277587890625, -1.132080078125, -0.98138427734375, -0.8306884765625, -0.67999267578125, -0.529296875, -0.37860107421875, -0.2279052734375, -0.07720947265625, 0.073486328125, 0.22418212890625, 0.3748779296875, 0.52557373046875, 0.67626953125, 0.82696533203125, 0.9776611328125, 1.12835693359375, 1.279052734375, 1.42974853515625, 1.5804443359375, 1.73114013671875, 1.8818359375, 2.03253173828125, 2.1832275390625, 2.33392333984375, 2.484619140625, 2.63531494140625, 2.7860107421875, 2.93670654296875, 3.08740234375, 3.23809814453125, 3.3887939453125, 3.53948974609375, 3.690185546875, 3.84088134765625, 3.9915771484375, 4.14227294921875, 4.29296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 10.0, 13.0, 18.0, 24.0, 34.0, 46.0, 60.0, 103.0, 143.0, 266.0, 367.0, 664.0, 1198.0, 2404.0, 5328.0, 14941.0, 48445.0, 175291.0, 402394.0, 275141.0, 82739.0, 23824.0, 8133.0, 3279.0, 1566.0, 822.0, 480.0, 278.0, 151.0, 106.0, 89.0, 51.0, 31.0, 25.0, 19.0, 15.0, 10.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.65234375, -6.42840576171875, -6.2044677734375, -5.98052978515625, -5.756591796875, -5.53265380859375, -5.3087158203125, -5.08477783203125, -4.86083984375, -4.63690185546875, -4.4129638671875, -4.18902587890625, -3.965087890625, -3.74114990234375, -3.5172119140625, -3.29327392578125, -3.0693359375, -2.84539794921875, -2.6214599609375, -2.39752197265625, -2.173583984375, -1.94964599609375, -1.7257080078125, -1.50177001953125, -1.27783203125, -1.05389404296875, -0.8299560546875, -0.60601806640625, -0.382080078125, -0.15814208984375, 0.0657958984375, 0.28973388671875, 0.513671875, 0.73760986328125, 0.9615478515625, 1.18548583984375, 1.409423828125, 1.63336181640625, 1.8572998046875, 2.08123779296875, 2.30517578125, 2.52911376953125, 2.7530517578125, 2.97698974609375, 3.200927734375, 3.42486572265625, 3.6488037109375, 3.87274169921875, 4.0966796875, 4.32061767578125, 4.5445556640625, 4.76849365234375, 4.992431640625, 5.21636962890625, 5.4403076171875, 5.66424560546875, 5.88818359375, 6.11212158203125, 6.3360595703125, 6.55999755859375, 6.783935546875, 7.00787353515625, 7.2318115234375, 7.45574951171875, 7.6796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 5.0, 6.0, 11.0, 9.0, 18.0, 21.0, 23.0, 22.0, 51.0, 68.0, 76.0, 110.0, 108.0, 97.0, 79.0, 74.0, 63.0, 42.0, 25.0, 29.0, 19.0, 13.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00153350830078125, -0.0014949813485145569, -0.0014564543962478638, -0.0014179274439811707, -0.0013794004917144775, -0.0013408735394477844, -0.0013023465871810913, -0.0012638196349143982, -0.001225292682647705, -0.001186765730381012, -0.0011482387781143188, -0.0011097118258476257, -0.0010711848735809326, -0.0010326579213142395, -0.0009941309690475464, -0.0009556040167808533, -0.0009170770645141602, -0.000878550112247467, -0.0008400231599807739, -0.0008014962077140808, -0.0007629692554473877, -0.0007244423031806946, -0.0006859153509140015, -0.0006473883986473083, -0.0006088614463806152, -0.0005703344941139221, -0.000531807541847229, -0.0004932805895805359, -0.0004547536373138428, -0.00041622668504714966, -0.00037769973278045654, -0.00033917278051376343, -0.0003006458282470703, -0.0002621188759803772, -0.00022359192371368408, -0.00018506497144699097, -0.00014653801918029785, -0.00010801106691360474, -6.948411464691162e-05, -3.0957162380218506e-05, 7.569789886474609e-06, 4.6096742153167725e-05, 8.462369441986084e-05, 0.00012315064668655396, 0.00016167759895324707, 0.00020020455121994019, 0.0002387315034866333, 0.0002772584557533264, 0.00031578540802001953, 0.00035431236028671265, 0.00039283931255340576, 0.0004313662648200989, 0.000469893217086792, 0.0005084201693534851, 0.0005469471216201782, 0.0005854740738868713, 0.0006240010261535645, 0.0006625279784202576, 0.0007010549306869507, 0.0007395818829536438, 0.0007781088352203369, 0.00081663578748703, 0.0008551627397537231, 0.0008936896920204163, 0.0009322166442871094]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 4.0, 7.0, 5.0, 7.0, 19.0, 16.0, 29.0, 84.0, 114.0, 178.0, 344.0, 625.0, 1319.0, 3296.0, 11193.0, 61354.0, 390927.0, 473062.0, 84512.0, 14402.0, 4020.0, 1554.0, 667.0, 332.0, 196.0, 114.0, 49.0, 34.0, 34.0, 10.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.5435791015625, -10.204345703125, -9.8651123046875, -9.52587890625, -9.1866455078125, -8.847412109375, -8.5081787109375, -8.1689453125, -7.8297119140625, -7.490478515625, -7.1512451171875, -6.81201171875, -6.4727783203125, -6.133544921875, -5.7943115234375, -5.455078125, -5.1158447265625, -4.776611328125, -4.4373779296875, -4.09814453125, -3.7589111328125, -3.419677734375, -3.0804443359375, -2.7412109375, -2.4019775390625, -2.062744140625, -1.7235107421875, -1.38427734375, -1.0450439453125, -0.705810546875, -0.3665771484375, -0.02734375, 0.3118896484375, 0.651123046875, 0.9903564453125, 1.32958984375, 1.6688232421875, 2.008056640625, 2.3472900390625, 2.6865234375, 3.0257568359375, 3.364990234375, 3.7042236328125, 4.04345703125, 4.3826904296875, 4.721923828125, 5.0611572265625, 5.400390625, 5.7396240234375, 6.078857421875, 6.4180908203125, 6.75732421875, 7.0965576171875, 7.435791015625, 7.7750244140625, 8.1142578125, 8.4534912109375, 8.792724609375, 9.1319580078125, 9.47119140625, 9.8104248046875, 10.149658203125, 10.4888916015625, 10.828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 5.0, 13.0, 14.0, 14.0, 26.0, 46.0, 43.0, 61.0, 68.0, 88.0, 73.0, 81.0, 91.0, 77.0, 66.0, 45.0, 44.0, 43.0, 24.0, 19.0, 16.0, 10.0, 8.0, 2.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.0499267578125, -3.896728515625, -3.7435302734375, -3.59033203125, -3.4371337890625, -3.283935546875, -3.1307373046875, -2.9775390625, -2.8243408203125, -2.671142578125, -2.5179443359375, -2.36474609375, -2.2115478515625, -2.058349609375, -1.9051513671875, -1.751953125, -1.5987548828125, -1.445556640625, -1.2923583984375, -1.13916015625, -0.9859619140625, -0.832763671875, -0.6795654296875, -0.5263671875, -0.3731689453125, -0.219970703125, -0.0667724609375, 0.08642578125, 0.2396240234375, 0.392822265625, 0.5460205078125, 0.69921875, 0.8524169921875, 1.005615234375, 1.1588134765625, 1.31201171875, 1.4652099609375, 1.618408203125, 1.7716064453125, 1.9248046875, 2.0780029296875, 2.231201171875, 2.3843994140625, 2.53759765625, 2.6907958984375, 2.843994140625, 2.9971923828125, 3.150390625, 3.3035888671875, 3.456787109375, 3.6099853515625, 3.76318359375, 3.9163818359375, 4.069580078125, 4.2227783203125, 4.3759765625, 4.5291748046875, 4.682373046875, 4.8355712890625, 4.98876953125, 5.1419677734375, 5.295166015625, 5.4483642578125, 5.6015625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 12.0, 34.0, 73.0, 136.0, 230.0, 242.0, 135.0, 82.0, 25.0, 13.0, 9.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.122108459472656, -38.83321762084961, -35.54432678222656, -32.25543975830078, -28.966548919677734, -25.677658081054688, -22.388769149780273, -19.09988021850586, -15.810989379882812, -12.522099494934082, -9.233209609985352, -5.944319725036621, -2.6554298400878906, 0.6334609985351562, 3.9223499298095703, 7.211238861083984, 10.500129699707031, 13.789019584655762, 17.077909469604492, 20.366798400878906, 23.655689239501953, 26.944580078125, 30.233469009399414, 33.52235794067383, 36.811248779296875, 40.10013961791992, 43.38903045654297, 46.67791748046875, 49.9668083190918, 53.255699157714844, 56.544586181640625, 59.83347702026367, 63.12237548828125, 66.41126251220703, 69.70015716552734, 72.98904418945312, 76.27793884277344, 79.56682586669922, 82.855712890625, 86.14460754394531, 89.4334945678711, 92.72238159179688, 96.01127624511719, 99.30016326904297, 102.58905029296875, 105.87794494628906, 109.16683197021484, 112.45571899414062, 115.74461364746094, 119.03350067138672, 122.32239532470703, 125.61128234863281, 128.90017700195312, 132.18905639648438, 135.4779510498047, 138.766845703125, 142.05572509765625, 145.34461975097656, 148.6334991455078, 151.92239379882812, 155.21128845214844, 158.50018310546875, 161.7890625, 165.0779571533203, 168.36685180664062]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 11.0, 15.0, 18.0, 17.0, 14.0, 27.0, 38.0, 29.0, 32.0, 49.0, 44.0, 46.0, 38.0, 48.0, 50.0, 46.0, 46.0, 39.0, 49.0, 45.0, 44.0, 33.0, 32.0, 30.0, 25.0, 22.0, 22.0, 16.0, 9.0, 12.0, 8.0, 5.0, 2.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.23662567138672, -32.14679718017578, -31.056968688964844, -29.967140197753906, -28.87731170654297, -27.78748321533203, -26.697654724121094, -25.607826232910156, -24.51799774169922, -23.42816925048828, -22.338340759277344, -21.248512268066406, -20.15868377685547, -19.06885528564453, -17.979026794433594, -16.889198303222656, -15.799367904663086, -14.709539413452148, -13.619710922241211, -12.529882431030273, -11.440053939819336, -10.350225448608398, -9.260396003723145, -8.170567512512207, -7.0807390213012695, -5.990910530090332, -4.9010820388793945, -3.811253070831299, -2.7214245796203613, -1.6315960884094238, -0.5417671203613281, 0.5480613708496094, 1.6378898620605469, 2.7277183532714844, 3.817547082901001, 4.907375812530518, 5.997204303741455, 7.087032794952393, 8.176861763000488, 9.266690254211426, 10.356518745422363, 11.4463472366333, 12.536175727844238, 13.626005172729492, 14.71583366394043, 15.805662155151367, 16.895490646362305, 17.985319137573242, 19.07514762878418, 20.164976119995117, 21.254804611206055, 22.344633102416992, 23.43446159362793, 24.524290084838867, 25.614120483398438, 26.703948974609375, 27.793777465820312, 28.88360595703125, 29.973434448242188, 31.063262939453125, 32.15309143066406, 33.242919921875, 34.33274841308594, 35.422576904296875, 36.51240539550781]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 9.0, 11.0, 16.0, 22.0, 28.0, 25.0, 48.0, 55.0, 78.0, 132.0, 207.0, 451.0, 1203.0, 4306.0, 21919.0, 228801.0, 3773978.0, 142644.0, 16097.0, 2995.0, 734.0, 233.0, 95.0, 60.0, 43.0, 28.0, 17.0, 20.0, 5.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71875, -25.96435546875, -25.2099609375, -24.45556640625, -23.701171875, -22.94677734375, -22.1923828125, -21.43798828125, -20.68359375, -19.92919921875, -19.1748046875, -18.42041015625, -17.666015625, -16.91162109375, -16.1572265625, -15.40283203125, -14.6484375, -13.89404296875, -13.1396484375, -12.38525390625, -11.630859375, -10.87646484375, -10.1220703125, -9.36767578125, -8.61328125, -7.85888671875, -7.1044921875, -6.35009765625, -5.595703125, -4.84130859375, -4.0869140625, -3.33251953125, -2.578125, -1.82373046875, -1.0693359375, -0.31494140625, 0.439453125, 1.19384765625, 1.9482421875, 2.70263671875, 3.45703125, 4.21142578125, 4.9658203125, 5.72021484375, 6.474609375, 7.22900390625, 7.9833984375, 8.73779296875, 9.4921875, 10.24658203125, 11.0009765625, 11.75537109375, 12.509765625, 13.26416015625, 14.0185546875, 14.77294921875, 15.52734375, 16.28173828125, 17.0361328125, 17.79052734375, 18.544921875, 19.29931640625, 20.0537109375, 20.80810546875, 21.5625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 9.0, 15.0, 26.0, 23.0, 51.0, 64.0, 72.0, 90.0, 108.0, 83.0, 88.0, 98.0, 82.0, 53.0, 44.0, 30.0, 26.0, 16.0, 11.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.689453125, -2.6338348388671875, -2.578216552734375, -2.5225982666015625, -2.46697998046875, -2.4113616943359375, -2.355743408203125, -2.3001251220703125, -2.2445068359375, -2.1888885498046875, -2.133270263671875, -2.0776519775390625, -2.02203369140625, -1.9664154052734375, -1.910797119140625, -1.8551788330078125, -1.799560546875, -1.7439422607421875, -1.688323974609375, -1.6327056884765625, -1.57708740234375, -1.5214691162109375, -1.465850830078125, -1.4102325439453125, -1.3546142578125, -1.2989959716796875, -1.243377685546875, -1.1877593994140625, -1.13214111328125, -1.0765228271484375, -1.020904541015625, -0.9652862548828125, -0.90966796875, -0.8540496826171875, -0.798431396484375, -0.7428131103515625, -0.68719482421875, -0.6315765380859375, -0.575958251953125, -0.5203399658203125, -0.4647216796875, -0.4091033935546875, -0.353485107421875, -0.2978668212890625, -0.24224853515625, -0.1866302490234375, -0.131011962890625, -0.0753936767578125, -0.019775390625, 0.0358428955078125, 0.091461181640625, 0.1470794677734375, 0.20269775390625, 0.2583160400390625, 0.313934326171875, 0.3695526123046875, 0.4251708984375, 0.4807891845703125, 0.536407470703125, 0.5920257568359375, 0.64764404296875, 0.7032623291015625, 0.758880615234375, 0.8144989013671875, 0.8701171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 12.0, 10.0, 12.0, 24.0, 49.0, 87.0, 139.0, 260.0, 584.0, 1509.0, 6107.0, 43500.0, 996433.0, 3058689.0, 74936.0, 8811.0, 1900.0, 624.0, 281.0, 146.0, 68.0, 41.0, 28.0, 17.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.21875, -32.4482421875, -31.677734375, -30.9072265625, -30.13671875, -29.3662109375, -28.595703125, -27.8251953125, -27.0546875, -26.2841796875, -25.513671875, -24.7431640625, -23.97265625, -23.2021484375, -22.431640625, -21.6611328125, -20.890625, -20.1201171875, -19.349609375, -18.5791015625, -17.80859375, -17.0380859375, -16.267578125, -15.4970703125, -14.7265625, -13.9560546875, -13.185546875, -12.4150390625, -11.64453125, -10.8740234375, -10.103515625, -9.3330078125, -8.5625, -7.7919921875, -7.021484375, -6.2509765625, -5.48046875, -4.7099609375, -3.939453125, -3.1689453125, -2.3984375, -1.6279296875, -0.857421875, -0.0869140625, 0.68359375, 1.4541015625, 2.224609375, 2.9951171875, 3.765625, 4.5361328125, 5.306640625, 6.0771484375, 6.84765625, 7.6181640625, 8.388671875, 9.1591796875, 9.9296875, 10.7001953125, 11.470703125, 12.2412109375, 13.01171875, 13.7822265625, 14.552734375, 15.3232421875, 16.09375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 13.0, 12.0, 15.0, 15.0, 33.0, 49.0, 57.0, 84.0, 155.0, 244.0, 431.0, 1004.0, 919.0, 414.0, 208.0, 124.0, 86.0, 59.0, 42.0, 39.0, 29.0, 12.0, 12.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.873046875, -3.7711181640625, -3.669189453125, -3.5672607421875, -3.46533203125, -3.3634033203125, -3.261474609375, -3.1595458984375, -3.0576171875, -2.9556884765625, -2.853759765625, -2.7518310546875, -2.64990234375, -2.5479736328125, -2.446044921875, -2.3441162109375, -2.2421875, -2.1402587890625, -2.038330078125, -1.9364013671875, -1.83447265625, -1.7325439453125, -1.630615234375, -1.5286865234375, -1.4267578125, -1.3248291015625, -1.222900390625, -1.1209716796875, -1.01904296875, -0.9171142578125, -0.815185546875, -0.7132568359375, -0.611328125, -0.5093994140625, -0.407470703125, -0.3055419921875, -0.20361328125, -0.1016845703125, 0.000244140625, 0.1021728515625, 0.2041015625, 0.3060302734375, 0.407958984375, 0.5098876953125, 0.61181640625, 0.7137451171875, 0.815673828125, 0.9176025390625, 1.01953125, 1.1214599609375, 1.223388671875, 1.3253173828125, 1.42724609375, 1.5291748046875, 1.631103515625, 1.7330322265625, 1.8349609375, 1.9368896484375, 2.038818359375, 2.1407470703125, 2.24267578125, 2.3446044921875, 2.446533203125, 2.5484619140625, 2.650390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 8.0, 21.0, 15.0, 22.0, 45.0, 75.0, 106.0, 121.0, 134.0, 129.0, 96.0, 74.0, 52.0, 36.0, 23.0, 14.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.101402282714844, -22.324092864990234, -21.546783447265625, -20.76947593688965, -19.99216651916504, -19.21485710144043, -18.43754768371582, -17.660240173339844, -16.882930755615234, -16.105621337890625, -15.328312873840332, -14.551003456115723, -13.77369499206543, -12.99638557434082, -12.219076156616211, -11.441767692565918, -10.664458274841309, -9.8871488571167, -9.109840393066406, -8.332530975341797, -7.555222511291504, -6.7779130935668945, -6.000604152679443, -5.223295211791992, -4.445986270904541, -3.66867733001709, -2.8913683891296387, -2.1140592098236084, -1.3367502689361572, -0.559441328048706, 0.21786785125732422, 0.9951767921447754, 1.7724857330322266, 2.5497946739196777, 3.327103614807129, 4.104413032531738, 4.881721496582031, 5.659030914306641, 6.436339855194092, 7.213648796081543, 7.990957736968994, 8.768266677856445, 9.545576095581055, 10.322884559631348, 11.100193977355957, 11.87750244140625, 12.65481185913086, 13.432121276855469, 14.209429740905762, 14.986739158630371, 15.764047622680664, 16.541357040405273, 17.318666458129883, 18.09597396850586, 18.87328338623047, 19.650592803955078, 20.427902221679688, 21.205211639404297, 21.982521057128906, 22.759828567504883, 23.537137985229492, 24.3144474029541, 25.09175682067871, 25.869064331054688, 26.646373748779297]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 7.0, 10.0, 7.0, 16.0, 20.0, 30.0, 27.0, 36.0, 46.0, 49.0, 51.0, 63.0, 52.0, 56.0, 73.0, 67.0, 61.0, 53.0, 50.0, 35.0, 40.0, 37.0, 40.0, 21.0, 12.0, 11.0, 10.0, 4.0, 6.0, 2.0, 1.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.743078231811523, -17.250381469726562, -16.757686614990234, -16.264989852905273, -15.772293090820312, -15.279597282409668, -14.786901473999023, -14.294204711914062, -13.801507949829102, -13.308812141418457, -12.816115379333496, -12.323419570922852, -11.83072280883789, -11.338027000427246, -10.845331192016602, -10.35263442993164, -9.859938621520996, -9.367242813110352, -8.87454605102539, -8.381850242614746, -7.889153480529785, -7.396457672119141, -6.903761386871338, -6.411065101623535, -5.918368816375732, -5.42567253112793, -4.932976245880127, -4.440279960632324, -3.9475839138031006, -3.454887628555298, -2.962191581726074, -2.4694952964782715, -1.9767999649047852, -1.4841036796569824, -0.9914075136184692, -0.49871134757995605, -0.00601506233215332, 0.4866812229156494, 0.979377269744873, 1.4720735549926758, 1.9647698402404785, 2.4574661254882812, 2.950162410736084, 3.4428584575653076, 3.9355547428131104, 4.428251266479492, 4.920947074890137, 5.4136433601379395, 5.906339645385742, 6.399035930633545, 6.891732215881348, 7.384428024291992, 7.877124786376953, 8.369820594787598, 8.862516403198242, 9.355213165283203, 9.847909927368164, 10.340605735778809, 10.83330249786377, 11.325998306274414, 11.818695068359375, 12.31139087677002, 12.804086685180664, 13.296783447265625, 13.78947925567627]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 8.0, 7.0, 12.0, 17.0, 22.0, 29.0, 43.0, 81.0, 180.0, 571.0, 2318.0, 12945.0, 108005.0, 553980.0, 320829.0, 41871.0, 5722.0, 1198.0, 347.0, 139.0, 76.0, 41.0, 32.0, 17.0, 13.0, 12.0, 11.0, 5.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4453125, -12.9781494140625, -12.510986328125, -12.0438232421875, -11.57666015625, -11.1094970703125, -10.642333984375, -10.1751708984375, -9.7080078125, -9.2408447265625, -8.773681640625, -8.3065185546875, -7.83935546875, -7.3721923828125, -6.905029296875, -6.4378662109375, -5.970703125, -5.5035400390625, -5.036376953125, -4.5692138671875, -4.10205078125, -3.6348876953125, -3.167724609375, -2.7005615234375, -2.2333984375, -1.7662353515625, -1.299072265625, -0.8319091796875, -0.36474609375, 0.1024169921875, 0.569580078125, 1.0367431640625, 1.50390625, 1.9710693359375, 2.438232421875, 2.9053955078125, 3.37255859375, 3.8397216796875, 4.306884765625, 4.7740478515625, 5.2412109375, 5.7083740234375, 6.175537109375, 6.6427001953125, 7.10986328125, 7.5770263671875, 8.044189453125, 8.5113525390625, 8.978515625, 9.4456787109375, 9.912841796875, 10.3800048828125, 10.84716796875, 11.3143310546875, 11.781494140625, 12.2486572265625, 12.7158203125, 13.1829833984375, 13.650146484375, 14.1173095703125, 14.58447265625, 15.0516357421875, 15.518798828125, 15.9859619140625, 16.453125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 10.0, 7.0, 16.0, 24.0, 28.0, 38.0, 54.0, 60.0, 85.0, 101.0, 96.0, 97.0, 87.0, 81.0, 57.0, 47.0, 38.0, 27.0, 20.0, 11.0, 11.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.66796875, -2.60968017578125, -2.5513916015625, -2.49310302734375, -2.434814453125, -2.37652587890625, -2.3182373046875, -2.25994873046875, -2.20166015625, -2.14337158203125, -2.0850830078125, -2.02679443359375, -1.968505859375, -1.91021728515625, -1.8519287109375, -1.79364013671875, -1.7353515625, -1.67706298828125, -1.6187744140625, -1.56048583984375, -1.502197265625, -1.44390869140625, -1.3856201171875, -1.32733154296875, -1.26904296875, -1.21075439453125, -1.1524658203125, -1.09417724609375, -1.035888671875, -0.97760009765625, -0.9193115234375, -0.86102294921875, -0.802734375, -0.74444580078125, -0.6861572265625, -0.62786865234375, -0.569580078125, -0.51129150390625, -0.4530029296875, -0.39471435546875, -0.33642578125, -0.27813720703125, -0.2198486328125, -0.16156005859375, -0.103271484375, -0.04498291015625, 0.0133056640625, 0.07159423828125, 0.1298828125, 0.18817138671875, 0.2464599609375, 0.30474853515625, 0.363037109375, 0.42132568359375, 0.4796142578125, 0.53790283203125, 0.59619140625, 0.65447998046875, 0.7127685546875, 0.77105712890625, 0.829345703125, 0.88763427734375, 0.9459228515625, 1.00421142578125, 1.0625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 7.0, 10.0, 18.0, 26.0, 31.0, 70.0, 105.0, 203.0, 307.0, 558.0, 944.0, 1916.0, 5007.0, 17167.0, 67795.0, 241204.0, 421359.0, 211307.0, 57681.0, 14640.0, 4315.0, 1737.0, 816.0, 490.0, 309.0, 207.0, 118.0, 73.0, 56.0, 33.0, 15.0, 15.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.328125, -8.063232421875, -7.79833984375, -7.533447265625, -7.2685546875, -7.003662109375, -6.73876953125, -6.473876953125, -6.208984375, -5.944091796875, -5.67919921875, -5.414306640625, -5.1494140625, -4.884521484375, -4.61962890625, -4.354736328125, -4.08984375, -3.824951171875, -3.56005859375, -3.295166015625, -3.0302734375, -2.765380859375, -2.50048828125, -2.235595703125, -1.970703125, -1.705810546875, -1.44091796875, -1.176025390625, -0.9111328125, -0.646240234375, -0.38134765625, -0.116455078125, 0.1484375, 0.413330078125, 0.67822265625, 0.943115234375, 1.2080078125, 1.472900390625, 1.73779296875, 2.002685546875, 2.267578125, 2.532470703125, 2.79736328125, 3.062255859375, 3.3271484375, 3.592041015625, 3.85693359375, 4.121826171875, 4.38671875, 4.651611328125, 4.91650390625, 5.181396484375, 5.4462890625, 5.711181640625, 5.97607421875, 6.240966796875, 6.505859375, 6.770751953125, 7.03564453125, 7.300537109375, 7.5654296875, 7.830322265625, 8.09521484375, 8.360107421875, 8.625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 6.0, 1.0, 7.0, 7.0, 8.0, 8.0, 8.0, 11.0, 9.0, 22.0, 18.0, 19.0, 26.0, 28.0, 28.0, 29.0, 33.0, 41.0, 47.0, 50.0, 48.0, 53.0, 31.0, 40.0, 34.0, 38.0, 38.0, 49.0, 30.0, 32.0, 33.0, 33.0, 20.0, 21.0, 22.0, 14.0, 14.0, 5.0, 7.0, 9.0, 3.0, 8.0, 5.0, 8.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.587066650390625, -3.43780517578125, -3.288543701171875, -3.1392822265625, -2.990020751953125, -2.84075927734375, -2.691497802734375, -2.542236328125, -2.392974853515625, -2.24371337890625, -2.094451904296875, -1.9451904296875, -1.795928955078125, -1.64666748046875, -1.497406005859375, -1.34814453125, -1.198883056640625, -1.04962158203125, -0.900360107421875, -0.7510986328125, -0.601837158203125, -0.45257568359375, -0.303314208984375, -0.154052734375, -0.004791259765625, 0.14447021484375, 0.293731689453125, 0.4429931640625, 0.592254638671875, 0.74151611328125, 0.890777587890625, 1.0400390625, 1.189300537109375, 1.33856201171875, 1.487823486328125, 1.6370849609375, 1.786346435546875, 1.93560791015625, 2.084869384765625, 2.234130859375, 2.383392333984375, 2.53265380859375, 2.681915283203125, 2.8311767578125, 2.980438232421875, 3.12969970703125, 3.278961181640625, 3.42822265625, 3.577484130859375, 3.72674560546875, 3.876007080078125, 4.0252685546875, 4.174530029296875, 4.32379150390625, 4.473052978515625, 4.622314453125, 4.771575927734375, 4.92083740234375, 5.070098876953125, 5.2193603515625, 5.368621826171875, 5.51788330078125, 5.667144775390625, 5.81640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 5.0, 14.0, 14.0, 22.0, 28.0, 48.0, 78.0, 147.0, 187.0, 316.0, 502.0, 946.0, 1862.0, 4354.0, 11193.0, 34592.0, 123170.0, 355039.0, 346154.0, 117592.0, 32970.0, 10901.0, 4275.0, 1934.0, 953.0, 479.0, 280.0, 165.0, 109.0, 68.0, 40.0, 27.0, 22.0, 10.0, 9.0, 14.0, 10.0, 3.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.41015625, -4.2630615234375, -4.115966796875, -3.9688720703125, -3.82177734375, -3.6746826171875, -3.527587890625, -3.3804931640625, -3.2333984375, -3.0863037109375, -2.939208984375, -2.7921142578125, -2.64501953125, -2.4979248046875, -2.350830078125, -2.2037353515625, -2.056640625, -1.9095458984375, -1.762451171875, -1.6153564453125, -1.46826171875, -1.3211669921875, -1.174072265625, -1.0269775390625, -0.8798828125, -0.7327880859375, -0.585693359375, -0.4385986328125, -0.29150390625, -0.1444091796875, 0.002685546875, 0.1497802734375, 0.296875, 0.4439697265625, 0.591064453125, 0.7381591796875, 0.88525390625, 1.0323486328125, 1.179443359375, 1.3265380859375, 1.4736328125, 1.6207275390625, 1.767822265625, 1.9149169921875, 2.06201171875, 2.2091064453125, 2.356201171875, 2.5032958984375, 2.650390625, 2.7974853515625, 2.944580078125, 3.0916748046875, 3.23876953125, 3.3858642578125, 3.532958984375, 3.6800537109375, 3.8271484375, 3.9742431640625, 4.121337890625, 4.2684326171875, 4.41552734375, 4.5626220703125, 4.709716796875, 4.8568115234375, 5.00390625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 2.0, 6.0, 10.0, 7.0, 8.0, 6.0, 12.0, 25.0, 26.0, 28.0, 36.0, 21.0, 45.0, 52.0, 54.0, 74.0, 88.0, 73.0, 74.0, 64.0, 50.0, 35.0, 39.0, 27.0, 19.0, 28.0, 17.0, 19.0, 13.0, 4.0, 9.0, 6.0, 4.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005822181701660156, -0.000563405454158783, -0.0005445927381515503, -0.0005257800221443176, -0.000506967306137085, -0.0004881545901298523, -0.00046934187412261963, -0.00045052915811538696, -0.0004317164421081543, -0.00041290372610092163, -0.00039409101009368896, -0.0003752782940864563, -0.00035646557807922363, -0.00033765286207199097, -0.0003188401460647583, -0.00030002743005752563, -0.00028121471405029297, -0.0002624019980430603, -0.00024358928203582764, -0.00022477656602859497, -0.0002059638500213623, -0.00018715113401412964, -0.00016833841800689697, -0.0001495257019996643, -0.00013071298599243164, -0.00011190026998519897, -9.308755397796631e-05, -7.427483797073364e-05, -5.5462121963500977e-05, -3.664940595626831e-05, -1.7836689949035645e-05, 9.760260581970215e-07, 1.9788742065429688e-05, 3.8601458072662354e-05, 5.741417407989502e-05, 7.622689008712769e-05, 9.503960609436035e-05, 0.00011385232210159302, 0.00013266503810882568, 0.00015147775411605835, 0.00017029047012329102, 0.00018910318613052368, 0.00020791590213775635, 0.00022672861814498901, 0.0002455413341522217, 0.00026435405015945435, 0.000283166766166687, 0.0003019794821739197, 0.00032079219818115234, 0.000339604914188385, 0.0003584176301956177, 0.00037723034620285034, 0.000396043062210083, 0.0004148557782173157, 0.00043366849422454834, 0.000452481210231781, 0.00047129392623901367, 0.0004901066422462463, 0.000508919358253479, 0.0005277320742607117, 0.0005465447902679443, 0.000565357506275177, 0.0005841702222824097, 0.0006029829382896423, 0.000621795654296875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 12.0, 11.0, 14.0, 12.0, 33.0, 59.0, 63.0, 98.0, 156.0, 239.0, 370.0, 695.0, 1311.0, 2829.0, 6973.0, 20232.0, 68859.0, 265531.0, 440823.0, 172168.0, 44516.0, 13726.0, 5115.0, 2128.0, 1067.0, 536.0, 324.0, 238.0, 137.0, 106.0, 47.0, 37.0, 24.0, 14.0, 17.0, 8.0, 9.0, 5.0, 7.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4296875, -5.26678466796875, -5.1038818359375, -4.94097900390625, -4.778076171875, -4.61517333984375, -4.4522705078125, -4.28936767578125, -4.12646484375, -3.96356201171875, -3.8006591796875, -3.63775634765625, -3.474853515625, -3.31195068359375, -3.1490478515625, -2.98614501953125, -2.8232421875, -2.66033935546875, -2.4974365234375, -2.33453369140625, -2.171630859375, -2.00872802734375, -1.8458251953125, -1.68292236328125, -1.52001953125, -1.35711669921875, -1.1942138671875, -1.03131103515625, -0.868408203125, -0.70550537109375, -0.5426025390625, -0.37969970703125, -0.216796875, -0.05389404296875, 0.1090087890625, 0.27191162109375, 0.434814453125, 0.59771728515625, 0.7606201171875, 0.92352294921875, 1.08642578125, 1.24932861328125, 1.4122314453125, 1.57513427734375, 1.738037109375, 1.90093994140625, 2.0638427734375, 2.22674560546875, 2.3896484375, 2.55255126953125, 2.7154541015625, 2.87835693359375, 3.041259765625, 3.20416259765625, 3.3670654296875, 3.52996826171875, 3.69287109375, 3.85577392578125, 4.0186767578125, 4.18157958984375, 4.344482421875, 4.50738525390625, 4.6702880859375, 4.83319091796875, 4.99609375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 1.0, 1.0, 5.0, 0.0, 6.0, 4.0, 12.0, 9.0, 15.0, 11.0, 15.0, 13.0, 22.0, 31.0, 38.0, 44.0, 51.0, 49.0, 51.0, 62.0, 64.0, 55.0, 52.0, 54.0, 57.0, 39.0, 38.0, 40.0, 27.0, 25.0, 34.0, 13.0, 13.0, 17.0, 8.0, 5.0, 8.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9765625, -2.89385986328125, -2.8111572265625, -2.72845458984375, -2.645751953125, -2.56304931640625, -2.4803466796875, -2.39764404296875, -2.31494140625, -2.23223876953125, -2.1495361328125, -2.06683349609375, -1.984130859375, -1.90142822265625, -1.8187255859375, -1.73602294921875, -1.6533203125, -1.57061767578125, -1.4879150390625, -1.40521240234375, -1.322509765625, -1.23980712890625, -1.1571044921875, -1.07440185546875, -0.99169921875, -0.90899658203125, -0.8262939453125, -0.74359130859375, -0.660888671875, -0.57818603515625, -0.4954833984375, -0.41278076171875, -0.330078125, -0.24737548828125, -0.1646728515625, -0.08197021484375, 0.000732421875, 0.08343505859375, 0.1661376953125, 0.24884033203125, 0.33154296875, 0.41424560546875, 0.4969482421875, 0.57965087890625, 0.662353515625, 0.74505615234375, 0.8277587890625, 0.91046142578125, 0.9931640625, 1.07586669921875, 1.1585693359375, 1.24127197265625, 1.323974609375, 1.40667724609375, 1.4893798828125, 1.57208251953125, 1.65478515625, 1.73748779296875, 1.8201904296875, 1.90289306640625, 1.985595703125, 2.06829833984375, 2.1510009765625, 2.23370361328125, 2.31640625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 14.0, 60.0, 169.0, 283.0, 274.0, 134.0, 52.0, 8.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.43489074707031, -86.2886962890625, -82.14250946044922, -77.99632263183594, -73.85012817382812, -69.70393371582031, -65.55774688720703, -61.411556243896484, -57.26536560058594, -53.11917495727539, -48.972984313964844, -44.8267936706543, -40.68060302734375, -36.5344123840332, -32.388221740722656, -28.24203109741211, -24.095840454101562, -19.949649810791016, -15.803459167480469, -11.657268524169922, -7.511077880859375, -3.364887237548828, 0.7813034057617188, 4.927494049072266, 9.073684692382812, 13.21987533569336, 17.366065979003906, 21.512256622314453, 25.658447265625, 29.804637908935547, 33.950828552246094, 38.09701919555664, 42.243194580078125, 46.38938522338867, 50.53557586669922, 54.681766510009766, 58.82795715332031, 62.97414779663086, 67.1203384399414, 71.26652526855469, 75.4127197265625, 79.55891418457031, 83.7051010131836, 87.85128784179688, 91.99748229980469, 96.1436767578125, 100.28986358642578, 104.43605041503906, 108.58224487304688, 112.72843933105469, 116.87462615966797, 121.02081298828125, 125.16700744628906, 129.31320190429688, 133.45938110351562, 137.60557556152344, 141.75177001953125, 145.89796447753906, 150.04415893554688, 154.19033813476562, 158.33653259277344, 162.48272705078125, 166.62890625, 170.7751007080078, 174.92129516601562]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 9.0, 8.0, 14.0, 5.0, 8.0, 24.0, 25.0, 28.0, 32.0, 46.0, 36.0, 51.0, 50.0, 61.0, 55.0, 53.0, 42.0, 56.0, 53.0, 38.0, 48.0, 50.0, 34.0, 27.0, 22.0, 21.0, 19.0, 24.0, 9.0, 12.0, 8.0, 4.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.51953887939453, -31.402442932128906, -30.28534698486328, -29.168251037597656, -28.05115509033203, -26.934059143066406, -25.81696128845215, -24.699865341186523, -23.5827693939209, -22.465673446655273, -21.34857749938965, -20.231481552124023, -19.114383697509766, -17.99728775024414, -16.880191802978516, -15.76309585571289, -14.645999908447266, -13.52890396118164, -12.411808013916016, -11.294711112976074, -10.17761516571045, -9.060519218444824, -7.943422794342041, -6.826326370239258, -5.709230422973633, -4.592134475708008, -3.4750380516052246, -2.3579418659210205, -1.2408456802368164, -0.1237497329711914, 0.9933466911315918, 2.110443115234375, 3.2275352478027344, 4.344631195068359, 5.461727619171143, 6.578824043273926, 7.695919990539551, 8.813015937805176, 9.930112838745117, 11.047208786010742, 12.164304733276367, 13.281400680541992, 14.398496627807617, 15.515593528747559, 16.6326904296875, 17.749786376953125, 18.86688232421875, 19.983978271484375, 21.10107421875, 22.218170166015625, 23.33526611328125, 24.452362060546875, 25.5694580078125, 26.686553955078125, 27.803651809692383, 28.920747756958008, 30.037843704223633, 31.154939651489258, 32.272037506103516, 33.38913345336914, 34.506229400634766, 35.62332534790039, 36.740421295166016, 37.85751724243164, 38.974613189697266]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 7.0, 5.0, 4.0, 8.0, 11.0, 15.0, 11.0, 23.0, 38.0, 55.0, 94.0, 97.0, 205.0, 313.0, 729.0, 1502.0, 3974.0, 12734.0, 61505.0, 1020451.0, 2978733.0, 89822.0, 16358.0, 4549.0, 1706.0, 691.0, 313.0, 151.0, 71.0, 41.0, 25.0, 15.0, 8.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.171875, -16.763916015625, -16.35595703125, -15.947998046875, -15.5400390625, -15.132080078125, -14.72412109375, -14.316162109375, -13.908203125, -13.500244140625, -13.09228515625, -12.684326171875, -12.2763671875, -11.868408203125, -11.46044921875, -11.052490234375, -10.64453125, -10.236572265625, -9.82861328125, -9.420654296875, -9.0126953125, -8.604736328125, -8.19677734375, -7.788818359375, -7.380859375, -6.972900390625, -6.56494140625, -6.156982421875, -5.7490234375, -5.341064453125, -4.93310546875, -4.525146484375, -4.1171875, -3.709228515625, -3.30126953125, -2.893310546875, -2.4853515625, -2.077392578125, -1.66943359375, -1.261474609375, -0.853515625, -0.445556640625, -0.03759765625, 0.370361328125, 0.7783203125, 1.186279296875, 1.59423828125, 2.002197265625, 2.41015625, 2.818115234375, 3.22607421875, 3.634033203125, 4.0419921875, 4.449951171875, 4.85791015625, 5.265869140625, 5.673828125, 6.081787109375, 6.48974609375, 6.897705078125, 7.3056640625, 7.713623046875, 8.12158203125, 8.529541015625, 8.9375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 18.0, 37.0, 26.0, 60.0, 63.0, 75.0, 87.0, 76.0, 89.0, 84.0, 78.0, 76.0, 62.0, 37.0, 37.0, 27.0, 14.0, 12.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.3556671142578125, -2.301177978515625, -2.2466888427734375, -2.19219970703125, -2.1377105712890625, -2.083221435546875, -2.0287322998046875, -1.9742431640625, -1.9197540283203125, -1.865264892578125, -1.8107757568359375, -1.75628662109375, -1.7017974853515625, -1.647308349609375, -1.5928192138671875, -1.538330078125, -1.4838409423828125, -1.429351806640625, -1.3748626708984375, -1.32037353515625, -1.2658843994140625, -1.211395263671875, -1.1569061279296875, -1.1024169921875, -1.0479278564453125, -0.993438720703125, -0.9389495849609375, -0.88446044921875, -0.8299713134765625, -0.775482177734375, -0.7209930419921875, -0.66650390625, -0.6120147705078125, -0.557525634765625, -0.5030364990234375, -0.44854736328125, -0.3940582275390625, -0.339569091796875, -0.2850799560546875, -0.2305908203125, -0.1761016845703125, -0.121612548828125, -0.0671234130859375, -0.01263427734375, 0.0418548583984375, 0.096343994140625, 0.1508331298828125, 0.205322265625, 0.2598114013671875, 0.314300537109375, 0.3687896728515625, 0.42327880859375, 0.4777679443359375, 0.532257080078125, 0.5867462158203125, 0.6412353515625, 0.6957244873046875, 0.750213623046875, 0.8047027587890625, 0.85919189453125, 0.9136810302734375, 0.968170166015625, 1.0226593017578125, 1.0771484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 7.0, 14.0, 8.0, 13.0, 14.0, 24.0, 39.0, 54.0, 110.0, 292.0, 1521.0, 20286.0, 3648866.0, 514046.0, 7579.0, 875.0, 212.0, 92.0, 70.0, 46.0, 39.0, 23.0, 16.0, 22.0, 10.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.28125, -14.251953125, -13.22265625, -12.193359375, -11.1640625, -10.134765625, -9.10546875, -8.076171875, -7.046875, -6.017578125, -4.98828125, -3.958984375, -2.9296875, -1.900390625, -0.87109375, 0.158203125, 1.1875, 2.216796875, 3.24609375, 4.275390625, 5.3046875, 6.333984375, 7.36328125, 8.392578125, 9.421875, 10.451171875, 11.48046875, 12.509765625, 13.5390625, 14.568359375, 15.59765625, 16.626953125, 17.65625, 18.685546875, 19.71484375, 20.744140625, 21.7734375, 22.802734375, 23.83203125, 24.861328125, 25.890625, 26.919921875, 27.94921875, 28.978515625, 30.0078125, 31.037109375, 32.06640625, 33.095703125, 34.125, 35.154296875, 36.18359375, 37.212890625, 38.2421875, 39.271484375, 40.30078125, 41.330078125, 42.359375, 43.388671875, 44.41796875, 45.447265625, 46.4765625, 47.505859375, 48.53515625, 49.564453125, 50.59375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 14.0, 26.0, 55.0, 158.0, 415.0, 1871.0, 1056.0, 286.0, 119.0, 51.0, 17.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.196044921875, -1.99365234375, -1.791259765625, -1.5888671875, -1.386474609375, -1.18408203125, -0.981689453125, -0.779296875, -0.576904296875, -0.37451171875, -0.172119140625, 0.0302734375, 0.232666015625, 0.43505859375, 0.637451171875, 0.83984375, 1.042236328125, 1.24462890625, 1.447021484375, 1.6494140625, 1.851806640625, 2.05419921875, 2.256591796875, 2.458984375, 2.661376953125, 2.86376953125, 3.066162109375, 3.2685546875, 3.470947265625, 3.67333984375, 3.875732421875, 4.078125, 4.280517578125, 4.48291015625, 4.685302734375, 4.8876953125, 5.090087890625, 5.29248046875, 5.494873046875, 5.697265625, 5.899658203125, 6.10205078125, 6.304443359375, 6.5068359375, 6.709228515625, 6.91162109375, 7.114013671875, 7.31640625, 7.518798828125, 7.72119140625, 7.923583984375, 8.1259765625, 8.328369140625, 8.53076171875, 8.733154296875, 8.935546875, 9.137939453125, 9.34033203125, 9.542724609375, 9.7451171875, 9.947509765625, 10.14990234375, 10.352294921875, 10.5546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 33.0, 126.0, 326.0, 324.0, 137.0, 37.0, 13.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.69554901123047, -78.90499877929688, -77.11444854736328, -75.32389831542969, -73.5333480834961, -71.7427978515625, -69.9522476196289, -68.16169738769531, -66.37114715576172, -64.58059692382812, -62.79004669189453, -60.99949645996094, -59.208946228027344, -57.41839599609375, -55.627845764160156, -53.83729553222656, -52.0467414855957, -50.25619125366211, -48.465641021728516, -46.67509078979492, -44.88454055786133, -43.093990325927734, -41.303436279296875, -39.51288604736328, -37.72233581542969, -35.931785583496094, -34.1412353515625, -32.350685119628906, -30.560134887695312, -28.76958465576172, -26.979032516479492, -25.1884822845459, -23.397933959960938, -21.607383728027344, -19.81683349609375, -18.026283264160156, -16.235733032226562, -14.445181846618652, -12.654630661010742, -10.864080429077148, -9.073530197143555, -7.282979965209961, -5.492429256439209, -3.701878547668457, -1.9113283157348633, -0.12077808380126953, 1.6697731018066406, 3.4603233337402344, 5.250873565673828, 7.041423797607422, 8.831974029541016, 10.622525215148926, 12.41307544708252, 14.203625679016113, 15.994176864624023, 17.784727096557617, 19.57527732849121, 21.365827560424805, 23.1563777923584, 24.946929931640625, 26.73748016357422, 28.528030395507812, 30.318580627441406, 32.109130859375, 33.899681091308594]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 7.0, 9.0, 17.0, 22.0, 31.0, 26.0, 37.0, 44.0, 67.0, 70.0, 81.0, 75.0, 81.0, 78.0, 77.0, 70.0, 55.0, 41.0, 25.0, 21.0, 26.0, 12.0, 13.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.844722747802734, -20.35968017578125, -19.874637603759766, -19.38959503173828, -18.904552459716797, -18.419509887695312, -17.934467315673828, -17.449424743652344, -16.96438217163086, -16.479339599609375, -15.99429702758789, -15.509254455566406, -15.024211883544922, -14.539169311523438, -14.054125785827637, -13.569083213806152, -13.084039688110352, -12.598997116088867, -12.113954544067383, -11.628911972045898, -11.143869400024414, -10.65882682800293, -10.173783302307129, -9.688740730285645, -9.20369815826416, -8.718655586242676, -8.233613014221191, -7.748569965362549, -7.2635273933410645, -6.77848482131958, -6.2934417724609375, -5.808399200439453, -5.323356628417969, -4.838314056396484, -4.353271484375, -3.8682284355163574, -3.383185863494873, -2.8981432914733887, -2.413100481033325, -1.9280576705932617, -1.4430150985717773, -0.9579724073410034, -0.4729297161102295, 0.012112975120544434, 0.49715566635131836, 0.9821982383728027, 1.4672410488128662, 1.9522838592529297, 2.437326431274414, 2.9223690032958984, 3.407411813735962, 3.8924546241760254, 4.37749719619751, 4.862539768218994, 5.347582817077637, 5.832625389099121, 6.3176679611206055, 6.80271053314209, 7.287753105163574, 7.772796154022217, 8.25783920288086, 8.742881774902344, 9.227924346923828, 9.712966918945312, 10.198009490966797]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 9.0, 13.0, 11.0, 14.0, 11.0, 31.0, 22.0, 55.0, 71.0, 140.0, 270.0, 440.0, 978.0, 2512.0, 7451.0, 26396.0, 98866.0, 304075.0, 390569.0, 155712.0, 43036.0, 11680.0, 3585.0, 1308.0, 591.0, 279.0, 148.0, 92.0, 45.0, 33.0, 29.0, 14.0, 8.0, 4.0, 9.0, 5.0, 9.0, 1.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.5072021484375, -8.225341796875, -7.9434814453125, -7.66162109375, -7.3797607421875, -7.097900390625, -6.8160400390625, -6.5341796875, -6.2523193359375, -5.970458984375, -5.6885986328125, -5.40673828125, -5.1248779296875, -4.843017578125, -4.5611572265625, -4.279296875, -3.9974365234375, -3.715576171875, -3.4337158203125, -3.15185546875, -2.8699951171875, -2.588134765625, -2.3062744140625, -2.0244140625, -1.7425537109375, -1.460693359375, -1.1788330078125, -0.89697265625, -0.6151123046875, -0.333251953125, -0.0513916015625, 0.23046875, 0.5123291015625, 0.794189453125, 1.0760498046875, 1.35791015625, 1.6397705078125, 1.921630859375, 2.2034912109375, 2.4853515625, 2.7672119140625, 3.049072265625, 3.3309326171875, 3.61279296875, 3.8946533203125, 4.176513671875, 4.4583740234375, 4.740234375, 5.0220947265625, 5.303955078125, 5.5858154296875, 5.86767578125, 6.1495361328125, 6.431396484375, 6.7132568359375, 6.9951171875, 7.2769775390625, 7.558837890625, 7.8406982421875, 8.12255859375, 8.4044189453125, 8.686279296875, 8.9681396484375, 9.25]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 11.0, 12.0, 19.0, 22.0, 33.0, 32.0, 43.0, 57.0, 69.0, 63.0, 66.0, 58.0, 74.0, 64.0, 72.0, 50.0, 41.0, 56.0, 37.0, 34.0, 16.0, 15.0, 20.0, 9.0, 2.0, 9.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9208984375, -1.8760147094726562, -1.8311309814453125, -1.7862472534179688, -1.741363525390625, -1.6964797973632812, -1.6515960693359375, -1.6067123413085938, -1.56182861328125, -1.5169448852539062, -1.4720611572265625, -1.4271774291992188, -1.382293701171875, -1.3374099731445312, -1.2925262451171875, -1.2476425170898438, -1.2027587890625, -1.1578750610351562, -1.1129913330078125, -1.0681076049804688, -1.023223876953125, -0.9783401489257812, -0.9334564208984375, -0.8885726928710938, -0.84368896484375, -0.7988052368164062, -0.7539215087890625, -0.7090377807617188, -0.664154052734375, -0.6192703247070312, -0.5743865966796875, -0.5295028686523438, -0.484619140625, -0.43973541259765625, -0.3948516845703125, -0.34996795654296875, -0.305084228515625, -0.26020050048828125, -0.2153167724609375, -0.17043304443359375, -0.12554931640625, -0.08066558837890625, -0.0357818603515625, 0.00910186767578125, 0.053985595703125, 0.09886932373046875, 0.1437530517578125, 0.18863677978515625, 0.2335205078125, 0.27840423583984375, 0.3232879638671875, 0.36817169189453125, 0.413055419921875, 0.45793914794921875, 0.5028228759765625, 0.5477066040039062, 0.59259033203125, 0.6374740600585938, 0.6823577880859375, 0.7272415161132812, 0.772125244140625, 0.8170089721679688, 0.8618927001953125, 0.9067764282226562, 0.95166015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 9.0, 9.0, 15.0, 12.0, 22.0, 35.0, 42.0, 74.0, 74.0, 109.0, 152.0, 192.0, 301.0, 411.0, 599.0, 976.0, 1608.0, 3024.0, 6294.0, 14880.0, 36271.0, 88433.0, 189623.0, 288859.0, 223581.0, 110955.0, 46424.0, 18743.0, 7779.0, 3725.0, 1911.0, 1076.0, 701.0, 443.0, 338.0, 220.0, 162.0, 131.0, 83.0, 69.0, 50.0, 32.0, 24.0, 24.0, 20.0, 5.0, 10.0, 8.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.3203125, -5.15728759765625, -4.9942626953125, -4.83123779296875, -4.668212890625, -4.50518798828125, -4.3421630859375, -4.17913818359375, -4.01611328125, -3.85308837890625, -3.6900634765625, -3.52703857421875, -3.364013671875, -3.20098876953125, -3.0379638671875, -2.87493896484375, -2.7119140625, -2.54888916015625, -2.3858642578125, -2.22283935546875, -2.059814453125, -1.89678955078125, -1.7337646484375, -1.57073974609375, -1.40771484375, -1.24468994140625, -1.0816650390625, -0.91864013671875, -0.755615234375, -0.59259033203125, -0.4295654296875, -0.26654052734375, -0.103515625, 0.05950927734375, 0.2225341796875, 0.38555908203125, 0.548583984375, 0.71160888671875, 0.8746337890625, 1.03765869140625, 1.20068359375, 1.36370849609375, 1.5267333984375, 1.68975830078125, 1.852783203125, 2.01580810546875, 2.1788330078125, 2.34185791015625, 2.5048828125, 2.66790771484375, 2.8309326171875, 2.99395751953125, 3.156982421875, 3.32000732421875, 3.4830322265625, 3.64605712890625, 3.80908203125, 3.97210693359375, 4.1351318359375, 4.29815673828125, 4.461181640625, 4.62420654296875, 4.7872314453125, 4.95025634765625, 5.11328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 9.0, 7.0, 10.0, 14.0, 14.0, 13.0, 28.0, 21.0, 28.0, 32.0, 27.0, 33.0, 48.0, 52.0, 47.0, 49.0, 55.0, 36.0, 52.0, 43.0, 47.0, 44.0, 31.0, 32.0, 42.0, 13.0, 22.0, 21.0, 26.0, 19.0, 14.0, 12.0, 12.0, 9.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.17578125, -5.02777099609375, -4.8797607421875, -4.73175048828125, -4.583740234375, -4.43572998046875, -4.2877197265625, -4.13970947265625, -3.99169921875, -3.84368896484375, -3.6956787109375, -3.54766845703125, -3.399658203125, -3.25164794921875, -3.1036376953125, -2.95562744140625, -2.8076171875, -2.65960693359375, -2.5115966796875, -2.36358642578125, -2.215576171875, -2.06756591796875, -1.9195556640625, -1.77154541015625, -1.62353515625, -1.47552490234375, -1.3275146484375, -1.17950439453125, -1.031494140625, -0.88348388671875, -0.7354736328125, -0.58746337890625, -0.439453125, -0.29144287109375, -0.1434326171875, 0.00457763671875, 0.152587890625, 0.30059814453125, 0.4486083984375, 0.59661865234375, 0.74462890625, 0.89263916015625, 1.0406494140625, 1.18865966796875, 1.336669921875, 1.48468017578125, 1.6326904296875, 1.78070068359375, 1.9287109375, 2.07672119140625, 2.2247314453125, 2.37274169921875, 2.520751953125, 2.66876220703125, 2.8167724609375, 2.96478271484375, 3.11279296875, 3.26080322265625, 3.4088134765625, 3.55682373046875, 3.704833984375, 3.85284423828125, 4.0008544921875, 4.14886474609375, 4.296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 7.0, 6.0, 9.0, 6.0, 12.0, 17.0, 24.0, 30.0, 48.0, 82.0, 122.0, 198.0, 334.0, 568.0, 989.0, 2036.0, 4177.0, 9476.0, 23936.0, 67013.0, 187016.0, 354606.0, 247188.0, 94163.0, 32857.0, 12755.0, 5386.0, 2502.0, 1256.0, 722.0, 380.0, 245.0, 137.0, 72.0, 63.0, 38.0, 16.0, 27.0, 12.0, 9.0, 5.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.4375, -3.332244873046875, -3.22698974609375, -3.121734619140625, -3.0164794921875, -2.911224365234375, -2.80596923828125, -2.700714111328125, -2.595458984375, -2.490203857421875, -2.38494873046875, -2.279693603515625, -2.1744384765625, -2.069183349609375, -1.96392822265625, -1.858673095703125, -1.75341796875, -1.648162841796875, -1.54290771484375, -1.437652587890625, -1.3323974609375, -1.227142333984375, -1.12188720703125, -1.016632080078125, -0.911376953125, -0.806121826171875, -0.70086669921875, -0.595611572265625, -0.4903564453125, -0.385101318359375, -0.27984619140625, -0.174591064453125, -0.0693359375, 0.035919189453125, 0.14117431640625, 0.246429443359375, 0.3516845703125, 0.456939697265625, 0.56219482421875, 0.667449951171875, 0.772705078125, 0.877960205078125, 0.98321533203125, 1.088470458984375, 1.1937255859375, 1.298980712890625, 1.40423583984375, 1.509490966796875, 1.61474609375, 1.720001220703125, 1.82525634765625, 1.930511474609375, 2.0357666015625, 2.141021728515625, 2.24627685546875, 2.351531982421875, 2.456787109375, 2.562042236328125, 2.66729736328125, 2.772552490234375, 2.8778076171875, 2.983062744140625, 3.08831787109375, 3.193572998046875, 3.298828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 5.0, 6.0, 12.0, 8.0, 10.0, 26.0, 17.0, 20.0, 34.0, 63.0, 76.0, 90.0, 84.0, 100.0, 98.0, 77.0, 69.0, 60.0, 37.0, 26.0, 20.0, 19.0, 13.0, 9.0, 11.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001026153564453125, -0.0010019093751907349, -0.0009776651859283447, -0.0009534209966659546, -0.0009291768074035645, -0.0009049326181411743, -0.0008806884288787842, -0.000856444239616394, -0.0008322000503540039, -0.0008079558610916138, -0.0007837116718292236, -0.0007594674825668335, -0.0007352232933044434, -0.0007109791040420532, -0.0006867349147796631, -0.000662490725517273, -0.0006382465362548828, -0.0006140023469924927, -0.0005897581577301025, -0.0005655139684677124, -0.0005412697792053223, -0.0005170255899429321, -0.000492781400680542, -0.00046853721141815186, -0.0004442930221557617, -0.0004200488328933716, -0.00039580464363098145, -0.0003715604543685913, -0.00034731626510620117, -0.00032307207584381104, -0.0002988278865814209, -0.00027458369731903076, -0.0002503395080566406, -0.0002260953187942505, -0.00020185112953186035, -0.00017760694026947021, -0.00015336275100708008, -0.00012911856174468994, -0.0001048743724822998, -8.063018321990967e-05, -5.638599395751953e-05, -3.2141804695129395e-05, -7.897615432739258e-06, 1.634657382965088e-05, 4.0590763092041016e-05, 6.483495235443115e-05, 8.907914161682129e-05, 0.00011332333087921143, 0.00013756752014160156, 0.0001618117094039917, 0.00018605589866638184, 0.00021030008792877197, 0.0002345442771911621, 0.00025878846645355225, 0.0002830326557159424, 0.0003072768449783325, 0.00033152103424072266, 0.0003557652235031128, 0.00038000941276550293, 0.00040425360202789307, 0.0004284977912902832, 0.00045274198055267334, 0.0004769861698150635, 0.0005012303590774536, 0.0005254745483398438]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 6.0, 5.0, 13.0, 27.0, 29.0, 53.0, 69.0, 95.0, 137.0, 226.0, 318.0, 590.0, 996.0, 1955.0, 4520.0, 11186.0, 33241.0, 110289.0, 325986.0, 362921.0, 132800.0, 39456.0, 13310.0, 5149.0, 2314.0, 1157.0, 641.0, 387.0, 203.0, 164.0, 92.0, 51.0, 44.0, 38.0, 25.0, 14.0, 13.0, 3.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.283203125, -3.1702880859375, -3.057373046875, -2.9444580078125, -2.83154296875, -2.7186279296875, -2.605712890625, -2.4927978515625, -2.3798828125, -2.2669677734375, -2.154052734375, -2.0411376953125, -1.92822265625, -1.8153076171875, -1.702392578125, -1.5894775390625, -1.4765625, -1.3636474609375, -1.250732421875, -1.1378173828125, -1.02490234375, -0.9119873046875, -0.799072265625, -0.6861572265625, -0.5732421875, -0.4603271484375, -0.347412109375, -0.2344970703125, -0.12158203125, -0.0086669921875, 0.104248046875, 0.2171630859375, 0.330078125, 0.4429931640625, 0.555908203125, 0.6688232421875, 0.78173828125, 0.8946533203125, 1.007568359375, 1.1204833984375, 1.2333984375, 1.3463134765625, 1.459228515625, 1.5721435546875, 1.68505859375, 1.7979736328125, 1.910888671875, 2.0238037109375, 2.13671875, 2.2496337890625, 2.362548828125, 2.4754638671875, 2.58837890625, 2.7012939453125, 2.814208984375, 2.9271240234375, 3.0400390625, 3.1529541015625, 3.265869140625, 3.3787841796875, 3.49169921875, 3.6046142578125, 3.717529296875, 3.8304443359375, 3.943359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 6.0, 9.0, 12.0, 10.0, 11.0, 14.0, 18.0, 24.0, 26.0, 29.0, 34.0, 45.0, 58.0, 80.0, 82.0, 71.0, 82.0, 59.0, 65.0, 49.0, 45.0, 37.0, 23.0, 15.0, 21.0, 13.0, 17.0, 7.0, 6.0, 8.0, 2.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.103515625, -2.022552490234375, -1.94158935546875, -1.860626220703125, -1.7796630859375, -1.698699951171875, -1.61773681640625, -1.536773681640625, -1.455810546875, -1.374847412109375, -1.29388427734375, -1.212921142578125, -1.1319580078125, -1.050994873046875, -0.97003173828125, -0.889068603515625, -0.80810546875, -0.727142333984375, -0.64617919921875, -0.565216064453125, -0.4842529296875, -0.403289794921875, -0.32232666015625, -0.241363525390625, -0.160400390625, -0.079437255859375, 0.00152587890625, 0.082489013671875, 0.1634521484375, 0.244415283203125, 0.32537841796875, 0.406341552734375, 0.4873046875, 0.568267822265625, 0.64923095703125, 0.730194091796875, 0.8111572265625, 0.892120361328125, 0.97308349609375, 1.054046630859375, 1.135009765625, 1.215972900390625, 1.29693603515625, 1.377899169921875, 1.4588623046875, 1.539825439453125, 1.62078857421875, 1.701751708984375, 1.78271484375, 1.863677978515625, 1.94464111328125, 2.025604248046875, 2.1065673828125, 2.187530517578125, 2.26849365234375, 2.349456787109375, 2.430419921875, 2.511383056640625, 2.59234619140625, 2.673309326171875, 2.7542724609375, 2.835235595703125, 2.91619873046875, 2.997161865234375, 3.078125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 10.0, 24.0, 30.0, 52.0, 86.0, 89.0, 120.0, 120.0, 138.0, 87.0, 74.0, 58.0, 40.0, 26.0, 14.0, 14.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.928070068359375, -45.283477783203125, -43.638885498046875, -41.994293212890625, -40.349700927734375, -38.705108642578125, -37.060516357421875, -35.415924072265625, -33.771331787109375, -32.126739501953125, -30.482147216796875, -28.837554931640625, -27.192962646484375, -25.548370361328125, -23.903779983520508, -22.259187698364258, -20.61459732055664, -18.97000503540039, -17.32541275024414, -15.680821418762207, -14.036229133605957, -12.391636848449707, -10.747045516967773, -9.102453231811523, -7.457860946655273, -5.813268661499023, -4.168676853179932, -2.52408504486084, -0.8794927597045898, 0.7650995254516602, 2.4096908569335938, 4.054283142089844, 5.698875427246094, 7.343467712402344, 8.988059997558594, 10.632651329040527, 12.277243614196777, 13.921835899353027, 15.566427230834961, 17.21101951599121, 18.85561180114746, 20.50020408630371, 22.14479637145996, 23.789386749267578, 25.433979034423828, 27.078571319580078, 28.723163604736328, 30.367755889892578, 32.01234817504883, 33.65694046020508, 35.30153274536133, 36.94612503051758, 38.59071731567383, 40.23530960083008, 41.87989807128906, 43.52449035644531, 45.16908264160156, 46.81367492675781, 48.45826721191406, 50.10285949707031, 51.74745178222656, 53.39204406738281, 55.03663635253906, 56.68122863769531, 58.32582092285156]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 9.0, 3.0, 8.0, 11.0, 9.0, 12.0, 17.0, 11.0, 27.0, 32.0, 30.0, 27.0, 33.0, 47.0, 53.0, 48.0, 47.0, 60.0, 62.0, 38.0, 50.0, 43.0, 42.0, 45.0, 40.0, 33.0, 24.0, 30.0, 17.0, 23.0, 6.0, 11.0, 12.0, 13.0, 8.0, 6.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.11848449707031, -33.14888381958008, -32.17927932739258, -31.20967674255371, -30.240074157714844, -29.27047348022461, -28.300870895385742, -27.331268310546875, -26.361665725708008, -25.39206314086914, -24.422460556030273, -23.452857971191406, -22.483257293701172, -21.513652801513672, -20.544052124023438, -19.57444953918457, -18.604846954345703, -17.635244369506836, -16.66564178466797, -15.696040153503418, -14.72643756866455, -13.756834983825684, -12.787233352661133, -11.817630767822266, -10.848028182983398, -9.878425598144531, -8.908823013305664, -7.939221382141113, -6.969618797302246, -6.000016212463379, -5.03041410446167, -4.060811996459961, -3.0912113189697266, -2.1216089725494385, -1.1520066261291504, -0.1824042797088623, 0.7871980667114258, 1.756800651550293, 2.726402759552002, 3.696004867553711, 4.665607452392578, 5.635210037231445, 6.604812145233154, 7.574414253234863, 8.54401683807373, 9.513619422912598, 10.483221054077148, 11.452823638916016, 12.422426223754883, 13.39202880859375, 14.361631393432617, 15.331233024597168, 16.30083465576172, 17.27043914794922, 18.240039825439453, 19.20964241027832, 20.179244995117188, 21.148847579956055, 22.118450164794922, 23.08805274963379, 24.057655334472656, 25.02725601196289, 25.996858596801758, 26.966461181640625, 27.936063766479492]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 7.0, 1.0, 2.0, 3.0, 8.0, 7.0, 5.0, 8.0, 15.0, 11.0, 21.0, 23.0, 44.0, 56.0, 53.0, 98.0, 132.0, 216.0, 330.0, 625.0, 1093.0, 2175.0, 4752.0, 11805.0, 36706.0, 157258.0, 1912899.0, 1849842.0, 159311.0, 36617.0, 11614.0, 4555.0, 1893.0, 1033.0, 486.0, 266.0, 150.0, 76.0, 39.0, 22.0, 14.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.015625, -11.7152099609375, -11.414794921875, -11.1143798828125, -10.81396484375, -10.5135498046875, -10.213134765625, -9.9127197265625, -9.6123046875, -9.3118896484375, -9.011474609375, -8.7110595703125, -8.41064453125, -8.1102294921875, -7.809814453125, -7.5093994140625, -7.208984375, -6.9085693359375, -6.608154296875, -6.3077392578125, -6.00732421875, -5.7069091796875, -5.406494140625, -5.1060791015625, -4.8056640625, -4.5052490234375, -4.204833984375, -3.9044189453125, -3.60400390625, -3.3035888671875, -3.003173828125, -2.7027587890625, -2.40234375, -2.1019287109375, -1.801513671875, -1.5010986328125, -1.20068359375, -0.9002685546875, -0.599853515625, -0.2994384765625, 0.0009765625, 0.3013916015625, 0.601806640625, 0.9022216796875, 1.20263671875, 1.5030517578125, 1.803466796875, 2.1038818359375, 2.404296875, 2.7047119140625, 3.005126953125, 3.3055419921875, 3.60595703125, 3.9063720703125, 4.206787109375, 4.5072021484375, 4.8076171875, 5.1080322265625, 5.408447265625, 5.7088623046875, 6.00927734375, 6.3096923828125, 6.610107421875, 6.9105224609375, 7.2109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 15.0, 11.0, 13.0, 28.0, 37.0, 36.0, 53.0, 47.0, 55.0, 80.0, 66.0, 64.0, 75.0, 70.0, 61.0, 43.0, 54.0, 47.0, 36.0, 23.0, 27.0, 15.0, 19.0, 12.0, 6.0, 0.0, 2.0, 0.0, 3.0, 3.0], "bins": [-2.017578125, -1.9733963012695312, -1.9292144775390625, -1.8850326538085938, -1.840850830078125, -1.7966690063476562, -1.7524871826171875, -1.7083053588867188, -1.66412353515625, -1.6199417114257812, -1.5757598876953125, -1.5315780639648438, -1.487396240234375, -1.4432144165039062, -1.3990325927734375, -1.3548507690429688, -1.3106689453125, -1.2664871215820312, -1.2223052978515625, -1.1781234741210938, -1.133941650390625, -1.0897598266601562, -1.0455780029296875, -1.0013961791992188, -0.95721435546875, -0.9130325317382812, -0.8688507080078125, -0.8246688842773438, -0.780487060546875, -0.7363052368164062, -0.6921234130859375, -0.6479415893554688, -0.603759765625, -0.5595779418945312, -0.5153961181640625, -0.47121429443359375, -0.427032470703125, -0.38285064697265625, -0.3386688232421875, -0.29448699951171875, -0.25030517578125, -0.20612335205078125, -0.1619415283203125, -0.11775970458984375, -0.073577880859375, -0.02939605712890625, 0.0147857666015625, 0.05896759033203125, 0.1031494140625, 0.14733123779296875, 0.1915130615234375, 0.23569488525390625, 0.279876708984375, 0.32405853271484375, 0.3682403564453125, 0.41242218017578125, 0.45660400390625, 0.5007858276367188, 0.5449676513671875, 0.5891494750976562, 0.633331298828125, 0.6775131225585938, 0.7216949462890625, 0.7658767700195312, 0.81005859375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 9.0, 7.0, 12.0, 15.0, 12.0, 27.0, 39.0, 37.0, 73.0, 78.0, 97.0, 175.0, 269.0, 500.0, 886.0, 1960.0, 4910.0, 16899.0, 114749.0, 2803249.0, 1163870.0, 67273.0, 11851.0, 3801.0, 1560.0, 712.0, 383.0, 239.0, 164.0, 101.0, 77.0, 59.0, 45.0, 27.0, 28.0, 35.0, 14.0, 6.0, 6.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-17.328125, -16.8582763671875, -16.388427734375, -15.9185791015625, -15.44873046875, -14.9788818359375, -14.509033203125, -14.0391845703125, -13.5693359375, -13.0994873046875, -12.629638671875, -12.1597900390625, -11.68994140625, -11.2200927734375, -10.750244140625, -10.2803955078125, -9.810546875, -9.3406982421875, -8.870849609375, -8.4010009765625, -7.93115234375, -7.4613037109375, -6.991455078125, -6.5216064453125, -6.0517578125, -5.5819091796875, -5.112060546875, -4.6422119140625, -4.17236328125, -3.7025146484375, -3.232666015625, -2.7628173828125, -2.29296875, -1.8231201171875, -1.353271484375, -0.8834228515625, -0.41357421875, 0.0562744140625, 0.526123046875, 0.9959716796875, 1.4658203125, 1.9356689453125, 2.405517578125, 2.8753662109375, 3.34521484375, 3.8150634765625, 4.284912109375, 4.7547607421875, 5.224609375, 5.6944580078125, 6.164306640625, 6.6341552734375, 7.10400390625, 7.5738525390625, 8.043701171875, 8.5135498046875, 8.9833984375, 9.4532470703125, 9.923095703125, 10.3929443359375, 10.86279296875, 11.3326416015625, 11.802490234375, 12.2723388671875, 12.7421875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 22.0, 24.0, 57.0, 100.0, 173.0, 426.0, 969.0, 1194.0, 508.0, 275.0, 134.0, 87.0, 39.0, 15.0, 13.0, 9.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.94317626953125, -4.7613525390625, -4.57952880859375, -4.397705078125, -4.21588134765625, -4.0340576171875, -3.85223388671875, -3.67041015625, -3.48858642578125, -3.3067626953125, -3.12493896484375, -2.943115234375, -2.76129150390625, -2.5794677734375, -2.39764404296875, -2.2158203125, -2.03399658203125, -1.8521728515625, -1.67034912109375, -1.488525390625, -1.30670166015625, -1.1248779296875, -0.94305419921875, -0.76123046875, -0.57940673828125, -0.3975830078125, -0.21575927734375, -0.033935546875, 0.14788818359375, 0.3297119140625, 0.51153564453125, 0.693359375, 0.87518310546875, 1.0570068359375, 1.23883056640625, 1.420654296875, 1.60247802734375, 1.7843017578125, 1.96612548828125, 2.14794921875, 2.32977294921875, 2.5115966796875, 2.69342041015625, 2.875244140625, 3.05706787109375, 3.2388916015625, 3.42071533203125, 3.6025390625, 3.78436279296875, 3.9661865234375, 4.14801025390625, 4.329833984375, 4.51165771484375, 4.6934814453125, 4.87530517578125, 5.05712890625, 5.23895263671875, 5.4207763671875, 5.60260009765625, 5.784423828125, 5.96624755859375, 6.1480712890625, 6.32989501953125, 6.51171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 5.0, 17.0, 21.0, 40.0, 73.0, 118.0, 136.0, 158.0, 157.0, 108.0, 73.0, 37.0, 22.0, 10.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.394588470458984, -34.097415924072266, -32.80023956298828, -31.50306510925293, -30.205890655517578, -28.90871810913086, -27.611543655395508, -26.314369201660156, -25.017194747924805, -23.720020294189453, -22.4228458404541, -21.12567138671875, -19.82849884033203, -18.531322479248047, -17.234149932861328, -15.936975479125977, -14.639801025390625, -13.342626571655273, -12.045452117919922, -10.748278617858887, -9.451104164123535, -8.153929710388184, -6.85675573348999, -5.559581756591797, -4.262407302856445, -2.965233087539673, -1.6680588722229004, -0.37088465690612793, 0.9262895584106445, 2.223464012145996, 3.5206379890441895, 4.817811965942383, 6.114990234375, 7.412164688110352, 8.709339141845703, 10.006512641906738, 11.30368709564209, 12.600861549377441, 13.898035049438477, 15.195209503173828, 16.49238395690918, 17.78955841064453, 19.086732864379883, 20.383907318115234, 21.681079864501953, 22.978256225585938, 24.275428771972656, 25.572603225708008, 26.86977767944336, 28.16695213317871, 29.464126586914062, 30.761301040649414, 32.058475494384766, 33.355648040771484, 34.65282440185547, 35.94999694824219, 37.247169494628906, 38.544342041015625, 39.84151840209961, 41.13869094848633, 42.43586730957031, 43.73303985595703, 45.030216217041016, 46.327388763427734, 47.62456512451172]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 7.0, 7.0, 1.0, 4.0, 10.0, 20.0, 16.0, 16.0, 18.0, 21.0, 27.0, 26.0, 30.0, 37.0, 50.0, 36.0, 45.0, 33.0, 38.0, 51.0, 47.0, 36.0, 42.0, 52.0, 43.0, 39.0, 38.0, 32.0, 29.0, 27.0, 23.0, 25.0, 13.0, 15.0, 9.0, 7.0, 8.0, 8.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.188618659973145, -14.744828224182129, -14.301036834716797, -13.857246398925781, -13.41345500946045, -12.969664573669434, -12.525873184204102, -12.082082748413086, -11.63829231262207, -11.194501876831055, -10.750710487365723, -10.306920051574707, -9.863128662109375, -9.41933822631836, -8.975547790527344, -8.531756401062012, -8.08796501159668, -7.644174098968506, -7.200383186340332, -6.756592750549316, -6.312801361083984, -5.869010925292969, -5.425220012664795, -4.981429100036621, -4.537638187408447, -4.093847274780273, -3.6500563621520996, -3.206265687942505, -2.762474775314331, -2.3186838626861572, -1.8748931884765625, -1.4311022758483887, -0.9873104095458984, -0.5435195565223694, -0.09972870349884033, 0.34406208992004395, 0.7878530025482178, 1.2316439151763916, 1.6754345893859863, 2.11922550201416, 2.563016414642334, 3.006807327270508, 3.4505982398986816, 3.8943889141082764, 4.338179588317871, 4.781970977783203, 5.225761413574219, 5.669552326202393, 6.113343238830566, 6.55713415145874, 7.000925064086914, 7.44471549987793, 7.888506889343262, 8.332297325134277, 8.77608871459961, 9.219879150390625, 9.66366958618164, 10.107460021972656, 10.551251411437988, 10.995041847229004, 11.438833236694336, 11.882623672485352, 12.326414108276367, 12.7702054977417, 13.213996887207031]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 11.0, 16.0, 20.0, 28.0, 43.0, 47.0, 91.0, 114.0, 186.0, 272.0, 447.0, 809.0, 1676.0, 3752.0, 9798.0, 31871.0, 109459.0, 354452.0, 368228.0, 115835.0, 33652.0, 10135.0, 3666.0, 1690.0, 903.0, 503.0, 292.0, 152.0, 105.0, 91.0, 71.0, 38.0, 22.0, 15.0, 11.0, 13.0, 8.0, 5.0, 1.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.109375, -9.80322265625, -9.4970703125, -9.19091796875, -8.884765625, -8.57861328125, -8.2724609375, -7.96630859375, -7.66015625, -7.35400390625, -7.0478515625, -6.74169921875, -6.435546875, -6.12939453125, -5.8232421875, -5.51708984375, -5.2109375, -4.90478515625, -4.5986328125, -4.29248046875, -3.986328125, -3.68017578125, -3.3740234375, -3.06787109375, -2.76171875, -2.45556640625, -2.1494140625, -1.84326171875, -1.537109375, -1.23095703125, -0.9248046875, -0.61865234375, -0.3125, -0.00634765625, 0.2998046875, 0.60595703125, 0.912109375, 1.21826171875, 1.5244140625, 1.83056640625, 2.13671875, 2.44287109375, 2.7490234375, 3.05517578125, 3.361328125, 3.66748046875, 3.9736328125, 4.27978515625, 4.5859375, 4.89208984375, 5.1982421875, 5.50439453125, 5.810546875, 6.11669921875, 6.4228515625, 6.72900390625, 7.03515625, 7.34130859375, 7.6474609375, 7.95361328125, 8.259765625, 8.56591796875, 8.8720703125, 9.17822265625, 9.484375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 10.0, 13.0, 5.0, 21.0, 21.0, 29.0, 25.0, 34.0, 59.0, 49.0, 54.0, 57.0, 61.0, 52.0, 62.0, 47.0, 47.0, 58.0, 37.0, 37.0, 45.0, 22.0, 31.0, 26.0, 15.0, 11.0, 10.0, 12.0, 8.0, 4.0, 5.0, 6.0, 4.0, 1.0, 1.0], "bins": [-1.587890625, -1.5505447387695312, -1.5131988525390625, -1.4758529663085938, -1.438507080078125, -1.4011611938476562, -1.3638153076171875, -1.3264694213867188, -1.28912353515625, -1.2517776489257812, -1.2144317626953125, -1.1770858764648438, -1.139739990234375, -1.1023941040039062, -1.0650482177734375, -1.0277023315429688, -0.9903564453125, -0.9530105590820312, -0.9156646728515625, -0.8783187866210938, -0.840972900390625, -0.8036270141601562, -0.7662811279296875, -0.7289352416992188, -0.69158935546875, -0.6542434692382812, -0.6168975830078125, -0.5795516967773438, -0.542205810546875, -0.5048599243164062, -0.4675140380859375, -0.43016815185546875, -0.392822265625, -0.35547637939453125, -0.3181304931640625, -0.28078460693359375, -0.243438720703125, -0.20609283447265625, -0.1687469482421875, -0.13140106201171875, -0.09405517578125, -0.05670928955078125, -0.0193634033203125, 0.01798248291015625, 0.055328369140625, 0.09267425537109375, 0.1300201416015625, 0.16736602783203125, 0.2047119140625, 0.24205780029296875, 0.2794036865234375, 0.31674957275390625, 0.354095458984375, 0.39144134521484375, 0.4287872314453125, 0.46613311767578125, 0.50347900390625, 0.5408248901367188, 0.5781707763671875, 0.6155166625976562, 0.652862548828125, 0.6902084350585938, 0.7275543212890625, 0.7649002075195312, 0.80224609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 2.0, 6.0, 11.0, 19.0, 19.0, 31.0, 35.0, 52.0, 66.0, 119.0, 157.0, 209.0, 338.0, 502.0, 911.0, 1515.0, 3054.0, 6275.0, 14009.0, 32090.0, 71915.0, 155347.0, 274732.0, 248876.0, 130362.0, 58938.0, 26068.0, 11598.0, 5352.0, 2523.0, 1290.0, 726.0, 398.0, 263.0, 203.0, 154.0, 97.0, 92.0, 47.0, 39.0, 27.0, 22.0, 18.0, 10.0, 15.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-4.76171875, -4.61688232421875, -4.4720458984375, -4.32720947265625, -4.182373046875, -4.03753662109375, -3.8927001953125, -3.74786376953125, -3.60302734375, -3.45819091796875, -3.3133544921875, -3.16851806640625, -3.023681640625, -2.87884521484375, -2.7340087890625, -2.58917236328125, -2.4443359375, -2.29949951171875, -2.1546630859375, -2.00982666015625, -1.864990234375, -1.72015380859375, -1.5753173828125, -1.43048095703125, -1.28564453125, -1.14080810546875, -0.9959716796875, -0.85113525390625, -0.706298828125, -0.56146240234375, -0.4166259765625, -0.27178955078125, -0.126953125, 0.01788330078125, 0.1627197265625, 0.30755615234375, 0.452392578125, 0.59722900390625, 0.7420654296875, 0.88690185546875, 1.03173828125, 1.17657470703125, 1.3214111328125, 1.46624755859375, 1.611083984375, 1.75592041015625, 1.9007568359375, 2.04559326171875, 2.1904296875, 2.33526611328125, 2.4801025390625, 2.62493896484375, 2.769775390625, 2.91461181640625, 3.0594482421875, 3.20428466796875, 3.34912109375, 3.49395751953125, 3.6387939453125, 3.78363037109375, 3.928466796875, 4.07330322265625, 4.2181396484375, 4.36297607421875, 4.5078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 5.0, 11.0, 6.0, 8.0, 9.0, 13.0, 14.0, 14.0, 19.0, 28.0, 23.0, 21.0, 37.0, 29.0, 36.0, 40.0, 37.0, 32.0, 32.0, 42.0, 36.0, 41.0, 42.0, 39.0, 37.0, 33.0, 32.0, 35.0, 29.0, 29.0, 25.0, 20.0, 19.0, 13.0, 18.0, 10.0, 16.0, 11.0, 9.0, 6.0, 5.0, 4.0, 8.0, 4.0, 5.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.703125, -3.5791015625, -3.455078125, -3.3310546875, -3.20703125, -3.0830078125, -2.958984375, -2.8349609375, -2.7109375, -2.5869140625, -2.462890625, -2.3388671875, -2.21484375, -2.0908203125, -1.966796875, -1.8427734375, -1.71875, -1.5947265625, -1.470703125, -1.3466796875, -1.22265625, -1.0986328125, -0.974609375, -0.8505859375, -0.7265625, -0.6025390625, -0.478515625, -0.3544921875, -0.23046875, -0.1064453125, 0.017578125, 0.1416015625, 0.265625, 0.3896484375, 0.513671875, 0.6376953125, 0.76171875, 0.8857421875, 1.009765625, 1.1337890625, 1.2578125, 1.3818359375, 1.505859375, 1.6298828125, 1.75390625, 1.8779296875, 2.001953125, 2.1259765625, 2.25, 2.3740234375, 2.498046875, 2.6220703125, 2.74609375, 2.8701171875, 2.994140625, 3.1181640625, 3.2421875, 3.3662109375, 3.490234375, 3.6142578125, 3.73828125, 3.8623046875, 3.986328125, 4.1103515625, 4.234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 10.0, 17.0, 25.0, 23.0, 56.0, 99.0, 193.0, 395.0, 937.0, 2531.0, 8335.0, 37902.0, 208307.0, 539186.0, 201631.0, 36488.0, 8225.0, 2465.0, 918.0, 379.0, 180.0, 111.0, 48.0, 28.0, 19.0, 14.0, 8.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.74609375, -6.56121826171875, -6.3763427734375, -6.19146728515625, -6.006591796875, -5.82171630859375, -5.6368408203125, -5.45196533203125, -5.26708984375, -5.08221435546875, -4.8973388671875, -4.71246337890625, -4.527587890625, -4.34271240234375, -4.1578369140625, -3.97296142578125, -3.7880859375, -3.60321044921875, -3.4183349609375, -3.23345947265625, -3.048583984375, -2.86370849609375, -2.6788330078125, -2.49395751953125, -2.30908203125, -2.12420654296875, -1.9393310546875, -1.75445556640625, -1.569580078125, -1.38470458984375, -1.1998291015625, -1.01495361328125, -0.830078125, -0.64520263671875, -0.4603271484375, -0.27545166015625, -0.090576171875, 0.09429931640625, 0.2791748046875, 0.46405029296875, 0.64892578125, 0.83380126953125, 1.0186767578125, 1.20355224609375, 1.388427734375, 1.57330322265625, 1.7581787109375, 1.94305419921875, 2.1279296875, 2.31280517578125, 2.4976806640625, 2.68255615234375, 2.867431640625, 3.05230712890625, 3.2371826171875, 3.42205810546875, 3.60693359375, 3.79180908203125, 3.9766845703125, 4.16156005859375, 4.346435546875, 4.53131103515625, 4.7161865234375, 4.90106201171875, 5.0859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 5.0, 7.0, 3.0, 4.0, 9.0, 16.0, 19.0, 20.0, 23.0, 25.0, 32.0, 47.0, 38.0, 67.0, 73.0, 66.0, 84.0, 78.0, 78.0, 55.0, 49.0, 35.0, 24.0, 28.0, 22.0, 14.0, 16.0, 11.0, 9.0, 7.0, 9.0, 8.0, 4.0, 0.0, 3.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004982948303222656, -0.00048135966062545776, -0.0004644244909286499, -0.00044748932123184204, -0.0004305541515350342, -0.0004136189818382263, -0.00039668381214141846, -0.0003797486424446106, -0.00036281347274780273, -0.0003458783030509949, -0.000328943133354187, -0.00031200796365737915, -0.0002950727939605713, -0.00027813762426376343, -0.00026120245456695557, -0.0002442672848701477, -0.00022733211517333984, -0.00021039694547653198, -0.00019346177577972412, -0.00017652660608291626, -0.0001595914363861084, -0.00014265626668930054, -0.00012572109699249268, -0.00010878592729568481, -9.185075759887695e-05, -7.491558790206909e-05, -5.798041820526123e-05, -4.104524850845337e-05, -2.4110078811645508e-05, -7.1749091148376465e-06, 9.760260581970215e-06, 2.6695430278778076e-05, 4.363059997558594e-05, 6.05657696723938e-05, 7.750093936920166e-05, 9.443610906600952e-05, 0.00011137127876281738, 0.00012830644845962524, 0.0001452416181564331, 0.00016217678785324097, 0.00017911195755004883, 0.0001960471272468567, 0.00021298229694366455, 0.0002299174666404724, 0.0002468526363372803, 0.00026378780603408813, 0.000280722975730896, 0.00029765814542770386, 0.0003145933151245117, 0.0003315284848213196, 0.00034846365451812744, 0.0003653988242149353, 0.00038233399391174316, 0.000399269163608551, 0.0004162043333053589, 0.00043313950300216675, 0.0004500746726989746, 0.00046700984239578247, 0.00048394501209259033, 0.0005008801817893982, 0.0005178153514862061, 0.0005347505211830139, 0.0005516856908798218, 0.0005686208605766296, 0.0005855560302734375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 5.0, 14.0, 17.0, 18.0, 37.0, 51.0, 124.0, 170.0, 356.0, 747.0, 1820.0, 5400.0, 22991.0, 141977.0, 570135.0, 252802.0, 39234.0, 8336.0, 2445.0, 959.0, 381.0, 242.0, 109.0, 63.0, 40.0, 24.0, 18.0, 12.0, 9.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.91009521484375, -5.7108154296875, -5.51153564453125, -5.312255859375, -5.11297607421875, -4.9136962890625, -4.71441650390625, -4.51513671875, -4.31585693359375, -4.1165771484375, -3.91729736328125, -3.718017578125, -3.51873779296875, -3.3194580078125, -3.12017822265625, -2.9208984375, -2.72161865234375, -2.5223388671875, -2.32305908203125, -2.123779296875, -1.92449951171875, -1.7252197265625, -1.52593994140625, -1.32666015625, -1.12738037109375, -0.9281005859375, -0.72882080078125, -0.529541015625, -0.33026123046875, -0.1309814453125, 0.06829833984375, 0.267578125, 0.46685791015625, 0.6661376953125, 0.86541748046875, 1.064697265625, 1.26397705078125, 1.4632568359375, 1.66253662109375, 1.86181640625, 2.06109619140625, 2.2603759765625, 2.45965576171875, 2.658935546875, 2.85821533203125, 3.0574951171875, 3.25677490234375, 3.4560546875, 3.65533447265625, 3.8546142578125, 4.05389404296875, 4.253173828125, 4.45245361328125, 4.6517333984375, 4.85101318359375, 5.05029296875, 5.24957275390625, 5.4488525390625, 5.64813232421875, 5.847412109375, 6.04669189453125, 6.2459716796875, 6.44525146484375, 6.64453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 11.0, 9.0, 7.0, 10.0, 11.0, 23.0, 25.0, 23.0, 32.0, 38.0, 52.0, 44.0, 41.0, 63.0, 60.0, 53.0, 62.0, 70.0, 45.0, 50.0, 47.0, 45.0, 28.0, 34.0, 20.0, 21.0, 14.0, 13.0, 12.0, 13.0, 7.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.3046875, -2.23004150390625, -2.1553955078125, -2.08074951171875, -2.006103515625, -1.93145751953125, -1.8568115234375, -1.78216552734375, -1.70751953125, -1.63287353515625, -1.5582275390625, -1.48358154296875, -1.408935546875, -1.33428955078125, -1.2596435546875, -1.18499755859375, -1.1103515625, -1.03570556640625, -0.9610595703125, -0.88641357421875, -0.811767578125, -0.73712158203125, -0.6624755859375, -0.58782958984375, -0.51318359375, -0.43853759765625, -0.3638916015625, -0.28924560546875, -0.214599609375, -0.13995361328125, -0.0653076171875, 0.00933837890625, 0.083984375, 0.15863037109375, 0.2332763671875, 0.30792236328125, 0.382568359375, 0.45721435546875, 0.5318603515625, 0.60650634765625, 0.68115234375, 0.75579833984375, 0.8304443359375, 0.90509033203125, 0.979736328125, 1.05438232421875, 1.1290283203125, 1.20367431640625, 1.2783203125, 1.35296630859375, 1.4276123046875, 1.50225830078125, 1.576904296875, 1.65155029296875, 1.7261962890625, 1.80084228515625, 1.87548828125, 1.95013427734375, 2.0247802734375, 2.09942626953125, 2.174072265625, 2.24871826171875, 2.3233642578125, 2.39801025390625, 2.47265625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 15.0, 21.0, 29.0, 32.0, 61.0, 74.0, 71.0, 103.0, 92.0, 93.0, 90.0, 89.0, 46.0, 52.0, 38.0, 24.0, 21.0, 12.0, 6.0, 3.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.173664093017578, -26.980215072631836, -25.78676414489746, -24.59331512451172, -23.399864196777344, -22.2064151763916, -21.01296615600586, -19.819515228271484, -18.626066207885742, -17.4326171875, -16.239166259765625, -15.045717239379883, -13.852267265319824, -12.658817291259766, -11.465368270874023, -10.271918296813965, -9.078468322753906, -7.885018348693848, -6.691568851470947, -5.498119354248047, -4.304669380187988, -3.1112194061279297, -1.9177699089050293, -0.7243204116821289, 0.4691295623779297, 1.6625792980194092, 2.8560290336608887, 4.049478530883789, 5.242928504943848, 6.436378479003906, 7.629827976226807, 8.823277473449707, 10.016731262207031, 11.21018123626709, 12.403631210327148, 13.59708023071289, 14.79053020477295, 15.983980178833008, 17.17742919921875, 18.370880126953125, 19.564329147338867, 20.75777816772461, 21.951229095458984, 23.144678115844727, 24.33812713623047, 25.531578063964844, 26.725027084350586, 27.918476104736328, 29.111927032470703, 30.305376052856445, 31.49882698059082, 32.69227600097656, 33.88572692871094, 35.07917785644531, 36.27262496948242, 37.4660758972168, 38.659523010253906, 39.85297393798828, 41.04642105102539, 42.239871978759766, 43.43332290649414, 44.62677001953125, 45.820220947265625, 47.013671875, 48.207122802734375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 9.0, 10.0, 7.0, 11.0, 13.0, 9.0, 23.0, 27.0, 25.0, 35.0, 33.0, 40.0, 42.0, 53.0, 58.0, 46.0, 43.0, 61.0, 52.0, 69.0, 43.0, 42.0, 34.0, 39.0, 39.0, 31.0, 18.0, 19.0, 14.0, 13.0, 6.0, 10.0, 6.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.967247009277344, -31.94890022277832, -30.930551528930664, -29.91220474243164, -28.893856048583984, -27.87550926208496, -26.857162475585938, -25.83881378173828, -24.820466995239258, -23.802120208740234, -22.783771514892578, -21.765424728393555, -20.74707794189453, -19.728729248046875, -18.71038246154785, -17.692035675048828, -16.673686981201172, -15.655339241027832, -14.636991500854492, -13.618644714355469, -12.600296974182129, -11.581949234008789, -10.563602447509766, -9.545254707336426, -8.526906967163086, -7.508559226989746, -6.4902119636535645, -5.471864700317383, -4.453516960144043, -3.435169219970703, -2.4168219566345215, -1.3984746932983398, -0.380126953125, 0.6382205486297607, 1.6565680503845215, 2.6749155521392822, 3.693263053894043, 4.711610794067383, 5.7299580574035645, 6.748305320739746, 7.766653060913086, 8.785000801086426, 9.803348541259766, 10.821695327758789, 11.840043067932129, 12.858390808105469, 13.876737594604492, 14.895085334777832, 15.913433074951172, 16.931779861450195, 17.95012855529785, 18.968475341796875, 19.98682403564453, 21.005170822143555, 22.023517608642578, 23.041866302490234, 24.060213088989258, 25.07855987548828, 26.096908569335938, 27.11525535583496, 28.133602142333984, 29.15195083618164, 30.170297622680664, 31.188644409179688, 32.206993103027344]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 4.0, 3.0, 9.0, 10.0, 16.0, 20.0, 27.0, 34.0, 46.0, 61.0, 77.0, 135.0, 187.0, 327.0, 503.0, 888.0, 1609.0, 3380.0, 7884.0, 22869.0, 91387.0, 1272652.0, 2633730.0, 115277.0, 26730.0, 8900.0, 3677.0, 1721.0, 880.0, 518.0, 293.0, 158.0, 87.0, 60.0, 48.0, 13.0, 14.0, 10.0, 13.0, 8.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.9296875, -9.6099853515625, -9.290283203125, -8.9705810546875, -8.65087890625, -8.3311767578125, -8.011474609375, -7.6917724609375, -7.3720703125, -7.0523681640625, -6.732666015625, -6.4129638671875, -6.09326171875, -5.7735595703125, -5.453857421875, -5.1341552734375, -4.814453125, -4.4947509765625, -4.175048828125, -3.8553466796875, -3.53564453125, -3.2159423828125, -2.896240234375, -2.5765380859375, -2.2568359375, -1.9371337890625, -1.617431640625, -1.2977294921875, -0.97802734375, -0.6583251953125, -0.338623046875, -0.0189208984375, 0.30078125, 0.6204833984375, 0.940185546875, 1.2598876953125, 1.57958984375, 1.8992919921875, 2.218994140625, 2.5386962890625, 2.8583984375, 3.1781005859375, 3.497802734375, 3.8175048828125, 4.13720703125, 4.4569091796875, 4.776611328125, 5.0963134765625, 5.416015625, 5.7357177734375, 6.055419921875, 6.3751220703125, 6.69482421875, 7.0145263671875, 7.334228515625, 7.6539306640625, 7.9736328125, 8.2933349609375, 8.613037109375, 8.9327392578125, 9.25244140625, 9.5721435546875, 9.891845703125, 10.2115478515625, 10.53125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 7.0, 0.0, 3.0, 8.0, 13.0, 11.0, 28.0, 25.0, 33.0, 47.0, 57.0, 61.0, 86.0, 87.0, 83.0, 80.0, 82.0, 64.0, 47.0, 45.0, 51.0, 27.0, 26.0, 13.0, 13.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5556640625, -1.4988555908203125, -1.442047119140625, -1.3852386474609375, -1.32843017578125, -1.2716217041015625, -1.214813232421875, -1.1580047607421875, -1.1011962890625, -1.0443878173828125, -0.987579345703125, -0.9307708740234375, -0.87396240234375, -0.8171539306640625, -0.760345458984375, -0.7035369873046875, -0.646728515625, -0.5899200439453125, -0.533111572265625, -0.4763031005859375, -0.41949462890625, -0.3626861572265625, -0.305877685546875, -0.2490692138671875, -0.1922607421875, -0.1354522705078125, -0.078643798828125, -0.0218353271484375, 0.03497314453125, 0.0917816162109375, 0.148590087890625, 0.2053985595703125, 0.26220703125, 0.3190155029296875, 0.375823974609375, 0.4326324462890625, 0.48944091796875, 0.5462493896484375, 0.603057861328125, 0.6598663330078125, 0.7166748046875, 0.7734832763671875, 0.830291748046875, 0.8871002197265625, 0.94390869140625, 1.0007171630859375, 1.057525634765625, 1.1143341064453125, 1.171142578125, 1.2279510498046875, 1.284759521484375, 1.3415679931640625, 1.39837646484375, 1.4551849365234375, 1.511993408203125, 1.5688018798828125, 1.6256103515625, 1.6824188232421875, 1.739227294921875, 1.7960357666015625, 1.85284423828125, 1.9096527099609375, 1.966461181640625, 2.0232696533203125, 2.080078125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 6.0, 3.0, 5.0, 11.0, 15.0, 21.0, 30.0, 31.0, 40.0, 43.0, 78.0, 103.0, 144.0, 215.0, 475.0, 1100.0, 3310.0, 13272.0, 80211.0, 1422881.0, 2543226.0, 105781.0, 16684.0, 3953.0, 1253.0, 581.0, 265.0, 154.0, 96.0, 68.0, 48.0, 43.0, 24.0, 23.0, 19.0, 18.0, 15.0, 5.0, 7.0, 2.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-13.7421875, -13.3502197265625, -12.958251953125, -12.5662841796875, -12.17431640625, -11.7823486328125, -11.390380859375, -10.9984130859375, -10.6064453125, -10.2144775390625, -9.822509765625, -9.4305419921875, -9.03857421875, -8.6466064453125, -8.254638671875, -7.8626708984375, -7.470703125, -7.0787353515625, -6.686767578125, -6.2947998046875, -5.90283203125, -5.5108642578125, -5.118896484375, -4.7269287109375, -4.3349609375, -3.9429931640625, -3.551025390625, -3.1590576171875, -2.76708984375, -2.3751220703125, -1.983154296875, -1.5911865234375, -1.19921875, -0.8072509765625, -0.415283203125, -0.0233154296875, 0.36865234375, 0.7606201171875, 1.152587890625, 1.5445556640625, 1.9365234375, 2.3284912109375, 2.720458984375, 3.1124267578125, 3.50439453125, 3.8963623046875, 4.288330078125, 4.6802978515625, 5.072265625, 5.4642333984375, 5.856201171875, 6.2481689453125, 6.64013671875, 7.0321044921875, 7.424072265625, 7.8160400390625, 8.2080078125, 8.5999755859375, 8.991943359375, 9.3839111328125, 9.77587890625, 10.1678466796875, 10.559814453125, 10.9517822265625, 11.34375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 8.0, 16.0, 14.0, 39.0, 69.0, 103.0, 247.0, 622.0, 1496.0, 762.0, 306.0, 173.0, 83.0, 53.0, 32.0, 16.0, 9.0, 12.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44921875, -3.30316162109375, -3.1571044921875, -3.01104736328125, -2.864990234375, -2.71893310546875, -2.5728759765625, -2.42681884765625, -2.28076171875, -2.13470458984375, -1.9886474609375, -1.84259033203125, -1.696533203125, -1.55047607421875, -1.4044189453125, -1.25836181640625, -1.1123046875, -0.96624755859375, -0.8201904296875, -0.67413330078125, -0.528076171875, -0.38201904296875, -0.2359619140625, -0.08990478515625, 0.05615234375, 0.20220947265625, 0.3482666015625, 0.49432373046875, 0.640380859375, 0.78643798828125, 0.9324951171875, 1.07855224609375, 1.224609375, 1.37066650390625, 1.5167236328125, 1.66278076171875, 1.808837890625, 1.95489501953125, 2.1009521484375, 2.24700927734375, 2.39306640625, 2.53912353515625, 2.6851806640625, 2.83123779296875, 2.977294921875, 3.12335205078125, 3.2694091796875, 3.41546630859375, 3.5615234375, 3.70758056640625, 3.8536376953125, 3.99969482421875, 4.145751953125, 4.29180908203125, 4.4378662109375, 4.58392333984375, 4.72998046875, 4.87603759765625, 5.0220947265625, 5.16815185546875, 5.314208984375, 5.46026611328125, 5.6063232421875, 5.75238037109375, 5.8984375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 13.0, 13.0, 26.0, 45.0, 67.0, 108.0, 88.0, 132.0, 123.0, 87.0, 92.0, 66.0, 46.0, 30.0, 18.0, 15.0, 12.0, 8.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.99906063079834, -12.26679801940918, -11.534534454345703, -10.802271842956543, -10.070009231567383, -9.337745666503906, -8.605483055114746, -7.873220443725586, -7.140957355499268, -6.408694267272949, -5.676431655883789, -4.944168567657471, -4.211905479431152, -3.479642868041992, -2.747379779815674, -2.0151171684265137, -1.2828540802001953, -0.5505911707878113, 0.18167173862457275, 0.9139347076416016, 1.6461975574493408, 2.37846040725708, 3.1107234954833984, 3.8429861068725586, 4.575249195098877, 5.307512283325195, 6.0397748947143555, 6.772037982940674, 7.504301071166992, 8.236563682556152, 8.968826293945312, 9.701089859008789, 10.433351516723633, 11.165614128112793, 11.89787769317627, 12.63014030456543, 13.36240291595459, 14.09466552734375, 14.826929092407227, 15.559191703796387, 16.291454315185547, 17.023717880249023, 17.755979537963867, 18.488243103027344, 19.22050666809082, 19.952768325805664, 20.68503189086914, 21.417293548583984, 22.149559020996094, 22.88182258605957, 23.614084243774414, 24.34634780883789, 25.078611373901367, 25.81087303161621, 26.543136596679688, 27.27539825439453, 28.007661819458008, 28.739925384521484, 29.472187042236328, 30.204450607299805, 30.93671417236328, 31.668975830078125, 32.40123748779297, 33.13350296020508, 33.86576461791992]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 3.0, 6.0, 7.0, 15.0, 13.0, 27.0, 28.0, 25.0, 28.0, 47.0, 45.0, 54.0, 43.0, 51.0, 44.0, 63.0, 59.0, 56.0, 73.0, 53.0, 36.0, 40.0, 34.0, 37.0, 24.0, 26.0, 18.0, 11.0, 10.0, 8.0, 9.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.916501998901367, -17.45857810974121, -17.000656127929688, -16.54273223876953, -16.084810256958008, -15.626886367797852, -15.168963432312012, -14.711040496826172, -14.253117561340332, -13.795194625854492, -13.337271690368652, -12.879348754882812, -12.421424865722656, -11.963501930236816, -11.505578994750977, -11.047656059265137, -10.589733123779297, -10.131810188293457, -9.673887252807617, -9.215963363647461, -8.758040428161621, -8.300117492675781, -7.842194557189941, -7.384271621704102, -6.926347732543945, -6.4684247970581055, -6.010501384735107, -5.552578449249268, -5.094655513763428, -4.63673210144043, -4.17880916595459, -3.72088623046875, -3.26296329498291, -2.805040121078491, -2.3471171855926514, -1.8891940116882324, -1.431270956993103, -0.9733479022979736, -0.5154247283935547, -0.057501792907714844, 0.4004213809967041, 0.8583444356918335, 1.316267490386963, 1.7741906642913818, 2.232113838195801, 2.6900367736816406, 3.1479599475860596, 3.6058828830718994, 4.063806056976318, 4.521728992462158, 4.979652404785156, 5.437575340270996, 5.895498275756836, 6.353421211242676, 6.811344623565674, 7.269267559051514, 7.727190971374512, 8.185113906860352, 8.643036842346191, 9.100959777832031, 9.558883666992188, 10.016806602478027, 10.474729537963867, 10.932652473449707, 11.390575408935547]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 8.0, 9.0, 12.0, 14.0, 25.0, 28.0, 45.0, 76.0, 97.0, 149.0, 236.0, 364.0, 618.0, 1108.0, 2151.0, 4381.0, 10583.0, 27953.0, 79363.0, 213663.0, 370906.0, 211180.0, 77954.0, 27580.0, 10581.0, 4466.0, 2187.0, 1110.0, 675.0, 335.0, 230.0, 154.0, 94.0, 52.0, 53.0, 32.0, 23.0, 22.0, 11.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.625, -8.36749267578125, -8.1099853515625, -7.85247802734375, -7.594970703125, -7.33746337890625, -7.0799560546875, -6.82244873046875, -6.56494140625, -6.30743408203125, -6.0499267578125, -5.79241943359375, -5.534912109375, -5.27740478515625, -5.0198974609375, -4.76239013671875, -4.5048828125, -4.24737548828125, -3.9898681640625, -3.73236083984375, -3.474853515625, -3.21734619140625, -2.9598388671875, -2.70233154296875, -2.44482421875, -2.18731689453125, -1.9298095703125, -1.67230224609375, -1.414794921875, -1.15728759765625, -0.8997802734375, -0.64227294921875, -0.384765625, -0.12725830078125, 0.1302490234375, 0.38775634765625, 0.645263671875, 0.90277099609375, 1.1602783203125, 1.41778564453125, 1.67529296875, 1.93280029296875, 2.1903076171875, 2.44781494140625, 2.705322265625, 2.96282958984375, 3.2203369140625, 3.47784423828125, 3.7353515625, 3.99285888671875, 4.2503662109375, 4.50787353515625, 4.765380859375, 5.02288818359375, 5.2803955078125, 5.53790283203125, 5.79541015625, 6.05291748046875, 6.3104248046875, 6.56793212890625, 6.825439453125, 7.08294677734375, 7.3404541015625, 7.59796142578125, 7.85546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 10.0, 5.0, 8.0, 8.0, 10.0, 10.0, 22.0, 21.0, 21.0, 23.0, 31.0, 29.0, 32.0, 49.0, 44.0, 29.0, 53.0, 47.0, 49.0, 45.0, 51.0, 39.0, 46.0, 44.0, 38.0, 39.0, 33.0, 25.0, 26.0, 26.0, 16.0, 16.0, 12.0, 6.0, 12.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.2900390625, -1.2555923461914062, -1.2211456298828125, -1.1866989135742188, -1.152252197265625, -1.1178054809570312, -1.0833587646484375, -1.0489120483398438, -1.01446533203125, -0.9800186157226562, -0.9455718994140625, -0.9111251831054688, -0.876678466796875, -0.8422317504882812, -0.8077850341796875, -0.7733383178710938, -0.7388916015625, -0.7044448852539062, -0.6699981689453125, -0.6355514526367188, -0.601104736328125, -0.5666580200195312, -0.5322113037109375, -0.49776458740234375, -0.46331787109375, -0.42887115478515625, -0.3944244384765625, -0.35997772216796875, -0.325531005859375, -0.29108428955078125, -0.2566375732421875, -0.22219085693359375, -0.187744140625, -0.15329742431640625, -0.1188507080078125, -0.08440399169921875, -0.049957275390625, -0.01551055908203125, 0.0189361572265625, 0.05338287353515625, 0.08782958984375, 0.12227630615234375, 0.1567230224609375, 0.19116973876953125, 0.225616455078125, 0.26006317138671875, 0.2945098876953125, 0.32895660400390625, 0.3634033203125, 0.39785003662109375, 0.4322967529296875, 0.46674346923828125, 0.501190185546875, 0.5356369018554688, 0.5700836181640625, 0.6045303344726562, 0.63897705078125, 0.6734237670898438, 0.7078704833984375, 0.7423171997070312, 0.776763916015625, 0.8112106323242188, 0.8456573486328125, 0.8801040649414062, 0.91455078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 9.0, 13.0, 20.0, 37.0, 36.0, 68.0, 78.0, 110.0, 157.0, 241.0, 381.0, 580.0, 1089.0, 2361.0, 6272.0, 18804.0, 59332.0, 181413.0, 382351.0, 259384.0, 91578.0, 28439.0, 9133.0, 3192.0, 1370.0, 734.0, 424.0, 291.0, 199.0, 152.0, 88.0, 57.0, 34.0, 32.0, 17.0, 16.0, 12.0, 14.0, 8.0, 6.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.828125, -5.62493896484375, -5.4217529296875, -5.21856689453125, -5.015380859375, -4.81219482421875, -4.6090087890625, -4.40582275390625, -4.20263671875, -3.99945068359375, -3.7962646484375, -3.59307861328125, -3.389892578125, -3.18670654296875, -2.9835205078125, -2.78033447265625, -2.5771484375, -2.37396240234375, -2.1707763671875, -1.96759033203125, -1.764404296875, -1.56121826171875, -1.3580322265625, -1.15484619140625, -0.95166015625, -0.74847412109375, -0.5452880859375, -0.34210205078125, -0.138916015625, 0.06427001953125, 0.2674560546875, 0.47064208984375, 0.673828125, 0.87701416015625, 1.0802001953125, 1.28338623046875, 1.486572265625, 1.68975830078125, 1.8929443359375, 2.09613037109375, 2.29931640625, 2.50250244140625, 2.7056884765625, 2.90887451171875, 3.112060546875, 3.31524658203125, 3.5184326171875, 3.72161865234375, 3.9248046875, 4.12799072265625, 4.3311767578125, 4.53436279296875, 4.737548828125, 4.94073486328125, 5.1439208984375, 5.34710693359375, 5.55029296875, 5.75347900390625, 5.9566650390625, 6.15985107421875, 6.363037109375, 6.56622314453125, 6.7694091796875, 6.97259521484375, 7.17578125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 7.0, 9.0, 9.0, 13.0, 20.0, 21.0, 26.0, 17.0, 29.0, 26.0, 26.0, 34.0, 40.0, 46.0, 58.0, 48.0, 53.0, 42.0, 52.0, 40.0, 32.0, 50.0, 38.0, 34.0, 41.0, 25.0, 26.0, 22.0, 18.0, 16.0, 10.0, 15.0, 8.0, 12.0, 10.0, 4.0, 2.0, 1.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.136474609375, -3.99169921875, -3.846923828125, -3.7021484375, -3.557373046875, -3.41259765625, -3.267822265625, -3.123046875, -2.978271484375, -2.83349609375, -2.688720703125, -2.5439453125, -2.399169921875, -2.25439453125, -2.109619140625, -1.96484375, -1.820068359375, -1.67529296875, -1.530517578125, -1.3857421875, -1.240966796875, -1.09619140625, -0.951416015625, -0.806640625, -0.661865234375, -0.51708984375, -0.372314453125, -0.2275390625, -0.082763671875, 0.06201171875, 0.206787109375, 0.3515625, 0.496337890625, 0.64111328125, 0.785888671875, 0.9306640625, 1.075439453125, 1.22021484375, 1.364990234375, 1.509765625, 1.654541015625, 1.79931640625, 1.944091796875, 2.0888671875, 2.233642578125, 2.37841796875, 2.523193359375, 2.66796875, 2.812744140625, 2.95751953125, 3.102294921875, 3.2470703125, 3.391845703125, 3.53662109375, 3.681396484375, 3.826171875, 3.970947265625, 4.11572265625, 4.260498046875, 4.4052734375, 4.550048828125, 4.69482421875, 4.839599609375, 4.984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 11.0, 4.0, 14.0, 17.0, 24.0, 45.0, 65.0, 132.0, 227.0, 553.0, 1490.0, 4939.0, 23612.0, 210153.0, 685556.0, 102261.0, 14120.0, 3305.0, 1119.0, 434.0, 189.0, 95.0, 70.0, 45.0, 27.0, 16.0, 11.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.8359375, -9.56536865234375, -9.2947998046875, -9.02423095703125, -8.753662109375, -8.48309326171875, -8.2125244140625, -7.94195556640625, -7.67138671875, -7.40081787109375, -7.1302490234375, -6.85968017578125, -6.589111328125, -6.31854248046875, -6.0479736328125, -5.77740478515625, -5.5068359375, -5.23626708984375, -4.9656982421875, -4.69512939453125, -4.424560546875, -4.15399169921875, -3.8834228515625, -3.61285400390625, -3.34228515625, -3.07171630859375, -2.8011474609375, -2.53057861328125, -2.260009765625, -1.98944091796875, -1.7188720703125, -1.44830322265625, -1.177734375, -0.90716552734375, -0.6365966796875, -0.36602783203125, -0.095458984375, 0.17510986328125, 0.4456787109375, 0.71624755859375, 0.98681640625, 1.25738525390625, 1.5279541015625, 1.79852294921875, 2.069091796875, 2.33966064453125, 2.6102294921875, 2.88079833984375, 3.1513671875, 3.42193603515625, 3.6925048828125, 3.96307373046875, 4.233642578125, 4.50421142578125, 4.7747802734375, 5.04534912109375, 5.31591796875, 5.58648681640625, 5.8570556640625, 6.12762451171875, 6.398193359375, 6.66876220703125, 6.9393310546875, 7.20989990234375, 7.48046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 12.0, 22.0, 34.0, 59.0, 58.0, 89.0, 125.0, 156.0, 125.0, 95.0, 75.0, 31.0, 31.0, 18.0, 21.0, 11.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006847381591796875, -0.0006494522094726562, -0.000614166259765625, -0.0005788803100585938, -0.0005435943603515625, -0.0005083084106445312, -0.0004730224609375, -0.00043773651123046875, -0.0004024505615234375, -0.00036716461181640625, -0.000331878662109375, -0.00029659271240234375, -0.0002613067626953125, -0.00022602081298828125, -0.00019073486328125, -0.00015544891357421875, -0.0001201629638671875, -8.487701416015625e-05, -4.9591064453125e-05, -1.430511474609375e-05, 2.09808349609375e-05, 5.626678466796875e-05, 9.1552734375e-05, 0.00012683868408203125, 0.0001621246337890625, 0.00019741058349609375, 0.000232696533203125, 0.00026798248291015625, 0.0003032684326171875, 0.00033855438232421875, 0.00037384033203125, 0.00040912628173828125, 0.0004444122314453125, 0.00047969818115234375, 0.000514984130859375, 0.0005502700805664062, 0.0005855560302734375, 0.0006208419799804688, 0.0006561279296875, 0.0006914138793945312, 0.0007266998291015625, 0.0007619857788085938, 0.000797271728515625, 0.0008325576782226562, 0.0008678436279296875, 0.0009031295776367188, 0.00093841552734375, 0.0009737014770507812, 0.0010089874267578125, 0.0010442733764648438, 0.001079559326171875, 0.0011148452758789062, 0.0011501312255859375, 0.0011854171752929688, 0.001220703125, 0.0012559890747070312, 0.0012912750244140625, 0.0013265609741210938, 0.001361846923828125, 0.0013971328735351562, 0.0014324188232421875, 0.0014677047729492188, 0.00150299072265625, 0.0015382766723632812, 0.0015735626220703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 5.0, 4.0, 7.0, 9.0, 6.0, 17.0, 12.0, 23.0, 25.0, 27.0, 35.0, 49.0, 70.0, 80.0, 147.0, 217.0, 380.0, 677.0, 1284.0, 2612.0, 5962.0, 15590.0, 47698.0, 186386.0, 493010.0, 211206.0, 53302.0, 17068.0, 6555.0, 2880.0, 1385.0, 669.0, 374.0, 255.0, 149.0, 99.0, 63.0, 31.0, 31.0, 36.0, 18.0, 26.0, 13.0, 14.0, 10.0, 9.0, 7.0, 8.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-4.96484375, -4.81683349609375, -4.6688232421875, -4.52081298828125, -4.372802734375, -4.22479248046875, -4.0767822265625, -3.92877197265625, -3.78076171875, -3.63275146484375, -3.4847412109375, -3.33673095703125, -3.188720703125, -3.04071044921875, -2.8927001953125, -2.74468994140625, -2.5966796875, -2.44866943359375, -2.3006591796875, -2.15264892578125, -2.004638671875, -1.85662841796875, -1.7086181640625, -1.56060791015625, -1.41259765625, -1.26458740234375, -1.1165771484375, -0.96856689453125, -0.820556640625, -0.67254638671875, -0.5245361328125, -0.37652587890625, -0.228515625, -0.08050537109375, 0.0675048828125, 0.21551513671875, 0.363525390625, 0.51153564453125, 0.6595458984375, 0.80755615234375, 0.95556640625, 1.10357666015625, 1.2515869140625, 1.39959716796875, 1.547607421875, 1.69561767578125, 1.8436279296875, 1.99163818359375, 2.1396484375, 2.28765869140625, 2.4356689453125, 2.58367919921875, 2.731689453125, 2.87969970703125, 3.0277099609375, 3.17572021484375, 3.32373046875, 3.47174072265625, 3.6197509765625, 3.76776123046875, 3.915771484375, 4.06378173828125, 4.2117919921875, 4.35980224609375, 4.5078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 4.0, 4.0, 5.0, 16.0, 12.0, 8.0, 20.0, 20.0, 21.0, 29.0, 45.0, 51.0, 50.0, 60.0, 74.0, 72.0, 71.0, 62.0, 78.0, 61.0, 40.0, 34.0, 26.0, 15.0, 17.0, 14.0, 10.0, 22.0, 7.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.255859375, -3.15966796875, -3.0634765625, -2.96728515625, -2.87109375, -2.77490234375, -2.6787109375, -2.58251953125, -2.486328125, -2.39013671875, -2.2939453125, -2.19775390625, -2.1015625, -2.00537109375, -1.9091796875, -1.81298828125, -1.716796875, -1.62060546875, -1.5244140625, -1.42822265625, -1.33203125, -1.23583984375, -1.1396484375, -1.04345703125, -0.947265625, -0.85107421875, -0.7548828125, -0.65869140625, -0.5625, -0.46630859375, -0.3701171875, -0.27392578125, -0.177734375, -0.08154296875, 0.0146484375, 0.11083984375, 0.20703125, 0.30322265625, 0.3994140625, 0.49560546875, 0.591796875, 0.68798828125, 0.7841796875, 0.88037109375, 0.9765625, 1.07275390625, 1.1689453125, 1.26513671875, 1.361328125, 1.45751953125, 1.5537109375, 1.64990234375, 1.74609375, 1.84228515625, 1.9384765625, 2.03466796875, 2.130859375, 2.22705078125, 2.3232421875, 2.41943359375, 2.515625, 2.61181640625, 2.7080078125, 2.80419921875, 2.900390625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 14.0, 46.0, 105.0, 162.0, 222.0, 187.0, 125.0, 77.0, 36.0, 13.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.70285034179688, -111.8202896118164, -108.93772888183594, -106.05516815185547, -103.172607421875, -100.29004669189453, -97.40748596191406, -94.52493286132812, -91.64236450195312, -88.75980377197266, -85.87724304199219, -82.99468231201172, -80.11212158203125, -77.22956085205078, -74.34700012207031, -71.46444702148438, -68.5818862915039, -65.69932556152344, -62.81676483154297, -59.9342041015625, -57.05164337158203, -54.16908264160156, -51.28652572631836, -48.40396499633789, -45.52140426635742, -42.63884353637695, -39.756282806396484, -36.87372589111328, -33.99116516113281, -31.10860252380371, -28.226043701171875, -25.343482971191406, -22.46092987060547, -19.578369140625, -16.69580841064453, -13.813249588012695, -10.930688858032227, -8.048128128051758, -5.165569305419922, -2.283008575439453, 0.5995521545410156, 3.482112407684326, 6.364672660827637, 9.247232437133789, 12.129793167114258, 15.012353897094727, 17.894912719726562, 20.77747344970703, 23.6600341796875, 26.54259490966797, 29.425155639648438, 32.307716369628906, 35.190277099609375, 38.072837829589844, 40.95539474487305, 43.837955474853516, 46.720516204833984, 49.60307693481445, 52.48563766479492, 55.368194580078125, 58.250755310058594, 61.13331604003906, 64.01587677001953, 66.8984375, 69.78099822998047]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 3.0, 4.0, 4.0, 7.0, 8.0, 13.0, 14.0, 14.0, 18.0, 30.0, 29.0, 29.0, 38.0, 34.0, 36.0, 34.0, 43.0, 38.0, 40.0, 42.0, 44.0, 46.0, 51.0, 32.0, 50.0, 36.0, 31.0, 47.0, 29.0, 24.0, 21.0, 21.0, 24.0, 15.0, 11.0, 13.0, 5.0, 5.0, 1.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.53211212158203, -31.670875549316406, -30.80963706970215, -29.948400497436523, -29.087162017822266, -28.22592544555664, -27.364688873291016, -26.503450393676758, -25.642213821411133, -24.780977249145508, -23.91973876953125, -23.058502197265625, -22.197263717651367, -21.336027145385742, -20.474788665771484, -19.61355209350586, -18.752315521240234, -17.89107894897461, -17.02984046936035, -16.168603897094727, -15.307366371154785, -14.446128845214844, -13.584891319274902, -12.723653793334961, -11.862415313720703, -11.001177787780762, -10.13994026184082, -9.278703689575195, -8.417466163635254, -7.5562286376953125, -6.694991111755371, -5.833754062652588, -4.972517013549805, -4.111279487609863, -3.25004243850708, -2.3888049125671387, -1.5275676250457764, -0.6663303375244141, 0.19490718841552734, 1.0561442375183105, 1.917381763458252, 2.7786190509796143, 3.6398563385009766, 4.501093864440918, 5.362331390380859, 6.223568439483643, 7.084805965423584, 7.946043014526367, 8.807280540466309, 9.66851806640625, 10.529755592346191, 11.390993118286133, 12.252229690551758, 13.1134672164917, 13.97470474243164, 14.835941314697266, 15.697179794311523, 16.55841636657715, 17.419654846191406, 18.28089141845703, 19.14212989807129, 20.003366470336914, 20.864604949951172, 21.725841522216797, 22.587078094482422]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 7.0, 4.0, 6.0, 13.0, 15.0, 14.0, 19.0, 28.0, 39.0, 52.0, 69.0, 89.0, 123.0, 162.0, 259.0, 362.0, 564.0, 874.0, 1408.0, 2485.0, 4966.0, 10673.0, 27183.0, 87228.0, 422447.0, 3064024.0, 430899.0, 89022.0, 28857.0, 11317.0, 5105.0, 2622.0, 1339.0, 736.0, 432.0, 281.0, 184.0, 136.0, 77.0, 51.0, 31.0, 27.0, 15.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.3125, -9.0426025390625, -8.772705078125, -8.5028076171875, -8.23291015625, -7.9630126953125, -7.693115234375, -7.4232177734375, -7.1533203125, -6.8834228515625, -6.613525390625, -6.3436279296875, -6.07373046875, -5.8038330078125, -5.533935546875, -5.2640380859375, -4.994140625, -4.7242431640625, -4.454345703125, -4.1844482421875, -3.91455078125, -3.6446533203125, -3.374755859375, -3.1048583984375, -2.8349609375, -2.5650634765625, -2.295166015625, -2.0252685546875, -1.75537109375, -1.4854736328125, -1.215576171875, -0.9456787109375, -0.67578125, -0.4058837890625, -0.135986328125, 0.1339111328125, 0.40380859375, 0.6737060546875, 0.943603515625, 1.2135009765625, 1.4833984375, 1.7532958984375, 2.023193359375, 2.2930908203125, 2.56298828125, 2.8328857421875, 3.102783203125, 3.3726806640625, 3.642578125, 3.9124755859375, 4.182373046875, 4.4522705078125, 4.72216796875, 4.9920654296875, 5.261962890625, 5.5318603515625, 5.8017578125, 6.0716552734375, 6.341552734375, 6.6114501953125, 6.88134765625, 7.1512451171875, 7.421142578125, 7.6910400390625, 7.9609375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 11.0, 7.0, 10.0, 16.0, 16.0, 19.0, 17.0, 36.0, 30.0, 33.0, 45.0, 47.0, 46.0, 44.0, 50.0, 48.0, 54.0, 35.0, 45.0, 44.0, 58.0, 39.0, 34.0, 34.0, 25.0, 26.0, 25.0, 20.0, 18.0, 10.0, 14.0, 13.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.197052001953125, -1.16070556640625, -1.124359130859375, -1.0880126953125, -1.051666259765625, -1.01531982421875, -0.978973388671875, -0.942626953125, -0.906280517578125, -0.86993408203125, -0.833587646484375, -0.7972412109375, -0.760894775390625, -0.72454833984375, -0.688201904296875, -0.65185546875, -0.615509033203125, -0.57916259765625, -0.542816162109375, -0.5064697265625, -0.470123291015625, -0.43377685546875, -0.397430419921875, -0.361083984375, -0.324737548828125, -0.28839111328125, -0.252044677734375, -0.2156982421875, -0.179351806640625, -0.14300537109375, -0.106658935546875, -0.0703125, -0.033966064453125, 0.00238037109375, 0.038726806640625, 0.0750732421875, 0.111419677734375, 0.14776611328125, 0.184112548828125, 0.220458984375, 0.256805419921875, 0.29315185546875, 0.329498291015625, 0.3658447265625, 0.402191162109375, 0.43853759765625, 0.474884033203125, 0.51123046875, 0.547576904296875, 0.58392333984375, 0.620269775390625, 0.6566162109375, 0.692962646484375, 0.72930908203125, 0.765655517578125, 0.802001953125, 0.838348388671875, 0.87469482421875, 0.911041259765625, 0.9473876953125, 0.983734130859375, 1.02008056640625, 1.056427001953125, 1.0927734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 11.0, 14.0, 29.0, 37.0, 57.0, 62.0, 130.0, 226.0, 435.0, 976.0, 2449.0, 7742.0, 32159.0, 190355.0, 2643830.0, 1170850.0, 114039.0, 21565.0, 5790.0, 1886.0, 783.0, 334.0, 169.0, 122.0, 56.0, 44.0, 37.0, 32.0, 16.0, 5.0, 9.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.9921875, -10.6676025390625, -10.343017578125, -10.0184326171875, -9.69384765625, -9.3692626953125, -9.044677734375, -8.7200927734375, -8.3955078125, -8.0709228515625, -7.746337890625, -7.4217529296875, -7.09716796875, -6.7725830078125, -6.447998046875, -6.1234130859375, -5.798828125, -5.4742431640625, -5.149658203125, -4.8250732421875, -4.50048828125, -4.1759033203125, -3.851318359375, -3.5267333984375, -3.2021484375, -2.8775634765625, -2.552978515625, -2.2283935546875, -1.90380859375, -1.5792236328125, -1.254638671875, -0.9300537109375, -0.60546875, -0.2808837890625, 0.043701171875, 0.3682861328125, 0.69287109375, 1.0174560546875, 1.342041015625, 1.6666259765625, 1.9912109375, 2.3157958984375, 2.640380859375, 2.9649658203125, 3.28955078125, 3.6141357421875, 3.938720703125, 4.2633056640625, 4.587890625, 4.9124755859375, 5.237060546875, 5.5616455078125, 5.88623046875, 6.2108154296875, 6.535400390625, 6.8599853515625, 7.1845703125, 7.5091552734375, 7.833740234375, 8.1583251953125, 8.48291015625, 8.8074951171875, 9.132080078125, 9.4566650390625, 9.78125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 8.0, 13.0, 7.0, 19.0, 21.0, 29.0, 51.0, 75.0, 89.0, 120.0, 166.0, 295.0, 470.0, 794.0, 637.0, 400.0, 243.0, 170.0, 123.0, 91.0, 53.0, 57.0, 31.0, 24.0, 18.0, 13.0, 10.0, 10.0, 6.0, 2.0, 7.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.565887451171875, -2.47357177734375, -2.381256103515625, -2.2889404296875, -2.196624755859375, -2.10430908203125, -2.011993408203125, -1.919677734375, -1.827362060546875, -1.73504638671875, -1.642730712890625, -1.5504150390625, -1.458099365234375, -1.36578369140625, -1.273468017578125, -1.18115234375, -1.088836669921875, -0.99652099609375, -0.904205322265625, -0.8118896484375, -0.719573974609375, -0.62725830078125, -0.534942626953125, -0.442626953125, -0.350311279296875, -0.25799560546875, -0.165679931640625, -0.0733642578125, 0.018951416015625, 0.11126708984375, 0.203582763671875, 0.2958984375, 0.388214111328125, 0.48052978515625, 0.572845458984375, 0.6651611328125, 0.757476806640625, 0.84979248046875, 0.942108154296875, 1.034423828125, 1.126739501953125, 1.21905517578125, 1.311370849609375, 1.4036865234375, 1.496002197265625, 1.58831787109375, 1.680633544921875, 1.77294921875, 1.865264892578125, 1.95758056640625, 2.049896240234375, 2.1422119140625, 2.234527587890625, 2.32684326171875, 2.419158935546875, 2.511474609375, 2.603790283203125, 2.69610595703125, 2.788421630859375, 2.8807373046875, 2.973052978515625, 3.06536865234375, 3.157684326171875, 3.25]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 13.0, 19.0, 47.0, 77.0, 126.0, 217.0, 196.0, 130.0, 76.0, 58.0, 28.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.36238098144531, -56.890621185302734, -55.41885757446289, -53.94709777832031, -52.47533416748047, -51.00357437133789, -49.53181457519531, -48.06005096435547, -46.58829116821289, -45.11653137207031, -43.64476776123047, -42.17300796508789, -40.70124816894531, -39.22948455810547, -37.75772476196289, -36.28596496582031, -34.81420135498047, -33.34244155883789, -31.870677947998047, -30.39891815185547, -28.927156448364258, -27.455394744873047, -25.98363494873047, -24.511873245239258, -23.040111541748047, -21.568349838256836, -20.096588134765625, -18.624828338623047, -17.153066635131836, -15.681304931640625, -14.20954418182373, -12.737783432006836, -11.26602554321289, -9.79426383972168, -8.322503089904785, -6.850741863250732, -5.37898063659668, -3.907219409942627, -2.435458183288574, -0.9636974334716797, 0.5080642700195312, 1.979825496673584, 3.4515867233276367, 4.9233479499816895, 6.395109176635742, 7.866870403289795, 9.338631629943848, 10.810392379760742, 12.282154083251953, 13.753915786743164, 15.225676536560059, 16.697437286376953, 18.169198989868164, 19.640960693359375, 21.112720489501953, 22.584482192993164, 24.056243896484375, 25.528005599975586, 26.999767303466797, 28.471527099609375, 29.943288803100586, 31.415050506591797, 32.886810302734375, 34.35857391357422, 35.8303337097168]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 7.0, 7.0, 12.0, 6.0, 10.0, 15.0, 22.0, 25.0, 23.0, 25.0, 24.0, 39.0, 26.0, 35.0, 47.0, 43.0, 34.0, 51.0, 57.0, 46.0, 40.0, 47.0, 39.0, 46.0, 41.0, 38.0, 35.0, 29.0, 25.0, 17.0, 19.0, 14.0, 12.0, 12.0, 14.0, 6.0, 6.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.49124526977539, -13.044209480285645, -12.597173690795898, -12.150137901306152, -11.703102111816406, -11.25606632232666, -10.809030532836914, -10.361994743347168, -9.914958953857422, -9.467923164367676, -9.02088737487793, -8.573851585388184, -8.126815795898438, -7.679780006408691, -7.232744216918945, -6.785708427429199, -6.338672637939453, -5.891636848449707, -5.444601058959961, -4.997565269470215, -4.550529479980469, -4.103493690490723, -3.6564579010009766, -3.2094221115112305, -2.7623863220214844, -2.3153505325317383, -1.8683147430419922, -1.421278953552246, -0.9742431640625, -0.5272073745727539, -0.08017158508300781, 0.3668642044067383, 0.8139009475708008, 1.2609367370605469, 1.707972526550293, 2.155008316040039, 2.602044105529785, 3.0490798950195312, 3.4961156845092773, 3.9431514739990234, 4.3901872634887695, 4.837223052978516, 5.284258842468262, 5.731294631958008, 6.178330421447754, 6.6253662109375, 7.072402000427246, 7.519437789916992, 7.966473579406738, 8.413509368896484, 8.86054515838623, 9.307580947875977, 9.754616737365723, 10.201652526855469, 10.648688316345215, 11.095724105834961, 11.542759895324707, 11.989795684814453, 12.4368314743042, 12.883867263793945, 13.330903053283691, 13.777938842773438, 14.224974632263184, 14.67201042175293, 15.119046211242676]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 16.0, 10.0, 17.0, 42.0, 59.0, 114.0, 198.0, 403.0, 713.0, 1595.0, 4167.0, 12762.0, 45436.0, 226567.0, 600444.0, 115274.0, 27502.0, 7954.0, 2873.0, 1148.0, 599.0, 266.0, 161.0, 78.0, 52.0, 33.0, 26.0, 16.0, 7.0, 13.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -13.110107421875, -12.72802734375, -12.345947265625, -11.9638671875, -11.581787109375, -11.19970703125, -10.817626953125, -10.435546875, -10.053466796875, -9.67138671875, -9.289306640625, -8.9072265625, -8.525146484375, -8.14306640625, -7.760986328125, -7.37890625, -6.996826171875, -6.61474609375, -6.232666015625, -5.8505859375, -5.468505859375, -5.08642578125, -4.704345703125, -4.322265625, -3.940185546875, -3.55810546875, -3.176025390625, -2.7939453125, -2.411865234375, -2.02978515625, -1.647705078125, -1.265625, -0.883544921875, -0.50146484375, -0.119384765625, 0.2626953125, 0.644775390625, 1.02685546875, 1.408935546875, 1.791015625, 2.173095703125, 2.55517578125, 2.937255859375, 3.3193359375, 3.701416015625, 4.08349609375, 4.465576171875, 4.84765625, 5.229736328125, 5.61181640625, 5.993896484375, 6.3759765625, 6.758056640625, 7.14013671875, 7.522216796875, 7.904296875, 8.286376953125, 8.66845703125, 9.050537109375, 9.4326171875, 9.814697265625, 10.19677734375, 10.578857421875, 10.9609375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 5.0, 9.0, 9.0, 11.0, 14.0, 22.0, 18.0, 26.0, 26.0, 38.0, 31.0, 48.0, 28.0, 43.0, 41.0, 42.0, 41.0, 51.0, 40.0, 36.0, 54.0, 42.0, 28.0, 32.0, 33.0, 38.0, 26.0, 34.0, 24.0, 15.0, 16.0, 16.0, 8.0, 6.0, 8.0, 3.0, 2.0, 5.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-1.2880859375, -1.2535171508789062, -1.2189483642578125, -1.1843795776367188, -1.149810791015625, -1.1152420043945312, -1.0806732177734375, -1.0461044311523438, -1.01153564453125, -0.9769668579101562, -0.9423980712890625, -0.9078292846679688, -0.873260498046875, -0.8386917114257812, -0.8041229248046875, -0.7695541381835938, -0.7349853515625, -0.7004165649414062, -0.6658477783203125, -0.6312789916992188, -0.596710205078125, -0.5621414184570312, -0.5275726318359375, -0.49300384521484375, -0.45843505859375, -0.42386627197265625, -0.3892974853515625, -0.35472869873046875, -0.320159912109375, -0.28559112548828125, -0.2510223388671875, -0.21645355224609375, -0.181884765625, -0.14731597900390625, -0.1127471923828125, -0.07817840576171875, -0.043609619140625, -0.00904083251953125, 0.0255279541015625, 0.06009674072265625, 0.09466552734375, 0.12923431396484375, 0.1638031005859375, 0.19837188720703125, 0.232940673828125, 0.26750946044921875, 0.3020782470703125, 0.33664703369140625, 0.3712158203125, 0.40578460693359375, 0.4403533935546875, 0.47492218017578125, 0.509490966796875, 0.5440597534179688, 0.5786285400390625, 0.6131973266601562, 0.64776611328125, 0.6823348999023438, 0.7169036865234375, 0.7514724731445312, 0.786041259765625, 0.8206100463867188, 0.8551788330078125, 0.8897476196289062, 0.92431640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 6.0, 11.0, 5.0, 13.0, 23.0, 29.0, 36.0, 69.0, 104.0, 134.0, 233.0, 359.0, 680.0, 1346.0, 2965.0, 8669.0, 27938.0, 99771.0, 458718.0, 340194.0, 73901.0, 21388.0, 6858.0, 2503.0, 1061.0, 582.0, 309.0, 190.0, 147.0, 92.0, 72.0, 49.0, 35.0, 27.0, 15.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.546875, -8.2869873046875, -8.027099609375, -7.7672119140625, -7.50732421875, -7.2474365234375, -6.987548828125, -6.7276611328125, -6.4677734375, -6.2078857421875, -5.947998046875, -5.6881103515625, -5.42822265625, -5.1683349609375, -4.908447265625, -4.6485595703125, -4.388671875, -4.1287841796875, -3.868896484375, -3.6090087890625, -3.34912109375, -3.0892333984375, -2.829345703125, -2.5694580078125, -2.3095703125, -2.0496826171875, -1.789794921875, -1.5299072265625, -1.27001953125, -1.0101318359375, -0.750244140625, -0.4903564453125, -0.23046875, 0.0294189453125, 0.289306640625, 0.5491943359375, 0.80908203125, 1.0689697265625, 1.328857421875, 1.5887451171875, 1.8486328125, 2.1085205078125, 2.368408203125, 2.6282958984375, 2.88818359375, 3.1480712890625, 3.407958984375, 3.6678466796875, 3.927734375, 4.1876220703125, 4.447509765625, 4.7073974609375, 4.96728515625, 5.2271728515625, 5.487060546875, 5.7469482421875, 6.0068359375, 6.2667236328125, 6.526611328125, 6.7864990234375, 7.04638671875, 7.3062744140625, 7.566162109375, 7.8260498046875, 8.0859375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 7.0, 10.0, 13.0, 17.0, 26.0, 29.0, 23.0, 43.0, 31.0, 38.0, 45.0, 44.0, 54.0, 60.0, 43.0, 50.0, 55.0, 54.0, 48.0, 37.0, 41.0, 37.0, 43.0, 34.0, 29.0, 23.0, 16.0, 12.0, 10.0, 11.0, 5.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.53594970703125, -4.3531494140625, -4.17034912109375, -3.987548828125, -3.80474853515625, -3.6219482421875, -3.43914794921875, -3.25634765625, -3.07354736328125, -2.8907470703125, -2.70794677734375, -2.525146484375, -2.34234619140625, -2.1595458984375, -1.97674560546875, -1.7939453125, -1.61114501953125, -1.4283447265625, -1.24554443359375, -1.062744140625, -0.87994384765625, -0.6971435546875, -0.51434326171875, -0.33154296875, -0.14874267578125, 0.0340576171875, 0.21685791015625, 0.399658203125, 0.58245849609375, 0.7652587890625, 0.94805908203125, 1.130859375, 1.31365966796875, 1.4964599609375, 1.67926025390625, 1.862060546875, 2.04486083984375, 2.2276611328125, 2.41046142578125, 2.59326171875, 2.77606201171875, 2.9588623046875, 3.14166259765625, 3.324462890625, 3.50726318359375, 3.6900634765625, 3.87286376953125, 4.0556640625, 4.23846435546875, 4.4212646484375, 4.60406494140625, 4.786865234375, 4.96966552734375, 5.1524658203125, 5.33526611328125, 5.51806640625, 5.70086669921875, 5.8836669921875, 6.06646728515625, 6.249267578125, 6.43206787109375, 6.6148681640625, 6.79766845703125, 6.98046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 4.0, 8.0, 8.0, 11.0, 17.0, 14.0, 37.0, 48.0, 77.0, 117.0, 270.0, 516.0, 1346.0, 4037.0, 15717.0, 86447.0, 675784.0, 224987.0, 28824.0, 6754.0, 2022.0, 739.0, 341.0, 170.0, 108.0, 48.0, 47.0, 15.0, 12.0, 12.0, 3.0, 9.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.91796875, -7.6961669921875, -7.474365234375, -7.2525634765625, -7.03076171875, -6.8089599609375, -6.587158203125, -6.3653564453125, -6.1435546875, -5.9217529296875, -5.699951171875, -5.4781494140625, -5.25634765625, -5.0345458984375, -4.812744140625, -4.5909423828125, -4.369140625, -4.1473388671875, -3.925537109375, -3.7037353515625, -3.48193359375, -3.2601318359375, -3.038330078125, -2.8165283203125, -2.5947265625, -2.3729248046875, -2.151123046875, -1.9293212890625, -1.70751953125, -1.4857177734375, -1.263916015625, -1.0421142578125, -0.8203125, -0.5985107421875, -0.376708984375, -0.1549072265625, 0.06689453125, 0.2886962890625, 0.510498046875, 0.7322998046875, 0.9541015625, 1.1759033203125, 1.397705078125, 1.6195068359375, 1.84130859375, 2.0631103515625, 2.284912109375, 2.5067138671875, 2.728515625, 2.9503173828125, 3.172119140625, 3.3939208984375, 3.61572265625, 3.8375244140625, 4.059326171875, 4.2811279296875, 4.5029296875, 4.7247314453125, 4.946533203125, 5.1683349609375, 5.39013671875, 5.6119384765625, 5.833740234375, 6.0555419921875, 6.27734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 9.0, 12.0, 15.0, 22.0, 29.0, 48.0, 58.0, 152.0, 206.0, 140.0, 86.0, 58.0, 35.0, 33.0, 12.0, 12.0, 13.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0014190673828125, -0.0013832300901412964, -0.0013473927974700928, -0.0013115555047988892, -0.0012757182121276855, -0.001239880919456482, -0.0012040436267852783, -0.0011682063341140747, -0.001132369041442871, -0.0010965317487716675, -0.0010606944561004639, -0.0010248571634292603, -0.0009890198707580566, -0.000953182578086853, -0.0009173452854156494, -0.0008815079927444458, -0.0008456707000732422, -0.0008098334074020386, -0.000773996114730835, -0.0007381588220596313, -0.0007023215293884277, -0.0006664842367172241, -0.0006306469440460205, -0.0005948096513748169, -0.0005589723587036133, -0.0005231350660324097, -0.00048729777336120605, -0.00045146048069000244, -0.00041562318801879883, -0.0003797858953475952, -0.0003439486026763916, -0.000308111310005188, -0.0002722740173339844, -0.00023643672466278076, -0.00020059943199157715, -0.00016476213932037354, -0.00012892484664916992, -9.308755397796631e-05, -5.7250261306762695e-05, -2.1412968635559082e-05, 1.4424324035644531e-05, 5.0261616706848145e-05, 8.609890937805176e-05, 0.00012193620204925537, 0.00015777349472045898, 0.0001936107873916626, 0.0002294480800628662, 0.0002652853727340698, 0.00030112266540527344, 0.00033695995807647705, 0.00037279725074768066, 0.0004086345434188843, 0.0004444718360900879, 0.0004803091287612915, 0.0005161464214324951, 0.0005519837141036987, 0.0005878210067749023, 0.000623658299446106, 0.0006594955921173096, 0.0006953328847885132, 0.0007311701774597168, 0.0007670074701309204, 0.000802844762802124, 0.0008386820554733276, 0.0008745193481445312]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 6.0, 7.0, 7.0, 11.0, 14.0, 39.0, 47.0, 60.0, 132.0, 173.0, 363.0, 734.0, 2038.0, 7546.0, 42600.0, 652118.0, 309635.0, 25006.0, 5135.0, 1524.0, 655.0, 276.0, 161.0, 100.0, 59.0, 35.0, 31.0, 21.0, 12.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.9532470703125, -7.695556640625, -7.4378662109375, -7.18017578125, -6.9224853515625, -6.664794921875, -6.4071044921875, -6.1494140625, -5.8917236328125, -5.634033203125, -5.3763427734375, -5.11865234375, -4.8609619140625, -4.603271484375, -4.3455810546875, -4.087890625, -3.8302001953125, -3.572509765625, -3.3148193359375, -3.05712890625, -2.7994384765625, -2.541748046875, -2.2840576171875, -2.0263671875, -1.7686767578125, -1.510986328125, -1.2532958984375, -0.99560546875, -0.7379150390625, -0.480224609375, -0.2225341796875, 0.03515625, 0.2928466796875, 0.550537109375, 0.8082275390625, 1.06591796875, 1.3236083984375, 1.581298828125, 1.8389892578125, 2.0966796875, 2.3543701171875, 2.612060546875, 2.8697509765625, 3.12744140625, 3.3851318359375, 3.642822265625, 3.9005126953125, 4.158203125, 4.4158935546875, 4.673583984375, 4.9312744140625, 5.18896484375, 5.4466552734375, 5.704345703125, 5.9620361328125, 6.2197265625, 6.4774169921875, 6.735107421875, 6.9927978515625, 7.25048828125, 7.5081787109375, 7.765869140625, 8.0235595703125, 8.28125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 1.0, 2.0, 7.0, 12.0, 9.0, 23.0, 31.0, 34.0, 63.0, 99.0, 146.0, 165.0, 143.0, 94.0, 46.0, 41.0, 22.0, 16.0, 10.0, 5.0, 13.0, 3.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.6806640625, -4.537109375, -4.3935546875, -4.25, -4.1064453125, -3.962890625, -3.8193359375, -3.67578125, -3.5322265625, -3.388671875, -3.2451171875, -3.1015625, -2.9580078125, -2.814453125, -2.6708984375, -2.52734375, -2.3837890625, -2.240234375, -2.0966796875, -1.953125, -1.8095703125, -1.666015625, -1.5224609375, -1.37890625, -1.2353515625, -1.091796875, -0.9482421875, -0.8046875, -0.6611328125, -0.517578125, -0.3740234375, -0.23046875, -0.0869140625, 0.056640625, 0.2001953125, 0.34375, 0.4873046875, 0.630859375, 0.7744140625, 0.91796875, 1.0615234375, 1.205078125, 1.3486328125, 1.4921875, 1.6357421875, 1.779296875, 1.9228515625, 2.06640625, 2.2099609375, 2.353515625, 2.4970703125, 2.640625, 2.7841796875, 2.927734375, 3.0712890625, 3.21484375, 3.3583984375, 3.501953125, 3.6455078125, 3.7890625, 3.9326171875, 4.076171875, 4.2197265625, 4.36328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 13.0, 61.0, 192.0, 359.0, 258.0, 101.0, 22.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.695068359375, -89.60940551757812, -84.52374267578125, -79.43807220458984, -74.35240936279297, -69.2667465209961, -64.18107604980469, -59.09541320800781, -54.00975036621094, -48.92408752441406, -43.83842086791992, -38.75275421142578, -33.667091369628906, -28.5814266204834, -23.49576187133789, -18.41009521484375, -13.324432373046875, -8.238767623901367, -3.1531028747558594, 1.9325618743896484, 7.018226623535156, 12.103891372680664, 17.189556121826172, 22.275222778320312, 27.360885620117188, 32.44654846191406, 37.5322151184082, 42.617881774902344, 47.70354461669922, 52.789207458496094, 57.874874114990234, 62.960540771484375, 68.04620361328125, 73.13186645507812, 78.217529296875, 83.3031997680664, 88.38886260986328, 93.47452545166016, 98.56019592285156, 103.64585876464844, 108.73152160644531, 113.81718444824219, 118.90284729003906, 123.98851776123047, 129.07418823242188, 134.15985107421875, 139.24551391601562, 144.3311767578125, 149.41683959960938, 154.50250244140625, 159.58816528320312, 164.673828125, 169.75949096679688, 174.8451690673828, 179.9308319091797, 185.01649475097656, 190.10215759277344, 195.1878204345703, 200.2734832763672, 205.35914611816406, 210.44482421875, 215.53048706054688, 220.61614990234375, 225.70181274414062, 230.7874755859375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 10.0, 20.0, 22.0, 23.0, 27.0, 33.0, 20.0, 25.0, 32.0, 26.0, 34.0, 39.0, 43.0, 39.0, 39.0, 29.0, 39.0, 33.0, 36.0, 36.0, 44.0, 33.0, 40.0, 32.0, 32.0, 26.0, 20.0, 23.0, 15.0, 16.0, 7.0, 10.0, 16.0, 10.0, 11.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-25.35485076904297, -24.618051528930664, -23.88125228881836, -23.144454956054688, -22.407655715942383, -21.670856475830078, -20.934057235717773, -20.19725799560547, -19.460460662841797, -18.723661422729492, -17.986862182617188, -17.250064849853516, -16.51326560974121, -15.776466369628906, -15.039667129516602, -14.302868843078613, -13.566069602966309, -12.829270362854004, -12.092472076416016, -11.355672836303711, -10.618874549865723, -9.882075309753418, -9.14527702331543, -8.408477783203125, -7.6716790199279785, -6.934880256652832, -6.1980814933776855, -5.461282730102539, -4.724483489990234, -3.987684965133667, -3.2508859634399414, -2.514087200164795, -1.7772884368896484, -1.040489673614502, -0.3036907911300659, 0.4331080913543701, 1.1699068546295166, 1.906705617904663, 2.6435046195983887, 3.380303382873535, 4.117102146148682, 4.853900909423828, 5.590699672698975, 6.327498435974121, 7.064297676086426, 7.801095962524414, 8.537895202636719, 9.274694442749023, 10.011492729187012, 10.748291969299316, 11.485090255737305, 12.22188949584961, 12.958687782287598, 13.695487022399902, 14.43228530883789, 15.169084548950195, 15.9058837890625, 16.642683029174805, 17.37948226928711, 18.11627960205078, 18.853078842163086, 19.58987808227539, 20.326677322387695, 21.0634765625, 21.800273895263672]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 5.0, 8.0, 12.0, 14.0, 15.0, 25.0, 29.0, 29.0, 50.0, 67.0, 100.0, 97.0, 152.0, 201.0, 296.0, 414.0, 649.0, 998.0, 1775.0, 3239.0, 6326.0, 13184.0, 31541.0, 94242.0, 502842.0, 3121538.0, 297771.0, 70147.0, 25229.0, 11084.0, 5451.0, 2841.0, 1517.0, 861.0, 508.0, 337.0, 206.0, 129.0, 103.0, 73.0, 49.0, 36.0, 22.0, 20.0, 19.0, 10.0, 10.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 3.0], "bins": [-10.1171875, -9.8311767578125, -9.545166015625, -9.2591552734375, -8.97314453125, -8.6871337890625, -8.401123046875, -8.1151123046875, -7.8291015625, -7.5430908203125, -7.257080078125, -6.9710693359375, -6.68505859375, -6.3990478515625, -6.113037109375, -5.8270263671875, -5.541015625, -5.2550048828125, -4.968994140625, -4.6829833984375, -4.39697265625, -4.1109619140625, -3.824951171875, -3.5389404296875, -3.2529296875, -2.9669189453125, -2.680908203125, -2.3948974609375, -2.10888671875, -1.8228759765625, -1.536865234375, -1.2508544921875, -0.96484375, -0.6788330078125, -0.392822265625, -0.1068115234375, 0.17919921875, 0.4652099609375, 0.751220703125, 1.0372314453125, 1.3232421875, 1.6092529296875, 1.895263671875, 2.1812744140625, 2.46728515625, 2.7532958984375, 3.039306640625, 3.3253173828125, 3.611328125, 3.8973388671875, 4.183349609375, 4.4693603515625, 4.75537109375, 5.0413818359375, 5.327392578125, 5.6134033203125, 5.8994140625, 6.1854248046875, 6.471435546875, 6.7574462890625, 7.04345703125, 7.3294677734375, 7.615478515625, 7.9014892578125, 8.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 6.0, 5.0, 4.0, 4.0, 7.0, 11.0, 17.0, 21.0, 20.0, 25.0, 21.0, 35.0, 30.0, 29.0, 34.0, 50.0, 52.0, 43.0, 46.0, 48.0, 37.0, 43.0, 34.0, 40.0, 40.0, 32.0, 37.0, 27.0, 21.0, 28.0, 29.0, 31.0, 19.0, 16.0, 12.0, 15.0, 6.0, 7.0, 3.0, 7.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.35546875, -1.3195037841796875, -1.283538818359375, -1.2475738525390625, -1.21160888671875, -1.1756439208984375, -1.139678955078125, -1.1037139892578125, -1.0677490234375, -1.0317840576171875, -0.995819091796875, -0.9598541259765625, -0.92388916015625, -0.8879241943359375, -0.851959228515625, -0.8159942626953125, -0.780029296875, -0.7440643310546875, -0.708099365234375, -0.6721343994140625, -0.63616943359375, -0.6002044677734375, -0.564239501953125, -0.5282745361328125, -0.4923095703125, -0.4563446044921875, -0.420379638671875, -0.3844146728515625, -0.34844970703125, -0.3124847412109375, -0.276519775390625, -0.2405548095703125, -0.20458984375, -0.1686248779296875, -0.132659912109375, -0.0966949462890625, -0.06072998046875, -0.0247650146484375, 0.011199951171875, 0.0471649169921875, 0.0831298828125, 0.1190948486328125, 0.155059814453125, 0.1910247802734375, 0.22698974609375, 0.2629547119140625, 0.298919677734375, 0.3348846435546875, 0.370849609375, 0.4068145751953125, 0.442779541015625, 0.4787445068359375, 0.51470947265625, 0.5506744384765625, 0.586639404296875, 0.6226043701171875, 0.6585693359375, 0.6945343017578125, 0.730499267578125, 0.7664642333984375, 0.80242919921875, 0.8383941650390625, 0.874359130859375, 0.9103240966796875, 0.9462890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 6.0, 12.0, 11.0, 17.0, 14.0, 19.0, 24.0, 53.0, 43.0, 96.0, 164.0, 345.0, 931.0, 4518.0, 45564.0, 3390311.0, 725841.0, 22093.0, 2808.0, 691.0, 244.0, 136.0, 81.0, 43.0, 38.0, 31.0, 26.0, 17.0, 19.0, 21.0, 20.0, 5.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-27.25, -26.56640625, -25.8828125, -25.19921875, -24.515625, -23.83203125, -23.1484375, -22.46484375, -21.78125, -21.09765625, -20.4140625, -19.73046875, -19.046875, -18.36328125, -17.6796875, -16.99609375, -16.3125, -15.62890625, -14.9453125, -14.26171875, -13.578125, -12.89453125, -12.2109375, -11.52734375, -10.84375, -10.16015625, -9.4765625, -8.79296875, -8.109375, -7.42578125, -6.7421875, -6.05859375, -5.375, -4.69140625, -4.0078125, -3.32421875, -2.640625, -1.95703125, -1.2734375, -0.58984375, 0.09375, 0.77734375, 1.4609375, 2.14453125, 2.828125, 3.51171875, 4.1953125, 4.87890625, 5.5625, 6.24609375, 6.9296875, 7.61328125, 8.296875, 8.98046875, 9.6640625, 10.34765625, 11.03125, 11.71484375, 12.3984375, 13.08203125, 13.765625, 14.44921875, 15.1328125, 15.81640625, 16.5]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 7.0, 29.0, 45.0, 100.0, 296.0, 774.0, 1941.0, 508.0, 196.0, 100.0, 31.0, 28.0, 11.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.099609375, -2.867095947265625, -2.63458251953125, -2.402069091796875, -2.1695556640625, -1.937042236328125, -1.70452880859375, -1.472015380859375, -1.239501953125, -1.006988525390625, -0.77447509765625, -0.541961669921875, -0.3094482421875, -0.076934814453125, 0.15557861328125, 0.388092041015625, 0.62060546875, 0.853118896484375, 1.08563232421875, 1.318145751953125, 1.5506591796875, 1.783172607421875, 2.01568603515625, 2.248199462890625, 2.480712890625, 2.713226318359375, 2.94573974609375, 3.178253173828125, 3.4107666015625, 3.643280029296875, 3.87579345703125, 4.108306884765625, 4.3408203125, 4.573333740234375, 4.80584716796875, 5.038360595703125, 5.2708740234375, 5.503387451171875, 5.73590087890625, 5.968414306640625, 6.200927734375, 6.433441162109375, 6.66595458984375, 6.898468017578125, 7.1309814453125, 7.363494873046875, 7.59600830078125, 7.828521728515625, 8.06103515625, 8.293548583984375, 8.52606201171875, 8.758575439453125, 8.9910888671875, 9.223602294921875, 9.45611572265625, 9.688629150390625, 9.921142578125, 10.153656005859375, 10.38616943359375, 10.618682861328125, 10.8511962890625, 11.083709716796875, 11.31622314453125, 11.548736572265625, 11.78125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 6.0, 9.0, 10.0, 21.0, 31.0, 49.0, 63.0, 67.0, 93.0, 83.0, 113.0, 99.0, 83.0, 78.0, 50.0, 43.0, 29.0, 30.0, 16.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.44961166381836, -18.736265182495117, -18.022916793823242, -17.3095703125, -16.596223831176758, -15.8828763961792, -15.16952896118164, -14.456182479858398, -13.742835998535156, -13.029488563537598, -12.316142082214355, -11.602794647216797, -10.889448165893555, -10.176100730895996, -9.462753295898438, -8.749406814575195, -8.036059379577637, -7.322712421417236, -6.609365463256836, -5.896018028259277, -5.182671546936035, -4.469324111938477, -3.755977153778076, -3.042630195617676, -2.3292832374572754, -1.615936279296875, -0.9025892019271851, -0.18924212455749512, 0.5241048336029053, 1.2374517917633057, 1.9507989883422852, 2.6641459465026855, 3.377492904663086, 4.090839862823486, 4.804186820983887, 5.517534255981445, 6.2308807373046875, 6.944228172302246, 7.6575751304626465, 8.370922088623047, 9.084268569946289, 9.797616004943848, 10.51096248626709, 11.224309921264648, 11.93765640258789, 12.65100383758545, 13.364351272583008, 14.07769775390625, 14.791045188903809, 15.504392623901367, 16.21773910522461, 16.93108558654785, 17.644433975219727, 18.35778045654297, 19.07112693786621, 19.784473419189453, 20.497821807861328, 21.21116828918457, 21.924516677856445, 22.637863159179688, 23.35120964050293, 24.064556121826172, 24.777904510498047, 25.49125099182129, 26.20459747314453]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 9.0, 16.0, 15.0, 17.0, 24.0, 39.0, 46.0, 52.0, 58.0, 72.0, 79.0, 90.0, 70.0, 73.0, 57.0, 54.0, 58.0, 43.0, 44.0, 25.0, 26.0, 12.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.966829299926758, -22.34467124938965, -21.722515106201172, -21.100357055664062, -20.478199005126953, -19.856040954589844, -19.233882904052734, -18.611726760864258, -17.98956871032715, -17.36741065979004, -16.745254516601562, -16.123096466064453, -15.500938415527344, -14.878780364990234, -14.256623268127441, -13.634466171264648, -13.012308120727539, -12.39015007019043, -11.767992973327637, -11.145835876464844, -10.523677825927734, -9.901519775390625, -9.279362678527832, -8.657205581665039, -8.03504753112793, -7.4128899574279785, -6.790732383728027, -6.168574810028076, -5.546417236328125, -4.924259662628174, -4.302102088928223, -3.6799445152282715, -3.057788848876953, -2.435631275177002, -1.8134737014770508, -1.1913161277770996, -0.5691585540771484, 0.052999019622802734, 0.6751565933227539, 1.297314167022705, 1.9194717407226562, 2.5416293144226074, 3.1637868881225586, 3.7859444618225098, 4.408102035522461, 5.030259609222412, 5.652417182922363, 6.2745747566223145, 6.896732330322266, 7.518889904022217, 8.141047477722168, 8.763204574584961, 9.38536262512207, 10.00752067565918, 10.629677772521973, 11.251834869384766, 11.873992919921875, 12.496150970458984, 13.118308067321777, 13.74046516418457, 14.36262321472168, 14.984781265258789, 15.606938362121582, 16.229095458984375, 16.851253509521484]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 9.0, 12.0, 20.0, 28.0, 43.0, 50.0, 77.0, 125.0, 192.0, 315.0, 487.0, 919.0, 1800.0, 3990.0, 9847.0, 26050.0, 78387.0, 394100.0, 406339.0, 80994.0, 26564.0, 9984.0, 3971.0, 1888.0, 890.0, 544.0, 298.0, 195.0, 138.0, 84.0, 70.0, 33.0, 20.0, 23.0, 16.0, 6.0, 8.0, 7.0, 2.0, 8.0, 2.0, 1.0, 1.0], "bins": [-11.890625, -11.5858154296875, -11.281005859375, -10.9761962890625, -10.67138671875, -10.3665771484375, -10.061767578125, -9.7569580078125, -9.4521484375, -9.1473388671875, -8.842529296875, -8.5377197265625, -8.23291015625, -7.9281005859375, -7.623291015625, -7.3184814453125, -7.013671875, -6.7088623046875, -6.404052734375, -6.0992431640625, -5.79443359375, -5.4896240234375, -5.184814453125, -4.8800048828125, -4.5751953125, -4.2703857421875, -3.965576171875, -3.6607666015625, -3.35595703125, -3.0511474609375, -2.746337890625, -2.4415283203125, -2.13671875, -1.8319091796875, -1.527099609375, -1.2222900390625, -0.91748046875, -0.6126708984375, -0.307861328125, -0.0030517578125, 0.3017578125, 0.6065673828125, 0.911376953125, 1.2161865234375, 1.52099609375, 1.8258056640625, 2.130615234375, 2.4354248046875, 2.740234375, 3.0450439453125, 3.349853515625, 3.6546630859375, 3.95947265625, 4.2642822265625, 4.569091796875, 4.8739013671875, 5.1787109375, 5.4835205078125, 5.788330078125, 6.0931396484375, 6.39794921875, 6.7027587890625, 7.007568359375, 7.3123779296875, 7.6171875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 7.0, 8.0, 11.0, 9.0, 14.0, 13.0, 20.0, 15.0, 26.0, 34.0, 36.0, 35.0, 37.0, 39.0, 37.0, 51.0, 55.0, 66.0, 46.0, 40.0, 30.0, 44.0, 39.0, 38.0, 38.0, 33.0, 37.0, 22.0, 18.0, 17.0, 17.0, 12.0, 11.0, 14.0, 3.0, 8.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.5322265625, -1.4914398193359375, -1.450653076171875, -1.4098663330078125, -1.36907958984375, -1.3282928466796875, -1.287506103515625, -1.2467193603515625, -1.2059326171875, -1.1651458740234375, -1.124359130859375, -1.0835723876953125, -1.04278564453125, -1.0019989013671875, -0.961212158203125, -0.9204254150390625, -0.879638671875, -0.8388519287109375, -0.798065185546875, -0.7572784423828125, -0.71649169921875, -0.6757049560546875, -0.634918212890625, -0.5941314697265625, -0.5533447265625, -0.5125579833984375, -0.471771240234375, -0.4309844970703125, -0.39019775390625, -0.3494110107421875, -0.308624267578125, -0.2678375244140625, -0.22705078125, -0.1862640380859375, -0.145477294921875, -0.1046905517578125, -0.06390380859375, -0.0231170654296875, 0.017669677734375, 0.0584564208984375, 0.0992431640625, 0.1400299072265625, 0.180816650390625, 0.2216033935546875, 0.26239013671875, 0.3031768798828125, 0.343963623046875, 0.3847503662109375, 0.425537109375, 0.4663238525390625, 0.507110595703125, 0.5478973388671875, 0.58868408203125, 0.6294708251953125, 0.670257568359375, 0.7110443115234375, 0.7518310546875, 0.7926177978515625, 0.833404541015625, 0.8741912841796875, 0.91497802734375, 0.9557647705078125, 0.996551513671875, 1.0373382568359375, 1.078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 1.0, 5.0, 9.0, 7.0, 7.0, 11.0, 11.0, 18.0, 28.0, 27.0, 56.0, 70.0, 92.0, 182.0, 251.0, 463.0, 777.0, 1555.0, 3176.0, 6984.0, 15716.0, 37038.0, 107360.0, 419547.0, 319011.0, 81299.0, 30395.0, 12586.0, 5865.0, 2845.0, 1338.0, 742.0, 379.0, 222.0, 143.0, 107.0, 56.0, 35.0, 31.0, 26.0, 21.0, 16.0, 14.0, 9.0, 6.0, 8.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.953125, -5.76641845703125, -5.5797119140625, -5.39300537109375, -5.206298828125, -5.01959228515625, -4.8328857421875, -4.64617919921875, -4.45947265625, -4.27276611328125, -4.0860595703125, -3.89935302734375, -3.712646484375, -3.52593994140625, -3.3392333984375, -3.15252685546875, -2.9658203125, -2.77911376953125, -2.5924072265625, -2.40570068359375, -2.218994140625, -2.03228759765625, -1.8455810546875, -1.65887451171875, -1.47216796875, -1.28546142578125, -1.0987548828125, -0.91204833984375, -0.725341796875, -0.53863525390625, -0.3519287109375, -0.16522216796875, 0.021484375, 0.20819091796875, 0.3948974609375, 0.58160400390625, 0.768310546875, 0.95501708984375, 1.1417236328125, 1.32843017578125, 1.51513671875, 1.70184326171875, 1.8885498046875, 2.07525634765625, 2.261962890625, 2.44866943359375, 2.6353759765625, 2.82208251953125, 3.0087890625, 3.19549560546875, 3.3822021484375, 3.56890869140625, 3.755615234375, 3.94232177734375, 4.1290283203125, 4.31573486328125, 4.50244140625, 4.68914794921875, 4.8758544921875, 5.06256103515625, 5.249267578125, 5.43597412109375, 5.6226806640625, 5.80938720703125, 5.99609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 1.0, 4.0, 7.0, 8.0, 6.0, 7.0, 14.0, 24.0, 21.0, 26.0, 28.0, 27.0, 36.0, 42.0, 53.0, 53.0, 61.0, 60.0, 48.0, 70.0, 50.0, 53.0, 48.0, 49.0, 47.0, 24.0, 26.0, 35.0, 20.0, 17.0, 7.0, 6.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.390625, -6.18975830078125, -5.9888916015625, -5.78802490234375, -5.587158203125, -5.38629150390625, -5.1854248046875, -4.98455810546875, -4.78369140625, -4.58282470703125, -4.3819580078125, -4.18109130859375, -3.980224609375, -3.77935791015625, -3.5784912109375, -3.37762451171875, -3.1767578125, -2.97589111328125, -2.7750244140625, -2.57415771484375, -2.373291015625, -2.17242431640625, -1.9715576171875, -1.77069091796875, -1.56982421875, -1.36895751953125, -1.1680908203125, -0.96722412109375, -0.766357421875, -0.56549072265625, -0.3646240234375, -0.16375732421875, 0.037109375, 0.23797607421875, 0.4388427734375, 0.63970947265625, 0.840576171875, 1.04144287109375, 1.2423095703125, 1.44317626953125, 1.64404296875, 1.84490966796875, 2.0457763671875, 2.24664306640625, 2.447509765625, 2.64837646484375, 2.8492431640625, 3.05010986328125, 3.2509765625, 3.45184326171875, 3.6527099609375, 3.85357666015625, 4.054443359375, 4.25531005859375, 4.4561767578125, 4.65704345703125, 4.85791015625, 5.05877685546875, 5.2596435546875, 5.46051025390625, 5.661376953125, 5.86224365234375, 6.0631103515625, 6.26397705078125, 6.46484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 6.0, 12.0, 11.0, 18.0, 28.0, 25.0, 35.0, 48.0, 73.0, 131.0, 365.0, 894.0, 2568.0, 9479.0, 96289.0, 878110.0, 50079.0, 6909.0, 2061.0, 756.0, 285.0, 137.0, 72.0, 38.0, 31.0, 23.0, 17.0, 15.0, 11.0, 5.0, 10.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8359375, -9.5123291015625, -9.188720703125, -8.8651123046875, -8.54150390625, -8.2178955078125, -7.894287109375, -7.5706787109375, -7.2470703125, -6.9234619140625, -6.599853515625, -6.2762451171875, -5.95263671875, -5.6290283203125, -5.305419921875, -4.9818115234375, -4.658203125, -4.3345947265625, -4.010986328125, -3.6873779296875, -3.36376953125, -3.0401611328125, -2.716552734375, -2.3929443359375, -2.0693359375, -1.7457275390625, -1.422119140625, -1.0985107421875, -0.77490234375, -0.4512939453125, -0.127685546875, 0.1959228515625, 0.51953125, 0.8431396484375, 1.166748046875, 1.4903564453125, 1.81396484375, 2.1375732421875, 2.461181640625, 2.7847900390625, 3.1083984375, 3.4320068359375, 3.755615234375, 4.0792236328125, 4.40283203125, 4.7264404296875, 5.050048828125, 5.3736572265625, 5.697265625, 6.0208740234375, 6.344482421875, 6.6680908203125, 6.99169921875, 7.3153076171875, 7.638916015625, 7.9625244140625, 8.2861328125, 8.6097412109375, 8.933349609375, 9.2569580078125, 9.58056640625, 9.9041748046875, 10.227783203125, 10.5513916015625, 10.875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 8.0, 4.0, 5.0, 7.0, 13.0, 9.0, 17.0, 24.0, 49.0, 107.0, 162.0, 247.0, 161.0, 60.0, 36.0, 20.0, 21.0, 8.0, 12.0, 9.0, 11.0, 2.0, 1.0, 6.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009527206420898438, -0.0009165108203887939, -0.0008803009986877441, -0.0008440911769866943, -0.0008078813552856445, -0.0007716715335845947, -0.0007354617118835449, -0.0006992518901824951, -0.0006630420684814453, -0.0006268322467803955, -0.0005906224250793457, -0.0005544126033782959, -0.0005182027816772461, -0.0004819929599761963, -0.0004457831382751465, -0.0004095733165740967, -0.0003733634948730469, -0.00033715367317199707, -0.00030094385147094727, -0.00026473402976989746, -0.00022852420806884766, -0.00019231438636779785, -0.00015610456466674805, -0.00011989474296569824, -8.368492126464844e-05, -4.747509956359863e-05, -1.1265277862548828e-05, 2.4944543838500977e-05, 6.115436553955078e-05, 9.736418724060059e-05, 0.0001335740089416504, 0.0001697838306427002, 0.00020599365234375, 0.0002422034740447998, 0.0002784132957458496, 0.0003146231174468994, 0.0003508329391479492, 0.000387042760848999, 0.00042325258255004883, 0.00045946240425109863, 0.0004956722259521484, 0.0005318820476531982, 0.000568091869354248, 0.0006043016910552979, 0.0006405115127563477, 0.0006767213344573975, 0.0007129311561584473, 0.0007491409778594971, 0.0007853507995605469, 0.0008215606212615967, 0.0008577704429626465, 0.0008939802646636963, 0.0009301900863647461, 0.0009663999080657959, 0.0010026097297668457, 0.0010388195514678955, 0.0010750293731689453, 0.0011112391948699951, 0.001147449016571045, 0.0011836588382720947, 0.0012198686599731445, 0.0012560784816741943, 0.0012922883033752441, 0.001328498125076294, 0.0013647079467773438]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 5.0, 8.0, 6.0, 10.0, 15.0, 21.0, 20.0, 20.0, 35.0, 29.0, 51.0, 71.0, 153.0, 338.0, 861.0, 2195.0, 7438.0, 44819.0, 827639.0, 144670.0, 14437.0, 3476.0, 1200.0, 449.0, 228.0, 84.0, 72.0, 43.0, 24.0, 24.0, 16.0, 24.0, 15.0, 13.0, 9.0, 7.0, 10.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.955078125, -7.66796875, -7.380859375, -7.09375, -6.806640625, -6.51953125, -6.232421875, -5.9453125, -5.658203125, -5.37109375, -5.083984375, -4.796875, -4.509765625, -4.22265625, -3.935546875, -3.6484375, -3.361328125, -3.07421875, -2.787109375, -2.5, -2.212890625, -1.92578125, -1.638671875, -1.3515625, -1.064453125, -0.77734375, -0.490234375, -0.203125, 0.083984375, 0.37109375, 0.658203125, 0.9453125, 1.232421875, 1.51953125, 1.806640625, 2.09375, 2.380859375, 2.66796875, 2.955078125, 3.2421875, 3.529296875, 3.81640625, 4.103515625, 4.390625, 4.677734375, 4.96484375, 5.251953125, 5.5390625, 5.826171875, 6.11328125, 6.400390625, 6.6875, 6.974609375, 7.26171875, 7.548828125, 7.8359375, 8.123046875, 8.41015625, 8.697265625, 8.984375, 9.271484375, 9.55859375, 9.845703125, 10.1328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 15.0, 21.0, 34.0, 36.0, 110.0, 262.0, 277.0, 105.0, 56.0, 36.0, 13.0, 13.0, 12.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.77734375, -5.52655029296875, -5.2757568359375, -5.02496337890625, -4.774169921875, -4.52337646484375, -4.2725830078125, -4.02178955078125, -3.77099609375, -3.52020263671875, -3.2694091796875, -3.01861572265625, -2.767822265625, -2.51702880859375, -2.2662353515625, -2.01544189453125, -1.7646484375, -1.51385498046875, -1.2630615234375, -1.01226806640625, -0.761474609375, -0.51068115234375, -0.2598876953125, -0.00909423828125, 0.24169921875, 0.49249267578125, 0.7432861328125, 0.99407958984375, 1.244873046875, 1.49566650390625, 1.7464599609375, 1.99725341796875, 2.248046875, 2.49884033203125, 2.7496337890625, 3.00042724609375, 3.251220703125, 3.50201416015625, 3.7528076171875, 4.00360107421875, 4.25439453125, 4.50518798828125, 4.7559814453125, 5.00677490234375, 5.257568359375, 5.50836181640625, 5.7591552734375, 6.00994873046875, 6.2607421875, 6.51153564453125, 6.7623291015625, 7.01312255859375, 7.263916015625, 7.51470947265625, 7.7655029296875, 8.01629638671875, 8.26708984375, 8.51788330078125, 8.7686767578125, 9.01947021484375, 9.270263671875, 9.52105712890625, 9.7718505859375, 10.02264404296875, 10.2734375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 11.0, 22.0, 29.0, 39.0, 74.0, 100.0, 85.0, 126.0, 127.0, 105.0, 86.0, 57.0, 43.0, 42.0, 15.0, 17.0, 11.0, 2.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-76.4738998413086, -74.8022689819336, -73.1306381225586, -71.4590072631836, -69.7873764038086, -68.11575317382812, -66.44412231445312, -64.77249145507812, -63.100860595703125, -61.429229736328125, -59.757598876953125, -58.085968017578125, -56.41434097290039, -54.74271011352539, -53.07107925415039, -51.39944839477539, -49.72781753540039, -48.05618667602539, -46.38455581665039, -44.712928771972656, -43.041297912597656, -41.369667053222656, -39.698036193847656, -38.026405334472656, -36.354774475097656, -34.683143615722656, -33.011512756347656, -31.33988380432129, -29.668254852294922, -27.996623992919922, -26.324993133544922, -24.653362274169922, -22.981733322143555, -21.310102462768555, -19.638473510742188, -17.966842651367188, -16.295211791992188, -14.62358283996582, -12.95195198059082, -11.280322074890137, -9.608692169189453, -7.9370622634887695, -6.265431880950928, -4.593801498413086, -2.9221715927124023, -1.2505416870117188, 0.42108917236328125, 2.092719078063965, 3.7643489837646484, 5.435978889465332, 7.107609272003174, 8.779239654541016, 10.4508695602417, 12.122499465942383, 13.794130325317383, 15.465760231018066, 17.13739013671875, 18.80902099609375, 20.480649948120117, 22.152280807495117, 23.823909759521484, 25.495540618896484, 27.167171478271484, 28.838802337646484, 30.51043128967285]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 5.0, 12.0, 9.0, 8.0, 17.0, 13.0, 16.0, 17.0, 17.0, 21.0, 31.0, 26.0, 26.0, 38.0, 33.0, 38.0, 35.0, 35.0, 43.0, 33.0, 36.0, 42.0, 35.0, 42.0, 44.0, 36.0, 40.0, 31.0, 23.0, 26.0, 26.0, 21.0, 16.0, 23.0, 11.0, 5.0, 8.0, 12.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-21.107223510742188, -20.39971923828125, -19.69221305847168, -18.984708786010742, -18.277204513549805, -17.569700241088867, -16.862194061279297, -16.15468978881836, -15.447185516357422, -14.739680290222168, -14.03217601776123, -13.324670791625977, -12.617166519165039, -11.909661293029785, -11.202156066894531, -10.494651794433594, -9.78714656829834, -9.079641342163086, -8.372137069702148, -7.6646318435668945, -6.957127571105957, -6.249622344970703, -5.542117595672607, -4.834612846374512, -4.127108097076416, -3.4196033477783203, -2.7120985984802246, -2.00459361076355, -1.297088861465454, -0.5895841121673584, 0.1179208755493164, 0.8254256248474121, 1.5329303741455078, 2.2404351234436035, 2.947939872741699, 3.655444860458374, 4.362949371337891, 5.0704545974731445, 5.77795934677124, 6.485464096069336, 7.192968845367432, 7.900473594665527, 8.607978820800781, 9.315483093261719, 10.022988319396973, 10.73049259185791, 11.437997817993164, 12.145502090454102, 12.853007316589355, 13.56051254272461, 14.268016815185547, 14.9755220413208, 15.683026313781738, 16.390531539916992, 17.09803581237793, 17.8055419921875, 18.513046264648438, 19.220550537109375, 19.928056716918945, 20.635560989379883, 21.34306526184082, 22.050569534301758, 22.758075714111328, 23.465579986572266, 24.173084259033203]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 9.0, 13.0, 16.0, 20.0, 37.0, 57.0, 92.0, 159.0, 274.0, 410.0, 727.0, 1486.0, 3699.0, 10051.0, 34874.0, 192257.0, 3596030.0, 289029.0, 44902.0, 12386.0, 4251.0, 1761.0, 799.0, 402.0, 216.0, 136.0, 56.0, 45.0, 30.0, 12.0, 14.0, 8.0, 7.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4921875, -15.0167236328125, -14.541259765625, -14.0657958984375, -13.59033203125, -13.1148681640625, -12.639404296875, -12.1639404296875, -11.6884765625, -11.2130126953125, -10.737548828125, -10.2620849609375, -9.78662109375, -9.3111572265625, -8.835693359375, -8.3602294921875, -7.884765625, -7.4093017578125, -6.933837890625, -6.4583740234375, -5.98291015625, -5.5074462890625, -5.031982421875, -4.5565185546875, -4.0810546875, -3.6055908203125, -3.130126953125, -2.6546630859375, -2.17919921875, -1.7037353515625, -1.228271484375, -0.7528076171875, -0.27734375, 0.1981201171875, 0.673583984375, 1.1490478515625, 1.62451171875, 2.0999755859375, 2.575439453125, 3.0509033203125, 3.5263671875, 4.0018310546875, 4.477294921875, 4.9527587890625, 5.42822265625, 5.9036865234375, 6.379150390625, 6.8546142578125, 7.330078125, 7.8055419921875, 8.281005859375, 8.7564697265625, 9.23193359375, 9.7073974609375, 10.182861328125, 10.6583251953125, 11.1337890625, 11.6092529296875, 12.084716796875, 12.5601806640625, 13.03564453125, 13.5111083984375, 13.986572265625, 14.4620361328125, 14.9375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 7.0, 6.0, 8.0, 14.0, 16.0, 14.0, 16.0, 18.0, 24.0, 28.0, 24.0, 32.0, 32.0, 42.0, 38.0, 47.0, 40.0, 43.0, 57.0, 47.0, 41.0, 40.0, 42.0, 31.0, 37.0, 32.0, 35.0, 32.0, 25.0, 28.0, 19.0, 8.0, 16.0, 13.0, 12.0, 8.0, 13.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0], "bins": [-1.4755859375, -1.4363555908203125, -1.397125244140625, -1.3578948974609375, -1.31866455078125, -1.2794342041015625, -1.240203857421875, -1.2009735107421875, -1.1617431640625, -1.1225128173828125, -1.083282470703125, -1.0440521240234375, -1.00482177734375, -0.9655914306640625, -0.926361083984375, -0.8871307373046875, -0.847900390625, -0.8086700439453125, -0.769439697265625, -0.7302093505859375, -0.69097900390625, -0.6517486572265625, -0.612518310546875, -0.5732879638671875, -0.5340576171875, -0.4948272705078125, -0.455596923828125, -0.4163665771484375, -0.37713623046875, -0.3379058837890625, -0.298675537109375, -0.2594451904296875, -0.22021484375, -0.1809844970703125, -0.141754150390625, -0.1025238037109375, -0.06329345703125, -0.0240631103515625, 0.015167236328125, 0.0543975830078125, 0.0936279296875, 0.1328582763671875, 0.172088623046875, 0.2113189697265625, 0.25054931640625, 0.2897796630859375, 0.329010009765625, 0.3682403564453125, 0.407470703125, 0.4467010498046875, 0.485931396484375, 0.5251617431640625, 0.56439208984375, 0.6036224365234375, 0.642852783203125, 0.6820831298828125, 0.7213134765625, 0.7605438232421875, 0.799774169921875, 0.8390045166015625, 0.87823486328125, 0.9174652099609375, 0.956695556640625, 0.9959259033203125, 1.03515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 3.0, 3.0, 9.0, 10.0, 10.0, 20.0, 17.0, 25.0, 31.0, 48.0, 57.0, 83.0, 89.0, 152.0, 220.0, 449.0, 875.0, 1939.0, 4606.0, 12538.0, 39834.0, 169914.0, 2953870.0, 860391.0, 105110.0, 27757.0, 9193.0, 3614.0, 1610.0, 749.0, 399.0, 211.0, 124.0, 85.0, 50.0, 38.0, 34.0, 25.0, 27.0, 20.0, 11.0, 8.0, 10.0, 13.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.893310546875, -7.57568359375, -7.258056640625, -6.9404296875, -6.622802734375, -6.30517578125, -5.987548828125, -5.669921875, -5.352294921875, -5.03466796875, -4.717041015625, -4.3994140625, -4.081787109375, -3.76416015625, -3.446533203125, -3.12890625, -2.811279296875, -2.49365234375, -2.176025390625, -1.8583984375, -1.540771484375, -1.22314453125, -0.905517578125, -0.587890625, -0.270263671875, 0.04736328125, 0.364990234375, 0.6826171875, 1.000244140625, 1.31787109375, 1.635498046875, 1.953125, 2.270751953125, 2.58837890625, 2.906005859375, 3.2236328125, 3.541259765625, 3.85888671875, 4.176513671875, 4.494140625, 4.811767578125, 5.12939453125, 5.447021484375, 5.7646484375, 6.082275390625, 6.39990234375, 6.717529296875, 7.03515625, 7.352783203125, 7.67041015625, 7.988037109375, 8.3056640625, 8.623291015625, 8.94091796875, 9.258544921875, 9.576171875, 9.893798828125, 10.21142578125, 10.529052734375, 10.8466796875, 11.164306640625, 11.48193359375, 11.799560546875, 12.1171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 11.0, 14.0, 21.0, 31.0, 47.0, 58.0, 123.0, 206.0, 463.0, 1672.0, 706.0, 258.0, 147.0, 108.0, 67.0, 30.0, 29.0, 23.0, 13.0, 15.0, 7.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-5.67578125, -5.542938232421875, -5.41009521484375, -5.277252197265625, -5.1444091796875, -5.011566162109375, -4.87872314453125, -4.745880126953125, -4.613037109375, -4.480194091796875, -4.34735107421875, -4.214508056640625, -4.0816650390625, -3.948822021484375, -3.81597900390625, -3.683135986328125, -3.55029296875, -3.417449951171875, -3.28460693359375, -3.151763916015625, -3.0189208984375, -2.886077880859375, -2.75323486328125, -2.620391845703125, -2.487548828125, -2.354705810546875, -2.22186279296875, -2.089019775390625, -1.9561767578125, -1.823333740234375, -1.69049072265625, -1.557647705078125, -1.4248046875, -1.291961669921875, -1.15911865234375, -1.026275634765625, -0.8934326171875, -0.760589599609375, -0.62774658203125, -0.494903564453125, -0.362060546875, -0.229217529296875, -0.09637451171875, 0.036468505859375, 0.1693115234375, 0.302154541015625, 0.43499755859375, 0.567840576171875, 0.70068359375, 0.833526611328125, 0.96636962890625, 1.099212646484375, 1.2320556640625, 1.364898681640625, 1.49774169921875, 1.630584716796875, 1.763427734375, 1.896270751953125, 2.02911376953125, 2.161956787109375, 2.2947998046875, 2.427642822265625, 2.56048583984375, 2.693328857421875, 2.826171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 7.0, 11.0, 9.0, 19.0, 28.0, 56.0, 56.0, 73.0, 104.0, 129.0, 123.0, 100.0, 75.0, 63.0, 50.0, 37.0, 19.0, 8.0, 14.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.434711456298828, -20.738893508911133, -20.043075561523438, -19.347257614135742, -18.651439666748047, -17.95562171936035, -17.259803771972656, -16.56398582458496, -15.868167877197266, -15.17234992980957, -14.476531982421875, -13.78071403503418, -13.084896087646484, -12.389078140258789, -11.693260192871094, -10.997442245483398, -10.301623344421387, -9.605805397033691, -8.909987449645996, -8.2141695022583, -7.5183515548706055, -6.82253360748291, -6.126715183258057, -5.430897235870361, -4.735079288482666, -4.039261341094971, -3.3434433937072754, -2.647625207901001, -1.9518072605133057, -1.2559893131256104, -0.5601711273193359, 0.13564682006835938, 0.8314647674560547, 1.52728271484375, 2.2231006622314453, 2.9189188480377197, 3.614736795425415, 4.310554504394531, 5.006372928619385, 5.70219087600708, 6.398008823394775, 7.093826770782471, 7.789644718170166, 8.48546314239502, 9.181281089782715, 9.87709903717041, 10.572916984558105, 11.2687349319458, 11.964552879333496, 12.660370826721191, 13.356188774108887, 14.052006721496582, 14.747824668884277, 15.443642616271973, 16.139461517333984, 16.83527946472168, 17.531097412109375, 18.22691535949707, 18.922733306884766, 19.61855125427246, 20.314369201660156, 21.01018714904785, 21.706005096435547, 22.401823043823242, 23.097640991210938]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 10.0, 19.0, 15.0, 6.0, 17.0, 19.0, 27.0, 32.0, 36.0, 37.0, 36.0, 54.0, 50.0, 43.0, 67.0, 44.0, 46.0, 62.0, 48.0, 53.0, 56.0, 37.0, 29.0, 23.0, 28.0, 19.0, 16.0, 16.0, 10.0, 12.0, 13.0, 7.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.550453186035156, -13.124029159545898, -12.69760513305664, -12.2711820602417, -11.844758033752441, -11.418334007263184, -10.991910934448242, -10.565486907958984, -10.139062881469727, -9.712638854980469, -9.286214828491211, -8.85979175567627, -8.433367729187012, -8.006943702697754, -7.580520153045654, -7.154096603393555, -6.727672576904297, -6.301248550415039, -5.8748250007629395, -5.44840145111084, -5.021977424621582, -4.595553398132324, -4.169129848480225, -3.742706060409546, -3.316282272338867, -2.8898584842681885, -2.4634346961975098, -2.037010908126831, -1.6105871200561523, -1.1841633319854736, -0.7577395439147949, -0.3313157558441162, 0.0951080322265625, 0.5215318202972412, 0.9479556083679199, 1.3743793964385986, 1.8008031845092773, 2.227226972579956, 2.6536507606506348, 3.0800745487213135, 3.506498336791992, 3.932922124862671, 4.35934591293335, 4.785769462585449, 5.212193489074707, 5.638617515563965, 6.0650410652160645, 6.491464614868164, 6.917888641357422, 7.34431266784668, 7.770736217498779, 8.197159767150879, 8.623583793640137, 9.050007820129395, 9.476430892944336, 9.902854919433594, 10.329278945922852, 10.75570297241211, 11.182126998901367, 11.608550071716309, 12.034974098205566, 12.461398124694824, 12.887821197509766, 13.314245223999023, 13.740669250488281]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 5.0, 12.0, 8.0, 12.0, 23.0, 30.0, 48.0, 79.0, 104.0, 174.0, 263.0, 452.0, 766.0, 1448.0, 2839.0, 6367.0, 14530.0, 35971.0, 90977.0, 250789.0, 396697.0, 147966.0, 57504.0, 23087.0, 9499.0, 4191.0, 2022.0, 1095.0, 597.0, 343.0, 222.0, 112.0, 99.0, 70.0, 57.0, 30.0, 21.0, 9.0, 7.0, 5.0, 10.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1796875, -6.916259765625, -6.65283203125, -6.389404296875, -6.1259765625, -5.862548828125, -5.59912109375, -5.335693359375, -5.072265625, -4.808837890625, -4.54541015625, -4.281982421875, -4.0185546875, -3.755126953125, -3.49169921875, -3.228271484375, -2.96484375, -2.701416015625, -2.43798828125, -2.174560546875, -1.9111328125, -1.647705078125, -1.38427734375, -1.120849609375, -0.857421875, -0.593994140625, -0.33056640625, -0.067138671875, 0.1962890625, 0.459716796875, 0.72314453125, 0.986572265625, 1.25, 1.513427734375, 1.77685546875, 2.040283203125, 2.3037109375, 2.567138671875, 2.83056640625, 3.093994140625, 3.357421875, 3.620849609375, 3.88427734375, 4.147705078125, 4.4111328125, 4.674560546875, 4.93798828125, 5.201416015625, 5.46484375, 5.728271484375, 5.99169921875, 6.255126953125, 6.5185546875, 6.781982421875, 7.04541015625, 7.308837890625, 7.572265625, 7.835693359375, 8.09912109375, 8.362548828125, 8.6259765625, 8.889404296875, 9.15283203125, 9.416259765625, 9.6796875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 7.0, 9.0, 13.0, 12.0, 11.0, 16.0, 12.0, 33.0, 35.0, 34.0, 33.0, 39.0, 39.0, 44.0, 54.0, 55.0, 53.0, 54.0, 45.0, 28.0, 50.0, 47.0, 32.0, 33.0, 32.0, 27.0, 14.0, 24.0, 14.0, 15.0, 12.0, 14.0, 15.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5771484375, -1.531494140625, -1.48583984375, -1.440185546875, -1.39453125, -1.348876953125, -1.30322265625, -1.257568359375, -1.2119140625, -1.166259765625, -1.12060546875, -1.074951171875, -1.029296875, -0.983642578125, -0.93798828125, -0.892333984375, -0.8466796875, -0.801025390625, -0.75537109375, -0.709716796875, -0.6640625, -0.618408203125, -0.57275390625, -0.527099609375, -0.4814453125, -0.435791015625, -0.39013671875, -0.344482421875, -0.298828125, -0.253173828125, -0.20751953125, -0.161865234375, -0.1162109375, -0.070556640625, -0.02490234375, 0.020751953125, 0.06640625, 0.112060546875, 0.15771484375, 0.203369140625, 0.2490234375, 0.294677734375, 0.34033203125, 0.385986328125, 0.431640625, 0.477294921875, 0.52294921875, 0.568603515625, 0.6142578125, 0.659912109375, 0.70556640625, 0.751220703125, 0.796875, 0.842529296875, 0.88818359375, 0.933837890625, 0.9794921875, 1.025146484375, 1.07080078125, 1.116455078125, 1.162109375, 1.207763671875, 1.25341796875, 1.299072265625, 1.3447265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 6.0, 5.0, 6.0, 12.0, 14.0, 21.0, 27.0, 37.0, 65.0, 81.0, 123.0, 186.0, 267.0, 416.0, 788.0, 1670.0, 5304.0, 20932.0, 91404.0, 447253.0, 377218.0, 76953.0, 17771.0, 4573.0, 1530.0, 728.0, 412.0, 228.0, 156.0, 106.0, 83.0, 61.0, 27.0, 29.0, 25.0, 11.0, 9.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2421875, -9.9404296875, -9.638671875, -9.3369140625, -9.03515625, -8.7333984375, -8.431640625, -8.1298828125, -7.828125, -7.5263671875, -7.224609375, -6.9228515625, -6.62109375, -6.3193359375, -6.017578125, -5.7158203125, -5.4140625, -5.1123046875, -4.810546875, -4.5087890625, -4.20703125, -3.9052734375, -3.603515625, -3.3017578125, -3.0, -2.6982421875, -2.396484375, -2.0947265625, -1.79296875, -1.4912109375, -1.189453125, -0.8876953125, -0.5859375, -0.2841796875, 0.017578125, 0.3193359375, 0.62109375, 0.9228515625, 1.224609375, 1.5263671875, 1.828125, 2.1298828125, 2.431640625, 2.7333984375, 3.03515625, 3.3369140625, 3.638671875, 3.9404296875, 4.2421875, 4.5439453125, 4.845703125, 5.1474609375, 5.44921875, 5.7509765625, 6.052734375, 6.3544921875, 6.65625, 6.9580078125, 7.259765625, 7.5615234375, 7.86328125, 8.1650390625, 8.466796875, 8.7685546875, 9.0703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 9.0, 5.0, 7.0, 8.0, 13.0, 20.0, 22.0, 15.0, 23.0, 32.0, 31.0, 35.0, 25.0, 35.0, 45.0, 47.0, 45.0, 50.0, 50.0, 40.0, 54.0, 41.0, 47.0, 49.0, 32.0, 37.0, 16.0, 30.0, 28.0, 18.0, 9.0, 16.0, 14.0, 11.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.8922119140625, -5.690673828125, -5.4891357421875, -5.28759765625, -5.0860595703125, -4.884521484375, -4.6829833984375, -4.4814453125, -4.2799072265625, -4.078369140625, -3.8768310546875, -3.67529296875, -3.4737548828125, -3.272216796875, -3.0706787109375, -2.869140625, -2.6676025390625, -2.466064453125, -2.2645263671875, -2.06298828125, -1.8614501953125, -1.659912109375, -1.4583740234375, -1.2568359375, -1.0552978515625, -0.853759765625, -0.6522216796875, -0.45068359375, -0.2491455078125, -0.047607421875, 0.1539306640625, 0.35546875, 0.5570068359375, 0.758544921875, 0.9600830078125, 1.16162109375, 1.3631591796875, 1.564697265625, 1.7662353515625, 1.9677734375, 2.1693115234375, 2.370849609375, 2.5723876953125, 2.77392578125, 2.9754638671875, 3.177001953125, 3.3785400390625, 3.580078125, 3.7816162109375, 3.983154296875, 4.1846923828125, 4.38623046875, 4.5877685546875, 4.789306640625, 4.9908447265625, 5.1923828125, 5.3939208984375, 5.595458984375, 5.7969970703125, 5.99853515625, 6.2000732421875, 6.401611328125, 6.6031494140625, 6.8046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 13.0, 12.0, 27.0, 51.0, 113.0, 207.0, 510.0, 1514.0, 5573.0, 29754.0, 258248.0, 656570.0, 80028.0, 11747.0, 2672.0, 883.0, 334.0, 147.0, 68.0, 39.0, 14.0, 10.0, 6.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8984375, -7.7021484375, -7.505859375, -7.3095703125, -7.11328125, -6.9169921875, -6.720703125, -6.5244140625, -6.328125, -6.1318359375, -5.935546875, -5.7392578125, -5.54296875, -5.3466796875, -5.150390625, -4.9541015625, -4.7578125, -4.5615234375, -4.365234375, -4.1689453125, -3.97265625, -3.7763671875, -3.580078125, -3.3837890625, -3.1875, -2.9912109375, -2.794921875, -2.5986328125, -2.40234375, -2.2060546875, -2.009765625, -1.8134765625, -1.6171875, -1.4208984375, -1.224609375, -1.0283203125, -0.83203125, -0.6357421875, -0.439453125, -0.2431640625, -0.046875, 0.1494140625, 0.345703125, 0.5419921875, 0.73828125, 0.9345703125, 1.130859375, 1.3271484375, 1.5234375, 1.7197265625, 1.916015625, 2.1123046875, 2.30859375, 2.5048828125, 2.701171875, 2.8974609375, 3.09375, 3.2900390625, 3.486328125, 3.6826171875, 3.87890625, 4.0751953125, 4.271484375, 4.4677734375, 4.6640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 10.0, 8.0, 20.0, 16.0, 19.0, 24.0, 26.0, 41.0, 51.0, 61.0, 95.0, 116.0, 113.0, 92.0, 71.0, 47.0, 30.0, 28.0, 29.0, 24.0, 14.0, 15.0, 11.0, 9.0, 7.0, 4.0, 1.0, 7.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0007457733154296875, -0.0007266029715538025, -0.0007074326276779175, -0.0006882622838020325, -0.0006690919399261475, -0.0006499215960502625, -0.0006307512521743774, -0.0006115809082984924, -0.0005924105644226074, -0.0005732402205467224, -0.0005540698766708374, -0.0005348995327949524, -0.0005157291889190674, -0.0004965588450431824, -0.00047738850116729736, -0.00045821815729141235, -0.00043904781341552734, -0.00041987746953964233, -0.0004007071256637573, -0.0003815367817878723, -0.0003623664379119873, -0.0003431960940361023, -0.0003240257501602173, -0.0003048554062843323, -0.00028568506240844727, -0.00026651471853256226, -0.00024734437465667725, -0.00022817403078079224, -0.00020900368690490723, -0.00018983334302902222, -0.0001706629991531372, -0.0001514926552772522, -0.0001323223114013672, -0.00011315196752548218, -9.398162364959717e-05, -7.481127977371216e-05, -5.564093589782715e-05, -3.647059202194214e-05, -1.730024814605713e-05, 1.8700957298278809e-06, 2.104043960571289e-05, 4.02107834815979e-05, 5.938112735748291e-05, 7.855147123336792e-05, 9.772181510925293e-05, 0.00011689215898513794, 0.00013606250286102295, 0.00015523284673690796, 0.00017440319061279297, 0.00019357353448867798, 0.000212743878364563, 0.000231914222240448, 0.000251084566116333, 0.000270254909992218, 0.00028942525386810303, 0.00030859559774398804, 0.00032776594161987305, 0.00034693628549575806, 0.00036610662937164307, 0.0003852769732475281, 0.0004044473171234131, 0.0004236176609992981, 0.0004427880048751831, 0.0004619583487510681, 0.0004811286926269531]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 9.0, 49.0, 82.0, 193.0, 501.0, 2342.0, 49419.0, 938054.0, 54575.0, 2494.0, 523.0, 163.0, 78.0, 31.0, 18.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9375, -6.517333984375, -6.09716796875, -5.677001953125, -5.2568359375, -4.836669921875, -4.41650390625, -3.996337890625, -3.576171875, -3.156005859375, -2.73583984375, -2.315673828125, -1.8955078125, -1.475341796875, -1.05517578125, -0.635009765625, -0.21484375, 0.205322265625, 0.62548828125, 1.045654296875, 1.4658203125, 1.885986328125, 2.30615234375, 2.726318359375, 3.146484375, 3.566650390625, 3.98681640625, 4.406982421875, 4.8271484375, 5.247314453125, 5.66748046875, 6.087646484375, 6.5078125, 6.927978515625, 7.34814453125, 7.768310546875, 8.1884765625, 8.608642578125, 9.02880859375, 9.448974609375, 9.869140625, 10.289306640625, 10.70947265625, 11.129638671875, 11.5498046875, 11.969970703125, 12.39013671875, 12.810302734375, 13.23046875, 13.650634765625, 14.07080078125, 14.490966796875, 14.9111328125, 15.331298828125, 15.75146484375, 16.171630859375, 16.591796875, 17.011962890625, 17.43212890625, 17.852294921875, 18.2724609375, 18.692626953125, 19.11279296875, 19.532958984375, 19.953125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 12.0, 10.0, 15.0, 26.0, 33.0, 46.0, 77.0, 107.0, 132.0, 150.0, 109.0, 97.0, 69.0, 46.0, 25.0, 14.0, 9.0, 12.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.283203125, -3.092987060546875, -2.90277099609375, -2.712554931640625, -2.5223388671875, -2.332122802734375, -2.14190673828125, -1.951690673828125, -1.761474609375, -1.571258544921875, -1.38104248046875, -1.190826416015625, -1.0006103515625, -0.810394287109375, -0.62017822265625, -0.429962158203125, -0.23974609375, -0.049530029296875, 0.14068603515625, 0.330902099609375, 0.5211181640625, 0.711334228515625, 0.90155029296875, 1.091766357421875, 1.281982421875, 1.472198486328125, 1.66241455078125, 1.852630615234375, 2.0428466796875, 2.233062744140625, 2.42327880859375, 2.613494873046875, 2.8037109375, 2.993927001953125, 3.18414306640625, 3.374359130859375, 3.5645751953125, 3.754791259765625, 3.94500732421875, 4.135223388671875, 4.325439453125, 4.515655517578125, 4.70587158203125, 4.896087646484375, 5.0863037109375, 5.276519775390625, 5.46673583984375, 5.656951904296875, 5.84716796875, 6.037384033203125, 6.22760009765625, 6.417816162109375, 6.6080322265625, 6.798248291015625, 6.98846435546875, 7.178680419921875, 7.368896484375, 7.559112548828125, 7.74932861328125, 7.939544677734375, 8.1297607421875, 8.319976806640625, 8.51019287109375, 8.700408935546875, 8.890625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 10.0, 10.0, 14.0, 26.0, 37.0, 51.0, 58.0, 82.0, 114.0, 110.0, 117.0, 92.0, 81.0, 60.0, 50.0, 33.0, 22.0, 11.0, 13.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5157470703125, -42.79899597167969, -41.08224868774414, -39.36549758911133, -37.64875030517578, -35.93199920654297, -34.215248107910156, -32.49850082397461, -30.78175163269043, -29.06500244140625, -27.34825325012207, -25.63150405883789, -23.914752960205078, -22.19800567626953, -20.48125457763672, -18.76450538635254, -17.04775619506836, -15.33100700378418, -13.6142578125, -11.897507667541504, -10.180758476257324, -8.464009284973145, -6.747259140014648, -5.030509948730469, -3.313760757446289, -1.5970113277435303, 0.11973810195922852, 1.8364877700805664, 3.553236961364746, 5.269986152648926, 6.986736297607422, 8.703485488891602, 10.420234680175781, 12.136983871459961, 13.85373306274414, 15.570483207702637, 17.2872314453125, 19.003982543945312, 20.720731735229492, 22.437480926513672, 24.15423011779785, 25.87097930908203, 27.58772850036621, 29.30447769165039, 31.021228790283203, 32.73797607421875, 34.45472717285156, 36.171478271484375, 37.88822555541992, 39.604976654052734, 41.32172393798828, 43.038475036621094, 44.75522232055664, 46.47197341918945, 48.188720703125, 49.90547180175781, 51.622222900390625, 53.33897399902344, 55.055721282958984, 56.7724723815918, 58.489219665527344, 60.205970764160156, 61.92272186279297, 63.639469146728516, 65.35621643066406]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 6.0, 14.0, 13.0, 5.0, 23.0, 21.0, 24.0, 32.0, 21.0, 27.0, 47.0, 34.0, 33.0, 23.0, 45.0, 44.0, 49.0, 36.0, 40.0, 48.0, 35.0, 38.0, 48.0, 28.0, 38.0, 41.0, 26.0, 26.0, 17.0, 16.0, 14.0, 14.0, 11.0, 11.0, 8.0, 5.0, 10.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-42.68281555175781, -41.5468864440918, -40.41095733642578, -39.27503204345703, -38.139102935791016, -37.003173828125, -35.867244720458984, -34.73131561279297, -33.59539031982422, -32.4594612121582, -31.32353401184082, -30.187604904174805, -29.051677703857422, -27.915748596191406, -26.77981948852539, -25.643890380859375, -24.50796127319336, -23.372032165527344, -22.23610496520996, -21.100175857543945, -19.964248657226562, -18.828319549560547, -17.69239044189453, -16.556461334228516, -15.420534133911133, -14.284605979919434, -13.148677825927734, -12.012748718261719, -10.87682056427002, -9.74089241027832, -8.604963302612305, -7.4690351486206055, -6.333110809326172, -5.197182655334473, -4.061254024505615, -2.925325632095337, -1.7893972396850586, -0.6534690856933594, 0.48245954513549805, 1.6183881759643555, 2.7543163299560547, 3.890244722366333, 5.026173114776611, 6.162101745605469, 7.298029899597168, 8.433958053588867, 9.569887161254883, 10.705815315246582, 11.841743469238281, 12.97767162322998, 14.11359977722168, 15.249528884887695, 16.385456085205078, 17.521385192871094, 18.65731430053711, 19.793243408203125, 20.929170608520508, 22.065099716186523, 23.201026916503906, 24.336956024169922, 25.472885131835938, 26.60881233215332, 27.744741439819336, 28.88066864013672, 30.016597747802734]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 12.0, 7.0, 16.0, 18.0, 21.0, 37.0, 80.0, 81.0, 165.0, 247.0, 482.0, 854.0, 1706.0, 4379.0, 12456.0, 50249.0, 373499.0, 3490387.0, 207487.0, 35851.0, 9882.0, 3476.0, 1454.0, 647.0, 340.0, 176.0, 92.0, 57.0, 48.0, 29.0, 12.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-16.671875, -16.24853515625, -15.8251953125, -15.40185546875, -14.978515625, -14.55517578125, -14.1318359375, -13.70849609375, -13.28515625, -12.86181640625, -12.4384765625, -12.01513671875, -11.591796875, -11.16845703125, -10.7451171875, -10.32177734375, -9.8984375, -9.47509765625, -9.0517578125, -8.62841796875, -8.205078125, -7.78173828125, -7.3583984375, -6.93505859375, -6.51171875, -6.08837890625, -5.6650390625, -5.24169921875, -4.818359375, -4.39501953125, -3.9716796875, -3.54833984375, -3.125, -2.70166015625, -2.2783203125, -1.85498046875, -1.431640625, -1.00830078125, -0.5849609375, -0.16162109375, 0.26171875, 0.68505859375, 1.1083984375, 1.53173828125, 1.955078125, 2.37841796875, 2.8017578125, 3.22509765625, 3.6484375, 4.07177734375, 4.4951171875, 4.91845703125, 5.341796875, 5.76513671875, 6.1884765625, 6.61181640625, 7.03515625, 7.45849609375, 7.8818359375, 8.30517578125, 8.728515625, 9.15185546875, 9.5751953125, 9.99853515625, 10.421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 5.0, 11.0, 11.0, 14.0, 11.0, 19.0, 25.0, 32.0, 27.0, 23.0, 34.0, 41.0, 45.0, 40.0, 45.0, 44.0, 60.0, 48.0, 38.0, 42.0, 47.0, 28.0, 47.0, 39.0, 34.0, 37.0, 21.0, 23.0, 21.0, 17.0, 10.0, 13.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6142578125, -1.56805419921875, -1.5218505859375, -1.47564697265625, -1.429443359375, -1.38323974609375, -1.3370361328125, -1.29083251953125, -1.24462890625, -1.19842529296875, -1.1522216796875, -1.10601806640625, -1.059814453125, -1.01361083984375, -0.9674072265625, -0.92120361328125, -0.875, -0.82879638671875, -0.7825927734375, -0.73638916015625, -0.690185546875, -0.64398193359375, -0.5977783203125, -0.55157470703125, -0.50537109375, -0.45916748046875, -0.4129638671875, -0.36676025390625, -0.320556640625, -0.27435302734375, -0.2281494140625, -0.18194580078125, -0.1357421875, -0.08953857421875, -0.0433349609375, 0.00286865234375, 0.049072265625, 0.09527587890625, 0.1414794921875, 0.18768310546875, 0.23388671875, 0.28009033203125, 0.3262939453125, 0.37249755859375, 0.418701171875, 0.46490478515625, 0.5111083984375, 0.55731201171875, 0.603515625, 0.64971923828125, 0.6959228515625, 0.74212646484375, 0.788330078125, 0.83453369140625, 0.8807373046875, 0.92694091796875, 0.97314453125, 1.01934814453125, 1.0655517578125, 1.11175537109375, 1.157958984375, 1.20416259765625, 1.2503662109375, 1.29656982421875, 1.3427734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 17.0, 27.0, 24.0, 69.0, 79.0, 166.0, 330.0, 741.0, 1504.0, 3991.0, 12390.0, 50962.0, 331476.0, 3295595.0, 416308.0, 59155.0, 13937.0, 4262.0, 1705.0, 721.0, 376.0, 181.0, 112.0, 68.0, 27.0, 25.0, 17.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.34344482421875, -6.0189208984375, -5.69439697265625, -5.369873046875, -5.04534912109375, -4.7208251953125, -4.39630126953125, -4.07177734375, -3.74725341796875, -3.4227294921875, -3.09820556640625, -2.773681640625, -2.44915771484375, -2.1246337890625, -1.80010986328125, -1.4755859375, -1.15106201171875, -0.8265380859375, -0.50201416015625, -0.177490234375, 0.14703369140625, 0.4715576171875, 0.79608154296875, 1.12060546875, 1.44512939453125, 1.7696533203125, 2.09417724609375, 2.418701171875, 2.74322509765625, 3.0677490234375, 3.39227294921875, 3.716796875, 4.04132080078125, 4.3658447265625, 4.69036865234375, 5.014892578125, 5.33941650390625, 5.6639404296875, 5.98846435546875, 6.31298828125, 6.63751220703125, 6.9620361328125, 7.28656005859375, 7.611083984375, 7.93560791015625, 8.2601318359375, 8.58465576171875, 8.9091796875, 9.23370361328125, 9.5582275390625, 9.88275146484375, 10.207275390625, 10.53179931640625, 10.8563232421875, 11.18084716796875, 11.50537109375, 11.82989501953125, 12.1544189453125, 12.47894287109375, 12.803466796875, 13.12799072265625, 13.4525146484375, 13.77703857421875, 14.1015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 12.0, 22.0, 9.0, 25.0, 25.0, 42.0, 60.0, 74.0, 113.0, 189.0, 265.0, 442.0, 1049.0, 690.0, 355.0, 218.0, 132.0, 101.0, 67.0, 43.0, 30.0, 21.0, 23.0, 16.0, 5.0, 6.0, 8.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.197265625, -3.08612060546875, -2.9749755859375, -2.86383056640625, -2.752685546875, -2.64154052734375, -2.5303955078125, -2.41925048828125, -2.30810546875, -2.19696044921875, -2.0858154296875, -1.97467041015625, -1.863525390625, -1.75238037109375, -1.6412353515625, -1.53009033203125, -1.4189453125, -1.30780029296875, -1.1966552734375, -1.08551025390625, -0.974365234375, -0.86322021484375, -0.7520751953125, -0.64093017578125, -0.52978515625, -0.41864013671875, -0.3074951171875, -0.19635009765625, -0.085205078125, 0.02593994140625, 0.1370849609375, 0.24822998046875, 0.359375, 0.47052001953125, 0.5816650390625, 0.69281005859375, 0.803955078125, 0.91510009765625, 1.0262451171875, 1.13739013671875, 1.24853515625, 1.35968017578125, 1.4708251953125, 1.58197021484375, 1.693115234375, 1.80426025390625, 1.9154052734375, 2.02655029296875, 2.1376953125, 2.24884033203125, 2.3599853515625, 2.47113037109375, 2.582275390625, 2.69342041015625, 2.8045654296875, 2.91571044921875, 3.02685546875, 3.13800048828125, 3.2491455078125, 3.36029052734375, 3.471435546875, 3.58258056640625, 3.6937255859375, 3.80487060546875, 3.916015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 11.0, 20.0, 38.0, 76.0, 139.0, 207.0, 210.0, 160.0, 82.0, 33.0, 22.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-87.8337173461914, -86.1816177368164, -84.5295181274414, -82.8774185180664, -81.2253189086914, -79.57321166992188, -77.92111206054688, -76.26901245117188, -74.61691284179688, -72.96481323242188, -71.31271362304688, -69.66061401367188, -68.00851440429688, -66.35641479492188, -64.70430755615234, -63.052207946777344, -61.400108337402344, -59.748008728027344, -58.095909118652344, -56.44380569458008, -54.79170608520508, -53.13960647583008, -51.48750686645508, -49.83540344238281, -48.18330764770508, -46.53120803833008, -44.87910842895508, -43.22700500488281, -41.57490539550781, -39.92280578613281, -38.27070617675781, -36.61860656738281, -34.96650695800781, -33.31440734863281, -31.66230583190918, -30.01020622253418, -28.358104705810547, -26.706005096435547, -25.053905487060547, -23.401803970336914, -21.74970245361328, -20.09760284423828, -18.44550132751465, -16.79340171813965, -15.141300201416016, -13.489200592041016, -11.8371000289917, -10.184999465942383, -8.53289794921875, -6.880797386169434, -5.228696823120117, -3.576596736907959, -1.9244961738586426, -0.2723960876464844, 1.379704475402832, 3.0318050384521484, 4.683905601501465, 6.336006164550781, 7.988106727600098, 9.640207290649414, 11.292306900024414, 12.94440746307373, 14.596508026123047, 16.248607635498047, 17.90070915222168]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 6.0, 7.0, 7.0, 13.0, 14.0, 12.0, 15.0, 20.0, 29.0, 25.0, 29.0, 32.0, 30.0, 37.0, 26.0, 35.0, 41.0, 43.0, 32.0, 46.0, 35.0, 46.0, 50.0, 41.0, 31.0, 32.0, 25.0, 38.0, 23.0, 31.0, 21.0, 16.0, 12.0, 11.0, 18.0, 14.0, 13.0, 7.0, 10.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.038463592529297, -13.638751029968262, -13.239038467407227, -12.839326858520508, -12.439614295959473, -12.039901733398438, -11.640189170837402, -11.240476608276367, -10.840764999389648, -10.441052436828613, -10.041339874267578, -9.64162826538086, -9.241915702819824, -8.842203140258789, -8.442490577697754, -8.042778015136719, -7.643065452575684, -7.243352890014648, -6.8436408042907715, -6.443928241729736, -6.044216156005859, -5.644503593444824, -5.244791030883789, -4.845078468322754, -4.445366382598877, -4.045653820037842, -3.645941734313965, -3.2462291717529297, -2.8465168476104736, -2.4468045234680176, -2.0470919609069824, -1.6473796367645264, -1.2476673126220703, -0.8479549288749695, -0.44824254512786865, -0.04853010177612305, 0.351182222366333, 0.7508945465087891, 1.1506071090698242, 1.5503194332122803, 1.9500317573547363, 2.3497440814971924, 2.7494564056396484, 3.1491689682006836, 3.5488812923431396, 3.9485936164855957, 4.348306179046631, 4.748018264770508, 5.147730827331543, 5.547443389892578, 5.947155475616455, 6.34686803817749, 6.746580123901367, 7.146292686462402, 7.5460052490234375, 7.945717811584473, 8.345430374145508, 8.745142936706543, 9.144855499267578, 9.544567108154297, 9.944279670715332, 10.343992233276367, 10.743704795837402, 11.143417358398438, 11.543128967285156]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 8.0, 11.0, 12.0, 30.0, 30.0, 51.0, 65.0, 116.0, 153.0, 253.0, 419.0, 711.0, 1415.0, 2674.0, 5949.0, 14676.0, 40940.0, 126907.0, 314780.0, 328723.0, 137671.0, 44757.0, 15942.0, 6259.0, 2847.0, 1348.0, 711.0, 393.0, 273.0, 135.0, 79.0, 65.0, 46.0, 30.0, 21.0, 16.0, 12.0, 6.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.22406005859375, -5.9754638671875, -5.72686767578125, -5.478271484375, -5.22967529296875, -4.9810791015625, -4.73248291015625, -4.48388671875, -4.23529052734375, -3.9866943359375, -3.73809814453125, -3.489501953125, -3.24090576171875, -2.9923095703125, -2.74371337890625, -2.4951171875, -2.24652099609375, -1.9979248046875, -1.74932861328125, -1.500732421875, -1.25213623046875, -1.0035400390625, -0.75494384765625, -0.50634765625, -0.25775146484375, -0.0091552734375, 0.23944091796875, 0.488037109375, 0.73663330078125, 0.9852294921875, 1.23382568359375, 1.482421875, 1.73101806640625, 1.9796142578125, 2.22821044921875, 2.476806640625, 2.72540283203125, 2.9739990234375, 3.22259521484375, 3.47119140625, 3.71978759765625, 3.9683837890625, 4.21697998046875, 4.465576171875, 4.71417236328125, 4.9627685546875, 5.21136474609375, 5.4599609375, 5.70855712890625, 5.9571533203125, 6.20574951171875, 6.454345703125, 6.70294189453125, 6.9515380859375, 7.20013427734375, 7.44873046875, 7.69732666015625, 7.9459228515625, 8.19451904296875, 8.443115234375, 8.69171142578125, 8.9403076171875, 9.18890380859375, 9.4375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 10.0, 5.0, 10.0, 12.0, 15.0, 21.0, 23.0, 29.0, 35.0, 40.0, 28.0, 38.0, 38.0, 34.0, 54.0, 61.0, 45.0, 51.0, 49.0, 52.0, 48.0, 39.0, 43.0, 32.0, 29.0, 28.0, 26.0, 20.0, 18.0, 7.0, 12.0, 7.0, 10.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.021484375, -1.9703369140625, -1.919189453125, -1.8680419921875, -1.81689453125, -1.7657470703125, -1.714599609375, -1.6634521484375, -1.6123046875, -1.5611572265625, -1.510009765625, -1.4588623046875, -1.40771484375, -1.3565673828125, -1.305419921875, -1.2542724609375, -1.203125, -1.1519775390625, -1.100830078125, -1.0496826171875, -0.99853515625, -0.9473876953125, -0.896240234375, -0.8450927734375, -0.7939453125, -0.7427978515625, -0.691650390625, -0.6405029296875, -0.58935546875, -0.5382080078125, -0.487060546875, -0.4359130859375, -0.384765625, -0.3336181640625, -0.282470703125, -0.2313232421875, -0.18017578125, -0.1290283203125, -0.077880859375, -0.0267333984375, 0.0244140625, 0.0755615234375, 0.126708984375, 0.1778564453125, 0.22900390625, 0.2801513671875, 0.331298828125, 0.3824462890625, 0.43359375, 0.4847412109375, 0.535888671875, 0.5870361328125, 0.63818359375, 0.6893310546875, 0.740478515625, 0.7916259765625, 0.8427734375, 0.8939208984375, 0.945068359375, 0.9962158203125, 1.04736328125, 1.0985107421875, 1.149658203125, 1.2008056640625, 1.251953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 6.0, 9.0, 9.0, 14.0, 20.0, 18.0, 28.0, 39.0, 55.0, 69.0, 106.0, 144.0, 195.0, 316.0, 462.0, 821.0, 1603.0, 3569.0, 10018.0, 32570.0, 120278.0, 390919.0, 345223.0, 99688.0, 27112.0, 8450.0, 3055.0, 1370.0, 781.0, 479.0, 341.0, 225.0, 152.0, 106.0, 79.0, 61.0, 39.0, 33.0, 25.0, 16.0, 14.0, 9.0, 7.0, 4.0, 2.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.078125, -7.84002685546875, -7.6019287109375, -7.36383056640625, -7.125732421875, -6.88763427734375, -6.6495361328125, -6.41143798828125, -6.17333984375, -5.93524169921875, -5.6971435546875, -5.45904541015625, -5.220947265625, -4.98284912109375, -4.7447509765625, -4.50665283203125, -4.2685546875, -4.03045654296875, -3.7923583984375, -3.55426025390625, -3.316162109375, -3.07806396484375, -2.8399658203125, -2.60186767578125, -2.36376953125, -2.12567138671875, -1.8875732421875, -1.64947509765625, -1.411376953125, -1.17327880859375, -0.9351806640625, -0.69708251953125, -0.458984375, -0.22088623046875, 0.0172119140625, 0.25531005859375, 0.493408203125, 0.73150634765625, 0.9696044921875, 1.20770263671875, 1.44580078125, 1.68389892578125, 1.9219970703125, 2.16009521484375, 2.398193359375, 2.63629150390625, 2.8743896484375, 3.11248779296875, 3.3505859375, 3.58868408203125, 3.8267822265625, 4.06488037109375, 4.302978515625, 4.54107666015625, 4.7791748046875, 5.01727294921875, 5.25537109375, 5.49346923828125, 5.7315673828125, 5.96966552734375, 6.207763671875, 6.44586181640625, 6.6839599609375, 6.92205810546875, 7.16015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 4.0, 6.0, 3.0, 3.0, 3.0, 5.0, 10.0, 9.0, 10.0, 12.0, 7.0, 22.0, 13.0, 21.0, 19.0, 22.0, 19.0, 33.0, 25.0, 29.0, 34.0, 48.0, 47.0, 37.0, 46.0, 38.0, 46.0, 34.0, 36.0, 32.0, 35.0, 36.0, 37.0, 26.0, 27.0, 30.0, 19.0, 11.0, 23.0, 18.0, 12.0, 10.0, 7.0, 13.0, 7.0, 6.0, 6.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.58203125, -5.388916015625, -5.19580078125, -5.002685546875, -4.8095703125, -4.616455078125, -4.42333984375, -4.230224609375, -4.037109375, -3.843994140625, -3.65087890625, -3.457763671875, -3.2646484375, -3.071533203125, -2.87841796875, -2.685302734375, -2.4921875, -2.299072265625, -2.10595703125, -1.912841796875, -1.7197265625, -1.526611328125, -1.33349609375, -1.140380859375, -0.947265625, -0.754150390625, -0.56103515625, -0.367919921875, -0.1748046875, 0.018310546875, 0.21142578125, 0.404541015625, 0.59765625, 0.790771484375, 0.98388671875, 1.177001953125, 1.3701171875, 1.563232421875, 1.75634765625, 1.949462890625, 2.142578125, 2.335693359375, 2.52880859375, 2.721923828125, 2.9150390625, 3.108154296875, 3.30126953125, 3.494384765625, 3.6875, 3.880615234375, 4.07373046875, 4.266845703125, 4.4599609375, 4.653076171875, 4.84619140625, 5.039306640625, 5.232421875, 5.425537109375, 5.61865234375, 5.811767578125, 6.0048828125, 6.197998046875, 6.39111328125, 6.584228515625, 6.77734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 2.0, 8.0, 12.0, 9.0, 16.0, 22.0, 29.0, 58.0, 91.0, 143.0, 283.0, 562.0, 1079.0, 2503.0, 6513.0, 19088.0, 63857.0, 208752.0, 417616.0, 225048.0, 69848.0, 21100.0, 6888.0, 2619.0, 1171.0, 523.0, 295.0, 149.0, 70.0, 72.0, 48.0, 29.0, 12.0, 8.0, 13.0, 5.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.0758056640625, -2.968017578125, -2.8602294921875, -2.75244140625, -2.6446533203125, -2.536865234375, -2.4290771484375, -2.3212890625, -2.2135009765625, -2.105712890625, -1.9979248046875, -1.89013671875, -1.7823486328125, -1.674560546875, -1.5667724609375, -1.458984375, -1.3511962890625, -1.243408203125, -1.1356201171875, -1.02783203125, -0.9200439453125, -0.812255859375, -0.7044677734375, -0.5966796875, -0.4888916015625, -0.381103515625, -0.2733154296875, -0.16552734375, -0.0577392578125, 0.050048828125, 0.1578369140625, 0.265625, 0.3734130859375, 0.481201171875, 0.5889892578125, 0.69677734375, 0.8045654296875, 0.912353515625, 1.0201416015625, 1.1279296875, 1.2357177734375, 1.343505859375, 1.4512939453125, 1.55908203125, 1.6668701171875, 1.774658203125, 1.8824462890625, 1.990234375, 2.0980224609375, 2.205810546875, 2.3135986328125, 2.42138671875, 2.5291748046875, 2.636962890625, 2.7447509765625, 2.8525390625, 2.9603271484375, 3.068115234375, 3.1759033203125, 3.28369140625, 3.3914794921875, 3.499267578125, 3.6070556640625, 3.71484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 3.0, 5.0, 7.0, 12.0, 20.0, 17.0, 22.0, 24.0, 33.0, 43.0, 56.0, 58.0, 60.0, 75.0, 65.0, 74.0, 64.0, 69.0, 52.0, 42.0, 33.0, 32.0, 27.0, 32.0, 20.0, 14.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006260871887207031, -0.0006093829870223999, -0.0005926787853240967, -0.0005759745836257935, -0.0005592703819274902, -0.000542566180229187, -0.0005258619785308838, -0.0005091577768325806, -0.0004924535751342773, -0.0004757493734359741, -0.0004590451717376709, -0.0004423409700393677, -0.00042563676834106445, -0.00040893256664276123, -0.000392228364944458, -0.0003755241632461548, -0.00035881996154785156, -0.00034211575984954834, -0.0003254115581512451, -0.0003087073564529419, -0.00029200315475463867, -0.00027529895305633545, -0.0002585947513580322, -0.000241890549659729, -0.00022518634796142578, -0.00020848214626312256, -0.00019177794456481934, -0.0001750737428665161, -0.0001583695411682129, -0.00014166533946990967, -0.00012496113777160645, -0.00010825693607330322, -9.1552734375e-05, -7.484853267669678e-05, -5.8144330978393555e-05, -4.144012928009033e-05, -2.473592758178711e-05, -8.031725883483887e-06, 8.672475814819336e-06, 2.537667751312256e-05, 4.208087921142578e-05, 5.8785080909729004e-05, 7.548928260803223e-05, 9.219348430633545e-05, 0.00010889768600463867, 0.0001256018877029419, 0.00014230608940124512, 0.00015901029109954834, 0.00017571449279785156, 0.00019241869449615479, 0.000209122896194458, 0.00022582709789276123, 0.00024253129959106445, 0.0002592355012893677, 0.0002759397029876709, 0.0002926439046859741, 0.00030934810638427734, 0.00032605230808258057, 0.0003427565097808838, 0.000359460711479187, 0.00037616491317749023, 0.00039286911487579346, 0.0004095733165740967, 0.0004262775182723999, 0.0004429817199707031]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 18.0, 28.0, 36.0, 41.0, 71.0, 110.0, 198.0, 322.0, 672.0, 1523.0, 4144.0, 15797.0, 81553.0, 407795.0, 424163.0, 87721.0, 16737.0, 4395.0, 1638.0, 652.0, 357.0, 208.0, 126.0, 79.0, 40.0, 33.0, 24.0, 16.0, 11.0, 11.0, 4.0, 1.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75, -3.5938720703125, -3.437744140625, -3.2816162109375, -3.12548828125, -2.9693603515625, -2.813232421875, -2.6571044921875, -2.5009765625, -2.3448486328125, -2.188720703125, -2.0325927734375, -1.87646484375, -1.7203369140625, -1.564208984375, -1.4080810546875, -1.251953125, -1.0958251953125, -0.939697265625, -0.7835693359375, -0.62744140625, -0.4713134765625, -0.315185546875, -0.1590576171875, -0.0029296875, 0.1531982421875, 0.309326171875, 0.4654541015625, 0.62158203125, 0.7777099609375, 0.933837890625, 1.0899658203125, 1.24609375, 1.4022216796875, 1.558349609375, 1.7144775390625, 1.87060546875, 2.0267333984375, 2.182861328125, 2.3389892578125, 2.4951171875, 2.6512451171875, 2.807373046875, 2.9635009765625, 3.11962890625, 3.2757568359375, 3.431884765625, 3.5880126953125, 3.744140625, 3.9002685546875, 4.056396484375, 4.2125244140625, 4.36865234375, 4.5247802734375, 4.680908203125, 4.8370361328125, 4.9931640625, 5.1492919921875, 5.305419921875, 5.4615478515625, 5.61767578125, 5.7738037109375, 5.929931640625, 6.0860595703125, 6.2421875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 7.0, 6.0, 10.0, 16.0, 15.0, 19.0, 17.0, 33.0, 26.0, 59.0, 64.0, 86.0, 80.0, 68.0, 68.0, 64.0, 57.0, 58.0, 63.0, 47.0, 30.0, 19.0, 10.0, 15.0, 21.0, 7.0, 9.0, 5.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.572265625, -2.454010009765625, -2.33575439453125, -2.217498779296875, -2.0992431640625, -1.980987548828125, -1.86273193359375, -1.744476318359375, -1.626220703125, -1.507965087890625, -1.38970947265625, -1.271453857421875, -1.1531982421875, -1.034942626953125, -0.91668701171875, -0.798431396484375, -0.68017578125, -0.561920166015625, -0.44366455078125, -0.325408935546875, -0.2071533203125, -0.088897705078125, 0.02935791015625, 0.147613525390625, 0.265869140625, 0.384124755859375, 0.50238037109375, 0.620635986328125, 0.7388916015625, 0.857147216796875, 0.97540283203125, 1.093658447265625, 1.2119140625, 1.330169677734375, 1.44842529296875, 1.566680908203125, 1.6849365234375, 1.803192138671875, 1.92144775390625, 2.039703369140625, 2.157958984375, 2.276214599609375, 2.39447021484375, 2.512725830078125, 2.6309814453125, 2.749237060546875, 2.86749267578125, 2.985748291015625, 3.10400390625, 3.222259521484375, 3.34051513671875, 3.458770751953125, 3.5770263671875, 3.695281982421875, 3.81353759765625, 3.931793212890625, 4.050048828125, 4.168304443359375, 4.28656005859375, 4.404815673828125, 4.5230712890625, 4.641326904296875, 4.75958251953125, 4.877838134765625, 4.99609375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 11.0, 82.0, 234.0, 331.0, 241.0, 85.0, 15.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.2195816040039, -62.7902717590332, -57.3609619140625, -51.93165588378906, -46.502342224121094, -41.073036193847656, -35.64372634887695, -30.21441650390625, -24.785106658935547, -19.355796813964844, -13.926487922668457, -8.49717903137207, -3.067869186401367, 2.361440658569336, 7.790748596191406, 13.22005844116211, 18.649368286132812, 24.078678131103516, 29.50798797607422, 34.937294006347656, 40.366607666015625, 45.79591369628906, 51.225223541259766, 56.65453338623047, 62.08384323120117, 67.51315307617188, 72.94245910644531, 78.37177276611328, 83.80107879638672, 89.23039245605469, 94.65969848632812, 100.08900451660156, 105.51832580566406, 110.9476318359375, 116.37694549560547, 121.8062515258789, 127.23556518554688, 132.6648712158203, 138.09417724609375, 143.52349853515625, 148.9528045654297, 154.38211059570312, 159.81141662597656, 165.24073791503906, 170.6700439453125, 176.09934997558594, 181.52865600585938, 186.95797729492188, 192.38726806640625, 197.8165740966797, 203.24588012695312, 208.67520141601562, 214.10450744628906, 219.5338134765625, 224.96311950683594, 230.39242553710938, 235.82174682617188, 241.2510528564453, 246.68035888671875, 252.10968017578125, 257.5389709472656, 262.9682922363281, 268.3976135253906, 273.826904296875, 279.2562255859375]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 5.0, 9.0, 13.0, 10.0, 21.0, 15.0, 18.0, 21.0, 30.0, 24.0, 35.0, 48.0, 43.0, 49.0, 36.0, 53.0, 49.0, 46.0, 38.0, 51.0, 47.0, 40.0, 35.0, 32.0, 31.0, 18.0, 24.0, 27.0, 21.0, 29.0, 12.0, 12.0, 14.0, 12.0, 4.0, 2.0, 6.0, 2.0, 1.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.62859344482422, -32.525753021240234, -31.422914505004883, -30.32007598876953, -29.217235565185547, -28.114395141601562, -27.01155662536621, -25.90871810913086, -24.805877685546875, -23.70303726196289, -22.60019874572754, -21.497360229492188, -20.394519805908203, -19.29167938232422, -18.188840866088867, -17.086002349853516, -15.983161926269531, -14.880322456359863, -13.777482986450195, -12.674643516540527, -11.57180404663086, -10.468964576721191, -9.366125106811523, -8.263285636901855, -7.1604461669921875, -6.0576066970825195, -4.954767227172852, -3.8519277572631836, -2.7490882873535156, -1.6462488174438477, -0.5434093475341797, 0.5594301223754883, 1.6622734069824219, 2.76511287689209, 3.867952346801758, 4.970791816711426, 6.073631286621094, 7.176470756530762, 8.27931022644043, 9.382149696350098, 10.484989166259766, 11.587828636169434, 12.690668106079102, 13.79350757598877, 14.896347045898438, 15.999186515808105, 17.102025985717773, 18.204864501953125, 19.30770492553711, 20.410545349121094, 21.513383865356445, 22.616222381591797, 23.71906280517578, 24.821903228759766, 25.924741744995117, 27.02758026123047, 28.130420684814453, 29.233261108398438, 30.33609962463379, 31.43893814086914, 32.541778564453125, 33.64461898803711, 34.747459411621094, 35.85029602050781, 36.9531364440918]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 3.0, 13.0, 8.0, 13.0, 14.0, 27.0, 37.0, 45.0, 64.0, 109.0, 183.0, 298.0, 582.0, 1078.0, 2192.0, 5746.0, 22614.0, 372529.0, 3747951.0, 28778.0, 6780.0, 2606.0, 1173.0, 550.0, 331.0, 201.0, 108.0, 80.0, 51.0, 43.0, 22.0, 18.0, 7.0, 6.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-21.265625, -20.7213134765625, -20.177001953125, -19.6326904296875, -19.08837890625, -18.5440673828125, -17.999755859375, -17.4554443359375, -16.9111328125, -16.3668212890625, -15.822509765625, -15.2781982421875, -14.73388671875, -14.1895751953125, -13.645263671875, -13.1009521484375, -12.556640625, -12.0123291015625, -11.468017578125, -10.9237060546875, -10.37939453125, -9.8350830078125, -9.290771484375, -8.7464599609375, -8.2021484375, -7.6578369140625, -7.113525390625, -6.5692138671875, -6.02490234375, -5.4805908203125, -4.936279296875, -4.3919677734375, -3.84765625, -3.3033447265625, -2.759033203125, -2.2147216796875, -1.67041015625, -1.1260986328125, -0.581787109375, -0.0374755859375, 0.5068359375, 1.0511474609375, 1.595458984375, 2.1397705078125, 2.68408203125, 3.2283935546875, 3.772705078125, 4.3170166015625, 4.861328125, 5.4056396484375, 5.949951171875, 6.4942626953125, 7.03857421875, 7.5828857421875, 8.127197265625, 8.6715087890625, 9.2158203125, 9.7601318359375, 10.304443359375, 10.8487548828125, 11.39306640625, 11.9373779296875, 12.481689453125, 13.0260009765625, 13.5703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 8.0, 6.0, 11.0, 6.0, 11.0, 12.0, 16.0, 17.0, 19.0, 28.0, 43.0, 33.0, 35.0, 47.0, 52.0, 33.0, 58.0, 52.0, 46.0, 54.0, 38.0, 46.0, 44.0, 34.0, 39.0, 31.0, 34.0, 28.0, 33.0, 19.0, 9.0, 8.0, 9.0, 16.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9599609375, -1.9056243896484375, -1.851287841796875, -1.7969512939453125, -1.74261474609375, -1.6882781982421875, -1.633941650390625, -1.5796051025390625, -1.5252685546875, -1.4709320068359375, -1.416595458984375, -1.3622589111328125, -1.30792236328125, -1.2535858154296875, -1.199249267578125, -1.1449127197265625, -1.090576171875, -1.0362396240234375, -0.981903076171875, -0.9275665283203125, -0.87322998046875, -0.8188934326171875, -0.764556884765625, -0.7102203369140625, -0.6558837890625, -0.6015472412109375, -0.547210693359375, -0.4928741455078125, -0.43853759765625, -0.3842010498046875, -0.329864501953125, -0.2755279541015625, -0.22119140625, -0.1668548583984375, -0.112518310546875, -0.0581817626953125, -0.00384521484375, 0.0504913330078125, 0.104827880859375, 0.1591644287109375, 0.2135009765625, 0.2678375244140625, 0.322174072265625, 0.3765106201171875, 0.43084716796875, 0.4851837158203125, 0.539520263671875, 0.5938568115234375, 0.648193359375, 0.7025299072265625, 0.756866455078125, 0.8112030029296875, 0.86553955078125, 0.9198760986328125, 0.974212646484375, 1.0285491943359375, 1.0828857421875, 1.1372222900390625, 1.191558837890625, 1.2458953857421875, 1.30023193359375, 1.3545684814453125, 1.408905029296875, 1.4632415771484375, 1.517578125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 13.0, 16.0, 29.0, 54.0, 77.0, 121.0, 176.0, 272.0, 420.0, 717.0, 1204.0, 2129.0, 4225.0, 9679.0, 27818.0, 138990.0, 3802488.0, 156289.0, 29841.0, 10108.0, 4309.0, 2128.0, 1204.0, 735.0, 452.0, 248.0, 197.0, 121.0, 80.0, 53.0, 27.0, 21.0, 11.0, 13.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.93359375, -7.68194580078125, -7.4302978515625, -7.17864990234375, -6.927001953125, -6.67535400390625, -6.4237060546875, -6.17205810546875, -5.92041015625, -5.66876220703125, -5.4171142578125, -5.16546630859375, -4.913818359375, -4.66217041015625, -4.4105224609375, -4.15887451171875, -3.9072265625, -3.65557861328125, -3.4039306640625, -3.15228271484375, -2.900634765625, -2.64898681640625, -2.3973388671875, -2.14569091796875, -1.89404296875, -1.64239501953125, -1.3907470703125, -1.13909912109375, -0.887451171875, -0.63580322265625, -0.3841552734375, -0.13250732421875, 0.119140625, 0.37078857421875, 0.6224365234375, 0.87408447265625, 1.125732421875, 1.37738037109375, 1.6290283203125, 1.88067626953125, 2.13232421875, 2.38397216796875, 2.6356201171875, 2.88726806640625, 3.138916015625, 3.39056396484375, 3.6422119140625, 3.89385986328125, 4.1455078125, 4.39715576171875, 4.6488037109375, 4.90045166015625, 5.152099609375, 5.40374755859375, 5.6553955078125, 5.90704345703125, 6.15869140625, 6.41033935546875, 6.6619873046875, 6.91363525390625, 7.165283203125, 7.41693115234375, 7.6685791015625, 7.92022705078125, 8.171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 8.0, 6.0, 13.0, 19.0, 18.0, 31.0, 79.0, 186.0, 2651.0, 745.0, 147.0, 59.0, 46.0, 20.0, 10.0, 13.0, 9.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.146484375, -2.079315185546875, -2.01214599609375, -1.944976806640625, -1.8778076171875, -1.810638427734375, -1.74346923828125, -1.676300048828125, -1.609130859375, -1.541961669921875, -1.47479248046875, -1.407623291015625, -1.3404541015625, -1.273284912109375, -1.20611572265625, -1.138946533203125, -1.07177734375, -1.004608154296875, -0.93743896484375, -0.870269775390625, -0.8031005859375, -0.735931396484375, -0.66876220703125, -0.601593017578125, -0.534423828125, -0.467254638671875, -0.40008544921875, -0.332916259765625, -0.2657470703125, -0.198577880859375, -0.13140869140625, -0.064239501953125, 0.0029296875, 0.070098876953125, 0.13726806640625, 0.204437255859375, 0.2716064453125, 0.338775634765625, 0.40594482421875, 0.473114013671875, 0.540283203125, 0.607452392578125, 0.67462158203125, 0.741790771484375, 0.8089599609375, 0.876129150390625, 0.94329833984375, 1.010467529296875, 1.07763671875, 1.144805908203125, 1.21197509765625, 1.279144287109375, 1.3463134765625, 1.413482666015625, 1.48065185546875, 1.547821044921875, 1.614990234375, 1.682159423828125, 1.74932861328125, 1.816497802734375, 1.8836669921875, 1.950836181640625, 2.01800537109375, 2.085174560546875, 2.15234375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 21.0, 31.0, 78.0, 132.0, 202.0, 224.0, 161.0, 88.0, 37.0, 16.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-25.31694221496582, -24.835744857788086, -24.35454750061035, -23.873350143432617, -23.392152786254883, -22.91095733642578, -22.429759979248047, -21.948562622070312, -21.467365264892578, -20.986167907714844, -20.50497055053711, -20.023773193359375, -19.54257583618164, -19.061378479003906, -18.580183029174805, -18.09898567199707, -17.617788314819336, -17.1365909576416, -16.655393600463867, -16.174196243286133, -15.692999839782715, -15.21180248260498, -14.730605125427246, -14.249408721923828, -13.768210411071777, -13.287013053894043, -12.805815696716309, -12.32461929321289, -11.843421936035156, -11.362224578857422, -10.881027221679688, -10.399829864501953, -9.918634414672852, -9.437437057495117, -8.956239700317383, -8.475043296813965, -7.9938459396362305, -7.512648582458496, -7.031451225280762, -6.5502543449401855, -6.069056510925293, -5.587859153747559, -5.106662273406982, -4.625464916229248, -4.144268035888672, -3.6630706787109375, -3.1818735599517822, -2.700676441192627, -2.219479560852051, -1.7382824420928955, -1.2570853233337402, -0.7758880853652954, -0.29469096660614014, 0.1865062713623047, 0.66770339012146, 1.1489005088806152, 1.6300976276397705, 2.111294746398926, 2.592491865158081, 3.0736889839172363, 3.5548863410949707, 4.036083221435547, 4.517280578613281, 4.998477935791016, 5.479674816131592]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 10.0, 6.0, 14.0, 20.0, 20.0, 24.0, 14.0, 22.0, 26.0, 44.0, 34.0, 34.0, 33.0, 32.0, 54.0, 39.0, 43.0, 43.0, 48.0, 37.0, 32.0, 41.0, 47.0, 41.0, 29.0, 23.0, 19.0, 29.0, 20.0, 22.0, 15.0, 16.0, 6.0, 8.0, 5.0, 10.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.32232141494751, -4.18694543838501, -4.05156946182251, -3.916193723678589, -3.780817747116089, -3.645441770553589, -3.510066032409668, -3.374690055847168, -3.239314079284668, -3.103938102722168, -2.968562126159668, -2.833186388015747, -2.697810411453247, -2.562434434890747, -2.427058696746826, -2.291682720184326, -2.156306743621826, -2.020930767059326, -1.8855549097061157, -1.7501790523529053, -1.6148030757904053, -1.4794270992279053, -1.3440512418746948, -1.2086753845214844, -1.0732994079589844, -0.9379234910011292, -0.8025475740432739, -0.6671716570854187, -0.5317957401275635, -0.39641982316970825, -0.261043906211853, -0.1256679892539978, 0.009707450866699219, 0.14508336782455444, 0.28045928478240967, 0.4158352017402649, 0.5512111186981201, 0.6865870356559753, 0.8219629526138306, 0.9573388695716858, 1.092714786529541, 1.228090763092041, 1.3634666204452515, 1.498842477798462, 1.634218454360962, 1.769594430923462, 1.9049702882766724, 2.040346145629883, 2.175722122192383, 2.311098098754883, 2.446474075317383, 2.5818498134613037, 2.7172257900238037, 2.8526017665863037, 2.9879775047302246, 3.1233534812927246, 3.2587294578552246, 3.3941054344177246, 3.5294814109802246, 3.6648571491241455, 3.8002331256866455, 3.9356091022491455, 4.070984840393066, 4.206360816955566, 4.341736793518066]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 4.0, 8.0, 11.0, 15.0, 19.0, 20.0, 46.0, 64.0, 102.0, 155.0, 243.0, 358.0, 731.0, 1309.0, 2828.0, 6280.0, 15787.0, 40641.0, 105492.0, 246409.0, 323648.0, 183195.0, 72897.0, 28291.0, 10997.0, 4456.0, 2075.0, 1038.0, 541.0, 322.0, 190.0, 129.0, 78.0, 66.0, 35.0, 23.0, 18.0, 6.0, 10.0, 3.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.53759765625, -5.3486328125, -5.15966796875, -4.970703125, -4.78173828125, -4.5927734375, -4.40380859375, -4.21484375, -4.02587890625, -3.8369140625, -3.64794921875, -3.458984375, -3.27001953125, -3.0810546875, -2.89208984375, -2.703125, -2.51416015625, -2.3251953125, -2.13623046875, -1.947265625, -1.75830078125, -1.5693359375, -1.38037109375, -1.19140625, -1.00244140625, -0.8134765625, -0.62451171875, -0.435546875, -0.24658203125, -0.0576171875, 0.13134765625, 0.3203125, 0.50927734375, 0.6982421875, 0.88720703125, 1.076171875, 1.26513671875, 1.4541015625, 1.64306640625, 1.83203125, 2.02099609375, 2.2099609375, 2.39892578125, 2.587890625, 2.77685546875, 2.9658203125, 3.15478515625, 3.34375, 3.53271484375, 3.7216796875, 3.91064453125, 4.099609375, 4.28857421875, 4.4775390625, 4.66650390625, 4.85546875, 5.04443359375, 5.2333984375, 5.42236328125, 5.611328125, 5.80029296875, 5.9892578125, 6.17822265625, 6.3671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 4.0, 9.0, 5.0, 10.0, 18.0, 17.0, 17.0, 26.0, 23.0, 43.0, 32.0, 42.0, 41.0, 39.0, 44.0, 55.0, 57.0, 51.0, 43.0, 47.0, 45.0, 54.0, 46.0, 37.0, 24.0, 20.0, 37.0, 31.0, 18.0, 10.0, 14.0, 11.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.974609375, -1.912872314453125, -1.85113525390625, -1.789398193359375, -1.7276611328125, -1.665924072265625, -1.60418701171875, -1.542449951171875, -1.480712890625, -1.418975830078125, -1.35723876953125, -1.295501708984375, -1.2337646484375, -1.172027587890625, -1.11029052734375, -1.048553466796875, -0.98681640625, -0.925079345703125, -0.86334228515625, -0.801605224609375, -0.7398681640625, -0.678131103515625, -0.61639404296875, -0.554656982421875, -0.492919921875, -0.431182861328125, -0.36944580078125, -0.307708740234375, -0.2459716796875, -0.184234619140625, -0.12249755859375, -0.060760498046875, 0.0009765625, 0.062713623046875, 0.12445068359375, 0.186187744140625, 0.2479248046875, 0.309661865234375, 0.37139892578125, 0.433135986328125, 0.494873046875, 0.556610107421875, 0.61834716796875, 0.680084228515625, 0.7418212890625, 0.803558349609375, 0.86529541015625, 0.927032470703125, 0.98876953125, 1.050506591796875, 1.11224365234375, 1.173980712890625, 1.2357177734375, 1.297454833984375, 1.35919189453125, 1.420928955078125, 1.482666015625, 1.544403076171875, 1.60614013671875, 1.667877197265625, 1.7296142578125, 1.791351318359375, 1.85308837890625, 1.914825439453125, 1.9765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 6.0, 2.0, 4.0, 2.0, 15.0, 10.0, 18.0, 19.0, 33.0, 33.0, 58.0, 75.0, 116.0, 138.0, 199.0, 272.0, 441.0, 647.0, 1364.0, 3490.0, 13005.0, 65082.0, 378044.0, 475111.0, 85696.0, 16781.0, 4084.0, 1516.0, 789.0, 445.0, 314.0, 223.0, 153.0, 99.0, 77.0, 52.0, 44.0, 31.0, 22.0, 10.0, 12.0, 12.0, 6.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.109375, -8.833984375, -8.55859375, -8.283203125, -8.0078125, -7.732421875, -7.45703125, -7.181640625, -6.90625, -6.630859375, -6.35546875, -6.080078125, -5.8046875, -5.529296875, -5.25390625, -4.978515625, -4.703125, -4.427734375, -4.15234375, -3.876953125, -3.6015625, -3.326171875, -3.05078125, -2.775390625, -2.5, -2.224609375, -1.94921875, -1.673828125, -1.3984375, -1.123046875, -0.84765625, -0.572265625, -0.296875, -0.021484375, 0.25390625, 0.529296875, 0.8046875, 1.080078125, 1.35546875, 1.630859375, 1.90625, 2.181640625, 2.45703125, 2.732421875, 3.0078125, 3.283203125, 3.55859375, 3.833984375, 4.109375, 4.384765625, 4.66015625, 4.935546875, 5.2109375, 5.486328125, 5.76171875, 6.037109375, 6.3125, 6.587890625, 6.86328125, 7.138671875, 7.4140625, 7.689453125, 7.96484375, 8.240234375, 8.515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 10.0, 11.0, 12.0, 17.0, 19.0, 28.0, 21.0, 25.0, 28.0, 29.0, 41.0, 27.0, 46.0, 49.0, 49.0, 41.0, 55.0, 50.0, 41.0, 47.0, 36.0, 44.0, 36.0, 41.0, 28.0, 25.0, 17.0, 21.0, 24.0, 17.0, 12.0, 9.0, 6.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.84375, -9.57611083984375, -9.3084716796875, -9.04083251953125, -8.773193359375, -8.50555419921875, -8.2379150390625, -7.97027587890625, -7.70263671875, -7.43499755859375, -7.1673583984375, -6.89971923828125, -6.632080078125, -6.36444091796875, -6.0968017578125, -5.82916259765625, -5.5615234375, -5.29388427734375, -5.0262451171875, -4.75860595703125, -4.490966796875, -4.22332763671875, -3.9556884765625, -3.68804931640625, -3.42041015625, -3.15277099609375, -2.8851318359375, -2.61749267578125, -2.349853515625, -2.08221435546875, -1.8145751953125, -1.54693603515625, -1.279296875, -1.01165771484375, -0.7440185546875, -0.47637939453125, -0.208740234375, 0.05889892578125, 0.3265380859375, 0.59417724609375, 0.86181640625, 1.12945556640625, 1.3970947265625, 1.66473388671875, 1.932373046875, 2.20001220703125, 2.4676513671875, 2.73529052734375, 3.0029296875, 3.27056884765625, 3.5382080078125, 3.80584716796875, 4.073486328125, 4.34112548828125, 4.6087646484375, 4.87640380859375, 5.14404296875, 5.41168212890625, 5.6793212890625, 5.94696044921875, 6.214599609375, 6.48223876953125, 6.7498779296875, 7.01751708984375, 7.28515625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 8.0, 14.0, 14.0, 34.0, 39.0, 55.0, 103.0, 121.0, 205.0, 333.0, 575.0, 1126.0, 2154.0, 4463.0, 11348.0, 30791.0, 92675.0, 269688.0, 392506.0, 158906.0, 51851.0, 17899.0, 6984.0, 3107.0, 1528.0, 782.0, 455.0, 299.0, 185.0, 98.0, 75.0, 44.0, 36.0, 16.0, 15.0, 4.0, 6.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.744140625, -2.661590576171875, -2.57904052734375, -2.496490478515625, -2.4139404296875, -2.331390380859375, -2.24884033203125, -2.166290283203125, -2.083740234375, -2.001190185546875, -1.91864013671875, -1.836090087890625, -1.7535400390625, -1.670989990234375, -1.58843994140625, -1.505889892578125, -1.42333984375, -1.340789794921875, -1.25823974609375, -1.175689697265625, -1.0931396484375, -1.010589599609375, -0.92803955078125, -0.845489501953125, -0.762939453125, -0.680389404296875, -0.59783935546875, -0.515289306640625, -0.4327392578125, -0.350189208984375, -0.26763916015625, -0.185089111328125, -0.1025390625, -0.019989013671875, 0.06256103515625, 0.145111083984375, 0.2276611328125, 0.310211181640625, 0.39276123046875, 0.475311279296875, 0.557861328125, 0.640411376953125, 0.72296142578125, 0.805511474609375, 0.8880615234375, 0.970611572265625, 1.05316162109375, 1.135711669921875, 1.21826171875, 1.300811767578125, 1.38336181640625, 1.465911865234375, 1.5484619140625, 1.631011962890625, 1.71356201171875, 1.796112060546875, 1.878662109375, 1.961212158203125, 2.04376220703125, 2.126312255859375, 2.2088623046875, 2.291412353515625, 2.37396240234375, 2.456512451171875, 2.5390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 7.0, 5.0, 10.0, 22.0, 16.0, 30.0, 41.0, 59.0, 83.0, 77.0, 98.0, 94.0, 105.0, 90.0, 63.0, 63.0, 47.0, 32.0, 15.0, 16.0, 14.0, 7.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0008831024169921875, -0.0008622035384178162, -0.0008413046598434448, -0.0008204057812690735, -0.0007995069026947021, -0.0007786080241203308, -0.0007577091455459595, -0.0007368102669715881, -0.0007159113883972168, -0.0006950125098228455, -0.0006741136312484741, -0.0006532147526741028, -0.0006323158740997314, -0.0006114169955253601, -0.0005905181169509888, -0.0005696192383766174, -0.0005487203598022461, -0.0005278214812278748, -0.0005069226026535034, -0.0004860237240791321, -0.00046512484550476074, -0.0004442259669303894, -0.00042332708835601807, -0.00040242820978164673, -0.0003815293312072754, -0.00036063045263290405, -0.0003397315740585327, -0.0003188326954841614, -0.00029793381690979004, -0.0002770349383354187, -0.00025613605976104736, -0.00023523718118667603, -0.0002143383026123047, -0.00019343942403793335, -0.000172540545463562, -0.00015164166688919067, -0.00013074278831481934, -0.000109843909740448, -8.894503116607666e-05, -6.804615259170532e-05, -4.7147274017333984e-05, -2.6248395442962646e-05, -5.349516868591309e-06, 1.554936170578003e-05, 3.644824028015137e-05, 5.7347118854522705e-05, 7.824599742889404e-05, 9.914487600326538e-05, 0.00012004375457763672, 0.00014094263315200806, 0.0001618415117263794, 0.00018274039030075073, 0.00020363926887512207, 0.0002245381474494934, 0.00024543702602386475, 0.0002663359045982361, 0.0002872347831726074, 0.00030813366174697876, 0.0003290325403213501, 0.00034993141889572144, 0.0003708302974700928, 0.0003917291760444641, 0.00041262805461883545, 0.0004335269331932068, 0.0004544258117675781]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 10.0, 9.0, 8.0, 12.0, 20.0, 35.0, 57.0, 85.0, 155.0, 278.0, 541.0, 1064.0, 2245.0, 6390.0, 26552.0, 151635.0, 564980.0, 238788.0, 41011.0, 9139.0, 2900.0, 1226.0, 609.0, 314.0, 198.0, 103.0, 59.0, 37.0, 23.0, 21.0, 11.0, 16.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.71875, -3.5888671875, -3.458984375, -3.3291015625, -3.19921875, -3.0693359375, -2.939453125, -2.8095703125, -2.6796875, -2.5498046875, -2.419921875, -2.2900390625, -2.16015625, -2.0302734375, -1.900390625, -1.7705078125, -1.640625, -1.5107421875, -1.380859375, -1.2509765625, -1.12109375, -0.9912109375, -0.861328125, -0.7314453125, -0.6015625, -0.4716796875, -0.341796875, -0.2119140625, -0.08203125, 0.0478515625, 0.177734375, 0.3076171875, 0.4375, 0.5673828125, 0.697265625, 0.8271484375, 0.95703125, 1.0869140625, 1.216796875, 1.3466796875, 1.4765625, 1.6064453125, 1.736328125, 1.8662109375, 1.99609375, 2.1259765625, 2.255859375, 2.3857421875, 2.515625, 2.6455078125, 2.775390625, 2.9052734375, 3.03515625, 3.1650390625, 3.294921875, 3.4248046875, 3.5546875, 3.6845703125, 3.814453125, 3.9443359375, 4.07421875, 4.2041015625, 4.333984375, 4.4638671875, 4.59375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 9.0, 13.0, 12.0, 15.0, 35.0, 26.0, 35.0, 52.0, 63.0, 71.0, 79.0, 95.0, 84.0, 95.0, 70.0, 61.0, 48.0, 37.0, 25.0, 22.0, 12.0, 10.0, 12.0, 7.0, 1.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.377532958984375, -4.25506591796875, -4.132598876953125, -4.0101318359375, -3.887664794921875, -3.76519775390625, -3.642730712890625, -3.520263671875, -3.397796630859375, -3.27532958984375, -3.152862548828125, -3.0303955078125, -2.907928466796875, -2.78546142578125, -2.662994384765625, -2.54052734375, -2.418060302734375, -2.29559326171875, -2.173126220703125, -2.0506591796875, -1.928192138671875, -1.80572509765625, -1.683258056640625, -1.560791015625, -1.438323974609375, -1.31585693359375, -1.193389892578125, -1.0709228515625, -0.948455810546875, -0.82598876953125, -0.703521728515625, -0.5810546875, -0.458587646484375, -0.33612060546875, -0.213653564453125, -0.0911865234375, 0.031280517578125, 0.15374755859375, 0.276214599609375, 0.398681640625, 0.521148681640625, 0.64361572265625, 0.766082763671875, 0.8885498046875, 1.011016845703125, 1.13348388671875, 1.255950927734375, 1.37841796875, 1.500885009765625, 1.62335205078125, 1.745819091796875, 1.8682861328125, 1.990753173828125, 2.11322021484375, 2.235687255859375, 2.358154296875, 2.480621337890625, 2.60308837890625, 2.725555419921875, 2.8480224609375, 2.970489501953125, 3.09295654296875, 3.215423583984375, 3.337890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 1.0, 1.0, 9.0, 11.0, 20.0, 17.0, 25.0, 35.0, 43.0, 72.0, 91.0, 73.0, 84.0, 105.0, 98.0, 88.0, 76.0, 42.0, 34.0, 23.0, 14.0, 19.0, 12.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.30792236328125, -41.81925964355469, -40.330596923828125, -38.84193420410156, -37.353275299072266, -35.8646125793457, -34.37594985961914, -32.88728713989258, -31.39862632751465, -29.909963607788086, -28.421302795410156, -26.932640075683594, -25.44397735595703, -23.9553165435791, -22.46665382385254, -20.97799301147461, -19.489330291748047, -18.000667572021484, -16.512006759643555, -15.023344039916992, -13.534682273864746, -12.0460205078125, -10.557357788085938, -9.068696022033691, -7.580034255981445, -6.091372489929199, -4.602710247039795, -3.1140480041503906, -1.6253862380981445, -0.13672447204589844, 1.351938247680664, 2.84060001373291, 4.329261779785156, 5.817923545837402, 7.306585788726807, 8.795248031616211, 10.283909797668457, 11.772571563720703, 13.261234283447266, 14.749896049499512, 16.238557815551758, 17.72722053527832, 19.21588134765625, 20.704544067382812, 22.193206787109375, 23.681867599487305, 25.170530319213867, 26.659191131591797, 28.14785385131836, 29.636516571044922, 31.12517738342285, 32.61383819580078, 34.102500915527344, 35.591163635253906, 37.07982635498047, 38.56848907470703, 40.057151794433594, 41.545814514160156, 43.03447723388672, 44.52313995361328, 46.01179885864258, 47.50046157836914, 48.9891242980957, 50.477787017822266, 51.96644592285156]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 8.0, 6.0, 7.0, 9.0, 7.0, 23.0, 14.0, 23.0, 26.0, 47.0, 37.0, 36.0, 37.0, 43.0, 46.0, 53.0, 48.0, 58.0, 46.0, 53.0, 49.0, 46.0, 45.0, 34.0, 28.0, 20.0, 31.0, 20.0, 24.0, 18.0, 14.0, 8.0, 3.0, 10.0, 7.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.10371398925781, -31.754697799682617, -30.405681610107422, -29.056663513183594, -27.70764923095703, -26.358631134033203, -25.009614944458008, -23.660598754882812, -22.311582565307617, -20.962566375732422, -19.613550186157227, -18.26453399658203, -16.915515899658203, -15.566500663757324, -14.217483520507812, -12.868467330932617, -11.519451141357422, -10.170434951782227, -8.821418762207031, -7.4724016189575195, -6.123385429382324, -4.774369239807129, -3.425352096557617, -2.076335906982422, -0.7273197174072266, 0.6216967105865479, 1.9707131385803223, 3.319729804992676, 4.668745994567871, 6.017762184143066, 7.366779327392578, 8.715795516967773, 10.064807891845703, 11.413824081420898, 12.762840270996094, 14.111857414245605, 15.4608736038208, 16.809890747070312, 18.158906936645508, 19.507923126220703, 20.8569393157959, 22.205955505371094, 23.55497169494629, 24.903987884521484, 26.253005981445312, 27.602020263671875, 28.951038360595703, 30.3000545501709, 31.649070739746094, 32.99808883666992, 34.347103118896484, 35.69612121582031, 37.045135498046875, 38.3941535949707, 39.74317169189453, 41.092185974121094, 42.441200256347656, 43.790218353271484, 45.13923263549805, 46.488250732421875, 47.83726501464844, 49.186283111572266, 50.535301208496094, 51.884315490722656, 53.233333587646484]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 1.0, 5.0, 8.0, 4.0, 9.0, 11.0, 17.0, 31.0, 61.0, 67.0, 110.0, 202.0, 332.0, 693.0, 1543.0, 4015.0, 14958.0, 153429.0, 3966794.0, 39983.0, 7355.0, 2417.0, 1033.0, 543.0, 266.0, 144.0, 83.0, 44.0, 28.0, 27.0, 18.0, 12.0, 7.0, 14.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-18.671875, -18.1962890625, -17.720703125, -17.2451171875, -16.76953125, -16.2939453125, -15.818359375, -15.3427734375, -14.8671875, -14.3916015625, -13.916015625, -13.4404296875, -12.96484375, -12.4892578125, -12.013671875, -11.5380859375, -11.0625, -10.5869140625, -10.111328125, -9.6357421875, -9.16015625, -8.6845703125, -8.208984375, -7.7333984375, -7.2578125, -6.7822265625, -6.306640625, -5.8310546875, -5.35546875, -4.8798828125, -4.404296875, -3.9287109375, -3.453125, -2.9775390625, -2.501953125, -2.0263671875, -1.55078125, -1.0751953125, -0.599609375, -0.1240234375, 0.3515625, 0.8271484375, 1.302734375, 1.7783203125, 2.25390625, 2.7294921875, 3.205078125, 3.6806640625, 4.15625, 4.6318359375, 5.107421875, 5.5830078125, 6.05859375, 6.5341796875, 7.009765625, 7.4853515625, 7.9609375, 8.4365234375, 8.912109375, 9.3876953125, 9.86328125, 10.3388671875, 10.814453125, 11.2900390625, 11.765625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 5.0, 10.0, 11.0, 11.0, 23.0, 15.0, 17.0, 23.0, 25.0, 31.0, 34.0, 28.0, 44.0, 38.0, 46.0, 39.0, 40.0, 55.0, 44.0, 38.0, 47.0, 41.0, 49.0, 23.0, 27.0, 40.0, 25.0, 27.0, 27.0, 20.0, 12.0, 14.0, 12.0, 13.0, 8.0, 7.0, 6.0, 1.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.69140625, -1.6392822265625, -1.587158203125, -1.5350341796875, -1.48291015625, -1.4307861328125, -1.378662109375, -1.3265380859375, -1.2744140625, -1.2222900390625, -1.170166015625, -1.1180419921875, -1.06591796875, -1.0137939453125, -0.961669921875, -0.9095458984375, -0.857421875, -0.8052978515625, -0.753173828125, -0.7010498046875, -0.64892578125, -0.5968017578125, -0.544677734375, -0.4925537109375, -0.4404296875, -0.3883056640625, -0.336181640625, -0.2840576171875, -0.23193359375, -0.1798095703125, -0.127685546875, -0.0755615234375, -0.0234375, 0.0286865234375, 0.080810546875, 0.1329345703125, 0.18505859375, 0.2371826171875, 0.289306640625, 0.3414306640625, 0.3935546875, 0.4456787109375, 0.497802734375, 0.5499267578125, 0.60205078125, 0.6541748046875, 0.706298828125, 0.7584228515625, 0.810546875, 0.8626708984375, 0.914794921875, 0.9669189453125, 1.01904296875, 1.0711669921875, 1.123291015625, 1.1754150390625, 1.2275390625, 1.2796630859375, 1.331787109375, 1.3839111328125, 1.43603515625, 1.4881591796875, 1.540283203125, 1.5924072265625, 1.64453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 12.0, 14.0, 10.0, 21.0, 34.0, 40.0, 66.0, 83.0, 139.0, 213.0, 287.0, 498.0, 756.0, 1152.0, 1911.0, 3107.0, 5595.0, 10795.0, 22584.0, 56720.0, 237480.0, 3590448.0, 171895.0, 48198.0, 19751.0, 9590.0, 5182.0, 2936.0, 1738.0, 1003.0, 705.0, 431.0, 251.0, 205.0, 132.0, 88.0, 65.0, 42.0, 27.0, 18.0, 15.0, 9.0, 11.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.51953125, -4.38427734375, -4.2490234375, -4.11376953125, -3.978515625, -3.84326171875, -3.7080078125, -3.57275390625, -3.4375, -3.30224609375, -3.1669921875, -3.03173828125, -2.896484375, -2.76123046875, -2.6259765625, -2.49072265625, -2.35546875, -2.22021484375, -2.0849609375, -1.94970703125, -1.814453125, -1.67919921875, -1.5439453125, -1.40869140625, -1.2734375, -1.13818359375, -1.0029296875, -0.86767578125, -0.732421875, -0.59716796875, -0.4619140625, -0.32666015625, -0.19140625, -0.05615234375, 0.0791015625, 0.21435546875, 0.349609375, 0.48486328125, 0.6201171875, 0.75537109375, 0.890625, 1.02587890625, 1.1611328125, 1.29638671875, 1.431640625, 1.56689453125, 1.7021484375, 1.83740234375, 1.97265625, 2.10791015625, 2.2431640625, 2.37841796875, 2.513671875, 2.64892578125, 2.7841796875, 2.91943359375, 3.0546875, 3.18994140625, 3.3251953125, 3.46044921875, 3.595703125, 3.73095703125, 3.8662109375, 4.00146484375, 4.13671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 0.0, 8.0, 10.0, 6.0, 9.0, 9.0, 17.0, 26.0, 23.0, 48.0, 76.0, 172.0, 631.0, 2561.0, 206.0, 90.0, 49.0, 31.0, 30.0, 17.0, 10.0, 8.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.640625, -1.592498779296875, -1.54437255859375, -1.496246337890625, -1.4481201171875, -1.399993896484375, -1.35186767578125, -1.303741455078125, -1.255615234375, -1.207489013671875, -1.15936279296875, -1.111236572265625, -1.0631103515625, -1.014984130859375, -0.96685791015625, -0.918731689453125, -0.87060546875, -0.822479248046875, -0.77435302734375, -0.726226806640625, -0.6781005859375, -0.629974365234375, -0.58184814453125, -0.533721923828125, -0.485595703125, -0.437469482421875, -0.38934326171875, -0.341217041015625, -0.2930908203125, -0.244964599609375, -0.19683837890625, -0.148712158203125, -0.1005859375, -0.052459716796875, -0.00433349609375, 0.043792724609375, 0.0919189453125, 0.140045166015625, 0.18817138671875, 0.236297607421875, 0.284423828125, 0.332550048828125, 0.38067626953125, 0.428802490234375, 0.4769287109375, 0.525054931640625, 0.57318115234375, 0.621307373046875, 0.66943359375, 0.717559814453125, 0.76568603515625, 0.813812255859375, 0.8619384765625, 0.910064697265625, 0.95819091796875, 1.006317138671875, 1.054443359375, 1.102569580078125, 1.15069580078125, 1.198822021484375, 1.2469482421875, 1.295074462890625, 1.34320068359375, 1.391326904296875, 1.439453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 13.0, 17.0, 35.0, 68.0, 130.0, 200.0, 183.0, 164.0, 99.0, 54.0, 21.0, 16.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.377860069274902, -5.994187355041504, -5.610514163970947, -5.226841449737549, -4.843168258666992, -4.459495544433594, -4.075822830200195, -3.6921498775482178, -3.3084769248962402, -2.9248039722442627, -2.541131019592285, -2.1574583053588867, -1.7737853527069092, -1.3901124000549316, -1.0064396858215332, -0.6227667331695557, -0.23909378051757812, 0.14457911252975464, 0.5282520055770874, 0.9119248390197754, 1.295597791671753, 1.6792707443237305, 2.062943458557129, 2.4466164112091064, 2.830289363861084, 3.2139623165130615, 3.597635269165039, 3.9813079833984375, 4.364980697631836, 4.748653888702393, 5.132326602935791, 5.515999794006348, 5.8996734619140625, 6.283346176147461, 6.667019367218018, 7.050692081451416, 7.434365272521973, 7.818037986755371, 8.20171070098877, 8.585383415222168, 8.969057083129883, 9.352729797363281, 9.73640251159668, 10.120075225830078, 10.503748893737793, 10.887421607971191, 11.27109432220459, 11.654767036437988, 12.038439750671387, 12.422112464904785, 12.805785179138184, 13.189458847045898, 13.573131561279297, 13.956804275512695, 14.340476989746094, 14.724149703979492, 15.10782241821289, 15.491495132446289, 15.875167846679688, 16.258840560913086, 16.642513275146484, 17.026187896728516, 17.40985870361328, 17.793533325195312, 18.17720603942871]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 7.0, 12.0, 10.0, 10.0, 11.0, 24.0, 17.0, 20.0, 22.0, 27.0, 25.0, 22.0, 36.0, 33.0, 42.0, 47.0, 40.0, 46.0, 50.0, 36.0, 51.0, 41.0, 37.0, 38.0, 33.0, 27.0, 19.0, 34.0, 23.0, 20.0, 21.0, 23.0, 22.0, 14.0, 12.0, 20.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8132519721984863, -3.6944029331207275, -3.5755538940429688, -3.456704616546631, -3.337855577468872, -3.2190065383911133, -3.1001574993133545, -2.9813084602355957, -2.862459182739258, -2.743610143661499, -2.6247611045837402, -2.5059118270874023, -2.3870627880096436, -2.2682137489318848, -2.149364709854126, -2.030515670776367, -1.9116665124893188, -1.79281747341156, -1.6739683151245117, -1.555119276046753, -1.4362701177597046, -1.3174210786819458, -1.1985719203948975, -1.0797228813171387, -0.9608737826347351, -0.8420246839523315, -0.723175585269928, -0.6043264865875244, -0.48547741770744324, -0.36662834882736206, -0.2477792501449585, -0.12893015146255493, -0.010081052780151367, 0.1087680384516716, 0.22761712968349457, 0.34646621346473694, 0.4653153121471405, 0.5841643810272217, 0.7030134797096252, 0.8218625783920288, 0.9407116770744324, 1.059560775756836, 1.1784098148345947, 1.297258973121643, 1.4161080121994019, 1.5349571704864502, 1.653806209564209, 1.7726552486419678, 1.8915044069290161, 2.0103535652160645, 2.1292026042938232, 2.248051643371582, 2.366900682449341, 2.4857497215270996, 2.6045989990234375, 2.7234480381011963, 2.842297077178955, 2.961146116256714, 3.0799951553344727, 3.1988444328308105, 3.3176934719085693, 3.436542510986328, 3.555391550064087, 3.6742405891418457, 3.7930898666381836]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 9.0, 11.0, 14.0, 19.0, 34.0, 42.0, 63.0, 93.0, 133.0, 204.0, 350.0, 623.0, 1014.0, 1810.0, 3646.0, 7699.0, 17302.0, 40816.0, 94846.0, 197873.0, 281008.0, 212876.0, 105690.0, 45694.0, 19488.0, 8629.0, 4009.0, 1946.0, 1009.0, 563.0, 348.0, 231.0, 153.0, 98.0, 63.0, 49.0, 33.0, 16.0, 17.0, 7.0, 5.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.9140625, -3.77703857421875, -3.6400146484375, -3.50299072265625, -3.365966796875, -3.22894287109375, -3.0919189453125, -2.95489501953125, -2.81787109375, -2.68084716796875, -2.5438232421875, -2.40679931640625, -2.269775390625, -2.13275146484375, -1.9957275390625, -1.85870361328125, -1.7216796875, -1.58465576171875, -1.4476318359375, -1.31060791015625, -1.173583984375, -1.03656005859375, -0.8995361328125, -0.76251220703125, -0.62548828125, -0.48846435546875, -0.3514404296875, -0.21441650390625, -0.077392578125, 0.05963134765625, 0.1966552734375, 0.33367919921875, 0.470703125, 0.60772705078125, 0.7447509765625, 0.88177490234375, 1.018798828125, 1.15582275390625, 1.2928466796875, 1.42987060546875, 1.56689453125, 1.70391845703125, 1.8409423828125, 1.97796630859375, 2.114990234375, 2.25201416015625, 2.3890380859375, 2.52606201171875, 2.6630859375, 2.80010986328125, 2.9371337890625, 3.07415771484375, 3.211181640625, 3.34820556640625, 3.4852294921875, 3.62225341796875, 3.75927734375, 3.89630126953125, 4.0333251953125, 4.17034912109375, 4.307373046875, 4.44439697265625, 4.5814208984375, 4.71844482421875, 4.85546875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 0.0, 4.0, 2.0, 8.0, 1.0, 5.0, 12.0, 9.0, 8.0, 18.0, 19.0, 13.0, 14.0, 18.0, 25.0, 24.0, 30.0, 32.0, 31.0, 47.0, 27.0, 49.0, 45.0, 38.0, 49.0, 43.0, 33.0, 42.0, 38.0, 39.0, 37.0, 29.0, 18.0, 30.0, 31.0, 17.0, 15.0, 14.0, 24.0, 11.0, 8.0, 7.0, 9.0, 9.0, 9.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.7861328125, -1.73419189453125, -1.6822509765625, -1.63031005859375, -1.578369140625, -1.52642822265625, -1.4744873046875, -1.42254638671875, -1.37060546875, -1.31866455078125, -1.2667236328125, -1.21478271484375, -1.162841796875, -1.11090087890625, -1.0589599609375, -1.00701904296875, -0.955078125, -0.90313720703125, -0.8511962890625, -0.79925537109375, -0.747314453125, -0.69537353515625, -0.6434326171875, -0.59149169921875, -0.53955078125, -0.48760986328125, -0.4356689453125, -0.38372802734375, -0.331787109375, -0.27984619140625, -0.2279052734375, -0.17596435546875, -0.1240234375, -0.07208251953125, -0.0201416015625, 0.03179931640625, 0.083740234375, 0.13568115234375, 0.1876220703125, 0.23956298828125, 0.29150390625, 0.34344482421875, 0.3953857421875, 0.44732666015625, 0.499267578125, 0.55120849609375, 0.6031494140625, 0.65509033203125, 0.70703125, 0.75897216796875, 0.8109130859375, 0.86285400390625, 0.914794921875, 0.96673583984375, 1.0186767578125, 1.07061767578125, 1.12255859375, 1.17449951171875, 1.2264404296875, 1.27838134765625, 1.330322265625, 1.38226318359375, 1.4342041015625, 1.48614501953125, 1.5380859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 3.0, 4.0, 13.0, 8.0, 17.0, 16.0, 36.0, 39.0, 68.0, 102.0, 139.0, 205.0, 336.0, 516.0, 850.0, 1673.0, 5033.0, 29932.0, 289221.0, 621058.0, 83179.0, 10505.0, 2621.0, 1114.0, 661.0, 424.0, 254.0, 164.0, 148.0, 79.0, 38.0, 43.0, 17.0, 5.0, 7.0, 10.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.703125, -9.4111328125, -9.119140625, -8.8271484375, -8.53515625, -8.2431640625, -7.951171875, -7.6591796875, -7.3671875, -7.0751953125, -6.783203125, -6.4912109375, -6.19921875, -5.9072265625, -5.615234375, -5.3232421875, -5.03125, -4.7392578125, -4.447265625, -4.1552734375, -3.86328125, -3.5712890625, -3.279296875, -2.9873046875, -2.6953125, -2.4033203125, -2.111328125, -1.8193359375, -1.52734375, -1.2353515625, -0.943359375, -0.6513671875, -0.359375, -0.0673828125, 0.224609375, 0.5166015625, 0.80859375, 1.1005859375, 1.392578125, 1.6845703125, 1.9765625, 2.2685546875, 2.560546875, 2.8525390625, 3.14453125, 3.4365234375, 3.728515625, 4.0205078125, 4.3125, 4.6044921875, 4.896484375, 5.1884765625, 5.48046875, 5.7724609375, 6.064453125, 6.3564453125, 6.6484375, 6.9404296875, 7.232421875, 7.5244140625, 7.81640625, 8.1083984375, 8.400390625, 8.6923828125, 8.984375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 3.0, 7.0, 6.0, 6.0, 7.0, 10.0, 10.0, 22.0, 16.0, 31.0, 35.0, 38.0, 46.0, 57.0, 56.0, 55.0, 60.0, 54.0, 66.0, 73.0, 59.0, 62.0, 44.0, 36.0, 38.0, 32.0, 25.0, 16.0, 12.0, 15.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -6.8529052734375, -6.502685546875, -6.1524658203125, -5.80224609375, -5.4520263671875, -5.101806640625, -4.7515869140625, -4.4013671875, -4.0511474609375, -3.700927734375, -3.3507080078125, -3.00048828125, -2.6502685546875, -2.300048828125, -1.9498291015625, -1.599609375, -1.2493896484375, -0.899169921875, -0.5489501953125, -0.19873046875, 0.1514892578125, 0.501708984375, 0.8519287109375, 1.2021484375, 1.5523681640625, 1.902587890625, 2.2528076171875, 2.60302734375, 2.9532470703125, 3.303466796875, 3.6536865234375, 4.00390625, 4.3541259765625, 4.704345703125, 5.0545654296875, 5.40478515625, 5.7550048828125, 6.105224609375, 6.4554443359375, 6.8056640625, 7.1558837890625, 7.506103515625, 7.8563232421875, 8.20654296875, 8.5567626953125, 8.906982421875, 9.2572021484375, 9.607421875, 9.9576416015625, 10.307861328125, 10.6580810546875, 11.00830078125, 11.3585205078125, 11.708740234375, 12.0589599609375, 12.4091796875, 12.7593994140625, 13.109619140625, 13.4598388671875, 13.81005859375, 14.1602783203125, 14.510498046875, 14.8607177734375, 15.2109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 4.0, 2.0, 7.0, 13.0, 10.0, 15.0, 17.0, 41.0, 40.0, 60.0, 81.0, 134.0, 190.0, 332.0, 710.0, 1509.0, 4413.0, 17120.0, 100001.0, 580548.0, 288833.0, 41274.0, 8447.0, 2503.0, 999.0, 494.0, 275.0, 147.0, 97.0, 58.0, 48.0, 35.0, 20.0, 28.0, 12.0, 12.0, 9.0, 10.0, 6.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.698150634765625, -3.57794189453125, -3.457733154296875, -3.3375244140625, -3.217315673828125, -3.09710693359375, -2.976898193359375, -2.856689453125, -2.736480712890625, -2.61627197265625, -2.496063232421875, -2.3758544921875, -2.255645751953125, -2.13543701171875, -2.015228271484375, -1.89501953125, -1.774810791015625, -1.65460205078125, -1.534393310546875, -1.4141845703125, -1.293975830078125, -1.17376708984375, -1.053558349609375, -0.933349609375, -0.813140869140625, -0.69293212890625, -0.572723388671875, -0.4525146484375, -0.332305908203125, -0.21209716796875, -0.091888427734375, 0.0283203125, 0.148529052734375, 0.26873779296875, 0.388946533203125, 0.5091552734375, 0.629364013671875, 0.74957275390625, 0.869781494140625, 0.989990234375, 1.110198974609375, 1.23040771484375, 1.350616455078125, 1.4708251953125, 1.591033935546875, 1.71124267578125, 1.831451416015625, 1.95166015625, 2.071868896484375, 2.19207763671875, 2.312286376953125, 2.4324951171875, 2.552703857421875, 2.67291259765625, 2.793121337890625, 2.913330078125, 3.033538818359375, 3.15374755859375, 3.273956298828125, 3.3941650390625, 3.514373779296875, 3.63458251953125, 3.754791259765625, 3.875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 11.0, 17.0, 15.0, 14.0, 30.0, 36.0, 53.0, 62.0, 65.0, 98.0, 109.0, 106.0, 84.0, 64.0, 49.0, 36.0, 26.0, 27.0, 21.0, 20.0, 9.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004267692565917969, -0.00040775537490844727, -0.00038874149322509766, -0.00036972761154174805, -0.00035071372985839844, -0.00033169984817504883, -0.0003126859664916992, -0.0002936720848083496, -0.000274658203125, -0.0002556443214416504, -0.00023663043975830078, -0.00021761655807495117, -0.00019860267639160156, -0.00017958879470825195, -0.00016057491302490234, -0.00014156103134155273, -0.00012254714965820312, -0.00010353326797485352, -8.45193862915039e-05, -6.55055046081543e-05, -4.649162292480469e-05, -2.7477741241455078e-05, -8.463859558105469e-06, 1.055002212524414e-05, 2.956390380859375e-05, 4.857778549194336e-05, 6.759166717529297e-05, 8.660554885864258e-05, 0.00010561943054199219, 0.0001246333122253418, 0.0001436471939086914, 0.00016266107559204102, 0.00018167495727539062, 0.00020068883895874023, 0.00021970272064208984, 0.00023871660232543945, 0.00025773048400878906, 0.00027674436569213867, 0.0002957582473754883, 0.0003147721290588379, 0.0003337860107421875, 0.0003527998924255371, 0.0003718137741088867, 0.00039082765579223633, 0.00040984153747558594, 0.00042885541915893555, 0.00044786930084228516, 0.00046688318252563477, 0.0004858970642089844, 0.000504910945892334, 0.0005239248275756836, 0.0005429387092590332, 0.0005619525909423828, 0.0005809664726257324, 0.000599980354309082, 0.0006189942359924316, 0.0006380081176757812, 0.0006570219993591309, 0.0006760358810424805, 0.0006950497627258301, 0.0007140636444091797, 0.0007330775260925293, 0.0007520914077758789, 0.0007711052894592285, 0.0007901191711425781]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 17.0, 17.0, 31.0, 45.0, 87.0, 125.0, 210.0, 382.0, 700.0, 1545.0, 4338.0, 18702.0, 160823.0, 701910.0, 136297.0, 16259.0, 3904.0, 1472.0, 715.0, 361.0, 194.0, 135.0, 83.0, 55.0, 40.0, 26.0, 19.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.48828125, -4.34564208984375, -4.2030029296875, -4.06036376953125, -3.917724609375, -3.77508544921875, -3.6324462890625, -3.48980712890625, -3.34716796875, -3.20452880859375, -3.0618896484375, -2.91925048828125, -2.776611328125, -2.63397216796875, -2.4913330078125, -2.34869384765625, -2.2060546875, -2.06341552734375, -1.9207763671875, -1.77813720703125, -1.635498046875, -1.49285888671875, -1.3502197265625, -1.20758056640625, -1.06494140625, -0.92230224609375, -0.7796630859375, -0.63702392578125, -0.494384765625, -0.35174560546875, -0.2091064453125, -0.06646728515625, 0.076171875, 0.21881103515625, 0.3614501953125, 0.50408935546875, 0.646728515625, 0.78936767578125, 0.9320068359375, 1.07464599609375, 1.21728515625, 1.35992431640625, 1.5025634765625, 1.64520263671875, 1.787841796875, 1.93048095703125, 2.0731201171875, 2.21575927734375, 2.3583984375, 2.50103759765625, 2.6436767578125, 2.78631591796875, 2.928955078125, 3.07159423828125, 3.2142333984375, 3.35687255859375, 3.49951171875, 3.64215087890625, 3.7847900390625, 3.92742919921875, 4.070068359375, 4.21270751953125, 4.3553466796875, 4.49798583984375, 4.640625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 6.0, 9.0, 8.0, 13.0, 13.0, 29.0, 32.0, 35.0, 45.0, 47.0, 59.0, 61.0, 89.0, 67.0, 79.0, 92.0, 72.0, 48.0, 54.0, 35.0, 25.0, 20.0, 15.0, 8.0, 9.0, 8.0, 5.0, 10.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.07421875, -2.972747802734375, -2.87127685546875, -2.769805908203125, -2.6683349609375, -2.566864013671875, -2.46539306640625, -2.363922119140625, -2.262451171875, -2.160980224609375, -2.05950927734375, -1.958038330078125, -1.8565673828125, -1.755096435546875, -1.65362548828125, -1.552154541015625, -1.45068359375, -1.349212646484375, -1.24774169921875, -1.146270751953125, -1.0447998046875, -0.943328857421875, -0.84185791015625, -0.740386962890625, -0.638916015625, -0.537445068359375, -0.43597412109375, -0.334503173828125, -0.2330322265625, -0.131561279296875, -0.03009033203125, 0.071380615234375, 0.1728515625, 0.274322509765625, 0.37579345703125, 0.477264404296875, 0.5787353515625, 0.680206298828125, 0.78167724609375, 0.883148193359375, 0.984619140625, 1.086090087890625, 1.18756103515625, 1.289031982421875, 1.3905029296875, 1.491973876953125, 1.59344482421875, 1.694915771484375, 1.79638671875, 1.897857666015625, 1.99932861328125, 2.100799560546875, 2.2022705078125, 2.303741455078125, 2.40521240234375, 2.506683349609375, 2.608154296875, 2.709625244140625, 2.81109619140625, 2.912567138671875, 3.0140380859375, 3.115509033203125, 3.21697998046875, 3.318450927734375, 3.419921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 11.0, 33.0, 97.0, 207.0, 233.0, 215.0, 124.0, 52.0, 16.0, 9.0, 2.0, 5.0, 2.0, 1.0], "bins": [-192.97793579101562, -189.45066833496094, -185.9234161376953, -182.39614868164062, -178.868896484375, -175.3416290283203, -171.81436157226562, -168.287109375, -164.7598419189453, -161.23257446289062, -157.705322265625, -154.1780548095703, -150.65078735351562, -147.12353515625, -143.5962677001953, -140.0690155029297, -136.541748046875, -133.0144805908203, -129.4872283935547, -125.9599609375, -122.43270111083984, -118.90544128417969, -115.378173828125, -111.85091400146484, -108.32365417480469, -104.79639434814453, -101.26913452148438, -97.74186706542969, -94.21460723876953, -90.68734741210938, -87.16007995605469, -83.63282012939453, -80.10556030273438, -76.57830047607422, -73.05104064941406, -69.52377319335938, -65.99651336669922, -62.46925354003906, -58.94198989868164, -55.41472625732422, -51.88747024536133, -48.360206604003906, -44.83294677734375, -41.305686950683594, -37.77842330932617, -34.25115966796875, -30.723899841308594, -27.196638107299805, -23.669376373291016, -20.142114639282227, -16.614852905273438, -13.087591171264648, -9.56032943725586, -6.03306770324707, -2.5058059692382812, 1.0214557647705078, 4.548717498779297, 8.075979232788086, 11.603240966796875, 15.130502700805664, 18.657764434814453, 22.185026168823242, 25.71228790283203, 29.23954963684082, 32.76681137084961]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 8.0, 12.0, 8.0, 13.0, 19.0, 32.0, 23.0, 23.0, 35.0, 29.0, 55.0, 39.0, 56.0, 68.0, 59.0, 58.0, 58.0, 51.0, 46.0, 45.0, 46.0, 33.0, 31.0, 26.0, 16.0, 12.0, 20.0, 21.0, 6.0, 13.0, 9.0, 7.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-46.29984664916992, -44.992916107177734, -43.68598175048828, -42.379051208496094, -41.07211685180664, -39.76518630981445, -38.458251953125, -37.15132141113281, -35.844390869140625, -34.53746032714844, -33.230525970458984, -31.923593521118164, -30.616661071777344, -29.309730529785156, -28.002798080444336, -26.695865631103516, -25.388931274414062, -24.081998825073242, -22.775066375732422, -21.4681339263916, -20.16120147705078, -18.854270935058594, -17.547338485717773, -16.240406036376953, -14.933473587036133, -13.626541137695312, -12.319608688354492, -11.012677192687988, -9.705744743347168, -8.398812294006348, -7.0918803215026855, -5.784948348999023, -4.4780120849609375, -3.1710798740386963, -1.864147663116455, -0.5572154521942139, 0.7497167587280273, 2.0566492080688477, 3.3635811805725098, 4.670513153076172, 5.977445602416992, 7.2843780517578125, 8.591310501098633, 9.898241996765137, 11.205174446105957, 12.512106895446777, 13.819038391113281, 15.125970840454102, 16.432903289794922, 17.739835739135742, 19.046768188476562, 20.353700637817383, 21.660633087158203, 22.96756362915039, 24.27449607849121, 25.58142852783203, 26.88836097717285, 28.195293426513672, 29.502225875854492, 30.809158325195312, 32.1160888671875, 33.42302322387695, 34.72995376586914, 36.036888122558594, 37.34381866455078]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 12.0, 7.0, 27.0, 32.0, 38.0, 74.0, 121.0, 223.0, 449.0, 912.0, 1836.0, 4895.0, 18955.0, 3882754.0, 260128.0, 16018.0, 4336.0, 1714.0, 784.0, 397.0, 210.0, 135.0, 81.0, 46.0, 21.0, 19.0, 10.0, 3.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.96875, -16.4967041015625, -16.024658203125, -15.5526123046875, -15.08056640625, -14.6085205078125, -14.136474609375, -13.6644287109375, -13.1923828125, -12.7203369140625, -12.248291015625, -11.7762451171875, -11.30419921875, -10.8321533203125, -10.360107421875, -9.8880615234375, -9.416015625, -8.9439697265625, -8.471923828125, -7.9998779296875, -7.52783203125, -7.0557861328125, -6.583740234375, -6.1116943359375, -5.6396484375, -5.1676025390625, -4.695556640625, -4.2235107421875, -3.75146484375, -3.2794189453125, -2.807373046875, -2.3353271484375, -1.86328125, -1.3912353515625, -0.919189453125, -0.4471435546875, 0.02490234375, 0.4969482421875, 0.968994140625, 1.4410400390625, 1.9130859375, 2.3851318359375, 2.857177734375, 3.3292236328125, 3.80126953125, 4.2733154296875, 4.745361328125, 5.2174072265625, 5.689453125, 6.1614990234375, 6.633544921875, 7.1055908203125, 7.57763671875, 8.0496826171875, 8.521728515625, 8.9937744140625, 9.4658203125, 9.9378662109375, 10.409912109375, 10.8819580078125, 11.35400390625, 11.8260498046875, 12.298095703125, 12.7701416015625, 13.2421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 16.0, 8.0, 9.0, 16.0, 18.0, 16.0, 15.0, 26.0, 34.0, 28.0, 35.0, 37.0, 45.0, 51.0, 47.0, 51.0, 45.0, 43.0, 44.0, 52.0, 41.0, 39.0, 32.0, 30.0, 22.0, 26.0, 29.0, 14.0, 19.0, 22.0, 15.0, 10.0, 10.0, 9.0, 9.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.86328125, -1.805908203125, -1.74853515625, -1.691162109375, -1.6337890625, -1.576416015625, -1.51904296875, -1.461669921875, -1.404296875, -1.346923828125, -1.28955078125, -1.232177734375, -1.1748046875, -1.117431640625, -1.06005859375, -1.002685546875, -0.9453125, -0.887939453125, -0.83056640625, -0.773193359375, -0.7158203125, -0.658447265625, -0.60107421875, -0.543701171875, -0.486328125, -0.428955078125, -0.37158203125, -0.314208984375, -0.2568359375, -0.199462890625, -0.14208984375, -0.084716796875, -0.02734375, 0.030029296875, 0.08740234375, 0.144775390625, 0.2021484375, 0.259521484375, 0.31689453125, 0.374267578125, 0.431640625, 0.489013671875, 0.54638671875, 0.603759765625, 0.6611328125, 0.718505859375, 0.77587890625, 0.833251953125, 0.890625, 0.947998046875, 1.00537109375, 1.062744140625, 1.1201171875, 1.177490234375, 1.23486328125, 1.292236328125, 1.349609375, 1.406982421875, 1.46435546875, 1.521728515625, 1.5791015625, 1.636474609375, 1.69384765625, 1.751220703125, 1.80859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 4.0, 13.0, 18.0, 15.0, 23.0, 58.0, 46.0, 73.0, 104.0, 124.0, 172.0, 263.0, 387.0, 645.0, 973.0, 1815.0, 3794.0, 9315.0, 29852.0, 219862.0, 3845128.0, 55967.0, 14245.0, 5287.0, 2424.0, 1331.0, 742.0, 467.0, 313.0, 237.0, 158.0, 117.0, 88.0, 56.0, 35.0, 36.0, 21.0, 25.0, 14.0, 7.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.6796875, -6.49517822265625, -6.3106689453125, -6.12615966796875, -5.941650390625, -5.75714111328125, -5.5726318359375, -5.38812255859375, -5.20361328125, -5.01910400390625, -4.8345947265625, -4.65008544921875, -4.465576171875, -4.28106689453125, -4.0965576171875, -3.91204833984375, -3.7275390625, -3.54302978515625, -3.3585205078125, -3.17401123046875, -2.989501953125, -2.80499267578125, -2.6204833984375, -2.43597412109375, -2.25146484375, -2.06695556640625, -1.8824462890625, -1.69793701171875, -1.513427734375, -1.32891845703125, -1.1444091796875, -0.95989990234375, -0.775390625, -0.59088134765625, -0.4063720703125, -0.22186279296875, -0.037353515625, 0.14715576171875, 0.3316650390625, 0.51617431640625, 0.70068359375, 0.88519287109375, 1.0697021484375, 1.25421142578125, 1.438720703125, 1.62322998046875, 1.8077392578125, 1.99224853515625, 2.1767578125, 2.36126708984375, 2.5457763671875, 2.73028564453125, 2.914794921875, 3.09930419921875, 3.2838134765625, 3.46832275390625, 3.65283203125, 3.83734130859375, 4.0218505859375, 4.20635986328125, 4.390869140625, 4.57537841796875, 4.7598876953125, 4.94439697265625, 5.12890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 10.0, 14.0, 19.0, 26.0, 50.0, 115.0, 2841.0, 709.0, 120.0, 54.0, 38.0, 14.0, 16.0, 9.0, 6.0, 2.0, 3.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7607421875, -1.713134765625, -1.66552734375, -1.617919921875, -1.5703125, -1.522705078125, -1.47509765625, -1.427490234375, -1.3798828125, -1.332275390625, -1.28466796875, -1.237060546875, -1.189453125, -1.141845703125, -1.09423828125, -1.046630859375, -0.9990234375, -0.951416015625, -0.90380859375, -0.856201171875, -0.80859375, -0.760986328125, -0.71337890625, -0.665771484375, -0.6181640625, -0.570556640625, -0.52294921875, -0.475341796875, -0.427734375, -0.380126953125, -0.33251953125, -0.284912109375, -0.2373046875, -0.189697265625, -0.14208984375, -0.094482421875, -0.046875, 0.000732421875, 0.04833984375, 0.095947265625, 0.1435546875, 0.191162109375, 0.23876953125, 0.286376953125, 0.333984375, 0.381591796875, 0.42919921875, 0.476806640625, 0.5244140625, 0.572021484375, 0.61962890625, 0.667236328125, 0.71484375, 0.762451171875, 0.81005859375, 0.857666015625, 0.9052734375, 0.952880859375, 1.00048828125, 1.048095703125, 1.095703125, 1.143310546875, 1.19091796875, 1.238525390625, 1.2861328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 21.0, 71.0, 235.0, 342.0, 222.0, 73.0, 22.0, 8.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.13338279724121, -22.623214721679688, -22.113046646118164, -21.60287857055664, -21.09271240234375, -20.582544326782227, -20.072376251220703, -19.56220817565918, -19.052040100097656, -18.541872024536133, -18.03170394897461, -17.52153778076172, -17.011369705200195, -16.501201629638672, -15.991033554077148, -15.480865478515625, -14.970698356628418, -14.460530281066895, -13.950363159179688, -13.440195083618164, -12.93002700805664, -12.419858932495117, -11.90969181060791, -11.399523735046387, -10.88935661315918, -10.379188537597656, -9.86902141571045, -9.358853340148926, -8.848685264587402, -8.338518142700195, -7.828350067138672, -7.318181991577148, -6.808012962341309, -6.297845363616943, -5.78767728805542, -5.277509689331055, -4.767341613769531, -4.257174015045166, -3.747006416320801, -3.2368385791778564, -2.726670742034912, -2.2165029048919678, -1.706335186958313, -1.1961674690246582, -0.6859996318817139, -0.17583179473876953, 0.3343358039855957, 0.84450364112854, 1.3546714782714844, 1.8648393154144287, 2.375007152557373, 2.8851747512817383, 3.3953425884246826, 3.905510425567627, 4.415678024291992, 4.925846099853516, 5.436013698577881, 5.946181297302246, 6.4563493728637695, 6.966516971588135, 7.4766845703125, 7.986852645874023, 8.497020721435547, 9.007187843322754, 9.517355918884277]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 11.0, 14.0, 21.0, 20.0, 33.0, 33.0, 43.0, 46.0, 58.0, 59.0, 55.0, 59.0, 71.0, 69.0, 61.0, 50.0, 43.0, 42.0, 40.0, 33.0, 34.0, 21.0, 18.0, 9.0, 14.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.2452592849731445, -5.111111164093018, -4.976963043212891, -4.842814922332764, -4.708666801452637, -4.574518203735352, -4.440370082855225, -4.306221961975098, -4.172073841094971, -4.037925720214844, -3.903777599334717, -3.7696292400360107, -3.635481119155884, -3.501332998275757, -3.367184638977051, -3.233036518096924, -3.098888397216797, -2.96474027633667, -2.830592155456543, -2.696443796157837, -2.56229567527771, -2.428147554397583, -2.293999195098877, -2.15985107421875, -2.025702953338623, -1.891554832458496, -1.7574065923690796, -1.623258352279663, -1.4891102313995361, -1.3549621105194092, -1.2208138704299927, -1.0866656303405762, -0.9525177478790283, -0.8183695673942566, -0.6842213869094849, -0.5500732064247131, -0.4159250259399414, -0.2817768454551697, -0.14762866497039795, -0.01348048448562622, 0.12066769599914551, 0.25481587648391724, 0.38896405696868896, 0.5231122374534607, 0.6572604179382324, 0.7914085984230042, 0.9255567789077759, 1.0597050189971924, 1.1938531398773193, 1.3280012607574463, 1.4621495008468628, 1.5962977409362793, 1.7304458618164062, 1.8645939826965332, 1.9987422227859497, 2.132890462875366, 2.267038583755493, 2.40118670463562, 2.535335063934326, 2.669483184814453, 2.80363130569458, 2.937779426574707, 3.071927547454834, 3.20607590675354, 3.340224027633667]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 5.0, 18.0, 15.0, 27.0, 39.0, 64.0, 83.0, 178.0, 309.0, 515.0, 996.0, 2073.0, 4604.0, 10830.0, 27946.0, 72838.0, 176118.0, 313919.0, 250413.0, 112802.0, 44310.0, 17355.0, 6905.0, 3120.0, 1348.0, 728.0, 383.0, 226.0, 142.0, 78.0, 48.0, 28.0, 30.0, 18.0, 7.0, 8.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.20147705078125, -4.0552978515625, -3.90911865234375, -3.762939453125, -3.61676025390625, -3.4705810546875, -3.32440185546875, -3.17822265625, -3.03204345703125, -2.8858642578125, -2.73968505859375, -2.593505859375, -2.44732666015625, -2.3011474609375, -2.15496826171875, -2.0087890625, -1.86260986328125, -1.7164306640625, -1.57025146484375, -1.424072265625, -1.27789306640625, -1.1317138671875, -0.98553466796875, -0.83935546875, -0.69317626953125, -0.5469970703125, -0.40081787109375, -0.254638671875, -0.10845947265625, 0.0377197265625, 0.18389892578125, 0.330078125, 0.47625732421875, 0.6224365234375, 0.76861572265625, 0.914794921875, 1.06097412109375, 1.2071533203125, 1.35333251953125, 1.49951171875, 1.64569091796875, 1.7918701171875, 1.93804931640625, 2.084228515625, 2.23040771484375, 2.3765869140625, 2.52276611328125, 2.6689453125, 2.81512451171875, 2.9613037109375, 3.10748291015625, 3.253662109375, 3.39984130859375, 3.5460205078125, 3.69219970703125, 3.83837890625, 3.98455810546875, 4.1307373046875, 4.27691650390625, 4.423095703125, 4.56927490234375, 4.7154541015625, 4.86163330078125, 5.0078125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 10.0, 6.0, 13.0, 10.0, 7.0, 12.0, 22.0, 11.0, 24.0, 25.0, 25.0, 33.0, 26.0, 36.0, 48.0, 32.0, 49.0, 48.0, 43.0, 53.0, 55.0, 43.0, 37.0, 34.0, 38.0, 34.0, 28.0, 37.0, 25.0, 20.0, 18.0, 16.0, 13.0, 12.0, 8.0, 9.0, 12.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8818359375, -1.8245697021484375, -1.767303466796875, -1.7100372314453125, -1.65277099609375, -1.5955047607421875, -1.538238525390625, -1.4809722900390625, -1.4237060546875, -1.3664398193359375, -1.309173583984375, -1.2519073486328125, -1.19464111328125, -1.1373748779296875, -1.080108642578125, -1.0228424072265625, -0.965576171875, -0.9083099365234375, -0.851043701171875, -0.7937774658203125, -0.73651123046875, -0.6792449951171875, -0.621978759765625, -0.5647125244140625, -0.5074462890625, -0.4501800537109375, -0.392913818359375, -0.3356475830078125, -0.27838134765625, -0.2211151123046875, -0.163848876953125, -0.1065826416015625, -0.04931640625, 0.0079498291015625, 0.065216064453125, 0.1224822998046875, 0.17974853515625, 0.2370147705078125, 0.294281005859375, 0.3515472412109375, 0.4088134765625, 0.4660797119140625, 0.523345947265625, 0.5806121826171875, 0.63787841796875, 0.6951446533203125, 0.752410888671875, 0.8096771240234375, 0.866943359375, 0.9242095947265625, 0.981475830078125, 1.0387420654296875, 1.09600830078125, 1.1532745361328125, 1.210540771484375, 1.2678070068359375, 1.3250732421875, 1.3823394775390625, 1.439605712890625, 1.4968719482421875, 1.55413818359375, 1.6114044189453125, 1.668670654296875, 1.7259368896484375, 1.783203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 16.0, 20.0, 23.0, 54.0, 68.0, 159.0, 233.0, 386.0, 731.0, 1474.0, 5533.0, 61933.0, 767995.0, 193694.0, 11817.0, 2285.0, 969.0, 458.0, 295.0, 170.0, 94.0, 57.0, 33.0, 21.0, 12.0, 5.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9296875, -12.5673828125, -12.205078125, -11.8427734375, -11.48046875, -11.1181640625, -10.755859375, -10.3935546875, -10.03125, -9.6689453125, -9.306640625, -8.9443359375, -8.58203125, -8.2197265625, -7.857421875, -7.4951171875, -7.1328125, -6.7705078125, -6.408203125, -6.0458984375, -5.68359375, -5.3212890625, -4.958984375, -4.5966796875, -4.234375, -3.8720703125, -3.509765625, -3.1474609375, -2.78515625, -2.4228515625, -2.060546875, -1.6982421875, -1.3359375, -0.9736328125, -0.611328125, -0.2490234375, 0.11328125, 0.4755859375, 0.837890625, 1.2001953125, 1.5625, 1.9248046875, 2.287109375, 2.6494140625, 3.01171875, 3.3740234375, 3.736328125, 4.0986328125, 4.4609375, 4.8232421875, 5.185546875, 5.5478515625, 5.91015625, 6.2724609375, 6.634765625, 6.9970703125, 7.359375, 7.7216796875, 8.083984375, 8.4462890625, 8.80859375, 9.1708984375, 9.533203125, 9.8955078125, 10.2578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 10.0, 9.0, 15.0, 26.0, 30.0, 37.0, 29.0, 48.0, 41.0, 49.0, 51.0, 49.0, 59.0, 71.0, 73.0, 59.0, 50.0, 47.0, 44.0, 37.0, 29.0, 27.0, 26.0, 18.0, 16.0, 19.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-13.578125, -13.24072265625, -12.9033203125, -12.56591796875, -12.228515625, -11.89111328125, -11.5537109375, -11.21630859375, -10.87890625, -10.54150390625, -10.2041015625, -9.86669921875, -9.529296875, -9.19189453125, -8.8544921875, -8.51708984375, -8.1796875, -7.84228515625, -7.5048828125, -7.16748046875, -6.830078125, -6.49267578125, -6.1552734375, -5.81787109375, -5.48046875, -5.14306640625, -4.8056640625, -4.46826171875, -4.130859375, -3.79345703125, -3.4560546875, -3.11865234375, -2.78125, -2.44384765625, -2.1064453125, -1.76904296875, -1.431640625, -1.09423828125, -0.7568359375, -0.41943359375, -0.08203125, 0.25537109375, 0.5927734375, 0.93017578125, 1.267578125, 1.60498046875, 1.9423828125, 2.27978515625, 2.6171875, 2.95458984375, 3.2919921875, 3.62939453125, 3.966796875, 4.30419921875, 4.6416015625, 4.97900390625, 5.31640625, 5.65380859375, 5.9912109375, 6.32861328125, 6.666015625, 7.00341796875, 7.3408203125, 7.67822265625, 8.015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 8.0, 6.0, 15.0, 19.0, 28.0, 40.0, 64.0, 94.0, 123.0, 338.0, 1009.0, 7360.0, 321962.0, 702493.0, 12824.0, 1342.0, 390.0, 152.0, 84.0, 54.0, 29.0, 20.0, 19.0, 12.0, 11.0, 9.0, 6.0, 8.0, 5.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -9.0235595703125, -8.742431640625, -8.4613037109375, -8.18017578125, -7.8990478515625, -7.617919921875, -7.3367919921875, -7.0556640625, -6.7745361328125, -6.493408203125, -6.2122802734375, -5.93115234375, -5.6500244140625, -5.368896484375, -5.0877685546875, -4.806640625, -4.5255126953125, -4.244384765625, -3.9632568359375, -3.68212890625, -3.4010009765625, -3.119873046875, -2.8387451171875, -2.5576171875, -2.2764892578125, -1.995361328125, -1.7142333984375, -1.43310546875, -1.1519775390625, -0.870849609375, -0.5897216796875, -0.30859375, -0.0274658203125, 0.253662109375, 0.5347900390625, 0.81591796875, 1.0970458984375, 1.378173828125, 1.6593017578125, 1.9404296875, 2.2215576171875, 2.502685546875, 2.7838134765625, 3.06494140625, 3.3460693359375, 3.627197265625, 3.9083251953125, 4.189453125, 4.4705810546875, 4.751708984375, 5.0328369140625, 5.31396484375, 5.5950927734375, 5.876220703125, 6.1573486328125, 6.4384765625, 6.7196044921875, 7.000732421875, 7.2818603515625, 7.56298828125, 7.8441162109375, 8.125244140625, 8.4063720703125, 8.6875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 3.0, 8.0, 7.0, 16.0, 16.0, 24.0, 33.0, 24.0, 52.0, 61.0, 93.0, 127.0, 124.0, 108.0, 75.0, 66.0, 43.0, 27.0, 16.0, 22.0, 16.0, 9.0, 8.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006780624389648438, -0.0006556734442710876, -0.0006332844495773315, -0.0006108954548835754, -0.0005885064601898193, -0.0005661174654960632, -0.0005437284708023071, -0.000521339476108551, -0.0004989504814147949, -0.0004765614867210388, -0.0004541724920272827, -0.0004317834973335266, -0.0004093945026397705, -0.0003870055079460144, -0.0003646165132522583, -0.0003422275185585022, -0.0003198385238647461, -0.00029744952917099, -0.0002750605344772339, -0.0002526715397834778, -0.00023028254508972168, -0.00020789355039596558, -0.00018550455570220947, -0.00016311556100845337, -0.00014072656631469727, -0.00011833757162094116, -9.594857692718506e-05, -7.355958223342896e-05, -5.117058753967285e-05, -2.8781592845916748e-05, -6.3925981521606445e-06, 1.599639654159546e-05, 3.838539123535156e-05, 6.0774385929107666e-05, 8.316338062286377e-05, 0.00010555237531661987, 0.00012794137001037598, 0.00015033036470413208, 0.00017271935939788818, 0.0001951083540916443, 0.0002174973487854004, 0.0002398863434791565, 0.0002622753381729126, 0.0002846643328666687, 0.0003070533275604248, 0.0003294423222541809, 0.000351831316947937, 0.0003742203116416931, 0.0003966093063354492, 0.0004189983010292053, 0.0004413872957229614, 0.00046377629041671753, 0.00048616528511047363, 0.0005085542798042297, 0.0005309432744979858, 0.0005533322691917419, 0.000575721263885498, 0.0005981102585792542, 0.0006204992532730103, 0.0006428882479667664, 0.0006652772426605225, 0.0006876662373542786, 0.0007100552320480347, 0.0007324442267417908, 0.0007548332214355469]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 10.0, 7.0, 14.0, 14.0, 18.0, 35.0, 50.0, 58.0, 72.0, 143.0, 251.0, 494.0, 1019.0, 2510.0, 8912.0, 67923.0, 724111.0, 217347.0, 18489.0, 4063.0, 1491.0, 679.0, 341.0, 165.0, 100.0, 59.0, 49.0, 30.0, 25.0, 11.0, 13.0, 14.0, 7.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.078125, -4.91278076171875, -4.7474365234375, -4.58209228515625, -4.416748046875, -4.25140380859375, -4.0860595703125, -3.92071533203125, -3.75537109375, -3.59002685546875, -3.4246826171875, -3.25933837890625, -3.093994140625, -2.92864990234375, -2.7633056640625, -2.59796142578125, -2.4326171875, -2.26727294921875, -2.1019287109375, -1.93658447265625, -1.771240234375, -1.60589599609375, -1.4405517578125, -1.27520751953125, -1.10986328125, -0.94451904296875, -0.7791748046875, -0.61383056640625, -0.448486328125, -0.28314208984375, -0.1177978515625, 0.04754638671875, 0.212890625, 0.37823486328125, 0.5435791015625, 0.70892333984375, 0.874267578125, 1.03961181640625, 1.2049560546875, 1.37030029296875, 1.53564453125, 1.70098876953125, 1.8663330078125, 2.03167724609375, 2.197021484375, 2.36236572265625, 2.5277099609375, 2.69305419921875, 2.8583984375, 3.02374267578125, 3.1890869140625, 3.35443115234375, 3.519775390625, 3.68511962890625, 3.8504638671875, 4.01580810546875, 4.18115234375, 4.34649658203125, 4.5118408203125, 4.67718505859375, 4.842529296875, 5.00787353515625, 5.1732177734375, 5.33856201171875, 5.50390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 5.0, 16.0, 16.0, 27.0, 36.0, 36.0, 49.0, 75.0, 70.0, 76.0, 95.0, 104.0, 97.0, 73.0, 46.0, 40.0, 33.0, 25.0, 14.0, 15.0, 8.0, 6.0, 5.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.79296875, -3.673065185546875, -3.55316162109375, -3.433258056640625, -3.3133544921875, -3.193450927734375, -3.07354736328125, -2.953643798828125, -2.833740234375, -2.713836669921875, -2.59393310546875, -2.474029541015625, -2.3541259765625, -2.234222412109375, -2.11431884765625, -1.994415283203125, -1.87451171875, -1.754608154296875, -1.63470458984375, -1.514801025390625, -1.3948974609375, -1.274993896484375, -1.15509033203125, -1.035186767578125, -0.915283203125, -0.795379638671875, -0.67547607421875, -0.555572509765625, -0.4356689453125, -0.315765380859375, -0.19586181640625, -0.075958251953125, 0.0439453125, 0.163848876953125, 0.28375244140625, 0.403656005859375, 0.5235595703125, 0.643463134765625, 0.76336669921875, 0.883270263671875, 1.003173828125, 1.123077392578125, 1.24298095703125, 1.362884521484375, 1.4827880859375, 1.602691650390625, 1.72259521484375, 1.842498779296875, 1.96240234375, 2.082305908203125, 2.20220947265625, 2.322113037109375, 2.4420166015625, 2.561920166015625, 2.68182373046875, 2.801727294921875, 2.921630859375, 3.041534423828125, 3.16143798828125, 3.281341552734375, 3.4012451171875, 3.521148681640625, 3.64105224609375, 3.760955810546875, 3.880859375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 19.0, 47.0, 92.0, 212.0, 240.0, 179.0, 119.0, 55.0, 16.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.25324249267578, -38.23593521118164, -35.2186279296875, -32.201324462890625, -29.184017181396484, -26.166709899902344, -23.149404525756836, -20.132099151611328, -17.114791870117188, -14.097485542297363, -11.080179214477539, -8.062872886657715, -5.045566558837891, -2.0282602310180664, 0.9890460968017578, 4.006351470947266, 7.023658752441406, 10.04096508026123, 13.058271408081055, 16.075576782226562, 19.092884063720703, 22.110191345214844, 25.12749671936035, 28.14480209350586, 31.162109375, 34.17941665649414, 37.19672393798828, 40.214027404785156, 43.2313346862793, 46.24864196777344, 49.26594543457031, 52.28325271606445, 55.300567626953125, 58.317874908447266, 61.335182189941406, 64.35248565673828, 67.36979675292969, 70.38710021972656, 73.40440368652344, 76.42170715332031, 79.43901824951172, 82.4563217163086, 85.4736328125, 88.49093627929688, 91.50823974609375, 94.52555084228516, 97.54285430908203, 100.56016540527344, 103.57746887207031, 106.59477233886719, 109.6120834350586, 112.62938690185547, 115.64669799804688, 118.66400146484375, 121.68130493164062, 124.6986083984375, 127.7159194946289, 130.7332305908203, 133.7505340576172, 136.76783752441406, 139.78514099121094, 142.8024444580078, 145.81976318359375, 148.83706665039062, 151.8543701171875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 4.0, 6.0, 14.0, 14.0, 15.0, 22.0, 20.0, 29.0, 25.0, 35.0, 35.0, 40.0, 46.0, 44.0, 52.0, 40.0, 45.0, 55.0, 56.0, 43.0, 40.0, 41.0, 34.0, 28.0, 38.0, 33.0, 27.0, 30.0, 18.0, 7.0, 13.0, 12.0, 9.0, 6.0, 3.0, 8.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.068565368652344, -36.761741638183594, -35.45492172241211, -34.14809799194336, -32.841278076171875, -31.534454345703125, -30.227632522583008, -28.92081069946289, -27.613988876342773, -26.307167053222656, -25.00034523010254, -23.693523406982422, -22.386699676513672, -21.079879760742188, -19.773056030273438, -18.46623420715332, -17.159412384033203, -15.852590560913086, -14.545768737792969, -13.238945960998535, -11.932124137878418, -10.6253023147583, -9.318479537963867, -8.01165771484375, -6.704835891723633, -5.398014068603516, -4.09119176864624, -2.784369707107544, -1.4775476455688477, -0.17072582244873047, 1.136096477508545, 2.4429187774658203, 3.749736785888672, 5.056558609008789, 6.3633809089660645, 7.67020320892334, 8.977025032043457, 10.283846855163574, 11.590669631958008, 12.897491455078125, 14.204313278198242, 15.51113510131836, 16.817956924438477, 18.124778747558594, 19.431602478027344, 20.738422393798828, 22.045246124267578, 23.352067947387695, 24.658889770507812, 25.96571159362793, 27.272533416748047, 28.579355239868164, 29.88617706298828, 31.19300079345703, 32.499820709228516, 33.806644439697266, 35.11346435546875, 36.4202880859375, 37.727108001708984, 39.033931732177734, 40.34075164794922, 41.64757537841797, 42.95439529418945, 44.2612190246582, 45.56804275512695]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 15.0, 15.0, 26.0, 41.0, 80.0, 110.0, 187.0, 405.0, 750.0, 1619.0, 4091.0, 11596.0, 50995.0, 3847049.0, 238783.0, 25968.0, 7476.0, 2676.0, 1158.0, 526.0, 296.0, 158.0, 68.0, 64.0, 37.0, 22.0, 16.0, 11.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-12.4921875, -12.18597412109375, -11.8797607421875, -11.57354736328125, -11.267333984375, -10.96112060546875, -10.6549072265625, -10.34869384765625, -10.04248046875, -9.73626708984375, -9.4300537109375, -9.12384033203125, -8.817626953125, -8.51141357421875, -8.2052001953125, -7.89898681640625, -7.5927734375, -7.28656005859375, -6.9803466796875, -6.67413330078125, -6.367919921875, -6.06170654296875, -5.7554931640625, -5.44927978515625, -5.14306640625, -4.83685302734375, -4.5306396484375, -4.22442626953125, -3.918212890625, -3.61199951171875, -3.3057861328125, -2.99957275390625, -2.693359375, -2.38714599609375, -2.0809326171875, -1.77471923828125, -1.468505859375, -1.16229248046875, -0.8560791015625, -0.54986572265625, -0.24365234375, 0.06256103515625, 0.3687744140625, 0.67498779296875, 0.981201171875, 1.28741455078125, 1.5936279296875, 1.89984130859375, 2.2060546875, 2.51226806640625, 2.8184814453125, 3.12469482421875, 3.430908203125, 3.73712158203125, 4.0433349609375, 4.34954833984375, 4.65576171875, 4.96197509765625, 5.2681884765625, 5.57440185546875, 5.880615234375, 6.18682861328125, 6.4930419921875, 6.79925537109375, 7.10546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 5.0, 1.0, 1.0, 8.0, 14.0, 4.0, 7.0, 13.0, 17.0, 23.0, 26.0, 18.0, 36.0, 32.0, 35.0, 32.0, 48.0, 60.0, 48.0, 58.0, 55.0, 50.0, 40.0, 49.0, 44.0, 40.0, 38.0, 32.0, 31.0, 31.0, 24.0, 21.0, 12.0, 9.0, 11.0, 5.0, 8.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8662109375, -1.806060791015625, -1.74591064453125, -1.685760498046875, -1.6256103515625, -1.565460205078125, -1.50531005859375, -1.445159912109375, -1.385009765625, -1.324859619140625, -1.26470947265625, -1.204559326171875, -1.1444091796875, -1.084259033203125, -1.02410888671875, -0.963958740234375, -0.90380859375, -0.843658447265625, -0.78350830078125, -0.723358154296875, -0.6632080078125, -0.603057861328125, -0.54290771484375, -0.482757568359375, -0.422607421875, -0.362457275390625, -0.30230712890625, -0.242156982421875, -0.1820068359375, -0.121856689453125, -0.06170654296875, -0.001556396484375, 0.05859375, 0.118743896484375, 0.17889404296875, 0.239044189453125, 0.2991943359375, 0.359344482421875, 0.41949462890625, 0.479644775390625, 0.539794921875, 0.599945068359375, 0.66009521484375, 0.720245361328125, 0.7803955078125, 0.840545654296875, 0.90069580078125, 0.960845947265625, 1.02099609375, 1.081146240234375, 1.14129638671875, 1.201446533203125, 1.2615966796875, 1.321746826171875, 1.38189697265625, 1.442047119140625, 1.502197265625, 1.562347412109375, 1.62249755859375, 1.682647705078125, 1.7427978515625, 1.802947998046875, 1.86309814453125, 1.923248291015625, 1.9833984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 1.0, 6.0, 12.0, 20.0, 19.0, 18.0, 27.0, 35.0, 39.0, 59.0, 61.0, 75.0, 107.0, 166.0, 340.0, 1536.0, 9398.0, 248762.0, 3910821.0, 19089.0, 2444.0, 556.0, 207.0, 112.0, 82.0, 48.0, 47.0, 43.0, 41.0, 26.0, 21.0, 16.0, 12.0, 3.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0546875, -14.58642578125, -14.1181640625, -13.64990234375, -13.181640625, -12.71337890625, -12.2451171875, -11.77685546875, -11.30859375, -10.84033203125, -10.3720703125, -9.90380859375, -9.435546875, -8.96728515625, -8.4990234375, -8.03076171875, -7.5625, -7.09423828125, -6.6259765625, -6.15771484375, -5.689453125, -5.22119140625, -4.7529296875, -4.28466796875, -3.81640625, -3.34814453125, -2.8798828125, -2.41162109375, -1.943359375, -1.47509765625, -1.0068359375, -0.53857421875, -0.0703125, 0.39794921875, 0.8662109375, 1.33447265625, 1.802734375, 2.27099609375, 2.7392578125, 3.20751953125, 3.67578125, 4.14404296875, 4.6123046875, 5.08056640625, 5.548828125, 6.01708984375, 6.4853515625, 6.95361328125, 7.421875, 7.89013671875, 8.3583984375, 8.82666015625, 9.294921875, 9.76318359375, 10.2314453125, 10.69970703125, 11.16796875, 11.63623046875, 12.1044921875, 12.57275390625, 13.041015625, 13.50927734375, 13.9775390625, 14.44580078125, 14.9140625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 14.0, 8.0, 14.0, 44.0, 79.0, 188.0, 2530.0, 902.0, 165.0, 64.0, 25.0, 16.0, 8.0, 11.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.09375, -5.96112060546875, -5.8284912109375, -5.69586181640625, -5.563232421875, -5.43060302734375, -5.2979736328125, -5.16534423828125, -5.03271484375, -4.90008544921875, -4.7674560546875, -4.63482666015625, -4.502197265625, -4.36956787109375, -4.2369384765625, -4.10430908203125, -3.9716796875, -3.83905029296875, -3.7064208984375, -3.57379150390625, -3.441162109375, -3.30853271484375, -3.1759033203125, -3.04327392578125, -2.91064453125, -2.77801513671875, -2.6453857421875, -2.51275634765625, -2.380126953125, -2.24749755859375, -2.1148681640625, -1.98223876953125, -1.849609375, -1.71697998046875, -1.5843505859375, -1.45172119140625, -1.319091796875, -1.18646240234375, -1.0538330078125, -0.92120361328125, -0.78857421875, -0.65594482421875, -0.5233154296875, -0.39068603515625, -0.258056640625, -0.12542724609375, 0.0072021484375, 0.13983154296875, 0.2724609375, 0.40509033203125, 0.5377197265625, 0.67034912109375, 0.802978515625, 0.93560791015625, 1.0682373046875, 1.20086669921875, 1.33349609375, 1.46612548828125, 1.5987548828125, 1.73138427734375, 1.864013671875, 1.99664306640625, 2.1292724609375, 2.26190185546875, 2.39453125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 18.0, 30.0, 75.0, 150.0, 238.0, 240.0, 150.0, 61.0, 17.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-43.9493522644043, -43.074520111083984, -42.199684143066406, -41.324851989746094, -40.45001983642578, -39.5751838684082, -38.70035171508789, -37.82551956176758, -36.95068359375, -36.07585144042969, -35.20101547241211, -34.3261833190918, -33.451351165771484, -32.576515197753906, -31.701683044433594, -30.82684898376465, -29.952016830444336, -29.07718276977539, -28.202350616455078, -27.327516555786133, -26.452682495117188, -25.577850341796875, -24.70301628112793, -23.828182220458984, -22.953350067138672, -22.078516006469727, -21.203683853149414, -20.32884979248047, -19.454015731811523, -18.579181671142578, -17.704349517822266, -16.82951545715332, -15.954680442810059, -15.07984733581543, -14.205013275146484, -13.330180168151855, -12.455347061157227, -11.580513000488281, -10.705679893493652, -9.830846786499023, -8.956012725830078, -8.08117961883545, -7.206345558166504, -6.331512451171875, -5.456678867340088, -4.581845283508301, -3.707012176513672, -2.8321785926818848, -1.9573450088500977, -1.0825115442276, -0.20767807960510254, 0.6671552658081055, 1.5419888496398926, 2.4168224334716797, 3.2916555404663086, 4.166489124298096, 5.041322708129883, 5.91615629196167, 6.790989875793457, 7.665822982788086, 8.540657043457031, 9.41549015045166, 10.290323257446289, 11.165157318115234, 12.039990425109863]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 8.0, 10.0, 13.0, 14.0, 22.0, 25.0, 33.0, 33.0, 39.0, 37.0, 37.0, 58.0, 60.0, 63.0, 47.0, 52.0, 58.0, 64.0, 34.0, 50.0, 39.0, 38.0, 25.0, 26.0, 16.0, 18.0, 19.0, 10.0, 7.0, 9.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9752960205078125, -7.696458339691162, -7.4176201820373535, -7.138782501220703, -6.8599443435668945, -6.581106662750244, -6.302268981933594, -6.023430824279785, -5.744593143463135, -5.465755462646484, -5.186917304992676, -4.908079624176025, -4.629241943359375, -4.350403785705566, -4.071566104888916, -3.7927281856536865, -3.513890266418457, -3.2350523471832275, -2.956214427947998, -2.6773767471313477, -2.398538827896118, -2.1197009086608887, -1.8408631086349487, -1.5620253086090088, -1.2831873893737793, -1.0043494701385498, -0.7255116701126099, -0.44667381048202515, -0.16783595085144043, 0.11100196838378906, 0.389839768409729, 0.668677568435669, 0.9475154876708984, 1.226353406906128, 1.5051912069320679, 1.7840290069580078, 2.0628669261932373, 2.341704845428467, 2.620542526245117, 2.8993804454803467, 3.178218364715576, 3.4570562839508057, 3.735894203186035, 4.0147318840026855, 4.293569564819336, 4.5724077224731445, 4.851245403289795, 5.130083084106445, 5.408921241760254, 5.687758922576904, 5.966597080230713, 6.245434761047363, 6.524272918701172, 6.803110599517822, 7.081948280334473, 7.360786437988281, 7.639624118804932, 7.918461799621582, 8.19729995727539, 8.4761381149292, 8.754975318908691, 9.0338134765625, 9.312651634216309, 9.5914888381958, 9.87032699584961]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 10.0, 8.0, 6.0, 11.0, 19.0, 29.0, 47.0, 70.0, 99.0, 182.0, 319.0, 519.0, 853.0, 1639.0, 3244.0, 7059.0, 15420.0, 35975.0, 85283.0, 195349.0, 322783.0, 213371.0, 94016.0, 39995.0, 16944.0, 7568.0, 3534.0, 1781.0, 1018.0, 537.0, 294.0, 218.0, 120.0, 79.0, 46.0, 35.0, 23.0, 19.0, 9.0, 5.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4921875, -4.3402099609375, -4.188232421875, -4.0362548828125, -3.88427734375, -3.7322998046875, -3.580322265625, -3.4283447265625, -3.2763671875, -3.1243896484375, -2.972412109375, -2.8204345703125, -2.66845703125, -2.5164794921875, -2.364501953125, -2.2125244140625, -2.060546875, -1.9085693359375, -1.756591796875, -1.6046142578125, -1.45263671875, -1.3006591796875, -1.148681640625, -0.9967041015625, -0.8447265625, -0.6927490234375, -0.540771484375, -0.3887939453125, -0.23681640625, -0.0848388671875, 0.067138671875, 0.2191162109375, 0.37109375, 0.5230712890625, 0.675048828125, 0.8270263671875, 0.97900390625, 1.1309814453125, 1.282958984375, 1.4349365234375, 1.5869140625, 1.7388916015625, 1.890869140625, 2.0428466796875, 2.19482421875, 2.3468017578125, 2.498779296875, 2.6507568359375, 2.802734375, 2.9547119140625, 3.106689453125, 3.2586669921875, 3.41064453125, 3.5626220703125, 3.714599609375, 3.8665771484375, 4.0185546875, 4.1705322265625, 4.322509765625, 4.4744873046875, 4.62646484375, 4.7784423828125, 4.930419921875, 5.0823974609375, 5.234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 10.0, 5.0, 12.0, 9.0, 18.0, 7.0, 18.0, 22.0, 23.0, 38.0, 35.0, 38.0, 31.0, 39.0, 65.0, 50.0, 58.0, 42.0, 53.0, 48.0, 57.0, 46.0, 36.0, 40.0, 40.0, 29.0, 26.0, 17.0, 13.0, 15.0, 14.0, 13.0, 7.0, 7.0, 6.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.103515625, -2.037933349609375, -1.97235107421875, -1.906768798828125, -1.8411865234375, -1.775604248046875, -1.71002197265625, -1.644439697265625, -1.578857421875, -1.513275146484375, -1.44769287109375, -1.382110595703125, -1.3165283203125, -1.250946044921875, -1.18536376953125, -1.119781494140625, -1.05419921875, -0.988616943359375, -0.92303466796875, -0.857452392578125, -0.7918701171875, -0.726287841796875, -0.66070556640625, -0.595123291015625, -0.529541015625, -0.463958740234375, -0.39837646484375, -0.332794189453125, -0.2672119140625, -0.201629638671875, -0.13604736328125, -0.070465087890625, -0.0048828125, 0.060699462890625, 0.12628173828125, 0.191864013671875, 0.2574462890625, 0.323028564453125, 0.38861083984375, 0.454193115234375, 0.519775390625, 0.585357666015625, 0.65093994140625, 0.716522216796875, 0.7821044921875, 0.847686767578125, 0.91326904296875, 0.978851318359375, 1.04443359375, 1.110015869140625, 1.17559814453125, 1.241180419921875, 1.3067626953125, 1.372344970703125, 1.43792724609375, 1.503509521484375, 1.569091796875, 1.634674072265625, 1.70025634765625, 1.765838623046875, 1.8314208984375, 1.897003173828125, 1.96258544921875, 2.028167724609375, 2.09375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 15.0, 26.0, 46.0, 63.0, 154.0, 284.0, 621.0, 1585.0, 5851.0, 106679.0, 891823.0, 35481.0, 3720.0, 1181.0, 490.0, 237.0, 122.0, 72.0, 32.0, 21.0, 14.0, 12.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.75, -15.17431640625, -14.5986328125, -14.02294921875, -13.447265625, -12.87158203125, -12.2958984375, -11.72021484375, -11.14453125, -10.56884765625, -9.9931640625, -9.41748046875, -8.841796875, -8.26611328125, -7.6904296875, -7.11474609375, -6.5390625, -5.96337890625, -5.3876953125, -4.81201171875, -4.236328125, -3.66064453125, -3.0849609375, -2.50927734375, -1.93359375, -1.35791015625, -0.7822265625, -0.20654296875, 0.369140625, 0.94482421875, 1.5205078125, 2.09619140625, 2.671875, 3.24755859375, 3.8232421875, 4.39892578125, 4.974609375, 5.55029296875, 6.1259765625, 6.70166015625, 7.27734375, 7.85302734375, 8.4287109375, 9.00439453125, 9.580078125, 10.15576171875, 10.7314453125, 11.30712890625, 11.8828125, 12.45849609375, 13.0341796875, 13.60986328125, 14.185546875, 14.76123046875, 15.3369140625, 15.91259765625, 16.48828125, 17.06396484375, 17.6396484375, 18.21533203125, 18.791015625, 19.36669921875, 19.9423828125, 20.51806640625, 21.09375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 11.0, 11.0, 13.0, 22.0, 27.0, 33.0, 34.0, 39.0, 54.0, 62.0, 75.0, 81.0, 79.0, 62.0, 65.0, 71.0, 37.0, 36.0, 43.0, 30.0, 24.0, 28.0, 21.0, 9.0, 12.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.592041015625, -8.22314453125, -7.854248046875, -7.4853515625, -7.116455078125, -6.74755859375, -6.378662109375, -6.009765625, -5.640869140625, -5.27197265625, -4.903076171875, -4.5341796875, -4.165283203125, -3.79638671875, -3.427490234375, -3.05859375, -2.689697265625, -2.32080078125, -1.951904296875, -1.5830078125, -1.214111328125, -0.84521484375, -0.476318359375, -0.107421875, 0.261474609375, 0.63037109375, 0.999267578125, 1.3681640625, 1.737060546875, 2.10595703125, 2.474853515625, 2.84375, 3.212646484375, 3.58154296875, 3.950439453125, 4.3193359375, 4.688232421875, 5.05712890625, 5.426025390625, 5.794921875, 6.163818359375, 6.53271484375, 6.901611328125, 7.2705078125, 7.639404296875, 8.00830078125, 8.377197265625, 8.74609375, 9.114990234375, 9.48388671875, 9.852783203125, 10.2216796875, 10.590576171875, 10.95947265625, 11.328369140625, 11.697265625, 12.066162109375, 12.43505859375, 12.803955078125, 13.1728515625, 13.541748046875, 13.91064453125, 14.279541015625, 14.6484375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 2.0, 5.0, 9.0, 13.0, 18.0, 25.0, 19.0, 39.0, 54.0, 65.0, 112.0, 158.0, 271.0, 575.0, 1315.0, 3902.0, 16971.0, 126009.0, 704227.0, 166095.0, 21072.0, 4635.0, 1464.0, 615.0, 321.0, 196.0, 87.0, 74.0, 49.0, 35.0, 26.0, 19.0, 26.0, 14.0, 11.0, 5.0, 6.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -4.019775390625, -3.90673828125, -3.793701171875, -3.6806640625, -3.567626953125, -3.45458984375, -3.341552734375, -3.228515625, -3.115478515625, -3.00244140625, -2.889404296875, -2.7763671875, -2.663330078125, -2.55029296875, -2.437255859375, -2.32421875, -2.211181640625, -2.09814453125, -1.985107421875, -1.8720703125, -1.759033203125, -1.64599609375, -1.532958984375, -1.419921875, -1.306884765625, -1.19384765625, -1.080810546875, -0.9677734375, -0.854736328125, -0.74169921875, -0.628662109375, -0.515625, -0.402587890625, -0.28955078125, -0.176513671875, -0.0634765625, 0.049560546875, 0.16259765625, 0.275634765625, 0.388671875, 0.501708984375, 0.61474609375, 0.727783203125, 0.8408203125, 0.953857421875, 1.06689453125, 1.179931640625, 1.29296875, 1.406005859375, 1.51904296875, 1.632080078125, 1.7451171875, 1.858154296875, 1.97119140625, 2.084228515625, 2.197265625, 2.310302734375, 2.42333984375, 2.536376953125, 2.6494140625, 2.762451171875, 2.87548828125, 2.988525390625, 3.1015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 10.0, 9.0, 10.0, 15.0, 17.0, 19.0, 28.0, 43.0, 43.0, 69.0, 79.0, 126.0, 144.0, 84.0, 59.0, 47.0, 42.0, 35.0, 28.0, 18.0, 19.0, 10.0, 6.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007829666137695312, -0.0007612928748130798, -0.0007396191358566284, -0.000717945396900177, -0.0006962716579437256, -0.0006745979189872742, -0.0006529241800308228, -0.0006312504410743713, -0.0006095767021179199, -0.0005879029631614685, -0.0005662292242050171, -0.0005445554852485657, -0.0005228817462921143, -0.0005012080073356628, -0.0004795342683792114, -0.00045786052942276, -0.0004361867904663086, -0.0004145130515098572, -0.00039283931255340576, -0.00037116557359695435, -0.00034949183464050293, -0.0003278180956840515, -0.0003061443567276001, -0.0002844706177711487, -0.00026279687881469727, -0.00024112313985824585, -0.00021944940090179443, -0.00019777566194534302, -0.0001761019229888916, -0.00015442818403244019, -0.00013275444507598877, -0.00011108070611953735, -8.940696716308594e-05, -6.773322820663452e-05, -4.6059489250183105e-05, -2.438575029373169e-05, -2.7120113372802734e-06, 1.8961727619171143e-05, 4.063546657562256e-05, 6.230920553207397e-05, 8.398294448852539e-05, 0.0001056566834449768, 0.00012733042240142822, 0.00014900416135787964, 0.00017067790031433105, 0.00019235163927078247, 0.0002140253782272339, 0.0002356991171836853, 0.0002573728561401367, 0.00027904659509658813, 0.00030072033405303955, 0.00032239407300949097, 0.0003440678119659424, 0.0003657415509223938, 0.0003874152898788452, 0.00040908902883529663, 0.00043076276779174805, 0.00045243650674819946, 0.0004741102457046509, 0.0004957839846611023, 0.0005174577236175537, 0.0005391314625740051, 0.0005608052015304565, 0.000582478940486908, 0.0006041526794433594]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 12.0, 17.0, 22.0, 21.0, 36.0, 59.0, 54.0, 101.0, 136.0, 175.0, 298.0, 441.0, 737.0, 1212.0, 2472.0, 6133.0, 18536.0, 77131.0, 363076.0, 445698.0, 96287.0, 22459.0, 6919.0, 2826.0, 1396.0, 798.0, 473.0, 310.0, 175.0, 148.0, 86.0, 68.0, 49.0, 47.0, 39.0, 24.0, 15.0, 15.0, 13.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.318359375, -2.243743896484375, -2.16912841796875, -2.094512939453125, -2.0198974609375, -1.945281982421875, -1.87066650390625, -1.796051025390625, -1.721435546875, -1.646820068359375, -1.57220458984375, -1.497589111328125, -1.4229736328125, -1.348358154296875, -1.27374267578125, -1.199127197265625, -1.12451171875, -1.049896240234375, -0.97528076171875, -0.900665283203125, -0.8260498046875, -0.751434326171875, -0.67681884765625, -0.602203369140625, -0.527587890625, -0.452972412109375, -0.37835693359375, -0.303741455078125, -0.2291259765625, -0.154510498046875, -0.07989501953125, -0.005279541015625, 0.0693359375, 0.143951416015625, 0.21856689453125, 0.293182373046875, 0.3677978515625, 0.442413330078125, 0.51702880859375, 0.591644287109375, 0.666259765625, 0.740875244140625, 0.81549072265625, 0.890106201171875, 0.9647216796875, 1.039337158203125, 1.11395263671875, 1.188568115234375, 1.26318359375, 1.337799072265625, 1.41241455078125, 1.487030029296875, 1.5616455078125, 1.636260986328125, 1.71087646484375, 1.785491943359375, 1.860107421875, 1.934722900390625, 2.00933837890625, 2.083953857421875, 2.1585693359375, 2.233184814453125, 2.30780029296875, 2.382415771484375, 2.45703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 1.0, 7.0, 5.0, 12.0, 12.0, 17.0, 19.0, 26.0, 25.0, 43.0, 37.0, 50.0, 88.0, 73.0, 76.0, 59.0, 78.0, 59.0, 49.0, 56.0, 37.0, 35.0, 25.0, 21.0, 23.0, 16.0, 8.0, 7.0, 5.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.845703125, -2.759063720703125, -2.67242431640625, -2.585784912109375, -2.4991455078125, -2.412506103515625, -2.32586669921875, -2.239227294921875, -2.152587890625, -2.065948486328125, -1.97930908203125, -1.892669677734375, -1.8060302734375, -1.719390869140625, -1.63275146484375, -1.546112060546875, -1.45947265625, -1.372833251953125, -1.28619384765625, -1.199554443359375, -1.1129150390625, -1.026275634765625, -0.93963623046875, -0.852996826171875, -0.766357421875, -0.679718017578125, -0.59307861328125, -0.506439208984375, -0.4197998046875, -0.333160400390625, -0.24652099609375, -0.159881591796875, -0.0732421875, 0.013397216796875, 0.10003662109375, 0.186676025390625, 0.2733154296875, 0.359954833984375, 0.44659423828125, 0.533233642578125, 0.619873046875, 0.706512451171875, 0.79315185546875, 0.879791259765625, 0.9664306640625, 1.053070068359375, 1.13970947265625, 1.226348876953125, 1.31298828125, 1.399627685546875, 1.48626708984375, 1.572906494140625, 1.6595458984375, 1.746185302734375, 1.83282470703125, 1.919464111328125, 2.006103515625, 2.092742919921875, 2.17938232421875, 2.266021728515625, 2.3526611328125, 2.439300537109375, 2.52593994140625, 2.612579345703125, 2.69921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 13.0, 14.0, 18.0, 45.0, 68.0, 104.0, 148.0, 174.0, 146.0, 94.0, 74.0, 43.0, 28.0, 10.0, 2.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.18310546875, -61.94818878173828, -59.7132682800293, -57.47835159301758, -55.243431091308594, -53.008514404296875, -50.773597717285156, -48.53868103027344, -46.30376052856445, -44.068843841552734, -41.83392333984375, -39.59900665283203, -37.36408996582031, -35.12916946411133, -32.89425277709961, -30.659334182739258, -28.424415588378906, -26.189496994018555, -23.954578399658203, -21.719661712646484, -19.484743118286133, -17.24982452392578, -15.014906883239746, -12.779989242553711, -10.54507064819336, -8.310152053833008, -6.075234413146973, -3.8403162956237793, -1.605398178100586, 0.6295204162597656, 2.864438056945801, 5.099355697631836, 7.3342742919921875, 9.569192886352539, 11.804110527038574, 14.03902816772461, 16.27394676208496, 18.508865356445312, 20.74378204345703, 22.978700637817383, 25.213619232177734, 27.448537826538086, 29.683456420898438, 31.918373107910156, 34.153289794921875, 36.38821029663086, 38.62312698364258, 40.85804748535156, 43.09296417236328, 45.327880859375, 47.562801361083984, 49.7977180480957, 52.03263854980469, 54.267555236816406, 56.502471923828125, 58.737388610839844, 60.97230911254883, 63.20722579956055, 65.44214630126953, 67.67706298828125, 69.91197967529297, 72.14689636230469, 74.38182067871094, 76.61673736572266, 78.85165405273438]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 13.0, 9.0, 16.0, 17.0, 23.0, 16.0, 24.0, 27.0, 36.0, 37.0, 33.0, 35.0, 54.0, 46.0, 58.0, 64.0, 54.0, 36.0, 46.0, 40.0, 30.0, 40.0, 30.0, 25.0, 13.0, 22.0, 29.0, 27.0, 16.0, 13.0, 13.0, 6.0, 10.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.08253860473633, -33.924659729003906, -32.766780853271484, -31.608901977539062, -30.451021194458008, -29.293142318725586, -28.135263442993164, -26.97738265991211, -25.819503784179688, -24.661624908447266, -23.503746032714844, -22.345867156982422, -21.187986373901367, -20.030107498168945, -18.872228622436523, -17.71434783935547, -16.55647087097168, -15.398591995239258, -14.24071216583252, -13.082833290100098, -11.92495346069336, -10.767074584960938, -9.609195709228516, -8.451315879821777, -7.2934370040893555, -6.135557651519775, -4.977678298950195, -3.8197994232177734, -2.6619200706481934, -1.5040407180786133, -0.3461618423461914, 0.8117179870605469, 1.9695968627929688, 3.127476215362549, 4.285355567932129, 5.443234443664551, 6.601113796234131, 7.758993148803711, 8.916872024536133, 10.074751853942871, 11.232630729675293, 12.390509605407715, 13.548389434814453, 14.706268310546875, 15.864147186279297, 17.02202606201172, 18.17990493774414, 19.337785720825195, 20.495664596557617, 21.65354347229004, 22.81142234802246, 23.969303131103516, 25.127182006835938, 26.28506088256836, 27.44293975830078, 28.600818634033203, 29.758697509765625, 30.916576385498047, 32.07445526123047, 33.23233413696289, 34.39021301269531, 35.548095703125, 36.705970764160156, 37.863853454589844, 39.021732330322266]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 8.0, 7.0, 14.0, 14.0, 22.0, 28.0, 38.0, 49.0, 60.0, 90.0, 117.0, 157.0, 248.0, 368.0, 622.0, 1044.0, 1689.0, 3175.0, 6068.0, 13201.0, 31884.0, 96093.0, 476727.0, 2763186.0, 618757.0, 114056.0, 36967.0, 14849.0, 6670.0, 3353.0, 1935.0, 1039.0, 633.0, 367.0, 245.0, 154.0, 93.0, 61.0, 54.0, 32.0, 26.0, 19.0, 14.0, 7.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-3.611328125, -3.50372314453125, -3.3961181640625, -3.28851318359375, -3.180908203125, -3.07330322265625, -2.9656982421875, -2.85809326171875, -2.75048828125, -2.64288330078125, -2.5352783203125, -2.42767333984375, -2.320068359375, -2.21246337890625, -2.1048583984375, -1.99725341796875, -1.8896484375, -1.78204345703125, -1.6744384765625, -1.56683349609375, -1.459228515625, -1.35162353515625, -1.2440185546875, -1.13641357421875, -1.02880859375, -0.92120361328125, -0.8135986328125, -0.70599365234375, -0.598388671875, -0.49078369140625, -0.3831787109375, -0.27557373046875, -0.16796875, -0.06036376953125, 0.0472412109375, 0.15484619140625, 0.262451171875, 0.37005615234375, 0.4776611328125, 0.58526611328125, 0.69287109375, 0.80047607421875, 0.9080810546875, 1.01568603515625, 1.123291015625, 1.23089599609375, 1.3385009765625, 1.44610595703125, 1.5537109375, 1.66131591796875, 1.7689208984375, 1.87652587890625, 1.984130859375, 2.09173583984375, 2.1993408203125, 2.30694580078125, 2.41455078125, 2.52215576171875, 2.6297607421875, 2.73736572265625, 2.844970703125, 2.95257568359375, 3.0601806640625, 3.16778564453125, 3.275390625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 0.0, 2.0, 6.0, 6.0, 10.0, 11.0, 5.0, 15.0, 13.0, 15.0, 19.0, 18.0, 21.0, 25.0, 28.0, 39.0, 47.0, 37.0, 50.0, 45.0, 52.0, 52.0, 45.0, 52.0, 39.0, 44.0, 31.0, 43.0, 27.0, 33.0, 21.0, 38.0, 22.0, 16.0, 17.0, 16.0, 10.0, 6.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.91015625, -1.85308837890625, -1.7960205078125, -1.73895263671875, -1.681884765625, -1.62481689453125, -1.5677490234375, -1.51068115234375, -1.45361328125, -1.39654541015625, -1.3394775390625, -1.28240966796875, -1.225341796875, -1.16827392578125, -1.1112060546875, -1.05413818359375, -0.9970703125, -0.94000244140625, -0.8829345703125, -0.82586669921875, -0.768798828125, -0.71173095703125, -0.6546630859375, -0.59759521484375, -0.54052734375, -0.48345947265625, -0.4263916015625, -0.36932373046875, -0.312255859375, -0.25518798828125, -0.1981201171875, -0.14105224609375, -0.083984375, -0.02691650390625, 0.0301513671875, 0.08721923828125, 0.144287109375, 0.20135498046875, 0.2584228515625, 0.31549072265625, 0.37255859375, 0.42962646484375, 0.4866943359375, 0.54376220703125, 0.600830078125, 0.65789794921875, 0.7149658203125, 0.77203369140625, 0.8291015625, 0.88616943359375, 0.9432373046875, 1.00030517578125, 1.057373046875, 1.11444091796875, 1.1715087890625, 1.22857666015625, 1.28564453125, 1.34271240234375, 1.3997802734375, 1.45684814453125, 1.513916015625, 1.57098388671875, 1.6280517578125, 1.68511962890625, 1.7421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 8.0, 10.0, 15.0, 19.0, 21.0, 46.0, 77.0, 110.0, 237.0, 587.0, 1686.0, 6421.0, 31731.0, 330897.0, 3591392.0, 200156.0, 23760.0, 4871.0, 1280.0, 449.0, 203.0, 94.0, 63.0, 39.0, 24.0, 16.0, 14.0, 9.0, 9.0, 8.0, 6.0, 4.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.2421875, -7.01165771484375, -6.7811279296875, -6.55059814453125, -6.320068359375, -6.08953857421875, -5.8590087890625, -5.62847900390625, -5.39794921875, -5.16741943359375, -4.9368896484375, -4.70635986328125, -4.475830078125, -4.24530029296875, -4.0147705078125, -3.78424072265625, -3.5537109375, -3.32318115234375, -3.0926513671875, -2.86212158203125, -2.631591796875, -2.40106201171875, -2.1705322265625, -1.94000244140625, -1.70947265625, -1.47894287109375, -1.2484130859375, -1.01788330078125, -0.787353515625, -0.55682373046875, -0.3262939453125, -0.09576416015625, 0.134765625, 0.36529541015625, 0.5958251953125, 0.82635498046875, 1.056884765625, 1.28741455078125, 1.5179443359375, 1.74847412109375, 1.97900390625, 2.20953369140625, 2.4400634765625, 2.67059326171875, 2.901123046875, 3.13165283203125, 3.3621826171875, 3.59271240234375, 3.8232421875, 4.05377197265625, 4.2843017578125, 4.51483154296875, 4.745361328125, 4.97589111328125, 5.2064208984375, 5.43695068359375, 5.66748046875, 5.89801025390625, 6.1285400390625, 6.35906982421875, 6.589599609375, 6.82012939453125, 7.0506591796875, 7.28118896484375, 7.51171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 14.0, 14.0, 19.0, 24.0, 40.0, 42.0, 50.0, 79.0, 117.0, 195.0, 341.0, 649.0, 845.0, 629.0, 338.0, 209.0, 139.0, 82.0, 63.0, 48.0, 30.0, 24.0, 16.0, 10.0, 4.0, 14.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.6328125, -5.4786376953125, -5.324462890625, -5.1702880859375, -5.01611328125, -4.8619384765625, -4.707763671875, -4.5535888671875, -4.3994140625, -4.2452392578125, -4.091064453125, -3.9368896484375, -3.78271484375, -3.6285400390625, -3.474365234375, -3.3201904296875, -3.166015625, -3.0118408203125, -2.857666015625, -2.7034912109375, -2.54931640625, -2.3951416015625, -2.240966796875, -2.0867919921875, -1.9326171875, -1.7784423828125, -1.624267578125, -1.4700927734375, -1.31591796875, -1.1617431640625, -1.007568359375, -0.8533935546875, -0.69921875, -0.5450439453125, -0.390869140625, -0.2366943359375, -0.08251953125, 0.0716552734375, 0.225830078125, 0.3800048828125, 0.5341796875, 0.6883544921875, 0.842529296875, 0.9967041015625, 1.15087890625, 1.3050537109375, 1.459228515625, 1.6134033203125, 1.767578125, 1.9217529296875, 2.075927734375, 2.2301025390625, 2.38427734375, 2.5384521484375, 2.692626953125, 2.8468017578125, 3.0009765625, 3.1551513671875, 3.309326171875, 3.4635009765625, 3.61767578125, 3.7718505859375, 3.926025390625, 4.0802001953125, 4.234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 11.0, 21.0, 35.0, 89.0, 117.0, 142.0, 176.0, 142.0, 103.0, 72.0, 30.0, 17.0, 10.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.3725471496582, -57.680233001708984, -55.9879150390625, -54.29560089111328, -52.60328674316406, -50.91096878051758, -49.21865463256836, -47.526336669921875, -45.834022521972656, -44.14170837402344, -42.44939041137695, -40.757076263427734, -39.064762115478516, -37.37244415283203, -35.68013000488281, -33.987815856933594, -32.295501708984375, -30.603185653686523, -28.910871505737305, -27.218555450439453, -25.5262393951416, -23.83392333984375, -22.14160919189453, -20.44929313659668, -18.756977081298828, -17.064661026000977, -15.372345924377441, -13.680030822753906, -11.987714767456055, -10.29539966583252, -8.603084564208984, -6.910768508911133, -5.218452453613281, -3.526136875152588, -1.8338215351104736, -0.14150619506835938, 1.550809383392334, 3.2431249618530273, 4.9354400634765625, 6.627756118774414, 8.32007122039795, 10.012386322021484, 11.704702377319336, 13.397017478942871, 15.089332580566406, 16.781648635864258, 18.47396469116211, 20.166278839111328, 21.85859489440918, 23.55091094970703, 25.24322509765625, 26.9355411529541, 28.627857208251953, 30.320171356201172, 32.012489318847656, 33.704803466796875, 35.397117614746094, 37.08943176269531, 38.7817497253418, 40.474063873291016, 42.166378021240234, 43.85869598388672, 45.55101013183594, 47.243324279785156, 48.93564224243164]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 5.0, 10.0, 3.0, 5.0, 7.0, 17.0, 13.0, 10.0, 19.0, 19.0, 18.0, 8.0, 33.0, 29.0, 39.0, 34.0, 48.0, 40.0, 43.0, 45.0, 52.0, 47.0, 47.0, 48.0, 39.0, 34.0, 35.0, 37.0, 29.0, 33.0, 26.0, 29.0, 27.0, 12.0, 9.0, 9.0, 12.0, 11.0, 12.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.255016326904297, -19.577436447143555, -18.899856567382812, -18.22227668762207, -17.544696807861328, -16.86711883544922, -16.189538955688477, -15.511959075927734, -14.834379196166992, -14.15679931640625, -13.479219436645508, -12.801640510559082, -12.12406063079834, -11.446480751037598, -10.768901824951172, -10.09132194519043, -9.413742065429688, -8.736162185668945, -8.058582305908203, -7.381003379821777, -6.703423500061035, -6.025843620300293, -5.348264217376709, -4.670684814453125, -3.993104934692383, -3.3155252933502197, -2.6379456520080566, -1.9603660106658936, -1.2827863693237305, -0.6052067279815674, 0.0723729133605957, 0.7499523162841797, 1.4275321960449219, 2.105111837387085, 2.782691478729248, 3.460271120071411, 4.137850761413574, 4.815430641174316, 5.4930100440979, 6.170589447021484, 6.848169326782227, 7.525749206542969, 8.203329086303711, 8.880908012390137, 9.558487892150879, 10.236067771911621, 10.913646697998047, 11.591226577758789, 12.268806457519531, 12.946386337280273, 13.623966217041016, 14.301545143127441, 14.979125022888184, 15.656704902648926, 16.33428382873535, 17.011863708496094, 17.689443588256836, 18.367023468017578, 19.04460334777832, 19.722183227539062, 20.399761199951172, 21.077341079711914, 21.754920959472656, 22.4325008392334, 23.11008071899414]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 16.0, 16.0, 26.0, 48.0, 56.0, 102.0, 159.0, 296.0, 479.0, 943.0, 1869.0, 4338.0, 10780.0, 28496.0, 78913.0, 240787.0, 423242.0, 166250.0, 56715.0, 20524.0, 7824.0, 3377.0, 1520.0, 710.0, 401.0, 249.0, 158.0, 91.0, 50.0, 30.0, 25.0, 21.0, 13.0, 4.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.58984375, -5.4169921875, -5.244140625, -5.0712890625, -4.8984375, -4.7255859375, -4.552734375, -4.3798828125, -4.20703125, -4.0341796875, -3.861328125, -3.6884765625, -3.515625, -3.3427734375, -3.169921875, -2.9970703125, -2.82421875, -2.6513671875, -2.478515625, -2.3056640625, -2.1328125, -1.9599609375, -1.787109375, -1.6142578125, -1.44140625, -1.2685546875, -1.095703125, -0.9228515625, -0.75, -0.5771484375, -0.404296875, -0.2314453125, -0.05859375, 0.1142578125, 0.287109375, 0.4599609375, 0.6328125, 0.8056640625, 0.978515625, 1.1513671875, 1.32421875, 1.4970703125, 1.669921875, 1.8427734375, 2.015625, 2.1884765625, 2.361328125, 2.5341796875, 2.70703125, 2.8798828125, 3.052734375, 3.2255859375, 3.3984375, 3.5712890625, 3.744140625, 3.9169921875, 4.08984375, 4.2626953125, 4.435546875, 4.6083984375, 4.78125, 4.9541015625, 5.126953125, 5.2998046875, 5.47265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 4.0, 5.0, 5.0, 10.0, 12.0, 15.0, 23.0, 18.0, 21.0, 18.0, 21.0, 37.0, 34.0, 43.0, 49.0, 43.0, 53.0, 49.0, 51.0, 44.0, 42.0, 45.0, 42.0, 40.0, 38.0, 28.0, 22.0, 38.0, 32.0, 23.0, 17.0, 15.0, 16.0, 12.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.962890625, -1.9058380126953125, -1.848785400390625, -1.7917327880859375, -1.73468017578125, -1.6776275634765625, -1.620574951171875, -1.5635223388671875, -1.5064697265625, -1.4494171142578125, -1.392364501953125, -1.3353118896484375, -1.27825927734375, -1.2212066650390625, -1.164154052734375, -1.1071014404296875, -1.050048828125, -0.9929962158203125, -0.935943603515625, -0.8788909912109375, -0.82183837890625, -0.7647857666015625, -0.707733154296875, -0.6506805419921875, -0.5936279296875, -0.5365753173828125, -0.479522705078125, -0.4224700927734375, -0.36541748046875, -0.3083648681640625, -0.251312255859375, -0.1942596435546875, -0.13720703125, -0.0801544189453125, -0.023101806640625, 0.0339508056640625, 0.09100341796875, 0.1480560302734375, 0.205108642578125, 0.2621612548828125, 0.3192138671875, 0.3762664794921875, 0.433319091796875, 0.4903717041015625, 0.54742431640625, 0.6044769287109375, 0.661529541015625, 0.7185821533203125, 0.775634765625, 0.8326873779296875, 0.889739990234375, 0.9467926025390625, 1.00384521484375, 1.0608978271484375, 1.117950439453125, 1.1750030517578125, 1.2320556640625, 1.2891082763671875, 1.346160888671875, 1.4032135009765625, 1.46026611328125, 1.5173187255859375, 1.574371337890625, 1.6314239501953125, 1.6884765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 12.0, 12.0, 19.0, 16.0, 22.0, 40.0, 61.0, 93.0, 123.0, 182.0, 287.0, 455.0, 848.0, 1692.0, 4366.0, 19471.0, 167177.0, 747477.0, 87684.0, 12060.0, 3173.0, 1325.0, 736.0, 430.0, 244.0, 162.0, 119.0, 81.0, 48.0, 35.0, 25.0, 20.0, 14.0, 10.0, 11.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.0703125, -10.7740478515625, -10.477783203125, -10.1815185546875, -9.88525390625, -9.5889892578125, -9.292724609375, -8.9964599609375, -8.7001953125, -8.4039306640625, -8.107666015625, -7.8114013671875, -7.51513671875, -7.2188720703125, -6.922607421875, -6.6263427734375, -6.330078125, -6.0338134765625, -5.737548828125, -5.4412841796875, -5.14501953125, -4.8487548828125, -4.552490234375, -4.2562255859375, -3.9599609375, -3.6636962890625, -3.367431640625, -3.0711669921875, -2.77490234375, -2.4786376953125, -2.182373046875, -1.8861083984375, -1.58984375, -1.2935791015625, -0.997314453125, -0.7010498046875, -0.40478515625, -0.1085205078125, 0.187744140625, 0.4840087890625, 0.7802734375, 1.0765380859375, 1.372802734375, 1.6690673828125, 1.96533203125, 2.2615966796875, 2.557861328125, 2.8541259765625, 3.150390625, 3.4466552734375, 3.742919921875, 4.0391845703125, 4.33544921875, 4.6317138671875, 4.927978515625, 5.2242431640625, 5.5205078125, 5.8167724609375, 6.113037109375, 6.4093017578125, 6.70556640625, 7.0018310546875, 7.298095703125, 7.5943603515625, 7.890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 14.0, 10.0, 12.0, 21.0, 18.0, 17.0, 29.0, 29.0, 38.0, 47.0, 44.0, 31.0, 46.0, 44.0, 40.0, 47.0, 60.0, 42.0, 34.0, 49.0, 56.0, 42.0, 38.0, 38.0, 25.0, 27.0, 17.0, 16.0, 10.0, 12.0, 9.0, 6.0, 6.0, 4.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.900146484375, -7.65966796875, -7.419189453125, -7.1787109375, -6.938232421875, -6.69775390625, -6.457275390625, -6.216796875, -5.976318359375, -5.73583984375, -5.495361328125, -5.2548828125, -5.014404296875, -4.77392578125, -4.533447265625, -4.29296875, -4.052490234375, -3.81201171875, -3.571533203125, -3.3310546875, -3.090576171875, -2.85009765625, -2.609619140625, -2.369140625, -2.128662109375, -1.88818359375, -1.647705078125, -1.4072265625, -1.166748046875, -0.92626953125, -0.685791015625, -0.4453125, -0.204833984375, 0.03564453125, 0.276123046875, 0.5166015625, 0.757080078125, 0.99755859375, 1.238037109375, 1.478515625, 1.718994140625, 1.95947265625, 2.199951171875, 2.4404296875, 2.680908203125, 2.92138671875, 3.161865234375, 3.40234375, 3.642822265625, 3.88330078125, 4.123779296875, 4.3642578125, 4.604736328125, 4.84521484375, 5.085693359375, 5.326171875, 5.566650390625, 5.80712890625, 6.047607421875, 6.2880859375, 6.528564453125, 6.76904296875, 7.009521484375, 7.25]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 10.0, 14.0, 24.0, 35.0, 44.0, 105.0, 175.0, 335.0, 783.0, 2618.0, 20264.0, 745786.0, 264307.0, 10918.0, 1881.0, 578.0, 269.0, 149.0, 81.0, 52.0, 25.0, 31.0, 14.0, 16.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9296875, -6.73651123046875, -6.5433349609375, -6.35015869140625, -6.156982421875, -5.96380615234375, -5.7706298828125, -5.57745361328125, -5.38427734375, -5.19110107421875, -4.9979248046875, -4.80474853515625, -4.611572265625, -4.41839599609375, -4.2252197265625, -4.03204345703125, -3.8388671875, -3.64569091796875, -3.4525146484375, -3.25933837890625, -3.066162109375, -2.87298583984375, -2.6798095703125, -2.48663330078125, -2.29345703125, -2.10028076171875, -1.9071044921875, -1.71392822265625, -1.520751953125, -1.32757568359375, -1.1343994140625, -0.94122314453125, -0.748046875, -0.55487060546875, -0.3616943359375, -0.16851806640625, 0.024658203125, 0.21783447265625, 0.4110107421875, 0.60418701171875, 0.79736328125, 0.99053955078125, 1.1837158203125, 1.37689208984375, 1.570068359375, 1.76324462890625, 1.9564208984375, 2.14959716796875, 2.3427734375, 2.53594970703125, 2.7291259765625, 2.92230224609375, 3.115478515625, 3.30865478515625, 3.5018310546875, 3.69500732421875, 3.88818359375, 4.08135986328125, 4.2745361328125, 4.46771240234375, 4.660888671875, 4.85406494140625, 5.0472412109375, 5.24041748046875, 5.43359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 2.0, 3.0, 4.0, 11.0, 10.0, 18.0, 27.0, 25.0, 36.0, 33.0, 70.0, 79.0, 116.0, 131.0, 92.0, 83.0, 55.0, 39.0, 33.0, 23.0, 23.0, 12.0, 6.0, 11.0, 12.0, 8.0, 11.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007314682006835938, -0.0007108598947525024, -0.0006902515888214111, -0.0006696432828903198, -0.0006490349769592285, -0.0006284266710281372, -0.0006078183650970459, -0.0005872100591659546, -0.0005666017532348633, -0.000545993447303772, -0.0005253851413726807, -0.0005047768354415894, -0.00048416852951049805, -0.00046356022357940674, -0.00044295191764831543, -0.0004223436117172241, -0.0004017353057861328, -0.0003811269998550415, -0.0003605186939239502, -0.0003399103879928589, -0.0003193020820617676, -0.00029869377613067627, -0.00027808547019958496, -0.00025747716426849365, -0.00023686885833740234, -0.00021626055240631104, -0.00019565224647521973, -0.00017504394054412842, -0.0001544356346130371, -0.0001338273286819458, -0.00011321902275085449, -9.261071681976318e-05, -7.200241088867188e-05, -5.1394104957580566e-05, -3.078579902648926e-05, -1.017749309539795e-05, 1.043081283569336e-05, 3.103911876678467e-05, 5.1647424697875977e-05, 7.225573062896729e-05, 9.28640365600586e-05, 0.0001134723424911499, 0.0001340806484222412, 0.00015468895435333252, 0.00017529726028442383, 0.00019590556621551514, 0.00021651387214660645, 0.00023712217807769775, 0.00025773048400878906, 0.00027833878993988037, 0.0002989470958709717, 0.000319555401802063, 0.0003401637077331543, 0.0003607720136642456, 0.0003813803195953369, 0.0004019886255264282, 0.00042259693145751953, 0.00044320523738861084, 0.00046381354331970215, 0.00048442184925079346, 0.0005050301551818848, 0.0005256384611129761, 0.0005462467670440674, 0.0005668550729751587, 0.00058746337890625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 7.0, 5.0, 8.0, 12.0, 13.0, 16.0, 23.0, 42.0, 59.0, 82.0, 118.0, 178.0, 300.0, 487.0, 947.0, 2190.0, 6260.0, 26658.0, 245654.0, 681435.0, 65913.0, 11522.0, 3460.0, 1427.0, 701.0, 342.0, 237.0, 123.0, 91.0, 54.0, 46.0, 39.0, 24.0, 13.0, 18.0, 11.0, 11.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.576171875, -3.4652099609375, -3.354248046875, -3.2432861328125, -3.13232421875, -3.0213623046875, -2.910400390625, -2.7994384765625, -2.6884765625, -2.5775146484375, -2.466552734375, -2.3555908203125, -2.24462890625, -2.1336669921875, -2.022705078125, -1.9117431640625, -1.80078125, -1.6898193359375, -1.578857421875, -1.4678955078125, -1.35693359375, -1.2459716796875, -1.135009765625, -1.0240478515625, -0.9130859375, -0.8021240234375, -0.691162109375, -0.5802001953125, -0.46923828125, -0.3582763671875, -0.247314453125, -0.1363525390625, -0.025390625, 0.0855712890625, 0.196533203125, 0.3074951171875, 0.41845703125, 0.5294189453125, 0.640380859375, 0.7513427734375, 0.8623046875, 0.9732666015625, 1.084228515625, 1.1951904296875, 1.30615234375, 1.4171142578125, 1.528076171875, 1.6390380859375, 1.75, 1.8609619140625, 1.971923828125, 2.0828857421875, 2.19384765625, 2.3048095703125, 2.415771484375, 2.5267333984375, 2.6376953125, 2.7486572265625, 2.859619140625, 2.9705810546875, 3.08154296875, 3.1925048828125, 3.303466796875, 3.4144287109375, 3.525390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 8.0, 8.0, 12.0, 23.0, 15.0, 37.0, 34.0, 40.0, 66.0, 71.0, 71.0, 98.0, 98.0, 102.0, 57.0, 57.0, 41.0, 30.0, 20.0, 19.0, 15.0, 11.0, 14.0, 8.0, 4.0, 12.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.845703125, -1.76458740234375, -1.6834716796875, -1.60235595703125, -1.521240234375, -1.44012451171875, -1.3590087890625, -1.27789306640625, -1.19677734375, -1.11566162109375, -1.0345458984375, -0.95343017578125, -0.872314453125, -0.79119873046875, -0.7100830078125, -0.62896728515625, -0.5478515625, -0.46673583984375, -0.3856201171875, -0.30450439453125, -0.223388671875, -0.14227294921875, -0.0611572265625, 0.01995849609375, 0.10107421875, 0.18218994140625, 0.2633056640625, 0.34442138671875, 0.425537109375, 0.50665283203125, 0.5877685546875, 0.66888427734375, 0.75, 0.83111572265625, 0.9122314453125, 0.99334716796875, 1.074462890625, 1.15557861328125, 1.2366943359375, 1.31781005859375, 1.39892578125, 1.48004150390625, 1.5611572265625, 1.64227294921875, 1.723388671875, 1.80450439453125, 1.8856201171875, 1.96673583984375, 2.0478515625, 2.12896728515625, 2.2100830078125, 2.29119873046875, 2.372314453125, 2.45343017578125, 2.5345458984375, 2.61566162109375, 2.69677734375, 2.77789306640625, 2.8590087890625, 2.94012451171875, 3.021240234375, 3.10235595703125, 3.1834716796875, 3.26458740234375, 3.345703125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 10.0, 10.0, 47.0, 135.0, 268.0, 307.0, 135.0, 52.0, 23.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-134.19493103027344, -131.00579833984375, -127.81666564941406, -124.62753295898438, -121.43840026855469, -118.249267578125, -115.06013488769531, -111.87100219726562, -108.68186950683594, -105.49273681640625, -102.30360412597656, -99.11447143554688, -95.92533874511719, -92.7362060546875, -89.54707336425781, -86.35794067382812, -83.16880798339844, -79.97967529296875, -76.79054260253906, -73.60140991210938, -70.41227722167969, -67.22314453125, -64.03401184082031, -60.844879150390625, -57.65574645996094, -54.46661376953125, -51.27748107910156, -48.088348388671875, -44.89921569824219, -41.7100830078125, -38.52095031738281, -35.331817626953125, -32.14269256591797, -28.95355987548828, -25.764427185058594, -22.575294494628906, -19.38616180419922, -16.19702911376953, -13.007896423339844, -9.818763732910156, -6.629631042480469, -3.4404983520507812, -0.25136566162109375, 2.9377670288085938, 6.126899719238281, 9.316032409667969, 12.505165100097656, 15.694297790527344, 18.88343048095703, 22.07256317138672, 25.261695861816406, 28.450828552246094, 31.63996124267578, 34.82909393310547, 38.018226623535156, 41.207359313964844, 44.39649200439453, 47.58562469482422, 50.774757385253906, 53.963890075683594, 57.15302276611328, 60.34215545654297, 63.531288146972656, 66.72042083740234, 69.90955352783203]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 9.0, 11.0, 25.0, 27.0, 14.0, 36.0, 38.0, 33.0, 29.0, 46.0, 50.0, 71.0, 71.0, 79.0, 61.0, 58.0, 50.0, 57.0, 34.0, 29.0, 32.0, 29.0, 15.0, 24.0, 20.0, 12.0, 13.0, 3.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.616851806640625, -24.487924575805664, -23.358997344970703, -22.230070114135742, -21.10114288330078, -19.97221565246582, -18.84328842163086, -17.71436309814453, -16.585433959960938, -15.456506729125977, -14.327579498291016, -13.198652267456055, -12.069725036621094, -10.940797805786133, -9.811871528625488, -8.682944297790527, -7.554018020629883, -6.425090789794922, -5.296163558959961, -4.167236804962158, -3.0383095741271973, -1.9093823432922363, -0.7804555892944336, 0.34847164154052734, 1.4773988723754883, 2.606326103210449, 3.735253095626831, 4.864180088043213, 5.993107318878174, 7.122034549713135, 8.250961303710938, 9.379888534545898, 10.50881576538086, 11.63774299621582, 12.766670227050781, 13.895597457885742, 15.024524688720703, 16.153451919555664, 17.282379150390625, 18.411304473876953, 19.540233612060547, 20.669160842895508, 21.79808807373047, 22.92701530456543, 24.05594253540039, 25.18486976623535, 26.313796997070312, 27.44272232055664, 28.5716495513916, 29.700576782226562, 30.829504013061523, 31.958431243896484, 33.08735656738281, 34.216285705566406, 35.345211029052734, 36.47414016723633, 37.603065490722656, 38.731990814208984, 39.86091995239258, 40.989845275878906, 42.1187744140625, 43.24769973754883, 44.37662887573242, 45.50555419921875, 46.634483337402344]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 12.0, 7.0, 17.0, 22.0, 31.0, 43.0, 77.0, 97.0, 154.0, 285.0, 745.0, 3165.0, 25587.0, 2550589.0, 1587535.0, 21677.0, 2882.0, 677.0, 255.0, 141.0, 79.0, 46.0, 43.0, 32.0, 21.0, 16.0, 14.0, 8.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.609375, -8.27783203125, -7.9462890625, -7.61474609375, -7.283203125, -6.95166015625, -6.6201171875, -6.28857421875, -5.95703125, -5.62548828125, -5.2939453125, -4.96240234375, -4.630859375, -4.29931640625, -3.9677734375, -3.63623046875, -3.3046875, -2.97314453125, -2.6416015625, -2.31005859375, -1.978515625, -1.64697265625, -1.3154296875, -0.98388671875, -0.65234375, -0.32080078125, 0.0107421875, 0.34228515625, 0.673828125, 1.00537109375, 1.3369140625, 1.66845703125, 2.0, 2.33154296875, 2.6630859375, 2.99462890625, 3.326171875, 3.65771484375, 3.9892578125, 4.32080078125, 4.65234375, 4.98388671875, 5.3154296875, 5.64697265625, 5.978515625, 6.31005859375, 6.6416015625, 6.97314453125, 7.3046875, 7.63623046875, 7.9677734375, 8.29931640625, 8.630859375, 8.96240234375, 9.2939453125, 9.62548828125, 9.95703125, 10.28857421875, 10.6201171875, 10.95166015625, 11.283203125, 11.61474609375, 11.9462890625, 12.27783203125, 12.609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 3.0, 7.0, 14.0, 19.0, 24.0, 37.0, 48.0, 47.0, 53.0, 80.0, 96.0, 102.0, 87.0, 88.0, 55.0, 58.0, 49.0, 50.0, 25.0, 19.0, 11.0, 15.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33203125, -2.23345947265625, -2.1348876953125, -2.03631591796875, -1.937744140625, -1.83917236328125, -1.7406005859375, -1.64202880859375, -1.54345703125, -1.44488525390625, -1.3463134765625, -1.24774169921875, -1.149169921875, -1.05059814453125, -0.9520263671875, -0.85345458984375, -0.7548828125, -0.65631103515625, -0.5577392578125, -0.45916748046875, -0.360595703125, -0.26202392578125, -0.1634521484375, -0.06488037109375, 0.03369140625, 0.13226318359375, 0.2308349609375, 0.32940673828125, 0.427978515625, 0.52655029296875, 0.6251220703125, 0.72369384765625, 0.822265625, 0.92083740234375, 1.0194091796875, 1.11798095703125, 1.216552734375, 1.31512451171875, 1.4136962890625, 1.51226806640625, 1.61083984375, 1.70941162109375, 1.8079833984375, 1.90655517578125, 2.005126953125, 2.10369873046875, 2.2022705078125, 2.30084228515625, 2.3994140625, 2.49798583984375, 2.5965576171875, 2.69512939453125, 2.793701171875, 2.89227294921875, 2.9908447265625, 3.08941650390625, 3.18798828125, 3.28656005859375, 3.3851318359375, 3.48370361328125, 3.582275390625, 3.68084716796875, 3.7794189453125, 3.87799072265625, 3.9765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 13.0, 9.0, 15.0, 23.0, 32.0, 71.0, 86.0, 178.0, 289.0, 532.0, 961.0, 1864.0, 4022.0, 9011.0, 24135.0, 81905.0, 493380.0, 2954516.0, 501005.0, 81754.0, 24219.0, 9056.0, 3842.0, 1630.0, 816.0, 399.0, 197.0, 132.0, 65.0, 39.0, 21.0, 11.0, 14.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.92987060546875, -3.8089599609375, -3.68804931640625, -3.567138671875, -3.44622802734375, -3.3253173828125, -3.20440673828125, -3.08349609375, -2.96258544921875, -2.8416748046875, -2.72076416015625, -2.599853515625, -2.47894287109375, -2.3580322265625, -2.23712158203125, -2.1162109375, -1.99530029296875, -1.8743896484375, -1.75347900390625, -1.632568359375, -1.51165771484375, -1.3907470703125, -1.26983642578125, -1.14892578125, -1.02801513671875, -0.9071044921875, -0.78619384765625, -0.665283203125, -0.54437255859375, -0.4234619140625, -0.30255126953125, -0.181640625, -0.06072998046875, 0.0601806640625, 0.18109130859375, 0.302001953125, 0.42291259765625, 0.5438232421875, 0.66473388671875, 0.78564453125, 0.90655517578125, 1.0274658203125, 1.14837646484375, 1.269287109375, 1.39019775390625, 1.5111083984375, 1.63201904296875, 1.7529296875, 1.87384033203125, 1.9947509765625, 2.11566162109375, 2.236572265625, 2.35748291015625, 2.4783935546875, 2.59930419921875, 2.72021484375, 2.84112548828125, 2.9620361328125, 3.08294677734375, 3.203857421875, 3.32476806640625, 3.4456787109375, 3.56658935546875, 3.6875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 10.0, 18.0, 23.0, 28.0, 44.0, 57.0, 117.0, 138.0, 198.0, 351.0, 571.0, 798.0, 572.0, 386.0, 250.0, 153.0, 96.0, 66.0, 42.0, 28.0, 25.0, 16.0, 6.0, 8.0, 10.0, 7.0, 8.0, 4.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.07421875, -4.94915771484375, -4.8240966796875, -4.69903564453125, -4.573974609375, -4.44891357421875, -4.3238525390625, -4.19879150390625, -4.07373046875, -3.94866943359375, -3.8236083984375, -3.69854736328125, -3.573486328125, -3.44842529296875, -3.3233642578125, -3.19830322265625, -3.0732421875, -2.94818115234375, -2.8231201171875, -2.69805908203125, -2.572998046875, -2.44793701171875, -2.3228759765625, -2.19781494140625, -2.07275390625, -1.94769287109375, -1.8226318359375, -1.69757080078125, -1.572509765625, -1.44744873046875, -1.3223876953125, -1.19732666015625, -1.072265625, -0.94720458984375, -0.8221435546875, -0.69708251953125, -0.572021484375, -0.44696044921875, -0.3218994140625, -0.19683837890625, -0.07177734375, 0.05328369140625, 0.1783447265625, 0.30340576171875, 0.428466796875, 0.55352783203125, 0.6785888671875, 0.80364990234375, 0.9287109375, 1.05377197265625, 1.1788330078125, 1.30389404296875, 1.428955078125, 1.55401611328125, 1.6790771484375, 1.80413818359375, 1.92919921875, 2.05426025390625, 2.1793212890625, 2.30438232421875, 2.429443359375, 2.55450439453125, 2.6795654296875, 2.80462646484375, 2.9296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 5.0, 16.0, 55.0, 150.0, 289.0, 268.0, 135.0, 44.0, 18.0, 8.0, 0.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.48841857910156, -96.14328002929688, -93.79813385009766, -91.45299530029297, -89.10784912109375, -86.76271057128906, -84.41757202148438, -82.07243347167969, -79.72728729248047, -77.38214874267578, -75.03700256347656, -72.69186401367188, -70.34672546386719, -68.00157928466797, -65.65644073486328, -63.31129837036133, -60.966156005859375, -58.62101364135742, -56.27587127685547, -53.93073272705078, -51.58559036254883, -49.240447998046875, -46.89530944824219, -44.550167083740234, -42.20502471923828, -39.85988235473633, -37.514739990234375, -35.16960144042969, -32.824459075927734, -30.47931671142578, -28.13417625427246, -25.78903579711914, -23.443885803222656, -21.098743438720703, -18.753602981567383, -16.408462524414062, -14.06332015991211, -11.718178749084473, -9.373037338256836, -7.027896881103516, -4.6827545166015625, -2.337613105773926, 0.0075283050537109375, 2.3526697158813477, 4.697811126708984, 7.042952537536621, 9.388093948364258, 11.733234405517578, 14.078376770019531, 16.423519134521484, 18.768659591674805, 21.113800048828125, 23.458942413330078, 25.80408477783203, 28.14922523498535, 30.494365692138672, 32.839508056640625, 35.18465042114258, 37.52979278564453, 39.87493133544922, 42.22007369995117, 44.565216064453125, 46.91035461425781, 49.255496978759766, 51.60063934326172]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 5.0, 9.0, 7.0, 9.0, 7.0, 12.0, 15.0, 18.0, 20.0, 25.0, 24.0, 32.0, 34.0, 46.0, 40.0, 58.0, 46.0, 64.0, 52.0, 62.0, 48.0, 52.0, 46.0, 50.0, 30.0, 29.0, 22.0, 22.0, 35.0, 13.0, 22.0, 10.0, 8.0, 8.0, 7.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.821266174316406, -16.20105743408203, -15.580848693847656, -14.960640907287598, -14.340432167053223, -13.720223426818848, -13.100015640258789, -12.479806900024414, -11.859598159790039, -11.239389419555664, -10.619180679321289, -9.99897289276123, -9.378764152526855, -8.75855541229248, -8.138347625732422, -7.518138885498047, -6.897930145263672, -6.277721405029297, -5.65751314163208, -5.037304878234863, -4.417096138000488, -3.7968876361846924, -3.1766791343688965, -2.5564708709716797, -1.9362621307373047, -1.3160536289215088, -0.6958451271057129, -0.07563662528991699, 0.5445718765258789, 1.1647803783416748, 1.7849888801574707, 2.4051971435546875, 3.0254039764404297, 3.6456124782562256, 4.2658209800720215, 4.886029243469238, 5.506237983703613, 6.126446723937988, 6.746654987335205, 7.366863250732422, 7.987071990966797, 8.607280731201172, 9.227489471435547, 9.847697257995605, 10.46790599822998, 11.088114738464355, 11.708322525024414, 12.328531265258789, 12.948740005493164, 13.568948745727539, 14.189157485961914, 14.809365272521973, 15.429574012756348, 16.049781799316406, 16.66999053955078, 17.290199279785156, 17.91040802001953, 18.530616760253906, 19.15082550048828, 19.771034240722656, 20.39124298095703, 21.011449813842773, 21.63165855407715, 22.251867294311523, 22.8720760345459]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 13.0, 17.0, 20.0, 32.0, 33.0, 54.0, 94.0, 131.0, 227.0, 395.0, 642.0, 1128.0, 2086.0, 3880.0, 7590.0, 15666.0, 33529.0, 75790.0, 188219.0, 357502.0, 207241.0, 83031.0, 36682.0, 17005.0, 8282.0, 4193.0, 2150.0, 1198.0, 640.0, 409.0, 224.0, 137.0, 97.0, 58.0, 45.0, 20.0, 28.0, 19.0, 11.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.65625, -3.53253173828125, -3.4088134765625, -3.28509521484375, -3.161376953125, -3.03765869140625, -2.9139404296875, -2.79022216796875, -2.66650390625, -2.54278564453125, -2.4190673828125, -2.29534912109375, -2.171630859375, -2.04791259765625, -1.9241943359375, -1.80047607421875, -1.6767578125, -1.55303955078125, -1.4293212890625, -1.30560302734375, -1.181884765625, -1.05816650390625, -0.9344482421875, -0.81072998046875, -0.68701171875, -0.56329345703125, -0.4395751953125, -0.31585693359375, -0.192138671875, -0.06842041015625, 0.0552978515625, 0.17901611328125, 0.302734375, 0.42645263671875, 0.5501708984375, 0.67388916015625, 0.797607421875, 0.92132568359375, 1.0450439453125, 1.16876220703125, 1.29248046875, 1.41619873046875, 1.5399169921875, 1.66363525390625, 1.787353515625, 1.91107177734375, 2.0347900390625, 2.15850830078125, 2.2822265625, 2.40594482421875, 2.5296630859375, 2.65338134765625, 2.777099609375, 2.90081787109375, 3.0245361328125, 3.14825439453125, 3.27197265625, 3.39569091796875, 3.5194091796875, 3.64312744140625, 3.766845703125, 3.89056396484375, 4.0142822265625, 4.13800048828125, 4.26171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 4.0, 8.0, 14.0, 16.0, 19.0, 25.0, 27.0, 42.0, 52.0, 52.0, 60.0, 52.0, 70.0, 73.0, 65.0, 77.0, 50.0, 52.0, 46.0, 49.0, 35.0, 31.0, 18.0, 19.0, 15.0, 8.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.123046875, -2.043243408203125, -1.96343994140625, -1.883636474609375, -1.8038330078125, -1.724029541015625, -1.64422607421875, -1.564422607421875, -1.484619140625, -1.404815673828125, -1.32501220703125, -1.245208740234375, -1.1654052734375, -1.085601806640625, -1.00579833984375, -0.925994873046875, -0.84619140625, -0.766387939453125, -0.68658447265625, -0.606781005859375, -0.5269775390625, -0.447174072265625, -0.36737060546875, -0.287567138671875, -0.207763671875, -0.127960205078125, -0.04815673828125, 0.031646728515625, 0.1114501953125, 0.191253662109375, 0.27105712890625, 0.350860595703125, 0.4306640625, 0.510467529296875, 0.59027099609375, 0.670074462890625, 0.7498779296875, 0.829681396484375, 0.90948486328125, 0.989288330078125, 1.069091796875, 1.148895263671875, 1.22869873046875, 1.308502197265625, 1.3883056640625, 1.468109130859375, 1.54791259765625, 1.627716064453125, 1.70751953125, 1.787322998046875, 1.86712646484375, 1.946929931640625, 2.0267333984375, 2.106536865234375, 2.18634033203125, 2.266143798828125, 2.345947265625, 2.425750732421875, 2.50555419921875, 2.585357666015625, 2.6651611328125, 2.744964599609375, 2.82476806640625, 2.904571533203125, 2.984375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 7.0, 12.0, 7.0, 29.0, 28.0, 46.0, 68.0, 117.0, 141.0, 220.0, 369.0, 608.0, 1247.0, 2720.0, 8114.0, 30259.0, 145733.0, 642696.0, 167535.0, 33790.0, 8659.0, 3044.0, 1298.0, 681.0, 402.0, 240.0, 159.0, 100.0, 57.0, 47.0, 39.0, 19.0, 16.0, 11.0, 9.0, 6.0, 10.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.38671875, -7.1728515625, -6.958984375, -6.7451171875, -6.53125, -6.3173828125, -6.103515625, -5.8896484375, -5.67578125, -5.4619140625, -5.248046875, -5.0341796875, -4.8203125, -4.6064453125, -4.392578125, -4.1787109375, -3.96484375, -3.7509765625, -3.537109375, -3.3232421875, -3.109375, -2.8955078125, -2.681640625, -2.4677734375, -2.25390625, -2.0400390625, -1.826171875, -1.6123046875, -1.3984375, -1.1845703125, -0.970703125, -0.7568359375, -0.54296875, -0.3291015625, -0.115234375, 0.0986328125, 0.3125, 0.5263671875, 0.740234375, 0.9541015625, 1.16796875, 1.3818359375, 1.595703125, 1.8095703125, 2.0234375, 2.2373046875, 2.451171875, 2.6650390625, 2.87890625, 3.0927734375, 3.306640625, 3.5205078125, 3.734375, 3.9482421875, 4.162109375, 4.3759765625, 4.58984375, 4.8037109375, 5.017578125, 5.2314453125, 5.4453125, 5.6591796875, 5.873046875, 6.0869140625, 6.30078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 7.0, 9.0, 6.0, 10.0, 7.0, 23.0, 12.0, 18.0, 24.0, 31.0, 24.0, 36.0, 29.0, 30.0, 37.0, 40.0, 47.0, 40.0, 42.0, 37.0, 47.0, 50.0, 36.0, 44.0, 39.0, 35.0, 37.0, 31.0, 34.0, 25.0, 14.0, 22.0, 11.0, 16.0, 11.0, 12.0, 6.0, 3.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1484375, -5.9461669921875, -5.743896484375, -5.5416259765625, -5.33935546875, -5.1370849609375, -4.934814453125, -4.7325439453125, -4.5302734375, -4.3280029296875, -4.125732421875, -3.9234619140625, -3.72119140625, -3.5189208984375, -3.316650390625, -3.1143798828125, -2.912109375, -2.7098388671875, -2.507568359375, -2.3052978515625, -2.10302734375, -1.9007568359375, -1.698486328125, -1.4962158203125, -1.2939453125, -1.0916748046875, -0.889404296875, -0.6871337890625, -0.48486328125, -0.2825927734375, -0.080322265625, 0.1219482421875, 0.32421875, 0.5264892578125, 0.728759765625, 0.9310302734375, 1.13330078125, 1.3355712890625, 1.537841796875, 1.7401123046875, 1.9423828125, 2.1446533203125, 2.346923828125, 2.5491943359375, 2.75146484375, 2.9537353515625, 3.156005859375, 3.3582763671875, 3.560546875, 3.7628173828125, 3.965087890625, 4.1673583984375, 4.36962890625, 4.5718994140625, 4.774169921875, 4.9764404296875, 5.1787109375, 5.3809814453125, 5.583251953125, 5.7855224609375, 5.98779296875, 6.1900634765625, 6.392333984375, 6.5946044921875, 6.796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 10.0, 11.0, 12.0, 12.0, 26.0, 39.0, 70.0, 139.0, 268.0, 505.0, 1283.0, 4256.0, 22372.0, 245997.0, 701865.0, 59871.0, 8134.0, 2120.0, 754.0, 346.0, 161.0, 91.0, 68.0, 31.0, 30.0, 19.0, 14.0, 12.0, 8.0, 4.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53515625, -3.4141845703125, -3.293212890625, -3.1722412109375, -3.05126953125, -2.9302978515625, -2.809326171875, -2.6883544921875, -2.5673828125, -2.4464111328125, -2.325439453125, -2.2044677734375, -2.08349609375, -1.9625244140625, -1.841552734375, -1.7205810546875, -1.599609375, -1.4786376953125, -1.357666015625, -1.2366943359375, -1.11572265625, -0.9947509765625, -0.873779296875, -0.7528076171875, -0.6318359375, -0.5108642578125, -0.389892578125, -0.2689208984375, -0.14794921875, -0.0269775390625, 0.093994140625, 0.2149658203125, 0.3359375, 0.4569091796875, 0.577880859375, 0.6988525390625, 0.81982421875, 0.9407958984375, 1.061767578125, 1.1827392578125, 1.3037109375, 1.4246826171875, 1.545654296875, 1.6666259765625, 1.78759765625, 1.9085693359375, 2.029541015625, 2.1505126953125, 2.271484375, 2.3924560546875, 2.513427734375, 2.6343994140625, 2.75537109375, 2.8763427734375, 2.997314453125, 3.1182861328125, 3.2392578125, 3.3602294921875, 3.481201171875, 3.6021728515625, 3.72314453125, 3.8441162109375, 3.965087890625, 4.0860595703125, 4.20703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 6.0, 1.0, 4.0, 6.0, 7.0, 6.0, 10.0, 12.0, 21.0, 18.0, 27.0, 30.0, 36.0, 66.0, 66.0, 92.0, 109.0, 88.0, 84.0, 70.0, 53.0, 34.0, 40.0, 23.0, 18.0, 16.0, 13.0, 10.0, 7.0, 3.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000629425048828125, -0.0006122253835201263, -0.0005950257182121277, -0.000577826052904129, -0.0005606263875961304, -0.0005434267222881317, -0.0005262270569801331, -0.0005090273916721344, -0.0004918277263641357, -0.0004746280610561371, -0.00045742839574813843, -0.00044022873044013977, -0.0004230290651321411, -0.00040582939982414246, -0.0003886297345161438, -0.00037143006920814514, -0.0003542304039001465, -0.00033703073859214783, -0.00031983107328414917, -0.0003026314079761505, -0.00028543174266815186, -0.0002682320773601532, -0.00025103241205215454, -0.00023383274674415588, -0.00021663308143615723, -0.00019943341612815857, -0.0001822337508201599, -0.00016503408551216125, -0.0001478344202041626, -0.00013063475489616394, -0.00011343508958816528, -9.623542428016663e-05, -7.903575897216797e-05, -6.183609366416931e-05, -4.4636428356170654e-05, -2.7436763048171997e-05, -1.023709774017334e-05, 6.962567567825317e-06, 2.4162232875823975e-05, 4.136189818382263e-05, 5.856156349182129e-05, 7.576122879981995e-05, 9.29608941078186e-05, 0.00011016055941581726, 0.00012736022472381592, 0.00014455989003181458, 0.00016175955533981323, 0.0001789592206478119, 0.00019615888595581055, 0.0002133585512638092, 0.00023055821657180786, 0.0002477578818798065, 0.0002649575471878052, 0.00028215721249580383, 0.0002993568778038025, 0.00031655654311180115, 0.0003337562084197998, 0.00035095587372779846, 0.0003681555390357971, 0.0003853552043437958, 0.00040255486965179443, 0.0004197545349597931, 0.00043695420026779175, 0.0004541538655757904, 0.00047135353088378906]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 9.0, 13.0, 16.0, 26.0, 33.0, 48.0, 75.0, 104.0, 187.0, 331.0, 607.0, 1243.0, 2712.0, 7404.0, 27409.0, 150548.0, 637009.0, 175612.0, 31248.0, 8131.0, 2962.0, 1286.0, 616.0, 351.0, 196.0, 116.0, 76.0, 44.0, 33.0, 28.0, 15.0, 15.0, 9.0, 4.0, 7.0, 7.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6171875, -2.534210205078125, -2.45123291015625, -2.368255615234375, -2.2852783203125, -2.202301025390625, -2.11932373046875, -2.036346435546875, -1.953369140625, -1.870391845703125, -1.78741455078125, -1.704437255859375, -1.6214599609375, -1.538482666015625, -1.45550537109375, -1.372528076171875, -1.28955078125, -1.206573486328125, -1.12359619140625, -1.040618896484375, -0.9576416015625, -0.874664306640625, -0.79168701171875, -0.708709716796875, -0.625732421875, -0.542755126953125, -0.45977783203125, -0.376800537109375, -0.2938232421875, -0.210845947265625, -0.12786865234375, -0.044891357421875, 0.0380859375, 0.121063232421875, 0.20404052734375, 0.287017822265625, 0.3699951171875, 0.452972412109375, 0.53594970703125, 0.618927001953125, 0.701904296875, 0.784881591796875, 0.86785888671875, 0.950836181640625, 1.0338134765625, 1.116790771484375, 1.19976806640625, 1.282745361328125, 1.36572265625, 1.448699951171875, 1.53167724609375, 1.614654541015625, 1.6976318359375, 1.780609130859375, 1.86358642578125, 1.946563720703125, 2.029541015625, 2.112518310546875, 2.19549560546875, 2.278472900390625, 2.3614501953125, 2.444427490234375, 2.52740478515625, 2.610382080078125, 2.693359375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 10.0, 11.0, 20.0, 16.0, 28.0, 28.0, 39.0, 62.0, 70.0, 75.0, 86.0, 103.0, 64.0, 84.0, 76.0, 41.0, 46.0, 29.0, 21.0, 18.0, 15.0, 14.0, 4.0, 8.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.58203125, -2.496856689453125, -2.41168212890625, -2.326507568359375, -2.2413330078125, -2.156158447265625, -2.07098388671875, -1.985809326171875, -1.900634765625, -1.815460205078125, -1.73028564453125, -1.645111083984375, -1.5599365234375, -1.474761962890625, -1.38958740234375, -1.304412841796875, -1.21923828125, -1.134063720703125, -1.04888916015625, -0.963714599609375, -0.8785400390625, -0.793365478515625, -0.70819091796875, -0.623016357421875, -0.537841796875, -0.452667236328125, -0.36749267578125, -0.282318115234375, -0.1971435546875, -0.111968994140625, -0.02679443359375, 0.058380126953125, 0.1435546875, 0.228729248046875, 0.31390380859375, 0.399078369140625, 0.4842529296875, 0.569427490234375, 0.65460205078125, 0.739776611328125, 0.824951171875, 0.910125732421875, 0.99530029296875, 1.080474853515625, 1.1656494140625, 1.250823974609375, 1.33599853515625, 1.421173095703125, 1.50634765625, 1.591522216796875, 1.67669677734375, 1.761871337890625, 1.8470458984375, 1.932220458984375, 2.01739501953125, 2.102569580078125, 2.187744140625, 2.272918701171875, 2.35809326171875, 2.443267822265625, 2.5284423828125, 2.613616943359375, 2.69879150390625, 2.783966064453125, 2.869140625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 31.0, 58.0, 90.0, 140.0, 194.0, 169.0, 124.0, 77.0, 34.0, 24.0, 22.0, 10.0, 5.0, 2.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.681007385253906, -51.9290657043457, -50.1771240234375, -48.4251823425293, -46.673240661621094, -44.921295166015625, -43.16935729980469, -41.41741180419922, -39.665470123291016, -37.91352844238281, -36.16158676147461, -34.409645080566406, -32.6577033996582, -30.905759811401367, -29.153818130493164, -27.401874542236328, -25.649934768676758, -23.897993087768555, -22.14605140686035, -20.394107818603516, -18.642166137695312, -16.89022445678711, -15.138282775878906, -13.386340141296387, -11.634398460388184, -9.88245677947998, -8.130514144897461, -6.378572463989258, -4.6266303062438965, -2.874688148498535, -1.122746467590332, 0.6291961669921875, 2.3811378479003906, 4.133080005645752, 5.885022163391113, 7.636963844299316, 9.388906478881836, 11.140848159790039, 12.892789840698242, 14.644732475280762, 16.39667510986328, 18.148616790771484, 19.900558471679688, 21.65250015258789, 23.404443740844727, 25.15638542175293, 26.908327102661133, 28.66027069091797, 30.41221046447754, 32.164154052734375, 33.91609573364258, 35.66803741455078, 37.419979095458984, 39.17192077636719, 40.92386245727539, 42.675804138183594, 44.4277458190918, 46.1796875, 47.9316291809082, 49.683570861816406, 51.43551254272461, 53.18745422363281, 54.93939971923828, 56.691341400146484, 58.44328308105469]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 8.0, 6.0, 15.0, 13.0, 25.0, 28.0, 34.0, 34.0, 36.0, 49.0, 41.0, 47.0, 59.0, 59.0, 80.0, 56.0, 44.0, 52.0, 40.0, 38.0, 34.0, 35.0, 29.0, 20.0, 22.0, 19.0, 23.0, 10.0, 8.0, 7.0, 3.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.78886032104492, -35.74620056152344, -34.70354461669922, -33.660884857177734, -32.61822509765625, -31.575565338134766, -30.532907485961914, -29.490249633789062, -28.447589874267578, -27.404930114746094, -26.362272262573242, -25.31961441040039, -24.276954650878906, -23.234294891357422, -22.19163703918457, -21.14897918701172, -20.106319427490234, -19.06365966796875, -18.0210018157959, -16.978343963623047, -15.935684204101562, -14.893025398254395, -13.850366592407227, -12.807707786560059, -11.76504898071289, -10.722390174865723, -9.679731369018555, -8.637072563171387, -7.594413757324219, -6.551754951477051, -5.509096145629883, -4.466437339782715, -3.4237823486328125, -2.3811235427856445, -1.3384647369384766, -0.2958059310913086, 0.7468528747558594, 1.7895116806030273, 2.8321704864501953, 3.8748292922973633, 4.917488098144531, 5.960146903991699, 7.002805709838867, 8.045464515686035, 9.088123321533203, 10.130782127380371, 11.173440933227539, 12.216099739074707, 13.258758544921875, 14.301417350769043, 15.344076156616211, 16.386734008789062, 17.429393768310547, 18.47205352783203, 19.514711380004883, 20.557369232177734, 21.60002899169922, 22.642688751220703, 23.685346603393555, 24.728004455566406, 25.77066421508789, 26.813323974609375, 27.855981826782227, 28.898639678955078, 29.941299438476562]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 3.0, 9.0, 11.0, 23.0, 19.0, 33.0, 56.0, 92.0, 126.0, 206.0, 388.0, 581.0, 1176.0, 2541.0, 5689.0, 14513.0, 41282.0, 144985.0, 775448.0, 2441304.0, 587401.0, 119859.0, 35475.0, 12821.0, 5293.0, 2346.0, 1172.0, 598.0, 331.0, 177.0, 127.0, 59.0, 49.0, 30.0, 17.0, 13.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.349609375, -3.25506591796875, -3.1605224609375, -3.06597900390625, -2.971435546875, -2.87689208984375, -2.7823486328125, -2.68780517578125, -2.59326171875, -2.49871826171875, -2.4041748046875, -2.30963134765625, -2.215087890625, -2.12054443359375, -2.0260009765625, -1.93145751953125, -1.8369140625, -1.74237060546875, -1.6478271484375, -1.55328369140625, -1.458740234375, -1.36419677734375, -1.2696533203125, -1.17510986328125, -1.08056640625, -0.98602294921875, -0.8914794921875, -0.79693603515625, -0.702392578125, -0.60784912109375, -0.5133056640625, -0.41876220703125, -0.32421875, -0.22967529296875, -0.1351318359375, -0.04058837890625, 0.053955078125, 0.14849853515625, 0.2430419921875, 0.33758544921875, 0.43212890625, 0.52667236328125, 0.6212158203125, 0.71575927734375, 0.810302734375, 0.90484619140625, 0.9993896484375, 1.09393310546875, 1.1884765625, 1.28302001953125, 1.3775634765625, 1.47210693359375, 1.566650390625, 1.66119384765625, 1.7557373046875, 1.85028076171875, 1.94482421875, 2.03936767578125, 2.1339111328125, 2.22845458984375, 2.322998046875, 2.41754150390625, 2.5120849609375, 2.60662841796875, 2.701171875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 13.0, 16.0, 16.0, 19.0, 15.0, 27.0, 29.0, 37.0, 42.0, 52.0, 45.0, 46.0, 51.0, 66.0, 54.0, 47.0, 48.0, 51.0, 38.0, 46.0, 33.0, 34.0, 34.0, 22.0, 18.0, 15.0, 13.0, 12.0, 11.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.88671875, -1.8296356201171875, -1.772552490234375, -1.7154693603515625, -1.65838623046875, -1.6013031005859375, -1.544219970703125, -1.4871368408203125, -1.4300537109375, -1.3729705810546875, -1.315887451171875, -1.2588043212890625, -1.20172119140625, -1.1446380615234375, -1.087554931640625, -1.0304718017578125, -0.973388671875, -0.9163055419921875, -0.859222412109375, -0.8021392822265625, -0.74505615234375, -0.6879730224609375, -0.630889892578125, -0.5738067626953125, -0.5167236328125, -0.4596405029296875, -0.402557373046875, -0.3454742431640625, -0.28839111328125, -0.2313079833984375, -0.174224853515625, -0.1171417236328125, -0.06005859375, -0.0029754638671875, 0.054107666015625, 0.1111907958984375, 0.16827392578125, 0.2253570556640625, 0.282440185546875, 0.3395233154296875, 0.3966064453125, 0.4536895751953125, 0.510772705078125, 0.5678558349609375, 0.62493896484375, 0.6820220947265625, 0.739105224609375, 0.7961883544921875, 0.853271484375, 0.9103546142578125, 0.967437744140625, 1.0245208740234375, 1.08160400390625, 1.1386871337890625, 1.195770263671875, 1.2528533935546875, 1.3099365234375, 1.3670196533203125, 1.424102783203125, 1.4811859130859375, 1.53826904296875, 1.5953521728515625, 1.652435302734375, 1.7095184326171875, 1.7666015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 3.0, 2.0, 7.0, 21.0, 15.0, 29.0, 43.0, 70.0, 161.0, 294.0, 581.0, 1437.0, 4504.0, 16075.0, 74806.0, 565364.0, 3067149.0, 385240.0, 58888.0, 13451.0, 3816.0, 1276.0, 480.0, 227.0, 128.0, 71.0, 50.0, 25.0, 17.0, 19.0, 3.0, 7.0, 5.0, 1.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.05859375, -4.902587890625, -4.74658203125, -4.590576171875, -4.4345703125, -4.278564453125, -4.12255859375, -3.966552734375, -3.810546875, -3.654541015625, -3.49853515625, -3.342529296875, -3.1865234375, -3.030517578125, -2.87451171875, -2.718505859375, -2.5625, -2.406494140625, -2.25048828125, -2.094482421875, -1.9384765625, -1.782470703125, -1.62646484375, -1.470458984375, -1.314453125, -1.158447265625, -1.00244140625, -0.846435546875, -0.6904296875, -0.534423828125, -0.37841796875, -0.222412109375, -0.06640625, 0.089599609375, 0.24560546875, 0.401611328125, 0.5576171875, 0.713623046875, 0.86962890625, 1.025634765625, 1.181640625, 1.337646484375, 1.49365234375, 1.649658203125, 1.8056640625, 1.961669921875, 2.11767578125, 2.273681640625, 2.4296875, 2.585693359375, 2.74169921875, 2.897705078125, 3.0537109375, 3.209716796875, 3.36572265625, 3.521728515625, 3.677734375, 3.833740234375, 3.98974609375, 4.145751953125, 4.3017578125, 4.457763671875, 4.61376953125, 4.769775390625, 4.92578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 7.0, 8.0, 8.0, 8.0, 16.0, 31.0, 33.0, 43.0, 51.0, 67.0, 71.0, 110.0, 159.0, 181.0, 286.0, 389.0, 468.0, 521.0, 402.0, 311.0, 200.0, 145.0, 125.0, 98.0, 76.0, 56.0, 34.0, 40.0, 22.0, 17.0, 18.0, 23.0, 11.0, 6.0, 8.0, 3.0, 4.0, 6.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.763671875, -3.64349365234375, -3.5233154296875, -3.40313720703125, -3.282958984375, -3.16278076171875, -3.0426025390625, -2.92242431640625, -2.80224609375, -2.68206787109375, -2.5618896484375, -2.44171142578125, -2.321533203125, -2.20135498046875, -2.0811767578125, -1.96099853515625, -1.8408203125, -1.72064208984375, -1.6004638671875, -1.48028564453125, -1.360107421875, -1.23992919921875, -1.1197509765625, -0.99957275390625, -0.87939453125, -0.75921630859375, -0.6390380859375, -0.51885986328125, -0.398681640625, -0.27850341796875, -0.1583251953125, -0.03814697265625, 0.08203125, 0.20220947265625, 0.3223876953125, 0.44256591796875, 0.562744140625, 0.68292236328125, 0.8031005859375, 0.92327880859375, 1.04345703125, 1.16363525390625, 1.2838134765625, 1.40399169921875, 1.524169921875, 1.64434814453125, 1.7645263671875, 1.88470458984375, 2.0048828125, 2.12506103515625, 2.2452392578125, 2.36541748046875, 2.485595703125, 2.60577392578125, 2.7259521484375, 2.84613037109375, 2.96630859375, 3.08648681640625, 3.2066650390625, 3.32684326171875, 3.447021484375, 3.56719970703125, 3.6873779296875, 3.80755615234375, 3.927734375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 9.0, 8.0, 28.0, 80.0, 195.0, 290.0, 201.0, 122.0, 41.0, 11.0, 11.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.01600646972656, -64.17169189453125, -61.32737350463867, -58.483055114746094, -55.638736724853516, -52.79441833496094, -49.950103759765625, -47.10578536987305, -44.26146697998047, -41.41714859008789, -38.57283401489258, -35.728515625, -32.88419723510742, -30.039880752563477, -27.19556427001953, -24.351245880126953, -21.50693130493164, -18.662614822387695, -15.818296432495117, -12.973979949951172, -10.12966251373291, -7.285345077514648, -4.441028594970703, -1.596710205078125, 1.2476062774658203, 4.091923713684082, 6.9362406730651855, 9.780557632446289, 12.62487506866455, 15.469192504882812, 18.313508987426758, 21.157827377319336, 24.00214385986328, 26.846460342407227, 29.690778732299805, 32.53509521484375, 35.37941360473633, 38.223731994628906, 41.06804656982422, 43.9123649597168, 46.756683349609375, 49.60100173950195, 52.445316314697266, 55.289634704589844, 58.13395309448242, 60.978271484375, 63.82258605957031, 66.66690063476562, 69.51121520996094, 72.35552978515625, 75.1998519897461, 78.0441665649414, 80.88848114013672, 83.73280334472656, 86.57711791992188, 89.42143249511719, 92.26575469970703, 95.11006927490234, 97.95439147949219, 100.7987060546875, 103.64302062988281, 106.48734283447266, 109.33165740966797, 112.17597961425781, 115.02029418945312]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 13.0, 7.0, 14.0, 29.0, 23.0, 18.0, 32.0, 35.0, 40.0, 47.0, 44.0, 52.0, 50.0, 52.0, 58.0, 50.0, 48.0, 54.0, 53.0, 47.0, 33.0, 34.0, 29.0, 28.0, 22.0, 19.0, 15.0, 9.0, 9.0, 8.0, 4.0, 6.0, 1.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.796733856201172, -19.902328491210938, -19.00792121887207, -18.113515853881836, -17.2191104888916, -16.324703216552734, -15.4302978515625, -14.535892486572266, -13.641486167907715, -12.747079849243164, -11.85267448425293, -10.958268165588379, -10.063861846923828, -9.169456481933594, -8.275050163269043, -7.38064432144165, -6.486238479614258, -5.591832637786865, -4.697426795959473, -3.803020477294922, -2.9086146354675293, -2.0142087936401367, -1.119802474975586, -0.22539663314819336, 0.6690092086791992, 1.5634151697158813, 2.4578211307525635, 3.352227210998535, 4.246633052825928, 5.14103889465332, 6.035445213317871, 6.929851055145264, 7.824256896972656, 8.718663215637207, 9.613068580627441, 10.507474899291992, 11.401880264282227, 12.296286582946777, 13.190692901611328, 14.085098266601562, 14.979504585266113, 15.873910903930664, 16.7683162689209, 17.662723541259766, 18.55712890625, 19.451534271240234, 20.34593963623047, 21.240346908569336, 22.13475227355957, 23.029157638549805, 23.923564910888672, 24.817970275878906, 25.71237564086914, 26.606781005859375, 27.501188278198242, 28.395593643188477, 29.290000915527344, 30.184406280517578, 31.078813552856445, 31.97321891784668, 32.86762619018555, 33.76203155517578, 34.656436920166016, 35.55084228515625, 36.445247650146484]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 6.0, 3.0, 3.0, 9.0, 15.0, 27.0, 35.0, 38.0, 71.0, 110.0, 147.0, 216.0, 314.0, 546.0, 1009.0, 1700.0, 3013.0, 6028.0, 12345.0, 26149.0, 54919.0, 114895.0, 238075.0, 292168.0, 154186.0, 73846.0, 34804.0, 16511.0, 8177.0, 4011.0, 2139.0, 1151.0, 693.0, 405.0, 231.0, 176.0, 106.0, 86.0, 44.0, 37.0, 25.0, 32.0, 10.0, 12.0, 15.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.455078125, -3.340667724609375, -3.22625732421875, -3.111846923828125, -2.9974365234375, -2.883026123046875, -2.76861572265625, -2.654205322265625, -2.539794921875, -2.425384521484375, -2.31097412109375, -2.196563720703125, -2.0821533203125, -1.967742919921875, -1.85333251953125, -1.738922119140625, -1.62451171875, -1.510101318359375, -1.39569091796875, -1.281280517578125, -1.1668701171875, -1.052459716796875, -0.93804931640625, -0.823638916015625, -0.709228515625, -0.594818115234375, -0.48040771484375, -0.365997314453125, -0.2515869140625, -0.137176513671875, -0.02276611328125, 0.091644287109375, 0.2060546875, 0.320465087890625, 0.43487548828125, 0.549285888671875, 0.6636962890625, 0.778106689453125, 0.89251708984375, 1.006927490234375, 1.121337890625, 1.235748291015625, 1.35015869140625, 1.464569091796875, 1.5789794921875, 1.693389892578125, 1.80780029296875, 1.922210693359375, 2.03662109375, 2.151031494140625, 2.26544189453125, 2.379852294921875, 2.4942626953125, 2.608673095703125, 2.72308349609375, 2.837493896484375, 2.951904296875, 3.066314697265625, 3.18072509765625, 3.295135498046875, 3.4095458984375, 3.523956298828125, 3.63836669921875, 3.752777099609375, 3.8671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 5.0, 9.0, 7.0, 13.0, 10.0, 14.0, 20.0, 22.0, 19.0, 33.0, 26.0, 24.0, 36.0, 40.0, 41.0, 46.0, 37.0, 51.0, 45.0, 38.0, 55.0, 29.0, 29.0, 35.0, 38.0, 33.0, 23.0, 37.0, 25.0, 20.0, 19.0, 16.0, 14.0, 16.0, 13.0, 8.0, 7.0, 6.0, 3.0, 7.0, 3.0, 0.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.474609375, -1.4265289306640625, -1.378448486328125, -1.3303680419921875, -1.28228759765625, -1.2342071533203125, -1.186126708984375, -1.1380462646484375, -1.0899658203125, -1.0418853759765625, -0.993804931640625, -0.9457244873046875, -0.89764404296875, -0.8495635986328125, -0.801483154296875, -0.7534027099609375, -0.705322265625, -0.6572418212890625, -0.609161376953125, -0.5610809326171875, -0.51300048828125, -0.4649200439453125, -0.416839599609375, -0.3687591552734375, -0.3206787109375, -0.2725982666015625, -0.224517822265625, -0.1764373779296875, -0.12835693359375, -0.0802764892578125, -0.032196044921875, 0.0158843994140625, 0.06396484375, 0.1120452880859375, 0.160125732421875, 0.2082061767578125, 0.25628662109375, 0.3043670654296875, 0.352447509765625, 0.4005279541015625, 0.4486083984375, 0.4966888427734375, 0.544769287109375, 0.5928497314453125, 0.64093017578125, 0.6890106201171875, 0.737091064453125, 0.7851715087890625, 0.833251953125, 0.8813323974609375, 0.929412841796875, 0.9774932861328125, 1.02557373046875, 1.0736541748046875, 1.121734619140625, 1.1698150634765625, 1.2178955078125, 1.2659759521484375, 1.314056396484375, 1.3621368408203125, 1.41021728515625, 1.4582977294921875, 1.506378173828125, 1.5544586181640625, 1.6025390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 5.0, 17.0, 16.0, 24.0, 35.0, 71.0, 85.0, 127.0, 191.0, 279.0, 449.0, 738.0, 1266.0, 2429.0, 6122.0, 25747.0, 195463.0, 701937.0, 90027.0, 14522.0, 4119.0, 1948.0, 1080.0, 649.0, 346.0, 279.0, 188.0, 137.0, 84.0, 47.0, 41.0, 25.0, 23.0, 15.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.181884765625, -7.90283203125, -7.623779296875, -7.3447265625, -7.065673828125, -6.78662109375, -6.507568359375, -6.228515625, -5.949462890625, -5.67041015625, -5.391357421875, -5.1123046875, -4.833251953125, -4.55419921875, -4.275146484375, -3.99609375, -3.717041015625, -3.43798828125, -3.158935546875, -2.8798828125, -2.600830078125, -2.32177734375, -2.042724609375, -1.763671875, -1.484619140625, -1.20556640625, -0.926513671875, -0.6474609375, -0.368408203125, -0.08935546875, 0.189697265625, 0.46875, 0.747802734375, 1.02685546875, 1.305908203125, 1.5849609375, 1.864013671875, 2.14306640625, 2.422119140625, 2.701171875, 2.980224609375, 3.25927734375, 3.538330078125, 3.8173828125, 4.096435546875, 4.37548828125, 4.654541015625, 4.93359375, 5.212646484375, 5.49169921875, 5.770751953125, 6.0498046875, 6.328857421875, 6.60791015625, 6.886962890625, 7.166015625, 7.445068359375, 7.72412109375, 8.003173828125, 8.2822265625, 8.561279296875, 8.84033203125, 9.119384765625, 9.3984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 6.0, 4.0, 10.0, 12.0, 11.0, 18.0, 19.0, 23.0, 36.0, 25.0, 26.0, 39.0, 45.0, 44.0, 49.0, 50.0, 51.0, 47.0, 33.0, 41.0, 44.0, 36.0, 40.0, 46.0, 32.0, 18.0, 27.0, 19.0, 17.0, 32.0, 16.0, 10.0, 9.0, 5.0, 10.0, 8.0, 9.0, 6.0, 5.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.8359375, -6.60546875, -6.375, -6.14453125, -5.9140625, -5.68359375, -5.453125, -5.22265625, -4.9921875, -4.76171875, -4.53125, -4.30078125, -4.0703125, -3.83984375, -3.609375, -3.37890625, -3.1484375, -2.91796875, -2.6875, -2.45703125, -2.2265625, -1.99609375, -1.765625, -1.53515625, -1.3046875, -1.07421875, -0.84375, -0.61328125, -0.3828125, -0.15234375, 0.078125, 0.30859375, 0.5390625, 0.76953125, 1.0, 1.23046875, 1.4609375, 1.69140625, 1.921875, 2.15234375, 2.3828125, 2.61328125, 2.84375, 3.07421875, 3.3046875, 3.53515625, 3.765625, 3.99609375, 4.2265625, 4.45703125, 4.6875, 4.91796875, 5.1484375, 5.37890625, 5.609375, 5.83984375, 6.0703125, 6.30078125, 6.53125, 6.76171875, 6.9921875, 7.22265625, 7.453125, 7.68359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 2.0, 4.0, 9.0, 11.0, 17.0, 23.0, 32.0, 55.0, 111.0, 231.0, 643.0, 2551.0, 23112.0, 725510.0, 281181.0, 12363.0, 1732.0, 515.0, 205.0, 91.0, 55.0, 33.0, 20.0, 17.0, 12.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.58984375, -5.43829345703125, -5.2867431640625, -5.13519287109375, -4.983642578125, -4.83209228515625, -4.6805419921875, -4.52899169921875, -4.37744140625, -4.22589111328125, -4.0743408203125, -3.92279052734375, -3.771240234375, -3.61968994140625, -3.4681396484375, -3.31658935546875, -3.1650390625, -3.01348876953125, -2.8619384765625, -2.71038818359375, -2.558837890625, -2.40728759765625, -2.2557373046875, -2.10418701171875, -1.95263671875, -1.80108642578125, -1.6495361328125, -1.49798583984375, -1.346435546875, -1.19488525390625, -1.0433349609375, -0.89178466796875, -0.740234375, -0.58868408203125, -0.4371337890625, -0.28558349609375, -0.134033203125, 0.01751708984375, 0.1690673828125, 0.32061767578125, 0.47216796875, 0.62371826171875, 0.7752685546875, 0.92681884765625, 1.078369140625, 1.22991943359375, 1.3814697265625, 1.53302001953125, 1.6845703125, 1.83612060546875, 1.9876708984375, 2.13922119140625, 2.290771484375, 2.44232177734375, 2.5938720703125, 2.74542236328125, 2.89697265625, 3.04852294921875, 3.2000732421875, 3.35162353515625, 3.503173828125, 3.65472412109375, 3.8062744140625, 3.95782470703125, 4.109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 5.0, 9.0, 6.0, 6.0, 12.0, 13.0, 17.0, 13.0, 21.0, 15.0, 27.0, 12.0, 27.0, 37.0, 50.0, 66.0, 86.0, 91.0, 90.0, 52.0, 55.0, 34.0, 35.0, 32.0, 25.0, 22.0, 19.0, 18.0, 13.0, 15.0, 11.0, 11.0, 6.0, 8.0, 7.0, 4.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0005679130554199219, -0.0005521290004253387, -0.0005363449454307556, -0.0005205608904361725, -0.0005047768354415894, -0.0004889927804470062, -0.0004732087254524231, -0.00045742467045783997, -0.00044164061546325684, -0.0004258565604686737, -0.0004100725054740906, -0.00039428845047950745, -0.0003785043954849243, -0.0003627203404903412, -0.00034693628549575806, -0.0003311522305011749, -0.0003153681755065918, -0.00029958412051200867, -0.00028380006551742554, -0.0002680160105228424, -0.0002522319555282593, -0.00023644790053367615, -0.00022066384553909302, -0.0002048797905445099, -0.00018909573554992676, -0.00017331168055534363, -0.0001575276255607605, -0.00014174357056617737, -0.00012595951557159424, -0.00011017546057701111, -9.439140558242798e-05, -7.860735058784485e-05, -6.282329559326172e-05, -4.703924059867859e-05, -3.125518560409546e-05, -1.547113060951233e-05, 3.129243850708008e-07, 1.609697937965393e-05, 3.188103437423706e-05, 4.766508936882019e-05, 6.344914436340332e-05, 7.923319935798645e-05, 9.501725435256958e-05, 0.00011080130934715271, 0.00012658536434173584, 0.00014236941933631897, 0.0001581534743309021, 0.00017393752932548523, 0.00018972158432006836, 0.0002055056393146515, 0.00022128969430923462, 0.00023707374930381775, 0.0002528578042984009, 0.000268641859292984, 0.00028442591428756714, 0.00030020996928215027, 0.0003159940242767334, 0.00033177807927131653, 0.00034756213426589966, 0.0003633461892604828, 0.0003791302442550659, 0.00039491429924964905, 0.0004106983542442322, 0.0004264824092388153, 0.00044226646423339844]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 14.0, 11.0, 19.0, 33.0, 45.0, 110.0, 161.0, 292.0, 683.0, 1611.0, 4548.0, 21678.0, 271721.0, 696889.0, 40394.0, 6690.0, 1927.0, 835.0, 402.0, 198.0, 99.0, 72.0, 41.0, 28.0, 16.0, 6.0, 8.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.916015625, -3.80133056640625, -3.6866455078125, -3.57196044921875, -3.457275390625, -3.34259033203125, -3.2279052734375, -3.11322021484375, -2.99853515625, -2.88385009765625, -2.7691650390625, -2.65447998046875, -2.539794921875, -2.42510986328125, -2.3104248046875, -2.19573974609375, -2.0810546875, -1.96636962890625, -1.8516845703125, -1.73699951171875, -1.622314453125, -1.50762939453125, -1.3929443359375, -1.27825927734375, -1.16357421875, -1.04888916015625, -0.9342041015625, -0.81951904296875, -0.704833984375, -0.59014892578125, -0.4754638671875, -0.36077880859375, -0.24609375, -0.13140869140625, -0.0167236328125, 0.09796142578125, 0.212646484375, 0.32733154296875, 0.4420166015625, 0.55670166015625, 0.67138671875, 0.78607177734375, 0.9007568359375, 1.01544189453125, 1.130126953125, 1.24481201171875, 1.3594970703125, 1.47418212890625, 1.5888671875, 1.70355224609375, 1.8182373046875, 1.93292236328125, 2.047607421875, 2.16229248046875, 2.2769775390625, 2.39166259765625, 2.50634765625, 2.62103271484375, 2.7357177734375, 2.85040283203125, 2.965087890625, 3.07977294921875, 3.1944580078125, 3.30914306640625, 3.423828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 2.0, 7.0, 7.0, 10.0, 7.0, 4.0, 16.0, 18.0, 20.0, 19.0, 33.0, 29.0, 40.0, 51.0, 52.0, 65.0, 59.0, 72.0, 63.0, 68.0, 55.0, 42.0, 47.0, 33.0, 37.0, 24.0, 14.0, 15.0, 23.0, 16.0, 7.0, 9.0, 7.0, 6.0, 3.0, 1.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.048828125, -1.993743896484375, -1.93865966796875, -1.883575439453125, -1.8284912109375, -1.773406982421875, -1.71832275390625, -1.663238525390625, -1.608154296875, -1.553070068359375, -1.49798583984375, -1.442901611328125, -1.3878173828125, -1.332733154296875, -1.27764892578125, -1.222564697265625, -1.16748046875, -1.112396240234375, -1.05731201171875, -1.002227783203125, -0.9471435546875, -0.892059326171875, -0.83697509765625, -0.781890869140625, -0.726806640625, -0.671722412109375, -0.61663818359375, -0.561553955078125, -0.5064697265625, -0.451385498046875, -0.39630126953125, -0.341217041015625, -0.2861328125, -0.231048583984375, -0.17596435546875, -0.120880126953125, -0.0657958984375, -0.010711669921875, 0.04437255859375, 0.099456787109375, 0.154541015625, 0.209625244140625, 0.26470947265625, 0.319793701171875, 0.3748779296875, 0.429962158203125, 0.48504638671875, 0.540130615234375, 0.59521484375, 0.650299072265625, 0.70538330078125, 0.760467529296875, 0.8155517578125, 0.870635986328125, 0.92572021484375, 0.980804443359375, 1.035888671875, 1.090972900390625, 1.14605712890625, 1.201141357421875, 1.2562255859375, 1.311309814453125, 1.36639404296875, 1.421478271484375, 1.4765625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 10.0, 29.0, 40.0, 91.0, 138.0, 233.0, 183.0, 123.0, 65.0, 42.0, 8.0, 7.0, 9.0, 1.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.40824890136719, -40.45799255371094, -38.50773620605469, -36.55747985839844, -34.60722351074219, -32.65696716308594, -30.706710815429688, -28.756454467773438, -26.806198120117188, -24.855941772460938, -22.905685424804688, -20.955429077148438, -19.005172729492188, -17.054916381835938, -15.104660034179688, -13.154403686523438, -11.204147338867188, -9.253890991210938, -7.3036346435546875, -5.3533782958984375, -3.4031219482421875, -1.4528656005859375, 0.4973907470703125, 2.4476470947265625, 4.3979034423828125, 6.3481597900390625, 8.298416137695312, 10.248672485351562, 12.198928833007812, 14.149185180664062, 16.099441528320312, 18.049697875976562, 19.999954223632812, 21.950210571289062, 23.900466918945312, 25.850723266601562, 27.800979614257812, 29.751235961914062, 31.701492309570312, 33.65174865722656, 35.60200500488281, 37.55226135253906, 39.50251770019531, 41.45277404785156, 43.40303039550781, 45.35328674316406, 47.30354309082031, 49.25379943847656, 51.20405578613281, 53.15431213378906, 55.10456848144531, 57.05482482910156, 59.00508117675781, 60.95533752441406, 62.90559387207031, 64.85585021972656, 66.80610656738281, 68.75636291503906, 70.70661926269531, 72.65687561035156, 74.60713195800781, 76.55738830566406, 78.50764465332031, 80.45790100097656, 82.40815734863281]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 6.0, 12.0, 17.0, 15.0, 21.0, 26.0, 24.0, 31.0, 35.0, 41.0, 41.0, 56.0, 82.0, 81.0, 82.0, 66.0, 43.0, 45.0, 39.0, 41.0, 28.0, 33.0, 22.0, 23.0, 17.0, 13.0, 9.0, 16.0, 8.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-41.92070388793945, -40.75674057006836, -39.592777252197266, -38.42881393432617, -37.26485061645508, -36.10088348388672, -34.936920166015625, -33.77295684814453, -32.60899353027344, -31.445030212402344, -30.28106689453125, -29.117103576660156, -27.95313835144043, -26.789175033569336, -25.625211715698242, -24.461246490478516, -23.297285079956055, -22.13332176208496, -20.969358444213867, -19.80539321899414, -18.641429901123047, -17.477466583251953, -16.31350326538086, -15.14953899383545, -13.985575675964355, -12.821612358093262, -11.657648086547852, -10.493684768676758, -9.329721450805664, -8.165757179260254, -7.00179386138916, -5.83782958984375, -4.673866271972656, -3.5099024772644043, -2.3459389209747314, -1.1819753646850586, -0.01801156997680664, 1.1459522247314453, 2.309915542602539, 3.473879814147949, 4.637843132019043, 5.801806926727295, 6.965770721435547, 8.12973403930664, 9.293697357177734, 10.457661628723145, 11.621624946594238, 12.785589218139648, 13.949552536010742, 15.113515853881836, 16.27747917175293, 17.441444396972656, 18.60540771484375, 19.769371032714844, 20.933334350585938, 22.09729766845703, 23.261260986328125, 24.42522430419922, 25.589187622070312, 26.753150939941406, 27.917116165161133, 29.081079483032227, 30.24504280090332, 31.409008026123047, 32.57297134399414]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 3.0, 5.0, 7.0, 7.0, 14.0, 18.0, 24.0, 56.0, 61.0, 133.0, 241.0, 485.0, 1089.0, 2572.0, 7455.0, 24437.0, 101632.0, 830850.0, 2793220.0, 349407.0, 58387.0, 15671.0, 5059.0, 1893.0, 749.0, 372.0, 203.0, 103.0, 53.0, 22.0, 15.0, 11.0, 14.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.498870849609375, -4.38446044921875, -4.270050048828125, -4.1556396484375, -4.041229248046875, -3.92681884765625, -3.812408447265625, -3.697998046875, -3.583587646484375, -3.46917724609375, -3.354766845703125, -3.2403564453125, -3.125946044921875, -3.01153564453125, -2.897125244140625, -2.78271484375, -2.668304443359375, -2.55389404296875, -2.439483642578125, -2.3250732421875, -2.210662841796875, -2.09625244140625, -1.981842041015625, -1.867431640625, -1.753021240234375, -1.63861083984375, -1.524200439453125, -1.4097900390625, -1.295379638671875, -1.18096923828125, -1.066558837890625, -0.9521484375, -0.837738037109375, -0.72332763671875, -0.608917236328125, -0.4945068359375, -0.380096435546875, -0.26568603515625, -0.151275634765625, -0.036865234375, 0.077545166015625, 0.19195556640625, 0.306365966796875, 0.4207763671875, 0.535186767578125, 0.64959716796875, 0.764007568359375, 0.87841796875, 0.992828369140625, 1.10723876953125, 1.221649169921875, 1.3360595703125, 1.450469970703125, 1.56488037109375, 1.679290771484375, 1.793701171875, 1.908111572265625, 2.02252197265625, 2.136932373046875, 2.2513427734375, 2.365753173828125, 2.48016357421875, 2.594573974609375, 2.708984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 6.0, 15.0, 13.0, 22.0, 28.0, 34.0, 45.0, 40.0, 60.0, 42.0, 63.0, 82.0, 69.0, 60.0, 57.0, 62.0, 61.0, 46.0, 34.0, 36.0, 36.0, 35.0, 24.0, 6.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.50390625, -1.423492431640625, -1.34307861328125, -1.262664794921875, -1.1822509765625, -1.101837158203125, -1.02142333984375, -0.941009521484375, -0.860595703125, -0.780181884765625, -0.69976806640625, -0.619354248046875, -0.5389404296875, -0.458526611328125, -0.37811279296875, -0.297698974609375, -0.21728515625, -0.136871337890625, -0.05645751953125, 0.023956298828125, 0.1043701171875, 0.184783935546875, 0.26519775390625, 0.345611572265625, 0.426025390625, 0.506439208984375, 0.58685302734375, 0.667266845703125, 0.7476806640625, 0.828094482421875, 0.90850830078125, 0.988922119140625, 1.0693359375, 1.149749755859375, 1.23016357421875, 1.310577392578125, 1.3909912109375, 1.471405029296875, 1.55181884765625, 1.632232666015625, 1.712646484375, 1.793060302734375, 1.87347412109375, 1.953887939453125, 2.0343017578125, 2.114715576171875, 2.19512939453125, 2.275543212890625, 2.35595703125, 2.436370849609375, 2.51678466796875, 2.597198486328125, 2.6776123046875, 2.758026123046875, 2.83843994140625, 2.918853759765625, 2.999267578125, 3.079681396484375, 3.16009521484375, 3.240509033203125, 3.3209228515625, 3.401336669921875, 3.48175048828125, 3.562164306640625, 3.642578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 5.0, 3.0, 8.0, 13.0, 19.0, 23.0, 32.0, 67.0, 100.0, 183.0, 378.0, 767.0, 1591.0, 3916.0, 10310.0, 32050.0, 132915.0, 1209863.0, 2513545.0, 225788.0, 43402.0, 12247.0, 4083.0, 1599.0, 707.0, 286.0, 139.0, 88.0, 55.0, 42.0, 17.0, 18.0, 7.0, 9.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.03125, -3.8975830078125, -3.763916015625, -3.6302490234375, -3.49658203125, -3.3629150390625, -3.229248046875, -3.0955810546875, -2.9619140625, -2.8282470703125, -2.694580078125, -2.5609130859375, -2.42724609375, -2.2935791015625, -2.159912109375, -2.0262451171875, -1.892578125, -1.7589111328125, -1.625244140625, -1.4915771484375, -1.35791015625, -1.2242431640625, -1.090576171875, -0.9569091796875, -0.8232421875, -0.6895751953125, -0.555908203125, -0.4222412109375, -0.28857421875, -0.1549072265625, -0.021240234375, 0.1124267578125, 0.24609375, 0.3797607421875, 0.513427734375, 0.6470947265625, 0.78076171875, 0.9144287109375, 1.048095703125, 1.1817626953125, 1.3154296875, 1.4490966796875, 1.582763671875, 1.7164306640625, 1.85009765625, 1.9837646484375, 2.117431640625, 2.2510986328125, 2.384765625, 2.5184326171875, 2.652099609375, 2.7857666015625, 2.91943359375, 3.0531005859375, 3.186767578125, 3.3204345703125, 3.4541015625, 3.5877685546875, 3.721435546875, 3.8551025390625, 3.98876953125, 4.1224365234375, 4.256103515625, 4.3897705078125, 4.5234375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 4.0, 9.0, 9.0, 18.0, 11.0, 8.0, 22.0, 35.0, 34.0, 57.0, 72.0, 112.0, 142.0, 250.0, 360.0, 518.0, 653.0, 603.0, 381.0, 274.0, 158.0, 105.0, 68.0, 44.0, 37.0, 25.0, 12.0, 10.0, 8.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.13653564453125, -4.9879150390625, -4.83929443359375, -4.690673828125, -4.54205322265625, -4.3934326171875, -4.24481201171875, -4.09619140625, -3.94757080078125, -3.7989501953125, -3.65032958984375, -3.501708984375, -3.35308837890625, -3.2044677734375, -3.05584716796875, -2.9072265625, -2.75860595703125, -2.6099853515625, -2.46136474609375, -2.312744140625, -2.16412353515625, -2.0155029296875, -1.86688232421875, -1.71826171875, -1.56964111328125, -1.4210205078125, -1.27239990234375, -1.123779296875, -0.97515869140625, -0.8265380859375, -0.67791748046875, -0.529296875, -0.38067626953125, -0.2320556640625, -0.08343505859375, 0.065185546875, 0.21380615234375, 0.3624267578125, 0.51104736328125, 0.65966796875, 0.80828857421875, 0.9569091796875, 1.10552978515625, 1.254150390625, 1.40277099609375, 1.5513916015625, 1.70001220703125, 1.8486328125, 1.99725341796875, 2.1458740234375, 2.29449462890625, 2.443115234375, 2.59173583984375, 2.7403564453125, 2.88897705078125, 3.03759765625, 3.18621826171875, 3.3348388671875, 3.48345947265625, 3.632080078125, 3.78070068359375, 3.9293212890625, 4.07794189453125, 4.2265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 5.0, 8.0, 10.0, 9.0, 26.0, 114.0, 266.0, 347.0, 162.0, 33.0, 19.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.81997680664062, -161.60415649414062, -158.38832092285156, -155.1724853515625, -151.9566650390625, -148.7408447265625, -145.52500915527344, -142.30917358398438, -139.09335327148438, -135.87753295898438, -132.6616973876953, -129.44586181640625, -126.23004150390625, -123.01421356201172, -119.79838562011719, -116.58255767822266, -113.36672973632812, -110.1509017944336, -106.93507385253906, -103.71924591064453, -100.50341796875, -97.28759002685547, -94.07176208496094, -90.8559341430664, -87.64010620117188, -84.42427825927734, -81.20845031738281, -77.99262237548828, -74.77679443359375, -71.56096649169922, -68.34513854980469, -65.12931060791016, -61.913490295410156, -58.697662353515625, -55.481834411621094, -52.26600646972656, -49.05017852783203, -45.8343505859375, -42.61852264404297, -39.40269470214844, -36.186866760253906, -32.971038818359375, -29.755210876464844, -26.539382934570312, -23.32355499267578, -20.10772705078125, -16.89189910888672, -13.676071166992188, -10.460243225097656, -7.244415283203125, -4.028587341308594, -0.8127593994140625, 2.4030685424804688, 5.618896484375, 8.834724426269531, 12.050552368164062, 15.266380310058594, 18.482208251953125, 21.698036193847656, 24.913864135742188, 28.12969207763672, 31.34552001953125, 34.56134796142578, 37.77717590332031, 40.993003845214844]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 7.0, 4.0, 7.0, 7.0, 2.0, 5.0, 8.0, 17.0, 11.0, 10.0, 17.0, 18.0, 25.0, 28.0, 28.0, 29.0, 37.0, 35.0, 56.0, 50.0, 29.0, 44.0, 44.0, 42.0, 54.0, 37.0, 36.0, 42.0, 31.0, 30.0, 31.0, 24.0, 26.0, 26.0, 20.0, 12.0, 15.0, 15.0, 8.0, 9.0, 8.0, 5.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.373092651367188, -20.643953323364258, -19.914812088012695, -19.185672760009766, -18.456533432006836, -17.727394104003906, -16.998252868652344, -16.269113540649414, -15.539973258972168, -14.810832977294922, -14.081693649291992, -13.352553367614746, -12.6234130859375, -11.89427375793457, -11.165133476257324, -10.435993194580078, -9.706853866577148, -8.977713584899902, -8.248574256896973, -7.519433975219727, -6.790294170379639, -6.061154365539551, -5.332014083862305, -4.602874279022217, -3.873734474182129, -3.144594669342041, -2.415454626083374, -1.686314582824707, -0.9571747779846191, -0.22803497314453125, 0.5011053085327148, 1.2302451133728027, 1.9593868255615234, 2.6885266304016113, 3.4176666736602783, 4.146806716918945, 4.875946521759033, 5.605086326599121, 6.334226608276367, 7.063366413116455, 7.792506217956543, 8.521646499633789, 9.250785827636719, 9.979926109313965, 10.709066390991211, 11.43820571899414, 12.167346000671387, 12.896486282348633, 13.625625610351562, 14.354765892028809, 15.083905220031738, 15.813045501708984, 16.542184829711914, 17.271324157714844, 18.000465393066406, 18.729604721069336, 19.458744049072266, 20.187883377075195, 20.917024612426758, 21.646163940429688, 22.375303268432617, 23.104442596435547, 23.83358383178711, 24.56272315979004, 25.2918643951416]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 13.0, 14.0, 20.0, 28.0, 26.0, 57.0, 56.0, 86.0, 142.0, 279.0, 465.0, 724.0, 1354.0, 2435.0, 4357.0, 8448.0, 17760.0, 40754.0, 99044.0, 259759.0, 347937.0, 153615.0, 60284.0, 26058.0, 11793.0, 5761.0, 3117.0, 1702.0, 911.0, 596.0, 376.0, 190.0, 119.0, 75.0, 60.0, 34.0, 29.0, 12.0, 21.0, 14.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.892578125, -3.77178955078125, -3.6510009765625, -3.53021240234375, -3.409423828125, -3.28863525390625, -3.1678466796875, -3.04705810546875, -2.92626953125, -2.80548095703125, -2.6846923828125, -2.56390380859375, -2.443115234375, -2.32232666015625, -2.2015380859375, -2.08074951171875, -1.9599609375, -1.83917236328125, -1.7183837890625, -1.59759521484375, -1.476806640625, -1.35601806640625, -1.2352294921875, -1.11444091796875, -0.99365234375, -0.87286376953125, -0.7520751953125, -0.63128662109375, -0.510498046875, -0.38970947265625, -0.2689208984375, -0.14813232421875, -0.02734375, 0.09344482421875, 0.2142333984375, 0.33502197265625, 0.455810546875, 0.57659912109375, 0.6973876953125, 0.81817626953125, 0.93896484375, 1.05975341796875, 1.1805419921875, 1.30133056640625, 1.422119140625, 1.54290771484375, 1.6636962890625, 1.78448486328125, 1.9052734375, 2.02606201171875, 2.1468505859375, 2.26763916015625, 2.388427734375, 2.50921630859375, 2.6300048828125, 2.75079345703125, 2.87158203125, 2.99237060546875, 3.1131591796875, 3.23394775390625, 3.354736328125, 3.47552490234375, 3.5963134765625, 3.71710205078125, 3.837890625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 7.0, 7.0, 12.0, 13.0, 11.0, 17.0, 25.0, 26.0, 31.0, 38.0, 38.0, 41.0, 46.0, 41.0, 35.0, 59.0, 52.0, 42.0, 47.0, 44.0, 43.0, 48.0, 40.0, 37.0, 36.0, 35.0, 22.0, 21.0, 15.0, 16.0, 11.0, 13.0, 12.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.865234375, -1.8049468994140625, -1.744659423828125, -1.6843719482421875, -1.62408447265625, -1.5637969970703125, -1.503509521484375, -1.4432220458984375, -1.3829345703125, -1.3226470947265625, -1.262359619140625, -1.2020721435546875, -1.14178466796875, -1.0814971923828125, -1.021209716796875, -0.9609222412109375, -0.900634765625, -0.8403472900390625, -0.780059814453125, -0.7197723388671875, -0.65948486328125, -0.5991973876953125, -0.538909912109375, -0.4786224365234375, -0.4183349609375, -0.3580474853515625, -0.297760009765625, -0.2374725341796875, -0.17718505859375, -0.1168975830078125, -0.056610107421875, 0.0036773681640625, 0.06396484375, 0.1242523193359375, 0.184539794921875, 0.2448272705078125, 0.30511474609375, 0.3654022216796875, 0.425689697265625, 0.4859771728515625, 0.5462646484375, 0.6065521240234375, 0.666839599609375, 0.7271270751953125, 0.78741455078125, 0.8477020263671875, 0.907989501953125, 0.9682769775390625, 1.028564453125, 1.0888519287109375, 1.149139404296875, 1.2094268798828125, 1.26971435546875, 1.3300018310546875, 1.390289306640625, 1.4505767822265625, 1.5108642578125, 1.5711517333984375, 1.631439208984375, 1.6917266845703125, 1.75201416015625, 1.8123016357421875, 1.872589111328125, 1.9328765869140625, 1.9931640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 6.0, 10.0, 14.0, 17.0, 31.0, 36.0, 43.0, 82.0, 105.0, 161.0, 242.0, 305.0, 531.0, 915.0, 1757.0, 4431.0, 16339.0, 103301.0, 746214.0, 143338.0, 20792.0, 5129.0, 2036.0, 983.0, 603.0, 354.0, 244.0, 145.0, 100.0, 85.0, 48.0, 53.0, 35.0, 20.0, 10.0, 9.0, 8.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.171875, -8.898681640625, -8.62548828125, -8.352294921875, -8.0791015625, -7.805908203125, -7.53271484375, -7.259521484375, -6.986328125, -6.713134765625, -6.43994140625, -6.166748046875, -5.8935546875, -5.620361328125, -5.34716796875, -5.073974609375, -4.80078125, -4.527587890625, -4.25439453125, -3.981201171875, -3.7080078125, -3.434814453125, -3.16162109375, -2.888427734375, -2.615234375, -2.342041015625, -2.06884765625, -1.795654296875, -1.5224609375, -1.249267578125, -0.97607421875, -0.702880859375, -0.4296875, -0.156494140625, 0.11669921875, 0.389892578125, 0.6630859375, 0.936279296875, 1.20947265625, 1.482666015625, 1.755859375, 2.029052734375, 2.30224609375, 2.575439453125, 2.8486328125, 3.121826171875, 3.39501953125, 3.668212890625, 3.94140625, 4.214599609375, 4.48779296875, 4.760986328125, 5.0341796875, 5.307373046875, 5.58056640625, 5.853759765625, 6.126953125, 6.400146484375, 6.67333984375, 6.946533203125, 7.2197265625, 7.492919921875, 7.76611328125, 8.039306640625, 8.3125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 15.0, 13.0, 13.0, 18.0, 26.0, 30.0, 46.0, 57.0, 59.0, 70.0, 80.0, 82.0, 76.0, 78.0, 69.0, 59.0, 53.0, 20.0, 32.0, 21.0, 22.0, 21.0, 7.0, 11.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -10.10888671875, -9.7568359375, -9.40478515625, -9.052734375, -8.70068359375, -8.3486328125, -7.99658203125, -7.64453125, -7.29248046875, -6.9404296875, -6.58837890625, -6.236328125, -5.88427734375, -5.5322265625, -5.18017578125, -4.828125, -4.47607421875, -4.1240234375, -3.77197265625, -3.419921875, -3.06787109375, -2.7158203125, -2.36376953125, -2.01171875, -1.65966796875, -1.3076171875, -0.95556640625, -0.603515625, -0.25146484375, 0.1005859375, 0.45263671875, 0.8046875, 1.15673828125, 1.5087890625, 1.86083984375, 2.212890625, 2.56494140625, 2.9169921875, 3.26904296875, 3.62109375, 3.97314453125, 4.3251953125, 4.67724609375, 5.029296875, 5.38134765625, 5.7333984375, 6.08544921875, 6.4375, 6.78955078125, 7.1416015625, 7.49365234375, 7.845703125, 8.19775390625, 8.5498046875, 8.90185546875, 9.25390625, 9.60595703125, 9.9580078125, 10.31005859375, 10.662109375, 11.01416015625, 11.3662109375, 11.71826171875, 12.0703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 4.0, 9.0, 13.0, 19.0, 47.0, 55.0, 90.0, 185.0, 358.0, 1011.0, 3568.0, 22237.0, 280656.0, 692507.0, 39894.0, 5473.0, 1406.0, 492.0, 210.0, 114.0, 63.0, 33.0, 28.0, 17.0, 14.0, 7.0, 8.0, 5.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.87109375, -2.76123046875, -2.6513671875, -2.54150390625, -2.431640625, -2.32177734375, -2.2119140625, -2.10205078125, -1.9921875, -1.88232421875, -1.7724609375, -1.66259765625, -1.552734375, -1.44287109375, -1.3330078125, -1.22314453125, -1.11328125, -1.00341796875, -0.8935546875, -0.78369140625, -0.673828125, -0.56396484375, -0.4541015625, -0.34423828125, -0.234375, -0.12451171875, -0.0146484375, 0.09521484375, 0.205078125, 0.31494140625, 0.4248046875, 0.53466796875, 0.64453125, 0.75439453125, 0.8642578125, 0.97412109375, 1.083984375, 1.19384765625, 1.3037109375, 1.41357421875, 1.5234375, 1.63330078125, 1.7431640625, 1.85302734375, 1.962890625, 2.07275390625, 2.1826171875, 2.29248046875, 2.40234375, 2.51220703125, 2.6220703125, 2.73193359375, 2.841796875, 2.95166015625, 3.0615234375, 3.17138671875, 3.28125, 3.39111328125, 3.5009765625, 3.61083984375, 3.720703125, 3.83056640625, 3.9404296875, 4.05029296875, 4.16015625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 9.0, 3.0, 6.0, 6.0, 13.0, 22.0, 23.0, 24.0, 36.0, 84.0, 138.0, 184.0, 161.0, 92.0, 65.0, 48.0, 26.0, 16.0, 16.0, 10.0, 5.0, 3.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009307861328125, -0.000903204083442688, -0.000875622034072876, -0.000848039984703064, -0.000820457935333252, -0.0007928758859634399, -0.0007652938365936279, -0.0007377117872238159, -0.0007101297378540039, -0.0006825476884841919, -0.0006549656391143799, -0.0006273835897445679, -0.0005998015403747559, -0.0005722194910049438, -0.0005446374416351318, -0.0005170553922653198, -0.0004894733428955078, -0.0004618912935256958, -0.0004343092441558838, -0.0004067271947860718, -0.00037914514541625977, -0.00035156309604644775, -0.00032398104667663574, -0.00029639899730682373, -0.0002688169479370117, -0.0002412348985671997, -0.0002136528491973877, -0.00018607079982757568, -0.00015848875045776367, -0.00013090670108795166, -0.00010332465171813965, -7.574260234832764e-05, -4.8160552978515625e-05, -2.0578503608703613e-05, 7.0035457611083984e-06, 3.458559513092041e-05, 6.216764450073242e-05, 8.974969387054443e-05, 0.00011733174324035645, 0.00014491379261016846, 0.00017249584197998047, 0.00020007789134979248, 0.0002276599407196045, 0.0002552419900894165, 0.0002828240394592285, 0.00031040608882904053, 0.00033798813819885254, 0.00036557018756866455, 0.00039315223693847656, 0.0004207342863082886, 0.0004483163356781006, 0.0004758983850479126, 0.0005034804344177246, 0.0005310624837875366, 0.0005586445331573486, 0.0005862265825271606, 0.0006138086318969727, 0.0006413906812667847, 0.0006689727306365967, 0.0006965547800064087, 0.0007241368293762207, 0.0007517188787460327, 0.0007793009281158447, 0.0008068829774856567, 0.0008344650268554688]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 16.0, 20.0, 27.0, 37.0, 64.0, 99.0, 170.0, 357.0, 691.0, 1555.0, 4381.0, 18260.0, 163009.0, 759064.0, 83257.0, 11764.0, 3206.0, 1269.0, 586.0, 281.0, 163.0, 110.0, 52.0, 36.0, 28.0, 19.0, 9.0, 7.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.767578125, -1.6807861328125, -1.593994140625, -1.5072021484375, -1.42041015625, -1.3336181640625, -1.246826171875, -1.1600341796875, -1.0732421875, -0.9864501953125, -0.899658203125, -0.8128662109375, -0.72607421875, -0.6392822265625, -0.552490234375, -0.4656982421875, -0.37890625, -0.2921142578125, -0.205322265625, -0.1185302734375, -0.03173828125, 0.0550537109375, 0.141845703125, 0.2286376953125, 0.3154296875, 0.4022216796875, 0.489013671875, 0.5758056640625, 0.66259765625, 0.7493896484375, 0.836181640625, 0.9229736328125, 1.009765625, 1.0965576171875, 1.183349609375, 1.2701416015625, 1.35693359375, 1.4437255859375, 1.530517578125, 1.6173095703125, 1.7041015625, 1.7908935546875, 1.877685546875, 1.9644775390625, 2.05126953125, 2.1380615234375, 2.224853515625, 2.3116455078125, 2.3984375, 2.4852294921875, 2.572021484375, 2.6588134765625, 2.74560546875, 2.8323974609375, 2.919189453125, 3.0059814453125, 3.0927734375, 3.1795654296875, 3.266357421875, 3.3531494140625, 3.43994140625, 3.5267333984375, 3.613525390625, 3.7003173828125, 3.787109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 4.0, 15.0, 11.0, 28.0, 26.0, 22.0, 34.0, 34.0, 56.0, 60.0, 76.0, 80.0, 72.0, 72.0, 65.0, 58.0, 50.0, 39.0, 39.0, 32.0, 27.0, 18.0, 11.0, 13.0, 12.0, 7.0, 10.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7353515625, -1.6743927001953125, -1.613433837890625, -1.5524749755859375, -1.49151611328125, -1.4305572509765625, -1.369598388671875, -1.3086395263671875, -1.2476806640625, -1.1867218017578125, -1.125762939453125, -1.0648040771484375, -1.00384521484375, -0.9428863525390625, -0.881927490234375, -0.8209686279296875, -0.760009765625, -0.6990509033203125, -0.638092041015625, -0.5771331787109375, -0.51617431640625, -0.4552154541015625, -0.394256591796875, -0.3332977294921875, -0.2723388671875, -0.2113800048828125, -0.150421142578125, -0.0894622802734375, -0.02850341796875, 0.0324554443359375, 0.093414306640625, 0.1543731689453125, 0.21533203125, 0.2762908935546875, 0.337249755859375, 0.3982086181640625, 0.45916748046875, 0.5201263427734375, 0.581085205078125, 0.6420440673828125, 0.7030029296875, 0.7639617919921875, 0.824920654296875, 0.8858795166015625, 0.94683837890625, 1.0077972412109375, 1.068756103515625, 1.1297149658203125, 1.190673828125, 1.2516326904296875, 1.312591552734375, 1.3735504150390625, 1.43450927734375, 1.4954681396484375, 1.556427001953125, 1.6173858642578125, 1.6783447265625, 1.7393035888671875, 1.800262451171875, 1.8612213134765625, 1.92218017578125, 1.9831390380859375, 2.044097900390625, 2.1050567626953125, 2.166015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 10.0, 17.0, 23.0, 52.0, 96.0, 162.0, 252.0, 164.0, 91.0, 62.0, 22.0, 16.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.84809112548828, -43.0869140625, -41.32573318481445, -39.56455612182617, -37.80337905883789, -36.042198181152344, -34.28102111816406, -32.51984405517578, -30.758663177490234, -28.99748420715332, -27.23630714416504, -25.475128173828125, -23.71394920349121, -21.952770233154297, -20.191593170166016, -18.4304141998291, -16.66923713684082, -14.908059120178223, -13.146880149841309, -11.385702133178711, -9.624523162841797, -7.863345146179199, -6.102167129516602, -4.3409881591796875, -2.57981014251709, -0.8186317682266235, 0.9425466060638428, 2.7037248611450195, 4.464903354644775, 6.226081848144531, 7.987259864807129, 9.748438835144043, 11.50961685180664, 13.270794868469238, 15.031973838806152, 16.79315185546875, 18.554330825805664, 20.315509796142578, 22.07668685913086, 23.837865829467773, 25.599044799804688, 27.3602237701416, 29.121400833129883, 30.882579803466797, 32.64375686645508, 34.404937744140625, 36.166114807128906, 37.92729187011719, 39.68846893310547, 41.44964599609375, 43.2108268737793, 44.97200393676758, 46.73318099975586, 48.494361877441406, 50.25553894042969, 52.01671600341797, 53.777896881103516, 55.5390739440918, 57.300254821777344, 59.061431884765625, 60.822608947753906, 62.58378982543945, 64.344970703125, 66.10614776611328, 67.86732482910156]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 8.0, 11.0, 7.0, 15.0, 12.0, 22.0, 29.0, 23.0, 30.0, 28.0, 27.0, 30.0, 25.0, 37.0, 41.0, 67.0, 82.0, 74.0, 57.0, 56.0, 40.0, 27.0, 31.0, 31.0, 22.0, 28.0, 29.0, 21.0, 6.0, 12.0, 5.0, 13.0, 7.0, 8.0, 11.0, 8.0, 6.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.217880249023438, -28.275840759277344, -27.333803176879883, -26.39176368713379, -25.449726104736328, -24.507686614990234, -23.565649032592773, -22.62360954284668, -21.68157196044922, -20.739532470703125, -19.797494888305664, -18.85545539855957, -17.91341781616211, -16.971378326416016, -16.029340744018555, -15.087301254272461, -14.145262718200684, -13.203224182128906, -12.261185646057129, -11.319147109985352, -10.377108573913574, -9.435070037841797, -8.493030548095703, -7.550992488861084, -6.608953952789307, -5.666915416717529, -4.724876880645752, -3.7828381061553955, -2.840799570083618, -1.8987607955932617, -0.9567222595214844, -0.014683723449707031, 0.9273548126220703, 1.8693933486938477, 2.811431884765625, 3.7534706592559814, 4.69550895690918, 5.637547969818115, 6.579586505889893, 7.52162504196167, 8.463663101196289, 9.405701637268066, 10.347740173339844, 11.289778709411621, 12.231817245483398, 13.173856735229492, 14.115894317626953, 15.057933807373047, 15.999972343444824, 16.9420108795166, 17.884050369262695, 18.826087951660156, 19.76812744140625, 20.71016502380371, 21.652204513549805, 22.594242095947266, 23.53628158569336, 24.478321075439453, 25.420358657836914, 26.362398147583008, 27.30443572998047, 28.246475219726562, 29.188512802124023, 30.130552291870117, 31.072589874267578]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 11.0, 16.0, 18.0, 21.0, 38.0, 59.0, 102.0, 210.0, 405.0, 886.0, 2156.0, 6657.0, 26000.0, 204817.0, 3103945.0, 776119.0, 55267.0, 11590.0, 3604.0, 1260.0, 565.0, 246.0, 116.0, 68.0, 38.0, 26.0, 14.0, 11.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.1558837890625, -5.022705078125, -4.8895263671875, -4.75634765625, -4.6231689453125, -4.489990234375, -4.3568115234375, -4.2236328125, -4.0904541015625, -3.957275390625, -3.8240966796875, -3.69091796875, -3.5577392578125, -3.424560546875, -3.2913818359375, -3.158203125, -3.0250244140625, -2.891845703125, -2.7586669921875, -2.62548828125, -2.4923095703125, -2.359130859375, -2.2259521484375, -2.0927734375, -1.9595947265625, -1.826416015625, -1.6932373046875, -1.56005859375, -1.4268798828125, -1.293701171875, -1.1605224609375, -1.02734375, -0.8941650390625, -0.760986328125, -0.6278076171875, -0.49462890625, -0.3614501953125, -0.228271484375, -0.0950927734375, 0.0380859375, 0.1712646484375, 0.304443359375, 0.4376220703125, 0.57080078125, 0.7039794921875, 0.837158203125, 0.9703369140625, 1.103515625, 1.2366943359375, 1.369873046875, 1.5030517578125, 1.63623046875, 1.7694091796875, 1.902587890625, 2.0357666015625, 2.1689453125, 2.3021240234375, 2.435302734375, 2.5684814453125, 2.70166015625, 2.8348388671875, 2.968017578125, 3.1011962890625, 3.234375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 2.0, 0.0, 9.0, 6.0, 13.0, 6.0, 17.0, 15.0, 15.0, 18.0, 29.0, 29.0, 27.0, 38.0, 40.0, 35.0, 40.0, 54.0, 42.0, 33.0, 43.0, 50.0, 34.0, 46.0, 39.0, 34.0, 31.0, 23.0, 33.0, 26.0, 25.0, 27.0, 19.0, 13.0, 13.0, 10.0, 9.0, 9.0, 11.0, 4.0, 3.0, 9.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.666015625, -1.6162109375, -1.56640625, -1.5166015625, -1.466796875, -1.4169921875, -1.3671875, -1.3173828125, -1.267578125, -1.2177734375, -1.16796875, -1.1181640625, -1.068359375, -1.0185546875, -0.96875, -0.9189453125, -0.869140625, -0.8193359375, -0.76953125, -0.7197265625, -0.669921875, -0.6201171875, -0.5703125, -0.5205078125, -0.470703125, -0.4208984375, -0.37109375, -0.3212890625, -0.271484375, -0.2216796875, -0.171875, -0.1220703125, -0.072265625, -0.0224609375, 0.02734375, 0.0771484375, 0.126953125, 0.1767578125, 0.2265625, 0.2763671875, 0.326171875, 0.3759765625, 0.42578125, 0.4755859375, 0.525390625, 0.5751953125, 0.625, 0.6748046875, 0.724609375, 0.7744140625, 0.82421875, 0.8740234375, 0.923828125, 0.9736328125, 1.0234375, 1.0732421875, 1.123046875, 1.1728515625, 1.22265625, 1.2724609375, 1.322265625, 1.3720703125, 1.421875, 1.4716796875, 1.521484375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 8.0, 10.0, 19.0, 30.0, 43.0, 77.0, 201.0, 430.0, 1092.0, 3394.0, 14491.0, 106885.0, 3133640.0, 873063.0, 48158.0, 8584.0, 2508.0, 867.0, 371.0, 181.0, 93.0, 47.0, 27.0, 19.0, 12.0, 8.0, 8.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01953125, -5.830322265625, -5.64111328125, -5.451904296875, -5.2626953125, -5.073486328125, -4.88427734375, -4.695068359375, -4.505859375, -4.316650390625, -4.12744140625, -3.938232421875, -3.7490234375, -3.559814453125, -3.37060546875, -3.181396484375, -2.9921875, -2.802978515625, -2.61376953125, -2.424560546875, -2.2353515625, -2.046142578125, -1.85693359375, -1.667724609375, -1.478515625, -1.289306640625, -1.10009765625, -0.910888671875, -0.7216796875, -0.532470703125, -0.34326171875, -0.154052734375, 0.03515625, 0.224365234375, 0.41357421875, 0.602783203125, 0.7919921875, 0.981201171875, 1.17041015625, 1.359619140625, 1.548828125, 1.738037109375, 1.92724609375, 2.116455078125, 2.3056640625, 2.494873046875, 2.68408203125, 2.873291015625, 3.0625, 3.251708984375, 3.44091796875, 3.630126953125, 3.8193359375, 4.008544921875, 4.19775390625, 4.386962890625, 4.576171875, 4.765380859375, 4.95458984375, 5.143798828125, 5.3330078125, 5.522216796875, 5.71142578125, 5.900634765625, 6.08984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 10.0, 16.0, 15.0, 18.0, 28.0, 36.0, 58.0, 48.0, 85.0, 142.0, 222.0, 331.0, 494.0, 660.0, 618.0, 450.0, 251.0, 170.0, 114.0, 86.0, 60.0, 42.0, 27.0, 18.0, 16.0, 6.0, 12.0, 10.0, 5.0, 5.0, 4.0, 6.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.77734375, -3.65008544921875, -3.5228271484375, -3.39556884765625, -3.268310546875, -3.14105224609375, -3.0137939453125, -2.88653564453125, -2.75927734375, -2.63201904296875, -2.5047607421875, -2.37750244140625, -2.250244140625, -2.12298583984375, -1.9957275390625, -1.86846923828125, -1.7412109375, -1.61395263671875, -1.4866943359375, -1.35943603515625, -1.232177734375, -1.10491943359375, -0.9776611328125, -0.85040283203125, -0.72314453125, -0.59588623046875, -0.4686279296875, -0.34136962890625, -0.214111328125, -0.08685302734375, 0.0404052734375, 0.16766357421875, 0.294921875, 0.42218017578125, 0.5494384765625, 0.67669677734375, 0.803955078125, 0.93121337890625, 1.0584716796875, 1.18572998046875, 1.31298828125, 1.44024658203125, 1.5675048828125, 1.69476318359375, 1.822021484375, 1.94927978515625, 2.0765380859375, 2.20379638671875, 2.3310546875, 2.45831298828125, 2.5855712890625, 2.71282958984375, 2.840087890625, 2.96734619140625, 3.0946044921875, 3.22186279296875, 3.34912109375, 3.47637939453125, 3.6036376953125, 3.73089599609375, 3.858154296875, 3.98541259765625, 4.1126708984375, 4.23992919921875, 4.3671875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 7.0, 15.0, 45.0, 104.0, 170.0, 207.0, 230.0, 125.0, 42.0, 22.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.884132385253906, -32.159244537353516, -30.43436050415039, -28.70947265625, -26.984586715698242, -25.259700775146484, -23.534814834594727, -21.80992889404297, -20.085041046142578, -18.36015510559082, -16.635269165039062, -14.910382270812988, -13.185495376586914, -11.460609436035156, -9.735723495483398, -8.010836601257324, -6.285951614379883, -4.561065196990967, -2.83617901802063, -1.111292839050293, 0.613593578338623, 2.338479995727539, 4.063365936279297, 5.788252830505371, 7.513138771057129, 9.238024711608887, 10.962911605834961, 12.687797546386719, 14.412683486938477, 16.137569427490234, 17.862457275390625, 19.587343215942383, 21.31222915649414, 23.0371150970459, 24.762001037597656, 26.486888885498047, 28.211774826049805, 29.936660766601562, 31.66154670715332, 33.38643264770508, 35.11132049560547, 36.83620834350586, 38.561092376708984, 40.285980224609375, 42.0108642578125, 43.73575210571289, 45.46063995361328, 47.185523986816406, 48.91040802001953, 50.63529586791992, 52.36017990112305, 54.08506774902344, 55.80995178222656, 57.53483963012695, 59.259727478027344, 60.98461151123047, 62.70949935913086, 64.43438720703125, 66.15927124023438, 67.8841552734375, 69.60904693603516, 71.33393096923828, 73.0588150024414, 74.78370666503906, 76.50859069824219]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 3.0, 8.0, 17.0, 15.0, 20.0, 15.0, 30.0, 19.0, 30.0, 38.0, 33.0, 46.0, 37.0, 41.0, 38.0, 44.0, 41.0, 56.0, 40.0, 48.0, 48.0, 31.0, 27.0, 48.0, 31.0, 23.0, 21.0, 28.0, 14.0, 14.0, 15.0, 12.0, 10.0, 5.0, 12.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.829822540283203, -19.26103401184082, -18.692245483398438, -18.123458862304688, -17.554670333862305, -16.985881805419922, -16.417095184326172, -15.848306655883789, -15.279518127441406, -14.710729598999023, -14.141942024230957, -13.57315444946289, -13.004365921020508, -12.435577392578125, -11.866789817810059, -11.298002243041992, -10.72921371459961, -10.160425186157227, -9.59163761138916, -9.022850036621094, -8.454061508178711, -7.885273456573486, -7.316485404968262, -6.747697353363037, -6.1789093017578125, -5.610121250152588, -5.041333198547363, -4.472545146942139, -3.903757095336914, -3.3349690437316895, -2.766180992126465, -2.1973929405212402, -1.6286067962646484, -1.0598187446594238, -0.4910306930541992, 0.07775735855102539, 0.64654541015625, 1.2153334617614746, 1.7841215133666992, 2.352909564971924, 2.9216976165771484, 3.490485668182373, 4.059273719787598, 4.628061771392822, 5.196849822998047, 5.7656378746032715, 6.334425926208496, 6.903213977813721, 7.472002029418945, 8.040790557861328, 8.609578132629395, 9.178365707397461, 9.747154235839844, 10.315942764282227, 10.884730339050293, 11.45351791381836, 12.022306442260742, 12.591094970703125, 13.159882545471191, 13.728670120239258, 14.29745864868164, 14.866247177124023, 15.43503475189209, 16.003822326660156, 16.57261085510254]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 14.0, 8.0, 27.0, 37.0, 55.0, 104.0, 166.0, 269.0, 465.0, 785.0, 1499.0, 3027.0, 6248.0, 14633.0, 36162.0, 97790.0, 245074.0, 341224.0, 183896.0, 69915.0, 26310.0, 10702.0, 4920.0, 2343.0, 1261.0, 687.0, 343.0, 200.0, 149.0, 78.0, 51.0, 31.0, 22.0, 17.0, 15.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.296112060546875, -2.19769287109375, -2.099273681640625, -2.0008544921875, -1.902435302734375, -1.80401611328125, -1.705596923828125, -1.607177734375, -1.508758544921875, -1.41033935546875, -1.311920166015625, -1.2135009765625, -1.115081787109375, -1.01666259765625, -0.918243408203125, -0.81982421875, -0.721405029296875, -0.62298583984375, -0.524566650390625, -0.4261474609375, -0.327728271484375, -0.22930908203125, -0.130889892578125, -0.032470703125, 0.065948486328125, 0.16436767578125, 0.262786865234375, 0.3612060546875, 0.459625244140625, 0.55804443359375, 0.656463623046875, 0.7548828125, 0.853302001953125, 0.95172119140625, 1.050140380859375, 1.1485595703125, 1.246978759765625, 1.34539794921875, 1.443817138671875, 1.542236328125, 1.640655517578125, 1.73907470703125, 1.837493896484375, 1.9359130859375, 2.034332275390625, 2.13275146484375, 2.231170654296875, 2.32958984375, 2.428009033203125, 2.52642822265625, 2.624847412109375, 2.7232666015625, 2.821685791015625, 2.92010498046875, 3.018524169921875, 3.116943359375, 3.215362548828125, 3.31378173828125, 3.412200927734375, 3.5106201171875, 3.609039306640625, 3.70745849609375, 3.805877685546875, 3.904296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 13.0, 14.0, 12.0, 18.0, 22.0, 18.0, 22.0, 38.0, 26.0, 32.0, 44.0, 56.0, 30.0, 48.0, 47.0, 39.0, 44.0, 53.0, 39.0, 48.0, 25.0, 38.0, 40.0, 32.0, 28.0, 33.0, 15.0, 13.0, 17.0, 8.0, 11.0, 17.0, 5.0, 3.0, 9.0, 3.0, 8.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9287109375, -1.871856689453125, -1.81500244140625, -1.758148193359375, -1.7012939453125, -1.644439697265625, -1.58758544921875, -1.530731201171875, -1.473876953125, -1.417022705078125, -1.36016845703125, -1.303314208984375, -1.2464599609375, -1.189605712890625, -1.13275146484375, -1.075897216796875, -1.01904296875, -0.962188720703125, -0.90533447265625, -0.848480224609375, -0.7916259765625, -0.734771728515625, -0.67791748046875, -0.621063232421875, -0.564208984375, -0.507354736328125, -0.45050048828125, -0.393646240234375, -0.3367919921875, -0.279937744140625, -0.22308349609375, -0.166229248046875, -0.109375, -0.052520751953125, 0.00433349609375, 0.061187744140625, 0.1180419921875, 0.174896240234375, 0.23175048828125, 0.288604736328125, 0.345458984375, 0.402313232421875, 0.45916748046875, 0.516021728515625, 0.5728759765625, 0.629730224609375, 0.68658447265625, 0.743438720703125, 0.80029296875, 0.857147216796875, 0.91400146484375, 0.970855712890625, 1.0277099609375, 1.084564208984375, 1.14141845703125, 1.198272705078125, 1.255126953125, 1.311981201171875, 1.36883544921875, 1.425689697265625, 1.4825439453125, 1.539398193359375, 1.59625244140625, 1.653106689453125, 1.7099609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 5.0, 8.0, 9.0, 6.0, 14.0, 20.0, 22.0, 53.0, 72.0, 90.0, 182.0, 329.0, 677.0, 1752.0, 4929.0, 18647.0, 104810.0, 658622.0, 212674.0, 33370.0, 7691.0, 2540.0, 964.0, 452.0, 225.0, 137.0, 67.0, 49.0, 33.0, 22.0, 15.0, 14.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.41015625, -6.225341796875, -6.04052734375, -5.855712890625, -5.6708984375, -5.486083984375, -5.30126953125, -5.116455078125, -4.931640625, -4.746826171875, -4.56201171875, -4.377197265625, -4.1923828125, -4.007568359375, -3.82275390625, -3.637939453125, -3.453125, -3.268310546875, -3.08349609375, -2.898681640625, -2.7138671875, -2.529052734375, -2.34423828125, -2.159423828125, -1.974609375, -1.789794921875, -1.60498046875, -1.420166015625, -1.2353515625, -1.050537109375, -0.86572265625, -0.680908203125, -0.49609375, -0.311279296875, -0.12646484375, 0.058349609375, 0.2431640625, 0.427978515625, 0.61279296875, 0.797607421875, 0.982421875, 1.167236328125, 1.35205078125, 1.536865234375, 1.7216796875, 1.906494140625, 2.09130859375, 2.276123046875, 2.4609375, 2.645751953125, 2.83056640625, 3.015380859375, 3.2001953125, 3.385009765625, 3.56982421875, 3.754638671875, 3.939453125, 4.124267578125, 4.30908203125, 4.493896484375, 4.6787109375, 4.863525390625, 5.04833984375, 5.233154296875, 5.41796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 6.0, 3.0, 5.0, 7.0, 9.0, 14.0, 20.0, 26.0, 32.0, 32.0, 37.0, 56.0, 47.0, 54.0, 67.0, 63.0, 60.0, 62.0, 66.0, 65.0, 52.0, 54.0, 39.0, 25.0, 25.0, 20.0, 20.0, 4.0, 8.0, 4.0, 4.0, 2.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.121337890625, -8.83642578125, -8.551513671875, -8.2666015625, -7.981689453125, -7.69677734375, -7.411865234375, -7.126953125, -6.842041015625, -6.55712890625, -6.272216796875, -5.9873046875, -5.702392578125, -5.41748046875, -5.132568359375, -4.84765625, -4.562744140625, -4.27783203125, -3.992919921875, -3.7080078125, -3.423095703125, -3.13818359375, -2.853271484375, -2.568359375, -2.283447265625, -1.99853515625, -1.713623046875, -1.4287109375, -1.143798828125, -0.85888671875, -0.573974609375, -0.2890625, -0.004150390625, 0.28076171875, 0.565673828125, 0.8505859375, 1.135498046875, 1.42041015625, 1.705322265625, 1.990234375, 2.275146484375, 2.56005859375, 2.844970703125, 3.1298828125, 3.414794921875, 3.69970703125, 3.984619140625, 4.26953125, 4.554443359375, 4.83935546875, 5.124267578125, 5.4091796875, 5.694091796875, 5.97900390625, 6.263916015625, 6.548828125, 6.833740234375, 7.11865234375, 7.403564453125, 7.6884765625, 7.973388671875, 8.25830078125, 8.543212890625, 8.828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 6.0, 10.0, 6.0, 6.0, 13.0, 20.0, 28.0, 47.0, 65.0, 101.0, 220.0, 397.0, 925.0, 2366.0, 7448.0, 29280.0, 154068.0, 664739.0, 148091.0, 29315.0, 7263.0, 2331.0, 936.0, 381.0, 192.0, 108.0, 64.0, 40.0, 35.0, 17.0, 14.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.48858642578125, -1.4381103515625, -1.38763427734375, -1.337158203125, -1.28668212890625, -1.2362060546875, -1.18572998046875, -1.13525390625, -1.08477783203125, -1.0343017578125, -0.98382568359375, -0.933349609375, -0.88287353515625, -0.8323974609375, -0.78192138671875, -0.7314453125, -0.68096923828125, -0.6304931640625, -0.58001708984375, -0.529541015625, -0.47906494140625, -0.4285888671875, -0.37811279296875, -0.32763671875, -0.27716064453125, -0.2266845703125, -0.17620849609375, -0.125732421875, -0.07525634765625, -0.0247802734375, 0.02569580078125, 0.076171875, 0.12664794921875, 0.1771240234375, 0.22760009765625, 0.278076171875, 0.32855224609375, 0.3790283203125, 0.42950439453125, 0.47998046875, 0.53045654296875, 0.5809326171875, 0.63140869140625, 0.681884765625, 0.73236083984375, 0.7828369140625, 0.83331298828125, 0.8837890625, 0.93426513671875, 0.9847412109375, 1.03521728515625, 1.085693359375, 1.13616943359375, 1.1866455078125, 1.23712158203125, 1.28759765625, 1.33807373046875, 1.3885498046875, 1.43902587890625, 1.489501953125, 1.53997802734375, 1.5904541015625, 1.64093017578125, 1.69140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 9.0, 9.0, 14.0, 14.0, 25.0, 31.0, 54.0, 70.0, 92.0, 115.0, 107.0, 101.0, 88.0, 70.0, 43.0, 41.0, 24.0, 21.0, 11.0, 12.0, 11.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003819465637207031, -0.00036891549825668335, -0.0003558844327926636, -0.0003428533673286438, -0.000329822301864624, -0.00031679123640060425, -0.00030376017093658447, -0.0002907291054725647, -0.0002776980400085449, -0.00026466697454452515, -0.00025163590908050537, -0.0002386048436164856, -0.00022557377815246582, -0.00021254271268844604, -0.00019951164722442627, -0.0001864805817604065, -0.00017344951629638672, -0.00016041845083236694, -0.00014738738536834717, -0.0001343563199043274, -0.00012132525444030762, -0.00010829418897628784, -9.526312351226807e-05, -8.223205804824829e-05, -6.920099258422852e-05, -5.616992712020874e-05, -4.3138861656188965e-05, -3.010779619216919e-05, -1.7076730728149414e-05, -4.045665264129639e-06, 8.985400199890137e-06, 2.2016465663909912e-05, 3.504753112792969e-05, 4.807859659194946e-05, 6.110966205596924e-05, 7.414072751998901e-05, 8.717179298400879e-05, 0.00010020285844802856, 0.00011323392391204834, 0.00012626498937606812, 0.0001392960548400879, 0.00015232712030410767, 0.00016535818576812744, 0.00017838925123214722, 0.000191420316696167, 0.00020445138216018677, 0.00021748244762420654, 0.00023051351308822632, 0.0002435445785522461, 0.00025657564401626587, 0.00026960670948028564, 0.0002826377749443054, 0.0002956688404083252, 0.00030869990587234497, 0.00032173097133636475, 0.0003347620368003845, 0.0003477931022644043, 0.00036082416772842407, 0.00037385523319244385, 0.0003868862986564636, 0.0003999173641204834, 0.0004129484295845032, 0.00042597949504852295, 0.0004390105605125427, 0.0004520416259765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 10.0, 18.0, 21.0, 21.0, 48.0, 86.0, 135.0, 220.0, 477.0, 1080.0, 2581.0, 7922.0, 33805.0, 189978.0, 652937.0, 125789.0, 23551.0, 6007.0, 2116.0, 867.0, 408.0, 199.0, 97.0, 53.0, 39.0, 28.0, 14.0, 15.0, 8.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.888671875, -1.833740234375, -1.77880859375, -1.723876953125, -1.6689453125, -1.614013671875, -1.55908203125, -1.504150390625, -1.44921875, -1.394287109375, -1.33935546875, -1.284423828125, -1.2294921875, -1.174560546875, -1.11962890625, -1.064697265625, -1.009765625, -0.954833984375, -0.89990234375, -0.844970703125, -0.7900390625, -0.735107421875, -0.68017578125, -0.625244140625, -0.5703125, -0.515380859375, -0.46044921875, -0.405517578125, -0.3505859375, -0.295654296875, -0.24072265625, -0.185791015625, -0.130859375, -0.075927734375, -0.02099609375, 0.033935546875, 0.0888671875, 0.143798828125, 0.19873046875, 0.253662109375, 0.30859375, 0.363525390625, 0.41845703125, 0.473388671875, 0.5283203125, 0.583251953125, 0.63818359375, 0.693115234375, 0.748046875, 0.802978515625, 0.85791015625, 0.912841796875, 0.9677734375, 1.022705078125, 1.07763671875, 1.132568359375, 1.1875, 1.242431640625, 1.29736328125, 1.352294921875, 1.4072265625, 1.462158203125, 1.51708984375, 1.572021484375, 1.626953125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 12.0, 11.0, 25.0, 39.0, 41.0, 62.0, 75.0, 100.0, 102.0, 119.0, 98.0, 71.0, 68.0, 50.0, 31.0, 20.0, 20.0, 16.0, 11.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6953125, -2.6277618408203125, -2.560211181640625, -2.4926605224609375, -2.42510986328125, -2.3575592041015625, -2.290008544921875, -2.2224578857421875, -2.1549072265625, -2.0873565673828125, -2.019805908203125, -1.9522552490234375, -1.88470458984375, -1.8171539306640625, -1.749603271484375, -1.6820526123046875, -1.614501953125, -1.5469512939453125, -1.479400634765625, -1.4118499755859375, -1.34429931640625, -1.2767486572265625, -1.209197998046875, -1.1416473388671875, -1.0740966796875, -1.0065460205078125, -0.938995361328125, -0.8714447021484375, -0.80389404296875, -0.7363433837890625, -0.668792724609375, -0.6012420654296875, -0.53369140625, -0.4661407470703125, -0.398590087890625, -0.3310394287109375, -0.26348876953125, -0.1959381103515625, -0.128387451171875, -0.0608367919921875, 0.0067138671875, 0.0742645263671875, 0.141815185546875, 0.2093658447265625, 0.27691650390625, 0.3444671630859375, 0.412017822265625, 0.4795684814453125, 0.547119140625, 0.6146697998046875, 0.682220458984375, 0.7497711181640625, 0.81732177734375, 0.8848724365234375, 0.952423095703125, 1.0199737548828125, 1.0875244140625, 1.1550750732421875, 1.222625732421875, 1.2901763916015625, 1.35772705078125, 1.4252777099609375, 1.492828369140625, 1.5603790283203125, 1.6279296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 14.0, 41.0, 71.0, 127.0, 217.0, 218.0, 109.0, 87.0, 55.0, 15.0, 16.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.301876068115234, -40.93848419189453, -39.57509231567383, -38.211700439453125, -36.84831237792969, -35.484920501708984, -34.12152862548828, -32.75813674926758, -31.394746780395508, -30.031354904174805, -28.667964935302734, -27.30457305908203, -25.941181182861328, -24.577791213989258, -23.214399337768555, -21.851009368896484, -20.48761749267578, -19.124225616455078, -17.760835647583008, -16.397443771362305, -15.034052848815918, -13.670661926269531, -12.307270050048828, -10.943879127502441, -9.580488204956055, -8.217097282409668, -6.853705883026123, -5.490314483642578, -4.126923561096191, -2.7635326385498047, -1.4001407623291016, -0.036749839782714844, 1.3266410827636719, 2.6900322437286377, 4.0534234046936035, 5.416814804077148, 6.780205726623535, 8.143596649169922, 9.506988525390625, 10.870379447937012, 12.233770370483398, 13.597161293029785, 14.960552215576172, 16.323944091796875, 17.687335968017578, 19.05072593688965, 20.41411781311035, 21.777507781982422, 23.140899658203125, 24.504291534423828, 25.8676815032959, 27.2310733795166, 28.594463348388672, 29.957855224609375, 31.321247100830078, 32.68463897705078, 34.04802703857422, 35.41141891479492, 36.774810791015625, 38.13819885253906, 39.501590728759766, 40.86498260498047, 42.22837448120117, 43.591766357421875, 44.95515823364258]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 6.0, 11.0, 9.0, 13.0, 14.0, 16.0, 13.0, 32.0, 27.0, 24.0, 33.0, 33.0, 38.0, 33.0, 59.0, 61.0, 80.0, 83.0, 57.0, 46.0, 27.0, 32.0, 28.0, 34.0, 25.0, 19.0, 16.0, 17.0, 6.0, 16.0, 12.0, 9.0, 15.0, 9.0, 5.0, 8.0, 7.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.409381866455078, -26.561960220336914, -25.71453857421875, -24.86711883544922, -24.019697189331055, -23.17227554321289, -22.324853897094727, -21.477432250976562, -20.63001251220703, -19.782590866088867, -18.935169219970703, -18.087749481201172, -17.240327835083008, -16.392906188964844, -15.54548454284668, -14.698062896728516, -13.850641250610352, -13.003219604492188, -12.15579891204834, -11.308377265930176, -10.460956573486328, -9.613534927368164, -8.76611328125, -7.918692111968994, -7.071270942687988, -6.223849773406982, -5.376428604125977, -4.5290069580078125, -3.6815857887268066, -2.834164619445801, -1.9867429733276367, -1.1393218040466309, -0.291900634765625, 0.5555206537246704, 1.4029419422149658, 2.250363349914551, 3.0977845191955566, 3.9452056884765625, 4.792627334594727, 5.640048503875732, 6.487469673156738, 7.334890842437744, 8.18231201171875, 9.029733657836914, 9.877155303955078, 10.724575996398926, 11.57199764251709, 12.419418334960938, 13.266839981079102, 14.114261627197266, 14.961682319641113, 15.809103965759277, 16.656524658203125, 17.50394630432129, 18.351367950439453, 19.198789596557617, 20.04621124267578, 20.893632888793945, 21.74105453491211, 22.58847427368164, 23.435895919799805, 24.28331756591797, 25.130739212036133, 25.978160858154297, 26.825580596923828]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 5.0, 6.0, 11.0, 15.0, 27.0, 40.0, 70.0, 103.0, 153.0, 284.0, 485.0, 945.0, 1755.0, 4165.0, 11362.0, 40953.0, 231397.0, 1810567.0, 1808416.0, 223708.0, 40202.0, 11390.0, 4236.0, 1840.0, 887.0, 508.0, 305.0, 168.0, 116.0, 53.0, 42.0, 31.0, 17.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.388671875, -3.3060150146484375, -3.223358154296875, -3.1407012939453125, -3.05804443359375, -2.9753875732421875, -2.892730712890625, -2.8100738525390625, -2.7274169921875, -2.6447601318359375, -2.562103271484375, -2.4794464111328125, -2.39678955078125, -2.3141326904296875, -2.231475830078125, -2.1488189697265625, -2.066162109375, -1.9835052490234375, -1.900848388671875, -1.8181915283203125, -1.73553466796875, -1.6528778076171875, -1.570220947265625, -1.4875640869140625, -1.4049072265625, -1.3222503662109375, -1.239593505859375, -1.1569366455078125, -1.07427978515625, -0.9916229248046875, -0.908966064453125, -0.8263092041015625, -0.74365234375, -0.6609954833984375, -0.578338623046875, -0.4956817626953125, -0.41302490234375, -0.3303680419921875, -0.247711181640625, -0.1650543212890625, -0.0823974609375, 0.0002593994140625, 0.082916259765625, 0.1655731201171875, 0.24822998046875, 0.3308868408203125, 0.413543701171875, 0.4962005615234375, 0.578857421875, 0.6615142822265625, 0.744171142578125, 0.8268280029296875, 0.90948486328125, 0.9921417236328125, 1.074798583984375, 1.1574554443359375, 1.2401123046875, 1.3227691650390625, 1.405426025390625, 1.4880828857421875, 1.57073974609375, 1.6533966064453125, 1.736053466796875, 1.8187103271484375, 1.9013671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 4.0, 13.0, 19.0, 19.0, 21.0, 16.0, 17.0, 22.0, 33.0, 34.0, 39.0, 46.0, 35.0, 56.0, 48.0, 42.0, 50.0, 60.0, 39.0, 41.0, 41.0, 26.0, 30.0, 44.0, 27.0, 26.0, 26.0, 22.0, 21.0, 11.0, 8.0, 11.0, 7.0, 6.0, 5.0, 10.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.966796875, -1.9099273681640625, -1.853057861328125, -1.7961883544921875, -1.73931884765625, -1.6824493408203125, -1.625579833984375, -1.5687103271484375, -1.5118408203125, -1.4549713134765625, -1.398101806640625, -1.3412322998046875, -1.28436279296875, -1.2274932861328125, -1.170623779296875, -1.1137542724609375, -1.056884765625, -1.0000152587890625, -0.943145751953125, -0.8862762451171875, -0.82940673828125, -0.7725372314453125, -0.715667724609375, -0.6587982177734375, -0.6019287109375, -0.5450592041015625, -0.488189697265625, -0.4313201904296875, -0.37445068359375, -0.3175811767578125, -0.260711669921875, -0.2038421630859375, -0.14697265625, -0.0901031494140625, -0.033233642578125, 0.0236358642578125, 0.08050537109375, 0.1373748779296875, 0.194244384765625, 0.2511138916015625, 0.3079833984375, 0.3648529052734375, 0.421722412109375, 0.4785919189453125, 0.53546142578125, 0.5923309326171875, 0.649200439453125, 0.7060699462890625, 0.762939453125, 0.8198089599609375, 0.876678466796875, 0.9335479736328125, 0.99041748046875, 1.0472869873046875, 1.104156494140625, 1.1610260009765625, 1.2178955078125, 1.2747650146484375, 1.331634521484375, 1.3885040283203125, 1.44537353515625, 1.5022430419921875, 1.559112548828125, 1.6159820556640625, 1.6728515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 13.0, 11.0, 19.0, 25.0, 19.0, 27.0, 62.0, 88.0, 155.0, 275.0, 697.0, 2342.0, 9214.0, 52813.0, 1005519.0, 2992609.0, 109169.0, 15735.0, 3596.0, 997.0, 381.0, 204.0, 96.0, 64.0, 38.0, 15.0, 22.0, 22.0, 13.0, 12.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.247802734375, -4.08544921875, -3.923095703125, -3.7607421875, -3.598388671875, -3.43603515625, -3.273681640625, -3.111328125, -2.948974609375, -2.78662109375, -2.624267578125, -2.4619140625, -2.299560546875, -2.13720703125, -1.974853515625, -1.8125, -1.650146484375, -1.48779296875, -1.325439453125, -1.1630859375, -1.000732421875, -0.83837890625, -0.676025390625, -0.513671875, -0.351318359375, -0.18896484375, -0.026611328125, 0.1357421875, 0.298095703125, 0.46044921875, 0.622802734375, 0.78515625, 0.947509765625, 1.10986328125, 1.272216796875, 1.4345703125, 1.596923828125, 1.75927734375, 1.921630859375, 2.083984375, 2.246337890625, 2.40869140625, 2.571044921875, 2.7333984375, 2.895751953125, 3.05810546875, 3.220458984375, 3.3828125, 3.545166015625, 3.70751953125, 3.869873046875, 4.0322265625, 4.194580078125, 4.35693359375, 4.519287109375, 4.681640625, 4.843994140625, 5.00634765625, 5.168701171875, 5.3310546875, 5.493408203125, 5.65576171875, 5.818115234375, 5.98046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 13.0, 7.0, 6.0, 12.0, 8.0, 14.0, 24.0, 27.0, 31.0, 55.0, 67.0, 123.0, 178.0, 299.0, 471.0, 663.0, 707.0, 495.0, 321.0, 163.0, 100.0, 71.0, 57.0, 39.0, 29.0, 28.0, 14.0, 9.0, 11.0, 10.0, 5.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.947265625, -3.820220947265625, -3.69317626953125, -3.566131591796875, -3.4390869140625, -3.312042236328125, -3.18499755859375, -3.057952880859375, -2.930908203125, -2.803863525390625, -2.67681884765625, -2.549774169921875, -2.4227294921875, -2.295684814453125, -2.16864013671875, -2.041595458984375, -1.91455078125, -1.787506103515625, -1.66046142578125, -1.533416748046875, -1.4063720703125, -1.279327392578125, -1.15228271484375, -1.025238037109375, -0.898193359375, -0.771148681640625, -0.64410400390625, -0.517059326171875, -0.3900146484375, -0.262969970703125, -0.13592529296875, -0.008880615234375, 0.1181640625, 0.245208740234375, 0.37225341796875, 0.499298095703125, 0.6263427734375, 0.753387451171875, 0.88043212890625, 1.007476806640625, 1.134521484375, 1.261566162109375, 1.38861083984375, 1.515655517578125, 1.6427001953125, 1.769744873046875, 1.89678955078125, 2.023834228515625, 2.15087890625, 2.277923583984375, 2.40496826171875, 2.532012939453125, 2.6590576171875, 2.786102294921875, 2.91314697265625, 3.040191650390625, 3.167236328125, 3.294281005859375, 3.42132568359375, 3.548370361328125, 3.6754150390625, 3.802459716796875, 3.92950439453125, 4.056549072265625, 4.18359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 12.0, 46.0, 93.0, 183.0, 284.0, 170.0, 123.0, 54.0, 13.0, 8.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.06366729736328, -33.44221115112305, -31.820756912231445, -30.19930076599121, -28.57784652709961, -26.956390380859375, -25.33493423461914, -23.71347999572754, -22.092025756835938, -20.470569610595703, -18.8491153717041, -17.227659225463867, -15.606204986572266, -13.984748840332031, -12.363293647766113, -10.741838455200195, -9.120382308959961, -7.498927116394043, -5.877471923828125, -4.256016254425049, -2.634561061859131, -1.0131053924560547, 0.6083498001098633, 2.2298049926757812, 3.851260185241699, 5.472715377807617, 7.094170570373535, 8.715625762939453, 10.337081909179688, 11.958537101745605, 13.579992294311523, 15.201447486877441, 16.82290267944336, 18.444358825683594, 20.065813064575195, 21.68726921081543, 23.30872344970703, 24.930179595947266, 26.5516357421875, 28.1730899810791, 29.794544219970703, 31.416000366210938, 33.03745651245117, 34.65890884399414, 36.280364990234375, 37.90182113647461, 39.523277282714844, 41.14472961425781, 42.76618957519531, 44.38764572143555, 46.00910186767578, 47.63055419921875, 49.252010345458984, 50.87346649169922, 52.49492263793945, 54.11637878417969, 55.737831115722656, 57.35928726196289, 58.980743408203125, 60.602195739746094, 62.22365188598633, 63.84510803222656, 65.46656036376953, 67.08802032470703, 68.70947265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 10.0, 11.0, 13.0, 22.0, 13.0, 15.0, 20.0, 24.0, 28.0, 23.0, 31.0, 28.0, 30.0, 46.0, 40.0, 49.0, 50.0, 55.0, 47.0, 53.0, 51.0, 41.0, 40.0, 31.0, 34.0, 30.0, 25.0, 21.0, 22.0, 21.0, 7.0, 6.0, 15.0, 14.0, 6.0, 6.0, 5.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.416810989379883, -14.879827499389648, -14.342843055725098, -13.805858612060547, -13.268875122070312, -12.731891632080078, -12.194907188415527, -11.657922744750977, -11.120939254760742, -10.583955764770508, -10.046971321105957, -9.509986877441406, -8.973003387451172, -8.436019897460938, -7.899035453796387, -7.362051486968994, -6.825067520141602, -6.288083553314209, -5.751099586486816, -5.214115619659424, -4.677131652832031, -4.140147686004639, -3.603163719177246, -3.0661797523498535, -2.529195785522461, -1.9922118186950684, -1.4552278518676758, -0.9182438850402832, -0.3812599182128906, 0.15572404861450195, 0.6927080154418945, 1.229691982269287, 1.7666759490966797, 2.3036599159240723, 2.840643882751465, 3.3776278495788574, 3.91461181640625, 4.451595783233643, 4.988579750061035, 5.525563716888428, 6.06254768371582, 6.599531650543213, 7.1365156173706055, 7.673499584197998, 8.21048355102539, 8.747467041015625, 9.284451484680176, 9.821435928344727, 10.358419418334961, 10.895402908325195, 11.432387351989746, 11.969371795654297, 12.506355285644531, 13.043338775634766, 13.580323219299316, 14.117307662963867, 14.654291152954102, 15.191274642944336, 15.728259086608887, 16.265243530273438, 16.802227020263672, 17.339210510253906, 17.87619400024414, 18.413179397583008, 18.950162887573242]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 11.0, 10.0, 17.0, 28.0, 42.0, 53.0, 80.0, 125.0, 205.0, 323.0, 594.0, 1032.0, 1776.0, 3798.0, 7953.0, 17773.0, 42859.0, 112246.0, 279118.0, 330296.0, 150916.0, 56551.0, 22931.0, 9916.0, 4604.0, 2338.0, 1231.0, 632.0, 405.0, 247.0, 155.0, 95.0, 62.0, 47.0, 31.0, 11.0, 11.0, 9.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.705078125, -2.62347412109375, -2.5418701171875, -2.46026611328125, -2.378662109375, -2.29705810546875, -2.2154541015625, -2.13385009765625, -2.05224609375, -1.97064208984375, -1.8890380859375, -1.80743408203125, -1.725830078125, -1.64422607421875, -1.5626220703125, -1.48101806640625, -1.3994140625, -1.31781005859375, -1.2362060546875, -1.15460205078125, -1.072998046875, -0.99139404296875, -0.9097900390625, -0.82818603515625, -0.74658203125, -0.66497802734375, -0.5833740234375, -0.50177001953125, -0.420166015625, -0.33856201171875, -0.2569580078125, -0.17535400390625, -0.09375, -0.01214599609375, 0.0694580078125, 0.15106201171875, 0.232666015625, 0.31427001953125, 0.3958740234375, 0.47747802734375, 0.55908203125, 0.64068603515625, 0.7222900390625, 0.80389404296875, 0.885498046875, 0.96710205078125, 1.0487060546875, 1.13031005859375, 1.2119140625, 1.29351806640625, 1.3751220703125, 1.45672607421875, 1.538330078125, 1.61993408203125, 1.7015380859375, 1.78314208984375, 1.86474609375, 1.94635009765625, 2.0279541015625, 2.10955810546875, 2.191162109375, 2.27276611328125, 2.3543701171875, 2.43597412109375, 2.517578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 2.0, 4.0, 8.0, 9.0, 8.0, 15.0, 21.0, 14.0, 18.0, 19.0, 24.0, 21.0, 26.0, 35.0, 30.0, 31.0, 36.0, 50.0, 52.0, 37.0, 53.0, 56.0, 35.0, 46.0, 35.0, 33.0, 29.0, 44.0, 19.0, 32.0, 24.0, 20.0, 10.0, 27.0, 19.0, 3.0, 11.0, 6.0, 5.0, 5.0, 7.0, 5.0, 11.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.9052734375, -1.8516082763671875, -1.797943115234375, -1.7442779541015625, -1.69061279296875, -1.6369476318359375, -1.583282470703125, -1.5296173095703125, -1.4759521484375, -1.4222869873046875, -1.368621826171875, -1.3149566650390625, -1.26129150390625, -1.2076263427734375, -1.153961181640625, -1.1002960205078125, -1.046630859375, -0.9929656982421875, -0.939300537109375, -0.8856353759765625, -0.83197021484375, -0.7783050537109375, -0.724639892578125, -0.6709747314453125, -0.6173095703125, -0.5636444091796875, -0.509979248046875, -0.4563140869140625, -0.40264892578125, -0.3489837646484375, -0.295318603515625, -0.2416534423828125, -0.18798828125, -0.1343231201171875, -0.080657958984375, -0.0269927978515625, 0.02667236328125, 0.0803375244140625, 0.134002685546875, 0.1876678466796875, 0.2413330078125, 0.2949981689453125, 0.348663330078125, 0.4023284912109375, 0.45599365234375, 0.5096588134765625, 0.563323974609375, 0.6169891357421875, 0.670654296875, 0.7243194580078125, 0.777984619140625, 0.8316497802734375, 0.88531494140625, 0.9389801025390625, 0.992645263671875, 1.0463104248046875, 1.0999755859375, 1.1536407470703125, 1.207305908203125, 1.2609710693359375, 1.31463623046875, 1.3683013916015625, 1.421966552734375, 1.4756317138671875, 1.529296875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 6.0, 6.0, 11.0, 11.0, 15.0, 19.0, 53.0, 62.0, 83.0, 156.0, 205.0, 410.0, 824.0, 1877.0, 7336.0, 52332.0, 734244.0, 223354.0, 20818.0, 3927.0, 1315.0, 641.0, 302.0, 192.0, 117.0, 64.0, 48.0, 36.0, 20.0, 20.0, 17.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.945556640625, -6.72705078125, -6.508544921875, -6.2900390625, -6.071533203125, -5.85302734375, -5.634521484375, -5.416015625, -5.197509765625, -4.97900390625, -4.760498046875, -4.5419921875, -4.323486328125, -4.10498046875, -3.886474609375, -3.66796875, -3.449462890625, -3.23095703125, -3.012451171875, -2.7939453125, -2.575439453125, -2.35693359375, -2.138427734375, -1.919921875, -1.701416015625, -1.48291015625, -1.264404296875, -1.0458984375, -0.827392578125, -0.60888671875, -0.390380859375, -0.171875, 0.046630859375, 0.26513671875, 0.483642578125, 0.7021484375, 0.920654296875, 1.13916015625, 1.357666015625, 1.576171875, 1.794677734375, 2.01318359375, 2.231689453125, 2.4501953125, 2.668701171875, 2.88720703125, 3.105712890625, 3.32421875, 3.542724609375, 3.76123046875, 3.979736328125, 4.1982421875, 4.416748046875, 4.63525390625, 4.853759765625, 5.072265625, 5.290771484375, 5.50927734375, 5.727783203125, 5.9462890625, 6.164794921875, 6.38330078125, 6.601806640625, 6.8203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 7.0, 14.0, 23.0, 17.0, 30.0, 14.0, 31.0, 37.0, 58.0, 44.0, 60.0, 66.0, 66.0, 55.0, 55.0, 68.0, 64.0, 53.0, 34.0, 42.0, 36.0, 24.0, 17.0, 17.0, 17.0, 15.0, 2.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.93359375, -6.66741943359375, -6.4012451171875, -6.13507080078125, -5.868896484375, -5.60272216796875, -5.3365478515625, -5.07037353515625, -4.80419921875, -4.53802490234375, -4.2718505859375, -4.00567626953125, -3.739501953125, -3.47332763671875, -3.2071533203125, -2.94097900390625, -2.6748046875, -2.40863037109375, -2.1424560546875, -1.87628173828125, -1.610107421875, -1.34393310546875, -1.0777587890625, -0.81158447265625, -0.54541015625, -0.27923583984375, -0.0130615234375, 0.25311279296875, 0.519287109375, 0.78546142578125, 1.0516357421875, 1.31781005859375, 1.583984375, 1.85015869140625, 2.1163330078125, 2.38250732421875, 2.648681640625, 2.91485595703125, 3.1810302734375, 3.44720458984375, 3.71337890625, 3.97955322265625, 4.2457275390625, 4.51190185546875, 4.778076171875, 5.04425048828125, 5.3104248046875, 5.57659912109375, 5.8427734375, 6.10894775390625, 6.3751220703125, 6.64129638671875, 6.907470703125, 7.17364501953125, 7.4398193359375, 7.70599365234375, 7.97216796875, 8.23834228515625, 8.5045166015625, 8.77069091796875, 9.036865234375, 9.30303955078125, 9.5692138671875, 9.83538818359375, 10.1015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 7.0, 2.0, 7.0, 14.0, 23.0, 42.0, 74.0, 187.0, 428.0, 1261.0, 4806.0, 26389.0, 378900.0, 601168.0, 28153.0, 4904.0, 1362.0, 475.0, 155.0, 82.0, 45.0, 23.0, 14.0, 8.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.921875, -1.853271484375, -1.78466796875, -1.716064453125, -1.6474609375, -1.578857421875, -1.51025390625, -1.441650390625, -1.373046875, -1.304443359375, -1.23583984375, -1.167236328125, -1.0986328125, -1.030029296875, -0.96142578125, -0.892822265625, -0.82421875, -0.755615234375, -0.68701171875, -0.618408203125, -0.5498046875, -0.481201171875, -0.41259765625, -0.343994140625, -0.275390625, -0.206787109375, -0.13818359375, -0.069580078125, -0.0009765625, 0.067626953125, 0.13623046875, 0.204833984375, 0.2734375, 0.342041015625, 0.41064453125, 0.479248046875, 0.5478515625, 0.616455078125, 0.68505859375, 0.753662109375, 0.822265625, 0.890869140625, 0.95947265625, 1.028076171875, 1.0966796875, 1.165283203125, 1.23388671875, 1.302490234375, 1.37109375, 1.439697265625, 1.50830078125, 1.576904296875, 1.6455078125, 1.714111328125, 1.78271484375, 1.851318359375, 1.919921875, 1.988525390625, 2.05712890625, 2.125732421875, 2.1943359375, 2.262939453125, 2.33154296875, 2.400146484375, 2.46875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 8.0, 6.0, 5.0, 4.0, 12.0, 18.0, 15.0, 27.0, 45.0, 56.0, 66.0, 133.0, 147.0, 131.0, 99.0, 60.0, 43.0, 34.0, 15.0, 18.0, 16.0, 7.0, 17.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033211708068847656, -0.0003192536532878876, -0.0003063902258872986, -0.0002935267984867096, -0.0002806633710861206, -0.0002677999436855316, -0.0002549365162849426, -0.00024207308888435364, -0.00022920966148376465, -0.00021634623408317566, -0.00020348280668258667, -0.00019061937928199768, -0.0001777559518814087, -0.0001648925244808197, -0.0001520290970802307, -0.00013916566967964172, -0.00012630224227905273, -0.00011343881487846375, -0.00010057538747787476, -8.771196007728577e-05, -7.484853267669678e-05, -6.198510527610779e-05, -4.91216778755188e-05, -3.625825047492981e-05, -2.339482307434082e-05, -1.0531395673751831e-05, 2.332031726837158e-06, 1.5195459127426147e-05, 2.8058886528015137e-05, 4.0922313928604126e-05, 5.3785741329193115e-05, 6.66491687297821e-05, 7.95125961303711e-05, 9.237602353096008e-05, 0.00010523945093154907, 0.00011810287833213806, 0.00013096630573272705, 0.00014382973313331604, 0.00015669316053390503, 0.00016955658793449402, 0.000182420015335083, 0.000195283442735672, 0.00020814687013626099, 0.00022101029753684998, 0.00023387372493743896, 0.00024673715233802795, 0.00025960057973861694, 0.00027246400713920593, 0.0002853274345397949, 0.0002981908619403839, 0.0003110542893409729, 0.0003239177167415619, 0.0003367811441421509, 0.00034964457154273987, 0.00036250799894332886, 0.00037537142634391785, 0.00038823485374450684, 0.0004010982811450958, 0.0004139617085456848, 0.0004268251359462738, 0.0004396885633468628, 0.0004525519907474518, 0.00046541541814804077, 0.00047827884554862976, 0.0004911422729492188]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 12.0, 10.0, 14.0, 24.0, 28.0, 63.0, 99.0, 188.0, 342.0, 732.0, 1796.0, 5601.0, 24848.0, 183443.0, 748679.0, 65398.0, 11685.0, 3251.0, 1177.0, 536.0, 257.0, 138.0, 90.0, 50.0, 29.0, 21.0, 13.0, 5.0, 9.0, 7.0, 6.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55859375, -1.501434326171875, -1.44427490234375, -1.387115478515625, -1.3299560546875, -1.272796630859375, -1.21563720703125, -1.158477783203125, -1.101318359375, -1.044158935546875, -0.98699951171875, -0.929840087890625, -0.8726806640625, -0.815521240234375, -0.75836181640625, -0.701202392578125, -0.64404296875, -0.586883544921875, -0.52972412109375, -0.472564697265625, -0.4154052734375, -0.358245849609375, -0.30108642578125, -0.243927001953125, -0.186767578125, -0.129608154296875, -0.07244873046875, -0.015289306640625, 0.0418701171875, 0.099029541015625, 0.15618896484375, 0.213348388671875, 0.2705078125, 0.327667236328125, 0.38482666015625, 0.441986083984375, 0.4991455078125, 0.556304931640625, 0.61346435546875, 0.670623779296875, 0.727783203125, 0.784942626953125, 0.84210205078125, 0.899261474609375, 0.9564208984375, 1.013580322265625, 1.07073974609375, 1.127899169921875, 1.18505859375, 1.242218017578125, 1.29937744140625, 1.356536865234375, 1.4136962890625, 1.470855712890625, 1.52801513671875, 1.585174560546875, 1.642333984375, 1.699493408203125, 1.75665283203125, 1.813812255859375, 1.8709716796875, 1.928131103515625, 1.98529052734375, 2.042449951171875, 2.099609375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 7.0, 8.0, 14.0, 17.0, 9.0, 27.0, 35.0, 72.0, 80.0, 125.0, 138.0, 112.0, 96.0, 57.0, 48.0, 33.0, 18.0, 23.0, 10.0, 8.0, 9.0, 12.0, 7.0, 2.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5849609375, -1.53314208984375, -1.4813232421875, -1.42950439453125, -1.377685546875, -1.32586669921875, -1.2740478515625, -1.22222900390625, -1.17041015625, -1.11859130859375, -1.0667724609375, -1.01495361328125, -0.963134765625, -0.91131591796875, -0.8594970703125, -0.80767822265625, -0.755859375, -0.70404052734375, -0.6522216796875, -0.60040283203125, -0.548583984375, -0.49676513671875, -0.4449462890625, -0.39312744140625, -0.34130859375, -0.28948974609375, -0.2376708984375, -0.18585205078125, -0.134033203125, -0.08221435546875, -0.0303955078125, 0.02142333984375, 0.0732421875, 0.12506103515625, 0.1768798828125, 0.22869873046875, 0.280517578125, 0.33233642578125, 0.3841552734375, 0.43597412109375, 0.48779296875, 0.53961181640625, 0.5914306640625, 0.64324951171875, 0.695068359375, 0.74688720703125, 0.7987060546875, 0.85052490234375, 0.90234375, 0.95416259765625, 1.0059814453125, 1.05780029296875, 1.109619140625, 1.16143798828125, 1.2132568359375, 1.26507568359375, 1.31689453125, 1.36871337890625, 1.4205322265625, 1.47235107421875, 1.524169921875, 1.57598876953125, 1.6278076171875, 1.67962646484375, 1.7314453125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 18.0, 36.0, 115.0, 330.0, 322.0, 110.0, 36.0, 12.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.340572357177734, -49.28413391113281, -47.227699279785156, -45.171260833740234, -43.11482238769531, -41.05838394165039, -39.00194549560547, -36.94551086425781, -34.88907241821289, -32.83263397216797, -30.77619743347168, -28.71976089477539, -26.66332244873047, -24.606884002685547, -22.550447463989258, -20.49401092529297, -18.437572479248047, -16.381134033203125, -14.324697494506836, -12.26826000213623, -10.211822509765625, -8.15538501739502, -6.098947525024414, -4.042510032653809, -1.9860725402832031, 0.07036495208740234, 2.126802444458008, 4.183239936828613, 6.239677429199219, 8.296114921569824, 10.35255241394043, 12.408989906311035, 14.465423583984375, 16.521862030029297, 18.578298568725586, 20.634735107421875, 22.691173553466797, 24.74761199951172, 26.804048538208008, 28.860485076904297, 30.91692352294922, 32.97336196899414, 35.02980041503906, 37.08623504638672, 39.14267349243164, 41.19911193847656, 43.25554656982422, 45.31198501586914, 47.36842346191406, 49.424861907958984, 51.481300354003906, 53.53773498535156, 55.594173431396484, 57.650611877441406, 59.70704650878906, 61.763484954833984, 63.819923400878906, 65.87635803222656, 67.93280029296875, 69.9892349243164, 72.04566955566406, 74.10211181640625, 76.1585464477539, 78.2149887084961, 80.27142333984375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 4.0, 12.0, 9.0, 6.0, 14.0, 13.0, 11.0, 22.0, 21.0, 18.0, 23.0, 13.0, 23.0, 32.0, 31.0, 37.0, 56.0, 87.0, 98.0, 77.0, 63.0, 39.0, 29.0, 38.0, 26.0, 19.0, 23.0, 11.0, 23.0, 16.0, 14.0, 13.0, 10.0, 13.0, 7.0, 9.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-25.095874786376953, -24.34669303894043, -23.59751319885254, -22.848331451416016, -22.099151611328125, -21.3499698638916, -20.600788116455078, -19.851608276367188, -19.102426528930664, -18.35324478149414, -17.60406494140625, -16.854883193969727, -16.105701446533203, -15.356521606445312, -14.607339859008789, -13.858159065246582, -13.108978271484375, -12.359797477722168, -11.610616683959961, -10.861434936523438, -10.11225414276123, -9.363073348999023, -8.6138916015625, -7.864710807800293, -7.115530014038086, -6.366349220275879, -5.617167949676514, -4.867986679077148, -4.118805885314941, -3.3696248531341553, -2.620443820953369, -1.871262550354004, -1.122079849243164, -0.37289881706237793, 0.3762822151184082, 1.1254632472991943, 1.8746442794799805, 2.6238253116607666, 3.3730063438415527, 4.122187614440918, 4.871368408203125, 5.620549201965332, 6.369730472564697, 7.1189117431640625, 7.8680925369262695, 8.617273330688477, 9.366455078125, 10.115635871887207, 10.864816665649414, 11.613997459411621, 12.363178253173828, 13.112360000610352, 13.861540794372559, 14.610721588134766, 15.359903335571289, 16.109085083007812, 16.858264923095703, 17.607446670532227, 18.356626510620117, 19.10580825805664, 19.85498809814453, 20.604169845581055, 21.353351593017578, 22.10253143310547, 22.851713180541992]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 15.0, 13.0, 21.0, 33.0, 44.0, 67.0, 101.0, 156.0, 222.0, 394.0, 615.0, 1036.0, 1960.0, 3853.0, 8406.0, 20974.0, 65070.0, 244608.0, 992593.0, 1916452.0, 690349.0, 168108.0, 47629.0, 16965.0, 6939.0, 3361.0, 1774.0, 960.0, 529.0, 352.0, 214.0, 151.0, 102.0, 59.0, 38.0, 27.0, 26.0, 15.0, 11.0, 9.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.9638671875, -1.9083404541015625, -1.852813720703125, -1.7972869873046875, -1.74176025390625, -1.6862335205078125, -1.630706787109375, -1.5751800537109375, -1.5196533203125, -1.4641265869140625, -1.408599853515625, -1.3530731201171875, -1.29754638671875, -1.2420196533203125, -1.186492919921875, -1.1309661865234375, -1.075439453125, -1.0199127197265625, -0.964385986328125, -0.9088592529296875, -0.85333251953125, -0.7978057861328125, -0.742279052734375, -0.6867523193359375, -0.6312255859375, -0.5756988525390625, -0.520172119140625, -0.4646453857421875, -0.40911865234375, -0.3535919189453125, -0.298065185546875, -0.2425384521484375, -0.18701171875, -0.1314849853515625, -0.075958251953125, -0.0204315185546875, 0.03509521484375, 0.0906219482421875, 0.146148681640625, 0.2016754150390625, 0.2572021484375, 0.3127288818359375, 0.368255615234375, 0.4237823486328125, 0.47930908203125, 0.5348358154296875, 0.590362548828125, 0.6458892822265625, 0.701416015625, 0.7569427490234375, 0.812469482421875, 0.8679962158203125, 0.92352294921875, 0.9790496826171875, 1.034576416015625, 1.0901031494140625, 1.1456298828125, 1.2011566162109375, 1.256683349609375, 1.3122100830078125, 1.36773681640625, 1.4232635498046875, 1.478790283203125, 1.5343170166015625, 1.58984375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 11.0, 11.0, 16.0, 9.0, 23.0, 21.0, 28.0, 24.0, 22.0, 26.0, 42.0, 30.0, 36.0, 37.0, 36.0, 38.0, 56.0, 50.0, 38.0, 36.0, 51.0, 38.0, 36.0, 34.0, 26.0, 22.0, 30.0, 25.0, 16.0, 19.0, 21.0, 14.0, 7.0, 9.0, 10.0, 8.0, 6.0, 4.0, 1.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.7568359375, -1.7066497802734375, -1.656463623046875, -1.6062774658203125, -1.55609130859375, -1.5059051513671875, -1.455718994140625, -1.4055328369140625, -1.3553466796875, -1.3051605224609375, -1.254974365234375, -1.2047882080078125, -1.15460205078125, -1.1044158935546875, -1.054229736328125, -1.0040435791015625, -0.953857421875, -0.9036712646484375, -0.853485107421875, -0.8032989501953125, -0.75311279296875, -0.7029266357421875, -0.652740478515625, -0.6025543212890625, -0.5523681640625, -0.5021820068359375, -0.451995849609375, -0.4018096923828125, -0.35162353515625, -0.3014373779296875, -0.251251220703125, -0.2010650634765625, -0.15087890625, -0.1006927490234375, -0.050506591796875, -0.0003204345703125, 0.04986572265625, 0.1000518798828125, 0.150238037109375, 0.2004241943359375, 0.2506103515625, 0.3007965087890625, 0.350982666015625, 0.4011688232421875, 0.45135498046875, 0.5015411376953125, 0.551727294921875, 0.6019134521484375, 0.652099609375, 0.7022857666015625, 0.752471923828125, 0.8026580810546875, 0.85284423828125, 0.9030303955078125, 0.953216552734375, 1.0034027099609375, 1.0535888671875, 1.1037750244140625, 1.153961181640625, 1.2041473388671875, 1.25433349609375, 1.3045196533203125, 1.354705810546875, 1.4048919677734375, 1.455078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 15.0, 31.0, 64.0, 116.0, 238.0, 620.0, 2622.0, 21287.0, 1851667.0, 2289488.0, 24108.0, 2863.0, 636.0, 247.0, 114.0, 61.0, 26.0, 19.0, 18.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.265625, -9.01531982421875, -8.7650146484375, -8.51470947265625, -8.264404296875, -8.01409912109375, -7.7637939453125, -7.51348876953125, -7.26318359375, -7.01287841796875, -6.7625732421875, -6.51226806640625, -6.261962890625, -6.01165771484375, -5.7613525390625, -5.51104736328125, -5.2607421875, -5.01043701171875, -4.7601318359375, -4.50982666015625, -4.259521484375, -4.00921630859375, -3.7589111328125, -3.50860595703125, -3.25830078125, -3.00799560546875, -2.7576904296875, -2.50738525390625, -2.257080078125, -2.00677490234375, -1.7564697265625, -1.50616455078125, -1.255859375, -1.00555419921875, -0.7552490234375, -0.50494384765625, -0.254638671875, -0.00433349609375, 0.2459716796875, 0.49627685546875, 0.74658203125, 0.99688720703125, 1.2471923828125, 1.49749755859375, 1.747802734375, 1.99810791015625, 2.2484130859375, 2.49871826171875, 2.7490234375, 2.99932861328125, 3.2496337890625, 3.49993896484375, 3.750244140625, 4.00054931640625, 4.2508544921875, 4.50115966796875, 4.75146484375, 5.00177001953125, 5.2520751953125, 5.50238037109375, 5.752685546875, 6.00299072265625, 6.2532958984375, 6.50360107421875, 6.75390625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 14.0, 27.0, 31.0, 75.0, 89.0, 177.0, 326.0, 603.0, 949.0, 737.0, 425.0, 240.0, 122.0, 76.0, 60.0, 34.0, 19.0, 16.0, 6.0, 10.0, 5.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7421875, -3.570068359375, -3.39794921875, -3.225830078125, -3.0537109375, -2.881591796875, -2.70947265625, -2.537353515625, -2.365234375, -2.193115234375, -2.02099609375, -1.848876953125, -1.6767578125, -1.504638671875, -1.33251953125, -1.160400390625, -0.98828125, -0.816162109375, -0.64404296875, -0.471923828125, -0.2998046875, -0.127685546875, 0.04443359375, 0.216552734375, 0.388671875, 0.560791015625, 0.73291015625, 0.905029296875, 1.0771484375, 1.249267578125, 1.42138671875, 1.593505859375, 1.765625, 1.937744140625, 2.10986328125, 2.281982421875, 2.4541015625, 2.626220703125, 2.79833984375, 2.970458984375, 3.142578125, 3.314697265625, 3.48681640625, 3.658935546875, 3.8310546875, 4.003173828125, 4.17529296875, 4.347412109375, 4.51953125, 4.691650390625, 4.86376953125, 5.035888671875, 5.2080078125, 5.380126953125, 5.55224609375, 5.724365234375, 5.896484375, 6.068603515625, 6.24072265625, 6.412841796875, 6.5849609375, 6.757080078125, 6.92919921875, 7.101318359375, 7.2734375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 17.0, 40.0, 163.0, 361.0, 282.0, 92.0, 25.0, 14.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.496604919433594, -39.15985107421875, -36.823097229003906, -34.4863395690918, -32.14958572387695, -29.81283187866211, -27.476076126098633, -25.139320373535156, -22.802566528320312, -20.46581268310547, -18.129056930541992, -15.792302131652832, -13.455547332763672, -11.118792533874512, -8.782037734985352, -6.445281982421875, -4.108528137207031, -1.771773338317871, 0.5649814605712891, 2.901736259460449, 5.238491058349609, 7.5752458572387695, 9.91200065612793, 12.248756408691406, 14.58551025390625, 16.922264099121094, 19.25901985168457, 21.595775604248047, 23.93252944946289, 26.269283294677734, 28.60603904724121, 30.942794799804688, 33.279541015625, 35.616294860839844, 37.95304870605469, 40.2898063659668, 42.62656021118164, 44.963314056396484, 47.300071716308594, 49.63682556152344, 51.97357940673828, 54.310333251953125, 56.64708709716797, 58.98384475708008, 61.32059860229492, 63.657352447509766, 65.99411010742188, 68.33086395263672, 70.66761779785156, 73.0043716430664, 75.34112548828125, 77.6778793334961, 80.01463317871094, 82.35139465332031, 84.68814849853516, 87.02490234375, 89.36165618896484, 91.69841003417969, 94.03516387939453, 96.37191772460938, 98.70867919921875, 101.0454330444336, 103.38218688964844, 105.71894073486328, 108.05569458007812]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 6.0, 5.0, 5.0, 5.0, 5.0, 7.0, 13.0, 11.0, 8.0, 13.0, 23.0, 22.0, 19.0, 30.0, 29.0, 31.0, 41.0, 41.0, 50.0, 52.0, 60.0, 43.0, 46.0, 62.0, 40.0, 47.0, 31.0, 33.0, 35.0, 27.0, 23.0, 20.0, 17.0, 13.0, 14.0, 15.0, 17.0, 6.0, 7.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-18.312931060791016, -17.755704879760742, -17.198476791381836, -16.641250610351562, -16.08402442932129, -15.5267972946167, -14.96957015991211, -14.412343978881836, -13.855116844177246, -13.297889709472656, -12.740663528442383, -12.183436393737793, -11.626209259033203, -11.06898307800293, -10.51175594329834, -9.95452880859375, -9.397302627563477, -8.840075492858887, -8.282849311828613, -7.725622177124023, -7.168395519256592, -6.61116886138916, -6.05394172668457, -5.496715068817139, -4.939488410949707, -4.382261753082275, -3.8250348567962646, -3.267807960510254, -2.7105813026428223, -2.1533546447753906, -1.5961277484893799, -1.0389008522033691, -0.4816741943359375, 0.07555258274078369, 0.6327793598175049, 1.190006136894226, 1.7472329139709473, 2.304459571838379, 2.8616864681243896, 3.4189133644104004, 3.976140022277832, 4.533366680145264, 5.090593338012695, 5.647820472717285, 6.205047130584717, 6.762273788452148, 7.319500923156738, 7.87672758102417, 8.433954238891602, 8.991181373596191, 9.548407554626465, 10.105634689331055, 10.662860870361328, 11.220088005065918, 11.777315139770508, 12.334541320800781, 12.891768455505371, 13.448995590209961, 14.006221771240234, 14.563448905944824, 15.120676040649414, 15.677902221679688, 16.23512840270996, 16.792356491088867, 17.34958267211914]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 9.0, 8.0, 12.0, 19.0, 23.0, 43.0, 62.0, 130.0, 198.0, 369.0, 705.0, 1228.0, 2174.0, 4170.0, 8284.0, 17250.0, 37229.0, 86694.0, 211384.0, 341590.0, 192221.0, 78635.0, 34268.0, 15425.0, 7738.0, 3919.0, 2078.0, 1147.0, 620.0, 347.0, 225.0, 137.0, 84.0, 58.0, 28.0, 22.0, 9.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.283203125, -2.20001220703125, -2.1168212890625, -2.03363037109375, -1.950439453125, -1.86724853515625, -1.7840576171875, -1.70086669921875, -1.61767578125, -1.53448486328125, -1.4512939453125, -1.36810302734375, -1.284912109375, -1.20172119140625, -1.1185302734375, -1.03533935546875, -0.9521484375, -0.86895751953125, -0.7857666015625, -0.70257568359375, -0.619384765625, -0.53619384765625, -0.4530029296875, -0.36981201171875, -0.28662109375, -0.20343017578125, -0.1202392578125, -0.03704833984375, 0.046142578125, 0.12933349609375, 0.2125244140625, 0.29571533203125, 0.37890625, 0.46209716796875, 0.5452880859375, 0.62847900390625, 0.711669921875, 0.79486083984375, 0.8780517578125, 0.96124267578125, 1.04443359375, 1.12762451171875, 1.2108154296875, 1.29400634765625, 1.377197265625, 1.46038818359375, 1.5435791015625, 1.62677001953125, 1.7099609375, 1.79315185546875, 1.8763427734375, 1.95953369140625, 2.042724609375, 2.12591552734375, 2.2091064453125, 2.29229736328125, 2.37548828125, 2.45867919921875, 2.5418701171875, 2.62506103515625, 2.708251953125, 2.79144287109375, 2.8746337890625, 2.95782470703125, 3.041015625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 4.0, 7.0, 8.0, 9.0, 8.0, 16.0, 11.0, 9.0, 24.0, 23.0, 24.0, 31.0, 23.0, 30.0, 34.0, 23.0, 41.0, 28.0, 38.0, 33.0, 41.0, 40.0, 30.0, 41.0, 40.0, 41.0, 34.0, 29.0, 25.0, 31.0, 24.0, 35.0, 24.0, 23.0, 15.0, 18.0, 15.0, 11.0, 5.0, 8.0, 11.0, 6.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-1.703125, -1.65484619140625, -1.6065673828125, -1.55828857421875, -1.510009765625, -1.46173095703125, -1.4134521484375, -1.36517333984375, -1.31689453125, -1.26861572265625, -1.2203369140625, -1.17205810546875, -1.123779296875, -1.07550048828125, -1.0272216796875, -0.97894287109375, -0.9306640625, -0.88238525390625, -0.8341064453125, -0.78582763671875, -0.737548828125, -0.68927001953125, -0.6409912109375, -0.59271240234375, -0.54443359375, -0.49615478515625, -0.4478759765625, -0.39959716796875, -0.351318359375, -0.30303955078125, -0.2547607421875, -0.20648193359375, -0.158203125, -0.10992431640625, -0.0616455078125, -0.01336669921875, 0.034912109375, 0.08319091796875, 0.1314697265625, 0.17974853515625, 0.22802734375, 0.27630615234375, 0.3245849609375, 0.37286376953125, 0.421142578125, 0.46942138671875, 0.5177001953125, 0.56597900390625, 0.6142578125, 0.66253662109375, 0.7108154296875, 0.75909423828125, 0.807373046875, 0.85565185546875, 0.9039306640625, 0.95220947265625, 1.00048828125, 1.04876708984375, 1.0970458984375, 1.14532470703125, 1.193603515625, 1.24188232421875, 1.2901611328125, 1.33843994140625, 1.38671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 6.0, 13.0, 8.0, 11.0, 30.0, 37.0, 43.0, 65.0, 81.0, 138.0, 216.0, 338.0, 537.0, 943.0, 2083.0, 6050.0, 36327.0, 728335.0, 244675.0, 20501.0, 4400.0, 1613.0, 762.0, 472.0, 282.0, 194.0, 128.0, 76.0, 54.0, 42.0, 33.0, 18.0, 13.0, 13.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3359375, -7.11932373046875, -6.9027099609375, -6.68609619140625, -6.469482421875, -6.25286865234375, -6.0362548828125, -5.81964111328125, -5.60302734375, -5.38641357421875, -5.1697998046875, -4.95318603515625, -4.736572265625, -4.51995849609375, -4.3033447265625, -4.08673095703125, -3.8701171875, -3.65350341796875, -3.4368896484375, -3.22027587890625, -3.003662109375, -2.78704833984375, -2.5704345703125, -2.35382080078125, -2.13720703125, -1.92059326171875, -1.7039794921875, -1.48736572265625, -1.270751953125, -1.05413818359375, -0.8375244140625, -0.62091064453125, -0.404296875, -0.18768310546875, 0.0289306640625, 0.24554443359375, 0.462158203125, 0.67877197265625, 0.8953857421875, 1.11199951171875, 1.32861328125, 1.54522705078125, 1.7618408203125, 1.97845458984375, 2.195068359375, 2.41168212890625, 2.6282958984375, 2.84490966796875, 3.0615234375, 3.27813720703125, 3.4947509765625, 3.71136474609375, 3.927978515625, 4.14459228515625, 4.3612060546875, 4.57781982421875, 4.79443359375, 5.01104736328125, 5.2276611328125, 5.44427490234375, 5.660888671875, 5.87750244140625, 6.0941162109375, 6.31072998046875, 6.52734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 7.0, 4.0, 5.0, 7.0, 5.0, 9.0, 9.0, 8.0, 21.0, 22.0, 16.0, 18.0, 33.0, 35.0, 41.0, 46.0, 53.0, 55.0, 56.0, 58.0, 53.0, 59.0, 44.0, 63.0, 48.0, 30.0, 36.0, 31.0, 28.0, 19.0, 21.0, 15.0, 13.0, 10.0, 4.0, 9.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.50390625, -6.2884521484375, -6.072998046875, -5.8575439453125, -5.64208984375, -5.4266357421875, -5.211181640625, -4.9957275390625, -4.7802734375, -4.5648193359375, -4.349365234375, -4.1339111328125, -3.91845703125, -3.7030029296875, -3.487548828125, -3.2720947265625, -3.056640625, -2.8411865234375, -2.625732421875, -2.4102783203125, -2.19482421875, -1.9793701171875, -1.763916015625, -1.5484619140625, -1.3330078125, -1.1175537109375, -0.902099609375, -0.6866455078125, -0.47119140625, -0.2557373046875, -0.040283203125, 0.1751708984375, 0.390625, 0.6060791015625, 0.821533203125, 1.0369873046875, 1.25244140625, 1.4678955078125, 1.683349609375, 1.8988037109375, 2.1142578125, 2.3297119140625, 2.545166015625, 2.7606201171875, 2.97607421875, 3.1915283203125, 3.406982421875, 3.6224365234375, 3.837890625, 4.0533447265625, 4.268798828125, 4.4842529296875, 4.69970703125, 4.9151611328125, 5.130615234375, 5.3460693359375, 5.5615234375, 5.7769775390625, 5.992431640625, 6.2078857421875, 6.42333984375, 6.6387939453125, 6.854248046875, 7.0697021484375, 7.28515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 13.0, 16.0, 15.0, 19.0, 19.0, 29.0, 44.0, 72.0, 95.0, 185.0, 333.0, 628.0, 1388.0, 3471.0, 10845.0, 41775.0, 267884.0, 645975.0, 54805.0, 13467.0, 4270.0, 1589.0, 711.0, 342.0, 187.0, 116.0, 70.0, 55.0, 29.0, 21.0, 22.0, 12.0, 6.0, 5.0, 11.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.072265625, -1.035400390625, -0.99853515625, -0.961669921875, -0.9248046875, -0.887939453125, -0.85107421875, -0.814208984375, -0.77734375, -0.740478515625, -0.70361328125, -0.666748046875, -0.6298828125, -0.593017578125, -0.55615234375, -0.519287109375, -0.482421875, -0.445556640625, -0.40869140625, -0.371826171875, -0.3349609375, -0.298095703125, -0.26123046875, -0.224365234375, -0.1875, -0.150634765625, -0.11376953125, -0.076904296875, -0.0400390625, -0.003173828125, 0.03369140625, 0.070556640625, 0.107421875, 0.144287109375, 0.18115234375, 0.218017578125, 0.2548828125, 0.291748046875, 0.32861328125, 0.365478515625, 0.40234375, 0.439208984375, 0.47607421875, 0.512939453125, 0.5498046875, 0.586669921875, 0.62353515625, 0.660400390625, 0.697265625, 0.734130859375, 0.77099609375, 0.807861328125, 0.8447265625, 0.881591796875, 0.91845703125, 0.955322265625, 0.9921875, 1.029052734375, 1.06591796875, 1.102783203125, 1.1396484375, 1.176513671875, 1.21337890625, 1.250244140625, 1.287109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 8.0, 7.0, 16.0, 11.0, 20.0, 43.0, 76.0, 127.0, 181.0, 168.0, 109.0, 59.0, 41.0, 26.0, 20.0, 9.0, 11.0, 6.0, 12.0, 3.0, 6.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006098747253417969, -0.0005933791399002075, -0.0005768835544586182, -0.0005603879690170288, -0.0005438923835754395, -0.0005273967981338501, -0.0005109012126922607, -0.0004944056272506714, -0.00047791004180908203, -0.0004614144563674927, -0.0004449188709259033, -0.00042842328548431396, -0.0004119277000427246, -0.00039543211460113525, -0.0003789365291595459, -0.00036244094371795654, -0.0003459453582763672, -0.00032944977283477783, -0.0003129541873931885, -0.0002964586019515991, -0.00027996301651000977, -0.0002634674310684204, -0.00024697184562683105, -0.0002304762601852417, -0.00021398067474365234, -0.000197485089302063, -0.00018098950386047363, -0.00016449391841888428, -0.00014799833297729492, -0.00013150274753570557, -0.00011500716209411621, -9.851157665252686e-05, -8.20159912109375e-05, -6.552040576934814e-05, -4.902482032775879e-05, -3.2529234886169434e-05, -1.6033649444580078e-05, 4.6193599700927734e-07, 1.6957521438598633e-05, 3.345310688018799e-05, 4.9948692321777344e-05, 6.64442777633667e-05, 8.293986320495605e-05, 9.943544864654541e-05, 0.00011593103408813477, 0.00013242661952972412, 0.00014892220497131348, 0.00016541779041290283, 0.0001819133758544922, 0.00019840896129608154, 0.0002149045467376709, 0.00023140013217926025, 0.0002478957176208496, 0.00026439130306243896, 0.0002808868885040283, 0.0002973824739456177, 0.00031387805938720703, 0.0003303736448287964, 0.00034686923027038574, 0.0003633648157119751, 0.00037986040115356445, 0.0003963559865951538, 0.00041285157203674316, 0.0004293471574783325, 0.0004458427429199219]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 11.0, 8.0, 17.0, 26.0, 36.0, 51.0, 84.0, 148.0, 229.0, 355.0, 651.0, 1299.0, 2966.0, 8113.0, 28884.0, 148130.0, 728276.0, 97139.0, 20991.0, 6157.0, 2424.0, 1060.0, 614.0, 287.0, 212.0, 129.0, 85.0, 53.0, 29.0, 26.0, 21.0, 11.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.1953125, -1.1572265625, -1.119140625, -1.0810546875, -1.04296875, -1.0048828125, -0.966796875, -0.9287109375, -0.890625, -0.8525390625, -0.814453125, -0.7763671875, -0.73828125, -0.7001953125, -0.662109375, -0.6240234375, -0.5859375, -0.5478515625, -0.509765625, -0.4716796875, -0.43359375, -0.3955078125, -0.357421875, -0.3193359375, -0.28125, -0.2431640625, -0.205078125, -0.1669921875, -0.12890625, -0.0908203125, -0.052734375, -0.0146484375, 0.0234375, 0.0615234375, 0.099609375, 0.1376953125, 0.17578125, 0.2138671875, 0.251953125, 0.2900390625, 0.328125, 0.3662109375, 0.404296875, 0.4423828125, 0.48046875, 0.5185546875, 0.556640625, 0.5947265625, 0.6328125, 0.6708984375, 0.708984375, 0.7470703125, 0.78515625, 0.8232421875, 0.861328125, 0.8994140625, 0.9375, 0.9755859375, 1.013671875, 1.0517578125, 1.08984375, 1.1279296875, 1.166015625, 1.2041015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 7.0, 1.0, 5.0, 4.0, 11.0, 13.0, 9.0, 10.0, 15.0, 16.0, 16.0, 22.0, 42.0, 43.0, 48.0, 68.0, 78.0, 71.0, 77.0, 78.0, 71.0, 53.0, 47.0, 36.0, 32.0, 26.0, 18.0, 8.0, 12.0, 8.0, 8.0, 11.0, 5.0, 5.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.138671875, -1.1082000732421875, -1.077728271484375, -1.0472564697265625, -1.01678466796875, -0.9863128662109375, -0.955841064453125, -0.9253692626953125, -0.8948974609375, -0.8644256591796875, -0.833953857421875, -0.8034820556640625, -0.77301025390625, -0.7425384521484375, -0.712066650390625, -0.6815948486328125, -0.651123046875, -0.6206512451171875, -0.590179443359375, -0.5597076416015625, -0.52923583984375, -0.4987640380859375, -0.468292236328125, -0.4378204345703125, -0.4073486328125, -0.3768768310546875, -0.346405029296875, -0.3159332275390625, -0.28546142578125, -0.2549896240234375, -0.224517822265625, -0.1940460205078125, -0.16357421875, -0.1331024169921875, -0.102630615234375, -0.0721588134765625, -0.04168701171875, -0.0112152099609375, 0.019256591796875, 0.0497283935546875, 0.0802001953125, 0.1106719970703125, 0.141143798828125, 0.1716156005859375, 0.20208740234375, 0.2325592041015625, 0.263031005859375, 0.2935028076171875, 0.323974609375, 0.3544464111328125, 0.384918212890625, 0.4153900146484375, 0.44586181640625, 0.4763336181640625, 0.506805419921875, 0.5372772216796875, 0.5677490234375, 0.5982208251953125, 0.628692626953125, 0.6591644287109375, 0.68963623046875, 0.7201080322265625, 0.750579833984375, 0.7810516357421875, 0.8115234375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 17.0, 21.0, 43.0, 61.0, 93.0, 135.0, 357.0, 112.0, 59.0, 33.0, 20.0, 14.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.05677795410156, -35.95051193237305, -34.844242095947266, -33.73797607421875, -32.631710052490234, -31.525442123413086, -30.419174194335938, -29.312908172607422, -28.206640243530273, -27.100372314453125, -25.99410629272461, -24.88783836364746, -23.781570434570312, -22.675304412841797, -21.56903648376465, -20.4627685546875, -19.356502532958984, -18.250234603881836, -17.14396858215332, -16.037700653076172, -14.93143367767334, -13.825166702270508, -12.71889877319336, -11.612631797790527, -10.506364822387695, -9.400097846984863, -8.293830871582031, -7.187562942504883, -6.081295967102051, -4.975028991699219, -3.8687615394592285, -2.7624940872192383, -1.6562232971191406, -0.5499560832977295, 0.5563111305236816, 1.6625783443450928, 2.768845558166504, 3.875112533569336, 4.981379985809326, 6.087647438049316, 7.193914413452148, 8.30018138885498, 9.406448364257812, 10.512716293334961, 11.618983268737793, 12.725250244140625, 13.831518173217773, 14.937785148620605, 16.044052124023438, 17.150320053100586, 18.2565860748291, 19.36285400390625, 20.469120025634766, 21.575387954711914, 22.681655883789062, 23.787921905517578, 24.894189834594727, 26.000457763671875, 27.10672378540039, 28.21299171447754, 29.319259643554688, 30.425525665283203, 31.53179359436035, 32.6380615234375, 33.744327545166016]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 0.0, 7.0, 5.0, 15.0, 9.0, 22.0, 13.0, 14.0, 18.0, 18.0, 21.0, 27.0, 34.0, 38.0, 47.0, 49.0, 104.0, 155.0, 90.0, 47.0, 40.0, 37.0, 30.0, 16.0, 17.0, 23.0, 16.0, 18.0, 16.0, 13.0, 9.0, 10.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.399587631225586, -30.562105178833008, -29.72462272644043, -28.88714027404785, -28.049659729003906, -27.212177276611328, -26.37469482421875, -25.537212371826172, -24.699729919433594, -23.862247467041016, -23.024765014648438, -22.18728256225586, -21.34980010986328, -20.512317657470703, -19.674837112426758, -18.83735466003418, -17.9998722076416, -17.162389755249023, -16.324907302856445, -15.487425804138184, -14.649943351745605, -13.812460899353027, -12.974979400634766, -12.137496948242188, -11.30001449584961, -10.462532043457031, -9.625049591064453, -8.787568092346191, -7.950085639953613, -7.112603187561035, -6.275121212005615, -5.437639236450195, -4.600154876708984, -3.7626726627349854, -2.9251904487609863, -2.0877082347869873, -1.2502260208129883, -0.41274356842041016, 0.42473840713500977, 1.2622203826904297, 2.099702835083008, 2.937185049057007, 3.774667263031006, 4.612149238586426, 5.449631690979004, 6.287114143371582, 7.124596118927002, 7.962078094482422, 8.799560546875, 9.637042999267578, 10.474525451660156, 11.312006950378418, 12.149489402770996, 12.986971855163574, 13.824453353881836, 14.661935806274414, 15.499418258666992, 16.33690071105957, 17.17438316345215, 18.011865615844727, 18.849346160888672, 19.68682861328125, 20.524311065673828, 21.361793518066406, 22.199275970458984]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 12.0, 14.0, 30.0, 46.0, 48.0, 76.0, 115.0, 175.0, 225.0, 392.0, 603.0, 1103.0, 1969.0, 3853.0, 8655.0, 23135.0, 75446.0, 315070.0, 1128095.0, 1699010.0, 687089.0, 174194.0, 45819.0, 16006.0, 6277.0, 2986.0, 1502.0, 839.0, 541.0, 330.0, 193.0, 135.0, 84.0, 73.0, 45.0, 30.0, 17.0, 8.0, 8.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.759765625, -2.6837158203125, -2.607666015625, -2.5316162109375, -2.45556640625, -2.3795166015625, -2.303466796875, -2.2274169921875, -2.1513671875, -2.0753173828125, -1.999267578125, -1.9232177734375, -1.84716796875, -1.7711181640625, -1.695068359375, -1.6190185546875, -1.54296875, -1.4669189453125, -1.390869140625, -1.3148193359375, -1.23876953125, -1.1627197265625, -1.086669921875, -1.0106201171875, -0.9345703125, -0.8585205078125, -0.782470703125, -0.7064208984375, -0.63037109375, -0.5543212890625, -0.478271484375, -0.4022216796875, -0.326171875, -0.2501220703125, -0.174072265625, -0.0980224609375, -0.02197265625, 0.0540771484375, 0.130126953125, 0.2061767578125, 0.2822265625, 0.3582763671875, 0.434326171875, 0.5103759765625, 0.58642578125, 0.6624755859375, 0.738525390625, 0.8145751953125, 0.890625, 0.9666748046875, 1.042724609375, 1.1187744140625, 1.19482421875, 1.2708740234375, 1.346923828125, 1.4229736328125, 1.4990234375, 1.5750732421875, 1.651123046875, 1.7271728515625, 1.80322265625, 1.8792724609375, 1.955322265625, 2.0313720703125, 2.107421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 5.0, 5.0, 8.0, 6.0, 16.0, 12.0, 10.0, 14.0, 24.0, 24.0, 30.0, 29.0, 34.0, 38.0, 43.0, 29.0, 47.0, 40.0, 35.0, 39.0, 41.0, 50.0, 50.0, 51.0, 35.0, 43.0, 37.0, 36.0, 31.0, 22.0, 27.0, 19.0, 11.0, 9.0, 12.0, 6.0, 14.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.013671875, -1.96014404296875, -1.9066162109375, -1.85308837890625, -1.799560546875, -1.74603271484375, -1.6925048828125, -1.63897705078125, -1.58544921875, -1.53192138671875, -1.4783935546875, -1.42486572265625, -1.371337890625, -1.31781005859375, -1.2642822265625, -1.21075439453125, -1.1572265625, -1.10369873046875, -1.0501708984375, -0.99664306640625, -0.943115234375, -0.88958740234375, -0.8360595703125, -0.78253173828125, -0.72900390625, -0.67547607421875, -0.6219482421875, -0.56842041015625, -0.514892578125, -0.46136474609375, -0.4078369140625, -0.35430908203125, -0.30078125, -0.24725341796875, -0.1937255859375, -0.14019775390625, -0.086669921875, -0.03314208984375, 0.0203857421875, 0.07391357421875, 0.12744140625, 0.18096923828125, 0.2344970703125, 0.28802490234375, 0.341552734375, 0.39508056640625, 0.4486083984375, 0.50213623046875, 0.5556640625, 0.60919189453125, 0.6627197265625, 0.71624755859375, 0.769775390625, 0.82330322265625, 0.8768310546875, 0.93035888671875, 0.98388671875, 1.03741455078125, 1.0909423828125, 1.14447021484375, 1.197998046875, 1.25152587890625, 1.3050537109375, 1.35858154296875, 1.412109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 4.0, 4.0, 7.0, 12.0, 18.0, 21.0, 34.0, 40.0, 50.0, 91.0, 133.0, 177.0, 242.0, 444.0, 829.0, 1640.0, 4293.0, 17300.0, 230405.0, 3773990.0, 144426.0, 13413.0, 3486.0, 1365.0, 705.0, 384.0, 237.0, 170.0, 92.0, 82.0, 58.0, 31.0, 26.0, 17.0, 12.0, 14.0, 7.0, 6.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.65234375, -7.40093994140625, -7.1495361328125, -6.89813232421875, -6.646728515625, -6.39532470703125, -6.1439208984375, -5.89251708984375, -5.64111328125, -5.38970947265625, -5.1383056640625, -4.88690185546875, -4.635498046875, -4.38409423828125, -4.1326904296875, -3.88128662109375, -3.6298828125, -3.37847900390625, -3.1270751953125, -2.87567138671875, -2.624267578125, -2.37286376953125, -2.1214599609375, -1.87005615234375, -1.61865234375, -1.36724853515625, -1.1158447265625, -0.86444091796875, -0.613037109375, -0.36163330078125, -0.1102294921875, 0.14117431640625, 0.392578125, 0.64398193359375, 0.8953857421875, 1.14678955078125, 1.398193359375, 1.64959716796875, 1.9010009765625, 2.15240478515625, 2.40380859375, 2.65521240234375, 2.9066162109375, 3.15802001953125, 3.409423828125, 3.66082763671875, 3.9122314453125, 4.16363525390625, 4.4150390625, 4.66644287109375, 4.9178466796875, 5.16925048828125, 5.420654296875, 5.67205810546875, 5.9234619140625, 6.17486572265625, 6.42626953125, 6.67767333984375, 6.9290771484375, 7.18048095703125, 7.431884765625, 7.68328857421875, 7.9346923828125, 8.18609619140625, 8.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 6.0, 7.0, 16.0, 22.0, 17.0, 26.0, 40.0, 41.0, 67.0, 99.0, 102.0, 157.0, 206.0, 293.0, 389.0, 481.0, 507.0, 445.0, 318.0, 211.0, 158.0, 122.0, 89.0, 50.0, 45.0, 32.0, 35.0, 21.0, 19.0, 8.0, 6.0, 10.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.47265625, -6.30792236328125, -6.1431884765625, -5.97845458984375, -5.813720703125, -5.64898681640625, -5.4842529296875, -5.31951904296875, -5.15478515625, -4.99005126953125, -4.8253173828125, -4.66058349609375, -4.495849609375, -4.33111572265625, -4.1663818359375, -4.00164794921875, -3.8369140625, -3.67218017578125, -3.5074462890625, -3.34271240234375, -3.177978515625, -3.01324462890625, -2.8485107421875, -2.68377685546875, -2.51904296875, -2.35430908203125, -2.1895751953125, -2.02484130859375, -1.860107421875, -1.69537353515625, -1.5306396484375, -1.36590576171875, -1.201171875, -1.03643798828125, -0.8717041015625, -0.70697021484375, -0.542236328125, -0.37750244140625, -0.2127685546875, -0.04803466796875, 0.11669921875, 0.28143310546875, 0.4461669921875, 0.61090087890625, 0.775634765625, 0.94036865234375, 1.1051025390625, 1.26983642578125, 1.4345703125, 1.59930419921875, 1.7640380859375, 1.92877197265625, 2.093505859375, 2.25823974609375, 2.4229736328125, 2.58770751953125, 2.75244140625, 2.91717529296875, 3.0819091796875, 3.24664306640625, 3.411376953125, 3.57611083984375, 3.7408447265625, 3.90557861328125, 4.0703125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 6.0, 7.0, 11.0, 29.0, 62.0, 153.0, 303.0, 267.0, 103.0, 28.0, 19.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-196.4784698486328, -192.5438995361328, -188.6093292236328, -184.67477416992188, -180.74020385742188, -176.80563354492188, -172.87106323242188, -168.93649291992188, -165.00192260742188, -161.06735229492188, -157.13278198242188, -153.19822692871094, -149.26365661621094, -145.32908630371094, -141.39451599121094, -137.45994567871094, -133.525390625, -129.5908203125, -125.65625762939453, -121.72168731689453, -117.78712463378906, -113.85255432128906, -109.91798400878906, -105.98341369628906, -102.0488510131836, -98.1142807006836, -94.17971801757812, -90.24514770507812, -86.31057739257812, -82.37601470947266, -78.44144439697266, -74.50688171386719, -70.57231903076172, -66.63774871826172, -62.70318603515625, -58.76861572265625, -54.834049224853516, -50.89948272705078, -46.96491241455078, -43.03034591674805, -39.09577941894531, -35.16121292114258, -31.22664451599121, -27.292076110839844, -23.35750961303711, -19.422943115234375, -15.488374710083008, -11.55380630493164, -7.619239807128906, -3.6846723556518555, 0.2498950958251953, 4.184462547302246, 8.119029998779297, 12.053596496582031, 15.988164901733398, 19.922733306884766, 23.8572998046875, 27.791866302490234, 31.7264347076416, 35.66100311279297, 39.5955696105957, 43.53013610839844, 47.46470642089844, 51.39927291870117, 55.333839416503906]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 2.0, 7.0, 12.0, 10.0, 15.0, 23.0, 14.0, 24.0, 19.0, 37.0, 25.0, 38.0, 58.0, 53.0, 64.0, 61.0, 72.0, 55.0, 41.0, 47.0, 50.0, 26.0, 42.0, 30.0, 40.0, 31.0, 18.0, 15.0, 18.0, 6.0, 11.0, 9.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-33.549720764160156, -32.41353988647461, -31.277359008789062, -30.141178131103516, -29.00499725341797, -27.868816375732422, -26.732637405395508, -25.59645652770996, -24.460275650024414, -23.324094772338867, -22.18791389465332, -21.051733016967773, -19.91555404663086, -18.779373168945312, -17.643192291259766, -16.50701141357422, -15.370830535888672, -14.234649658203125, -13.098468780517578, -11.962288856506348, -10.8261079788208, -9.689927101135254, -8.553747177124023, -7.417566299438477, -6.28138542175293, -5.145204544067383, -4.009024143218994, -2.8728435039520264, -1.7366628646850586, -0.6004819869995117, 0.535698413848877, 1.6718788146972656, 2.808063507080078, 3.944244146347046, 5.080424785614014, 6.216605186462402, 7.352786064147949, 8.488966941833496, 9.625146865844727, 10.761327743530273, 11.89750862121582, 13.033689498901367, 14.169870376586914, 15.306050300598145, 16.442230224609375, 17.578411102294922, 18.71459197998047, 19.850772857666016, 20.986953735351562, 22.12313461303711, 23.259315490722656, 24.395496368408203, 25.53167724609375, 26.667858123779297, 27.80403709411621, 28.940217971801758, 30.076398849487305, 31.21257972717285, 32.348758697509766, 33.48493957519531, 34.62112045288086, 35.757301330566406, 36.89348220825195, 38.0296630859375, 39.16584396362305]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 9.0, 15.0, 13.0, 22.0, 36.0, 57.0, 94.0, 154.0, 297.0, 596.0, 1276.0, 3082.0, 7819.0, 25236.0, 107579.0, 610304.0, 227626.0, 43888.0, 12467.0, 4382.0, 1804.0, 907.0, 390.0, 221.0, 108.0, 56.0, 49.0, 20.0, 22.0, 11.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.524566650390625, -2.40264892578125, -2.280731201171875, -2.1588134765625, -2.036895751953125, -1.91497802734375, -1.793060302734375, -1.671142578125, -1.549224853515625, -1.42730712890625, -1.305389404296875, -1.1834716796875, -1.061553955078125, -0.93963623046875, -0.817718505859375, -0.69580078125, -0.573883056640625, -0.45196533203125, -0.330047607421875, -0.2081298828125, -0.086212158203125, 0.03570556640625, 0.157623291015625, 0.279541015625, 0.401458740234375, 0.52337646484375, 0.645294189453125, 0.7672119140625, 0.889129638671875, 1.01104736328125, 1.132965087890625, 1.2548828125, 1.376800537109375, 1.49871826171875, 1.620635986328125, 1.7425537109375, 1.864471435546875, 1.98638916015625, 2.108306884765625, 2.230224609375, 2.352142333984375, 2.47406005859375, 2.595977783203125, 2.7178955078125, 2.839813232421875, 2.96173095703125, 3.083648681640625, 3.20556640625, 3.327484130859375, 3.44940185546875, 3.571319580078125, 3.6932373046875, 3.815155029296875, 3.93707275390625, 4.058990478515625, 4.180908203125, 4.302825927734375, 4.42474365234375, 4.546661376953125, 4.6685791015625, 4.790496826171875, 4.91241455078125, 5.034332275390625, 5.15625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 11.0, 15.0, 17.0, 24.0, 21.0, 25.0, 27.0, 43.0, 41.0, 53.0, 63.0, 60.0, 49.0, 57.0, 67.0, 49.0, 60.0, 50.0, 44.0, 36.0, 32.0, 37.0, 20.0, 9.0, 12.0, 16.0, 13.0, 9.0, 7.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9833984375, -1.9050750732421875, -1.826751708984375, -1.7484283447265625, -1.67010498046875, -1.5917816162109375, -1.513458251953125, -1.4351348876953125, -1.3568115234375, -1.2784881591796875, -1.200164794921875, -1.1218414306640625, -1.04351806640625, -0.9651947021484375, -0.886871337890625, -0.8085479736328125, -0.730224609375, -0.6519012451171875, -0.573577880859375, -0.4952545166015625, -0.41693115234375, -0.3386077880859375, -0.260284423828125, -0.1819610595703125, -0.1036376953125, -0.0253143310546875, 0.053009033203125, 0.1313323974609375, 0.20965576171875, 0.2879791259765625, 0.366302490234375, 0.4446258544921875, 0.52294921875, 0.6012725830078125, 0.679595947265625, 0.7579193115234375, 0.83624267578125, 0.9145660400390625, 0.992889404296875, 1.0712127685546875, 1.1495361328125, 1.2278594970703125, 1.306182861328125, 1.3845062255859375, 1.46282958984375, 1.5411529541015625, 1.619476318359375, 1.6977996826171875, 1.776123046875, 1.8544464111328125, 1.932769775390625, 2.0110931396484375, 2.08941650390625, 2.1677398681640625, 2.246063232421875, 2.3243865966796875, 2.4027099609375, 2.4810333251953125, 2.559356689453125, 2.6376800537109375, 2.71600341796875, 2.7943267822265625, 2.872650146484375, 2.9509735107421875, 3.029296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 10.0, 6.0, 13.0, 25.0, 32.0, 48.0, 61.0, 93.0, 108.0, 225.0, 488.0, 1150.0, 4454.0, 41229.0, 931145.0, 61281.0, 5634.0, 1268.0, 522.0, 305.0, 165.0, 90.0, 68.0, 55.0, 35.0, 13.0, 16.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.48162841796875, -4.2991943359375, -4.11676025390625, -3.934326171875, -3.75189208984375, -3.5694580078125, -3.38702392578125, -3.20458984375, -3.02215576171875, -2.8397216796875, -2.65728759765625, -2.474853515625, -2.29241943359375, -2.1099853515625, -1.92755126953125, -1.7451171875, -1.56268310546875, -1.3802490234375, -1.19781494140625, -1.015380859375, -0.83294677734375, -0.6505126953125, -0.46807861328125, -0.28564453125, -0.10321044921875, 0.0792236328125, 0.26165771484375, 0.444091796875, 0.62652587890625, 0.8089599609375, 0.99139404296875, 1.173828125, 1.35626220703125, 1.5386962890625, 1.72113037109375, 1.903564453125, 2.08599853515625, 2.2684326171875, 2.45086669921875, 2.63330078125, 2.81573486328125, 2.9981689453125, 3.18060302734375, 3.363037109375, 3.54547119140625, 3.7279052734375, 3.91033935546875, 4.0927734375, 4.27520751953125, 4.4576416015625, 4.64007568359375, 4.822509765625, 5.00494384765625, 5.1873779296875, 5.36981201171875, 5.55224609375, 5.73468017578125, 5.9171142578125, 6.09954833984375, 6.281982421875, 6.46441650390625, 6.6468505859375, 6.82928466796875, 7.01171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 0.0, 4.0, 6.0, 9.0, 6.0, 5.0, 7.0, 4.0, 14.0, 8.0, 14.0, 14.0, 16.0, 23.0, 27.0, 28.0, 31.0, 41.0, 43.0, 59.0, 58.0, 52.0, 66.0, 68.0, 48.0, 50.0, 49.0, 32.0, 30.0, 21.0, 14.0, 23.0, 24.0, 11.0, 19.0, 17.0, 11.0, 9.0, 4.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-7.15234375, -6.935302734375, -6.71826171875, -6.501220703125, -6.2841796875, -6.067138671875, -5.85009765625, -5.633056640625, -5.416015625, -5.198974609375, -4.98193359375, -4.764892578125, -4.5478515625, -4.330810546875, -4.11376953125, -3.896728515625, -3.6796875, -3.462646484375, -3.24560546875, -3.028564453125, -2.8115234375, -2.594482421875, -2.37744140625, -2.160400390625, -1.943359375, -1.726318359375, -1.50927734375, -1.292236328125, -1.0751953125, -0.858154296875, -0.64111328125, -0.424072265625, -0.20703125, 0.010009765625, 0.22705078125, 0.444091796875, 0.6611328125, 0.878173828125, 1.09521484375, 1.312255859375, 1.529296875, 1.746337890625, 1.96337890625, 2.180419921875, 2.3974609375, 2.614501953125, 2.83154296875, 3.048583984375, 3.265625, 3.482666015625, 3.69970703125, 3.916748046875, 4.1337890625, 4.350830078125, 4.56787109375, 4.784912109375, 5.001953125, 5.218994140625, 5.43603515625, 5.653076171875, 5.8701171875, 6.087158203125, 6.30419921875, 6.521240234375, 6.73828125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 6.0, 12.0, 16.0, 20.0, 23.0, 37.0, 71.0, 126.0, 233.0, 530.0, 1544.0, 5241.0, 29151.0, 895084.0, 101309.0, 10829.0, 2623.0, 942.0, 330.0, 154.0, 88.0, 57.0, 36.0, 30.0, 15.0, 8.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0361328125, -1.004486083984375, -0.97283935546875, -0.941192626953125, -0.9095458984375, -0.877899169921875, -0.84625244140625, -0.814605712890625, -0.782958984375, -0.751312255859375, -0.71966552734375, -0.688018798828125, -0.6563720703125, -0.624725341796875, -0.59307861328125, -0.561431884765625, -0.52978515625, -0.498138427734375, -0.46649169921875, -0.434844970703125, -0.4031982421875, -0.371551513671875, -0.33990478515625, -0.308258056640625, -0.276611328125, -0.244964599609375, -0.21331787109375, -0.181671142578125, -0.1500244140625, -0.118377685546875, -0.08673095703125, -0.055084228515625, -0.0234375, 0.008209228515625, 0.03985595703125, 0.071502685546875, 0.1031494140625, 0.134796142578125, 0.16644287109375, 0.198089599609375, 0.229736328125, 0.261383056640625, 0.29302978515625, 0.324676513671875, 0.3563232421875, 0.387969970703125, 0.41961669921875, 0.451263427734375, 0.48291015625, 0.514556884765625, 0.54620361328125, 0.577850341796875, 0.6094970703125, 0.641143798828125, 0.67279052734375, 0.704437255859375, 0.736083984375, 0.767730712890625, 0.79937744140625, 0.831024169921875, 0.8626708984375, 0.894317626953125, 0.92596435546875, 0.957611083984375, 0.9892578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 8.0, 7.0, 5.0, 8.0, 12.0, 10.0, 17.0, 21.0, 43.0, 47.0, 93.0, 132.0, 156.0, 130.0, 96.0, 58.0, 38.0, 31.0, 24.0, 14.0, 9.0, 14.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025844573974609375, -0.000250963494181633, -0.00024348124861717224, -0.0002359990030527115, -0.00022851675748825073, -0.00022103451192378998, -0.00021355226635932922, -0.00020607002079486847, -0.00019858777523040771, -0.00019110552966594696, -0.0001836232841014862, -0.00017614103853702545, -0.0001686587929725647, -0.00016117654740810394, -0.0001536943018436432, -0.00014621205627918243, -0.00013872981071472168, -0.00013124756515026093, -0.00012376531958580017, -0.00011628307402133942, -0.00010880082845687866, -0.00010131858289241791, -9.383633732795715e-05, -8.63540917634964e-05, -7.887184619903564e-05, -7.138960063457489e-05, -6.390735507011414e-05, -5.642510950565338e-05, -4.894286394119263e-05, -4.146061837673187e-05, -3.397837281227112e-05, -2.6496127247810364e-05, -1.901388168334961e-05, -1.1531636118888855e-05, -4.049390554428101e-06, 3.432855010032654e-06, 1.0915100574493408e-05, 1.8397346138954163e-05, 2.5879591703414917e-05, 3.336183726787567e-05, 4.0844082832336426e-05, 4.832632839679718e-05, 5.5808573961257935e-05, 6.329081952571869e-05, 7.077306509017944e-05, 7.82553106546402e-05, 8.573755621910095e-05, 9.32198017835617e-05, 0.00010070204734802246, 0.00010818429291248322, 0.00011566653847694397, 0.00012314878404140472, 0.00013063102960586548, 0.00013811327517032623, 0.000145595520734787, 0.00015307776629924774, 0.0001605600118637085, 0.00016804225742816925, 0.00017552450299263, 0.00018300674855709076, 0.00019048899412155151, 0.00019797123968601227, 0.00020545348525047302, 0.00021293573081493378, 0.00022041797637939453]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 6.0, 10.0, 19.0, 26.0, 36.0, 73.0, 101.0, 188.0, 335.0, 648.0, 1299.0, 3139.0, 8665.0, 29813.0, 194368.0, 745179.0, 44957.0, 12157.0, 4063.0, 1704.0, 799.0, 393.0, 233.0, 135.0, 72.0, 50.0, 34.0, 15.0, 10.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.54345703125, -0.5241470336914062, -0.5048370361328125, -0.48552703857421875, -0.466217041015625, -0.44690704345703125, -0.4275970458984375, -0.40828704833984375, -0.38897705078125, -0.36966705322265625, -0.3503570556640625, -0.33104705810546875, -0.311737060546875, -0.29242706298828125, -0.2731170654296875, -0.25380706787109375, -0.2344970703125, -0.21518707275390625, -0.1958770751953125, -0.17656707763671875, -0.157257080078125, -0.13794708251953125, -0.1186370849609375, -0.09932708740234375, -0.08001708984375, -0.06070709228515625, -0.0413970947265625, -0.02208709716796875, -0.002777099609375, 0.01653289794921875, 0.0358428955078125, 0.05515289306640625, 0.074462890625, 0.09377288818359375, 0.1130828857421875, 0.13239288330078125, 0.151702880859375, 0.17101287841796875, 0.1903228759765625, 0.20963287353515625, 0.22894287109375, 0.24825286865234375, 0.2675628662109375, 0.28687286376953125, 0.306182861328125, 0.32549285888671875, 0.3448028564453125, 0.36411285400390625, 0.3834228515625, 0.40273284912109375, 0.4220428466796875, 0.44135284423828125, 0.460662841796875, 0.47997283935546875, 0.4992828369140625, 0.5185928344726562, 0.53790283203125, 0.5572128295898438, 0.5765228271484375, 0.5958328247070312, 0.615142822265625, 0.6344528198242188, 0.6537628173828125, 0.6730728149414062, 0.6923828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 8.0, 4.0, 3.0, 4.0, 10.0, 11.0, 5.0, 10.0, 14.0, 22.0, 29.0, 32.0, 57.0, 95.0, 110.0, 135.0, 136.0, 75.0, 63.0, 29.0, 29.0, 20.0, 16.0, 11.0, 11.0, 12.0, 11.0, 6.0, 9.0, 5.0, 1.0, 1.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.8509063720703125, -0.826324462890625, -0.8017425537109375, -0.77716064453125, -0.7525787353515625, -0.727996826171875, -0.7034149169921875, -0.6788330078125, -0.6542510986328125, -0.629669189453125, -0.6050872802734375, -0.58050537109375, -0.5559234619140625, -0.531341552734375, -0.5067596435546875, -0.482177734375, -0.4575958251953125, -0.433013916015625, -0.4084320068359375, -0.38385009765625, -0.3592681884765625, -0.334686279296875, -0.3101043701171875, -0.2855224609375, -0.2609405517578125, -0.236358642578125, -0.2117767333984375, -0.18719482421875, -0.1626129150390625, -0.138031005859375, -0.1134490966796875, -0.0888671875, -0.0642852783203125, -0.039703369140625, -0.0151214599609375, 0.00946044921875, 0.0340423583984375, 0.058624267578125, 0.0832061767578125, 0.1077880859375, 0.1323699951171875, 0.156951904296875, 0.1815338134765625, 0.20611572265625, 0.2306976318359375, 0.255279541015625, 0.2798614501953125, 0.304443359375, 0.3290252685546875, 0.353607177734375, 0.3781890869140625, 0.40277099609375, 0.4273529052734375, 0.451934814453125, 0.4765167236328125, 0.5010986328125, 0.5256805419921875, 0.550262451171875, 0.5748443603515625, 0.59942626953125, 0.6240081787109375, 0.648590087890625, 0.6731719970703125, 0.69775390625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 13.0, 86.0, 564.0, 250.0, 57.0, 19.0, 5.0, 6.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.64462661743164, -50.22813415527344, -47.81163787841797, -45.395145416259766, -42.9786491394043, -40.562156677246094, -38.145660400390625, -35.72916793823242, -33.31267547607422, -30.896181106567383, -28.479686737060547, -26.063194274902344, -23.646697998046875, -21.230205535888672, -18.813711166381836, -16.397216796875, -13.980720520019531, -11.564226150512695, -9.14773178100586, -6.73123836517334, -4.314743995666504, -1.898249626159668, 0.5182437896728516, 2.9347381591796875, 5.351232528686523, 7.767726898193359, 10.184221267700195, 12.600714683532715, 15.01720905303955, 17.433704376220703, 19.850196838378906, 22.266691207885742, 24.683181762695312, 27.09967613220215, 29.516170501708984, 31.932662963867188, 34.349159240722656, 36.76565170288086, 39.18214416503906, 41.59864044189453, 44.01513671875, 46.4316291809082, 48.84812545776367, 51.264617919921875, 53.681114196777344, 56.09760665893555, 58.51409912109375, 60.93059539794922, 63.34708786010742, 65.76358032226562, 68.1800765991211, 70.59657287597656, 73.0130615234375, 75.42955780029297, 77.84605407714844, 80.26254272460938, 82.67903900146484, 85.09553527832031, 87.51202392578125, 89.92852020263672, 92.34501647949219, 94.76151275634766, 97.1780014038086, 99.59449768066406, 102.01099395751953]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 12.0, 10.0, 10.0, 14.0, 21.0, 22.0, 23.0, 33.0, 45.0, 134.0, 146.0, 143.0, 134.0, 45.0, 29.0, 28.0, 33.0, 24.0, 18.0, 11.0, 15.0, 10.0, 14.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.04194641113281, -36.11620330810547, -35.190460205078125, -34.26471710205078, -33.33897399902344, -32.413230895996094, -31.487489700317383, -30.56174659729004, -29.636005401611328, -28.710262298583984, -27.78451919555664, -26.858776092529297, -25.933034896850586, -25.007291793823242, -24.0815486907959, -23.155805587768555, -22.23006248474121, -21.304319381713867, -20.378576278686523, -19.452835083007812, -18.52709197998047, -17.601348876953125, -16.67560577392578, -15.749862670898438, -14.82412052154541, -13.898377418518066, -12.972635269165039, -12.046892166137695, -11.121149063110352, -10.195406913757324, -9.26966381072998, -8.343921661376953, -7.418178558349609, -6.492435932159424, -5.566693305969238, -4.6409502029418945, -3.715207576751709, -2.7894649505615234, -1.8637218475341797, -0.9379792213439941, -0.012236595153808594, 0.9135061502456665, 1.8392488956451416, 2.7649917602539062, 3.690734386444092, 4.616477012634277, 5.542220115661621, 6.467962741851807, 7.393705368041992, 8.319448471069336, 9.245190620422363, 10.170933723449707, 11.096675872802734, 12.022418975830078, 12.948162078857422, 13.873905181884766, 14.799647331237793, 15.725390434265137, 16.651132583618164, 17.576875686645508, 18.50261878967285, 19.428359985351562, 20.354103088378906, 21.27984619140625, 22.205589294433594]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 6.0, 5.0, 1.0, 6.0, 2.0, 7.0, 13.0, 12.0, 11.0, 14.0, 24.0, 11.0, 19.0, 25.0, 26.0, 25.0, 27.0, 35.0, 78.0, 239.0, 91.0, 48.0, 32.0, 31.0, 27.0, 30.0, 17.0, 20.0, 17.0, 10.0, 18.0, 9.0, 12.0, 15.0, 5.0, 12.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.90234375, -1.845428466796875, -1.78851318359375, -1.731597900390625, -1.6746826171875, -1.617767333984375, -1.56085205078125, -1.503936767578125, -1.447021484375, -1.390106201171875, -1.33319091796875, -1.276275634765625, -1.2193603515625, -1.162445068359375, -1.10552978515625, -1.048614501953125, -0.99169921875, -0.934783935546875, -0.87786865234375, -0.820953369140625, -0.7640380859375, -0.707122802734375, -0.65020751953125, -0.593292236328125, -0.536376953125, -0.479461669921875, -0.42254638671875, -0.365631103515625, -0.3087158203125, -0.251800537109375, -0.19488525390625, -0.137969970703125, -0.0810546875, -0.024139404296875, 0.03277587890625, 0.089691162109375, 0.1466064453125, 0.203521728515625, 0.26043701171875, 0.317352294921875, 0.374267578125, 0.431182861328125, 0.48809814453125, 0.545013427734375, 0.6019287109375, 0.658843994140625, 0.71575927734375, 0.772674560546875, 0.82958984375, 0.886505126953125, 0.94342041015625, 1.000335693359375, 1.0572509765625, 1.114166259765625, 1.17108154296875, 1.227996826171875, 1.284912109375, 1.341827392578125, 1.39874267578125, 1.455657958984375, 1.5125732421875, 1.569488525390625, 1.62640380859375, 1.683319091796875, 1.740234375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 10.0, 12.0, 7.0, 6.0, 18.0, 22.0, 24.0, 45.0, 58.0, 77.0, 126.0, 272.0, 473.0, 1002.0, 2778.0, 9652.0, 8064118.0, 297660.0, 7868.0, 2416.0, 956.0, 375.0, 215.0, 130.0, 73.0, 49.0, 31.0, 24.0, 16.0, 9.0, 16.0, 6.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-18.889272689819336, -18.33279037475586, -17.776309967041016, -17.21982765197754, -16.663345336914062, -16.10686492919922, -15.550382614135742, -14.993901252746582, -14.437419891357422, -13.880938529968262, -13.324457168579102, -12.767974853515625, -12.211493492126465, -11.655012130737305, -11.098529815673828, -10.542048454284668, -9.985567092895508, -9.429085731506348, -8.872604370117188, -8.316122055053711, -7.759640693664551, -7.203159332275391, -6.646677494049072, -6.090195655822754, -5.533714294433594, -4.977232933044434, -4.420751094818115, -3.864269495010376, -3.3077878952026367, -2.7513062953948975, -2.194824695587158, -1.638343095779419, -1.0818634033203125, -0.5253818035125732, 0.031099796295166016, 0.5875813961029053, 1.1440629959106445, 1.7005445957183838, 2.257026195526123, 2.8135077953338623, 3.3699893951416016, 3.926470994949341, 4.48295259475708, 5.039434432983398, 5.595915794372559, 6.152397155761719, 6.708878993988037, 7.2653608322143555, 7.821842193603516, 8.378323554992676, 8.934804916381836, 9.491287231445312, 10.047768592834473, 10.604249954223633, 11.16073226928711, 11.71721363067627, 12.27369499206543, 12.83017635345459, 13.38665771484375, 13.943140029907227, 14.499621391296387, 15.056102752685547, 15.612585067749023, 16.169065475463867, 16.725547790527344]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 2.0, 7.0, 5.0, 5.0, 3.0, 6.0, 4.0, 4.0, 1.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.659130096435547, -24.68804931640625, -23.716968536376953, -22.745887756347656, -21.77480697631836, -20.803726196289062, -19.832643508911133, -18.861562728881836, -17.89048194885254, -16.919401168823242, -15.948320388793945, -14.977238655090332, -14.006157875061035, -13.035077095031738, -12.063995361328125, -11.092914581298828, -10.121833801269531, -9.150753021240234, -8.179672241210938, -7.208590507507324, -6.237509727478027, -5.2664289474487305, -4.295347690582275, -3.3242664337158203, -2.3531856536865234, -1.3821046352386475, -0.4110236167907715, 0.5600574016571045, 1.5311384201049805, 2.5022192001342773, 3.4733004570007324, 4.4443817138671875, 5.415462493896484, 6.386543273925781, 7.357624530792236, 8.328705787658691, 9.299786567687988, 10.270867347717285, 11.241949081420898, 12.213029861450195, 13.184110641479492, 14.155191421508789, 15.126272201538086, 16.097352981567383, 17.068435668945312, 18.03951644897461, 19.010597229003906, 19.981678009033203, 20.9527587890625, 21.923839569091797, 22.894920349121094, 23.86600112915039, 24.837081909179688, 25.808162689208984, 26.779245376586914, 27.75032615661621, 28.721406936645508, 29.692487716674805, 30.6635684967041, 31.6346492767334, 32.60573196411133, 33.576812744140625, 34.54789352416992, 35.51897430419922, 36.490055084228516]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 5.0, 9.0, 9.0, 7.0, 16.0, 30.0, 40.0, 48.0, 63.0, 89.0, 149.0, 262.0, 574.0, 1293.0, 3606.0, 11143.0, 36760.0, 123499.0, 219263.0, 88731.0, 25687.0, 8114.0, 2705.0, 1021.0, 449.0, 228.0, 140.0, 89.0, 59.0, 49.0, 25.0, 33.0, 16.0, 15.0, 7.0, 5.0, 8.0, 4.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.673828125, -20.03515625, -19.396484375, -18.7578125, -18.119140625, -17.48046875, -16.841796875, -16.203125, -15.564453125, -14.92578125, -14.287109375, -13.6484375, -13.009765625, -12.37109375, -11.732421875, -11.09375, -10.455078125, -9.81640625, -9.177734375, -8.5390625, -7.900390625, -7.26171875, -6.623046875, -5.984375, -5.345703125, -4.70703125, -4.068359375, -3.4296875, -2.791015625, -2.15234375, -1.513671875, -0.875, -0.236328125, 0.40234375, 1.041015625, 1.6796875, 2.318359375, 2.95703125, 3.595703125, 4.234375, 4.873046875, 5.51171875, 6.150390625, 6.7890625, 7.427734375, 8.06640625, 8.705078125, 9.34375, 9.982421875, 10.62109375, 11.259765625, 11.8984375, 12.537109375, 13.17578125, 13.814453125, 14.453125, 15.091796875, 15.73046875, 16.369140625, 17.0078125, 17.646484375, 18.28515625, 18.923828125, 19.5625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 10.0, 2.0, 7.0, 9.0, 20.0, 15.0, 26.0, 39.0, 47.0, 39.0, 80.0, 89.0, 102.0, 81.0, 86.0, 85.0, 67.0, 61.0, 38.0, 32.0, 24.0, 17.0, 11.0, 8.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24609375, -3.13677978515625, -3.0274658203125, -2.91815185546875, -2.808837890625, -2.69952392578125, -2.5902099609375, -2.48089599609375, -2.37158203125, -2.26226806640625, -2.1529541015625, -2.04364013671875, -1.934326171875, -1.82501220703125, -1.7156982421875, -1.60638427734375, -1.4970703125, -1.38775634765625, -1.2784423828125, -1.16912841796875, -1.059814453125, -0.95050048828125, -0.8411865234375, -0.73187255859375, -0.62255859375, -0.51324462890625, -0.4039306640625, -0.29461669921875, -0.185302734375, -0.07598876953125, 0.0333251953125, 0.14263916015625, 0.251953125, 0.36126708984375, 0.4705810546875, 0.57989501953125, 0.689208984375, 0.79852294921875, 0.9078369140625, 1.01715087890625, 1.12646484375, 1.23577880859375, 1.3450927734375, 1.45440673828125, 1.563720703125, 1.67303466796875, 1.7823486328125, 1.89166259765625, 2.0009765625, 2.11029052734375, 2.2196044921875, 2.32891845703125, 2.438232421875, 2.54754638671875, 2.6568603515625, 2.76617431640625, 2.87548828125, 2.98480224609375, 3.0941162109375, 3.20343017578125, 3.312744140625, 3.42205810546875, 3.5313720703125, 3.64068603515625, 3.75]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 4.0, 7.0, 11.0, 13.0, 17.0, 24.0, 41.0, 63.0, 79.0, 64.0, 54.0, 23.0, 16.0, 15.0, 9.0, 9.0, 8.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.71794319152832, -19.17167854309082, -18.625411987304688, -18.079147338867188, -17.532880783081055, -16.986616134643555, -16.440349578857422, -15.894084930419922, -15.347819328308105, -14.801553726196289, -14.255288124084473, -13.709022521972656, -13.162757873535156, -12.616491317749023, -12.070226669311523, -11.523961067199707, -10.97769546508789, -10.431429862976074, -9.885164260864258, -9.338898658752441, -8.792633056640625, -8.246368408203125, -7.700102806091309, -7.153837203979492, -6.607571601867676, -6.061305999755859, -5.515040397644043, -4.968775272369385, -4.422509670257568, -3.876244068145752, -3.3299787044525146, -2.7837133407592773, -2.237445831298828, -1.6911803483963013, -1.1449148654937744, -0.5986493825912476, -0.0523838996887207, 0.4938817024230957, 1.040147066116333, 1.5864124298095703, 2.1326780319213867, 2.678943634033203, 3.2252089977264404, 3.7714743614196777, 4.317739963531494, 4.8640055656433105, 5.410270690917969, 5.956536293029785, 6.502801895141602, 7.049067497253418, 7.595333099365234, 8.14159870147705, 8.687864303588867, 9.234128952026367, 9.780394554138184, 10.32666015625, 10.872925758361816, 11.419191360473633, 11.96545696258545, 12.511722564697266, 13.057987213134766, 13.604253768920898, 14.150518417358398, 14.696784019470215, 15.243049621582031]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 1.0, 7.0, 3.0, 5.0, 1.0, 5.0, 13.0, 24.0, 39.0, 80.0, 107.0, 66.0, 44.0, 28.0, 11.0, 8.0, 9.0, 3.0, 7.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.374192237854004, -9.951359748840332, -9.52852725982666, -9.105693817138672, -8.682861328125, -8.260028839111328, -7.837196350097656, -7.414363861083984, -6.991530895233154, -6.568698406219482, -6.145865440368652, -5.7230329513549805, -5.300200462341309, -4.8773674964904785, -4.454535007476807, -4.031702041625977, -3.6088695526123047, -3.1860368251800537, -2.7632040977478027, -2.340371608734131, -1.9175388813018799, -1.494706153869629, -1.071873664855957, -0.649040937423706, -0.22620820999145508, 0.19662445783615112, 0.6194571256637573, 1.0422897338867188, 1.4651224613189697, 1.8879551887512207, 2.3107876777648926, 2.7336204051971436, 3.156454086303711, 3.579286813735962, 4.002119541168213, 4.424952030181885, 4.847784996032715, 5.270617485046387, 5.693449974060059, 6.1162824630737305, 6.5391154289245605, 6.961947917938232, 7.3847808837890625, 7.807613372802734, 8.230445861816406, 8.653278350830078, 9.07611083984375, 9.498944282531738, 9.92177677154541, 10.344609260559082, 10.767441749572754, 11.190275192260742, 11.613107681274414, 12.035940170288086, 12.458772659301758, 12.88160514831543, 13.304437637329102, 13.727270126342773, 14.150102615356445, 14.572935104370117, 14.995768547058105, 15.418601036071777, 15.84143352508545, 16.264266967773438, 16.68709945678711]}, "eval/loss": 4.626309871673584, "eval/wer": 0.8567830226100753, "eval/runtime": 668.3691, "eval/samples_per_second": 3.953, "eval/steps_per_second": 0.495} \ No newline at end of file +{"train/loss": 0.0634, "train/learning_rate": 1.0688836104513066e-08, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 105886, "_timestamp": 1647053125, "_step": 17851, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 6.0, 17.0, 13.0, 19.0, 24.0, 12.0, 29.0, 25.0, 35.0, 32.0, 28.0, 40.0, 45.0, 50.0, 61.0, 41.0, 50.0, 47.0, 51.0, 44.0, 38.0, 39.0, 39.0, 29.0, 34.0, 31.0, 23.0, 17.0, 13.0, 12.0, 13.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-129.83238220214844, -127.52375030517578, -125.2151107788086, -122.90647888183594, -120.59784698486328, -118.2892074584961, -115.98057556152344, -113.67193603515625, -111.3633041381836, -109.05467224121094, -106.74603271484375, -104.4374008178711, -102.12876892089844, -99.82012939453125, -97.5114974975586, -95.20286560058594, -92.89422607421875, -90.5855941772461, -88.2769546508789, -85.96832275390625, -83.6596908569336, -81.3510513305664, -79.04241943359375, -76.73377990722656, -74.42515563964844, -72.11652374267578, -69.8078842163086, -67.49925231933594, -65.19062042236328, -62.881980895996094, -60.57334899902344, -58.264713287353516, -55.956077575683594, -53.64744186401367, -51.338809967041016, -49.030174255371094, -46.72153854370117, -44.41290283203125, -42.104270935058594, -39.79563522338867, -37.48699951171875, -35.17836380004883, -32.86973190307617, -30.56109619140625, -28.252460479736328, -25.94382667541504, -23.63519287109375, -21.326557159423828, -19.017925262451172, -16.709291458129883, -14.400655746459961, -12.092021942138672, -9.783387184143066, -7.474752426147461, -5.166118621826172, -2.85748291015625, -0.5488491058349609, 1.7597854137420654, 4.068419933319092, 6.377054214477539, 8.685688972473145, 10.99432373046875, 13.302957534790039, 15.611593246459961, 17.92022705078125]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 8.0, 4.0, 12.0, 10.0, 21.0, 14.0, 20.0, 29.0, 20.0, 35.0, 36.0, 28.0, 38.0, 36.0, 28.0, 41.0, 58.0, 47.0, 52.0, 44.0, 39.0, 36.0, 32.0, 40.0, 32.0, 29.0, 27.0, 24.0, 12.0, 17.0, 23.0, 22.0, 18.0, 12.0, 10.0, 8.0, 11.0, 9.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.229087829589844, -57.20296859741211, -55.176849365234375, -53.150733947753906, -51.12461471557617, -49.09849548339844, -47.07238006591797, -45.046260833740234, -43.0201416015625, -40.994022369384766, -38.96790313720703, -36.94178771972656, -34.91566848754883, -32.889549255371094, -30.863431930541992, -28.83731460571289, -26.811195373535156, -24.785076141357422, -22.75895881652832, -20.73284149169922, -18.706722259521484, -16.68060302734375, -14.654485702514648, -12.62836742401123, -10.602249145507812, -8.576130867004395, -6.550012588500977, -4.523894309997559, -2.4977760314941406, -0.47165775299072266, 1.5544605255126953, 3.5805788040161133, 5.6067047119140625, 7.6328229904174805, 9.658941268920898, 11.685059547424316, 13.711177825927734, 15.737296104431152, 17.76341438293457, 19.789531707763672, 21.815650939941406, 23.84177017211914, 25.867887496948242, 27.894004821777344, 29.920124053955078, 31.946243286132812, 33.97235870361328, 35.998477935791016, 38.02459716796875, 40.050716400146484, 42.07683563232422, 44.10295104980469, 46.12907028198242, 48.155189514160156, 50.181304931640625, 52.20742416381836, 54.233543395996094, 56.25966262817383, 58.28578186035156, 60.31189727783203, 62.338016510009766, 64.3641357421875, 66.39025115966797, 68.41637420654297, 70.44248962402344]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 17.0, 21.0, 22.0, 30.0, 67.0, 99.0, 177.0, 310.0, 528.0, 893.0, 1462.0, 2460.0, 4383.0, 7166.0, 12011.0, 20601.0, 34550.0, 58049.0, 94819.0, 152761.0, 235287.0, 342712.0, 460193.0, 547886.0, 566160.0, 503519.0, 392170.0, 277748.0, 183003.0, 116680.0, 70553.0, 43671.0, 25867.0, 15389.0, 9362.0, 5509.0, 3249.0, 1898.0, 1177.0, 694.0, 441.0, 258.0, 169.0, 97.0, 64.0, 35.0, 23.0, 9.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0], "bins": [-102.6875, -99.595703125, -96.50390625, -93.412109375, -90.3203125, -87.228515625, -84.13671875, -81.044921875, -77.953125, -74.861328125, -71.76953125, -68.677734375, -65.5859375, -62.494140625, -59.40234375, -56.310546875, -53.21875, -50.126953125, -47.03515625, -43.943359375, -40.8515625, -37.759765625, -34.66796875, -31.576171875, -28.484375, -25.392578125, -22.30078125, -19.208984375, -16.1171875, -13.025390625, -9.93359375, -6.841796875, -3.75, -0.658203125, 2.43359375, 5.525390625, 8.6171875, 11.708984375, 14.80078125, 17.892578125, 20.984375, 24.076171875, 27.16796875, 30.259765625, 33.3515625, 36.443359375, 39.53515625, 42.626953125, 45.71875, 48.810546875, 51.90234375, 54.994140625, 58.0859375, 61.177734375, 64.26953125, 67.361328125, 70.453125, 73.544921875, 76.63671875, 79.728515625, 82.8203125, 85.912109375, 89.00390625, 92.095703125, 95.1875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 5.0, 2.0, 3.0, 17.0, 12.0, 16.0, 17.0, 29.0, 18.0, 29.0, 39.0, 38.0, 41.0, 39.0, 38.0, 45.0, 46.0, 50.0, 43.0, 35.0, 52.0, 43.0, 43.0, 31.0, 30.0, 34.0, 25.0, 34.0, 23.0, 25.0, 12.0, 18.0, 11.0, 9.0, 11.0, 9.0, 8.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.6875, -72.3857421875, -70.083984375, -67.7822265625, -65.48046875, -63.1787109375, -60.876953125, -58.5751953125, -56.2734375, -53.9716796875, -51.669921875, -49.3681640625, -47.06640625, -44.7646484375, -42.462890625, -40.1611328125, -37.859375, -35.5576171875, -33.255859375, -30.9541015625, -28.65234375, -26.3505859375, -24.048828125, -21.7470703125, -19.4453125, -17.1435546875, -14.841796875, -12.5400390625, -10.23828125, -7.9365234375, -5.634765625, -3.3330078125, -1.03125, 1.2705078125, 3.572265625, 5.8740234375, 8.17578125, 10.4775390625, 12.779296875, 15.0810546875, 17.3828125, 19.6845703125, 21.986328125, 24.2880859375, 26.58984375, 28.8916015625, 31.193359375, 33.4951171875, 35.796875, 38.0986328125, 40.400390625, 42.7021484375, 45.00390625, 47.3056640625, 49.607421875, 51.9091796875, 54.2109375, 56.5126953125, 58.814453125, 61.1162109375, 63.41796875, 65.7197265625, 68.021484375, 70.3232421875, 72.625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 15.0, 21.0, 37.0, 61.0, 115.0, 190.0, 364.0, 601.0, 1021.0, 1712.0, 3182.0, 5573.0, 9674.0, 16836.0, 28094.0, 45228.0, 72481.0, 111979.0, 165923.0, 236504.0, 313165.0, 388419.0, 447140.0, 470743.0, 449780.0, 392738.0, 318418.0, 239093.0, 169178.0, 114731.0, 74827.0, 46929.0, 28909.0, 16938.0, 10119.0, 5735.0, 3488.0, 1819.0, 1130.0, 615.0, 328.0, 178.0, 117.0, 53.0, 42.0, 21.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-81.5625, -79.1298828125, -76.697265625, -74.2646484375, -71.83203125, -69.3994140625, -66.966796875, -64.5341796875, -62.1015625, -59.6689453125, -57.236328125, -54.8037109375, -52.37109375, -49.9384765625, -47.505859375, -45.0732421875, -42.640625, -40.2080078125, -37.775390625, -35.3427734375, -32.91015625, -30.4775390625, -28.044921875, -25.6123046875, -23.1796875, -20.7470703125, -18.314453125, -15.8818359375, -13.44921875, -11.0166015625, -8.583984375, -6.1513671875, -3.71875, -1.2861328125, 1.146484375, 3.5791015625, 6.01171875, 8.4443359375, 10.876953125, 13.3095703125, 15.7421875, 18.1748046875, 20.607421875, 23.0400390625, 25.47265625, 27.9052734375, 30.337890625, 32.7705078125, 35.203125, 37.6357421875, 40.068359375, 42.5009765625, 44.93359375, 47.3662109375, 49.798828125, 52.2314453125, 54.6640625, 57.0966796875, 59.529296875, 61.9619140625, 64.39453125, 66.8271484375, 69.259765625, 71.6923828125, 74.125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 6.0, 3.0, 7.0, 8.0, 14.0, 12.0, 22.0, 25.0, 25.0, 39.0, 65.0, 72.0, 68.0, 102.0, 118.0, 108.0, 131.0, 163.0, 157.0, 173.0, 188.0, 192.0, 187.0, 219.0, 212.0, 187.0, 220.0, 184.0, 154.0, 145.0, 146.0, 134.0, 101.0, 96.0, 78.0, 65.0, 49.0, 40.0, 42.0, 27.0, 19.0, 18.0, 17.0, 8.0, 8.0, 7.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0], "bins": [-40.9375, -39.77734375, -38.6171875, -37.45703125, -36.296875, -35.13671875, -33.9765625, -32.81640625, -31.65625, -30.49609375, -29.3359375, -28.17578125, -27.015625, -25.85546875, -24.6953125, -23.53515625, -22.375, -21.21484375, -20.0546875, -18.89453125, -17.734375, -16.57421875, -15.4140625, -14.25390625, -13.09375, -11.93359375, -10.7734375, -9.61328125, -8.453125, -7.29296875, -6.1328125, -4.97265625, -3.8125, -2.65234375, -1.4921875, -0.33203125, 0.828125, 1.98828125, 3.1484375, 4.30859375, 5.46875, 6.62890625, 7.7890625, 8.94921875, 10.109375, 11.26953125, 12.4296875, 13.58984375, 14.75, 15.91015625, 17.0703125, 18.23046875, 19.390625, 20.55078125, 21.7109375, 22.87109375, 24.03125, 25.19140625, 26.3515625, 27.51171875, 28.671875, 29.83203125, 30.9921875, 32.15234375, 33.3125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 9.0, 7.0, 8.0, 14.0, 14.0, 23.0, 21.0, 13.0, 31.0, 29.0, 19.0, 32.0, 27.0, 27.0, 30.0, 43.0, 34.0, 38.0, 40.0, 42.0, 39.0, 50.0, 39.0, 48.0, 40.0, 40.0, 31.0, 28.0, 18.0, 32.0, 22.0, 17.0, 12.0, 15.0, 13.0, 10.0, 7.0, 5.0, 1.0, 7.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-88.5003433227539, -85.922119140625, -83.34390258789062, -80.76567840576172, -78.18746185302734, -75.60923767089844, -73.03102111816406, -70.45279693603516, -67.87457275390625, -65.29634857177734, -62.71813201904297, -60.13991165161133, -57.56169128417969, -54.98346710205078, -52.40524673461914, -49.8270263671875, -47.248809814453125, -44.670589447021484, -42.092369079589844, -39.5141487121582, -36.93592834472656, -34.357704162597656, -31.779483795166016, -29.201263427734375, -26.623043060302734, -24.044822692871094, -21.466602325439453, -18.88838005065918, -16.31015968322754, -13.731939315795898, -11.153717994689941, -8.575496673583984, -5.997276306152344, -3.419055461883545, -0.8408346176147461, 1.7373862266540527, 4.315607070922852, 6.893827438354492, 9.47204875946045, 12.050270080566406, 14.628490447998047, 17.206710815429688, 19.784931182861328, 22.3631534576416, 24.941373825073242, 27.519594192504883, 30.097816467285156, 32.6760368347168, 35.25425720214844, 37.83247756958008, 40.41069793701172, 42.98891830444336, 45.567138671875, 48.145362854003906, 50.72358322143555, 53.30180358886719, 55.88002395629883, 58.45824432373047, 61.03646469116211, 63.61468505859375, 66.19290924072266, 68.77112579345703, 71.34934997558594, 73.92756652832031, 76.50579071044922]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 4.0, 7.0, 11.0, 9.0, 13.0, 15.0, 21.0, 17.0, 26.0, 26.0, 36.0, 38.0, 29.0, 34.0, 31.0, 41.0, 46.0, 38.0, 42.0, 56.0, 41.0, 33.0, 39.0, 35.0, 42.0, 33.0, 30.0, 32.0, 22.0, 25.0, 22.0, 17.0, 18.0, 14.0, 6.0, 10.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-90.4842529296875, -87.76840209960938, -85.05255126953125, -82.33670043945312, -79.620849609375, -76.90499877929688, -74.18914794921875, -71.47329711914062, -68.7574462890625, -66.04159545898438, -63.32574462890625, -60.609893798828125, -57.89404296875, -55.178192138671875, -52.46234130859375, -49.746490478515625, -47.0306396484375, -44.314788818359375, -41.59893798828125, -38.883087158203125, -36.167236328125, -33.451385498046875, -30.73553466796875, -28.019683837890625, -25.3038330078125, -22.587982177734375, -19.87213134765625, -17.156280517578125, -14.4404296875, -11.724578857421875, -9.00872802734375, -6.292877197265625, -3.5770187377929688, -0.8611679077148438, 1.8546829223632812, 4.570533752441406, 7.286384582519531, 10.002235412597656, 12.718086242675781, 15.433937072753906, 18.14978790283203, 20.865638732910156, 23.58148956298828, 26.297340393066406, 29.01319122314453, 31.729042053222656, 34.44489288330078, 37.160743713378906, 39.87659454345703, 42.592445373535156, 45.30829620361328, 48.024147033691406, 50.73999786376953, 53.455848693847656, 56.17169952392578, 58.887550354003906, 61.60340118408203, 64.31925201416016, 67.03510284423828, 69.7509536743164, 72.46680450439453, 75.18265533447266, 77.89850616455078, 80.6143569946289, 83.33020782470703]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 8.0, 13.0, 24.0, 26.0, 38.0, 53.0, 78.0, 105.0, 147.0, 211.0, 323.0, 440.0, 732.0, 1124.0, 1738.0, 2772.0, 4462.0, 7533.0, 12551.0, 21402.0, 36458.0, 61211.0, 98818.0, 144502.0, 176116.0, 164798.0, 120337.0, 76825.0, 46588.0, 27307.0, 16492.0, 9617.0, 5908.0, 3505.0, 2263.0, 1388.0, 929.0, 537.0, 352.0, 238.0, 172.0, 122.0, 92.0, 55.0, 44.0, 31.0, 24.0, 20.0, 10.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.375, -66.220703125, -64.06640625, -61.912109375, -59.7578125, -57.603515625, -55.44921875, -53.294921875, -51.140625, -48.986328125, -46.83203125, -44.677734375, -42.5234375, -40.369140625, -38.21484375, -36.060546875, -33.90625, -31.751953125, -29.59765625, -27.443359375, -25.2890625, -23.134765625, -20.98046875, -18.826171875, -16.671875, -14.517578125, -12.36328125, -10.208984375, -8.0546875, -5.900390625, -3.74609375, -1.591796875, 0.5625, 2.716796875, 4.87109375, 7.025390625, 9.1796875, 11.333984375, 13.48828125, 15.642578125, 17.796875, 19.951171875, 22.10546875, 24.259765625, 26.4140625, 28.568359375, 30.72265625, 32.876953125, 35.03125, 37.185546875, 39.33984375, 41.494140625, 43.6484375, 45.802734375, 47.95703125, 50.111328125, 52.265625, 54.419921875, 56.57421875, 58.728515625, 60.8828125, 63.037109375, 65.19140625, 67.345703125, 69.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 4.0, 4.0, 8.0, 9.0, 7.0, 16.0, 13.0, 21.0, 18.0, 21.0, 28.0, 31.0, 35.0, 34.0, 35.0, 33.0, 37.0, 44.0, 43.0, 28.0, 65.0, 42.0, 33.0, 43.0, 36.0, 35.0, 36.0, 34.0, 26.0, 30.0, 20.0, 26.0, 14.0, 20.0, 12.0, 11.0, 11.0, 10.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-92.0625, -89.3095703125, -86.556640625, -83.8037109375, -81.05078125, -78.2978515625, -75.544921875, -72.7919921875, -70.0390625, -67.2861328125, -64.533203125, -61.7802734375, -59.02734375, -56.2744140625, -53.521484375, -50.7685546875, -48.015625, -45.2626953125, -42.509765625, -39.7568359375, -37.00390625, -34.2509765625, -31.498046875, -28.7451171875, -25.9921875, -23.2392578125, -20.486328125, -17.7333984375, -14.98046875, -12.2275390625, -9.474609375, -6.7216796875, -3.96875, -1.2158203125, 1.537109375, 4.2900390625, 7.04296875, 9.7958984375, 12.548828125, 15.3017578125, 18.0546875, 20.8076171875, 23.560546875, 26.3134765625, 29.06640625, 31.8193359375, 34.572265625, 37.3251953125, 40.078125, 42.8310546875, 45.583984375, 48.3369140625, 51.08984375, 53.8427734375, 56.595703125, 59.3486328125, 62.1015625, 64.8544921875, 67.607421875, 70.3603515625, 73.11328125, 75.8662109375, 78.619140625, 81.3720703125, 84.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 16.0, 9.0, 18.0, 28.0, 33.0, 29.0, 65.0, 67.0, 105.0, 114.0, 176.0, 224.0, 343.0, 453.0, 661.0, 1116.0, 1786.0, 2983.0, 5566.0, 11022.0, 25135.0, 65743.0, 183017.0, 351161.0, 243591.0, 91431.0, 33200.0, 14045.0, 6749.0, 3512.0, 2081.0, 1274.0, 838.0, 552.0, 402.0, 266.0, 191.0, 134.0, 100.0, 76.0, 53.0, 51.0, 24.0, 24.0, 13.0, 11.0, 15.0, 17.0, 4.0, 10.0, 6.0, 2.0, 2.0, 2.0], "bins": [-93.9375, -91.146484375, -88.35546875, -85.564453125, -82.7734375, -79.982421875, -77.19140625, -74.400390625, -71.609375, -68.818359375, -66.02734375, -63.236328125, -60.4453125, -57.654296875, -54.86328125, -52.072265625, -49.28125, -46.490234375, -43.69921875, -40.908203125, -38.1171875, -35.326171875, -32.53515625, -29.744140625, -26.953125, -24.162109375, -21.37109375, -18.580078125, -15.7890625, -12.998046875, -10.20703125, -7.416015625, -4.625, -1.833984375, 0.95703125, 3.748046875, 6.5390625, 9.330078125, 12.12109375, 14.912109375, 17.703125, 20.494140625, 23.28515625, 26.076171875, 28.8671875, 31.658203125, 34.44921875, 37.240234375, 40.03125, 42.822265625, 45.61328125, 48.404296875, 51.1953125, 53.986328125, 56.77734375, 59.568359375, 62.359375, 65.150390625, 67.94140625, 70.732421875, 73.5234375, 76.314453125, 79.10546875, 81.896484375, 84.6875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 4.0, 11.0, 6.0, 9.0, 18.0, 12.0, 16.0, 16.0, 22.0, 27.0, 33.0, 35.0, 31.0, 38.0, 43.0, 37.0, 38.0, 42.0, 42.0, 44.0, 38.0, 30.0, 40.0, 28.0, 27.0, 25.0, 33.0, 29.0, 33.0, 31.0, 22.0, 18.0, 29.0, 15.0, 16.0, 12.0, 5.0, 10.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.78125, -54.0712890625, -52.361328125, -50.6513671875, -48.94140625, -47.2314453125, -45.521484375, -43.8115234375, -42.1015625, -40.3916015625, -38.681640625, -36.9716796875, -35.26171875, -33.5517578125, -31.841796875, -30.1318359375, -28.421875, -26.7119140625, -25.001953125, -23.2919921875, -21.58203125, -19.8720703125, -18.162109375, -16.4521484375, -14.7421875, -13.0322265625, -11.322265625, -9.6123046875, -7.90234375, -6.1923828125, -4.482421875, -2.7724609375, -1.0625, 0.6474609375, 2.357421875, 4.0673828125, 5.77734375, 7.4873046875, 9.197265625, 10.9072265625, 12.6171875, 14.3271484375, 16.037109375, 17.7470703125, 19.45703125, 21.1669921875, 22.876953125, 24.5869140625, 26.296875, 28.0068359375, 29.716796875, 31.4267578125, 33.13671875, 34.8466796875, 36.556640625, 38.2666015625, 39.9765625, 41.6865234375, 43.396484375, 45.1064453125, 46.81640625, 48.5263671875, 50.236328125, 51.9462890625, 53.65625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 5.0, 2.0, 4.0, 4.0, 7.0, 9.0, 7.0, 15.0, 26.0, 32.0, 29.0, 48.0, 54.0, 79.0, 129.0, 177.0, 253.0, 333.0, 479.0, 729.0, 1179.0, 2020.0, 3555.0, 6453.0, 12970.0, 27027.0, 62394.0, 149466.0, 300062.0, 264239.0, 120076.0, 50248.0, 22239.0, 10607.0, 5457.0, 3125.0, 1822.0, 1032.0, 660.0, 447.0, 299.0, 204.0, 162.0, 99.0, 72.0, 69.0, 32.0, 27.0, 28.0, 18.0, 12.0, 13.0, 8.0, 5.0, 7.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0], "bins": [-38.125, -36.89013671875, -35.6552734375, -34.42041015625, -33.185546875, -31.95068359375, -30.7158203125, -29.48095703125, -28.24609375, -27.01123046875, -25.7763671875, -24.54150390625, -23.306640625, -22.07177734375, -20.8369140625, -19.60205078125, -18.3671875, -17.13232421875, -15.8974609375, -14.66259765625, -13.427734375, -12.19287109375, -10.9580078125, -9.72314453125, -8.48828125, -7.25341796875, -6.0185546875, -4.78369140625, -3.548828125, -2.31396484375, -1.0791015625, 0.15576171875, 1.390625, 2.62548828125, 3.8603515625, 5.09521484375, 6.330078125, 7.56494140625, 8.7998046875, 10.03466796875, 11.26953125, 12.50439453125, 13.7392578125, 14.97412109375, 16.208984375, 17.44384765625, 18.6787109375, 19.91357421875, 21.1484375, 22.38330078125, 23.6181640625, 24.85302734375, 26.087890625, 27.32275390625, 28.5576171875, 29.79248046875, 31.02734375, 32.26220703125, 33.4970703125, 34.73193359375, 35.966796875, 37.20166015625, 38.4365234375, 39.67138671875, 40.90625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 6.0, 5.0, 7.0, 9.0, 21.0, 26.0, 21.0, 36.0, 52.0, 59.0, 85.0, 75.0, 80.0, 94.0, 96.0, 64.0, 61.0, 49.0, 45.0, 32.0, 15.0, 22.0, 11.0, 14.0, 8.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002880096435546875, -0.0027959048748016357, -0.0027117133140563965, -0.0026275217533111572, -0.002543330192565918, -0.0024591386318206787, -0.0023749470710754395, -0.0022907555103302, -0.002206563949584961, -0.0021223723888397217, -0.0020381808280944824, -0.001953989267349243, -0.001869797706604004, -0.0017856061458587646, -0.0017014145851135254, -0.0016172230243682861, -0.0015330314636230469, -0.0014488399028778076, -0.0013646483421325684, -0.001280456781387329, -0.0011962652206420898, -0.0011120736598968506, -0.0010278820991516113, -0.0009436905384063721, -0.0008594989776611328, -0.0007753074169158936, -0.0006911158561706543, -0.000606924295425415, -0.0005227327346801758, -0.0004385411739349365, -0.00035434961318969727, -0.000270158052444458, -0.00018596649169921875, -0.00010177493095397949, -1.7583370208740234e-05, 6.660819053649902e-05, 0.00015079975128173828, 0.00023499131202697754, 0.0003191828727722168, 0.00040337443351745605, 0.0004875659942626953, 0.0005717575550079346, 0.0006559491157531738, 0.0007401406764984131, 0.0008243322372436523, 0.0009085237979888916, 0.0009927153587341309, 0.0010769069194793701, 0.0011610984802246094, 0.0012452900409698486, 0.0013294816017150879, 0.0014136731624603271, 0.0014978647232055664, 0.0015820562839508057, 0.001666247844696045, 0.0017504394054412842, 0.0018346309661865234, 0.0019188225269317627, 0.002003014087677002, 0.002087205648422241, 0.0021713972091674805, 0.0022555887699127197, 0.002339780330657959, 0.0024239718914031982, 0.0025081634521484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 15.0, 21.0, 34.0, 41.0, 68.0, 91.0, 118.0, 176.0, 310.0, 425.0, 677.0, 1059.0, 1745.0, 2965.0, 4934.0, 8904.0, 16591.0, 30829.0, 57024.0, 102455.0, 164490.0, 204356.0, 180350.0, 120355.0, 68054.0, 37165.0, 19694.0, 10715.0, 5978.0, 3306.0, 2016.0, 1271.0, 781.0, 497.0, 347.0, 231.0, 142.0, 96.0, 78.0, 44.0, 29.0, 22.0, 18.0, 11.0, 8.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-59.5, -57.78271484375, -56.0654296875, -54.34814453125, -52.630859375, -50.91357421875, -49.1962890625, -47.47900390625, -45.76171875, -44.04443359375, -42.3271484375, -40.60986328125, -38.892578125, -37.17529296875, -35.4580078125, -33.74072265625, -32.0234375, -30.30615234375, -28.5888671875, -26.87158203125, -25.154296875, -23.43701171875, -21.7197265625, -20.00244140625, -18.28515625, -16.56787109375, -14.8505859375, -13.13330078125, -11.416015625, -9.69873046875, -7.9814453125, -6.26416015625, -4.546875, -2.82958984375, -1.1123046875, 0.60498046875, 2.322265625, 4.03955078125, 5.7568359375, 7.47412109375, 9.19140625, 10.90869140625, 12.6259765625, 14.34326171875, 16.060546875, 17.77783203125, 19.4951171875, 21.21240234375, 22.9296875, 24.64697265625, 26.3642578125, 28.08154296875, 29.798828125, 31.51611328125, 33.2333984375, 34.95068359375, 36.66796875, 38.38525390625, 40.1025390625, 41.81982421875, 43.537109375, 45.25439453125, 46.9716796875, 48.68896484375, 50.40625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 8.0, 12.0, 20.0, 20.0, 27.0, 28.0, 35.0, 31.0, 45.0, 43.0, 46.0, 51.0, 66.0, 55.0, 58.0, 57.0, 47.0, 48.0, 35.0, 38.0, 50.0, 25.0, 25.0, 28.0, 12.0, 25.0, 16.0, 7.0, 8.0, 8.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.9921875, -11.5133056640625, -11.034423828125, -10.5555419921875, -10.07666015625, -9.5977783203125, -9.118896484375, -8.6400146484375, -8.1611328125, -7.6822509765625, -7.203369140625, -6.7244873046875, -6.24560546875, -5.7667236328125, -5.287841796875, -4.8089599609375, -4.330078125, -3.8511962890625, -3.372314453125, -2.8934326171875, -2.41455078125, -1.9356689453125, -1.456787109375, -0.9779052734375, -0.4990234375, -0.0201416015625, 0.458740234375, 0.9376220703125, 1.41650390625, 1.8953857421875, 2.374267578125, 2.8531494140625, 3.33203125, 3.8109130859375, 4.289794921875, 4.7686767578125, 5.24755859375, 5.7264404296875, 6.205322265625, 6.6842041015625, 7.1630859375, 7.6419677734375, 8.120849609375, 8.5997314453125, 9.07861328125, 9.5574951171875, 10.036376953125, 10.5152587890625, 10.994140625, 11.4730224609375, 11.951904296875, 12.4307861328125, 12.90966796875, 13.3885498046875, 13.867431640625, 14.3463134765625, 14.8251953125, 15.3040771484375, 15.782958984375, 16.2618408203125, 16.74072265625, 17.2196044921875, 17.698486328125, 18.1773681640625, 18.65625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 5.0, 5.0, 11.0, 10.0, 11.0, 17.0, 10.0, 13.0, 22.0, 34.0, 32.0, 28.0, 28.0, 28.0, 34.0, 41.0, 41.0, 45.0, 37.0, 54.0, 32.0, 38.0, 47.0, 47.0, 55.0, 40.0, 26.0, 40.0, 24.0, 24.0, 18.0, 21.0, 19.0, 10.0, 12.0, 5.0, 12.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-100.13265228271484, -97.32498168945312, -94.51731872558594, -91.70964813232422, -88.90198516845703, -86.09431457519531, -83.28665161132812, -80.4789810180664, -77.67131042480469, -74.86363983154297, -72.05597686767578, -69.24830627441406, -66.44064331054688, -63.632972717285156, -60.8253059387207, -58.01763916015625, -55.20997619628906, -52.40230941772461, -49.594642639160156, -46.78697204589844, -43.97930908203125, -41.17163848876953, -38.36397171020508, -35.556304931640625, -32.74863815307617, -29.94097137451172, -27.133304595947266, -24.32563591003418, -21.517969131469727, -18.710302352905273, -15.902633666992188, -13.094966888427734, -10.28729248046875, -7.479625225067139, -4.671957969665527, -1.8642902374267578, 0.9433765411376953, 3.7510433197021484, 6.558712005615234, 9.366378784179688, 12.17404556274414, 14.981712341308594, 17.789379119873047, 20.597047805786133, 23.404714584350586, 26.21238136291504, 29.020050048828125, 31.827716827392578, 34.63538360595703, 37.443050384521484, 40.25071716308594, 43.058387756347656, 45.866050720214844, 48.67372131347656, 51.481388092041016, 54.28905487060547, 57.09672164916992, 59.904388427734375, 62.71205520629883, 65.51972198486328, 68.327392578125, 71.13505554199219, 73.9427261352539, 76.75039672851562, 79.55805969238281]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 4.0, 7.0, 5.0, 18.0, 10.0, 15.0, 22.0, 25.0, 25.0, 35.0, 32.0, 27.0, 42.0, 38.0, 42.0, 37.0, 33.0, 48.0, 38.0, 50.0, 37.0, 46.0, 41.0, 31.0, 35.0, 38.0, 28.0, 24.0, 17.0, 22.0, 18.0, 18.0, 15.0, 18.0, 9.0, 8.0, 9.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0], "bins": [-92.81146240234375, -90.04576110839844, -87.28006744384766, -84.51436614990234, -81.74867248535156, -78.98297119140625, -76.21726989746094, -73.45156860351562, -70.68587493896484, -67.92017364501953, -65.15447998046875, -62.38877868652344, -59.62308120727539, -56.857383728027344, -54.09168243408203, -51.325984954833984, -48.56028747558594, -45.79458999633789, -43.028892517089844, -40.26319122314453, -37.497493743896484, -34.73179626464844, -31.966096878051758, -29.200397491455078, -26.43470001220703, -23.669002532958984, -20.903303146362305, -18.137603759765625, -15.371906280517578, -12.606207847595215, -9.840509414672852, -7.074810028076172, -4.309104919433594, -1.5434064865112305, 1.2222919464111328, 3.987990379333496, 6.753688812255859, 9.519387245178223, 12.285085678100586, 15.050785064697266, 17.816482543945312, 20.58218002319336, 23.34787940979004, 26.11357879638672, 28.879276275634766, 31.644973754882812, 34.410675048828125, 37.17637252807617, 39.94207000732422, 42.707767486572266, 45.47346496582031, 48.239166259765625, 51.00486373901367, 53.77056121826172, 56.53626251220703, 59.30195999145508, 62.067657470703125, 64.83335876464844, 67.59905242919922, 70.36475372314453, 73.13044738769531, 75.89614868164062, 78.66184997558594, 81.42755126953125, 84.19324493408203]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 4.0, 5.0, 11.0, 10.0, 19.0, 33.0, 46.0, 69.0, 102.0, 166.0, 305.0, 446.0, 665.0, 1013.0, 1525.0, 2413.0, 3573.0, 5455.0, 8028.0, 11919.0, 16593.0, 23551.0, 31612.0, 41760.0, 52970.0, 64366.0, 75284.0, 83622.0, 88922.0, 89128.0, 84851.0, 77151.0, 66836.0, 55998.0, 44144.0, 33673.0, 24908.0, 18314.0, 12725.0, 8724.0, 6009.0, 4014.0, 2623.0, 1767.0, 1158.0, 726.0, 466.0, 307.0, 207.0, 128.0, 86.0, 51.0, 35.0, 12.0, 17.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0], "bins": [-71.0625, -68.849609375, -66.63671875, -64.423828125, -62.2109375, -59.998046875, -57.78515625, -55.572265625, -53.359375, -51.146484375, -48.93359375, -46.720703125, -44.5078125, -42.294921875, -40.08203125, -37.869140625, -35.65625, -33.443359375, -31.23046875, -29.017578125, -26.8046875, -24.591796875, -22.37890625, -20.166015625, -17.953125, -15.740234375, -13.52734375, -11.314453125, -9.1015625, -6.888671875, -4.67578125, -2.462890625, -0.25, 1.962890625, 4.17578125, 6.388671875, 8.6015625, 10.814453125, 13.02734375, 15.240234375, 17.453125, 19.666015625, 21.87890625, 24.091796875, 26.3046875, 28.517578125, 30.73046875, 32.943359375, 35.15625, 37.369140625, 39.58203125, 41.794921875, 44.0078125, 46.220703125, 48.43359375, 50.646484375, 52.859375, 55.072265625, 57.28515625, 59.498046875, 61.7109375, 63.923828125, 66.13671875, 68.349609375, 70.5625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 6.0, 3.0, 7.0, 16.0, 12.0, 13.0, 22.0, 23.0, 29.0, 36.0, 30.0, 26.0, 44.0, 37.0, 42.0, 34.0, 33.0, 49.0, 38.0, 49.0, 41.0, 43.0, 43.0, 28.0, 38.0, 35.0, 31.0, 23.0, 19.0, 17.0, 19.0, 19.0, 16.0, 16.0, 9.0, 10.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0], "bins": [-92.3125, -89.5634765625, -86.814453125, -84.0654296875, -81.31640625, -78.5673828125, -75.818359375, -73.0693359375, -70.3203125, -67.5712890625, -64.822265625, -62.0732421875, -59.32421875, -56.5751953125, -53.826171875, -51.0771484375, -48.328125, -45.5791015625, -42.830078125, -40.0810546875, -37.33203125, -34.5830078125, -31.833984375, -29.0849609375, -26.3359375, -23.5869140625, -20.837890625, -18.0888671875, -15.33984375, -12.5908203125, -9.841796875, -7.0927734375, -4.34375, -1.5947265625, 1.154296875, 3.9033203125, 6.65234375, 9.4013671875, 12.150390625, 14.8994140625, 17.6484375, 20.3974609375, 23.146484375, 25.8955078125, 28.64453125, 31.3935546875, 34.142578125, 36.8916015625, 39.640625, 42.3896484375, 45.138671875, 47.8876953125, 50.63671875, 53.3857421875, 56.134765625, 58.8837890625, 61.6328125, 64.3818359375, 67.130859375, 69.8798828125, 72.62890625, 75.3779296875, 78.126953125, 80.8759765625, 83.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 13.0, 12.0, 17.0, 38.0, 49.0, 48.0, 129.0, 203.0, 342.0, 614.0, 1038.0, 1679.0, 2897.0, 5235.0, 9100.0, 15477.0, 26152.0, 41955.0, 64246.0, 90299.0, 116461.0, 134118.0, 134814.0, 120949.0, 96572.0, 69177.0, 46579.0, 29077.0, 16834.0, 10189.0, 5863.0, 3410.0, 1982.0, 1197.0, 707.0, 406.0, 233.0, 148.0, 104.0, 80.0, 36.0, 21.0, 13.0, 9.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-120.75, -116.9892578125, -113.228515625, -109.4677734375, -105.70703125, -101.9462890625, -98.185546875, -94.4248046875, -90.6640625, -86.9033203125, -83.142578125, -79.3818359375, -75.62109375, -71.8603515625, -68.099609375, -64.3388671875, -60.578125, -56.8173828125, -53.056640625, -49.2958984375, -45.53515625, -41.7744140625, -38.013671875, -34.2529296875, -30.4921875, -26.7314453125, -22.970703125, -19.2099609375, -15.44921875, -11.6884765625, -7.927734375, -4.1669921875, -0.40625, 3.3544921875, 7.115234375, 10.8759765625, 14.63671875, 18.3974609375, 22.158203125, 25.9189453125, 29.6796875, 33.4404296875, 37.201171875, 40.9619140625, 44.72265625, 48.4833984375, 52.244140625, 56.0048828125, 59.765625, 63.5263671875, 67.287109375, 71.0478515625, 74.80859375, 78.5693359375, 82.330078125, 86.0908203125, 89.8515625, 93.6123046875, 97.373046875, 101.1337890625, 104.89453125, 108.6552734375, 112.416015625, 116.1767578125, 119.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 1.0, 8.0, 9.0, 17.0, 18.0, 10.0, 15.0, 25.0, 17.0, 33.0, 43.0, 42.0, 40.0, 42.0, 60.0, 58.0, 50.0, 48.0, 47.0, 52.0, 50.0, 46.0, 43.0, 29.0, 31.0, 23.0, 30.0, 23.0, 19.0, 14.0, 10.0, 6.0, 9.0, 7.0, 5.0, 3.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.5625, -79.1943359375, -76.826171875, -74.4580078125, -72.08984375, -69.7216796875, -67.353515625, -64.9853515625, -62.6171875, -60.2490234375, -57.880859375, -55.5126953125, -53.14453125, -50.7763671875, -48.408203125, -46.0400390625, -43.671875, -41.3037109375, -38.935546875, -36.5673828125, -34.19921875, -31.8310546875, -29.462890625, -27.0947265625, -24.7265625, -22.3583984375, -19.990234375, -17.6220703125, -15.25390625, -12.8857421875, -10.517578125, -8.1494140625, -5.78125, -3.4130859375, -1.044921875, 1.3232421875, 3.69140625, 6.0595703125, 8.427734375, 10.7958984375, 13.1640625, 15.5322265625, 17.900390625, 20.2685546875, 22.63671875, 25.0048828125, 27.373046875, 29.7412109375, 32.109375, 34.4775390625, 36.845703125, 39.2138671875, 41.58203125, 43.9501953125, 46.318359375, 48.6865234375, 51.0546875, 53.4228515625, 55.791015625, 58.1591796875, 60.52734375, 62.8955078125, 65.263671875, 67.6318359375, 70.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 12.0, 14.0, 27.0, 30.0, 48.0, 62.0, 106.0, 148.0, 229.0, 314.0, 505.0, 779.0, 1242.0, 1935.0, 2884.0, 4645.0, 7339.0, 12377.0, 20202.0, 32991.0, 54058.0, 83629.0, 118285.0, 145849.0, 151944.0, 132594.0, 100256.0, 66902.0, 42025.0, 25745.0, 15572.0, 9539.0, 5967.0, 3714.0, 2338.0, 1483.0, 977.0, 593.0, 382.0, 279.0, 169.0, 115.0, 88.0, 55.0, 31.0, 32.0, 18.0, 5.0, 8.0, 2.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-40.5, -39.20361328125, -37.9072265625, -36.61083984375, -35.314453125, -34.01806640625, -32.7216796875, -31.42529296875, -30.12890625, -28.83251953125, -27.5361328125, -26.23974609375, -24.943359375, -23.64697265625, -22.3505859375, -21.05419921875, -19.7578125, -18.46142578125, -17.1650390625, -15.86865234375, -14.572265625, -13.27587890625, -11.9794921875, -10.68310546875, -9.38671875, -8.09033203125, -6.7939453125, -5.49755859375, -4.201171875, -2.90478515625, -1.6083984375, -0.31201171875, 0.984375, 2.28076171875, 3.5771484375, 4.87353515625, 6.169921875, 7.46630859375, 8.7626953125, 10.05908203125, 11.35546875, 12.65185546875, 13.9482421875, 15.24462890625, 16.541015625, 17.83740234375, 19.1337890625, 20.43017578125, 21.7265625, 23.02294921875, 24.3193359375, 25.61572265625, 26.912109375, 28.20849609375, 29.5048828125, 30.80126953125, 32.09765625, 33.39404296875, 34.6904296875, 35.98681640625, 37.283203125, 38.57958984375, 39.8759765625, 41.17236328125, 42.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 17.0, 18.0, 27.0, 39.0, 46.0, 61.0, 63.0, 70.0, 95.0, 88.0, 104.0, 80.0, 75.0, 64.0, 33.0, 17.0, 23.0, 15.0, 14.0, 8.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01085662841796875, -0.01060110330581665, -0.01034557819366455, -0.010090053081512451, -0.009834527969360352, -0.009579002857208252, -0.009323477745056152, -0.009067952632904053, -0.008812427520751953, -0.008556902408599854, -0.008301377296447754, -0.008045852184295654, -0.007790327072143555, -0.007534801959991455, -0.0072792768478393555, -0.007023751735687256, -0.006768226623535156, -0.006512701511383057, -0.006257176399230957, -0.006001651287078857, -0.005746126174926758, -0.005490601062774658, -0.005235075950622559, -0.004979550838470459, -0.004724025726318359, -0.00446850061416626, -0.00421297550201416, -0.0039574503898620605, -0.003701925277709961, -0.0034464001655578613, -0.0031908750534057617, -0.002935349941253662, -0.0026798248291015625, -0.002424299716949463, -0.0021687746047973633, -0.0019132494926452637, -0.001657724380493164, -0.0014021992683410645, -0.0011466741561889648, -0.0008911490440368652, -0.0006356239318847656, -0.000380098819732666, -0.0001245737075805664, 0.0001309514045715332, 0.0003864765167236328, 0.0006420016288757324, 0.000897526741027832, 0.0011530518531799316, 0.0014085769653320312, 0.0016641020774841309, 0.0019196271896362305, 0.00217515230178833, 0.0024306774139404297, 0.0026862025260925293, 0.002941727638244629, 0.0031972527503967285, 0.003452777862548828, 0.0037083029747009277, 0.003963828086853027, 0.004219353199005127, 0.0044748783111572266, 0.004730403423309326, 0.004985928535461426, 0.005241453647613525, 0.005496978759765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 6.0, 8.0, 13.0, 35.0, 44.0, 58.0, 69.0, 139.0, 198.0, 332.0, 505.0, 845.0, 1259.0, 2007.0, 3169.0, 4746.0, 7399.0, 10878.0, 16080.0, 23559.0, 33022.0, 45232.0, 59260.0, 73192.0, 86181.0, 95831.0, 99660.0, 97221.0, 87940.0, 76451.0, 61801.0, 47803.0, 35652.0, 25451.0, 17524.0, 12035.0, 7950.0, 5341.0, 3520.0, 2245.0, 1385.0, 900.0, 573.0, 365.0, 223.0, 159.0, 92.0, 79.0, 43.0, 30.0, 21.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-21.484375, -20.782470703125, -20.08056640625, -19.378662109375, -18.6767578125, -17.974853515625, -17.27294921875, -16.571044921875, -15.869140625, -15.167236328125, -14.46533203125, -13.763427734375, -13.0615234375, -12.359619140625, -11.65771484375, -10.955810546875, -10.25390625, -9.552001953125, -8.85009765625, -8.148193359375, -7.4462890625, -6.744384765625, -6.04248046875, -5.340576171875, -4.638671875, -3.936767578125, -3.23486328125, -2.532958984375, -1.8310546875, -1.129150390625, -0.42724609375, 0.274658203125, 0.9765625, 1.678466796875, 2.38037109375, 3.082275390625, 3.7841796875, 4.486083984375, 5.18798828125, 5.889892578125, 6.591796875, 7.293701171875, 7.99560546875, 8.697509765625, 9.3994140625, 10.101318359375, 10.80322265625, 11.505126953125, 12.20703125, 12.908935546875, 13.61083984375, 14.312744140625, 15.0146484375, 15.716552734375, 16.41845703125, 17.120361328125, 17.822265625, 18.524169921875, 19.22607421875, 19.927978515625, 20.6298828125, 21.331787109375, 22.03369140625, 22.735595703125, 23.4375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 8.0, 5.0, 6.0, 19.0, 20.0, 23.0, 14.0, 24.0, 35.0, 38.0, 40.0, 45.0, 45.0, 36.0, 58.0, 48.0, 53.0, 45.0, 40.0, 41.0, 48.0, 35.0, 23.0, 33.0, 25.0, 29.0, 28.0, 23.0, 29.0, 24.0, 8.0, 9.0, 6.0, 9.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -11.244384765625, -10.91064453125, -10.576904296875, -10.2431640625, -9.909423828125, -9.57568359375, -9.241943359375, -8.908203125, -8.574462890625, -8.24072265625, -7.906982421875, -7.5732421875, -7.239501953125, -6.90576171875, -6.572021484375, -6.23828125, -5.904541015625, -5.57080078125, -5.237060546875, -4.9033203125, -4.569580078125, -4.23583984375, -3.902099609375, -3.568359375, -3.234619140625, -2.90087890625, -2.567138671875, -2.2333984375, -1.899658203125, -1.56591796875, -1.232177734375, -0.8984375, -0.564697265625, -0.23095703125, 0.102783203125, 0.4365234375, 0.770263671875, 1.10400390625, 1.437744140625, 1.771484375, 2.105224609375, 2.43896484375, 2.772705078125, 3.1064453125, 3.440185546875, 3.77392578125, 4.107666015625, 4.44140625, 4.775146484375, 5.10888671875, 5.442626953125, 5.7763671875, 6.110107421875, 6.44384765625, 6.777587890625, 7.111328125, 7.445068359375, 7.77880859375, 8.112548828125, 8.4462890625, 8.780029296875, 9.11376953125, 9.447509765625, 9.78125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 3.0, 12.0, 15.0, 13.0, 7.0, 18.0, 22.0, 20.0, 29.0, 31.0, 45.0, 40.0, 36.0, 40.0, 40.0, 40.0, 48.0, 58.0, 37.0, 39.0, 50.0, 44.0, 41.0, 36.0, 42.0, 39.0, 27.0, 22.0, 23.0, 20.0, 10.0, 11.0, 7.0, 9.0, 3.0, 7.0, 2.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.14584350585938, -90.01254272460938, -86.8792495727539, -83.7459487915039, -80.61265563964844, -77.47935485839844, -74.34605407714844, -71.21276092529297, -68.0794677734375, -64.9461669921875, -61.81287384033203, -58.67957305908203, -55.54627990722656, -52.41297912597656, -49.27968215942383, -46.146385192871094, -43.013084411621094, -39.87978744506836, -36.746490478515625, -33.613189697265625, -30.479894638061523, -27.34659767150879, -24.213298797607422, -21.080001831054688, -17.946704864501953, -14.813407897949219, -11.680109977722168, -8.546812057495117, -5.413515090942383, -2.2802181243896484, 0.8530807495117188, 3.986377716064453, 7.119682312011719, 10.252979278564453, 13.386277198791504, 16.519575119018555, 19.65287208557129, 22.786169052124023, 25.91946792602539, 29.052764892578125, 32.18606185913086, 35.319358825683594, 38.45265579223633, 41.58595275878906, 44.71925354003906, 47.85254669189453, 50.98584747314453, 54.119144439697266, 57.25244140625, 60.385738372802734, 63.51903533935547, 66.65233612060547, 69.78562927246094, 72.91893005371094, 76.05223083496094, 79.1855239868164, 82.31881713867188, 85.45211791992188, 88.58541107177734, 91.71871185302734, 94.85200500488281, 97.98530578613281, 101.11860656738281, 104.25189971923828, 107.38520050048828]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 4.0, 11.0, 8.0, 11.0, 18.0, 24.0, 25.0, 25.0, 30.0, 22.0, 45.0, 22.0, 44.0, 44.0, 31.0, 32.0, 31.0, 51.0, 45.0, 37.0, 43.0, 32.0, 24.0, 33.0, 31.0, 47.0, 25.0, 18.0, 29.0, 20.0, 25.0, 18.0, 13.0, 13.0, 14.0, 13.0, 1.0, 7.0, 2.0, 7.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-86.0357437133789, -83.21099090576172, -80.38624572753906, -77.56149291992188, -74.73674774169922, -71.91199493408203, -69.08724975585938, -66.26249694824219, -63.437747955322266, -60.612998962402344, -57.78824996948242, -54.9635009765625, -52.13874816894531, -49.314002990722656, -46.48925018310547, -43.66450119018555, -40.839752197265625, -38.0150032043457, -35.19025421142578, -32.365501403808594, -29.540754318237305, -26.716005325317383, -23.891254425048828, -21.066505432128906, -18.241756439208984, -15.417007446289062, -12.592257499694824, -9.767507553100586, -6.942758560180664, -4.118009567260742, -1.2932586669921875, 1.5314903259277344, 4.356231689453125, 7.180981159210205, 10.005730628967285, 12.830480575561523, 15.655229568481445, 18.479978561401367, 21.304729461669922, 24.129478454589844, 26.954227447509766, 29.778976440429688, 32.60372543334961, 35.42847442626953, 38.25322723388672, 41.077972412109375, 43.90272521972656, 46.727474212646484, 49.552223205566406, 52.37697219848633, 55.20172119140625, 58.02647399902344, 60.851219177246094, 63.67597198486328, 66.50071716308594, 69.32546997070312, 72.15022277832031, 74.9749755859375, 77.79972076416016, 80.62447357177734, 83.44921875, 86.27397155761719, 89.09872436523438, 91.92346954345703, 94.74821472167969]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 7.0, 12.0, 17.0, 31.0, 39.0, 82.0, 139.0, 237.0, 416.0, 644.0, 1202.0, 2078.0, 3376.0, 5830.0, 9687.0, 16483.0, 26715.0, 42504.0, 68739.0, 105105.0, 158298.0, 226277.0, 306857.0, 387242.0, 451055.0, 478337.0, 458963.0, 399156.0, 320655.0, 238974.0, 169273.0, 113897.0, 74890.0, 48024.0, 30703.0, 18725.0, 11380.0, 7077.0, 4331.0, 2716.0, 1604.0, 1020.0, 590.0, 369.0, 204.0, 128.0, 82.0, 41.0, 35.0, 12.0, 15.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-80.5625, -78.013671875, -75.46484375, -72.916015625, -70.3671875, -67.818359375, -65.26953125, -62.720703125, -60.171875, -57.623046875, -55.07421875, -52.525390625, -49.9765625, -47.427734375, -44.87890625, -42.330078125, -39.78125, -37.232421875, -34.68359375, -32.134765625, -29.5859375, -27.037109375, -24.48828125, -21.939453125, -19.390625, -16.841796875, -14.29296875, -11.744140625, -9.1953125, -6.646484375, -4.09765625, -1.548828125, 1.0, 3.548828125, 6.09765625, 8.646484375, 11.1953125, 13.744140625, 16.29296875, 18.841796875, 21.390625, 23.939453125, 26.48828125, 29.037109375, 31.5859375, 34.134765625, 36.68359375, 39.232421875, 41.78125, 44.330078125, 46.87890625, 49.427734375, 51.9765625, 54.525390625, 57.07421875, 59.623046875, 62.171875, 64.720703125, 67.26953125, 69.818359375, 72.3671875, 74.916015625, 77.46484375, 80.013671875, 82.5625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 8.0, 11.0, 13.0, 14.0, 21.0, 30.0, 23.0, 33.0, 28.0, 32.0, 37.0, 39.0, 43.0, 32.0, 26.0, 32.0, 48.0, 44.0, 40.0, 36.0, 37.0, 31.0, 24.0, 38.0, 36.0, 30.0, 20.0, 25.0, 27.0, 22.0, 20.0, 10.0, 15.0, 14.0, 9.0, 8.0, 4.0, 3.0, 7.0, 6.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.375, -71.931640625, -69.48828125, -67.044921875, -64.6015625, -62.158203125, -59.71484375, -57.271484375, -54.828125, -52.384765625, -49.94140625, -47.498046875, -45.0546875, -42.611328125, -40.16796875, -37.724609375, -35.28125, -32.837890625, -30.39453125, -27.951171875, -25.5078125, -23.064453125, -20.62109375, -18.177734375, -15.734375, -13.291015625, -10.84765625, -8.404296875, -5.9609375, -3.517578125, -1.07421875, 1.369140625, 3.8125, 6.255859375, 8.69921875, 11.142578125, 13.5859375, 16.029296875, 18.47265625, 20.916015625, 23.359375, 25.802734375, 28.24609375, 30.689453125, 33.1328125, 35.576171875, 38.01953125, 40.462890625, 42.90625, 45.349609375, 47.79296875, 50.236328125, 52.6796875, 55.123046875, 57.56640625, 60.009765625, 62.453125, 64.896484375, 67.33984375, 69.783203125, 72.2265625, 74.669921875, 77.11328125, 79.556640625, 82.0]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 10.0, 11.0, 33.0, 36.0, 73.0, 115.0, 185.0, 286.0, 549.0, 876.0, 1491.0, 2605.0, 4459.0, 7599.0, 12419.0, 20681.0, 33642.0, 53365.0, 82825.0, 121687.0, 175354.0, 238508.0, 307839.0, 371542.0, 419747.0, 436896.0, 420789.0, 378991.0, 315162.0, 245704.0, 181794.0, 127390.0, 85934.0, 55878.0, 35450.0, 21572.0, 13107.0, 8058.0, 4808.0, 2757.0, 1664.0, 983.0, 568.0, 358.0, 186.0, 122.0, 72.0, 32.0, 27.0, 23.0, 6.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-79.5, -76.98046875, -74.4609375, -71.94140625, -69.421875, -66.90234375, -64.3828125, -61.86328125, -59.34375, -56.82421875, -54.3046875, -51.78515625, -49.265625, -46.74609375, -44.2265625, -41.70703125, -39.1875, -36.66796875, -34.1484375, -31.62890625, -29.109375, -26.58984375, -24.0703125, -21.55078125, -19.03125, -16.51171875, -13.9921875, -11.47265625, -8.953125, -6.43359375, -3.9140625, -1.39453125, 1.125, 3.64453125, 6.1640625, 8.68359375, 11.203125, 13.72265625, 16.2421875, 18.76171875, 21.28125, 23.80078125, 26.3203125, 28.83984375, 31.359375, 33.87890625, 36.3984375, 38.91796875, 41.4375, 43.95703125, 46.4765625, 48.99609375, 51.515625, 54.03515625, 56.5546875, 59.07421875, 61.59375, 64.11328125, 66.6328125, 69.15234375, 71.671875, 74.19140625, 76.7109375, 79.23046875, 81.75]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 11.0, 10.0, 15.0, 26.0, 28.0, 37.0, 39.0, 49.0, 71.0, 84.0, 96.0, 115.0, 126.0, 152.0, 160.0, 190.0, 223.0, 220.0, 210.0, 219.0, 237.0, 230.0, 197.0, 215.0, 185.0, 166.0, 148.0, 122.0, 111.0, 89.0, 68.0, 46.0, 49.0, 30.0, 24.0, 13.0, 19.0, 11.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.15625, -44.74267578125, -43.3291015625, -41.91552734375, -40.501953125, -39.08837890625, -37.6748046875, -36.26123046875, -34.84765625, -33.43408203125, -32.0205078125, -30.60693359375, -29.193359375, -27.77978515625, -26.3662109375, -24.95263671875, -23.5390625, -22.12548828125, -20.7119140625, -19.29833984375, -17.884765625, -16.47119140625, -15.0576171875, -13.64404296875, -12.23046875, -10.81689453125, -9.4033203125, -7.98974609375, -6.576171875, -5.16259765625, -3.7490234375, -2.33544921875, -0.921875, 0.49169921875, 1.9052734375, 3.31884765625, 4.732421875, 6.14599609375, 7.5595703125, 8.97314453125, 10.38671875, 11.80029296875, 13.2138671875, 14.62744140625, 16.041015625, 17.45458984375, 18.8681640625, 20.28173828125, 21.6953125, 23.10888671875, 24.5224609375, 25.93603515625, 27.349609375, 28.76318359375, 30.1767578125, 31.59033203125, 33.00390625, 34.41748046875, 35.8310546875, 37.24462890625, 38.658203125, 40.07177734375, 41.4853515625, 42.89892578125, 44.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 9.0, 11.0, 13.0, 20.0, 22.0, 16.0, 26.0, 34.0, 38.0, 35.0, 38.0, 45.0, 44.0, 48.0, 49.0, 53.0, 45.0, 53.0, 39.0, 51.0, 47.0, 44.0, 36.0, 30.0, 26.0, 28.0, 18.0, 20.0, 14.0, 7.0, 11.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.91854858398438, -106.35018920898438, -102.7818374633789, -99.21348571777344, -95.64512634277344, -92.07676696777344, -88.50841522216797, -84.9400634765625, -81.3717041015625, -77.8033447265625, -74.23499298095703, -70.66664123535156, -67.09828186035156, -63.52992630004883, -59.961570739746094, -56.39321517944336, -52.824859619140625, -49.25650405883789, -45.688148498535156, -42.11979293823242, -38.55143737792969, -34.98308181762695, -31.41472625732422, -27.846370697021484, -24.27801513671875, -20.709659576416016, -17.14130401611328, -13.572948455810547, -10.004592895507812, -6.436237335205078, -2.8678817749023438, 0.7004737854003906, 4.268829345703125, 7.837184906005859, 11.405540466308594, 14.973896026611328, 18.542251586914062, 22.110607147216797, 25.67896270751953, 29.247318267822266, 32.815673828125, 36.384029388427734, 39.95238494873047, 43.5207405090332, 47.08909606933594, 50.65745162963867, 54.225807189941406, 57.79416275024414, 61.362518310546875, 64.93087768554688, 68.49922943115234, 72.06758117675781, 75.63594055175781, 79.20429992675781, 82.77265167236328, 86.34100341796875, 89.90936279296875, 93.47772216796875, 97.04607391357422, 100.61442565917969, 104.18278503417969, 107.75114440917969, 111.31949615478516, 114.88784790039062, 118.45620727539062]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 10.0, 11.0, 14.0, 16.0, 21.0, 22.0, 23.0, 25.0, 31.0, 30.0, 26.0, 41.0, 38.0, 36.0, 48.0, 51.0, 41.0, 53.0, 38.0, 44.0, 44.0, 33.0, 39.0, 24.0, 32.0, 36.0, 27.0, 16.0, 17.0, 17.0, 16.0, 13.0, 14.0, 7.0, 9.0, 6.0, 7.0, 6.0, 4.0, 2.0, 0.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-98.07047271728516, -94.94247436523438, -91.81448364257812, -88.68648529052734, -85.55848693847656, -82.43048858642578, -79.302490234375, -76.17449951171875, -73.04650115966797, -69.91850280761719, -66.79051208496094, -63.662513732910156, -60.534515380859375, -57.406517028808594, -54.27852249145508, -51.15052795410156, -48.02252960205078, -44.89453125, -41.766536712646484, -38.63854217529297, -35.51054382324219, -32.382545471191406, -29.25455093383789, -26.126554489135742, -22.998558044433594, -19.870561599731445, -16.742565155029297, -13.614568710327148, -10.486572265625, -7.358575820922852, -4.230579376220703, -1.1025829315185547, 2.0254058837890625, 5.153402328491211, 8.28139877319336, 11.409395217895508, 14.537391662597656, 17.665388107299805, 20.793384552001953, 23.9213809967041, 27.04937744140625, 30.1773738861084, 33.30537033081055, 36.43336486816406, 39.561363220214844, 42.689361572265625, 45.81735610961914, 48.945350646972656, 52.07334899902344, 55.20134735107422, 58.329341888427734, 61.45733642578125, 64.58533477783203, 67.71333312988281, 70.84132385253906, 73.96932220458984, 77.09732055664062, 80.2253189086914, 83.35331726074219, 86.48130798339844, 89.60930633544922, 92.7373046875, 95.86529541015625, 98.99329376220703, 102.12129211425781]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 8.0, 10.0, 12.0, 29.0, 51.0, 72.0, 104.0, 135.0, 260.0, 397.0, 626.0, 934.0, 1409.0, 2198.0, 3503.0, 5550.0, 8509.0, 13101.0, 20303.0, 30190.0, 45584.0, 64961.0, 89587.0, 114359.0, 130913.0, 129345.0, 111773.0, 86409.0, 61882.0, 43365.0, 29024.0, 19000.0, 12314.0, 7929.0, 5271.0, 3393.0, 2124.0, 1468.0, 847.0, 598.0, 327.0, 235.0, 164.0, 116.0, 63.0, 39.0, 22.0, 21.0, 12.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.15625, -52.40576171875, -50.6552734375, -48.90478515625, -47.154296875, -45.40380859375, -43.6533203125, -41.90283203125, -40.15234375, -38.40185546875, -36.6513671875, -34.90087890625, -33.150390625, -31.39990234375, -29.6494140625, -27.89892578125, -26.1484375, -24.39794921875, -22.6474609375, -20.89697265625, -19.146484375, -17.39599609375, -15.6455078125, -13.89501953125, -12.14453125, -10.39404296875, -8.6435546875, -6.89306640625, -5.142578125, -3.39208984375, -1.6416015625, 0.10888671875, 1.859375, 3.60986328125, 5.3603515625, 7.11083984375, 8.861328125, 10.61181640625, 12.3623046875, 14.11279296875, 15.86328125, 17.61376953125, 19.3642578125, 21.11474609375, 22.865234375, 24.61572265625, 26.3662109375, 28.11669921875, 29.8671875, 31.61767578125, 33.3681640625, 35.11865234375, 36.869140625, 38.61962890625, 40.3701171875, 42.12060546875, 43.87109375, 45.62158203125, 47.3720703125, 49.12255859375, 50.873046875, 52.62353515625, 54.3740234375, 56.12451171875, 57.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 12.0, 13.0, 9.0, 20.0, 23.0, 25.0, 19.0, 23.0, 31.0, 34.0, 21.0, 48.0, 37.0, 44.0, 49.0, 42.0, 42.0, 50.0, 44.0, 40.0, 37.0, 41.0, 34.0, 25.0, 32.0, 31.0, 30.0, 14.0, 18.0, 15.0, 16.0, 14.0, 11.0, 8.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-97.625, -94.486328125, -91.34765625, -88.208984375, -85.0703125, -81.931640625, -78.79296875, -75.654296875, -72.515625, -69.376953125, -66.23828125, -63.099609375, -59.9609375, -56.822265625, -53.68359375, -50.544921875, -47.40625, -44.267578125, -41.12890625, -37.990234375, -34.8515625, -31.712890625, -28.57421875, -25.435546875, -22.296875, -19.158203125, -16.01953125, -12.880859375, -9.7421875, -6.603515625, -3.46484375, -0.326171875, 2.8125, 5.951171875, 9.08984375, 12.228515625, 15.3671875, 18.505859375, 21.64453125, 24.783203125, 27.921875, 31.060546875, 34.19921875, 37.337890625, 40.4765625, 43.615234375, 46.75390625, 49.892578125, 53.03125, 56.169921875, 59.30859375, 62.447265625, 65.5859375, 68.724609375, 71.86328125, 75.001953125, 78.140625, 81.279296875, 84.41796875, 87.556640625, 90.6953125, 93.833984375, 96.97265625, 100.111328125, 103.25]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 9.0, 23.0, 27.0, 33.0, 38.0, 61.0, 88.0, 127.0, 184.0, 286.0, 410.0, 675.0, 1059.0, 1706.0, 3156.0, 5654.0, 10787.0, 21474.0, 44708.0, 95794.0, 190230.0, 264878.0, 203258.0, 104419.0, 49371.0, 23558.0, 11695.0, 6255.0, 3396.0, 1916.0, 1178.0, 723.0, 455.0, 276.0, 178.0, 145.0, 105.0, 73.0, 42.0, 27.0, 28.0, 7.0, 17.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-94.9375, -92.1904296875, -89.443359375, -86.6962890625, -83.94921875, -81.2021484375, -78.455078125, -75.7080078125, -72.9609375, -70.2138671875, -67.466796875, -64.7197265625, -61.97265625, -59.2255859375, -56.478515625, -53.7314453125, -50.984375, -48.2373046875, -45.490234375, -42.7431640625, -39.99609375, -37.2490234375, -34.501953125, -31.7548828125, -29.0078125, -26.2607421875, -23.513671875, -20.7666015625, -18.01953125, -15.2724609375, -12.525390625, -9.7783203125, -7.03125, -4.2841796875, -1.537109375, 1.2099609375, 3.95703125, 6.7041015625, 9.451171875, 12.1982421875, 14.9453125, 17.6923828125, 20.439453125, 23.1865234375, 25.93359375, 28.6806640625, 31.427734375, 34.1748046875, 36.921875, 39.6689453125, 42.416015625, 45.1630859375, 47.91015625, 50.6572265625, 53.404296875, 56.1513671875, 58.8984375, 61.6455078125, 64.392578125, 67.1396484375, 69.88671875, 72.6337890625, 75.380859375, 78.1279296875, 80.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 5.0, 9.0, 14.0, 16.0, 12.0, 15.0, 25.0, 18.0, 22.0, 23.0, 19.0, 25.0, 35.0, 22.0, 35.0, 36.0, 38.0, 32.0, 33.0, 34.0, 47.0, 51.0, 40.0, 45.0, 30.0, 36.0, 26.0, 31.0, 26.0, 26.0, 24.0, 23.0, 15.0, 14.0, 21.0, 9.0, 12.0, 8.0, 10.0, 5.0, 5.0, 7.0, 5.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0], "bins": [-64.375, -62.49169921875, -60.6083984375, -58.72509765625, -56.841796875, -54.95849609375, -53.0751953125, -51.19189453125, -49.30859375, -47.42529296875, -45.5419921875, -43.65869140625, -41.775390625, -39.89208984375, -38.0087890625, -36.12548828125, -34.2421875, -32.35888671875, -30.4755859375, -28.59228515625, -26.708984375, -24.82568359375, -22.9423828125, -21.05908203125, -19.17578125, -17.29248046875, -15.4091796875, -13.52587890625, -11.642578125, -9.75927734375, -7.8759765625, -5.99267578125, -4.109375, -2.22607421875, -0.3427734375, 1.54052734375, 3.423828125, 5.30712890625, 7.1904296875, 9.07373046875, 10.95703125, 12.84033203125, 14.7236328125, 16.60693359375, 18.490234375, 20.37353515625, 22.2568359375, 24.14013671875, 26.0234375, 27.90673828125, 29.7900390625, 31.67333984375, 33.556640625, 35.43994140625, 37.3232421875, 39.20654296875, 41.08984375, 42.97314453125, 44.8564453125, 46.73974609375, 48.623046875, 50.50634765625, 52.3896484375, 54.27294921875, 56.15625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 10.0, 20.0, 36.0, 29.0, 43.0, 73.0, 95.0, 156.0, 246.0, 383.0, 612.0, 997.0, 1532.0, 2492.0, 3983.0, 6953.0, 12112.0, 21558.0, 39011.0, 71989.0, 133434.0, 216192.0, 221218.0, 141881.0, 77478.0, 41406.0, 22928.0, 12742.0, 7527.0, 4333.0, 2598.0, 1610.0, 959.0, 635.0, 423.0, 299.0, 169.0, 117.0, 84.0, 57.0, 44.0, 33.0, 14.0, 8.0, 11.0, 7.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.34375, -29.397216796875, -28.45068359375, -27.504150390625, -26.5576171875, -25.611083984375, -24.66455078125, -23.718017578125, -22.771484375, -21.824951171875, -20.87841796875, -19.931884765625, -18.9853515625, -18.038818359375, -17.09228515625, -16.145751953125, -15.19921875, -14.252685546875, -13.30615234375, -12.359619140625, -11.4130859375, -10.466552734375, -9.52001953125, -8.573486328125, -7.626953125, -6.680419921875, -5.73388671875, -4.787353515625, -3.8408203125, -2.894287109375, -1.94775390625, -1.001220703125, -0.0546875, 0.891845703125, 1.83837890625, 2.784912109375, 3.7314453125, 4.677978515625, 5.62451171875, 6.571044921875, 7.517578125, 8.464111328125, 9.41064453125, 10.357177734375, 11.3037109375, 12.250244140625, 13.19677734375, 14.143310546875, 15.08984375, 16.036376953125, 16.98291015625, 17.929443359375, 18.8759765625, 19.822509765625, 20.76904296875, 21.715576171875, 22.662109375, 23.608642578125, 24.55517578125, 25.501708984375, 26.4482421875, 27.394775390625, 28.34130859375, 29.287841796875, 30.234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 4.0, 6.0, 14.0, 22.0, 20.0, 45.0, 50.0, 57.0, 73.0, 95.0, 108.0, 101.0, 101.0, 75.0, 47.0, 49.0, 31.0, 20.0, 12.0, 21.0, 13.0, 6.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00501251220703125, -0.004893064498901367, -0.004773616790771484, -0.0046541690826416016, -0.004534721374511719, -0.004415273666381836, -0.004295825958251953, -0.00417637825012207, -0.0040569305419921875, -0.003937482833862305, -0.003818035125732422, -0.003698587417602539, -0.0035791397094726562, -0.0034596920013427734, -0.0033402442932128906, -0.003220796585083008, -0.003101348876953125, -0.002981901168823242, -0.0028624534606933594, -0.0027430057525634766, -0.0026235580444335938, -0.002504110336303711, -0.002384662628173828, -0.0022652149200439453, -0.0021457672119140625, -0.0020263195037841797, -0.0019068717956542969, -0.001787424087524414, -0.0016679763793945312, -0.0015485286712646484, -0.0014290809631347656, -0.0013096332550048828, -0.001190185546875, -0.0010707378387451172, -0.0009512901306152344, -0.0008318424224853516, -0.0007123947143554688, -0.0005929470062255859, -0.0004734992980957031, -0.0003540515899658203, -0.0002346038818359375, -0.00011515617370605469, 4.291534423828125e-06, 0.00012373924255371094, 0.00024318695068359375, 0.00036263465881347656, 0.0004820823669433594, 0.0006015300750732422, 0.000720977783203125, 0.0008404254913330078, 0.0009598731994628906, 0.0010793209075927734, 0.0011987686157226562, 0.001318216323852539, 0.0014376640319824219, 0.0015571117401123047, 0.0016765594482421875, 0.0017960071563720703, 0.0019154548645019531, 0.002034902572631836, 0.0021543502807617188, 0.0022737979888916016, 0.0023932456970214844, 0.002512693405151367, 0.00263214111328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 16.0, 25.0, 26.0, 44.0, 51.0, 86.0, 124.0, 193.0, 256.0, 411.0, 571.0, 800.0, 1179.0, 1802.0, 2675.0, 4271.0, 6278.0, 9893.0, 15354.0, 23372.0, 35642.0, 52472.0, 75151.0, 100131.0, 122048.0, 130308.0, 123214.0, 102440.0, 77100.0, 54416.0, 37324.0, 24666.0, 15989.0, 10380.0, 6682.0, 4451.0, 2856.0, 1908.0, 1280.0, 851.0, 594.0, 404.0, 258.0, 210.0, 112.0, 69.0, 56.0, 43.0, 26.0, 15.0, 12.0, 13.0, 3.0, 4.0, 1.0, 0.0, 0.0, 4.0], "bins": [-30.75, -29.775390625, -28.80078125, -27.826171875, -26.8515625, -25.876953125, -24.90234375, -23.927734375, -22.953125, -21.978515625, -21.00390625, -20.029296875, -19.0546875, -18.080078125, -17.10546875, -16.130859375, -15.15625, -14.181640625, -13.20703125, -12.232421875, -11.2578125, -10.283203125, -9.30859375, -8.333984375, -7.359375, -6.384765625, -5.41015625, -4.435546875, -3.4609375, -2.486328125, -1.51171875, -0.537109375, 0.4375, 1.412109375, 2.38671875, 3.361328125, 4.3359375, 5.310546875, 6.28515625, 7.259765625, 8.234375, 9.208984375, 10.18359375, 11.158203125, 12.1328125, 13.107421875, 14.08203125, 15.056640625, 16.03125, 17.005859375, 17.98046875, 18.955078125, 19.9296875, 20.904296875, 21.87890625, 22.853515625, 23.828125, 24.802734375, 25.77734375, 26.751953125, 27.7265625, 28.701171875, 29.67578125, 30.650390625, 31.625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 6.0, 9.0, 6.0, 17.0, 20.0, 17.0, 29.0, 28.0, 31.0, 43.0, 41.0, 40.0, 55.0, 51.0, 55.0, 49.0, 48.0, 55.0, 58.0, 39.0, 41.0, 49.0, 38.0, 28.0, 24.0, 21.0, 22.0, 15.0, 15.0, 13.0, 12.0, 9.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.109375, -15.692626953125, -15.27587890625, -14.859130859375, -14.4423828125, -14.025634765625, -13.60888671875, -13.192138671875, -12.775390625, -12.358642578125, -11.94189453125, -11.525146484375, -11.1083984375, -10.691650390625, -10.27490234375, -9.858154296875, -9.44140625, -9.024658203125, -8.60791015625, -8.191162109375, -7.7744140625, -7.357666015625, -6.94091796875, -6.524169921875, -6.107421875, -5.690673828125, -5.27392578125, -4.857177734375, -4.4404296875, -4.023681640625, -3.60693359375, -3.190185546875, -2.7734375, -2.356689453125, -1.93994140625, -1.523193359375, -1.1064453125, -0.689697265625, -0.27294921875, 0.143798828125, 0.560546875, 0.977294921875, 1.39404296875, 1.810791015625, 2.2275390625, 2.644287109375, 3.06103515625, 3.477783203125, 3.89453125, 4.311279296875, 4.72802734375, 5.144775390625, 5.5615234375, 5.978271484375, 6.39501953125, 6.811767578125, 7.228515625, 7.645263671875, 8.06201171875, 8.478759765625, 8.8955078125, 9.312255859375, 9.72900390625, 10.145751953125, 10.5625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 6.0, 12.0, 16.0, 19.0, 15.0, 29.0, 28.0, 32.0, 24.0, 45.0, 40.0, 47.0, 39.0, 54.0, 37.0, 44.0, 49.0, 40.0, 46.0, 61.0, 38.0, 43.0, 35.0, 34.0, 26.0, 18.0, 19.0, 22.0, 13.0, 13.0, 9.0, 6.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.94319152832031, -98.51013946533203, -95.07708740234375, -91.64402770996094, -88.21097564697266, -84.77792358398438, -81.34486389160156, -77.91181182861328, -74.478759765625, -71.04570770263672, -67.61265563964844, -64.17959594726562, -60.746543884277344, -57.31349182128906, -53.880435943603516, -50.44738006591797, -47.01432800292969, -43.581275939941406, -40.14822006225586, -36.71516418457031, -33.28211212158203, -29.849058151245117, -26.416004180908203, -22.98295021057129, -19.549896240234375, -16.11684226989746, -12.683788299560547, -9.250734329223633, -5.817680358886719, -2.3846263885498047, 1.0484275817871094, 4.481481552124023, 7.9145355224609375, 11.347589492797852, 14.780643463134766, 18.21369743347168, 21.646751403808594, 25.079805374145508, 28.512859344482422, 31.945913314819336, 35.37896728515625, 38.81201934814453, 42.24507522583008, 45.678131103515625, 49.111183166503906, 52.54423522949219, 55.977291107177734, 59.41034698486328, 62.84339904785156, 66.27645111083984, 69.70950317382812, 73.14256286621094, 76.57561492919922, 80.0086669921875, 83.44172668457031, 86.8747787475586, 90.30783081054688, 93.74088287353516, 97.17393493652344, 100.60699462890625, 104.04004669189453, 107.47309875488281, 110.90615844726562, 114.3392105102539, 117.77226257324219]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 9.0, 21.0, 14.0, 26.0, 14.0, 21.0, 30.0, 27.0, 28.0, 29.0, 28.0, 48.0, 43.0, 44.0, 44.0, 44.0, 49.0, 41.0, 61.0, 34.0, 38.0, 37.0, 20.0, 31.0, 33.0, 30.0, 22.0, 16.0, 17.0, 15.0, 8.0, 11.0, 16.0, 8.0, 5.0, 9.0, 3.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-97.33415985107422, -94.13499450683594, -90.93582153320312, -87.73665618896484, -84.53749084472656, -81.33831787109375, -78.13915252685547, -74.93998718261719, -71.74081420898438, -68.5416488647461, -65.34247589111328, -62.143310546875, -58.94414138793945, -55.744972229003906, -52.545806884765625, -49.34663772583008, -46.14746856689453, -42.948299407958984, -39.74913024902344, -36.549964904785156, -33.35079574584961, -30.151626586914062, -26.95245933532715, -23.753292083740234, -20.554122924804688, -17.35495376586914, -14.155786514282227, -10.956618309020996, -7.757450103759766, -4.558281898498535, -1.3591136932373047, 1.8400535583496094, 5.0392303466796875, 8.238398551940918, 11.437566757202148, 14.636734962463379, 17.83590316772461, 21.035072326660156, 24.23423957824707, 27.433406829833984, 30.63257598876953, 33.83174514770508, 37.030914306640625, 40.230079650878906, 43.42924880981445, 46.62841796875, 49.82758331298828, 53.02675247192383, 56.225921630859375, 59.42509078979492, 62.62425994873047, 65.82342529296875, 69.02259826660156, 72.22176361083984, 75.42092895507812, 78.62010192871094, 81.81926727294922, 85.0184326171875, 88.21760559082031, 91.4167709350586, 94.61593627929688, 97.81510925292969, 101.01427459716797, 104.21343994140625, 107.41261291503906]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 20.0, 26.0, 68.0, 89.0, 171.0, 301.0, 465.0, 936.0, 1408.0, 2418.0, 3844.0, 5971.0, 9584.0, 14464.0, 21422.0, 30378.0, 42082.0, 56134.0, 70031.0, 83672.0, 94950.0, 100124.0, 99100.0, 91790.0, 80110.0, 66446.0, 51628.0, 38581.0, 27851.0, 19368.0, 12786.0, 8539.0, 5291.0, 3468.0, 1993.0, 1303.0, 705.0, 410.0, 253.0, 150.0, 87.0, 48.0, 38.0, 20.0, 9.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-83.5625, -81.01953125, -78.4765625, -75.93359375, -73.390625, -70.84765625, -68.3046875, -65.76171875, -63.21875, -60.67578125, -58.1328125, -55.58984375, -53.046875, -50.50390625, -47.9609375, -45.41796875, -42.875, -40.33203125, -37.7890625, -35.24609375, -32.703125, -30.16015625, -27.6171875, -25.07421875, -22.53125, -19.98828125, -17.4453125, -14.90234375, -12.359375, -9.81640625, -7.2734375, -4.73046875, -2.1875, 0.35546875, 2.8984375, 5.44140625, 7.984375, 10.52734375, 13.0703125, 15.61328125, 18.15625, 20.69921875, 23.2421875, 25.78515625, 28.328125, 30.87109375, 33.4140625, 35.95703125, 38.5, 41.04296875, 43.5859375, 46.12890625, 48.671875, 51.21484375, 53.7578125, 56.30078125, 58.84375, 61.38671875, 63.9296875, 66.47265625, 69.015625, 71.55859375, 74.1015625, 76.64453125, 79.1875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 5.0, 8.0, 9.0, 17.0, 12.0, 29.0, 17.0, 17.0, 27.0, 32.0, 26.0, 30.0, 32.0, 41.0, 48.0, 37.0, 48.0, 42.0, 47.0, 49.0, 64.0, 29.0, 38.0, 36.0, 24.0, 29.0, 35.0, 28.0, 22.0, 18.0, 14.0, 17.0, 10.0, 10.0, 17.0, 7.0, 5.0, 10.0, 3.0, 1.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-95.3125, -92.19140625, -89.0703125, -85.94921875, -82.828125, -79.70703125, -76.5859375, -73.46484375, -70.34375, -67.22265625, -64.1015625, -60.98046875, -57.859375, -54.73828125, -51.6171875, -48.49609375, -45.375, -42.25390625, -39.1328125, -36.01171875, -32.890625, -29.76953125, -26.6484375, -23.52734375, -20.40625, -17.28515625, -14.1640625, -11.04296875, -7.921875, -4.80078125, -1.6796875, 1.44140625, 4.5625, 7.68359375, 10.8046875, 13.92578125, 17.046875, 20.16796875, 23.2890625, 26.41015625, 29.53125, 32.65234375, 35.7734375, 38.89453125, 42.015625, 45.13671875, 48.2578125, 51.37890625, 54.5, 57.62109375, 60.7421875, 63.86328125, 66.984375, 70.10546875, 73.2265625, 76.34765625, 79.46875, 82.58984375, 85.7109375, 88.83203125, 91.953125, 95.07421875, 98.1953125, 101.31640625, 104.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 12.0, 23.0, 23.0, 41.0, 69.0, 88.0, 156.0, 228.0, 393.0, 625.0, 1066.0, 1730.0, 2802.0, 4442.0, 7160.0, 11090.0, 16818.0, 25245.0, 36023.0, 49999.0, 65603.0, 81792.0, 96006.0, 104778.0, 106133.0, 99588.0, 86842.0, 71302.0, 54851.0, 40487.0, 28544.0, 19379.0, 12895.0, 8304.0, 5278.0, 3252.0, 2146.0, 1295.0, 823.0, 479.0, 273.0, 180.0, 118.0, 54.0, 45.0, 20.0, 23.0, 5.0, 6.0, 9.0, 2.0, 2.0, 2.0, 2.0], "bins": [-99.375, -96.466796875, -93.55859375, -90.650390625, -87.7421875, -84.833984375, -81.92578125, -79.017578125, -76.109375, -73.201171875, -70.29296875, -67.384765625, -64.4765625, -61.568359375, -58.66015625, -55.751953125, -52.84375, -49.935546875, -47.02734375, -44.119140625, -41.2109375, -38.302734375, -35.39453125, -32.486328125, -29.578125, -26.669921875, -23.76171875, -20.853515625, -17.9453125, -15.037109375, -12.12890625, -9.220703125, -6.3125, -3.404296875, -0.49609375, 2.412109375, 5.3203125, 8.228515625, 11.13671875, 14.044921875, 16.953125, 19.861328125, 22.76953125, 25.677734375, 28.5859375, 31.494140625, 34.40234375, 37.310546875, 40.21875, 43.126953125, 46.03515625, 48.943359375, 51.8515625, 54.759765625, 57.66796875, 60.576171875, 63.484375, 66.392578125, 69.30078125, 72.208984375, 75.1171875, 78.025390625, 80.93359375, 83.841796875, 86.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 8.0, 2.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 16.0, 13.0, 22.0, 27.0, 16.0, 27.0, 28.0, 29.0, 29.0, 39.0, 42.0, 44.0, 30.0, 43.0, 42.0, 53.0, 44.0, 40.0, 40.0, 41.0, 52.0, 30.0, 27.0, 28.0, 31.0, 21.0, 21.0, 18.0, 9.0, 16.0, 15.0, 6.0, 6.0, 1.0, 3.0, 7.0, 2.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.25, -55.0888671875, -52.927734375, -50.7666015625, -48.60546875, -46.4443359375, -44.283203125, -42.1220703125, -39.9609375, -37.7998046875, -35.638671875, -33.4775390625, -31.31640625, -29.1552734375, -26.994140625, -24.8330078125, -22.671875, -20.5107421875, -18.349609375, -16.1884765625, -14.02734375, -11.8662109375, -9.705078125, -7.5439453125, -5.3828125, -3.2216796875, -1.060546875, 1.1005859375, 3.26171875, 5.4228515625, 7.583984375, 9.7451171875, 11.90625, 14.0673828125, 16.228515625, 18.3896484375, 20.55078125, 22.7119140625, 24.873046875, 27.0341796875, 29.1953125, 31.3564453125, 33.517578125, 35.6787109375, 37.83984375, 40.0009765625, 42.162109375, 44.3232421875, 46.484375, 48.6455078125, 50.806640625, 52.9677734375, 55.12890625, 57.2900390625, 59.451171875, 61.6123046875, 63.7734375, 65.9345703125, 68.095703125, 70.2568359375, 72.41796875, 74.5791015625, 76.740234375, 78.9013671875, 81.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 27.0, 48.0, 78.0, 127.0, 189.0, 299.0, 456.0, 735.0, 1179.0, 1849.0, 2836.0, 4646.0, 7524.0, 11589.0, 18850.0, 29164.0, 44728.0, 65417.0, 89567.0, 112906.0, 127232.0, 128258.0, 113938.0, 91327.0, 67279.0, 45893.0, 30277.0, 19506.0, 12276.0, 7550.0, 4721.0, 3053.0, 1903.0, 1117.0, 724.0, 434.0, 289.0, 177.0, 140.0, 80.0, 61.0, 31.0, 21.0, 10.0, 10.0, 7.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-40.40625, -39.18310546875, -37.9599609375, -36.73681640625, -35.513671875, -34.29052734375, -33.0673828125, -31.84423828125, -30.62109375, -29.39794921875, -28.1748046875, -26.95166015625, -25.728515625, -24.50537109375, -23.2822265625, -22.05908203125, -20.8359375, -19.61279296875, -18.3896484375, -17.16650390625, -15.943359375, -14.72021484375, -13.4970703125, -12.27392578125, -11.05078125, -9.82763671875, -8.6044921875, -7.38134765625, -6.158203125, -4.93505859375, -3.7119140625, -2.48876953125, -1.265625, -0.04248046875, 1.1806640625, 2.40380859375, 3.626953125, 4.85009765625, 6.0732421875, 7.29638671875, 8.51953125, 9.74267578125, 10.9658203125, 12.18896484375, 13.412109375, 14.63525390625, 15.8583984375, 17.08154296875, 18.3046875, 19.52783203125, 20.7509765625, 21.97412109375, 23.197265625, 24.42041015625, 25.6435546875, 26.86669921875, 28.08984375, 29.31298828125, 30.5361328125, 31.75927734375, 32.982421875, 34.20556640625, 35.4287109375, 36.65185546875, 37.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 7.0, 11.0, 10.0, 16.0, 9.0, 12.0, 13.0, 26.0, 16.0, 35.0, 31.0, 46.0, 47.0, 49.0, 48.0, 69.0, 42.0, 46.0, 60.0, 55.0, 52.0, 49.0, 32.0, 26.0, 41.0, 33.0, 16.0, 23.0, 11.0, 18.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.005420684814453125, -0.005257546901702881, -0.005094408988952637, -0.004931271076202393, -0.0047681331634521484, -0.004604995250701904, -0.00444185733795166, -0.004278719425201416, -0.004115581512451172, -0.003952443599700928, -0.0037893056869506836, -0.0036261677742004395, -0.0034630298614501953, -0.003299891948699951, -0.003136754035949707, -0.002973616123199463, -0.0028104782104492188, -0.0026473402976989746, -0.0024842023849487305, -0.0023210644721984863, -0.002157926559448242, -0.001994788646697998, -0.001831650733947754, -0.0016685128211975098, -0.0015053749084472656, -0.0013422369956970215, -0.0011790990829467773, -0.0010159611701965332, -0.0008528232574462891, -0.0006896853446960449, -0.0005265474319458008, -0.00036340951919555664, -0.0002002716064453125, -3.713369369506836e-05, 0.00012600421905517578, 0.0002891421318054199, 0.00045228004455566406, 0.0006154179573059082, 0.0007785558700561523, 0.0009416937828063965, 0.0011048316955566406, 0.0012679696083068848, 0.001431107521057129, 0.001594245433807373, 0.0017573833465576172, 0.0019205212593078613, 0.0020836591720581055, 0.0022467970848083496, 0.0024099349975585938, 0.002573072910308838, 0.002736210823059082, 0.002899348735809326, 0.0030624866485595703, 0.0032256245613098145, 0.0033887624740600586, 0.0035519003868103027, 0.003715038299560547, 0.003878176212310791, 0.004041314125061035, 0.004204452037811279, 0.0043675899505615234, 0.004530727863311768, 0.004693865776062012, 0.004857003688812256, 0.0050201416015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 10.0, 12.0, 20.0, 36.0, 42.0, 78.0, 120.0, 189.0, 253.0, 428.0, 699.0, 1082.0, 1654.0, 2742.0, 4370.0, 6798.0, 10698.0, 16049.0, 23939.0, 33911.0, 47183.0, 62357.0, 77982.0, 90967.0, 100171.0, 103391.0, 99260.0, 88597.0, 75284.0, 59240.0, 44398.0, 32199.0, 22219.0, 14958.0, 9843.0, 6266.0, 4016.0, 2544.0, 1690.0, 1036.0, 650.0, 398.0, 276.0, 162.0, 124.0, 81.0, 58.0, 30.0, 13.0, 12.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0], "bins": [-28.859375, -27.968994140625, -27.07861328125, -26.188232421875, -25.2978515625, -24.407470703125, -23.51708984375, -22.626708984375, -21.736328125, -20.845947265625, -19.95556640625, -19.065185546875, -18.1748046875, -17.284423828125, -16.39404296875, -15.503662109375, -14.61328125, -13.722900390625, -12.83251953125, -11.942138671875, -11.0517578125, -10.161376953125, -9.27099609375, -8.380615234375, -7.490234375, -6.599853515625, -5.70947265625, -4.819091796875, -3.9287109375, -3.038330078125, -2.14794921875, -1.257568359375, -0.3671875, 0.523193359375, 1.41357421875, 2.303955078125, 3.1943359375, 4.084716796875, 4.97509765625, 5.865478515625, 6.755859375, 7.646240234375, 8.53662109375, 9.427001953125, 10.3173828125, 11.207763671875, 12.09814453125, 12.988525390625, 13.87890625, 14.769287109375, 15.65966796875, 16.550048828125, 17.4404296875, 18.330810546875, 19.22119140625, 20.111572265625, 21.001953125, 21.892333984375, 22.78271484375, 23.673095703125, 24.5634765625, 25.453857421875, 26.34423828125, 27.234619140625, 28.125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 7.0, 7.0, 13.0, 14.0, 15.0, 20.0, 25.0, 32.0, 37.0, 39.0, 55.0, 48.0, 41.0, 63.0, 65.0, 61.0, 41.0, 56.0, 48.0, 42.0, 40.0, 41.0, 33.0, 22.0, 21.0, 20.0, 17.0, 16.0, 12.0, 15.0, 6.0, 5.0, 6.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0390625, -13.5897216796875, -13.140380859375, -12.6910400390625, -12.24169921875, -11.7923583984375, -11.343017578125, -10.8936767578125, -10.4443359375, -9.9949951171875, -9.545654296875, -9.0963134765625, -8.64697265625, -8.1976318359375, -7.748291015625, -7.2989501953125, -6.849609375, -6.4002685546875, -5.950927734375, -5.5015869140625, -5.05224609375, -4.6029052734375, -4.153564453125, -3.7042236328125, -3.2548828125, -2.8055419921875, -2.356201171875, -1.9068603515625, -1.45751953125, -1.0081787109375, -0.558837890625, -0.1094970703125, 0.33984375, 0.7891845703125, 1.238525390625, 1.6878662109375, 2.13720703125, 2.5865478515625, 3.035888671875, 3.4852294921875, 3.9345703125, 4.3839111328125, 4.833251953125, 5.2825927734375, 5.73193359375, 6.1812744140625, 6.630615234375, 7.0799560546875, 7.529296875, 7.9786376953125, 8.427978515625, 8.8773193359375, 9.32666015625, 9.7760009765625, 10.225341796875, 10.6746826171875, 11.1240234375, 11.5733642578125, 12.022705078125, 12.4720458984375, 12.92138671875, 13.3707275390625, 13.820068359375, 14.2694091796875, 14.71875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 5.0, 8.0, 13.0, 13.0, 16.0, 25.0, 24.0, 30.0, 20.0, 36.0, 36.0, 45.0, 44.0, 47.0, 47.0, 49.0, 58.0, 42.0, 47.0, 43.0, 43.0, 44.0, 29.0, 34.0, 36.0, 24.0, 24.0, 16.0, 15.0, 13.0, 12.0, 8.0, 15.0, 8.0, 4.0, 7.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-112.98036193847656, -109.52311706542969, -106.06587219238281, -102.60862731933594, -99.15138244628906, -95.69413757324219, -92.23689270019531, -88.77964782714844, -85.32240295410156, -81.86515808105469, -78.40791320800781, -74.95066833496094, -71.49342346191406, -68.03617858886719, -64.57893371582031, -61.12168884277344, -57.66444396972656, -54.20719909667969, -50.74995422363281, -47.29270935058594, -43.83546447753906, -40.37821960449219, -36.92097473144531, -33.46372985839844, -30.006484985351562, -26.549240112304688, -23.091995239257812, -19.634750366210938, -16.177505493164062, -12.720260620117188, -9.263015747070312, -5.8057708740234375, -2.3485336303710938, 1.1087112426757812, 4.565956115722656, 8.023200988769531, 11.480445861816406, 14.937690734863281, 18.394935607910156, 21.85218048095703, 25.309425354003906, 28.76667022705078, 32.223915100097656, 35.68115997314453, 39.138404846191406, 42.59564971923828, 46.052894592285156, 49.51013946533203, 52.967384338378906, 56.42462921142578, 59.881874084472656, 63.33911895751953, 66.7963638305664, 70.25360870361328, 73.71085357666016, 77.16809844970703, 80.6253433227539, 84.08258819580078, 87.53983306884766, 90.99707794189453, 94.4543228149414, 97.91156768798828, 101.36881256103516, 104.82605743408203, 108.2833023071289]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 8.0, 5.0, 11.0, 7.0, 10.0, 15.0, 12.0, 22.0, 17.0, 17.0, 25.0, 26.0, 28.0, 37.0, 36.0, 32.0, 22.0, 34.0, 35.0, 48.0, 35.0, 34.0, 51.0, 52.0, 42.0, 34.0, 32.0, 29.0, 37.0, 19.0, 36.0, 20.0, 19.0, 15.0, 18.0, 11.0, 21.0, 11.0, 6.0, 7.0, 3.0, 2.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.73394012451172, -92.62911224365234, -89.52428436279297, -86.41946411132812, -83.31463623046875, -80.20980834960938, -77.10498046875, -74.00015258789062, -70.89533233642578, -67.7905044555664, -64.68567657470703, -61.58085250854492, -58.47602844238281, -55.37120056152344, -52.26637268066406, -49.16154861450195, -46.05672073364258, -42.9518928527832, -39.847068786621094, -36.74224090576172, -33.63741683959961, -30.532588958740234, -27.427762985229492, -24.32293701171875, -21.218111038208008, -18.113285064697266, -15.008459091186523, -11.903632164001465, -8.798806190490723, -5.6939802169799805, -2.589153289794922, 0.5156726837158203, 3.6204986572265625, 6.725324630737305, 9.830150604248047, 12.934977531433105, 16.03980255126953, 19.144630432128906, 22.24945640563965, 25.35428237915039, 28.459108352661133, 31.563934326171875, 34.66876220703125, 37.77358627319336, 40.878414154052734, 43.983238220214844, 47.08806610107422, 50.192893981933594, 53.2977180480957, 56.40254592895508, 59.50736999511719, 62.61219787597656, 65.71702575683594, 68.82184600830078, 71.92667388916016, 75.03150177001953, 78.1363296508789, 81.24115753173828, 84.34598541259766, 87.4508056640625, 90.55563354492188, 93.66046142578125, 96.76528930664062, 99.8701171875, 102.97493743896484]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 13.0, 13.0, 34.0, 63.0, 123.0, 190.0, 311.0, 481.0, 806.0, 1348.0, 2144.0, 3800.0, 6028.0, 9866.0, 15983.0, 25157.0, 39803.0, 61392.0, 91992.0, 135771.0, 193454.0, 261132.0, 334169.0, 398381.0, 439286.0, 446291.0, 415087.0, 357187.0, 285830.0, 214020.0, 152937.0, 105316.0, 70395.0, 46094.0, 29556.0, 18844.0, 11812.0, 7263.0, 4561.0, 2792.0, 1751.0, 1053.0, 616.0, 433.0, 261.0, 185.0, 106.0, 58.0, 37.0, 25.0, 16.0, 10.0, 3.0, 5.0, 0.0, 4.0], "bins": [-83.25, -80.740234375, -78.23046875, -75.720703125, -73.2109375, -70.701171875, -68.19140625, -65.681640625, -63.171875, -60.662109375, -58.15234375, -55.642578125, -53.1328125, -50.623046875, -48.11328125, -45.603515625, -43.09375, -40.583984375, -38.07421875, -35.564453125, -33.0546875, -30.544921875, -28.03515625, -25.525390625, -23.015625, -20.505859375, -17.99609375, -15.486328125, -12.9765625, -10.466796875, -7.95703125, -5.447265625, -2.9375, -0.427734375, 2.08203125, 4.591796875, 7.1015625, 9.611328125, 12.12109375, 14.630859375, 17.140625, 19.650390625, 22.16015625, 24.669921875, 27.1796875, 29.689453125, 32.19921875, 34.708984375, 37.21875, 39.728515625, 42.23828125, 44.748046875, 47.2578125, 49.767578125, 52.27734375, 54.787109375, 57.296875, 59.806640625, 62.31640625, 64.826171875, 67.3359375, 69.845703125, 72.35546875, 74.865234375, 77.375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 9.0, 10.0, 9.0, 13.0, 19.0, 15.0, 20.0, 19.0, 25.0, 27.0, 31.0, 36.0, 33.0, 32.0, 28.0, 27.0, 44.0, 41.0, 44.0, 38.0, 52.0, 39.0, 53.0, 31.0, 33.0, 33.0, 34.0, 32.0, 23.0, 15.0, 18.0, 16.0, 14.0, 24.0, 10.0, 8.0, 6.0, 5.0, 2.0, 5.0, 8.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.3125, -87.4619140625, -84.611328125, -81.7607421875, -78.91015625, -76.0595703125, -73.208984375, -70.3583984375, -67.5078125, -64.6572265625, -61.806640625, -58.9560546875, -56.10546875, -53.2548828125, -50.404296875, -47.5537109375, -44.703125, -41.8525390625, -39.001953125, -36.1513671875, -33.30078125, -30.4501953125, -27.599609375, -24.7490234375, -21.8984375, -19.0478515625, -16.197265625, -13.3466796875, -10.49609375, -7.6455078125, -4.794921875, -1.9443359375, 0.90625, 3.7568359375, 6.607421875, 9.4580078125, 12.30859375, 15.1591796875, 18.009765625, 20.8603515625, 23.7109375, 26.5615234375, 29.412109375, 32.2626953125, 35.11328125, 37.9638671875, 40.814453125, 43.6650390625, 46.515625, 49.3662109375, 52.216796875, 55.0673828125, 57.91796875, 60.7685546875, 63.619140625, 66.4697265625, 69.3203125, 72.1708984375, 75.021484375, 77.8720703125, 80.72265625, 83.5732421875, 86.423828125, 89.2744140625, 92.125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 7.0, 14.0, 26.0, 27.0, 34.0, 68.0, 129.0, 195.0, 333.0, 544.0, 888.0, 1527.0, 2408.0, 4029.0, 6436.0, 10355.0, 16170.0, 24295.0, 37612.0, 55562.0, 79647.0, 112840.0, 152446.0, 200813.0, 252051.0, 301941.0, 342270.0, 370540.0, 377076.0, 362565.0, 330027.0, 284061.0, 234412.0, 183249.0, 138630.0, 100210.0, 71180.0, 49186.0, 32372.0, 21300.0, 13783.0, 8672.0, 5571.0, 3426.0, 2072.0, 1322.0, 754.0, 506.0, 287.0, 148.0, 103.0, 67.0, 44.0, 31.0, 10.0, 12.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-72.9375, -70.609375, -68.28125, -65.953125, -63.625, -61.296875, -58.96875, -56.640625, -54.3125, -51.984375, -49.65625, -47.328125, -45.0, -42.671875, -40.34375, -38.015625, -35.6875, -33.359375, -31.03125, -28.703125, -26.375, -24.046875, -21.71875, -19.390625, -17.0625, -14.734375, -12.40625, -10.078125, -7.75, -5.421875, -3.09375, -0.765625, 1.5625, 3.890625, 6.21875, 8.546875, 10.875, 13.203125, 15.53125, 17.859375, 20.1875, 22.515625, 24.84375, 27.171875, 29.5, 31.828125, 34.15625, 36.484375, 38.8125, 41.140625, 43.46875, 45.796875, 48.125, 50.453125, 52.78125, 55.109375, 57.4375, 59.765625, 62.09375, 64.421875, 66.75, 69.078125, 71.40625, 73.734375, 76.0625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 2.0, 7.0, 6.0, 10.0, 14.0, 25.0, 35.0, 35.0, 53.0, 48.0, 66.0, 70.0, 96.0, 98.0, 110.0, 131.0, 139.0, 143.0, 200.0, 167.0, 193.0, 220.0, 205.0, 191.0, 202.0, 190.0, 195.0, 178.0, 165.0, 132.0, 131.0, 113.0, 78.0, 73.0, 71.0, 46.0, 52.0, 35.0, 40.0, 28.0, 19.0, 16.0, 15.0, 10.0, 4.0, 6.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.0625, -42.716796875, -41.37109375, -40.025390625, -38.6796875, -37.333984375, -35.98828125, -34.642578125, -33.296875, -31.951171875, -30.60546875, -29.259765625, -27.9140625, -26.568359375, -25.22265625, -23.876953125, -22.53125, -21.185546875, -19.83984375, -18.494140625, -17.1484375, -15.802734375, -14.45703125, -13.111328125, -11.765625, -10.419921875, -9.07421875, -7.728515625, -6.3828125, -5.037109375, -3.69140625, -2.345703125, -1.0, 0.345703125, 1.69140625, 3.037109375, 4.3828125, 5.728515625, 7.07421875, 8.419921875, 9.765625, 11.111328125, 12.45703125, 13.802734375, 15.1484375, 16.494140625, 17.83984375, 19.185546875, 20.53125, 21.876953125, 23.22265625, 24.568359375, 25.9140625, 27.259765625, 28.60546875, 29.951171875, 31.296875, 32.642578125, 33.98828125, 35.333984375, 36.6796875, 38.025390625, 39.37109375, 40.716796875, 42.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 6.0, 12.0, 15.0, 11.0, 16.0, 15.0, 28.0, 35.0, 27.0, 34.0, 31.0, 38.0, 48.0, 38.0, 46.0, 49.0, 47.0, 50.0, 44.0, 48.0, 33.0, 41.0, 31.0, 39.0, 30.0, 33.0, 24.0, 24.0, 17.0, 14.0, 6.0, 12.0, 6.0, 9.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.15003204345703, -114.64317321777344, -111.13630676269531, -107.62944793701172, -104.1225814819336, -100.61572265625, -97.10885620117188, -93.60199737548828, -90.09513854980469, -86.5882797241211, -83.08141326904297, -79.57455444335938, -76.06768798828125, -72.56082916259766, -69.05397033691406, -65.54710388183594, -62.04024124145508, -58.53337860107422, -55.02651596069336, -51.5196533203125, -48.012794494628906, -44.50593185424805, -40.99906921386719, -37.492210388183594, -33.98534393310547, -30.47848129272461, -26.971620559692383, -23.464757919311523, -19.957897186279297, -16.451034545898438, -12.944171905517578, -9.437311172485352, -5.930450439453125, -2.423588514328003, 1.0832734107971191, 4.59013557434082, 8.096997261047363, 11.603858947753906, 15.110721588134766, 18.617582321166992, 22.12444496154785, 25.63130760192871, 29.138168334960938, 32.6450309753418, 36.151893615722656, 39.65875244140625, 43.165618896484375, 46.67247772216797, 50.17934036254883, 53.68620300292969, 57.19306564331055, 60.699928283691406, 64.206787109375, 67.71365356445312, 71.22051239013672, 74.72737121582031, 78.23423767089844, 81.74109649658203, 85.24796295166016, 88.75482177734375, 92.26168823242188, 95.76854705810547, 99.27540588378906, 102.78227233886719, 106.28913116455078]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 8.0, 3.0, 7.0, 19.0, 16.0, 16.0, 28.0, 20.0, 38.0, 20.0, 25.0, 36.0, 36.0, 38.0, 35.0, 46.0, 41.0, 37.0, 47.0, 46.0, 40.0, 42.0, 42.0, 39.0, 31.0, 26.0, 32.0, 27.0, 17.0, 17.0, 19.0, 12.0, 26.0, 12.0, 9.0, 2.0, 3.0, 8.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-112.1991958618164, -108.85623931884766, -105.5132827758789, -102.17032623291016, -98.8273696899414, -95.48441314697266, -92.14146423339844, -88.79850769042969, -85.45555114746094, -82.11259460449219, -78.76963806152344, -75.42668151855469, -72.08372497558594, -68.74076843261719, -65.39781188964844, -62.05485916137695, -58.71189880371094, -55.36894226074219, -52.02598571777344, -48.68302917480469, -45.34007263183594, -41.99711608886719, -38.6541633605957, -35.31120681762695, -31.968250274658203, -28.625293731689453, -25.282337188720703, -21.939382553100586, -18.596426010131836, -15.253469467163086, -11.910514831542969, -8.567558288574219, -5.2245941162109375, -1.8816380500793457, 1.461318016052246, 4.80427360534668, 8.14723014831543, 11.49018669128418, 14.833141326904297, 18.176097869873047, 21.519054412841797, 24.862010955810547, 28.204967498779297, 31.547922134399414, 34.89087677001953, 38.23383331298828, 41.57678985595703, 44.91974639892578, 48.26270294189453, 51.60565948486328, 54.94861602783203, 58.29157257080078, 61.63452911376953, 64.97748565673828, 68.3204345703125, 71.66339111328125, 75.00634765625, 78.34930419921875, 81.6922607421875, 85.03521728515625, 88.378173828125, 91.72113037109375, 95.0640869140625, 98.40704345703125, 101.75]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 7.0, 12.0, 20.0, 30.0, 42.0, 53.0, 86.0, 124.0, 172.0, 241.0, 347.0, 420.0, 646.0, 912.0, 1228.0, 1659.0, 2416.0, 3736.0, 6012.0, 10649.0, 19863.0, 39247.0, 78254.0, 150601.0, 235549.0, 219813.0, 132182.0, 67563.0, 33435.0, 17275.0, 9269.0, 5479.0, 3311.0, 2337.0, 1553.0, 1068.0, 818.0, 635.0, 440.0, 317.0, 240.0, 138.0, 118.0, 74.0, 64.0, 43.0, 22.0, 15.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-109.375, -105.9453125, -102.515625, -99.0859375, -95.65625, -92.2265625, -88.796875, -85.3671875, -81.9375, -78.5078125, -75.078125, -71.6484375, -68.21875, -64.7890625, -61.359375, -57.9296875, -54.5, -51.0703125, -47.640625, -44.2109375, -40.78125, -37.3515625, -33.921875, -30.4921875, -27.0625, -23.6328125, -20.203125, -16.7734375, -13.34375, -9.9140625, -6.484375, -3.0546875, 0.375, 3.8046875, 7.234375, 10.6640625, 14.09375, 17.5234375, 20.953125, 24.3828125, 27.8125, 31.2421875, 34.671875, 38.1015625, 41.53125, 44.9609375, 48.390625, 51.8203125, 55.25, 58.6796875, 62.109375, 65.5390625, 68.96875, 72.3984375, 75.828125, 79.2578125, 82.6875, 86.1171875, 89.546875, 92.9765625, 96.40625, 99.8359375, 103.265625, 106.6953125, 110.125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 10.0, 6.0, 9.0, 3.0, 7.0, 22.0, 17.0, 21.0, 20.0, 29.0, 35.0, 19.0, 33.0, 34.0, 28.0, 44.0, 40.0, 45.0, 36.0, 41.0, 49.0, 41.0, 38.0, 49.0, 37.0, 37.0, 31.0, 28.0, 32.0, 20.0, 20.0, 14.0, 17.0, 19.0, 20.0, 11.0, 6.0, 4.0, 5.0, 5.0, 9.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.4375, -108.115234375, -104.79296875, -101.470703125, -98.1484375, -94.826171875, -91.50390625, -88.181640625, -84.859375, -81.537109375, -78.21484375, -74.892578125, -71.5703125, -68.248046875, -64.92578125, -61.603515625, -58.28125, -54.958984375, -51.63671875, -48.314453125, -44.9921875, -41.669921875, -38.34765625, -35.025390625, -31.703125, -28.380859375, -25.05859375, -21.736328125, -18.4140625, -15.091796875, -11.76953125, -8.447265625, -5.125, -1.802734375, 1.51953125, 4.841796875, 8.1640625, 11.486328125, 14.80859375, 18.130859375, 21.453125, 24.775390625, 28.09765625, 31.419921875, 34.7421875, 38.064453125, 41.38671875, 44.708984375, 48.03125, 51.353515625, 54.67578125, 57.998046875, 61.3203125, 64.642578125, 67.96484375, 71.287109375, 74.609375, 77.931640625, 81.25390625, 84.576171875, 87.8984375, 91.220703125, 94.54296875, 97.865234375, 101.1875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 7.0, 10.0, 11.0, 30.0, 32.0, 56.0, 74.0, 98.0, 161.0, 197.0, 331.0, 532.0, 763.0, 1214.0, 2141.0, 3789.0, 6788.0, 13540.0, 30462.0, 96452.0, 382866.0, 361570.0, 89486.0, 29207.0, 12953.0, 6565.0, 3496.0, 2075.0, 1292.0, 828.0, 493.0, 339.0, 220.0, 155.0, 82.0, 64.0, 43.0, 35.0, 22.0, 21.0, 9.0, 18.0, 3.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-173.25, -167.65625, -162.0625, -156.46875, -150.875, -145.28125, -139.6875, -134.09375, -128.5, -122.90625, -117.3125, -111.71875, -106.125, -100.53125, -94.9375, -89.34375, -83.75, -78.15625, -72.5625, -66.96875, -61.375, -55.78125, -50.1875, -44.59375, -39.0, -33.40625, -27.8125, -22.21875, -16.625, -11.03125, -5.4375, 0.15625, 5.75, 11.34375, 16.9375, 22.53125, 28.125, 33.71875, 39.3125, 44.90625, 50.5, 56.09375, 61.6875, 67.28125, 72.875, 78.46875, 84.0625, 89.65625, 95.25, 100.84375, 106.4375, 112.03125, 117.625, 123.21875, 128.8125, 134.40625, 140.0, 145.59375, 151.1875, 156.78125, 162.375, 167.96875, 173.5625, 179.15625, 184.75]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 6.0, 5.0, 7.0, 4.0, 7.0, 10.0, 7.0, 15.0, 25.0, 20.0, 32.0, 36.0, 36.0, 41.0, 39.0, 45.0, 53.0, 45.0, 58.0, 42.0, 58.0, 48.0, 57.0, 31.0, 44.0, 41.0, 39.0, 27.0, 28.0, 28.0, 20.0, 13.0, 14.0, 5.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.125, -84.384765625, -81.64453125, -78.904296875, -76.1640625, -73.423828125, -70.68359375, -67.943359375, -65.203125, -62.462890625, -59.72265625, -56.982421875, -54.2421875, -51.501953125, -48.76171875, -46.021484375, -43.28125, -40.541015625, -37.80078125, -35.060546875, -32.3203125, -29.580078125, -26.83984375, -24.099609375, -21.359375, -18.619140625, -15.87890625, -13.138671875, -10.3984375, -7.658203125, -4.91796875, -2.177734375, 0.5625, 3.302734375, 6.04296875, 8.783203125, 11.5234375, 14.263671875, 17.00390625, 19.744140625, 22.484375, 25.224609375, 27.96484375, 30.705078125, 33.4453125, 36.185546875, 38.92578125, 41.666015625, 44.40625, 47.146484375, 49.88671875, 52.626953125, 55.3671875, 58.107421875, 60.84765625, 63.587890625, 66.328125, 69.068359375, 71.80859375, 74.548828125, 77.2890625, 80.029296875, 82.76953125, 85.509765625, 88.25]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 13.0, 11.0, 23.0, 42.0, 48.0, 85.0, 95.0, 171.0, 210.0, 326.0, 467.0, 617.0, 990.0, 1449.0, 2198.0, 3344.0, 5316.0, 9443.0, 18036.0, 40208.0, 110052.0, 310507.0, 332159.0, 123107.0, 44229.0, 19273.0, 9925.0, 5801.0, 3441.0, 2267.0, 1439.0, 1016.0, 689.0, 499.0, 333.0, 214.0, 160.0, 102.0, 69.0, 44.0, 46.0, 28.0, 20.0, 14.0, 12.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-61.03125, -59.126953125, -57.22265625, -55.318359375, -53.4140625, -51.509765625, -49.60546875, -47.701171875, -45.796875, -43.892578125, -41.98828125, -40.083984375, -38.1796875, -36.275390625, -34.37109375, -32.466796875, -30.5625, -28.658203125, -26.75390625, -24.849609375, -22.9453125, -21.041015625, -19.13671875, -17.232421875, -15.328125, -13.423828125, -11.51953125, -9.615234375, -7.7109375, -5.806640625, -3.90234375, -1.998046875, -0.09375, 1.810546875, 3.71484375, 5.619140625, 7.5234375, 9.427734375, 11.33203125, 13.236328125, 15.140625, 17.044921875, 18.94921875, 20.853515625, 22.7578125, 24.662109375, 26.56640625, 28.470703125, 30.375, 32.279296875, 34.18359375, 36.087890625, 37.9921875, 39.896484375, 41.80078125, 43.705078125, 45.609375, 47.513671875, 49.41796875, 51.322265625, 53.2265625, 55.130859375, 57.03515625, 58.939453125, 60.84375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 7.0, 4.0, 13.0, 17.0, 41.0, 96.0, 190.0, 271.0, 196.0, 81.0, 32.0, 21.0, 13.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01165771484375, -0.011275529861450195, -0.01089334487915039, -0.010511159896850586, -0.010128974914550781, -0.009746789932250977, -0.009364604949951172, -0.008982419967651367, -0.008600234985351562, -0.008218050003051758, -0.007835865020751953, -0.0074536800384521484, -0.007071495056152344, -0.006689310073852539, -0.006307125091552734, -0.00592494010925293, -0.005542755126953125, -0.00516057014465332, -0.004778385162353516, -0.004396200180053711, -0.004014015197753906, -0.0036318302154541016, -0.003249645233154297, -0.002867460250854492, -0.0024852752685546875, -0.002103090286254883, -0.0017209053039550781, -0.0013387203216552734, -0.0009565353393554688, -0.0005743503570556641, -0.00019216537475585938, 0.0001900196075439453, 0.00057220458984375, 0.0009543895721435547, 0.0013365745544433594, 0.001718759536743164, 0.0021009445190429688, 0.0024831295013427734, 0.002865314483642578, 0.003247499465942383, 0.0036296844482421875, 0.004011869430541992, 0.004394054412841797, 0.0047762393951416016, 0.005158424377441406, 0.005540609359741211, 0.005922794342041016, 0.00630497932434082, 0.006687164306640625, 0.00706934928894043, 0.007451534271240234, 0.007833719253540039, 0.008215904235839844, 0.008598089218139648, 0.008980274200439453, 0.009362459182739258, 0.009744644165039062, 0.010126829147338867, 0.010509014129638672, 0.010891199111938477, 0.011273384094238281, 0.011655569076538086, 0.01203775405883789, 0.012419939041137695, 0.0128021240234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 17.0, 13.0, 28.0, 29.0, 49.0, 67.0, 92.0, 130.0, 189.0, 250.0, 375.0, 559.0, 843.0, 1146.0, 1660.0, 2422.0, 3681.0, 5738.0, 9148.0, 16075.0, 27812.0, 51003.0, 92898.0, 154404.0, 204624.0, 186493.0, 123976.0, 70772.0, 38896.0, 21482.0, 12108.0, 7223.0, 4649.0, 2974.0, 2057.0, 1414.0, 980.0, 698.0, 477.0, 331.0, 217.0, 159.0, 125.0, 81.0, 58.0, 48.0, 38.0, 14.0, 12.0, 4.0, 4.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0], "bins": [-53.65625, -51.96728515625, -50.2783203125, -48.58935546875, -46.900390625, -45.21142578125, -43.5224609375, -41.83349609375, -40.14453125, -38.45556640625, -36.7666015625, -35.07763671875, -33.388671875, -31.69970703125, -30.0107421875, -28.32177734375, -26.6328125, -24.94384765625, -23.2548828125, -21.56591796875, -19.876953125, -18.18798828125, -16.4990234375, -14.81005859375, -13.12109375, -11.43212890625, -9.7431640625, -8.05419921875, -6.365234375, -4.67626953125, -2.9873046875, -1.29833984375, 0.390625, 2.07958984375, 3.7685546875, 5.45751953125, 7.146484375, 8.83544921875, 10.5244140625, 12.21337890625, 13.90234375, 15.59130859375, 17.2802734375, 18.96923828125, 20.658203125, 22.34716796875, 24.0361328125, 25.72509765625, 27.4140625, 29.10302734375, 30.7919921875, 32.48095703125, 34.169921875, 35.85888671875, 37.5478515625, 39.23681640625, 40.92578125, 42.61474609375, 44.3037109375, 45.99267578125, 47.681640625, 49.37060546875, 51.0595703125, 52.74853515625, 54.4375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 5.0, 4.0, 8.0, 23.0, 17.0, 22.0, 21.0, 24.0, 45.0, 51.0, 49.0, 74.0, 63.0, 95.0, 65.0, 61.0, 53.0, 51.0, 50.0, 34.0, 33.0, 32.0, 29.0, 25.0, 18.0, 8.0, 8.0, 10.0, 5.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.984375, -15.345703125, -14.70703125, -14.068359375, -13.4296875, -12.791015625, -12.15234375, -11.513671875, -10.875, -10.236328125, -9.59765625, -8.958984375, -8.3203125, -7.681640625, -7.04296875, -6.404296875, -5.765625, -5.126953125, -4.48828125, -3.849609375, -3.2109375, -2.572265625, -1.93359375, -1.294921875, -0.65625, -0.017578125, 0.62109375, 1.259765625, 1.8984375, 2.537109375, 3.17578125, 3.814453125, 4.453125, 5.091796875, 5.73046875, 6.369140625, 7.0078125, 7.646484375, 8.28515625, 8.923828125, 9.5625, 10.201171875, 10.83984375, 11.478515625, 12.1171875, 12.755859375, 13.39453125, 14.033203125, 14.671875, 15.310546875, 15.94921875, 16.587890625, 17.2265625, 17.865234375, 18.50390625, 19.142578125, 19.78125, 20.419921875, 21.05859375, 21.697265625, 22.3359375, 22.974609375, 23.61328125, 24.251953125, 24.890625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 8.0, 13.0, 10.0, 14.0, 17.0, 14.0, 20.0, 28.0, 21.0, 33.0, 35.0, 30.0, 40.0, 35.0, 50.0, 50.0, 42.0, 57.0, 53.0, 43.0, 33.0, 42.0, 34.0, 30.0, 43.0, 33.0, 37.0, 28.0, 19.0, 18.0, 10.0, 11.0, 3.0, 11.0, 6.0, 3.0, 6.0, 9.0, 2.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.13176727294922, -109.57005310058594, -106.00834655761719, -102.4466323852539, -98.88491821289062, -95.32320404052734, -91.76148986816406, -88.19978332519531, -84.63806915283203, -81.07635498046875, -77.5146484375, -73.95293426513672, -70.39122009277344, -66.82950592041016, -63.26779556274414, -59.706085205078125, -56.144371032714844, -52.58265686035156, -49.02094650268555, -45.45923614501953, -41.89752197265625, -38.33580780029297, -34.77409744262695, -31.212385177612305, -27.650672912597656, -24.088960647583008, -20.52724838256836, -16.96553611755371, -13.403823852539062, -9.842111587524414, -6.280399322509766, -2.718687057495117, 0.8430328369140625, 4.404745101928711, 7.966457366943359, 11.528169631958008, 15.089881896972656, 18.651594161987305, 22.213306427001953, 25.7750186920166, 29.33673095703125, 32.89844512939453, 36.46015548706055, 40.02186584472656, 43.583580017089844, 47.145294189453125, 50.70700454711914, 54.268714904785156, 57.83042907714844, 61.39214324951172, 64.953857421875, 68.51556396484375, 72.07727813720703, 75.63899230957031, 79.20069885253906, 82.76241302490234, 86.32412719726562, 89.8858413696289, 93.44755554199219, 97.00926208496094, 100.57097625732422, 104.1326904296875, 107.69439697265625, 111.25611114501953, 114.81782531738281]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 8.0, 8.0, 6.0, 9.0, 5.0, 11.0, 17.0, 12.0, 21.0, 22.0, 32.0, 24.0, 23.0, 29.0, 49.0, 38.0, 32.0, 34.0, 41.0, 43.0, 38.0, 47.0, 47.0, 40.0, 34.0, 46.0, 42.0, 29.0, 34.0, 18.0, 26.0, 21.0, 17.0, 21.0, 15.0, 14.0, 10.0, 9.0, 6.0, 9.0, 4.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-116.03997802734375, -112.6844711303711, -109.32896423339844, -105.97345733642578, -102.61795043945312, -99.26244354248047, -95.90693664550781, -92.55143737792969, -89.1959228515625, -85.84041595458984, -82.48490905761719, -79.12940216064453, -75.77389526367188, -72.41838836669922, -69.06288146972656, -65.70738220214844, -62.35187530517578, -58.996368408203125, -55.64086151123047, -52.28535461425781, -48.929847717285156, -45.5743408203125, -42.21883773803711, -38.86333084106445, -35.5078239440918, -32.15231704711914, -28.796810150146484, -25.44130516052246, -22.085798263549805, -18.73029136657715, -15.374786376953125, -12.019279479980469, -8.663780212402344, -5.308273792266846, -1.9527673721313477, 1.4027385711669922, 4.758245468139648, 8.113752365112305, 11.469257354736328, 14.824764251708984, 18.18027114868164, 21.535778045654297, 24.891284942626953, 28.246789932250977, 31.602296829223633, 34.957801818847656, 38.31330871582031, 41.66881561279297, 45.024322509765625, 48.37982940673828, 51.73533630371094, 55.090843200683594, 58.44635009765625, 61.801856994628906, 65.15736389160156, 68.51286315917969, 71.86837768554688, 75.22388458251953, 78.57939147949219, 81.93489837646484, 85.2904052734375, 88.64591217041016, 92.00141906738281, 95.35691833496094, 98.7124252319336]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 6.0, 15.0, 23.0, 34.0, 58.0, 97.0, 183.0, 242.0, 409.0, 655.0, 1080.0, 1754.0, 2741.0, 4347.0, 6690.0, 10146.0, 14885.0, 21357.0, 29933.0, 39691.0, 51853.0, 63918.0, 75673.0, 85146.0, 90821.0, 92150.0, 88578.0, 80293.0, 70239.0, 57513.0, 45596.0, 34354.0, 25313.0, 17672.0, 12214.0, 8269.0, 5429.0, 3438.0, 2154.0, 1401.0, 859.0, 527.0, 308.0, 192.0, 124.0, 65.0, 54.0, 28.0, 15.0, 6.0, 5.0, 5.0, 4.0, 1.0], "bins": [-83.5625, -81.19140625, -78.8203125, -76.44921875, -74.078125, -71.70703125, -69.3359375, -66.96484375, -64.59375, -62.22265625, -59.8515625, -57.48046875, -55.109375, -52.73828125, -50.3671875, -47.99609375, -45.625, -43.25390625, -40.8828125, -38.51171875, -36.140625, -33.76953125, -31.3984375, -29.02734375, -26.65625, -24.28515625, -21.9140625, -19.54296875, -17.171875, -14.80078125, -12.4296875, -10.05859375, -7.6875, -5.31640625, -2.9453125, -0.57421875, 1.796875, 4.16796875, 6.5390625, 8.91015625, 11.28125, 13.65234375, 16.0234375, 18.39453125, 20.765625, 23.13671875, 25.5078125, 27.87890625, 30.25, 32.62109375, 34.9921875, 37.36328125, 39.734375, 42.10546875, 44.4765625, 46.84765625, 49.21875, 51.58984375, 53.9609375, 56.33203125, 58.703125, 61.07421875, 63.4453125, 65.81640625, 68.1875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 7.0, 7.0, 12.0, 8.0, 6.0, 7.0, 15.0, 16.0, 17.0, 25.0, 24.0, 33.0, 26.0, 30.0, 34.0, 49.0, 37.0, 30.0, 42.0, 36.0, 43.0, 46.0, 51.0, 43.0, 29.0, 41.0, 49.0, 32.0, 30.0, 25.0, 20.0, 20.0, 24.0, 15.0, 17.0, 10.0, 11.0, 7.0, 10.0, 6.0, 5.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-112.9375, -109.6669921875, -106.396484375, -103.1259765625, -99.85546875, -96.5849609375, -93.314453125, -90.0439453125, -86.7734375, -83.5029296875, -80.232421875, -76.9619140625, -73.69140625, -70.4208984375, -67.150390625, -63.8798828125, -60.609375, -57.3388671875, -54.068359375, -50.7978515625, -47.52734375, -44.2568359375, -40.986328125, -37.7158203125, -34.4453125, -31.1748046875, -27.904296875, -24.6337890625, -21.36328125, -18.0927734375, -14.822265625, -11.5517578125, -8.28125, -5.0107421875, -1.740234375, 1.5302734375, 4.80078125, 8.0712890625, 11.341796875, 14.6123046875, 17.8828125, 21.1533203125, 24.423828125, 27.6943359375, 30.96484375, 34.2353515625, 37.505859375, 40.7763671875, 44.046875, 47.3173828125, 50.587890625, 53.8583984375, 57.12890625, 60.3994140625, 63.669921875, 66.9404296875, 70.2109375, 73.4814453125, 76.751953125, 80.0224609375, 83.29296875, 86.5634765625, 89.833984375, 93.1044921875, 96.375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 5.0, 15.0, 32.0, 39.0, 64.0, 117.0, 167.0, 278.0, 419.0, 772.0, 1333.0, 1997.0, 3171.0, 5190.0, 7968.0, 12336.0, 18331.0, 26945.0, 37572.0, 50261.0, 64842.0, 79390.0, 90504.0, 98177.0, 99937.0, 95105.0, 85145.0, 71897.0, 57019.0, 43441.0, 31572.0, 22192.0, 15223.0, 10027.0, 6492.0, 3999.0, 2595.0, 1584.0, 914.0, 555.0, 330.0, 222.0, 138.0, 89.0, 61.0, 25.0, 21.0, 13.0, 10.0, 5.0, 2.0, 11.0, 1.0, 2.0, 1.0, 2.0], "bins": [-83.3125, -80.728515625, -78.14453125, -75.560546875, -72.9765625, -70.392578125, -67.80859375, -65.224609375, -62.640625, -60.056640625, -57.47265625, -54.888671875, -52.3046875, -49.720703125, -47.13671875, -44.552734375, -41.96875, -39.384765625, -36.80078125, -34.216796875, -31.6328125, -29.048828125, -26.46484375, -23.880859375, -21.296875, -18.712890625, -16.12890625, -13.544921875, -10.9609375, -8.376953125, -5.79296875, -3.208984375, -0.625, 1.958984375, 4.54296875, 7.126953125, 9.7109375, 12.294921875, 14.87890625, 17.462890625, 20.046875, 22.630859375, 25.21484375, 27.798828125, 30.3828125, 32.966796875, 35.55078125, 38.134765625, 40.71875, 43.302734375, 45.88671875, 48.470703125, 51.0546875, 53.638671875, 56.22265625, 58.806640625, 61.390625, 63.974609375, 66.55859375, 69.142578125, 71.7265625, 74.310546875, 76.89453125, 79.478515625, 82.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 4.0, 4.0, 8.0, 9.0, 17.0, 9.0, 17.0, 17.0, 17.0, 18.0, 24.0, 20.0, 31.0, 38.0, 34.0, 32.0, 40.0, 39.0, 34.0, 41.0, 31.0, 57.0, 27.0, 29.0, 45.0, 26.0, 32.0, 29.0, 31.0, 31.0, 23.0, 23.0, 19.0, 19.0, 16.0, 14.0, 17.0, 16.0, 6.0, 10.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-63.46875, -61.49267578125, -59.5166015625, -57.54052734375, -55.564453125, -53.58837890625, -51.6123046875, -49.63623046875, -47.66015625, -45.68408203125, -43.7080078125, -41.73193359375, -39.755859375, -37.77978515625, -35.8037109375, -33.82763671875, -31.8515625, -29.87548828125, -27.8994140625, -25.92333984375, -23.947265625, -21.97119140625, -19.9951171875, -18.01904296875, -16.04296875, -14.06689453125, -12.0908203125, -10.11474609375, -8.138671875, -6.16259765625, -4.1865234375, -2.21044921875, -0.234375, 1.74169921875, 3.7177734375, 5.69384765625, 7.669921875, 9.64599609375, 11.6220703125, 13.59814453125, 15.57421875, 17.55029296875, 19.5263671875, 21.50244140625, 23.478515625, 25.45458984375, 27.4306640625, 29.40673828125, 31.3828125, 33.35888671875, 35.3349609375, 37.31103515625, 39.287109375, 41.26318359375, 43.2392578125, 45.21533203125, 47.19140625, 49.16748046875, 51.1435546875, 53.11962890625, 55.095703125, 57.07177734375, 59.0478515625, 61.02392578125, 63.0]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 6.0, 5.0, 3.0, 9.0, 15.0, 33.0, 40.0, 43.0, 89.0, 128.0, 197.0, 327.0, 567.0, 846.0, 1279.0, 2234.0, 3755.0, 6273.0, 10410.0, 17343.0, 28612.0, 44641.0, 66906.0, 92587.0, 116764.0, 131149.0, 131000.0, 116385.0, 92232.0, 67528.0, 44955.0, 28363.0, 17618.0, 10315.0, 6324.0, 3725.0, 2250.0, 1329.0, 817.0, 522.0, 334.0, 196.0, 144.0, 95.0, 63.0, 35.0, 22.0, 17.0, 12.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.78125, -36.52197265625, -35.2626953125, -34.00341796875, -32.744140625, -31.48486328125, -30.2255859375, -28.96630859375, -27.70703125, -26.44775390625, -25.1884765625, -23.92919921875, -22.669921875, -21.41064453125, -20.1513671875, -18.89208984375, -17.6328125, -16.37353515625, -15.1142578125, -13.85498046875, -12.595703125, -11.33642578125, -10.0771484375, -8.81787109375, -7.55859375, -6.29931640625, -5.0400390625, -3.78076171875, -2.521484375, -1.26220703125, -0.0029296875, 1.25634765625, 2.515625, 3.77490234375, 5.0341796875, 6.29345703125, 7.552734375, 8.81201171875, 10.0712890625, 11.33056640625, 12.58984375, 13.84912109375, 15.1083984375, 16.36767578125, 17.626953125, 18.88623046875, 20.1455078125, 21.40478515625, 22.6640625, 23.92333984375, 25.1826171875, 26.44189453125, 27.701171875, 28.96044921875, 30.2197265625, 31.47900390625, 32.73828125, 33.99755859375, 35.2568359375, 36.51611328125, 37.775390625, 39.03466796875, 40.2939453125, 41.55322265625, 42.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 11.0, 11.0, 17.0, 24.0, 29.0, 34.0, 51.0, 42.0, 55.0, 56.0, 70.0, 74.0, 60.0, 80.0, 52.0, 68.0, 49.0, 46.0, 28.0, 23.0, 31.0, 22.0, 15.0, 12.0, 8.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00592041015625, -0.005708158016204834, -0.005495905876159668, -0.005283653736114502, -0.005071401596069336, -0.00485914945602417, -0.004646897315979004, -0.004434645175933838, -0.004222393035888672, -0.004010140895843506, -0.00379788875579834, -0.003585636615753174, -0.003373384475708008, -0.003161132335662842, -0.0029488801956176758, -0.0027366280555725098, -0.0025243759155273438, -0.0023121237754821777, -0.0020998716354370117, -0.0018876194953918457, -0.0016753673553466797, -0.0014631152153015137, -0.0012508630752563477, -0.0010386109352111816, -0.0008263587951660156, -0.0006141066551208496, -0.0004018545150756836, -0.00018960237503051758, 2.2649765014648438e-05, 0.00023490190505981445, 0.00044715404510498047, 0.0006594061851501465, 0.0008716583251953125, 0.0010839104652404785, 0.0012961626052856445, 0.0015084147453308105, 0.0017206668853759766, 0.0019329190254211426, 0.0021451711654663086, 0.0023574233055114746, 0.0025696754455566406, 0.0027819275856018066, 0.0029941797256469727, 0.0032064318656921387, 0.0034186840057373047, 0.0036309361457824707, 0.0038431882858276367, 0.004055440425872803, 0.004267692565917969, 0.004479944705963135, 0.004692196846008301, 0.004904448986053467, 0.005116701126098633, 0.005328953266143799, 0.005541205406188965, 0.005753457546234131, 0.005965709686279297, 0.006177961826324463, 0.006390213966369629, 0.006602466106414795, 0.006814718246459961, 0.007026970386505127, 0.007239222526550293, 0.007451474666595459, 0.007663726806640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 13.0, 14.0, 16.0, 32.0, 37.0, 93.0, 130.0, 213.0, 344.0, 526.0, 831.0, 1331.0, 2073.0, 3375.0, 4961.0, 8039.0, 12060.0, 17899.0, 25685.0, 36390.0, 48687.0, 63514.0, 77232.0, 89913.0, 97806.0, 100230.0, 96277.0, 86002.0, 72393.0, 57969.0, 44552.0, 32358.0, 22977.0, 15391.0, 10538.0, 6715.0, 4329.0, 2757.0, 1785.0, 1110.0, 748.0, 455.0, 286.0, 150.0, 114.0, 74.0, 73.0, 27.0, 16.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-30.265625, -29.329345703125, -28.39306640625, -27.456787109375, -26.5205078125, -25.584228515625, -24.64794921875, -23.711669921875, -22.775390625, -21.839111328125, -20.90283203125, -19.966552734375, -19.0302734375, -18.093994140625, -17.15771484375, -16.221435546875, -15.28515625, -14.348876953125, -13.41259765625, -12.476318359375, -11.5400390625, -10.603759765625, -9.66748046875, -8.731201171875, -7.794921875, -6.858642578125, -5.92236328125, -4.986083984375, -4.0498046875, -3.113525390625, -2.17724609375, -1.240966796875, -0.3046875, 0.631591796875, 1.56787109375, 2.504150390625, 3.4404296875, 4.376708984375, 5.31298828125, 6.249267578125, 7.185546875, 8.121826171875, 9.05810546875, 9.994384765625, 10.9306640625, 11.866943359375, 12.80322265625, 13.739501953125, 14.67578125, 15.612060546875, 16.54833984375, 17.484619140625, 18.4208984375, 19.357177734375, 20.29345703125, 21.229736328125, 22.166015625, 23.102294921875, 24.03857421875, 24.974853515625, 25.9111328125, 26.847412109375, 27.78369140625, 28.719970703125, 29.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 7.0, 11.0, 13.0, 12.0, 11.0, 15.0, 12.0, 30.0, 16.0, 21.0, 31.0, 37.0, 35.0, 37.0, 41.0, 42.0, 49.0, 46.0, 50.0, 53.0, 38.0, 43.0, 31.0, 31.0, 37.0, 38.0, 31.0, 27.0, 16.0, 28.0, 9.0, 14.0, 18.0, 11.0, 11.0, 4.0, 9.0, 9.0, 11.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.0625, -11.6485595703125, -11.234619140625, -10.8206787109375, -10.40673828125, -9.9927978515625, -9.578857421875, -9.1649169921875, -8.7509765625, -8.3370361328125, -7.923095703125, -7.5091552734375, -7.09521484375, -6.6812744140625, -6.267333984375, -5.8533935546875, -5.439453125, -5.0255126953125, -4.611572265625, -4.1976318359375, -3.78369140625, -3.3697509765625, -2.955810546875, -2.5418701171875, -2.1279296875, -1.7139892578125, -1.300048828125, -0.8861083984375, -0.47216796875, -0.0582275390625, 0.355712890625, 0.7696533203125, 1.18359375, 1.5975341796875, 2.011474609375, 2.4254150390625, 2.83935546875, 3.2532958984375, 3.667236328125, 4.0811767578125, 4.4951171875, 4.9090576171875, 5.322998046875, 5.7369384765625, 6.15087890625, 6.5648193359375, 6.978759765625, 7.3927001953125, 7.806640625, 8.2205810546875, 8.634521484375, 9.0484619140625, 9.46240234375, 9.8763427734375, 10.290283203125, 10.7042236328125, 11.1181640625, 11.5321044921875, 11.946044921875, 12.3599853515625, 12.77392578125, 13.1878662109375, 13.601806640625, 14.0157470703125, 14.4296875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 5.0, 11.0, 13.0, 17.0, 12.0, 21.0, 31.0, 22.0, 29.0, 31.0, 37.0, 31.0, 47.0, 56.0, 43.0, 48.0, 55.0, 49.0, 59.0, 33.0, 52.0, 37.0, 31.0, 34.0, 27.0, 34.0, 36.0, 15.0, 20.0, 9.0, 11.0, 6.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.1883544921875, -120.39750671386719, -116.6066665649414, -112.81582641601562, -109.02497863769531, -105.234130859375, -101.44329071044922, -97.65245056152344, -93.86160278320312, -90.07075500488281, -86.27991485595703, -82.48907470703125, -78.69822692871094, -74.90737915039062, -71.11653900146484, -67.32569885253906, -63.53485107421875, -59.7440071105957, -55.953163146972656, -52.16231918334961, -48.37147521972656, -44.580631256103516, -40.78978729248047, -36.99894332885742, -33.208099365234375, -29.417255401611328, -25.62641143798828, -21.835567474365234, -18.044723510742188, -14.25387954711914, -10.463035583496094, -6.672191619873047, -2.88134765625, 0.9094963073730469, 4.700340270996094, 8.49118423461914, 12.282028198242188, 16.072872161865234, 19.86371612548828, 23.654560089111328, 27.445404052734375, 31.236248016357422, 35.02709197998047, 38.817935943603516, 42.60877990722656, 46.39962387084961, 50.190467834472656, 53.9813117980957, 57.77215576171875, 61.5629997253418, 65.35384368896484, 69.14468383789062, 72.93553161621094, 76.72637939453125, 80.51721954345703, 84.30805969238281, 88.09890747070312, 91.88975524902344, 95.68059539794922, 99.471435546875, 103.26228332519531, 107.05313110351562, 110.8439712524414, 114.63481140136719, 118.4256591796875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 8.0, 9.0, 5.0, 5.0, 14.0, 21.0, 12.0, 10.0, 18.0, 29.0, 33.0, 23.0, 26.0, 28.0, 33.0, 30.0, 41.0, 44.0, 43.0, 34.0, 42.0, 45.0, 43.0, 43.0, 34.0, 47.0, 30.0, 42.0, 28.0, 29.0, 20.0, 27.0, 17.0, 17.0, 12.0, 15.0, 8.0, 7.0, 9.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-115.82787322998047, -112.46138763427734, -109.09489440917969, -105.72840881347656, -102.36192321777344, -98.99542999267578, -95.62894439697266, -92.262451171875, -88.89596557617188, -85.52947998046875, -82.1629867553711, -78.79650115966797, -75.43001556396484, -72.06352233886719, -68.69703674316406, -65.33055114746094, -61.96406173706055, -58.597572326660156, -55.23108673095703, -51.86459732055664, -48.49810791015625, -45.131622314453125, -41.765132904052734, -38.398643493652344, -35.03215789794922, -31.66567039489746, -28.29918098449707, -24.932693481445312, -21.566204071044922, -18.199716567993164, -14.833229064941406, -11.466739654541016, -8.100250244140625, -4.733761787414551, -1.3672738075256348, 1.9992141723632812, 5.3657026290893555, 8.73219108581543, 12.098678588867188, 15.465167999267578, 18.831655502319336, 22.198143005371094, 25.564632415771484, 28.931119918823242, 32.297607421875, 35.66409683227539, 39.03058624267578, 42.397071838378906, 45.7635612487793, 49.13005065917969, 52.49653625488281, 55.8630256652832, 59.229515075683594, 62.59600067138672, 65.96249389648438, 69.3289794921875, 72.69546508789062, 76.06195068359375, 79.4284439086914, 82.79492950439453, 86.16141510009766, 89.52790832519531, 92.89439392089844, 96.26087951660156, 99.62737274169922]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 10.0, 28.0, 29.0, 55.0, 78.0, 155.0, 295.0, 504.0, 853.0, 1403.0, 2463.0, 4208.0, 7071.0, 11659.0, 19053.0, 30279.0, 48254.0, 75335.0, 112316.0, 161737.0, 224440.0, 296067.0, 365620.0, 420919.0, 447949.0, 436023.0, 391642.0, 326860.0, 253659.0, 186370.0, 130409.0, 87753.0, 57413.0, 36010.0, 22674.0, 13904.0, 8401.0, 5127.0, 2917.0, 1825.0, 1003.0, 626.0, 363.0, 214.0, 128.0, 67.0, 50.0, 31.0, 17.0, 9.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-86.375, -83.7333984375, -81.091796875, -78.4501953125, -75.80859375, -73.1669921875, -70.525390625, -67.8837890625, -65.2421875, -62.6005859375, -59.958984375, -57.3173828125, -54.67578125, -52.0341796875, -49.392578125, -46.7509765625, -44.109375, -41.4677734375, -38.826171875, -36.1845703125, -33.54296875, -30.9013671875, -28.259765625, -25.6181640625, -22.9765625, -20.3349609375, -17.693359375, -15.0517578125, -12.41015625, -9.7685546875, -7.126953125, -4.4853515625, -1.84375, 0.7978515625, 3.439453125, 6.0810546875, 8.72265625, 11.3642578125, 14.005859375, 16.6474609375, 19.2890625, 21.9306640625, 24.572265625, 27.2138671875, 29.85546875, 32.4970703125, 35.138671875, 37.7802734375, 40.421875, 43.0634765625, 45.705078125, 48.3466796875, 50.98828125, 53.6298828125, 56.271484375, 58.9130859375, 61.5546875, 64.1962890625, 66.837890625, 69.4794921875, 72.12109375, 74.7626953125, 77.404296875, 80.0458984375, 82.6875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 10.0, 9.0, 5.0, 4.0, 11.0, 16.0, 23.0, 8.0, 17.0, 32.0, 36.0, 18.0, 24.0, 22.0, 30.0, 40.0, 38.0, 51.0, 33.0, 42.0, 42.0, 39.0, 48.0, 44.0, 40.0, 40.0, 28.0, 40.0, 38.0, 21.0, 27.0, 20.0, 20.0, 19.0, 9.0, 16.0, 9.0, 7.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-104.0, -100.9638671875, -97.927734375, -94.8916015625, -91.85546875, -88.8193359375, -85.783203125, -82.7470703125, -79.7109375, -76.6748046875, -73.638671875, -70.6025390625, -67.56640625, -64.5302734375, -61.494140625, -58.4580078125, -55.421875, -52.3857421875, -49.349609375, -46.3134765625, -43.27734375, -40.2412109375, -37.205078125, -34.1689453125, -31.1328125, -28.0966796875, -25.060546875, -22.0244140625, -18.98828125, -15.9521484375, -12.916015625, -9.8798828125, -6.84375, -3.8076171875, -0.771484375, 2.2646484375, 5.30078125, 8.3369140625, 11.373046875, 14.4091796875, 17.4453125, 20.4814453125, 23.517578125, 26.5537109375, 29.58984375, 32.6259765625, 35.662109375, 38.6982421875, 41.734375, 44.7705078125, 47.806640625, 50.8427734375, 53.87890625, 56.9150390625, 59.951171875, 62.9873046875, 66.0234375, 69.0595703125, 72.095703125, 75.1318359375, 78.16796875, 81.2041015625, 84.240234375, 87.2763671875, 90.3125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 11.0, 26.0, 38.0, 49.0, 100.0, 142.0, 249.0, 457.0, 719.0, 1182.0, 2083.0, 3396.0, 5337.0, 8738.0, 13713.0, 21165.0, 32502.0, 48091.0, 69238.0, 97283.0, 133456.0, 175499.0, 220877.0, 268878.0, 310654.0, 343647.0, 360894.0, 359598.0, 340444.0, 306378.0, 262975.0, 216041.0, 170127.0, 128336.0, 94066.0, 66323.0, 45980.0, 30822.0, 20194.0, 13183.0, 8222.0, 5206.0, 3177.0, 1920.0, 1203.0, 682.0, 405.0, 240.0, 151.0, 77.0, 55.0, 38.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.375, -68.9912109375, -66.607421875, -64.2236328125, -61.83984375, -59.4560546875, -57.072265625, -54.6884765625, -52.3046875, -49.9208984375, -47.537109375, -45.1533203125, -42.76953125, -40.3857421875, -38.001953125, -35.6181640625, -33.234375, -30.8505859375, -28.466796875, -26.0830078125, -23.69921875, -21.3154296875, -18.931640625, -16.5478515625, -14.1640625, -11.7802734375, -9.396484375, -7.0126953125, -4.62890625, -2.2451171875, 0.138671875, 2.5224609375, 4.90625, 7.2900390625, 9.673828125, 12.0576171875, 14.44140625, 16.8251953125, 19.208984375, 21.5927734375, 23.9765625, 26.3603515625, 28.744140625, 31.1279296875, 33.51171875, 35.8955078125, 38.279296875, 40.6630859375, 43.046875, 45.4306640625, 47.814453125, 50.1982421875, 52.58203125, 54.9658203125, 57.349609375, 59.7333984375, 62.1171875, 64.5009765625, 66.884765625, 69.2685546875, 71.65234375, 74.0361328125, 76.419921875, 78.8037109375, 81.1875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 6.0, 6.0, 4.0, 9.0, 12.0, 18.0, 14.0, 29.0, 37.0, 27.0, 30.0, 49.0, 50.0, 67.0, 81.0, 84.0, 89.0, 119.0, 117.0, 135.0, 134.0, 144.0, 179.0, 159.0, 181.0, 149.0, 173.0, 191.0, 172.0, 168.0, 149.0, 161.0, 152.0, 122.0, 119.0, 122.0, 92.0, 81.0, 64.0, 58.0, 65.0, 50.0, 46.0, 37.0, 31.0, 21.0, 20.0, 11.0, 12.0, 11.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0], "bins": [-40.21875, -38.98095703125, -37.7431640625, -36.50537109375, -35.267578125, -34.02978515625, -32.7919921875, -31.55419921875, -30.31640625, -29.07861328125, -27.8408203125, -26.60302734375, -25.365234375, -24.12744140625, -22.8896484375, -21.65185546875, -20.4140625, -19.17626953125, -17.9384765625, -16.70068359375, -15.462890625, -14.22509765625, -12.9873046875, -11.74951171875, -10.51171875, -9.27392578125, -8.0361328125, -6.79833984375, -5.560546875, -4.32275390625, -3.0849609375, -1.84716796875, -0.609375, 0.62841796875, 1.8662109375, 3.10400390625, 4.341796875, 5.57958984375, 6.8173828125, 8.05517578125, 9.29296875, 10.53076171875, 11.7685546875, 13.00634765625, 14.244140625, 15.48193359375, 16.7197265625, 17.95751953125, 19.1953125, 20.43310546875, 21.6708984375, 22.90869140625, 24.146484375, 25.38427734375, 26.6220703125, 27.85986328125, 29.09765625, 30.33544921875, 31.5732421875, 32.81103515625, 34.048828125, 35.28662109375, 36.5244140625, 37.76220703125, 39.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 8.0, 5.0, 9.0, 8.0, 14.0, 17.0, 21.0, 18.0, 29.0, 36.0, 34.0, 38.0, 38.0, 45.0, 35.0, 50.0, 50.0, 44.0, 55.0, 38.0, 45.0, 41.0, 35.0, 38.0, 35.0, 35.0, 26.0, 27.0, 30.0, 14.0, 10.0, 13.0, 13.0, 8.0, 9.0, 4.0, 4.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-112.99324035644531, -109.22698974609375, -105.46073913574219, -101.69448852539062, -97.92823791503906, -94.1619873046875, -90.39573669433594, -86.62948608398438, -82.86323547363281, -79.09698486328125, -75.33073425292969, -71.56448364257812, -67.79823303222656, -64.031982421875, -60.2657356262207, -56.49948501586914, -52.733238220214844, -48.96698760986328, -45.20073699951172, -41.434486389160156, -37.668235778808594, -33.90198516845703, -30.135738372802734, -26.369487762451172, -22.60323715209961, -18.836986541748047, -15.0707368850708, -11.304487228393555, -7.538236618041992, -3.7719860076904297, -0.0057373046875, 3.7605133056640625, 7.526763916015625, 11.293014526367188, 15.059264183044434, 18.82551383972168, 22.591764450073242, 26.358015060424805, 30.124263763427734, 33.8905143737793, 37.65676498413086, 41.42301559448242, 45.189266204833984, 48.95551300048828, 52.721763610839844, 56.488014221191406, 60.25426483154297, 64.02051544189453, 67.7867660522461, 71.55301666259766, 75.31926727294922, 79.08551788330078, 82.85176849365234, 86.6180191040039, 90.38426208496094, 94.1505126953125, 97.91676330566406, 101.68301391601562, 105.44926452636719, 109.21551513671875, 112.98176574707031, 116.74801635742188, 120.51426696777344, 124.280517578125, 128.04676818847656]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 3.0, 9.0, 11.0, 10.0, 10.0, 12.0, 9.0, 12.0, 17.0, 25.0, 12.0, 21.0, 23.0, 50.0, 37.0, 37.0, 35.0, 42.0, 43.0, 46.0, 53.0, 49.0, 33.0, 31.0, 48.0, 41.0, 37.0, 45.0, 36.0, 30.0, 19.0, 31.0, 25.0, 9.0, 12.0, 8.0, 4.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-114.14955139160156, -110.68359375, -107.21763610839844, -103.75167083740234, -100.28571319580078, -96.81975555419922, -93.35379028320312, -89.88783264160156, -86.421875, -82.95591735839844, -79.48995971679688, -76.02399444580078, -72.55803680419922, -69.09207916259766, -65.62611389160156, -62.16015625, -58.69419860839844, -55.228240966796875, -51.76227951049805, -48.29631805419922, -44.830360412597656, -41.364402770996094, -37.898441314697266, -34.43247985839844, -30.966522216796875, -27.50056266784668, -24.034603118896484, -20.56864356994629, -17.102684020996094, -13.636724472045898, -10.170764923095703, -6.704805374145508, -3.2388458251953125, 0.2271137237548828, 3.693073272705078, 7.159032821655273, 10.624992370605469, 14.090951919555664, 17.55691146850586, 21.022871017456055, 24.48883056640625, 27.954790115356445, 31.42074966430664, 34.88671112060547, 38.35266876220703, 41.818626403808594, 45.28458786010742, 48.75054931640625, 52.21650695800781, 55.682464599609375, 59.1484260559082, 62.61438751220703, 66.0803451538086, 69.54630279541016, 73.01226806640625, 76.47822570800781, 79.94418334960938, 83.41014099121094, 86.8760986328125, 90.3420639038086, 93.80802154541016, 97.27397918701172, 100.73994445800781, 104.20590209960938, 107.67185974121094]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 10.0, 18.0, 24.0, 41.0, 62.0, 90.0, 128.0, 207.0, 309.0, 485.0, 743.0, 1211.0, 1872.0, 2998.0, 4817.0, 7538.0, 12072.0, 20172.0, 32397.0, 51587.0, 79186.0, 112930.0, 141850.0, 151234.0, 134364.0, 102680.0, 70481.0, 45262.0, 28009.0, 17445.0, 10641.0, 6361.0, 4150.0, 2613.0, 1654.0, 1030.0, 685.0, 472.0, 256.0, 172.0, 103.0, 70.0, 48.0, 33.0, 23.0, 12.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0], "bins": [-74.0, -71.90673828125, -69.8134765625, -67.72021484375, -65.626953125, -63.53369140625, -61.4404296875, -59.34716796875, -57.25390625, -55.16064453125, -53.0673828125, -50.97412109375, -48.880859375, -46.78759765625, -44.6943359375, -42.60107421875, -40.5078125, -38.41455078125, -36.3212890625, -34.22802734375, -32.134765625, -30.04150390625, -27.9482421875, -25.85498046875, -23.76171875, -21.66845703125, -19.5751953125, -17.48193359375, -15.388671875, -13.29541015625, -11.2021484375, -9.10888671875, -7.015625, -4.92236328125, -2.8291015625, -0.73583984375, 1.357421875, 3.45068359375, 5.5439453125, 7.63720703125, 9.73046875, 11.82373046875, 13.9169921875, 16.01025390625, 18.103515625, 20.19677734375, 22.2900390625, 24.38330078125, 26.4765625, 28.56982421875, 30.6630859375, 32.75634765625, 34.849609375, 36.94287109375, 39.0361328125, 41.12939453125, 43.22265625, 45.31591796875, 47.4091796875, 49.50244140625, 51.595703125, 53.68896484375, 55.7822265625, 57.87548828125, 59.96875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 5.0, 9.0, 10.0, 12.0, 9.0, 12.0, 8.0, 15.0, 20.0, 21.0, 13.0, 17.0, 36.0, 45.0, 38.0, 34.0, 37.0, 39.0, 48.0, 46.0, 51.0, 46.0, 35.0, 29.0, 55.0, 42.0, 35.0, 47.0, 31.0, 27.0, 22.0, 28.0, 23.0, 7.0, 11.0, 9.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-113.375, -109.9248046875, -106.474609375, -103.0244140625, -99.57421875, -96.1240234375, -92.673828125, -89.2236328125, -85.7734375, -82.3232421875, -78.873046875, -75.4228515625, -71.97265625, -68.5224609375, -65.072265625, -61.6220703125, -58.171875, -54.7216796875, -51.271484375, -47.8212890625, -44.37109375, -40.9208984375, -37.470703125, -34.0205078125, -30.5703125, -27.1201171875, -23.669921875, -20.2197265625, -16.76953125, -13.3193359375, -9.869140625, -6.4189453125, -2.96875, 0.4814453125, 3.931640625, 7.3818359375, 10.83203125, 14.2822265625, 17.732421875, 21.1826171875, 24.6328125, 28.0830078125, 31.533203125, 34.9833984375, 38.43359375, 41.8837890625, 45.333984375, 48.7841796875, 52.234375, 55.6845703125, 59.134765625, 62.5849609375, 66.03515625, 69.4853515625, 72.935546875, 76.3857421875, 79.8359375, 83.2861328125, 86.736328125, 90.1865234375, 93.63671875, 97.0869140625, 100.537109375, 103.9873046875, 107.4375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 7.0, 7.0, 15.0, 36.0, 35.0, 56.0, 73.0, 123.0, 161.0, 232.0, 297.0, 471.0, 696.0, 1120.0, 1799.0, 3118.0, 5435.0, 10558.0, 21628.0, 51249.0, 134216.0, 311948.0, 294638.0, 121183.0, 46514.0, 20182.0, 9687.0, 5313.0, 2796.0, 1724.0, 1057.0, 727.0, 456.0, 313.0, 194.0, 149.0, 91.0, 84.0, 48.0, 48.0, 23.0, 6.0, 12.0, 9.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-137.125, -133.201171875, -129.27734375, -125.353515625, -121.4296875, -117.505859375, -113.58203125, -109.658203125, -105.734375, -101.810546875, -97.88671875, -93.962890625, -90.0390625, -86.115234375, -82.19140625, -78.267578125, -74.34375, -70.419921875, -66.49609375, -62.572265625, -58.6484375, -54.724609375, -50.80078125, -46.876953125, -42.953125, -39.029296875, -35.10546875, -31.181640625, -27.2578125, -23.333984375, -19.41015625, -15.486328125, -11.5625, -7.638671875, -3.71484375, 0.208984375, 4.1328125, 8.056640625, 11.98046875, 15.904296875, 19.828125, 23.751953125, 27.67578125, 31.599609375, 35.5234375, 39.447265625, 43.37109375, 47.294921875, 51.21875, 55.142578125, 59.06640625, 62.990234375, 66.9140625, 70.837890625, 74.76171875, 78.685546875, 82.609375, 86.533203125, 90.45703125, 94.380859375, 98.3046875, 102.228515625, 106.15234375, 110.076171875, 114.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 11.0, 7.0, 16.0, 16.0, 12.0, 18.0, 18.0, 12.0, 23.0, 20.0, 26.0, 35.0, 33.0, 34.0, 36.0, 48.0, 46.0, 48.0, 36.0, 34.0, 44.0, 30.0, 39.0, 37.0, 30.0, 36.0, 28.0, 35.0, 33.0, 22.0, 31.0, 13.0, 8.0, 14.0, 14.0, 9.0, 12.0, 7.0, 5.0, 4.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-67.4375, -65.4130859375, -63.388671875, -61.3642578125, -59.33984375, -57.3154296875, -55.291015625, -53.2666015625, -51.2421875, -49.2177734375, -47.193359375, -45.1689453125, -43.14453125, -41.1201171875, -39.095703125, -37.0712890625, -35.046875, -33.0224609375, -30.998046875, -28.9736328125, -26.94921875, -24.9248046875, -22.900390625, -20.8759765625, -18.8515625, -16.8271484375, -14.802734375, -12.7783203125, -10.75390625, -8.7294921875, -6.705078125, -4.6806640625, -2.65625, -0.6318359375, 1.392578125, 3.4169921875, 5.44140625, 7.4658203125, 9.490234375, 11.5146484375, 13.5390625, 15.5634765625, 17.587890625, 19.6123046875, 21.63671875, 23.6611328125, 25.685546875, 27.7099609375, 29.734375, 31.7587890625, 33.783203125, 35.8076171875, 37.83203125, 39.8564453125, 41.880859375, 43.9052734375, 45.9296875, 47.9541015625, 49.978515625, 52.0029296875, 54.02734375, 56.0517578125, 58.076171875, 60.1005859375, 62.125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 5.0, 8.0, 8.0, 23.0, 25.0, 60.0, 77.0, 121.0, 189.0, 334.0, 491.0, 806.0, 1388.0, 2367.0, 4615.0, 9166.0, 20136.0, 48352.0, 130248.0, 328651.0, 305254.0, 116127.0, 43332.0, 18274.0, 8365.0, 4389.0, 2258.0, 1343.0, 864.0, 493.0, 306.0, 173.0, 108.0, 74.0, 39.0, 33.0, 16.0, 14.0, 11.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.34375, -54.52294921875, -52.7021484375, -50.88134765625, -49.060546875, -47.23974609375, -45.4189453125, -43.59814453125, -41.77734375, -39.95654296875, -38.1357421875, -36.31494140625, -34.494140625, -32.67333984375, -30.8525390625, -29.03173828125, -27.2109375, -25.39013671875, -23.5693359375, -21.74853515625, -19.927734375, -18.10693359375, -16.2861328125, -14.46533203125, -12.64453125, -10.82373046875, -9.0029296875, -7.18212890625, -5.361328125, -3.54052734375, -1.7197265625, 0.10107421875, 1.921875, 3.74267578125, 5.5634765625, 7.38427734375, 9.205078125, 11.02587890625, 12.8466796875, 14.66748046875, 16.48828125, 18.30908203125, 20.1298828125, 21.95068359375, 23.771484375, 25.59228515625, 27.4130859375, 29.23388671875, 31.0546875, 32.87548828125, 34.6962890625, 36.51708984375, 38.337890625, 40.15869140625, 41.9794921875, 43.80029296875, 45.62109375, 47.44189453125, 49.2626953125, 51.08349609375, 52.904296875, 54.72509765625, 56.5458984375, 58.36669921875, 60.1875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 8.0, 8.0, 17.0, 17.0, 19.0, 27.0, 34.0, 38.0, 54.0, 50.0, 59.0, 67.0, 94.0, 72.0, 67.0, 73.0, 57.0, 50.0, 40.0, 29.0, 26.0, 21.0, 18.0, 13.0, 10.0, 11.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036144256591796875, -0.0035037994384765625, -0.0033931732177734375, -0.0032825469970703125, -0.0031719207763671875, -0.0030612945556640625, -0.0029506683349609375, -0.0028400421142578125, -0.0027294158935546875, -0.0026187896728515625, -0.0025081634521484375, -0.0023975372314453125, -0.0022869110107421875, -0.0021762847900390625, -0.0020656585693359375, -0.0019550323486328125, -0.0018444061279296875, -0.0017337799072265625, -0.0016231536865234375, -0.0015125274658203125, -0.0014019012451171875, -0.0012912750244140625, -0.0011806488037109375, -0.0010700225830078125, -0.0009593963623046875, -0.0008487701416015625, -0.0007381439208984375, -0.0006275177001953125, -0.0005168914794921875, -0.0004062652587890625, -0.0002956390380859375, -0.0001850128173828125, -7.43865966796875e-05, 3.62396240234375e-05, 0.0001468658447265625, 0.0002574920654296875, 0.0003681182861328125, 0.0004787445068359375, 0.0005893707275390625, 0.0006999969482421875, 0.0008106231689453125, 0.0009212493896484375, 0.0010318756103515625, 0.0011425018310546875, 0.0012531280517578125, 0.0013637542724609375, 0.0014743804931640625, 0.0015850067138671875, 0.0016956329345703125, 0.0018062591552734375, 0.0019168853759765625, 0.0020275115966796875, 0.0021381378173828125, 0.0022487640380859375, 0.0023593902587890625, 0.0024700164794921875, 0.0025806427001953125, 0.0026912689208984375, 0.0028018951416015625, 0.0029125213623046875, 0.0030231475830078125, 0.0031337738037109375, 0.0032444000244140625, 0.0033550262451171875, 0.0034656524658203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 3.0, 16.0, 13.0, 23.0, 40.0, 54.0, 55.0, 107.0, 141.0, 257.0, 406.0, 632.0, 865.0, 1347.0, 2105.0, 3524.0, 5607.0, 9257.0, 16121.0, 27587.0, 47329.0, 79241.0, 121530.0, 160856.0, 171937.0, 144327.0, 101609.0, 62970.0, 37199.0, 21175.0, 12585.0, 7419.0, 4413.0, 2769.0, 1740.0, 1138.0, 704.0, 469.0, 325.0, 225.0, 130.0, 105.0, 78.0, 42.0, 29.0, 16.0, 7.0, 10.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-48.9375, -47.37255859375, -45.8076171875, -44.24267578125, -42.677734375, -41.11279296875, -39.5478515625, -37.98291015625, -36.41796875, -34.85302734375, -33.2880859375, -31.72314453125, -30.158203125, -28.59326171875, -27.0283203125, -25.46337890625, -23.8984375, -22.33349609375, -20.7685546875, -19.20361328125, -17.638671875, -16.07373046875, -14.5087890625, -12.94384765625, -11.37890625, -9.81396484375, -8.2490234375, -6.68408203125, -5.119140625, -3.55419921875, -1.9892578125, -0.42431640625, 1.140625, 2.70556640625, 4.2705078125, 5.83544921875, 7.400390625, 8.96533203125, 10.5302734375, 12.09521484375, 13.66015625, 15.22509765625, 16.7900390625, 18.35498046875, 19.919921875, 21.48486328125, 23.0498046875, 24.61474609375, 26.1796875, 27.74462890625, 29.3095703125, 30.87451171875, 32.439453125, 34.00439453125, 35.5693359375, 37.13427734375, 38.69921875, 40.26416015625, 41.8291015625, 43.39404296875, 44.958984375, 46.52392578125, 48.0888671875, 49.65380859375, 51.21875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 3.0, 8.0, 6.0, 10.0, 17.0, 23.0, 25.0, 29.0, 25.0, 49.0, 61.0, 56.0, 78.0, 102.0, 86.0, 81.0, 75.0, 48.0, 49.0, 37.0, 28.0, 29.0, 16.0, 12.0, 13.0, 9.0, 6.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.46875, -22.7353515625, -22.001953125, -21.2685546875, -20.53515625, -19.8017578125, -19.068359375, -18.3349609375, -17.6015625, -16.8681640625, -16.134765625, -15.4013671875, -14.66796875, -13.9345703125, -13.201171875, -12.4677734375, -11.734375, -11.0009765625, -10.267578125, -9.5341796875, -8.80078125, -8.0673828125, -7.333984375, -6.6005859375, -5.8671875, -5.1337890625, -4.400390625, -3.6669921875, -2.93359375, -2.2001953125, -1.466796875, -0.7333984375, 0.0, 0.7333984375, 1.466796875, 2.2001953125, 2.93359375, 3.6669921875, 4.400390625, 5.1337890625, 5.8671875, 6.6005859375, 7.333984375, 8.0673828125, 8.80078125, 9.5341796875, 10.267578125, 11.0009765625, 11.734375, 12.4677734375, 13.201171875, 13.9345703125, 14.66796875, 15.4013671875, 16.134765625, 16.8681640625, 17.6015625, 18.3349609375, 19.068359375, 19.8017578125, 20.53515625, 21.2685546875, 22.001953125, 22.7353515625, 23.46875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 8.0, 11.0, 14.0, 16.0, 22.0, 28.0, 28.0, 28.0, 34.0, 41.0, 38.0, 44.0, 47.0, 42.0, 50.0, 40.0, 52.0, 42.0, 44.0, 58.0, 46.0, 33.0, 30.0, 27.0, 37.0, 21.0, 19.0, 18.0, 9.0, 10.0, 10.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.34396362304688, -103.45259857177734, -99.56123352050781, -95.66986846923828, -91.77850341796875, -87.88713836669922, -83.99577331542969, -80.10440826416016, -76.21304321289062, -72.3216781616211, -68.43031311035156, -64.53894805908203, -60.6475830078125, -56.75621795654297, -52.86485290527344, -48.973487854003906, -45.08211898803711, -41.19075393676758, -37.29938888549805, -33.408023834228516, -29.516658782958984, -25.62529182434082, -21.73392677307129, -17.842561721801758, -13.951196670532227, -10.059831619262695, -6.168466091156006, -2.2771005630493164, 1.6142644882202148, 5.5056304931640625, 9.396995544433594, 13.288360595703125, 17.179725646972656, 21.071090698242188, 24.96245574951172, 28.85382080078125, 32.74518585205078, 36.63655090332031, 40.527915954589844, 44.419281005859375, 48.310646057128906, 52.20201110839844, 56.09337615966797, 59.9847412109375, 63.87610626220703, 67.76747131347656, 71.6588363647461, 75.55020141601562, 79.44157409667969, 83.33293914794922, 87.22430419921875, 91.11566925048828, 95.00703430175781, 98.89839935302734, 102.78976440429688, 106.6811294555664, 110.57249450683594, 114.46385955810547, 118.355224609375, 122.24658966064453, 126.13795471191406, 130.02932739257812, 133.92068481445312, 137.8120574951172, 141.7034149169922]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 4.0, 5.0, 6.0, 10.0, 11.0, 9.0, 13.0, 15.0, 19.0, 17.0, 18.0, 12.0, 32.0, 34.0, 24.0, 46.0, 37.0, 40.0, 43.0, 51.0, 53.0, 44.0, 33.0, 36.0, 38.0, 49.0, 49.0, 41.0, 28.0, 41.0, 20.0, 25.0, 21.0, 14.0, 17.0, 7.0, 7.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-112.07254791259766, -108.63005065917969, -105.18756103515625, -101.74507141113281, -98.30257415771484, -94.86007690429688, -91.41758728027344, -87.97509765625, -84.53260040283203, -81.09010314941406, -77.64761352539062, -74.20512390136719, -70.76262664794922, -67.32012939453125, -63.87763977050781, -60.43514633178711, -56.992652893066406, -53.5501594543457, -50.107666015625, -46.6651725769043, -43.222679138183594, -39.78018569946289, -36.33769226074219, -32.895198822021484, -29.45270538330078, -26.010211944580078, -22.567718505859375, -19.125225067138672, -15.682731628417969, -12.240238189697266, -8.797744750976562, -5.355251312255859, -1.9127655029296875, 1.5297279357910156, 4.972221374511719, 8.414714813232422, 11.857208251953125, 15.299701690673828, 18.74219512939453, 22.184688568115234, 25.627182006835938, 29.06967544555664, 32.512168884277344, 35.95466232299805, 39.39715576171875, 42.83964920043945, 46.282142639160156, 49.72463607788086, 53.16712951660156, 56.609622955322266, 60.05211639404297, 63.49460983276367, 66.93710327148438, 70.37959289550781, 73.82209014892578, 77.26458740234375, 80.70707702636719, 84.14956665039062, 87.5920639038086, 91.03456115722656, 94.47705078125, 97.91954040527344, 101.3620376586914, 104.80453491210938, 108.24702453613281]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 10.0, 27.0, 25.0, 56.0, 93.0, 144.0, 222.0, 336.0, 466.0, 724.0, 1053.0, 1643.0, 2373.0, 3372.0, 4610.0, 6848.0, 9409.0, 12685.0, 17090.0, 22102.0, 28335.0, 35559.0, 42897.0, 50587.0, 58192.0, 65116.0, 70136.0, 72939.0, 73374.0, 71903.0, 67847.0, 61450.0, 54416.0, 46528.0, 39001.0, 31466.0, 25048.0, 19192.0, 14464.0, 10872.0, 7750.0, 5625.0, 4024.0, 2793.0, 1899.0, 1279.0, 871.0, 611.0, 374.0, 269.0, 169.0, 113.0, 67.0, 31.0, 32.0, 15.0, 13.0, 5.0, 8.0, 3.0, 1.0], "bins": [-60.96875, -59.0166015625, -57.064453125, -55.1123046875, -53.16015625, -51.2080078125, -49.255859375, -47.3037109375, -45.3515625, -43.3994140625, -41.447265625, -39.4951171875, -37.54296875, -35.5908203125, -33.638671875, -31.6865234375, -29.734375, -27.7822265625, -25.830078125, -23.8779296875, -21.92578125, -19.9736328125, -18.021484375, -16.0693359375, -14.1171875, -12.1650390625, -10.212890625, -8.2607421875, -6.30859375, -4.3564453125, -2.404296875, -0.4521484375, 1.5, 3.4521484375, 5.404296875, 7.3564453125, 9.30859375, 11.2607421875, 13.212890625, 15.1650390625, 17.1171875, 19.0693359375, 21.021484375, 22.9736328125, 24.92578125, 26.8779296875, 28.830078125, 30.7822265625, 32.734375, 34.6865234375, 36.638671875, 38.5908203125, 40.54296875, 42.4951171875, 44.447265625, 46.3994140625, 48.3515625, 50.3037109375, 52.255859375, 54.2080078125, 56.16015625, 58.1123046875, 60.064453125, 62.0166015625, 63.96875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 3.0, 5.0, 10.0, 6.0, 12.0, 10.0, 13.0, 11.0, 25.0, 15.0, 18.0, 14.0, 31.0, 32.0, 26.0, 43.0, 39.0, 39.0, 41.0, 50.0, 54.0, 45.0, 34.0, 35.0, 39.0, 50.0, 46.0, 40.0, 33.0, 35.0, 23.0, 22.0, 24.0, 13.0, 19.0, 6.0, 10.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-107.875, -104.5546875, -101.234375, -97.9140625, -94.59375, -91.2734375, -87.953125, -84.6328125, -81.3125, -77.9921875, -74.671875, -71.3515625, -68.03125, -64.7109375, -61.390625, -58.0703125, -54.75, -51.4296875, -48.109375, -44.7890625, -41.46875, -38.1484375, -34.828125, -31.5078125, -28.1875, -24.8671875, -21.546875, -18.2265625, -14.90625, -11.5859375, -8.265625, -4.9453125, -1.625, 1.6953125, 5.015625, 8.3359375, 11.65625, 14.9765625, 18.296875, 21.6171875, 24.9375, 28.2578125, 31.578125, 34.8984375, 38.21875, 41.5390625, 44.859375, 48.1796875, 51.5, 54.8203125, 58.140625, 61.4609375, 64.78125, 68.1015625, 71.421875, 74.7421875, 78.0625, 81.3828125, 84.703125, 88.0234375, 91.34375, 94.6640625, 97.984375, 101.3046875, 104.625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 10.0, 20.0, 23.0, 58.0, 87.0, 143.0, 271.0, 509.0, 896.0, 1462.0, 2498.0, 4379.0, 7037.0, 11583.0, 17711.0, 26533.0, 38244.0, 52625.0, 68259.0, 83463.0, 96359.0, 103305.0, 104508.0, 98348.0, 85806.0, 71018.0, 54682.0, 40516.0, 27837.0, 19020.0, 12463.0, 7611.0, 4587.0, 2782.0, 1697.0, 904.0, 573.0, 327.0, 197.0, 83.0, 46.0, 35.0, 17.0, 12.0, 6.0, 6.0, 0.0, 0.0, 1.0], "bins": [-104.5, -101.681640625, -98.86328125, -96.044921875, -93.2265625, -90.408203125, -87.58984375, -84.771484375, -81.953125, -79.134765625, -76.31640625, -73.498046875, -70.6796875, -67.861328125, -65.04296875, -62.224609375, -59.40625, -56.587890625, -53.76953125, -50.951171875, -48.1328125, -45.314453125, -42.49609375, -39.677734375, -36.859375, -34.041015625, -31.22265625, -28.404296875, -25.5859375, -22.767578125, -19.94921875, -17.130859375, -14.3125, -11.494140625, -8.67578125, -5.857421875, -3.0390625, -0.220703125, 2.59765625, 5.416015625, 8.234375, 11.052734375, 13.87109375, 16.689453125, 19.5078125, 22.326171875, 25.14453125, 27.962890625, 30.78125, 33.599609375, 36.41796875, 39.236328125, 42.0546875, 44.873046875, 47.69140625, 50.509765625, 53.328125, 56.146484375, 58.96484375, 61.783203125, 64.6015625, 67.419921875, 70.23828125, 73.056640625, 75.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 5.0, 5.0, 9.0, 3.0, 12.0, 9.0, 13.0, 23.0, 22.0, 20.0, 27.0, 17.0, 35.0, 29.0, 36.0, 31.0, 39.0, 44.0, 32.0, 38.0, 52.0, 35.0, 35.0, 38.0, 39.0, 44.0, 33.0, 45.0, 24.0, 34.0, 34.0, 18.0, 20.0, 18.0, 16.0, 7.0, 8.0, 12.0, 3.0, 3.0, 12.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-69.8125, -67.75341796875, -65.6943359375, -63.63525390625, -61.576171875, -59.51708984375, -57.4580078125, -55.39892578125, -53.33984375, -51.28076171875, -49.2216796875, -47.16259765625, -45.103515625, -43.04443359375, -40.9853515625, -38.92626953125, -36.8671875, -34.80810546875, -32.7490234375, -30.68994140625, -28.630859375, -26.57177734375, -24.5126953125, -22.45361328125, -20.39453125, -18.33544921875, -16.2763671875, -14.21728515625, -12.158203125, -10.09912109375, -8.0400390625, -5.98095703125, -3.921875, -1.86279296875, 0.1962890625, 2.25537109375, 4.314453125, 6.37353515625, 8.4326171875, 10.49169921875, 12.55078125, 14.60986328125, 16.6689453125, 18.72802734375, 20.787109375, 22.84619140625, 24.9052734375, 26.96435546875, 29.0234375, 31.08251953125, 33.1416015625, 35.20068359375, 37.259765625, 39.31884765625, 41.3779296875, 43.43701171875, 45.49609375, 47.55517578125, 49.6142578125, 51.67333984375, 53.732421875, 55.79150390625, 57.8505859375, 59.90966796875, 61.96875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 12.0, 6.0, 25.0, 30.0, 45.0, 59.0, 114.0, 159.0, 239.0, 411.0, 686.0, 1121.0, 1870.0, 3090.0, 5225.0, 8457.0, 13793.0, 22270.0, 34002.0, 50166.0, 70523.0, 91391.0, 109510.0, 119460.0, 118700.0, 107308.0, 88360.0, 67685.0, 47661.0, 32156.0, 20941.0, 13002.0, 7910.0, 4812.0, 2885.0, 1808.0, 1023.0, 611.0, 399.0, 247.0, 112.0, 101.0, 65.0, 38.0, 24.0, 13.0, 14.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-42.90625, -41.5625, -40.21875, -38.875, -37.53125, -36.1875, -34.84375, -33.5, -32.15625, -30.8125, -29.46875, -28.125, -26.78125, -25.4375, -24.09375, -22.75, -21.40625, -20.0625, -18.71875, -17.375, -16.03125, -14.6875, -13.34375, -12.0, -10.65625, -9.3125, -7.96875, -6.625, -5.28125, -3.9375, -2.59375, -1.25, 0.09375, 1.4375, 2.78125, 4.125, 5.46875, 6.8125, 8.15625, 9.5, 10.84375, 12.1875, 13.53125, 14.875, 16.21875, 17.5625, 18.90625, 20.25, 21.59375, 22.9375, 24.28125, 25.625, 26.96875, 28.3125, 29.65625, 31.0, 32.34375, 33.6875, 35.03125, 36.375, 37.71875, 39.0625, 40.40625, 41.75, 43.09375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 7.0, 1.0, 9.0, 11.0, 13.0, 12.0, 17.0, 25.0, 29.0, 32.0, 31.0, 60.0, 51.0, 37.0, 71.0, 58.0, 66.0, 54.0, 61.0, 52.0, 43.0, 34.0, 38.0, 39.0, 30.0, 27.0, 22.0, 17.0, 17.0, 10.0, 8.0, 1.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006359100341796875, -0.006159663200378418, -0.005960226058959961, -0.005760788917541504, -0.005561351776123047, -0.00536191463470459, -0.005162477493286133, -0.004963040351867676, -0.004763603210449219, -0.004564166069030762, -0.004364728927612305, -0.004165291786193848, -0.003965854644775391, -0.0037664175033569336, -0.0035669803619384766, -0.0033675432205200195, -0.0031681060791015625, -0.0029686689376831055, -0.0027692317962646484, -0.0025697946548461914, -0.0023703575134277344, -0.0021709203720092773, -0.0019714832305908203, -0.0017720460891723633, -0.0015726089477539062, -0.0013731718063354492, -0.0011737346649169922, -0.0009742975234985352, -0.0007748603820800781, -0.0005754232406616211, -0.00037598609924316406, -0.00017654895782470703, 2.288818359375e-05, 0.00022232532501220703, 0.00042176246643066406, 0.0006211996078491211, 0.0008206367492675781, 0.0010200738906860352, 0.0012195110321044922, 0.0014189481735229492, 0.0016183853149414062, 0.0018178224563598633, 0.0020172595977783203, 0.0022166967391967773, 0.0024161338806152344, 0.0026155710220336914, 0.0028150081634521484, 0.0030144453048706055, 0.0032138824462890625, 0.0034133195877075195, 0.0036127567291259766, 0.0038121938705444336, 0.004011631011962891, 0.004211068153381348, 0.004410505294799805, 0.004609942436218262, 0.004809379577636719, 0.005008816719055176, 0.005208253860473633, 0.00540769100189209, 0.005607128143310547, 0.005806565284729004, 0.006006002426147461, 0.006205439567565918, 0.006404876708984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 14.0, 16.0, 14.0, 36.0, 60.0, 107.0, 183.0, 313.0, 487.0, 872.0, 1494.0, 2567.0, 4469.0, 7541.0, 12634.0, 20346.0, 31701.0, 46651.0, 65678.0, 86460.0, 103975.0, 115999.0, 117892.0, 109698.0, 93370.0, 73688.0, 53647.0, 36905.0, 24386.0, 15060.0, 9379.0, 5277.0, 3187.0, 1866.0, 1067.0, 630.0, 356.0, 208.0, 131.0, 82.0, 46.0, 26.0, 12.0, 11.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-44.875, -43.52294921875, -42.1708984375, -40.81884765625, -39.466796875, -38.11474609375, -36.7626953125, -35.41064453125, -34.05859375, -32.70654296875, -31.3544921875, -30.00244140625, -28.650390625, -27.29833984375, -25.9462890625, -24.59423828125, -23.2421875, -21.89013671875, -20.5380859375, -19.18603515625, -17.833984375, -16.48193359375, -15.1298828125, -13.77783203125, -12.42578125, -11.07373046875, -9.7216796875, -8.36962890625, -7.017578125, -5.66552734375, -4.3134765625, -2.96142578125, -1.609375, -0.25732421875, 1.0947265625, 2.44677734375, 3.798828125, 5.15087890625, 6.5029296875, 7.85498046875, 9.20703125, 10.55908203125, 11.9111328125, 13.26318359375, 14.615234375, 15.96728515625, 17.3193359375, 18.67138671875, 20.0234375, 21.37548828125, 22.7275390625, 24.07958984375, 25.431640625, 26.78369140625, 28.1357421875, 29.48779296875, 30.83984375, 32.19189453125, 33.5439453125, 34.89599609375, 36.248046875, 37.60009765625, 38.9521484375, 40.30419921875, 41.65625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 5.0, 5.0, 2.0, 7.0, 7.0, 12.0, 16.0, 20.0, 19.0, 27.0, 16.0, 34.0, 27.0, 34.0, 34.0, 42.0, 47.0, 43.0, 36.0, 47.0, 59.0, 46.0, 43.0, 49.0, 37.0, 47.0, 36.0, 36.0, 33.0, 28.0, 17.0, 16.0, 16.0, 8.0, 10.0, 10.0, 11.0, 10.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0], "bins": [-21.9375, -21.3887939453125, -20.840087890625, -20.2913818359375, -19.74267578125, -19.1939697265625, -18.645263671875, -18.0965576171875, -17.5478515625, -16.9991455078125, -16.450439453125, -15.9017333984375, -15.35302734375, -14.8043212890625, -14.255615234375, -13.7069091796875, -13.158203125, -12.6094970703125, -12.060791015625, -11.5120849609375, -10.96337890625, -10.4146728515625, -9.865966796875, -9.3172607421875, -8.7685546875, -8.2198486328125, -7.671142578125, -7.1224365234375, -6.57373046875, -6.0250244140625, -5.476318359375, -4.9276123046875, -4.37890625, -3.8302001953125, -3.281494140625, -2.7327880859375, -2.18408203125, -1.6353759765625, -1.086669921875, -0.5379638671875, 0.0107421875, 0.5594482421875, 1.108154296875, 1.6568603515625, 2.20556640625, 2.7542724609375, 3.302978515625, 3.8516845703125, 4.400390625, 4.9490966796875, 5.497802734375, 6.0465087890625, 6.59521484375, 7.1439208984375, 7.692626953125, 8.2413330078125, 8.7900390625, 9.3387451171875, 9.887451171875, 10.4361572265625, 10.98486328125, 11.5335693359375, 12.082275390625, 12.6309814453125, 13.1796875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 9.0, 5.0, 8.0, 7.0, 8.0, 10.0, 14.0, 16.0, 16.0, 25.0, 21.0, 30.0, 32.0, 32.0, 35.0, 41.0, 56.0, 44.0, 32.0, 33.0, 51.0, 36.0, 39.0, 47.0, 26.0, 39.0, 42.0, 30.0, 34.0, 33.0, 28.0, 21.0, 23.0, 16.0, 21.0, 7.0, 5.0, 7.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.40325927734375, -107.7926254272461, -104.18199920654297, -100.57136535644531, -96.96073913574219, -93.35010528564453, -89.73947143554688, -86.12884521484375, -82.5182113647461, -78.90757751464844, -75.29695129394531, -71.68631744384766, -68.07568359375, -64.46505737304688, -60.85442352294922, -57.24379348754883, -53.63316345214844, -50.02253341674805, -46.411903381347656, -42.80126953125, -39.19063949584961, -35.58000946044922, -31.969377517700195, -28.358745574951172, -24.74811553955078, -21.13748550415039, -17.526853561401367, -13.91622257232666, -10.305591583251953, -6.6949615478515625, -3.084329605102539, 0.5263023376464844, 4.136924743652344, 7.747555732727051, 11.358186721801758, 14.968817710876465, 18.579448699951172, 22.190078735351562, 25.800710678100586, 29.41134262084961, 33.02197265625, 36.63260269165039, 40.24323272705078, 43.85386657714844, 47.46449661254883, 51.07512664794922, 54.685760498046875, 58.296390533447266, 61.907020568847656, 65.51765441894531, 69.12828063964844, 72.7389144897461, 76.34954833984375, 79.96017456054688, 83.57080841064453, 87.18144226074219, 90.79206848144531, 94.40270233154297, 98.0133285522461, 101.62396240234375, 105.23458862304688, 108.84522247314453, 112.45585632324219, 116.06648254394531, 119.67711639404297]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 5.0, 6.0, 7.0, 12.0, 7.0, 8.0, 13.0, 7.0, 13.0, 15.0, 24.0, 25.0, 26.0, 40.0, 39.0, 32.0, 45.0, 38.0, 44.0, 43.0, 39.0, 30.0, 54.0, 52.0, 51.0, 36.0, 43.0, 45.0, 27.0, 27.0, 30.0, 26.0, 20.0, 17.0, 11.0, 9.0, 12.0, 2.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.59342956542969, -113.98590087890625, -110.37837219238281, -106.77084350585938, -103.1633071899414, -99.55577850341797, -95.94824981689453, -92.3407211303711, -88.73318481445312, -85.12565612792969, -81.51812744140625, -77.91059875488281, -74.30306243896484, -70.6955337524414, -67.08800506591797, -63.48047637939453, -59.872947692871094, -56.265419006347656, -52.65788650512695, -49.050357818603516, -45.44282531738281, -41.835296630859375, -38.22776794433594, -34.6202392578125, -31.012706756591797, -27.405176162719727, -23.797645568847656, -20.19011688232422, -16.58258628845215, -12.975055694580078, -9.36752700805664, -5.75999641418457, -2.1524734497070312, 1.4550566673278809, 5.062586784362793, 8.670116424560547, 12.277647018432617, 15.885177612304688, 19.492706298828125, 23.100236892700195, 26.707767486572266, 30.315298080444336, 33.922828674316406, 37.530357360839844, 41.13788604736328, 44.745418548583984, 48.35294723510742, 51.960479736328125, 55.56800842285156, 59.175537109375, 62.7830696105957, 66.39059448242188, 69.99813079833984, 73.60565948486328, 77.21318817138672, 80.82071685791016, 84.42825317382812, 88.03578186035156, 91.643310546875, 95.25083923339844, 98.8583755493164, 102.46590423583984, 106.07343292236328, 109.68096160888672, 113.28849029541016]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 9.0, 7.0, 17.0, 23.0, 26.0, 48.0, 72.0, 110.0, 147.0, 273.0, 453.0, 707.0, 1165.0, 1897.0, 2869.0, 4528.0, 6924.0, 10445.0, 16080.0, 24003.0, 36404.0, 51998.0, 73815.0, 101958.0, 137817.0, 181878.0, 228811.0, 277330.0, 321365.0, 351248.0, 366291.0, 361860.0, 337595.0, 297299.0, 251504.0, 203281.0, 157161.0, 117954.0, 85203.0, 60565.0, 41646.0, 28273.0, 18867.0, 12372.0, 8090.0, 5236.0, 3244.0, 2138.0, 1278.0, 812.0, 482.0, 299.0, 152.0, 104.0, 70.0, 42.0, 26.0, 11.0, 6.0, 3.0, 6.0, 3.0], "bins": [-74.625, -72.34375, -70.0625, -67.78125, -65.5, -63.21875, -60.9375, -58.65625, -56.375, -54.09375, -51.8125, -49.53125, -47.25, -44.96875, -42.6875, -40.40625, -38.125, -35.84375, -33.5625, -31.28125, -29.0, -26.71875, -24.4375, -22.15625, -19.875, -17.59375, -15.3125, -13.03125, -10.75, -8.46875, -6.1875, -3.90625, -1.625, 0.65625, 2.9375, 5.21875, 7.5, 9.78125, 12.0625, 14.34375, 16.625, 18.90625, 21.1875, 23.46875, 25.75, 28.03125, 30.3125, 32.59375, 34.875, 37.15625, 39.4375, 41.71875, 44.0, 46.28125, 48.5625, 50.84375, 53.125, 55.40625, 57.6875, 59.96875, 62.25, 64.53125, 66.8125, 69.09375, 71.375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 5.0, 10.0, 8.0, 8.0, 10.0, 11.0, 11.0, 17.0, 11.0, 23.0, 24.0, 30.0, 37.0, 32.0, 52.0, 35.0, 42.0, 43.0, 38.0, 42.0, 38.0, 45.0, 58.0, 42.0, 36.0, 47.0, 39.0, 28.0, 31.0, 31.0, 28.0, 18.0, 12.0, 15.0, 8.0, 8.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.625, -102.3671875, -99.109375, -95.8515625, -92.59375, -89.3359375, -86.078125, -82.8203125, -79.5625, -76.3046875, -73.046875, -69.7890625, -66.53125, -63.2734375, -60.015625, -56.7578125, -53.5, -50.2421875, -46.984375, -43.7265625, -40.46875, -37.2109375, -33.953125, -30.6953125, -27.4375, -24.1796875, -20.921875, -17.6640625, -14.40625, -11.1484375, -7.890625, -4.6328125, -1.375, 1.8828125, 5.140625, 8.3984375, 11.65625, 14.9140625, 18.171875, 21.4296875, 24.6875, 27.9453125, 31.203125, 34.4609375, 37.71875, 40.9765625, 44.234375, 47.4921875, 50.75, 54.0078125, 57.265625, 60.5234375, 63.78125, 67.0390625, 70.296875, 73.5546875, 76.8125, 80.0703125, 83.328125, 86.5859375, 89.84375, 93.1015625, 96.359375, 99.6171875, 102.875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 10.0, 24.0, 39.0, 53.0, 95.0, 178.0, 271.0, 476.0, 716.0, 1311.0, 2119.0, 3324.0, 5322.0, 8343.0, 13183.0, 20135.0, 29774.0, 43922.0, 62890.0, 87115.0, 118165.0, 154433.0, 195803.0, 238673.0, 279023.0, 313088.0, 337616.0, 343849.0, 336954.0, 314610.0, 281169.0, 242100.0, 197803.0, 156346.0, 120369.0, 88773.0, 63931.0, 44729.0, 30703.0, 20261.0, 13365.0, 8730.0, 5579.0, 3504.0, 2137.0, 1304.0, 812.0, 475.0, 292.0, 172.0, 97.0, 53.0, 31.0, 15.0, 7.0, 11.0, 5.0, 3.0], "bins": [-80.25, -77.8564453125, -75.462890625, -73.0693359375, -70.67578125, -68.2822265625, -65.888671875, -63.4951171875, -61.1015625, -58.7080078125, -56.314453125, -53.9208984375, -51.52734375, -49.1337890625, -46.740234375, -44.3466796875, -41.953125, -39.5595703125, -37.166015625, -34.7724609375, -32.37890625, -29.9853515625, -27.591796875, -25.1982421875, -22.8046875, -20.4111328125, -18.017578125, -15.6240234375, -13.23046875, -10.8369140625, -8.443359375, -6.0498046875, -3.65625, -1.2626953125, 1.130859375, 3.5244140625, 5.91796875, 8.3115234375, 10.705078125, 13.0986328125, 15.4921875, 17.8857421875, 20.279296875, 22.6728515625, 25.06640625, 27.4599609375, 29.853515625, 32.2470703125, 34.640625, 37.0341796875, 39.427734375, 41.8212890625, 44.21484375, 46.6083984375, 49.001953125, 51.3955078125, 53.7890625, 56.1826171875, 58.576171875, 60.9697265625, 63.36328125, 65.7568359375, 68.150390625, 70.5439453125, 72.9375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 9.0, 9.0, 11.0, 17.0, 24.0, 35.0, 38.0, 36.0, 58.0, 63.0, 63.0, 84.0, 108.0, 107.0, 146.0, 181.0, 172.0, 192.0, 180.0, 201.0, 199.0, 229.0, 201.0, 203.0, 192.0, 192.0, 166.0, 147.0, 131.0, 103.0, 100.0, 105.0, 70.0, 55.0, 58.0, 37.0, 42.0, 31.0, 24.0, 18.0, 15.0, 6.0, 7.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.78125, -45.2939453125, -43.806640625, -42.3193359375, -40.83203125, -39.3447265625, -37.857421875, -36.3701171875, -34.8828125, -33.3955078125, -31.908203125, -30.4208984375, -28.93359375, -27.4462890625, -25.958984375, -24.4716796875, -22.984375, -21.4970703125, -20.009765625, -18.5224609375, -17.03515625, -15.5478515625, -14.060546875, -12.5732421875, -11.0859375, -9.5986328125, -8.111328125, -6.6240234375, -5.13671875, -3.6494140625, -2.162109375, -0.6748046875, 0.8125, 2.2998046875, 3.787109375, 5.2744140625, 6.76171875, 8.2490234375, 9.736328125, 11.2236328125, 12.7109375, 14.1982421875, 15.685546875, 17.1728515625, 18.66015625, 20.1474609375, 21.634765625, 23.1220703125, 24.609375, 26.0966796875, 27.583984375, 29.0712890625, 30.55859375, 32.0458984375, 33.533203125, 35.0205078125, 36.5078125, 37.9951171875, 39.482421875, 40.9697265625, 42.45703125, 43.9443359375, 45.431640625, 46.9189453125, 48.40625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 6.0, 7.0, 6.0, 6.0, 12.0, 12.0, 14.0, 20.0, 25.0, 18.0, 31.0, 26.0, 29.0, 38.0, 39.0, 39.0, 46.0, 38.0, 37.0, 30.0, 38.0, 41.0, 49.0, 37.0, 31.0, 40.0, 33.0, 37.0, 24.0, 26.0, 29.0, 23.0, 15.0, 8.0, 26.0, 10.0, 11.0, 9.0, 5.0, 6.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-126.97412109375, -123.3863754272461, -119.79862213134766, -116.21087646484375, -112.62313079833984, -109.03538513183594, -105.4476318359375, -101.8598861694336, -98.27214050292969, -94.68439483642578, -91.09664154052734, -87.50889587402344, -83.92115020751953, -80.33340454101562, -76.74565124511719, -73.15790557861328, -69.57015991210938, -65.98241424560547, -62.3946647644043, -58.806915283203125, -55.21916961669922, -51.63142013549805, -48.043670654296875, -44.45592498779297, -40.86817169189453, -37.28042221069336, -33.69267654418945, -30.10492706298828, -26.517181396484375, -22.929431915283203, -19.341684341430664, -15.753936767578125, -12.166191101074219, -8.57844352722168, -4.990695476531982, -1.4029474258422852, 2.184800148010254, 5.772548675537109, 9.360296249389648, 12.948043823242188, 16.535791397094727, 20.123538970947266, 23.711286544799805, 27.299034118652344, 30.886783599853516, 34.47453308105469, 38.062278747558594, 41.6500244140625, 45.23777389526367, 48.825523376464844, 52.41326904296875, 56.00101852416992, 59.58876419067383, 63.176513671875, 66.7642593383789, 70.35200500488281, 73.93975830078125, 77.52750396728516, 81.1152572631836, 84.7030029296875, 88.2907485961914, 91.87849426269531, 95.46624755859375, 99.05399322509766, 102.64173889160156]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 10.0, 9.0, 11.0, 10.0, 4.0, 11.0, 13.0, 23.0, 27.0, 23.0, 23.0, 25.0, 34.0, 29.0, 30.0, 35.0, 29.0, 43.0, 34.0, 43.0, 44.0, 51.0, 42.0, 57.0, 37.0, 50.0, 28.0, 26.0, 37.0, 21.0, 24.0, 23.0, 18.0, 13.0, 9.0, 15.0, 15.0, 2.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-116.69853210449219, -113.23775482177734, -109.77698516845703, -106.31620788574219, -102.85543823242188, -99.39466094970703, -95.93388366699219, -92.47311401367188, -89.01233673095703, -85.55155944824219, -82.09078979492188, -78.63001251220703, -75.16923522949219, -71.70846557617188, -68.24768829345703, -64.78691101074219, -61.326141357421875, -57.8653678894043, -54.40459442138672, -50.943817138671875, -47.4830436706543, -44.02227020263672, -40.561492919921875, -37.1007194519043, -33.63994598388672, -30.17917251586914, -26.71839714050293, -23.25762176513672, -19.79684829711914, -16.336074829101562, -12.875299453735352, -9.41452407836914, -5.953758239746094, -2.492983818054199, 0.9677906036376953, 4.42856502532959, 7.889339447021484, 11.350112915039062, 14.810888290405273, 18.271663665771484, 21.732437133789062, 25.19321060180664, 28.65398597717285, 32.11476135253906, 35.57553482055664, 39.03630828857422, 42.49708557128906, 45.95785903930664, 49.41863250732422, 52.8794059753418, 56.340179443359375, 59.80095672607422, 63.2617301940918, 66.72250366210938, 70.18328094482422, 73.64405822753906, 77.10482788085938, 80.56560516357422, 84.02637481689453, 87.48715209960938, 90.94792175292969, 94.40869903564453, 97.86947631835938, 101.33024597167969, 104.79102325439453]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 3.0, 8.0, 17.0, 12.0, 27.0, 49.0, 62.0, 125.0, 182.0, 287.0, 482.0, 809.0, 1211.0, 2217.0, 3353.0, 5840.0, 10021.0, 17100.0, 29826.0, 53301.0, 92484.0, 146607.0, 189583.0, 180556.0, 129652.0, 79055.0, 44939.0, 25093.0, 14544.0, 8387.0, 5083.0, 2996.0, 1826.0, 1106.0, 635.0, 427.0, 271.0, 143.0, 92.0, 53.0, 34.0, 19.0, 15.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-79.375, -76.8828125, -74.390625, -71.8984375, -69.40625, -66.9140625, -64.421875, -61.9296875, -59.4375, -56.9453125, -54.453125, -51.9609375, -49.46875, -46.9765625, -44.484375, -41.9921875, -39.5, -37.0078125, -34.515625, -32.0234375, -29.53125, -27.0390625, -24.546875, -22.0546875, -19.5625, -17.0703125, -14.578125, -12.0859375, -9.59375, -7.1015625, -4.609375, -2.1171875, 0.375, 2.8671875, 5.359375, 7.8515625, 10.34375, 12.8359375, 15.328125, 17.8203125, 20.3125, 22.8046875, 25.296875, 27.7890625, 30.28125, 32.7734375, 35.265625, 37.7578125, 40.25, 42.7421875, 45.234375, 47.7265625, 50.21875, 52.7109375, 55.203125, 57.6953125, 60.1875, 62.6796875, 65.171875, 67.6640625, 70.15625, 72.6484375, 75.140625, 77.6328125, 80.125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 9.0, 12.0, 9.0, 9.0, 5.0, 13.0, 13.0, 21.0, 25.0, 28.0, 21.0, 26.0, 37.0, 25.0, 31.0, 35.0, 27.0, 44.0, 36.0, 40.0, 49.0, 47.0, 48.0, 51.0, 39.0, 45.0, 28.0, 29.0, 37.0, 20.0, 23.0, 23.0, 18.0, 13.0, 9.0, 14.0, 16.0, 2.0, 6.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-115.625, -112.193359375, -108.76171875, -105.330078125, -101.8984375, -98.466796875, -95.03515625, -91.603515625, -88.171875, -84.740234375, -81.30859375, -77.876953125, -74.4453125, -71.013671875, -67.58203125, -64.150390625, -60.71875, -57.287109375, -53.85546875, -50.423828125, -46.9921875, -43.560546875, -40.12890625, -36.697265625, -33.265625, -29.833984375, -26.40234375, -22.970703125, -19.5390625, -16.107421875, -12.67578125, -9.244140625, -5.8125, -2.380859375, 1.05078125, 4.482421875, 7.9140625, 11.345703125, 14.77734375, 18.208984375, 21.640625, 25.072265625, 28.50390625, 31.935546875, 35.3671875, 38.798828125, 42.23046875, 45.662109375, 49.09375, 52.525390625, 55.95703125, 59.388671875, 62.8203125, 66.251953125, 69.68359375, 73.115234375, 76.546875, 79.978515625, 83.41015625, 86.841796875, 90.2734375, 93.705078125, 97.13671875, 100.568359375, 104.0]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 13.0, 19.0, 19.0, 24.0, 36.0, 53.0, 84.0, 104.0, 177.0, 242.0, 345.0, 584.0, 827.0, 1330.0, 2042.0, 3262.0, 5343.0, 8715.0, 15179.0, 27709.0, 57063.0, 129904.0, 262412.0, 268477.0, 136340.0, 60058.0, 28839.0, 15701.0, 8874.0, 5292.0, 3345.0, 2107.0, 1424.0, 893.0, 564.0, 368.0, 228.0, 173.0, 125.0, 80.0, 58.0, 36.0, 26.0, 16.0, 11.0, 11.0, 7.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-102.375, -99.275390625, -96.17578125, -93.076171875, -89.9765625, -86.876953125, -83.77734375, -80.677734375, -77.578125, -74.478515625, -71.37890625, -68.279296875, -65.1796875, -62.080078125, -58.98046875, -55.880859375, -52.78125, -49.681640625, -46.58203125, -43.482421875, -40.3828125, -37.283203125, -34.18359375, -31.083984375, -27.984375, -24.884765625, -21.78515625, -18.685546875, -15.5859375, -12.486328125, -9.38671875, -6.287109375, -3.1875, -0.087890625, 3.01171875, 6.111328125, 9.2109375, 12.310546875, 15.41015625, 18.509765625, 21.609375, 24.708984375, 27.80859375, 30.908203125, 34.0078125, 37.107421875, 40.20703125, 43.306640625, 46.40625, 49.505859375, 52.60546875, 55.705078125, 58.8046875, 61.904296875, 65.00390625, 68.103515625, 71.203125, 74.302734375, 77.40234375, 80.501953125, 83.6015625, 86.701171875, 89.80078125, 92.900390625, 96.0]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 7.0, 2.0, 13.0, 9.0, 8.0, 17.0, 15.0, 15.0, 25.0, 23.0, 24.0, 19.0, 31.0, 24.0, 32.0, 28.0, 37.0, 49.0, 34.0, 42.0, 48.0, 31.0, 48.0, 37.0, 37.0, 42.0, 27.0, 35.0, 25.0, 29.0, 36.0, 23.0, 16.0, 15.0, 13.0, 10.0, 15.0, 9.0, 11.0, 8.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-67.8125, -65.6943359375, -63.576171875, -61.4580078125, -59.33984375, -57.2216796875, -55.103515625, -52.9853515625, -50.8671875, -48.7490234375, -46.630859375, -44.5126953125, -42.39453125, -40.2763671875, -38.158203125, -36.0400390625, -33.921875, -31.8037109375, -29.685546875, -27.5673828125, -25.44921875, -23.3310546875, -21.212890625, -19.0947265625, -16.9765625, -14.8583984375, -12.740234375, -10.6220703125, -8.50390625, -6.3857421875, -4.267578125, -2.1494140625, -0.03125, 2.0869140625, 4.205078125, 6.3232421875, 8.44140625, 10.5595703125, 12.677734375, 14.7958984375, 16.9140625, 19.0322265625, 21.150390625, 23.2685546875, 25.38671875, 27.5048828125, 29.623046875, 31.7412109375, 33.859375, 35.9775390625, 38.095703125, 40.2138671875, 42.33203125, 44.4501953125, 46.568359375, 48.6865234375, 50.8046875, 52.9228515625, 55.041015625, 57.1591796875, 59.27734375, 61.3955078125, 63.513671875, 65.6318359375, 67.75]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 10.0, 7.0, 16.0, 10.0, 15.0, 22.0, 35.0, 48.0, 64.0, 83.0, 156.0, 197.0, 292.0, 433.0, 710.0, 1046.0, 1597.0, 2448.0, 4065.0, 6829.0, 11797.0, 21440.0, 42207.0, 87755.0, 184017.0, 283820.0, 200342.0, 96553.0, 46778.0, 23738.0, 12640.0, 7430.0, 4403.0, 2623.0, 1694.0, 1038.0, 697.0, 463.0, 338.0, 209.0, 156.0, 102.0, 71.0, 51.0, 32.0, 17.0, 25.0, 18.0, 11.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.40625, -39.03955078125, -37.6728515625, -36.30615234375, -34.939453125, -33.57275390625, -32.2060546875, -30.83935546875, -29.47265625, -28.10595703125, -26.7392578125, -25.37255859375, -24.005859375, -22.63916015625, -21.2724609375, -19.90576171875, -18.5390625, -17.17236328125, -15.8056640625, -14.43896484375, -13.072265625, -11.70556640625, -10.3388671875, -8.97216796875, -7.60546875, -6.23876953125, -4.8720703125, -3.50537109375, -2.138671875, -0.77197265625, 0.5947265625, 1.96142578125, 3.328125, 4.69482421875, 6.0615234375, 7.42822265625, 8.794921875, 10.16162109375, 11.5283203125, 12.89501953125, 14.26171875, 15.62841796875, 16.9951171875, 18.36181640625, 19.728515625, 21.09521484375, 22.4619140625, 23.82861328125, 25.1953125, 26.56201171875, 27.9287109375, 29.29541015625, 30.662109375, 32.02880859375, 33.3955078125, 34.76220703125, 36.12890625, 37.49560546875, 38.8623046875, 40.22900390625, 41.595703125, 42.96240234375, 44.3291015625, 45.69580078125, 47.0625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 6.0, 14.0, 24.0, 27.0, 22.0, 38.0, 57.0, 56.0, 92.0, 80.0, 97.0, 85.0, 93.0, 64.0, 67.0, 39.0, 42.0, 18.0, 16.0, 10.0, 5.0, 9.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031147003173828125, -0.0030017197132110596, -0.0028887391090393066, -0.0027757585048675537, -0.0026627779006958008, -0.002549797296524048, -0.002436816692352295, -0.002323836088180542, -0.002210855484008789, -0.002097874879837036, -0.001984894275665283, -0.0018719136714935303, -0.0017589330673217773, -0.0016459524631500244, -0.0015329718589782715, -0.0014199912548065186, -0.0013070106506347656, -0.0011940300464630127, -0.0010810494422912598, -0.0009680688381195068, -0.0008550882339477539, -0.000742107629776001, -0.000629127025604248, -0.0005161464214324951, -0.0004031658172607422, -0.00029018521308898926, -0.00017720460891723633, -6.42240047454834e-05, 4.875659942626953e-05, 0.00016173720359802246, 0.0002747178077697754, 0.0003876984119415283, 0.0005006790161132812, 0.0006136596202850342, 0.0007266402244567871, 0.00083962082862854, 0.000952601432800293, 0.001065582036972046, 0.0011785626411437988, 0.0012915432453155518, 0.0014045238494873047, 0.0015175044536590576, 0.0016304850578308105, 0.0017434656620025635, 0.0018564462661743164, 0.0019694268703460693, 0.0020824074745178223, 0.002195388078689575, 0.002308368682861328, 0.002421349287033081, 0.002534329891204834, 0.002647310495376587, 0.00276029109954834, 0.0028732717037200928, 0.0029862523078918457, 0.0030992329120635986, 0.0032122135162353516, 0.0033251941204071045, 0.0034381747245788574, 0.0035511553287506104, 0.0036641359329223633, 0.003777116537094116, 0.003890097141265869, 0.004003077745437622, 0.004116058349609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 6.0, 6.0, 14.0, 16.0, 24.0, 35.0, 39.0, 71.0, 116.0, 178.0, 266.0, 411.0, 631.0, 1123.0, 1912.0, 3323.0, 5626.0, 10530.0, 19594.0, 37250.0, 69364.0, 121041.0, 178541.0, 200711.0, 164187.0, 105752.0, 58764.0, 31512.0, 16621.0, 8954.0, 4816.0, 2895.0, 1636.0, 930.0, 615.0, 357.0, 232.0, 164.0, 108.0, 63.0, 44.0, 26.0, 13.0, 16.0, 6.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0], "bins": [-66.375, -64.5498046875, -62.724609375, -60.8994140625, -59.07421875, -57.2490234375, -55.423828125, -53.5986328125, -51.7734375, -49.9482421875, -48.123046875, -46.2978515625, -44.47265625, -42.6474609375, -40.822265625, -38.9970703125, -37.171875, -35.3466796875, -33.521484375, -31.6962890625, -29.87109375, -28.0458984375, -26.220703125, -24.3955078125, -22.5703125, -20.7451171875, -18.919921875, -17.0947265625, -15.26953125, -13.4443359375, -11.619140625, -9.7939453125, -7.96875, -6.1435546875, -4.318359375, -2.4931640625, -0.66796875, 1.1572265625, 2.982421875, 4.8076171875, 6.6328125, 8.4580078125, 10.283203125, 12.1083984375, 13.93359375, 15.7587890625, 17.583984375, 19.4091796875, 21.234375, 23.0595703125, 24.884765625, 26.7099609375, 28.53515625, 30.3603515625, 32.185546875, 34.0107421875, 35.8359375, 37.6611328125, 39.486328125, 41.3115234375, 43.13671875, 44.9619140625, 46.787109375, 48.6123046875, 50.4375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 5.0, 7.0, 6.0, 10.0, 9.0, 10.0, 13.0, 12.0, 16.0, 21.0, 24.0, 42.0, 32.0, 42.0, 54.0, 64.0, 68.0, 57.0, 54.0, 72.0, 47.0, 63.0, 43.0, 28.0, 24.0, 35.0, 25.0, 24.0, 21.0, 13.0, 9.0, 11.0, 4.0, 11.0, 6.0, 2.0, 7.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.25, -15.73974609375, -15.2294921875, -14.71923828125, -14.208984375, -13.69873046875, -13.1884765625, -12.67822265625, -12.16796875, -11.65771484375, -11.1474609375, -10.63720703125, -10.126953125, -9.61669921875, -9.1064453125, -8.59619140625, -8.0859375, -7.57568359375, -7.0654296875, -6.55517578125, -6.044921875, -5.53466796875, -5.0244140625, -4.51416015625, -4.00390625, -3.49365234375, -2.9833984375, -2.47314453125, -1.962890625, -1.45263671875, -0.9423828125, -0.43212890625, 0.078125, 0.58837890625, 1.0986328125, 1.60888671875, 2.119140625, 2.62939453125, 3.1396484375, 3.64990234375, 4.16015625, 4.67041015625, 5.1806640625, 5.69091796875, 6.201171875, 6.71142578125, 7.2216796875, 7.73193359375, 8.2421875, 8.75244140625, 9.2626953125, 9.77294921875, 10.283203125, 10.79345703125, 11.3037109375, 11.81396484375, 12.32421875, 12.83447265625, 13.3447265625, 13.85498046875, 14.365234375, 14.87548828125, 15.3857421875, 15.89599609375, 16.40625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 1.0, 4.0, 6.0, 7.0, 9.0, 12.0, 7.0, 11.0, 20.0, 26.0, 18.0, 25.0, 33.0, 32.0, 46.0, 43.0, 40.0, 40.0, 41.0, 43.0, 39.0, 40.0, 35.0, 45.0, 38.0, 40.0, 29.0, 32.0, 38.0, 20.0, 18.0, 21.0, 25.0, 22.0, 18.0, 14.0, 12.0, 11.0, 7.0, 7.0, 5.0, 10.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-131.89218139648438, -128.23825073242188, -124.58432006835938, -120.93038940429688, -117.27645874023438, -113.62252807617188, -109.96859741210938, -106.31466674804688, -102.66073608398438, -99.00680541992188, -95.35287475585938, -91.69894409179688, -88.04501342773438, -84.39108276367188, -80.73715209960938, -77.08322143554688, -73.4292984008789, -69.7753677368164, -66.1214370727539, -62.467506408691406, -58.813575744628906, -55.159645080566406, -51.50571823120117, -47.85178756713867, -44.19785690307617, -40.54392623901367, -36.88999557495117, -33.23606872558594, -29.582136154174805, -25.928205490112305, -22.274276733398438, -18.620346069335938, -14.966407775878906, -11.312477111816406, -7.658547401428223, -4.004617691040039, -0.35068702697753906, 3.303243637084961, 6.957172393798828, 10.611103057861328, 14.265033721923828, 17.918964385986328, 21.572895050048828, 25.226823806762695, 28.880754470825195, 32.53468322753906, 36.18861389160156, 39.84254455566406, 43.49647521972656, 47.15040588378906, 50.80433654785156, 54.45826721191406, 58.11219787597656, 61.76612854003906, 65.42005920410156, 69.07398986816406, 72.72792053222656, 76.38185119628906, 80.03578186035156, 83.68971252441406, 87.34364318847656, 90.99757385253906, 94.65150451660156, 98.30543518066406, 101.95935821533203]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 9.0, 7.0, 8.0, 9.0, 7.0, 11.0, 6.0, 18.0, 17.0, 28.0, 32.0, 15.0, 29.0, 27.0, 34.0, 31.0, 33.0, 42.0, 37.0, 35.0, 46.0, 39.0, 52.0, 45.0, 55.0, 45.0, 32.0, 33.0, 24.0, 33.0, 28.0, 28.0, 20.0, 14.0, 16.0, 7.0, 10.0, 10.0, 9.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-117.27581024169922, -113.78746032714844, -110.29911804199219, -106.8107681274414, -103.32241821289062, -99.83407592773438, -96.3457260131836, -92.85737609863281, -89.36903381347656, -85.88068389892578, -82.39234161376953, -78.90399169921875, -75.41564178466797, -71.92729187011719, -68.43894958496094, -64.95059967041016, -61.462249755859375, -57.97390365600586, -54.48555374145508, -50.99720764160156, -47.50885772705078, -44.020511627197266, -40.53216552734375, -37.04381561279297, -33.55546951293945, -30.067121505737305, -26.578773498535156, -23.09042739868164, -19.602079391479492, -16.113731384277344, -12.625385284423828, -9.13703727722168, -5.648689270019531, -2.160341739654541, 1.3280057907104492, 4.816352844238281, 8.30470085144043, 11.793048858642578, 15.281394958496094, 18.769742965698242, 22.25809097290039, 25.74643898010254, 29.234786987304688, 32.7231330871582, 36.21147918701172, 39.6998291015625, 43.188175201416016, 46.67652130126953, 50.16487121582031, 53.65321731567383, 57.14156723022461, 60.629913330078125, 64.1182632446289, 67.60661315917969, 71.09495544433594, 74.58330535888672, 78.0716552734375, 81.56000518798828, 85.04834747314453, 88.53669738769531, 92.0250473022461, 95.51339721679688, 99.00173950195312, 102.4900894165039, 105.97843170166016]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 19.0, 25.0, 45.0, 86.0, 112.0, 207.0, 351.0, 599.0, 904.0, 1393.0, 2141.0, 3391.0, 5237.0, 7891.0, 11211.0, 15876.0, 22017.0, 29885.0, 38464.0, 48679.0, 58909.0, 68732.0, 76592.0, 82007.0, 84470.0, 83043.0, 78457.0, 69738.0, 60474.0, 50398.0, 40140.0, 31010.0, 23257.0, 16895.0, 11860.0, 8121.0, 5548.0, 3758.0, 2420.0, 1561.0, 1021.0, 601.0, 391.0, 244.0, 155.0, 88.0, 50.0, 27.0, 22.0, 15.0, 11.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-74.9375, -72.6376953125, -70.337890625, -68.0380859375, -65.73828125, -63.4384765625, -61.138671875, -58.8388671875, -56.5390625, -54.2392578125, -51.939453125, -49.6396484375, -47.33984375, -45.0400390625, -42.740234375, -40.4404296875, -38.140625, -35.8408203125, -33.541015625, -31.2412109375, -28.94140625, -26.6416015625, -24.341796875, -22.0419921875, -19.7421875, -17.4423828125, -15.142578125, -12.8427734375, -10.54296875, -8.2431640625, -5.943359375, -3.6435546875, -1.34375, 0.9560546875, 3.255859375, 5.5556640625, 7.85546875, 10.1552734375, 12.455078125, 14.7548828125, 17.0546875, 19.3544921875, 21.654296875, 23.9541015625, 26.25390625, 28.5537109375, 30.853515625, 33.1533203125, 35.453125, 37.7529296875, 40.052734375, 42.3525390625, 44.65234375, 46.9521484375, 49.251953125, 51.5517578125, 53.8515625, 56.1513671875, 58.451171875, 60.7509765625, 63.05078125, 65.3505859375, 67.650390625, 69.9501953125, 72.25]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 7.0, 9.0, 6.0, 13.0, 6.0, 18.0, 23.0, 25.0, 27.0, 21.0, 25.0, 27.0, 37.0, 34.0, 30.0, 42.0, 37.0, 39.0, 41.0, 41.0, 49.0, 50.0, 49.0, 47.0, 37.0, 26.0, 32.0, 31.0, 26.0, 26.0, 19.0, 16.0, 14.0, 5.0, 13.0, 10.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-113.8125, -110.416015625, -107.01953125, -103.623046875, -100.2265625, -96.830078125, -93.43359375, -90.037109375, -86.640625, -83.244140625, -79.84765625, -76.451171875, -73.0546875, -69.658203125, -66.26171875, -62.865234375, -59.46875, -56.072265625, -52.67578125, -49.279296875, -45.8828125, -42.486328125, -39.08984375, -35.693359375, -32.296875, -28.900390625, -25.50390625, -22.107421875, -18.7109375, -15.314453125, -11.91796875, -8.521484375, -5.125, -1.728515625, 1.66796875, 5.064453125, 8.4609375, 11.857421875, 15.25390625, 18.650390625, 22.046875, 25.443359375, 28.83984375, 32.236328125, 35.6328125, 39.029296875, 42.42578125, 45.822265625, 49.21875, 52.615234375, 56.01171875, 59.408203125, 62.8046875, 66.201171875, 69.59765625, 72.994140625, 76.390625, 79.787109375, 83.18359375, 86.580078125, 89.9765625, 93.373046875, 96.76953125, 100.166015625, 103.5625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 22.0, 27.0, 32.0, 67.0, 93.0, 173.0, 288.0, 471.0, 736.0, 1166.0, 1850.0, 2860.0, 4453.0, 6870.0, 9951.0, 14582.0, 20478.0, 28338.0, 37386.0, 48455.0, 59582.0, 69717.0, 79201.0, 85570.0, 87243.0, 86073.0, 80382.0, 72040.0, 62265.0, 50143.0, 38990.0, 29951.0, 21702.0, 15808.0, 11033.0, 7188.0, 4866.0, 3169.0, 1989.0, 1288.0, 813.0, 493.0, 289.0, 190.0, 108.0, 67.0, 35.0, 25.0, 11.0, 14.0, 6.0, 3.0, 4.0, 2.0, 1.0], "bins": [-79.625, -77.2548828125, -74.884765625, -72.5146484375, -70.14453125, -67.7744140625, -65.404296875, -63.0341796875, -60.6640625, -58.2939453125, -55.923828125, -53.5537109375, -51.18359375, -48.8134765625, -46.443359375, -44.0732421875, -41.703125, -39.3330078125, -36.962890625, -34.5927734375, -32.22265625, -29.8525390625, -27.482421875, -25.1123046875, -22.7421875, -20.3720703125, -18.001953125, -15.6318359375, -13.26171875, -10.8916015625, -8.521484375, -6.1513671875, -3.78125, -1.4111328125, 0.958984375, 3.3291015625, 5.69921875, 8.0693359375, 10.439453125, 12.8095703125, 15.1796875, 17.5498046875, 19.919921875, 22.2900390625, 24.66015625, 27.0302734375, 29.400390625, 31.7705078125, 34.140625, 36.5107421875, 38.880859375, 41.2509765625, 43.62109375, 45.9912109375, 48.361328125, 50.7314453125, 53.1015625, 55.4716796875, 57.841796875, 60.2119140625, 62.58203125, 64.9521484375, 67.322265625, 69.6923828125, 72.0625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 7.0, 15.0, 5.0, 11.0, 15.0, 21.0, 12.0, 19.0, 23.0, 35.0, 36.0, 26.0, 32.0, 36.0, 37.0, 47.0, 49.0, 38.0, 43.0, 43.0, 47.0, 50.0, 26.0, 38.0, 36.0, 29.0, 28.0, 33.0, 34.0, 22.0, 20.0, 16.0, 12.0, 14.0, 8.0, 7.0, 6.0, 6.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.25, -75.8623046875, -73.474609375, -71.0869140625, -68.69921875, -66.3115234375, -63.923828125, -61.5361328125, -59.1484375, -56.7607421875, -54.373046875, -51.9853515625, -49.59765625, -47.2099609375, -44.822265625, -42.4345703125, -40.046875, -37.6591796875, -35.271484375, -32.8837890625, -30.49609375, -28.1083984375, -25.720703125, -23.3330078125, -20.9453125, -18.5576171875, -16.169921875, -13.7822265625, -11.39453125, -9.0068359375, -6.619140625, -4.2314453125, -1.84375, 0.5439453125, 2.931640625, 5.3193359375, 7.70703125, 10.0947265625, 12.482421875, 14.8701171875, 17.2578125, 19.6455078125, 22.033203125, 24.4208984375, 26.80859375, 29.1962890625, 31.583984375, 33.9716796875, 36.359375, 38.7470703125, 41.134765625, 43.5224609375, 45.91015625, 48.2978515625, 50.685546875, 53.0732421875, 55.4609375, 57.8486328125, 60.236328125, 62.6240234375, 65.01171875, 67.3994140625, 69.787109375, 72.1748046875, 74.5625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 11.0, 31.0, 59.0, 78.0, 152.0, 282.0, 574.0, 1073.0, 2239.0, 4310.0, 8210.0, 15665.0, 28177.0, 48592.0, 76441.0, 108045.0, 136199.0, 149323.0, 141754.0, 116635.0, 84250.0, 54778.0, 32864.0, 18326.0, 9819.0, 5164.0, 2617.0, 1329.0, 683.0, 400.0, 170.0, 110.0, 55.0, 40.0, 32.0, 16.0, 6.0, 6.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.5, -50.93896484375, -49.3779296875, -47.81689453125, -46.255859375, -44.69482421875, -43.1337890625, -41.57275390625, -40.01171875, -38.45068359375, -36.8896484375, -35.32861328125, -33.767578125, -32.20654296875, -30.6455078125, -29.08447265625, -27.5234375, -25.96240234375, -24.4013671875, -22.84033203125, -21.279296875, -19.71826171875, -18.1572265625, -16.59619140625, -15.03515625, -13.47412109375, -11.9130859375, -10.35205078125, -8.791015625, -7.22998046875, -5.6689453125, -4.10791015625, -2.546875, -0.98583984375, 0.5751953125, 2.13623046875, 3.697265625, 5.25830078125, 6.8193359375, 8.38037109375, 9.94140625, 11.50244140625, 13.0634765625, 14.62451171875, 16.185546875, 17.74658203125, 19.3076171875, 20.86865234375, 22.4296875, 23.99072265625, 25.5517578125, 27.11279296875, 28.673828125, 30.23486328125, 31.7958984375, 33.35693359375, 34.91796875, 36.47900390625, 38.0400390625, 39.60107421875, 41.162109375, 42.72314453125, 44.2841796875, 45.84521484375, 47.40625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 9.0, 7.0, 9.0, 18.0, 11.0, 25.0, 30.0, 29.0, 33.0, 37.0, 41.0, 39.0, 38.0, 43.0, 52.0, 53.0, 56.0, 52.0, 43.0, 43.0, 50.0, 33.0, 38.0, 35.0, 30.0, 20.0, 19.0, 20.0, 11.0, 17.0, 6.0, 8.0, 5.0, 8.0, 3.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.005550384521484375, -0.0053879618644714355, -0.005225539207458496, -0.005063116550445557, -0.004900693893432617, -0.004738271236419678, -0.004575848579406738, -0.004413425922393799, -0.004251003265380859, -0.00408858060836792, -0.0039261579513549805, -0.003763735294342041, -0.0036013126373291016, -0.003438889980316162, -0.0032764673233032227, -0.003114044666290283, -0.0029516220092773438, -0.0027891993522644043, -0.002626776695251465, -0.0024643540382385254, -0.002301931381225586, -0.0021395087242126465, -0.001977086067199707, -0.0018146634101867676, -0.0016522407531738281, -0.0014898180961608887, -0.0013273954391479492, -0.0011649727821350098, -0.0010025501251220703, -0.0008401274681091309, -0.0006777048110961914, -0.000515282154083252, -0.0003528594970703125, -0.00019043684005737305, -2.8014183044433594e-05, 0.00013440847396850586, 0.0002968311309814453, 0.00045925378799438477, 0.0006216764450073242, 0.0007840991020202637, 0.0009465217590332031, 0.0011089444160461426, 0.001271367073059082, 0.0014337897300720215, 0.001596212387084961, 0.0017586350440979004, 0.0019210577011108398, 0.0020834803581237793, 0.0022459030151367188, 0.002408325672149658, 0.0025707483291625977, 0.002733170986175537, 0.0028955936431884766, 0.003058016300201416, 0.0032204389572143555, 0.003382861614227295, 0.0035452842712402344, 0.003707706928253174, 0.0038701295852661133, 0.004032552242279053, 0.004194974899291992, 0.004357397556304932, 0.004519820213317871, 0.0046822428703308105, 0.00484466552734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 4.0, 6.0, 10.0, 25.0, 25.0, 60.0, 87.0, 121.0, 190.0, 290.0, 474.0, 721.0, 1155.0, 1679.0, 2593.0, 3778.0, 5695.0, 8217.0, 11518.0, 16089.0, 22651.0, 30404.0, 39738.0, 49797.0, 60747.0, 70535.0, 78943.0, 84735.0, 86548.0, 83946.0, 77054.0, 69060.0, 58043.0, 47065.0, 37129.0, 28752.0, 21263.0, 15459.0, 10804.0, 7555.0, 5225.0, 3533.0, 2372.0, 1603.0, 1043.0, 632.0, 445.0, 266.0, 181.0, 101.0, 75.0, 47.0, 32.0, 19.0, 11.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-30.390625, -29.422607421875, -28.45458984375, -27.486572265625, -26.5185546875, -25.550537109375, -24.58251953125, -23.614501953125, -22.646484375, -21.678466796875, -20.71044921875, -19.742431640625, -18.7744140625, -17.806396484375, -16.83837890625, -15.870361328125, -14.90234375, -13.934326171875, -12.96630859375, -11.998291015625, -11.0302734375, -10.062255859375, -9.09423828125, -8.126220703125, -7.158203125, -6.190185546875, -5.22216796875, -4.254150390625, -3.2861328125, -2.318115234375, -1.35009765625, -0.382080078125, 0.5859375, 1.553955078125, 2.52197265625, 3.489990234375, 4.4580078125, 5.426025390625, 6.39404296875, 7.362060546875, 8.330078125, 9.298095703125, 10.26611328125, 11.234130859375, 12.2021484375, 13.170166015625, 14.13818359375, 15.106201171875, 16.07421875, 17.042236328125, 18.01025390625, 18.978271484375, 19.9462890625, 20.914306640625, 21.88232421875, 22.850341796875, 23.818359375, 24.786376953125, 25.75439453125, 26.722412109375, 27.6904296875, 28.658447265625, 29.62646484375, 30.594482421875, 31.5625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 16.0, 11.0, 13.0, 12.0, 15.0, 14.0, 21.0, 27.0, 21.0, 41.0, 29.0, 30.0, 53.0, 34.0, 44.0, 46.0, 48.0, 36.0, 49.0, 37.0, 38.0, 26.0, 45.0, 48.0, 38.0, 28.0, 27.0, 24.0, 19.0, 19.0, 6.0, 14.0, 16.0, 6.0, 7.0, 6.0, 7.0, 7.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-15.078125, -14.586669921875, -14.09521484375, -13.603759765625, -13.1123046875, -12.620849609375, -12.12939453125, -11.637939453125, -11.146484375, -10.655029296875, -10.16357421875, -9.672119140625, -9.1806640625, -8.689208984375, -8.19775390625, -7.706298828125, -7.21484375, -6.723388671875, -6.23193359375, -5.740478515625, -5.2490234375, -4.757568359375, -4.26611328125, -3.774658203125, -3.283203125, -2.791748046875, -2.30029296875, -1.808837890625, -1.3173828125, -0.825927734375, -0.33447265625, 0.156982421875, 0.6484375, 1.139892578125, 1.63134765625, 2.122802734375, 2.6142578125, 3.105712890625, 3.59716796875, 4.088623046875, 4.580078125, 5.071533203125, 5.56298828125, 6.054443359375, 6.5458984375, 7.037353515625, 7.52880859375, 8.020263671875, 8.51171875, 9.003173828125, 9.49462890625, 9.986083984375, 10.4775390625, 10.968994140625, 11.46044921875, 11.951904296875, 12.443359375, 12.934814453125, 13.42626953125, 13.917724609375, 14.4091796875, 14.900634765625, 15.39208984375, 15.883544921875, 16.375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 4.0, 1.0, 10.0, 6.0, 15.0, 8.0, 9.0, 22.0, 24.0, 18.0, 29.0, 39.0, 37.0, 44.0, 44.0, 38.0, 45.0, 49.0, 35.0, 43.0, 44.0, 28.0, 36.0, 32.0, 42.0, 39.0, 34.0, 35.0, 18.0, 22.0, 28.0, 16.0, 19.0, 21.0, 13.0, 10.0, 12.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.87712097167969, -102.23286437988281, -98.5886001586914, -94.94434356689453, -91.30007934570312, -87.65582275390625, -84.01156616210938, -80.3673095703125, -76.7230453491211, -73.07878875732422, -69.43452453613281, -65.79026794433594, -62.1460075378418, -58.501747131347656, -54.85749053955078, -51.21323013305664, -47.5689697265625, -43.92470932006836, -40.28044891357422, -36.636192321777344, -32.9919319152832, -29.347671508789062, -25.703413009643555, -22.059154510498047, -18.414894104003906, -14.770634651184082, -11.126375198364258, -7.482115745544434, -3.8378562927246094, -0.19359588623046875, 3.450662612915039, 7.094921112060547, 10.739173889160156, 14.38343334197998, 18.027692794799805, 21.671951293945312, 25.316211700439453, 28.960472106933594, 32.60472869873047, 36.24898910522461, 39.89324951171875, 43.53750991821289, 47.18177032470703, 50.826026916503906, 54.47028732299805, 58.11454772949219, 61.75880432128906, 65.40306091308594, 69.04732513427734, 72.69158172607422, 76.33584594726562, 79.9801025390625, 83.62435913085938, 87.26862335205078, 90.91287994384766, 94.55714416503906, 98.20140075683594, 101.84565734863281, 105.48992156982422, 109.1341781616211, 112.7784423828125, 116.42269897460938, 120.06695556640625, 123.71121215820312, 127.35547637939453]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 8.0, 17.0, 9.0, 12.0, 18.0, 22.0, 20.0, 22.0, 22.0, 26.0, 31.0, 38.0, 28.0, 29.0, 36.0, 41.0, 40.0, 43.0, 40.0, 41.0, 40.0, 36.0, 46.0, 32.0, 30.0, 30.0, 36.0, 39.0, 20.0, 20.0, 22.0, 15.0, 11.0, 12.0, 10.0, 5.0, 6.0, 6.0, 7.0, 1.0, 5.0, 5.0, 0.0, 4.0, 0.0, 3.0], "bins": [-122.56629180908203, -119.14018249511719, -115.71406555175781, -112.28795623779297, -108.86184692382812, -105.43572998046875, -102.0096206665039, -98.58351135253906, -95.15739440917969, -91.73128509521484, -88.30516815185547, -84.87905883789062, -81.45294189453125, -78.0268325805664, -74.60072326660156, -71.17460632324219, -67.74849700927734, -64.3223876953125, -60.896270751953125, -57.47016143798828, -54.04404830932617, -50.61793518066406, -47.19182586669922, -43.76571273803711, -40.339599609375, -36.91348648071289, -33.48737335205078, -30.061264038085938, -26.635150909423828, -23.20903778076172, -19.782926559448242, -16.356815338134766, -12.930709838867188, -9.504597663879395, -6.078485488891602, -2.6523733139038086, 0.7737388610839844, 4.199851989746094, 7.62596321105957, 11.052074432373047, 14.478187561035156, 17.904300689697266, 21.330411911010742, 24.75652313232422, 28.182636260986328, 31.608749389648438, 35.03485870361328, 38.46097183227539, 41.8870849609375, 45.31319808959961, 48.73931121826172, 52.16542053222656, 55.59153366088867, 59.01764678955078, 62.443756103515625, 65.869873046875, 69.29598236083984, 72.72209167480469, 76.14820861816406, 79.5743179321289, 83.00042724609375, 86.42654418945312, 89.85265350341797, 93.27876281738281, 96.70487976074219]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 7.0, 11.0, 19.0, 41.0, 58.0, 82.0, 136.0, 230.0, 376.0, 644.0, 1023.0, 1679.0, 2746.0, 4343.0, 6747.0, 10501.0, 16596.0, 24941.0, 37055.0, 55360.0, 79316.0, 111270.0, 152219.0, 199090.0, 252809.0, 303435.0, 345140.0, 375728.0, 381285.0, 366420.0, 331559.0, 283413.0, 232251.0, 180695.0, 134509.0, 98320.0, 68446.0, 47348.0, 31635.0, 20639.0, 13464.0, 8632.0, 5365.0, 3320.0, 2090.0, 1311.0, 789.0, 510.0, 271.0, 149.0, 113.0, 53.0, 38.0, 27.0, 7.0, 14.0, 8.0, 6.0, 1.0, 3.0, 1.0], "bins": [-76.4375, -73.9951171875, -71.552734375, -69.1103515625, -66.66796875, -64.2255859375, -61.783203125, -59.3408203125, -56.8984375, -54.4560546875, -52.013671875, -49.5712890625, -47.12890625, -44.6865234375, -42.244140625, -39.8017578125, -37.359375, -34.9169921875, -32.474609375, -30.0322265625, -27.58984375, -25.1474609375, -22.705078125, -20.2626953125, -17.8203125, -15.3779296875, -12.935546875, -10.4931640625, -8.05078125, -5.6083984375, -3.166015625, -0.7236328125, 1.71875, 4.1611328125, 6.603515625, 9.0458984375, 11.48828125, 13.9306640625, 16.373046875, 18.8154296875, 21.2578125, 23.7001953125, 26.142578125, 28.5849609375, 31.02734375, 33.4697265625, 35.912109375, 38.3544921875, 40.796875, 43.2392578125, 45.681640625, 48.1240234375, 50.56640625, 53.0087890625, 55.451171875, 57.8935546875, 60.3359375, 62.7783203125, 65.220703125, 67.6630859375, 70.10546875, 72.5478515625, 74.990234375, 77.4326171875, 79.875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 7.0, 9.0, 10.0, 13.0, 10.0, 10.0, 20.0, 23.0, 20.0, 23.0, 25.0, 25.0, 25.0, 30.0, 38.0, 21.0, 37.0, 42.0, 36.0, 46.0, 45.0, 34.0, 40.0, 36.0, 38.0, 42.0, 28.0, 32.0, 36.0, 35.0, 26.0, 14.0, 22.0, 18.0, 12.0, 13.0, 10.0, 9.0, 8.0, 3.0, 5.0, 6.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-107.0625, -104.0205078125, -100.978515625, -97.9365234375, -94.89453125, -91.8525390625, -88.810546875, -85.7685546875, -82.7265625, -79.6845703125, -76.642578125, -73.6005859375, -70.55859375, -67.5166015625, -64.474609375, -61.4326171875, -58.390625, -55.3486328125, -52.306640625, -49.2646484375, -46.22265625, -43.1806640625, -40.138671875, -37.0966796875, -34.0546875, -31.0126953125, -27.970703125, -24.9287109375, -21.88671875, -18.8447265625, -15.802734375, -12.7607421875, -9.71875, -6.6767578125, -3.634765625, -0.5927734375, 2.44921875, 5.4912109375, 8.533203125, 11.5751953125, 14.6171875, 17.6591796875, 20.701171875, 23.7431640625, 26.78515625, 29.8271484375, 32.869140625, 35.9111328125, 38.953125, 41.9951171875, 45.037109375, 48.0791015625, 51.12109375, 54.1630859375, 57.205078125, 60.2470703125, 63.2890625, 66.3310546875, 69.373046875, 72.4150390625, 75.45703125, 78.4990234375, 81.541015625, 84.5830078125, 87.625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 10.0, 28.0, 53.0, 79.0, 153.0, 288.0, 467.0, 788.0, 1282.0, 2018.0, 3339.0, 5442.0, 8488.0, 13128.0, 20292.0, 30063.0, 44173.0, 62468.0, 87545.0, 118073.0, 153967.0, 194267.0, 236079.0, 275208.0, 309790.0, 332141.0, 341116.0, 335070.0, 314858.0, 281934.0, 243035.0, 201169.0, 158802.0, 122700.0, 91120.0, 66496.0, 46466.0, 32261.0, 21481.0, 13826.0, 9158.0, 5810.0, 3649.0, 2297.0, 1397.0, 818.0, 491.0, 299.0, 185.0, 88.0, 74.0, 36.0, 10.0, 11.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-74.5, -72.0634765625, -69.626953125, -67.1904296875, -64.75390625, -62.3173828125, -59.880859375, -57.4443359375, -55.0078125, -52.5712890625, -50.134765625, -47.6982421875, -45.26171875, -42.8251953125, -40.388671875, -37.9521484375, -35.515625, -33.0791015625, -30.642578125, -28.2060546875, -25.76953125, -23.3330078125, -20.896484375, -18.4599609375, -16.0234375, -13.5869140625, -11.150390625, -8.7138671875, -6.27734375, -3.8408203125, -1.404296875, 1.0322265625, 3.46875, 5.9052734375, 8.341796875, 10.7783203125, 13.21484375, 15.6513671875, 18.087890625, 20.5244140625, 22.9609375, 25.3974609375, 27.833984375, 30.2705078125, 32.70703125, 35.1435546875, 37.580078125, 40.0166015625, 42.453125, 44.8896484375, 47.326171875, 49.7626953125, 52.19921875, 54.6357421875, 57.072265625, 59.5087890625, 61.9453125, 64.3818359375, 66.818359375, 69.2548828125, 71.69140625, 74.1279296875, 76.564453125, 79.0009765625, 81.4375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 8.0, 4.0, 12.0, 11.0, 16.0, 23.0, 31.0, 26.0, 27.0, 37.0, 65.0, 62.0, 78.0, 72.0, 87.0, 105.0, 122.0, 122.0, 148.0, 163.0, 160.0, 194.0, 152.0, 192.0, 194.0, 176.0, 162.0, 182.0, 168.0, 167.0, 143.0, 133.0, 107.0, 101.0, 103.0, 85.0, 75.0, 67.0, 61.0, 44.0, 35.0, 29.0, 38.0, 17.0, 18.0, 13.0, 18.0, 12.0, 4.0, 2.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.59375, -35.27001953125, -33.9462890625, -32.62255859375, -31.298828125, -29.97509765625, -28.6513671875, -27.32763671875, -26.00390625, -24.68017578125, -23.3564453125, -22.03271484375, -20.708984375, -19.38525390625, -18.0615234375, -16.73779296875, -15.4140625, -14.09033203125, -12.7666015625, -11.44287109375, -10.119140625, -8.79541015625, -7.4716796875, -6.14794921875, -4.82421875, -3.50048828125, -2.1767578125, -0.85302734375, 0.470703125, 1.79443359375, 3.1181640625, 4.44189453125, 5.765625, 7.08935546875, 8.4130859375, 9.73681640625, 11.060546875, 12.38427734375, 13.7080078125, 15.03173828125, 16.35546875, 17.67919921875, 19.0029296875, 20.32666015625, 21.650390625, 22.97412109375, 24.2978515625, 25.62158203125, 26.9453125, 28.26904296875, 29.5927734375, 30.91650390625, 32.240234375, 33.56396484375, 34.8876953125, 36.21142578125, 37.53515625, 38.85888671875, 40.1826171875, 41.50634765625, 42.830078125, 44.15380859375, 45.4775390625, 46.80126953125, 48.125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 11.0, 8.0, 11.0, 18.0, 16.0, 22.0, 32.0, 26.0, 30.0, 28.0, 28.0, 50.0, 56.0, 47.0, 49.0, 51.0, 47.0, 52.0, 44.0, 48.0, 38.0, 44.0, 27.0, 22.0, 40.0, 27.0, 14.0, 27.0, 19.0, 12.0, 7.0, 6.0, 9.0, 4.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.84194946289062, -106.7968978881836, -102.75184631347656, -98.70679473876953, -94.6617431640625, -90.61668395996094, -86.5716323852539, -82.52658081054688, -78.48152923583984, -74.43647766113281, -70.39142608642578, -66.34637451171875, -62.30131912231445, -58.25626754760742, -54.211212158203125, -50.166160583496094, -46.12110900878906, -42.07605743408203, -38.031005859375, -33.9859504699707, -29.940898895263672, -25.89584732055664, -21.850793838500977, -17.805740356445312, -13.760688781738281, -9.715636253356934, -5.670583724975586, -1.6255311965942383, 2.4195213317871094, 6.464572906494141, 10.509626388549805, 14.554679870605469, 18.5997314453125, 22.64478302001953, 26.689836502075195, 30.73488998413086, 34.77994155883789, 38.82499313354492, 42.87004852294922, 46.91510009765625, 50.96015167236328, 55.00520324707031, 59.050254821777344, 63.09531021118164, 67.14036560058594, 71.18540954589844, 75.23046875, 79.27552032470703, 83.32057189941406, 87.3656234741211, 91.41067504882812, 95.45572662353516, 99.50077819824219, 103.54583740234375, 107.59088897705078, 111.63594055175781, 115.68099212646484, 119.72604370117188, 123.7710952758789, 127.81614685058594, 131.8612060546875, 135.90625, 139.95130920410156, 143.99636840820312, 148.04141235351562]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 7.0, 10.0, 9.0, 7.0, 8.0, 12.0, 22.0, 24.0, 19.0, 25.0, 25.0, 28.0, 30.0, 28.0, 31.0, 39.0, 30.0, 42.0, 40.0, 41.0, 37.0, 46.0, 41.0, 48.0, 39.0, 45.0, 36.0, 26.0, 34.0, 25.0, 31.0, 23.0, 10.0, 21.0, 16.0, 11.0, 8.0, 4.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-127.93498992919922, -124.26873016357422, -120.60247802734375, -116.93621826171875, -113.26996612548828, -109.60370635986328, -105.93745422363281, -102.27119445800781, -98.60493469238281, -94.93867492675781, -91.27242279052734, -87.60616302490234, -83.93991088867188, -80.27365112304688, -76.60739135742188, -72.9411392211914, -69.27488708496094, -65.60862731933594, -61.94237518310547, -58.27611541748047, -54.609859466552734, -50.943603515625, -47.277347564697266, -43.61109161376953, -39.94483184814453, -36.2785758972168, -32.61231994628906, -28.946062088012695, -25.279804229736328, -21.613548278808594, -17.94729232788086, -14.281034469604492, -10.614776611328125, -6.948519706726074, -3.2822632789611816, 0.38399314880371094, 4.050250053405762, 7.7165069580078125, 11.382762908935547, 15.049020767211914, 18.71527671813965, 22.381532669067383, 26.04779052734375, 29.714046478271484, 33.38030242919922, 37.04656219482422, 40.71281433105469, 44.37907409667969, 48.04533004760742, 51.711585998535156, 55.37784194946289, 59.044097900390625, 62.710357666015625, 66.37661743164062, 70.0428695678711, 73.7091293334961, 77.37538146972656, 81.04164123535156, 84.70789337158203, 88.37415313720703, 92.0404052734375, 95.7066650390625, 99.3729248046875, 103.03917694091797, 106.70543670654297]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 8.0, 7.0, 14.0, 22.0, 26.0, 20.0, 47.0, 58.0, 91.0, 154.0, 266.0, 409.0, 762.0, 1253.0, 2258.0, 4168.0, 7945.0, 14615.0, 28371.0, 55214.0, 102020.0, 163521.0, 206883.0, 186314.0, 125307.0, 71088.0, 37140.0, 18775.0, 9804.0, 5286.0, 2797.0, 1606.0, 892.0, 504.0, 328.0, 193.0, 134.0, 80.0, 42.0, 43.0, 25.0, 20.0, 16.0, 8.0, 8.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-86.75, -84.0966796875, -81.443359375, -78.7900390625, -76.13671875, -73.4833984375, -70.830078125, -68.1767578125, -65.5234375, -62.8701171875, -60.216796875, -57.5634765625, -54.91015625, -52.2568359375, -49.603515625, -46.9501953125, -44.296875, -41.6435546875, -38.990234375, -36.3369140625, -33.68359375, -31.0302734375, -28.376953125, -25.7236328125, -23.0703125, -20.4169921875, -17.763671875, -15.1103515625, -12.45703125, -9.8037109375, -7.150390625, -4.4970703125, -1.84375, 0.8095703125, 3.462890625, 6.1162109375, 8.76953125, 11.4228515625, 14.076171875, 16.7294921875, 19.3828125, 22.0361328125, 24.689453125, 27.3427734375, 29.99609375, 32.6494140625, 35.302734375, 37.9560546875, 40.609375, 43.2626953125, 45.916015625, 48.5693359375, 51.22265625, 53.8759765625, 56.529296875, 59.1826171875, 61.8359375, 64.4892578125, 67.142578125, 69.7958984375, 72.44921875, 75.1025390625, 77.755859375, 80.4091796875, 83.0625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 11.0, 7.0, 8.0, 8.0, 16.0, 18.0, 25.0, 20.0, 23.0, 26.0, 28.0, 31.0, 29.0, 31.0, 37.0, 31.0, 42.0, 41.0, 40.0, 39.0, 45.0, 44.0, 40.0, 43.0, 47.0, 33.0, 28.0, 31.0, 29.0, 30.0, 20.0, 12.0, 23.0, 14.0, 9.0, 8.0, 6.0, 7.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-128.0, -124.3427734375, -120.685546875, -117.0283203125, -113.37109375, -109.7138671875, -106.056640625, -102.3994140625, -98.7421875, -95.0849609375, -91.427734375, -87.7705078125, -84.11328125, -80.4560546875, -76.798828125, -73.1416015625, -69.484375, -65.8271484375, -62.169921875, -58.5126953125, -54.85546875, -51.1982421875, -47.541015625, -43.8837890625, -40.2265625, -36.5693359375, -32.912109375, -29.2548828125, -25.59765625, -21.9404296875, -18.283203125, -14.6259765625, -10.96875, -7.3115234375, -3.654296875, 0.0029296875, 3.66015625, 7.3173828125, 10.974609375, 14.6318359375, 18.2890625, 21.9462890625, 25.603515625, 29.2607421875, 32.91796875, 36.5751953125, 40.232421875, 43.8896484375, 47.546875, 51.2041015625, 54.861328125, 58.5185546875, 62.17578125, 65.8330078125, 69.490234375, 73.1474609375, 76.8046875, 80.4619140625, 84.119140625, 87.7763671875, 91.43359375, 95.0908203125, 98.748046875, 102.4052734375, 106.0625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 8.0, 9.0, 29.0, 35.0, 56.0, 60.0, 86.0, 142.0, 237.0, 316.0, 581.0, 872.0, 1528.0, 2789.0, 5278.0, 11076.0, 25443.0, 68623.0, 197461.0, 369080.0, 227797.0, 81635.0, 29547.0, 12542.0, 5881.0, 3061.0, 1648.0, 959.0, 621.0, 404.0, 215.0, 174.0, 103.0, 87.0, 43.0, 28.0, 28.0, 19.0, 15.0, 9.0, 8.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-119.8125, -116.134765625, -112.45703125, -108.779296875, -105.1015625, -101.423828125, -97.74609375, -94.068359375, -90.390625, -86.712890625, -83.03515625, -79.357421875, -75.6796875, -72.001953125, -68.32421875, -64.646484375, -60.96875, -57.291015625, -53.61328125, -49.935546875, -46.2578125, -42.580078125, -38.90234375, -35.224609375, -31.546875, -27.869140625, -24.19140625, -20.513671875, -16.8359375, -13.158203125, -9.48046875, -5.802734375, -2.125, 1.552734375, 5.23046875, 8.908203125, 12.5859375, 16.263671875, 19.94140625, 23.619140625, 27.296875, 30.974609375, 34.65234375, 38.330078125, 42.0078125, 45.685546875, 49.36328125, 53.041015625, 56.71875, 60.396484375, 64.07421875, 67.751953125, 71.4296875, 75.107421875, 78.78515625, 82.462890625, 86.140625, 89.818359375, 93.49609375, 97.173828125, 100.8515625, 104.529296875, 108.20703125, 111.884765625, 115.5625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 10.0, 12.0, 9.0, 20.0, 22.0, 18.0, 19.0, 25.0, 26.0, 28.0, 27.0, 30.0, 30.0, 43.0, 33.0, 29.0, 47.0, 48.0, 38.0, 35.0, 47.0, 28.0, 35.0, 47.0, 27.0, 29.0, 28.0, 30.0, 19.0, 22.0, 17.0, 15.0, 17.0, 16.0, 9.0, 10.0, 8.0, 13.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-79.0625, -76.87255859375, -74.6826171875, -72.49267578125, -70.302734375, -68.11279296875, -65.9228515625, -63.73291015625, -61.54296875, -59.35302734375, -57.1630859375, -54.97314453125, -52.783203125, -50.59326171875, -48.4033203125, -46.21337890625, -44.0234375, -41.83349609375, -39.6435546875, -37.45361328125, -35.263671875, -33.07373046875, -30.8837890625, -28.69384765625, -26.50390625, -24.31396484375, -22.1240234375, -19.93408203125, -17.744140625, -15.55419921875, -13.3642578125, -11.17431640625, -8.984375, -6.79443359375, -4.6044921875, -2.41455078125, -0.224609375, 1.96533203125, 4.1552734375, 6.34521484375, 8.53515625, 10.72509765625, 12.9150390625, 15.10498046875, 17.294921875, 19.48486328125, 21.6748046875, 23.86474609375, 26.0546875, 28.24462890625, 30.4345703125, 32.62451171875, 34.814453125, 37.00439453125, 39.1943359375, 41.38427734375, 43.57421875, 45.76416015625, 47.9541015625, 50.14404296875, 52.333984375, 54.52392578125, 56.7138671875, 58.90380859375, 61.09375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 4.0, 5.0, 9.0, 8.0, 18.0, 11.0, 17.0, 25.0, 40.0, 61.0, 81.0, 131.0, 172.0, 248.0, 328.0, 562.0, 892.0, 1564.0, 2831.0, 5919.0, 13905.0, 37794.0, 134532.0, 472292.0, 269980.0, 66841.0, 21933.0, 8895.0, 4053.0, 2157.0, 1177.0, 705.0, 410.0, 273.0, 206.0, 122.0, 113.0, 59.0, 50.0, 38.0, 22.0, 18.0, 10.0, 10.0, 10.0, 10.0, 10.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-87.4375, -84.7666015625, -82.095703125, -79.4248046875, -76.75390625, -74.0830078125, -71.412109375, -68.7412109375, -66.0703125, -63.3994140625, -60.728515625, -58.0576171875, -55.38671875, -52.7158203125, -50.044921875, -47.3740234375, -44.703125, -42.0322265625, -39.361328125, -36.6904296875, -34.01953125, -31.3486328125, -28.677734375, -26.0068359375, -23.3359375, -20.6650390625, -17.994140625, -15.3232421875, -12.65234375, -9.9814453125, -7.310546875, -4.6396484375, -1.96875, 0.7021484375, 3.373046875, 6.0439453125, 8.71484375, 11.3857421875, 14.056640625, 16.7275390625, 19.3984375, 22.0693359375, 24.740234375, 27.4111328125, 30.08203125, 32.7529296875, 35.423828125, 38.0947265625, 40.765625, 43.4365234375, 46.107421875, 48.7783203125, 51.44921875, 54.1201171875, 56.791015625, 59.4619140625, 62.1328125, 64.8037109375, 67.474609375, 70.1455078125, 72.81640625, 75.4873046875, 78.158203125, 80.8291015625, 83.5]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 27.0, 50.0, 59.0, 83.0, 119.0, 114.0, 128.0, 125.0, 93.0, 73.0, 50.0, 23.0, 20.0, 11.0, 10.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0069122314453125, -0.006736338138580322, -0.0065604448318481445, -0.006384551525115967, -0.006208658218383789, -0.006032764911651611, -0.005856871604919434, -0.005680978298187256, -0.005505084991455078, -0.0053291916847229, -0.005153298377990723, -0.004977405071258545, -0.004801511764526367, -0.0046256184577941895, -0.004449725151062012, -0.004273831844329834, -0.004097938537597656, -0.0039220452308654785, -0.0037461519241333008, -0.003570258617401123, -0.0033943653106689453, -0.0032184720039367676, -0.00304257869720459, -0.002866685390472412, -0.0026907920837402344, -0.0025148987770080566, -0.002339005470275879, -0.002163112163543701, -0.0019872188568115234, -0.0018113255500793457, -0.001635432243347168, -0.0014595389366149902, -0.0012836456298828125, -0.0011077523231506348, -0.000931859016418457, -0.0007559657096862793, -0.0005800724029541016, -0.00040417909622192383, -0.0002282857894897461, -5.239248275756836e-05, 0.00012350082397460938, 0.0002993941307067871, 0.00047528743743896484, 0.0006511807441711426, 0.0008270740509033203, 0.001002967357635498, 0.0011788606643676758, 0.0013547539710998535, 0.0015306472778320312, 0.001706540584564209, 0.0018824338912963867, 0.0020583271980285645, 0.002234220504760742, 0.00241011381149292, 0.0025860071182250977, 0.0027619004249572754, 0.002937793731689453, 0.003113687038421631, 0.0032895803451538086, 0.0034654736518859863, 0.003641366958618164, 0.003817260265350342, 0.0039931535720825195, 0.004169046878814697, 0.004344940185546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 10.0, 11.0, 14.0, 21.0, 25.0, 27.0, 35.0, 61.0, 82.0, 128.0, 221.0, 326.0, 509.0, 871.0, 1456.0, 2781.0, 4982.0, 9729.0, 19352.0, 39751.0, 83938.0, 163575.0, 238497.0, 219600.0, 132791.0, 65854.0, 31366.0, 15218.0, 7693.0, 4145.0, 2198.0, 1233.0, 725.0, 453.0, 260.0, 193.0, 136.0, 74.0, 68.0, 36.0, 23.0, 24.0, 24.0, 16.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-77.625, -75.2607421875, -72.896484375, -70.5322265625, -68.16796875, -65.8037109375, -63.439453125, -61.0751953125, -58.7109375, -56.3466796875, -53.982421875, -51.6181640625, -49.25390625, -46.8896484375, -44.525390625, -42.1611328125, -39.796875, -37.4326171875, -35.068359375, -32.7041015625, -30.33984375, -27.9755859375, -25.611328125, -23.2470703125, -20.8828125, -18.5185546875, -16.154296875, -13.7900390625, -11.42578125, -9.0615234375, -6.697265625, -4.3330078125, -1.96875, 0.3955078125, 2.759765625, 5.1240234375, 7.48828125, 9.8525390625, 12.216796875, 14.5810546875, 16.9453125, 19.3095703125, 21.673828125, 24.0380859375, 26.40234375, 28.7666015625, 31.130859375, 33.4951171875, 35.859375, 38.2236328125, 40.587890625, 42.9521484375, 45.31640625, 47.6806640625, 50.044921875, 52.4091796875, 54.7734375, 57.1376953125, 59.501953125, 61.8662109375, 64.23046875, 66.5947265625, 68.958984375, 71.3232421875, 73.6875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 8.0, 8.0, 10.0, 24.0, 19.0, 17.0, 14.0, 19.0, 22.0, 48.0, 47.0, 46.0, 40.0, 54.0, 52.0, 55.0, 45.0, 56.0, 32.0, 54.0, 44.0, 44.0, 41.0, 28.0, 34.0, 27.0, 18.0, 17.0, 21.0, 9.0, 7.0, 6.0, 3.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.90625, -18.32177734375, -17.7373046875, -17.15283203125, -16.568359375, -15.98388671875, -15.3994140625, -14.81494140625, -14.23046875, -13.64599609375, -13.0615234375, -12.47705078125, -11.892578125, -11.30810546875, -10.7236328125, -10.13916015625, -9.5546875, -8.97021484375, -8.3857421875, -7.80126953125, -7.216796875, -6.63232421875, -6.0478515625, -5.46337890625, -4.87890625, -4.29443359375, -3.7099609375, -3.12548828125, -2.541015625, -1.95654296875, -1.3720703125, -0.78759765625, -0.203125, 0.38134765625, 0.9658203125, 1.55029296875, 2.134765625, 2.71923828125, 3.3037109375, 3.88818359375, 4.47265625, 5.05712890625, 5.6416015625, 6.22607421875, 6.810546875, 7.39501953125, 7.9794921875, 8.56396484375, 9.1484375, 9.73291015625, 10.3173828125, 10.90185546875, 11.486328125, 12.07080078125, 12.6552734375, 13.23974609375, 13.82421875, 14.40869140625, 14.9931640625, 15.57763671875, 16.162109375, 16.74658203125, 17.3310546875, 17.91552734375, 18.5]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 7.0, 4.0, 5.0, 5.0, 6.0, 13.0, 12.0, 10.0, 23.0, 20.0, 25.0, 27.0, 31.0, 29.0, 33.0, 33.0, 54.0, 47.0, 46.0, 47.0, 54.0, 59.0, 46.0, 47.0, 42.0, 38.0, 26.0, 27.0, 35.0, 22.0, 27.0, 26.0, 18.0, 17.0, 10.0, 8.0, 3.0, 7.0, 6.0, 7.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.48670959472656, -98.48464965820312, -94.48259735107422, -90.48053741455078, -86.47848510742188, -82.47642517089844, -78.474365234375, -74.47230529785156, -70.47025299072266, -66.46819305419922, -62.46614074707031, -58.464080810546875, -54.4620246887207, -50.45996856689453, -46.457908630371094, -42.45585250854492, -38.45379638671875, -34.45174026489258, -30.449682235717773, -26.44762420654297, -22.445568084716797, -18.443511962890625, -14.44145393371582, -10.439395904541016, -6.437339782714844, -2.4352827072143555, 1.5667743682861328, 5.568831443786621, 9.57088851928711, 13.572944641113281, 17.575002670288086, 21.57706069946289, 25.579132080078125, 29.581188201904297, 33.58324432373047, 37.585304260253906, 41.58736038208008, 45.58941650390625, 49.59147644042969, 53.59353256225586, 57.59558868408203, 61.5976448059082, 65.59970092773438, 69.60176086425781, 73.60382080078125, 77.60587310791016, 81.6079330444336, 85.6099853515625, 89.61204528808594, 93.61410522460938, 97.61615753173828, 101.61821746826172, 105.62026977539062, 109.62232971191406, 113.6243896484375, 117.62644958496094, 121.62850189208984, 125.63056182861328, 129.6326141357422, 133.63467407226562, 137.63673400878906, 141.6387939453125, 145.64083862304688, 149.6428985595703, 153.64495849609375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 7.0, 10.0, 5.0, 13.0, 17.0, 14.0, 27.0, 22.0, 21.0, 31.0, 25.0, 33.0, 28.0, 37.0, 37.0, 32.0, 42.0, 30.0, 34.0, 46.0, 45.0, 46.0, 37.0, 44.0, 34.0, 34.0, 36.0, 33.0, 23.0, 26.0, 24.0, 21.0, 10.0, 15.0, 12.0, 9.0, 4.0, 10.0, 7.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-129.37306213378906, -125.76629638671875, -122.15953063964844, -118.55276489257812, -114.94599914550781, -111.3392333984375, -107.73246765136719, -104.12570190429688, -100.51893615722656, -96.91217041015625, -93.30540466308594, -89.69863891601562, -86.09187316894531, -82.485107421875, -78.87834167480469, -75.27157592773438, -71.66480255126953, -68.05803680419922, -64.4512710571289, -60.844505310058594, -57.23773956298828, -53.63097381591797, -50.02420425415039, -46.41743850708008, -42.810672760009766, -39.20390701293945, -35.59714126586914, -31.990373611450195, -28.383607864379883, -24.77684211730957, -21.170074462890625, -17.563308715820312, -13.956550598144531, -10.349784851074219, -6.74301815032959, -3.136251449584961, 0.47051429748535156, 4.077280044555664, 7.684047698974609, 11.290813446044922, 14.897579193115234, 18.504344940185547, 22.11111068725586, 25.717878341674805, 29.324644088745117, 32.93141174316406, 36.538177490234375, 40.14494323730469, 43.751708984375, 47.35847473144531, 50.965240478515625, 54.57200622558594, 58.17877197265625, 61.78553771972656, 65.39230346679688, 68.99906921386719, 72.6058349609375, 76.21260070800781, 79.81936645507812, 83.42613220214844, 87.03289794921875, 90.63966369628906, 94.24642944335938, 97.85319519042969, 101.45996856689453]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 17.0, 14.0, 27.0, 63.0, 82.0, 131.0, 213.0, 383.0, 631.0, 1016.0, 1535.0, 2419.0, 3632.0, 5485.0, 7967.0, 11477.0, 16210.0, 22083.0, 29471.0, 38134.0, 47066.0, 56509.0, 66368.0, 74225.0, 79294.0, 82121.0, 80978.0, 76636.0, 69574.0, 61083.0, 52420.0, 41998.0, 33083.0, 25219.0, 18791.0, 13465.0, 9658.0, 6500.0, 4444.0, 2975.0, 1936.0, 1214.0, 768.0, 490.0, 293.0, 185.0, 121.0, 64.0, 53.0, 15.0, 11.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-71.1875, -69.0126953125, -66.837890625, -64.6630859375, -62.48828125, -60.3134765625, -58.138671875, -55.9638671875, -53.7890625, -51.6142578125, -49.439453125, -47.2646484375, -45.08984375, -42.9150390625, -40.740234375, -38.5654296875, -36.390625, -34.2158203125, -32.041015625, -29.8662109375, -27.69140625, -25.5166015625, -23.341796875, -21.1669921875, -18.9921875, -16.8173828125, -14.642578125, -12.4677734375, -10.29296875, -8.1181640625, -5.943359375, -3.7685546875, -1.59375, 0.5810546875, 2.755859375, 4.9306640625, 7.10546875, 9.2802734375, 11.455078125, 13.6298828125, 15.8046875, 17.9794921875, 20.154296875, 22.3291015625, 24.50390625, 26.6787109375, 28.853515625, 31.0283203125, 33.203125, 35.3779296875, 37.552734375, 39.7275390625, 41.90234375, 44.0771484375, 46.251953125, 48.4267578125, 50.6015625, 52.7763671875, 54.951171875, 57.1259765625, 59.30078125, 61.4755859375, 63.650390625, 65.8251953125, 68.0]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 8.0, 9.0, 7.0, 6.0, 14.0, 19.0, 13.0, 25.0, 23.0, 22.0, 30.0, 24.0, 33.0, 31.0, 36.0, 37.0, 33.0, 43.0, 29.0, 32.0, 45.0, 46.0, 44.0, 40.0, 45.0, 35.0, 35.0, 36.0, 31.0, 20.0, 30.0, 20.0, 23.0, 8.0, 18.0, 11.0, 8.0, 4.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-126.0, -122.482421875, -118.96484375, -115.447265625, -111.9296875, -108.412109375, -104.89453125, -101.376953125, -97.859375, -94.341796875, -90.82421875, -87.306640625, -83.7890625, -80.271484375, -76.75390625, -73.236328125, -69.71875, -66.201171875, -62.68359375, -59.166015625, -55.6484375, -52.130859375, -48.61328125, -45.095703125, -41.578125, -38.060546875, -34.54296875, -31.025390625, -27.5078125, -23.990234375, -20.47265625, -16.955078125, -13.4375, -9.919921875, -6.40234375, -2.884765625, 0.6328125, 4.150390625, 7.66796875, 11.185546875, 14.703125, 18.220703125, 21.73828125, 25.255859375, 28.7734375, 32.291015625, 35.80859375, 39.326171875, 42.84375, 46.361328125, 49.87890625, 53.396484375, 56.9140625, 60.431640625, 63.94921875, 67.466796875, 70.984375, 74.501953125, 78.01953125, 81.537109375, 85.0546875, 88.572265625, 92.08984375, 95.607421875, 99.125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 15.0, 27.0, 59.0, 85.0, 129.0, 235.0, 397.0, 740.0, 1294.0, 2135.0, 3585.0, 6126.0, 9611.0, 15001.0, 22744.0, 33446.0, 46536.0, 62122.0, 77403.0, 91957.0, 101156.0, 103886.0, 100454.0, 90609.0, 76354.0, 61507.0, 46357.0, 32984.0, 22691.0, 14968.0, 9327.0, 5997.0, 3558.0, 2134.0, 1249.0, 732.0, 406.0, 227.0, 125.0, 67.0, 55.0, 29.0, 15.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.375, -83.7158203125, -81.056640625, -78.3974609375, -75.73828125, -73.0791015625, -70.419921875, -67.7607421875, -65.1015625, -62.4423828125, -59.783203125, -57.1240234375, -54.46484375, -51.8056640625, -49.146484375, -46.4873046875, -43.828125, -41.1689453125, -38.509765625, -35.8505859375, -33.19140625, -30.5322265625, -27.873046875, -25.2138671875, -22.5546875, -19.8955078125, -17.236328125, -14.5771484375, -11.91796875, -9.2587890625, -6.599609375, -3.9404296875, -1.28125, 1.3779296875, 4.037109375, 6.6962890625, 9.35546875, 12.0146484375, 14.673828125, 17.3330078125, 19.9921875, 22.6513671875, 25.310546875, 27.9697265625, 30.62890625, 33.2880859375, 35.947265625, 38.6064453125, 41.265625, 43.9248046875, 46.583984375, 49.2431640625, 51.90234375, 54.5615234375, 57.220703125, 59.8798828125, 62.5390625, 65.1982421875, 67.857421875, 70.5166015625, 73.17578125, 75.8349609375, 78.494140625, 81.1533203125, 83.8125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 7.0, 16.0, 6.0, 20.0, 18.0, 21.0, 22.0, 30.0, 14.0, 42.0, 32.0, 35.0, 43.0, 48.0, 37.0, 48.0, 40.0, 50.0, 51.0, 42.0, 49.0, 26.0, 34.0, 37.0, 34.0, 34.0, 18.0, 19.0, 17.0, 13.0, 18.0, 16.0, 12.0, 10.0, 6.0, 8.0, 4.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.4375, -74.056640625, -71.67578125, -69.294921875, -66.9140625, -64.533203125, -62.15234375, -59.771484375, -57.390625, -55.009765625, -52.62890625, -50.248046875, -47.8671875, -45.486328125, -43.10546875, -40.724609375, -38.34375, -35.962890625, -33.58203125, -31.201171875, -28.8203125, -26.439453125, -24.05859375, -21.677734375, -19.296875, -16.916015625, -14.53515625, -12.154296875, -9.7734375, -7.392578125, -5.01171875, -2.630859375, -0.25, 2.130859375, 4.51171875, 6.892578125, 9.2734375, 11.654296875, 14.03515625, 16.416015625, 18.796875, 21.177734375, 23.55859375, 25.939453125, 28.3203125, 30.701171875, 33.08203125, 35.462890625, 37.84375, 40.224609375, 42.60546875, 44.986328125, 47.3671875, 49.748046875, 52.12890625, 54.509765625, 56.890625, 59.271484375, 61.65234375, 64.033203125, 66.4140625, 68.794921875, 71.17578125, 73.556640625, 75.9375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 1.0, 14.0, 22.0, 27.0, 56.0, 78.0, 159.0, 275.0, 426.0, 718.0, 1181.0, 2090.0, 3207.0, 5259.0, 8048.0, 12532.0, 19101.0, 27568.0, 39202.0, 52954.0, 67829.0, 82535.0, 93181.0, 100274.0, 101126.0, 95304.0, 84121.0, 69840.0, 54868.0, 40649.0, 29080.0, 20308.0, 13399.0, 8829.0, 5421.0, 3432.0, 2145.0, 1330.0, 762.0, 480.0, 282.0, 184.0, 113.0, 54.0, 33.0, 24.0, 14.0, 10.0, 5.0, 6.0, 3.0], "bins": [-38.09375, -37.066162109375, -36.03857421875, -35.010986328125, -33.9833984375, -32.955810546875, -31.92822265625, -30.900634765625, -29.873046875, -28.845458984375, -27.81787109375, -26.790283203125, -25.7626953125, -24.735107421875, -23.70751953125, -22.679931640625, -21.65234375, -20.624755859375, -19.59716796875, -18.569580078125, -17.5419921875, -16.514404296875, -15.48681640625, -14.459228515625, -13.431640625, -12.404052734375, -11.37646484375, -10.348876953125, -9.3212890625, -8.293701171875, -7.26611328125, -6.238525390625, -5.2109375, -4.183349609375, -3.15576171875, -2.128173828125, -1.1005859375, -0.072998046875, 0.95458984375, 1.982177734375, 3.009765625, 4.037353515625, 5.06494140625, 6.092529296875, 7.1201171875, 8.147705078125, 9.17529296875, 10.202880859375, 11.23046875, 12.258056640625, 13.28564453125, 14.313232421875, 15.3408203125, 16.368408203125, 17.39599609375, 18.423583984375, 19.451171875, 20.478759765625, 21.50634765625, 22.533935546875, 23.5615234375, 24.589111328125, 25.61669921875, 26.644287109375, 27.671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 7.0, 5.0, 10.0, 8.0, 12.0, 11.0, 11.0, 19.0, 26.0, 29.0, 35.0, 42.0, 56.0, 42.0, 41.0, 47.0, 55.0, 55.0, 44.0, 48.0, 53.0, 49.0, 46.0, 31.0, 39.0, 23.0, 47.0, 28.0, 18.0, 14.0, 17.0, 10.0, 12.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005527496337890625, -0.005363941192626953, -0.005200386047363281, -0.005036830902099609, -0.0048732757568359375, -0.004709720611572266, -0.004546165466308594, -0.004382610321044922, -0.00421905517578125, -0.004055500030517578, -0.0038919448852539062, -0.0037283897399902344, -0.0035648345947265625, -0.0034012794494628906, -0.0032377243041992188, -0.003074169158935547, -0.002910614013671875, -0.002747058868408203, -0.0025835037231445312, -0.0024199485778808594, -0.0022563934326171875, -0.0020928382873535156, -0.0019292831420898438, -0.0017657279968261719, -0.0016021728515625, -0.0014386177062988281, -0.0012750625610351562, -0.0011115074157714844, -0.0009479522705078125, -0.0007843971252441406, -0.0006208419799804688, -0.0004572868347167969, -0.000293731689453125, -0.00013017654418945312, 3.337860107421875e-05, 0.00019693374633789062, 0.0003604888916015625, 0.0005240440368652344, 0.0006875991821289062, 0.0008511543273925781, 0.00101470947265625, 0.0011782646179199219, 0.0013418197631835938, 0.0015053749084472656, 0.0016689300537109375, 0.0018324851989746094, 0.0019960403442382812, 0.002159595489501953, 0.002323150634765625, 0.002486705780029297, 0.0026502609252929688, 0.0028138160705566406, 0.0029773712158203125, 0.0031409263610839844, 0.0033044815063476562, 0.003468036651611328, 0.003631591796875, 0.003795146942138672, 0.003958702087402344, 0.004122257232666016, 0.0042858123779296875, 0.004449367523193359, 0.004612922668457031, 0.004776477813720703, 0.004940032958984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 12.0, 14.0, 28.0, 44.0, 69.0, 121.0, 189.0, 317.0, 468.0, 741.0, 1152.0, 1968.0, 3043.0, 4634.0, 7364.0, 11168.0, 16758.0, 24495.0, 34587.0, 46195.0, 60488.0, 74515.0, 87799.0, 96621.0, 99949.0, 96582.0, 87887.0, 75502.0, 61115.0, 47227.0, 34572.0, 24397.0, 16709.0, 11382.0, 7474.0, 4885.0, 2980.0, 1874.0, 1181.0, 785.0, 449.0, 296.0, 226.0, 120.0, 59.0, 40.0, 26.0, 16.0, 8.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.4375, -34.31298828125, -33.1884765625, -32.06396484375, -30.939453125, -29.81494140625, -28.6904296875, -27.56591796875, -26.44140625, -25.31689453125, -24.1923828125, -23.06787109375, -21.943359375, -20.81884765625, -19.6943359375, -18.56982421875, -17.4453125, -16.32080078125, -15.1962890625, -14.07177734375, -12.947265625, -11.82275390625, -10.6982421875, -9.57373046875, -8.44921875, -7.32470703125, -6.2001953125, -5.07568359375, -3.951171875, -2.82666015625, -1.7021484375, -0.57763671875, 0.546875, 1.67138671875, 2.7958984375, 3.92041015625, 5.044921875, 6.16943359375, 7.2939453125, 8.41845703125, 9.54296875, 10.66748046875, 11.7919921875, 12.91650390625, 14.041015625, 15.16552734375, 16.2900390625, 17.41455078125, 18.5390625, 19.66357421875, 20.7880859375, 21.91259765625, 23.037109375, 24.16162109375, 25.2861328125, 26.41064453125, 27.53515625, 28.65966796875, 29.7841796875, 30.90869140625, 32.033203125, 33.15771484375, 34.2822265625, 35.40673828125, 36.53125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 10.0, 6.0, 4.0, 11.0, 11.0, 14.0, 14.0, 13.0, 33.0, 27.0, 24.0, 30.0, 44.0, 40.0, 37.0, 61.0, 54.0, 41.0, 53.0, 43.0, 47.0, 40.0, 37.0, 33.0, 30.0, 35.0, 37.0, 27.0, 24.0, 25.0, 20.0, 21.0, 8.0, 9.0, 11.0, 3.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.578125, -16.043701171875, -15.50927734375, -14.974853515625, -14.4404296875, -13.906005859375, -13.37158203125, -12.837158203125, -12.302734375, -11.768310546875, -11.23388671875, -10.699462890625, -10.1650390625, -9.630615234375, -9.09619140625, -8.561767578125, -8.02734375, -7.492919921875, -6.95849609375, -6.424072265625, -5.8896484375, -5.355224609375, -4.82080078125, -4.286376953125, -3.751953125, -3.217529296875, -2.68310546875, -2.148681640625, -1.6142578125, -1.079833984375, -0.54541015625, -0.010986328125, 0.5234375, 1.057861328125, 1.59228515625, 2.126708984375, 2.6611328125, 3.195556640625, 3.72998046875, 4.264404296875, 4.798828125, 5.333251953125, 5.86767578125, 6.402099609375, 6.9365234375, 7.470947265625, 8.00537109375, 8.539794921875, 9.07421875, 9.608642578125, 10.14306640625, 10.677490234375, 11.2119140625, 11.746337890625, 12.28076171875, 12.815185546875, 13.349609375, 13.884033203125, 14.41845703125, 14.952880859375, 15.4873046875, 16.021728515625, 16.55615234375, 17.090576171875, 17.625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 10.0, 7.0, 12.0, 12.0, 13.0, 13.0, 20.0, 29.0, 28.0, 26.0, 33.0, 48.0, 46.0, 49.0, 41.0, 51.0, 41.0, 48.0, 45.0, 60.0, 40.0, 37.0, 37.0, 34.0, 34.0, 31.0, 29.0, 25.0, 18.0, 9.0, 16.0, 12.0, 11.0, 7.0, 6.0, 5.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.46051788330078, -99.41128540039062, -95.362060546875, -91.31282806396484, -87.26359558105469, -83.21436309814453, -79.16513061523438, -75.11590576171875, -71.0666732788086, -67.01744079589844, -62.96821212768555, -58.918983459472656, -54.8697509765625, -50.820518493652344, -46.77128982543945, -42.72206115722656, -38.672828674316406, -34.62359619140625, -30.57436752319336, -26.525136947631836, -22.475906372070312, -18.42667579650879, -14.377445220947266, -10.328214645385742, -6.278984069824219, -2.2297534942626953, 1.8194770812988281, 5.868707656860352, 9.917938232421875, 13.967168807983398, 18.016399383544922, 22.065629959106445, 26.114852905273438, 30.16408348083496, 34.213314056396484, 38.262542724609375, 42.31177520751953, 46.36100769042969, 50.41023635864258, 54.45946502685547, 58.508697509765625, 62.55792999267578, 66.60716247558594, 70.65638732910156, 74.70561981201172, 78.75485229492188, 82.8040771484375, 86.85330963134766, 90.90254211425781, 94.95177459716797, 99.00100708007812, 103.05023193359375, 107.0994644165039, 111.14869689941406, 115.19792175292969, 119.24715423583984, 123.29638671875, 127.34561920166016, 131.3948516845703, 135.44407653808594, 139.49331665039062, 143.54254150390625, 147.59176635742188, 151.64100646972656, 155.6902313232422]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 6.0, 3.0, 9.0, 15.0, 9.0, 13.0, 16.0, 22.0, 15.0, 23.0, 28.0, 34.0, 39.0, 34.0, 28.0, 25.0, 29.0, 47.0, 41.0, 40.0, 29.0, 55.0, 52.0, 45.0, 32.0, 38.0, 32.0, 36.0, 24.0, 29.0, 25.0, 17.0, 28.0, 15.0, 12.0, 9.0, 8.0, 5.0, 10.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-113.9129867553711, -110.26800537109375, -106.62301635742188, -102.97803497314453, -99.33305358886719, -95.68806457519531, -92.04308319091797, -88.39810180664062, -84.75311279296875, -81.1081314086914, -77.46314239501953, -73.81816101074219, -70.17317962646484, -66.5281982421875, -62.883209228515625, -59.23822784423828, -55.59324645996094, -51.94826126098633, -48.303279876708984, -44.658294677734375, -41.01331329345703, -37.36832809448242, -33.72334289550781, -30.078359603881836, -26.43337631225586, -22.788393020629883, -19.143409729003906, -15.498424530029297, -11.85344123840332, -8.208457946777344, -4.563472747802734, -0.9184894561767578, 2.7264938354492188, 6.3714776039123535, 10.016461372375488, 13.661445617675781, 17.306428909301758, 20.951412200927734, 24.596397399902344, 28.24138069152832, 31.886363983154297, 35.531349182128906, 39.17633056640625, 42.82131576538086, 46.46630096435547, 50.11128234863281, 53.75626754760742, 57.40125274658203, 61.046234130859375, 64.69121551513672, 68.3362045288086, 71.98118591308594, 75.62616729736328, 79.27114868164062, 82.9161376953125, 86.56111907958984, 90.20610046386719, 93.85108184814453, 97.4960708618164, 101.14105224609375, 104.7860336303711, 108.43101501464844, 112.07600402832031, 115.72098541259766, 119.36597442626953]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 7.0, 7.0, 17.0, 26.0, 56.0, 83.0, 142.0, 219.0, 401.0, 663.0, 1124.0, 1818.0, 3124.0, 4995.0, 7877.0, 12256.0, 19460.0, 29363.0, 44280.0, 64598.0, 92487.0, 126904.0, 169587.0, 218368.0, 269454.0, 316206.0, 353565.0, 372489.0, 372583.0, 351497.0, 313435.0, 265728.0, 215985.0, 166811.0, 123988.0, 90110.0, 62757.0, 42929.0, 28719.0, 18426.0, 11967.0, 7750.0, 4659.0, 2943.0, 1822.0, 1048.0, 632.0, 367.0, 227.0, 134.0, 101.0, 49.0, 30.0, 14.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.5625, -75.0576171875, -72.552734375, -70.0478515625, -67.54296875, -65.0380859375, -62.533203125, -60.0283203125, -57.5234375, -55.0185546875, -52.513671875, -50.0087890625, -47.50390625, -44.9990234375, -42.494140625, -39.9892578125, -37.484375, -34.9794921875, -32.474609375, -29.9697265625, -27.46484375, -24.9599609375, -22.455078125, -19.9501953125, -17.4453125, -14.9404296875, -12.435546875, -9.9306640625, -7.42578125, -4.9208984375, -2.416015625, 0.0888671875, 2.59375, 5.0986328125, 7.603515625, 10.1083984375, 12.61328125, 15.1181640625, 17.623046875, 20.1279296875, 22.6328125, 25.1376953125, 27.642578125, 30.1474609375, 32.65234375, 35.1572265625, 37.662109375, 40.1669921875, 42.671875, 45.1767578125, 47.681640625, 50.1865234375, 52.69140625, 55.1962890625, 57.701171875, 60.2060546875, 62.7109375, 65.2158203125, 67.720703125, 70.2255859375, 72.73046875, 75.2353515625, 77.740234375, 80.2451171875, 82.75]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 6.0, 19.0, 11.0, 17.0, 18.0, 21.0, 18.0, 28.0, 29.0, 37.0, 35.0, 31.0, 27.0, 29.0, 51.0, 39.0, 40.0, 32.0, 56.0, 45.0, 42.0, 46.0, 33.0, 34.0, 35.0, 25.0, 30.0, 26.0, 22.0, 25.0, 16.0, 11.0, 8.0, 8.0, 6.0, 9.0, 6.0, 4.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-105.875, -102.50390625, -99.1328125, -95.76171875, -92.390625, -89.01953125, -85.6484375, -82.27734375, -78.90625, -75.53515625, -72.1640625, -68.79296875, -65.421875, -62.05078125, -58.6796875, -55.30859375, -51.9375, -48.56640625, -45.1953125, -41.82421875, -38.453125, -35.08203125, -31.7109375, -28.33984375, -24.96875, -21.59765625, -18.2265625, -14.85546875, -11.484375, -8.11328125, -4.7421875, -1.37109375, 2.0, 5.37109375, 8.7421875, 12.11328125, 15.484375, 18.85546875, 22.2265625, 25.59765625, 28.96875, 32.33984375, 35.7109375, 39.08203125, 42.453125, 45.82421875, 49.1953125, 52.56640625, 55.9375, 59.30859375, 62.6796875, 66.05078125, 69.421875, 72.79296875, 76.1640625, 79.53515625, 82.90625, 86.27734375, 89.6484375, 93.01953125, 96.390625, 99.76171875, 103.1328125, 106.50390625, 109.875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 18.0, 36.0, 79.0, 126.0, 216.0, 405.0, 708.0, 1173.0, 2043.0, 3464.0, 5797.0, 9469.0, 14909.0, 23300.0, 35250.0, 52296.0, 75882.0, 105721.0, 142650.0, 186998.0, 232026.0, 277341.0, 316749.0, 345264.0, 358688.0, 354396.0, 332621.0, 298428.0, 254114.0, 208363.0, 162706.0, 122744.0, 89358.0, 62510.0, 42672.0, 28247.0, 18394.0, 11424.0, 7221.0, 4317.0, 2639.0, 1496.0, 913.0, 483.0, 305.0, 155.0, 86.0, 34.0, 30.0, 12.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.3125, -78.6669921875, -76.021484375, -73.3759765625, -70.73046875, -68.0849609375, -65.439453125, -62.7939453125, -60.1484375, -57.5029296875, -54.857421875, -52.2119140625, -49.56640625, -46.9208984375, -44.275390625, -41.6298828125, -38.984375, -36.3388671875, -33.693359375, -31.0478515625, -28.40234375, -25.7568359375, -23.111328125, -20.4658203125, -17.8203125, -15.1748046875, -12.529296875, -9.8837890625, -7.23828125, -4.5927734375, -1.947265625, 0.6982421875, 3.34375, 5.9892578125, 8.634765625, 11.2802734375, 13.92578125, 16.5712890625, 19.216796875, 21.8623046875, 24.5078125, 27.1533203125, 29.798828125, 32.4443359375, 35.08984375, 37.7353515625, 40.380859375, 43.0263671875, 45.671875, 48.3173828125, 50.962890625, 53.6083984375, 56.25390625, 58.8994140625, 61.544921875, 64.1904296875, 66.8359375, 69.4814453125, 72.126953125, 74.7724609375, 77.41796875, 80.0634765625, 82.708984375, 85.3544921875, 88.0]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 13.0, 18.0, 16.0, 26.0, 44.0, 40.0, 61.0, 72.0, 77.0, 91.0, 95.0, 126.0, 144.0, 147.0, 165.0, 186.0, 205.0, 210.0, 206.0, 228.0, 228.0, 214.0, 178.0, 185.0, 177.0, 166.0, 167.0, 110.0, 92.0, 68.0, 66.0, 56.0, 36.0, 32.0, 27.0, 27.0, 17.0, 14.0, 13.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.03125, -51.38671875, -49.7421875, -48.09765625, -46.453125, -44.80859375, -43.1640625, -41.51953125, -39.875, -38.23046875, -36.5859375, -34.94140625, -33.296875, -31.65234375, -30.0078125, -28.36328125, -26.71875, -25.07421875, -23.4296875, -21.78515625, -20.140625, -18.49609375, -16.8515625, -15.20703125, -13.5625, -11.91796875, -10.2734375, -8.62890625, -6.984375, -5.33984375, -3.6953125, -2.05078125, -0.40625, 1.23828125, 2.8828125, 4.52734375, 6.171875, 7.81640625, 9.4609375, 11.10546875, 12.75, 14.39453125, 16.0390625, 17.68359375, 19.328125, 20.97265625, 22.6171875, 24.26171875, 25.90625, 27.55078125, 29.1953125, 30.83984375, 32.484375, 34.12890625, 35.7734375, 37.41796875, 39.0625, 40.70703125, 42.3515625, 43.99609375, 45.640625, 47.28515625, 48.9296875, 50.57421875, 52.21875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 3.0, 6.0, 6.0, 11.0, 8.0, 9.0, 22.0, 15.0, 17.0, 24.0, 29.0, 34.0, 30.0, 50.0, 43.0, 45.0, 44.0, 31.0, 48.0, 35.0, 40.0, 39.0, 37.0, 37.0, 43.0, 34.0, 44.0, 31.0, 34.0, 28.0, 18.0, 14.0, 14.0, 13.0, 19.0, 10.0, 8.0, 2.0, 6.0, 12.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.12509155273438, -110.19347381591797, -106.2618637084961, -102.33024597167969, -98.39862823486328, -94.4670181274414, -90.535400390625, -86.60379028320312, -82.67217254638672, -78.74055480957031, -74.80894470214844, -70.87732696533203, -66.94570922851562, -63.01409912109375, -59.082481384277344, -55.1508674621582, -51.2192497253418, -47.287635803222656, -43.35601806640625, -39.42440414428711, -35.49279022216797, -31.561174392700195, -27.629558563232422, -23.69794464111328, -19.766328811645508, -15.83471393585205, -11.903099060058594, -7.97148323059082, -4.039868354797363, -0.10825347900390625, 3.823362350463867, 7.754976272583008, 11.686592102050781, 15.618206977844238, 19.549821853637695, 23.48143768310547, 27.41305160522461, 31.344667434692383, 35.276283264160156, 39.2078971862793, 43.13951110839844, 47.07112503051758, 51.002742767333984, 54.934356689453125, 58.865970611572266, 62.797584533691406, 66.72920227050781, 70.66081237792969, 74.59243774414062, 78.52405548095703, 82.4556655883789, 86.38728332519531, 90.31890106201172, 94.2505111694336, 98.18212890625, 102.11373901367188, 106.04535675048828, 109.97697448730469, 113.90858459472656, 117.84020233154297, 121.77182006835938, 125.70343017578125, 129.63504028320312, 133.56666564941406, 137.49827575683594]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 6.0, 9.0, 8.0, 5.0, 11.0, 13.0, 16.0, 14.0, 23.0, 18.0, 27.0, 28.0, 28.0, 38.0, 19.0, 36.0, 36.0, 38.0, 37.0, 33.0, 33.0, 42.0, 47.0, 41.0, 31.0, 34.0, 44.0, 40.0, 35.0, 34.0, 25.0, 17.0, 21.0, 22.0, 17.0, 13.0, 9.0, 10.0, 12.0, 6.0, 2.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-106.30992126464844, -102.78382873535156, -99.25772857666016, -95.73163604736328, -92.20553588867188, -88.679443359375, -85.15335083007812, -81.62725067138672, -78.10115051269531, -74.57505798339844, -71.04895782470703, -67.52286529541016, -63.99676513671875, -60.470672607421875, -56.944576263427734, -53.418479919433594, -49.89238739013672, -46.36629104614258, -42.84019470214844, -39.31410217285156, -35.788002014160156, -32.26190948486328, -28.73581314086914, -25.209716796875, -21.68362045288086, -18.15752410888672, -14.631428718566895, -11.10533332824707, -7.57923698425293, -4.053140640258789, -0.5270462036132812, 2.9990501403808594, 6.525154113769531, 10.051250457763672, 13.577345848083496, 17.10344123840332, 20.62953758239746, 24.1556339263916, 27.68172836303711, 31.20782470703125, 34.73392105102539, 38.26001739501953, 41.78611373901367, 45.31221008300781, 48.83830261230469, 52.364402770996094, 55.89049530029297, 59.41659164428711, 62.94268798828125, 66.46878051757812, 69.99488067626953, 73.5209732055664, 77.04707336425781, 80.57316589355469, 84.09925842285156, 87.62535858154297, 91.15145874023438, 94.67755126953125, 98.20365142822266, 101.72974395751953, 105.25584411621094, 108.78193664550781, 112.30802917480469, 115.8341293334961, 119.36022186279297]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 6.0, 7.0, 11.0, 21.0, 32.0, 36.0, 57.0, 75.0, 126.0, 169.0, 255.0, 366.0, 636.0, 873.0, 1319.0, 2046.0, 3098.0, 4819.0, 7490.0, 11921.0, 18756.0, 28697.0, 44012.0, 64760.0, 89403.0, 113945.0, 130232.0, 129567.0, 114752.0, 89747.0, 64993.0, 44966.0, 29211.0, 18687.0, 11859.0, 7538.0, 4822.0, 3199.0, 2067.0, 1282.0, 891.0, 585.0, 386.0, 267.0, 192.0, 132.0, 81.0, 40.0, 37.0, 34.0, 21.0, 12.0, 8.0, 6.0, 3.0, 3.0, 0.0, 4.0], "bins": [-50.59375, -49.06103515625, -47.5283203125, -45.99560546875, -44.462890625, -42.93017578125, -41.3974609375, -39.86474609375, -38.33203125, -36.79931640625, -35.2666015625, -33.73388671875, -32.201171875, -30.66845703125, -29.1357421875, -27.60302734375, -26.0703125, -24.53759765625, -23.0048828125, -21.47216796875, -19.939453125, -18.40673828125, -16.8740234375, -15.34130859375, -13.80859375, -12.27587890625, -10.7431640625, -9.21044921875, -7.677734375, -6.14501953125, -4.6123046875, -3.07958984375, -1.546875, -0.01416015625, 1.5185546875, 3.05126953125, 4.583984375, 6.11669921875, 7.6494140625, 9.18212890625, 10.71484375, 12.24755859375, 13.7802734375, 15.31298828125, 16.845703125, 18.37841796875, 19.9111328125, 21.44384765625, 22.9765625, 24.50927734375, 26.0419921875, 27.57470703125, 29.107421875, 30.64013671875, 32.1728515625, 33.70556640625, 35.23828125, 36.77099609375, 38.3037109375, 39.83642578125, 41.369140625, 42.90185546875, 44.4345703125, 45.96728515625, 47.5]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 7.0, 1.0, 6.0, 9.0, 8.0, 5.0, 10.0, 13.0, 19.0, 14.0, 21.0, 20.0, 26.0, 26.0, 29.0, 39.0, 19.0, 37.0, 36.0, 34.0, 38.0, 37.0, 30.0, 44.0, 46.0, 39.0, 30.0, 37.0, 44.0, 40.0, 33.0, 36.0, 23.0, 22.0, 18.0, 22.0, 16.0, 14.0, 8.0, 13.0, 9.0, 6.0, 3.0, 4.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-106.0625, -102.5380859375, -99.013671875, -95.4892578125, -91.96484375, -88.4404296875, -84.916015625, -81.3916015625, -77.8671875, -74.3427734375, -70.818359375, -67.2939453125, -63.76953125, -60.2451171875, -56.720703125, -53.1962890625, -49.671875, -46.1474609375, -42.623046875, -39.0986328125, -35.57421875, -32.0498046875, -28.525390625, -25.0009765625, -21.4765625, -17.9521484375, -14.427734375, -10.9033203125, -7.37890625, -3.8544921875, -0.330078125, 3.1943359375, 6.71875, 10.2431640625, 13.767578125, 17.2919921875, 20.81640625, 24.3408203125, 27.865234375, 31.3896484375, 34.9140625, 38.4384765625, 41.962890625, 45.4873046875, 49.01171875, 52.5361328125, 56.060546875, 59.5849609375, 63.109375, 66.6337890625, 70.158203125, 73.6826171875, 77.20703125, 80.7314453125, 84.255859375, 87.7802734375, 91.3046875, 94.8291015625, 98.353515625, 101.8779296875, 105.40234375, 108.9267578125, 112.451171875, 115.9755859375, 119.5]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 6.0, 8.0, 11.0, 17.0, 28.0, 37.0, 49.0, 70.0, 145.0, 215.0, 360.0, 561.0, 1001.0, 1688.0, 3212.0, 6476.0, 14135.0, 35367.0, 98882.0, 258296.0, 346095.0, 175573.0, 62369.0, 23568.0, 9840.0, 4836.0, 2478.0, 1291.0, 734.0, 436.0, 284.0, 173.0, 114.0, 57.0, 39.0, 42.0, 23.0, 13.0, 5.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.5625, -96.2744140625, -92.986328125, -89.6982421875, -86.41015625, -83.1220703125, -79.833984375, -76.5458984375, -73.2578125, -69.9697265625, -66.681640625, -63.3935546875, -60.10546875, -56.8173828125, -53.529296875, -50.2412109375, -46.953125, -43.6650390625, -40.376953125, -37.0888671875, -33.80078125, -30.5126953125, -27.224609375, -23.9365234375, -20.6484375, -17.3603515625, -14.072265625, -10.7841796875, -7.49609375, -4.2080078125, -0.919921875, 2.3681640625, 5.65625, 8.9443359375, 12.232421875, 15.5205078125, 18.80859375, 22.0966796875, 25.384765625, 28.6728515625, 31.9609375, 35.2490234375, 38.537109375, 41.8251953125, 45.11328125, 48.4013671875, 51.689453125, 54.9775390625, 58.265625, 61.5537109375, 64.841796875, 68.1298828125, 71.41796875, 74.7060546875, 77.994140625, 81.2822265625, 84.5703125, 87.8583984375, 91.146484375, 94.4345703125, 97.72265625, 101.0107421875, 104.298828125, 107.5869140625, 110.875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 4.0, 10.0, 17.0, 9.0, 21.0, 17.0, 13.0, 23.0, 26.0, 26.0, 26.0, 32.0, 31.0, 42.0, 34.0, 52.0, 25.0, 40.0, 37.0, 40.0, 51.0, 40.0, 48.0, 34.0, 33.0, 41.0, 23.0, 28.0, 32.0, 24.0, 23.0, 20.0, 20.0, 5.0, 11.0, 6.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.3125, -71.845703125, -69.37890625, -66.912109375, -64.4453125, -61.978515625, -59.51171875, -57.044921875, -54.578125, -52.111328125, -49.64453125, -47.177734375, -44.7109375, -42.244140625, -39.77734375, -37.310546875, -34.84375, -32.376953125, -29.91015625, -27.443359375, -24.9765625, -22.509765625, -20.04296875, -17.576171875, -15.109375, -12.642578125, -10.17578125, -7.708984375, -5.2421875, -2.775390625, -0.30859375, 2.158203125, 4.625, 7.091796875, 9.55859375, 12.025390625, 14.4921875, 16.958984375, 19.42578125, 21.892578125, 24.359375, 26.826171875, 29.29296875, 31.759765625, 34.2265625, 36.693359375, 39.16015625, 41.626953125, 44.09375, 46.560546875, 49.02734375, 51.494140625, 53.9609375, 56.427734375, 58.89453125, 61.361328125, 63.828125, 66.294921875, 68.76171875, 71.228515625, 73.6953125, 76.162109375, 78.62890625, 81.095703125, 83.5625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 6.0, 10.0, 12.0, 12.0, 18.0, 33.0, 36.0, 47.0, 77.0, 118.0, 163.0, 251.0, 341.0, 525.0, 730.0, 1189.0, 1716.0, 2704.0, 4204.0, 6780.0, 11723.0, 21009.0, 39038.0, 79091.0, 166098.0, 276596.0, 214764.0, 105965.0, 51457.0, 26348.0, 14646.0, 8504.0, 5104.0, 3174.0, 2064.0, 1356.0, 854.0, 567.0, 397.0, 242.0, 178.0, 109.0, 97.0, 59.0, 44.0, 33.0, 26.0, 18.0, 13.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-45.0625, -43.763671875, -42.46484375, -41.166015625, -39.8671875, -38.568359375, -37.26953125, -35.970703125, -34.671875, -33.373046875, -32.07421875, -30.775390625, -29.4765625, -28.177734375, -26.87890625, -25.580078125, -24.28125, -22.982421875, -21.68359375, -20.384765625, -19.0859375, -17.787109375, -16.48828125, -15.189453125, -13.890625, -12.591796875, -11.29296875, -9.994140625, -8.6953125, -7.396484375, -6.09765625, -4.798828125, -3.5, -2.201171875, -0.90234375, 0.396484375, 1.6953125, 2.994140625, 4.29296875, 5.591796875, 6.890625, 8.189453125, 9.48828125, 10.787109375, 12.0859375, 13.384765625, 14.68359375, 15.982421875, 17.28125, 18.580078125, 19.87890625, 21.177734375, 22.4765625, 23.775390625, 25.07421875, 26.373046875, 27.671875, 28.970703125, 30.26953125, 31.568359375, 32.8671875, 34.166015625, 35.46484375, 36.763671875, 38.0625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 15.0, 7.0, 8.0, 12.0, 18.0, 22.0, 24.0, 35.0, 31.0, 38.0, 41.0, 71.0, 51.0, 56.0, 58.0, 55.0, 56.0, 50.0, 57.0, 53.0, 39.0, 29.0, 34.0, 35.0, 28.0, 13.0, 13.0, 14.0, 9.0, 6.0, 4.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0022945404052734375, -0.0022280514240264893, -0.002161562442779541, -0.0020950734615325928, -0.0020285844802856445, -0.0019620954990386963, -0.001895606517791748, -0.0018291175365447998, -0.0017626285552978516, -0.0016961395740509033, -0.001629650592803955, -0.0015631616115570068, -0.0014966726303100586, -0.0014301836490631104, -0.0013636946678161621, -0.0012972056865692139, -0.0012307167053222656, -0.0011642277240753174, -0.0010977387428283691, -0.001031249761581421, -0.0009647607803344727, -0.0008982717990875244, -0.0008317828178405762, -0.0007652938365936279, -0.0006988048553466797, -0.0006323158740997314, -0.0005658268928527832, -0.000499337911605835, -0.0004328489303588867, -0.0003663599491119385, -0.00029987096786499023, -0.000233381986618042, -0.00016689300537109375, -0.00010040402412414551, -3.3915042877197266e-05, 3.2573938369750977e-05, 9.906291961669922e-05, 0.00016555190086364746, 0.0002320408821105957, 0.00029852986335754395, 0.0003650188446044922, 0.00043150782585144043, 0.0004979968070983887, 0.0005644857883453369, 0.0006309747695922852, 0.0006974637508392334, 0.0007639527320861816, 0.0008304417133331299, 0.0008969306945800781, 0.0009634196758270264, 0.0010299086570739746, 0.0010963976383209229, 0.001162886619567871, 0.0012293756008148193, 0.0012958645820617676, 0.0013623535633087158, 0.001428842544555664, 0.0014953315258026123, 0.0015618205070495605, 0.0016283094882965088, 0.001694798469543457, 0.0017612874507904053, 0.0018277764320373535, 0.0018942654132843018, 0.00196075439453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 6.0, 11.0, 17.0, 20.0, 35.0, 57.0, 108.0, 156.0, 199.0, 281.0, 421.0, 695.0, 986.0, 1537.0, 2374.0, 3571.0, 5387.0, 8432.0, 12818.0, 19637.0, 29705.0, 44104.0, 64009.0, 87070.0, 111337.0, 126887.0, 127925.0, 112610.0, 88474.0, 65296.0, 45186.0, 30350.0, 20052.0, 13473.0, 8724.0, 5742.0, 3721.0, 2378.0, 1571.0, 1087.0, 689.0, 498.0, 314.0, 230.0, 121.0, 82.0, 57.0, 44.0, 28.0, 21.0, 12.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.0625, -34.86181640625, -33.6611328125, -32.46044921875, -31.259765625, -30.05908203125, -28.8583984375, -27.65771484375, -26.45703125, -25.25634765625, -24.0556640625, -22.85498046875, -21.654296875, -20.45361328125, -19.2529296875, -18.05224609375, -16.8515625, -15.65087890625, -14.4501953125, -13.24951171875, -12.048828125, -10.84814453125, -9.6474609375, -8.44677734375, -7.24609375, -6.04541015625, -4.8447265625, -3.64404296875, -2.443359375, -1.24267578125, -0.0419921875, 1.15869140625, 2.359375, 3.56005859375, 4.7607421875, 5.96142578125, 7.162109375, 8.36279296875, 9.5634765625, 10.76416015625, 11.96484375, 13.16552734375, 14.3662109375, 15.56689453125, 16.767578125, 17.96826171875, 19.1689453125, 20.36962890625, 21.5703125, 22.77099609375, 23.9716796875, 25.17236328125, 26.373046875, 27.57373046875, 28.7744140625, 29.97509765625, 31.17578125, 32.37646484375, 33.5771484375, 34.77783203125, 35.978515625, 37.17919921875, 38.3798828125, 39.58056640625, 40.78125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 6.0, 8.0, 11.0, 9.0, 26.0, 17.0, 22.0, 21.0, 43.0, 45.0, 55.0, 46.0, 48.0, 55.0, 48.0, 54.0, 43.0, 45.0, 39.0, 49.0, 39.0, 40.0, 30.0, 32.0, 18.0, 23.0, 21.0, 19.0, 14.0, 15.0, 9.0, 7.0, 7.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.390625, -15.850830078125, -15.31103515625, -14.771240234375, -14.2314453125, -13.691650390625, -13.15185546875, -12.612060546875, -12.072265625, -11.532470703125, -10.99267578125, -10.452880859375, -9.9130859375, -9.373291015625, -8.83349609375, -8.293701171875, -7.75390625, -7.214111328125, -6.67431640625, -6.134521484375, -5.5947265625, -5.054931640625, -4.51513671875, -3.975341796875, -3.435546875, -2.895751953125, -2.35595703125, -1.816162109375, -1.2763671875, -0.736572265625, -0.19677734375, 0.343017578125, 0.8828125, 1.422607421875, 1.96240234375, 2.502197265625, 3.0419921875, 3.581787109375, 4.12158203125, 4.661376953125, 5.201171875, 5.740966796875, 6.28076171875, 6.820556640625, 7.3603515625, 7.900146484375, 8.43994140625, 8.979736328125, 9.51953125, 10.059326171875, 10.59912109375, 11.138916015625, 11.6787109375, 12.218505859375, 12.75830078125, 13.298095703125, 13.837890625, 14.377685546875, 14.91748046875, 15.457275390625, 15.9970703125, 16.536865234375, 17.07666015625, 17.616455078125, 18.15625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 10.0, 12.0, 13.0, 14.0, 16.0, 24.0, 30.0, 30.0, 29.0, 38.0, 53.0, 47.0, 44.0, 41.0, 43.0, 36.0, 41.0, 46.0, 40.0, 37.0, 42.0, 46.0, 35.0, 41.0, 25.0, 31.0, 18.0, 15.0, 15.0, 18.0, 11.0, 10.0, 9.0, 7.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-125.12088775634766, -120.9701156616211, -116.8193359375, -112.66856384277344, -108.51779174804688, -104.36701965332031, -100.21624755859375, -96.06546783447266, -91.9146957397461, -87.76392364501953, -83.61314392089844, -79.46237182617188, -75.31159973144531, -71.16082763671875, -67.01005554199219, -62.859275817871094, -58.70850372314453, -54.55773162841797, -50.40695571899414, -46.25617980957031, -42.10540771484375, -37.95463562011719, -33.80385971069336, -29.653085708618164, -25.50231170654297, -21.351537704467773, -17.200763702392578, -13.049989700317383, -8.899215698242188, -4.748441696166992, -0.5976676940917969, 3.5531063079833984, 7.7038726806640625, 11.854646682739258, 16.005420684814453, 20.15619468688965, 24.306968688964844, 28.45774269104004, 32.608516693115234, 36.75929260253906, 40.910064697265625, 45.06083679199219, 49.211612701416016, 53.362388610839844, 57.513160705566406, 61.66393280029297, 65.81471252441406, 69.96548461914062, 74.11625671386719, 78.26702880859375, 82.41780090332031, 86.5685806274414, 90.71935272216797, 94.87012481689453, 99.02090454101562, 103.17167663574219, 107.32244873046875, 111.47322082519531, 115.62399291992188, 119.77477264404297, 123.92554473876953, 128.07632446289062, 132.2270965576172, 136.37786865234375, 140.5286407470703]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 8.0, 8.0, 10.0, 12.0, 13.0, 10.0, 18.0, 22.0, 19.0, 29.0, 27.0, 23.0, 34.0, 33.0, 31.0, 38.0, 34.0, 37.0, 35.0, 38.0, 55.0, 42.0, 33.0, 35.0, 31.0, 48.0, 34.0, 26.0, 36.0, 23.0, 27.0, 20.0, 22.0, 13.0, 17.0, 6.0, 9.0, 13.0, 4.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-106.82785034179688, -103.26084899902344, -99.69384765625, -96.12684631347656, -92.55984497070312, -88.99284362792969, -85.42584228515625, -81.85884094238281, -78.29183959960938, -74.72483825683594, -71.1578369140625, -67.59083557128906, -64.02383422851562, -60.45683288574219, -56.88983154296875, -53.32283020019531, -49.755828857421875, -46.18882751464844, -42.621826171875, -39.05482482910156, -35.487823486328125, -31.920822143554688, -28.35382080078125, -24.786819458007812, -21.219818115234375, -17.652816772460938, -14.0858154296875, -10.518814086914062, -6.951812744140625, -3.3848114013671875, 0.18218994140625, 3.7491912841796875, 7.316184997558594, 10.883186340332031, 14.450187683105469, 18.017189025878906, 21.584190368652344, 25.15119171142578, 28.71819305419922, 32.285194396972656, 35.852195739746094, 39.41919708251953, 42.98619842529297, 46.553199768066406, 50.120201110839844, 53.68720245361328, 57.25420379638672, 60.821205139160156, 64.3882064819336, 67.95520782470703, 71.52220916748047, 75.0892105102539, 78.65621185302734, 82.22321319580078, 85.79021453857422, 89.35721588134766, 92.9242172241211, 96.49121856689453, 100.05821990966797, 103.6252212524414, 107.19222259521484, 110.75922393798828, 114.32622528076172, 117.89322662353516, 121.4602279663086]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 7.0, 12.0, 19.0, 26.0, 36.0, 70.0, 126.0, 170.0, 281.0, 481.0, 721.0, 1215.0, 1710.0, 2758.0, 3928.0, 5908.0, 8767.0, 12152.0, 16987.0, 22963.0, 30430.0, 38849.0, 47466.0, 57300.0, 66055.0, 73282.0, 78489.0, 81228.0, 79785.0, 75541.0, 68814.0, 59880.0, 50984.0, 41629.0, 32851.0, 25462.0, 18637.0, 13867.0, 9620.0, 6695.0, 4574.0, 3101.0, 2029.0, 1320.0, 840.0, 583.0, 322.0, 232.0, 151.0, 85.0, 50.0, 35.0, 16.0, 12.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-68.875, -66.62890625, -64.3828125, -62.13671875, -59.890625, -57.64453125, -55.3984375, -53.15234375, -50.90625, -48.66015625, -46.4140625, -44.16796875, -41.921875, -39.67578125, -37.4296875, -35.18359375, -32.9375, -30.69140625, -28.4453125, -26.19921875, -23.953125, -21.70703125, -19.4609375, -17.21484375, -14.96875, -12.72265625, -10.4765625, -8.23046875, -5.984375, -3.73828125, -1.4921875, 0.75390625, 3.0, 5.24609375, 7.4921875, 9.73828125, 11.984375, 14.23046875, 16.4765625, 18.72265625, 20.96875, 23.21484375, 25.4609375, 27.70703125, 29.953125, 32.19921875, 34.4453125, 36.69140625, 38.9375, 41.18359375, 43.4296875, 45.67578125, 47.921875, 50.16796875, 52.4140625, 54.66015625, 56.90625, 59.15234375, 61.3984375, 63.64453125, 65.890625, 68.13671875, 70.3828125, 72.62890625, 74.875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 8.0, 9.0, 11.0, 17.0, 11.0, 18.0, 20.0, 19.0, 29.0, 28.0, 27.0, 35.0, 29.0, 32.0, 40.0, 35.0, 32.0, 42.0, 34.0, 53.0, 46.0, 28.0, 38.0, 36.0, 47.0, 29.0, 25.0, 35.0, 25.0, 28.0, 19.0, 17.0, 16.0, 14.0, 7.0, 7.0, 14.0, 3.0, 4.0, 9.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-102.8125, -99.3505859375, -95.888671875, -92.4267578125, -88.96484375, -85.5029296875, -82.041015625, -78.5791015625, -75.1171875, -71.6552734375, -68.193359375, -64.7314453125, -61.26953125, -57.8076171875, -54.345703125, -50.8837890625, -47.421875, -43.9599609375, -40.498046875, -37.0361328125, -33.57421875, -30.1123046875, -26.650390625, -23.1884765625, -19.7265625, -16.2646484375, -12.802734375, -9.3408203125, -5.87890625, -2.4169921875, 1.044921875, 4.5068359375, 7.96875, 11.4306640625, 14.892578125, 18.3544921875, 21.81640625, 25.2783203125, 28.740234375, 32.2021484375, 35.6640625, 39.1259765625, 42.587890625, 46.0498046875, 49.51171875, 52.9736328125, 56.435546875, 59.8974609375, 63.359375, 66.8212890625, 70.283203125, 73.7451171875, 77.20703125, 80.6689453125, 84.130859375, 87.5927734375, 91.0546875, 94.5166015625, 97.978515625, 101.4404296875, 104.90234375, 108.3642578125, 111.826171875, 115.2880859375, 118.75]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 13.0, 18.0, 26.0, 40.0, 104.0, 113.0, 201.0, 333.0, 521.0, 761.0, 1177.0, 1752.0, 2666.0, 4055.0, 5955.0, 8315.0, 12109.0, 16722.0, 22696.0, 29177.0, 37207.0, 45961.0, 55162.0, 63359.0, 70624.0, 75760.0, 77959.0, 78291.0, 74851.0, 68978.0, 62173.0, 53047.0, 44007.0, 35198.0, 27600.0, 20758.0, 15483.0, 11156.0, 8040.0, 5454.0, 3746.0, 2378.0, 1665.0, 1109.0, 660.0, 474.0, 269.0, 163.0, 110.0, 67.0, 48.0, 25.0, 13.0, 10.0, 2.0, 4.0, 0.0, 2.0], "bins": [-69.625, -67.5078125, -65.390625, -63.2734375, -61.15625, -59.0390625, -56.921875, -54.8046875, -52.6875, -50.5703125, -48.453125, -46.3359375, -44.21875, -42.1015625, -39.984375, -37.8671875, -35.75, -33.6328125, -31.515625, -29.3984375, -27.28125, -25.1640625, -23.046875, -20.9296875, -18.8125, -16.6953125, -14.578125, -12.4609375, -10.34375, -8.2265625, -6.109375, -3.9921875, -1.875, 0.2421875, 2.359375, 4.4765625, 6.59375, 8.7109375, 10.828125, 12.9453125, 15.0625, 17.1796875, 19.296875, 21.4140625, 23.53125, 25.6484375, 27.765625, 29.8828125, 32.0, 34.1171875, 36.234375, 38.3515625, 40.46875, 42.5859375, 44.703125, 46.8203125, 48.9375, 51.0546875, 53.171875, 55.2890625, 57.40625, 59.5234375, 61.640625, 63.7578125, 65.875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 8.0, 8.0, 12.0, 7.0, 6.0, 9.0, 13.0, 13.0, 20.0, 22.0, 21.0, 25.0, 22.0, 24.0, 35.0, 36.0, 34.0, 34.0, 29.0, 36.0, 42.0, 35.0, 33.0, 30.0, 36.0, 28.0, 37.0, 37.0, 24.0, 25.0, 23.0, 30.0, 22.0, 17.0, 21.0, 15.0, 19.0, 22.0, 14.0, 9.0, 12.0, 8.0, 8.0, 2.0, 7.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-58.375, -56.4287109375, -54.482421875, -52.5361328125, -50.58984375, -48.6435546875, -46.697265625, -44.7509765625, -42.8046875, -40.8583984375, -38.912109375, -36.9658203125, -35.01953125, -33.0732421875, -31.126953125, -29.1806640625, -27.234375, -25.2880859375, -23.341796875, -21.3955078125, -19.44921875, -17.5029296875, -15.556640625, -13.6103515625, -11.6640625, -9.7177734375, -7.771484375, -5.8251953125, -3.87890625, -1.9326171875, 0.013671875, 1.9599609375, 3.90625, 5.8525390625, 7.798828125, 9.7451171875, 11.69140625, 13.6376953125, 15.583984375, 17.5302734375, 19.4765625, 21.4228515625, 23.369140625, 25.3154296875, 27.26171875, 29.2080078125, 31.154296875, 33.1005859375, 35.046875, 36.9931640625, 38.939453125, 40.8857421875, 42.83203125, 44.7783203125, 46.724609375, 48.6708984375, 50.6171875, 52.5634765625, 54.509765625, 56.4560546875, 58.40234375, 60.3486328125, 62.294921875, 64.2412109375, 66.1875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 8.0, 15.0, 26.0, 36.0, 59.0, 111.0, 195.0, 288.0, 501.0, 819.0, 1360.0, 2189.0, 3503.0, 5903.0, 9360.0, 14244.0, 21534.0, 31177.0, 43489.0, 57332.0, 73100.0, 86684.0, 96179.0, 101596.0, 99833.0, 92118.0, 79461.0, 65096.0, 50655.0, 36993.0, 26142.0, 17750.0, 11580.0, 7454.0, 4511.0, 2843.0, 1760.0, 1033.0, 662.0, 375.0, 235.0, 148.0, 81.0, 49.0, 29.0, 18.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-39.90625, -38.7900390625, -37.673828125, -36.5576171875, -35.44140625, -34.3251953125, -33.208984375, -32.0927734375, -30.9765625, -29.8603515625, -28.744140625, -27.6279296875, -26.51171875, -25.3955078125, -24.279296875, -23.1630859375, -22.046875, -20.9306640625, -19.814453125, -18.6982421875, -17.58203125, -16.4658203125, -15.349609375, -14.2333984375, -13.1171875, -12.0009765625, -10.884765625, -9.7685546875, -8.65234375, -7.5361328125, -6.419921875, -5.3037109375, -4.1875, -3.0712890625, -1.955078125, -0.8388671875, 0.27734375, 1.3935546875, 2.509765625, 3.6259765625, 4.7421875, 5.8583984375, 6.974609375, 8.0908203125, 9.20703125, 10.3232421875, 11.439453125, 12.5556640625, 13.671875, 14.7880859375, 15.904296875, 17.0205078125, 18.13671875, 19.2529296875, 20.369140625, 21.4853515625, 22.6015625, 23.7177734375, 24.833984375, 25.9501953125, 27.06640625, 28.1826171875, 29.298828125, 30.4150390625, 31.53125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 13.0, 14.0, 11.0, 13.0, 18.0, 28.0, 25.0, 24.0, 33.0, 39.0, 32.0, 33.0, 49.0, 44.0, 37.0, 49.0, 44.0, 42.0, 45.0, 29.0, 41.0, 27.0, 30.0, 38.0, 28.0, 22.0, 23.0, 25.0, 27.0, 22.0, 19.0, 11.0, 10.0, 7.0, 5.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004174411296844482, -0.00402677059173584, -0.0038791298866271973, -0.0037314891815185547, -0.003583848476409912, -0.0034362077713012695, -0.003288567066192627, -0.0031409263610839844, -0.002993285655975342, -0.0028456449508666992, -0.0026980042457580566, -0.002550363540649414, -0.0024027228355407715, -0.002255082130432129, -0.0021074414253234863, -0.0019598007202148438, -0.0018121600151062012, -0.0016645193099975586, -0.001516878604888916, -0.0013692378997802734, -0.0012215971946716309, -0.0010739564895629883, -0.0009263157844543457, -0.0007786750793457031, -0.0006310343742370605, -0.00048339366912841797, -0.0003357529640197754, -0.0001881122589111328, -4.0471553802490234e-05, 0.00010716915130615234, 0.0002548098564147949, 0.0004024505615234375, 0.0005500912666320801, 0.0006977319717407227, 0.0008453726768493652, 0.0009930133819580078, 0.0011406540870666504, 0.001288294792175293, 0.0014359354972839355, 0.0015835762023925781, 0.0017312169075012207, 0.0018788576126098633, 0.002026498317718506, 0.0021741390228271484, 0.002321779727935791, 0.0024694204330444336, 0.002617061138153076, 0.0027647018432617188, 0.0029123425483703613, 0.003059983253479004, 0.0032076239585876465, 0.003355264663696289, 0.0035029053688049316, 0.0036505460739135742, 0.003798186779022217, 0.003945827484130859, 0.004093468189239502, 0.0042411088943481445, 0.004388749599456787, 0.00453639030456543, 0.004684031009674072, 0.004831671714782715, 0.004979312419891357, 0.005126953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 18.0, 16.0, 32.0, 64.0, 85.0, 160.0, 300.0, 448.0, 792.0, 1362.0, 2302.0, 3704.0, 6321.0, 10157.0, 16055.0, 24145.0, 34311.0, 48350.0, 63440.0, 79075.0, 92829.0, 101664.0, 104732.0, 99928.0, 89438.0, 75565.0, 59415.0, 44600.0, 31467.0, 21338.0, 14012.0, 8807.0, 5540.0, 3345.0, 1915.0, 1147.0, 714.0, 396.0, 229.0, 134.0, 77.0, 51.0, 34.0, 12.0, 12.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.125, -36.82666015625, -35.5283203125, -34.22998046875, -32.931640625, -31.63330078125, -30.3349609375, -29.03662109375, -27.73828125, -26.43994140625, -25.1416015625, -23.84326171875, -22.544921875, -21.24658203125, -19.9482421875, -18.64990234375, -17.3515625, -16.05322265625, -14.7548828125, -13.45654296875, -12.158203125, -10.85986328125, -9.5615234375, -8.26318359375, -6.96484375, -5.66650390625, -4.3681640625, -3.06982421875, -1.771484375, -0.47314453125, 0.8251953125, 2.12353515625, 3.421875, 4.72021484375, 6.0185546875, 7.31689453125, 8.615234375, 9.91357421875, 11.2119140625, 12.51025390625, 13.80859375, 15.10693359375, 16.4052734375, 17.70361328125, 19.001953125, 20.30029296875, 21.5986328125, 22.89697265625, 24.1953125, 25.49365234375, 26.7919921875, 28.09033203125, 29.388671875, 30.68701171875, 31.9853515625, 33.28369140625, 34.58203125, 35.88037109375, 37.1787109375, 38.47705078125, 39.775390625, 41.07373046875, 42.3720703125, 43.67041015625, 44.96875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 2.0, 9.0, 9.0, 9.0, 11.0, 12.0, 12.0, 16.0, 19.0, 21.0, 36.0, 29.0, 25.0, 33.0, 34.0, 34.0, 52.0, 48.0, 58.0, 47.0, 48.0, 50.0, 39.0, 47.0, 31.0, 38.0, 38.0, 31.0, 29.0, 20.0, 23.0, 13.0, 18.0, 13.0, 13.0, 3.0, 4.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.20166015625, -17.6064453125, -17.01123046875, -16.416015625, -15.82080078125, -15.2255859375, -14.63037109375, -14.03515625, -13.43994140625, -12.8447265625, -12.24951171875, -11.654296875, -11.05908203125, -10.4638671875, -9.86865234375, -9.2734375, -8.67822265625, -8.0830078125, -7.48779296875, -6.892578125, -6.29736328125, -5.7021484375, -5.10693359375, -4.51171875, -3.91650390625, -3.3212890625, -2.72607421875, -2.130859375, -1.53564453125, -0.9404296875, -0.34521484375, 0.25, 0.84521484375, 1.4404296875, 2.03564453125, 2.630859375, 3.22607421875, 3.8212890625, 4.41650390625, 5.01171875, 5.60693359375, 6.2021484375, 6.79736328125, 7.392578125, 7.98779296875, 8.5830078125, 9.17822265625, 9.7734375, 10.36865234375, 10.9638671875, 11.55908203125, 12.154296875, 12.74951171875, 13.3447265625, 13.93994140625, 14.53515625, 15.13037109375, 15.7255859375, 16.32080078125, 16.916015625, 17.51123046875, 18.1064453125, 18.70166015625, 19.296875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 13.0, 14.0, 12.0, 13.0, 22.0, 20.0, 36.0, 36.0, 39.0, 38.0, 35.0, 40.0, 44.0, 55.0, 49.0, 50.0, 41.0, 48.0, 44.0, 44.0, 43.0, 35.0, 32.0, 26.0, 24.0, 19.0, 16.0, 17.0, 16.0, 19.0, 7.0, 10.0, 4.0, 3.0, 8.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.75225067138672, -117.50408935546875, -113.25592803955078, -109.00776672363281, -104.75960540771484, -100.51144409179688, -96.26327514648438, -92.01512145996094, -87.76695251464844, -83.51879119873047, -79.2706298828125, -75.02246856689453, -70.77430725097656, -66.5261459350586, -62.27798080444336, -58.02981948852539, -53.78166198730469, -49.53350067138672, -45.28533935546875, -41.03717803955078, -36.78901672363281, -32.540855407714844, -28.29269027709961, -24.04452896118164, -19.796367645263672, -15.548206329345703, -11.300044059753418, -7.051881790161133, -2.803720474243164, 1.4444408416748047, 5.692604064941406, 9.940765380859375, 14.188919067382812, 18.43708038330078, 22.68524169921875, 26.93340492248535, 31.18156623840332, 35.429725646972656, 39.67789077758789, 43.92605209350586, 48.17421340942383, 52.4223747253418, 56.670536041259766, 60.918701171875, 65.16686248779297, 69.41502380371094, 73.6631851196289, 77.91134643554688, 82.15950775146484, 86.40766906738281, 90.65583038330078, 94.90399169921875, 99.15215301513672, 103.40031433105469, 107.64848327636719, 111.89663696289062, 116.14480590820312, 120.3929672241211, 124.64112854003906, 128.88929748535156, 133.137451171875, 137.3856201171875, 141.63377380371094, 145.88194274902344, 150.13009643554688]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 9.0, 10.0, 11.0, 16.0, 15.0, 21.0, 13.0, 27.0, 35.0, 31.0, 43.0, 30.0, 41.0, 38.0, 39.0, 34.0, 47.0, 42.0, 56.0, 42.0, 32.0, 42.0, 39.0, 32.0, 39.0, 29.0, 23.0, 24.0, 35.0, 17.0, 13.0, 13.0, 13.0, 6.0, 11.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-117.27759552001953, -113.27005767822266, -109.26251220703125, -105.25497436523438, -101.2474365234375, -97.2398910522461, -93.23235321044922, -89.22480773925781, -85.21726989746094, -81.20973205566406, -77.20218658447266, -73.19464874267578, -69.18710327148438, -65.1795654296875, -61.172027587890625, -57.164485931396484, -53.156944274902344, -49.1494026184082, -45.14186096191406, -41.13432312011719, -37.12678146362305, -33.119239807128906, -29.1117000579834, -25.10416030883789, -21.09661865234375, -17.08907699584961, -13.081537246704102, -9.073996543884277, -5.066455841064453, -1.0589141845703125, 2.9486255645751953, 6.956165313720703, 10.963714599609375, 14.9712553024292, 18.978796005249023, 22.98633575439453, 26.993877410888672, 31.001419067382812, 35.00895690917969, 39.01649856567383, 43.02404022216797, 47.03158187866211, 51.03912353515625, 55.046661376953125, 59.054203033447266, 63.061744689941406, 67.06928253173828, 71.07682800292969, 75.08436584472656, 79.09190368652344, 83.09944915771484, 87.10698699951172, 91.11453247070312, 95.1220703125, 99.12960815429688, 103.13714599609375, 107.14469146728516, 111.15222930908203, 115.15977478027344, 119.16731262207031, 123.17485046386719, 127.1823959350586, 131.18994140625, 135.19747924804688, 139.20501708984375]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 19.0, 46.0, 54.0, 93.0, 165.0, 318.0, 536.0, 970.0, 1724.0, 2873.0, 5067.0, 8392.0, 13796.0, 22350.0, 35420.0, 55074.0, 83215.0, 120536.0, 167658.0, 225683.0, 286246.0, 342303.0, 388816.0, 411650.0, 404311.0, 374568.0, 323961.0, 264193.0, 203681.0, 149225.0, 105958.0, 71458.0, 47238.0, 30065.0, 18629.0, 11475.0, 6906.0, 4019.0, 2394.0, 1347.0, 822.0, 449.0, 261.0, 147.0, 74.0, 42.0, 21.0, 16.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.625, -80.8203125, -78.015625, -75.2109375, -72.40625, -69.6015625, -66.796875, -63.9921875, -61.1875, -58.3828125, -55.578125, -52.7734375, -49.96875, -47.1640625, -44.359375, -41.5546875, -38.75, -35.9453125, -33.140625, -30.3359375, -27.53125, -24.7265625, -21.921875, -19.1171875, -16.3125, -13.5078125, -10.703125, -7.8984375, -5.09375, -2.2890625, 0.515625, 3.3203125, 6.125, 8.9296875, 11.734375, 14.5390625, 17.34375, 20.1484375, 22.953125, 25.7578125, 28.5625, 31.3671875, 34.171875, 36.9765625, 39.78125, 42.5859375, 45.390625, 48.1953125, 51.0, 53.8046875, 56.609375, 59.4140625, 62.21875, 65.0234375, 67.828125, 70.6328125, 73.4375, 76.2421875, 79.046875, 81.8515625, 84.65625, 87.4609375, 90.265625, 93.0703125, 95.875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 5.0, 6.0, 13.0, 10.0, 20.0, 17.0, 16.0, 18.0, 32.0, 30.0, 32.0, 46.0, 30.0, 37.0, 41.0, 36.0, 41.0, 36.0, 49.0, 50.0, 42.0, 34.0, 38.0, 40.0, 29.0, 39.0, 25.0, 35.0, 19.0, 37.0, 12.0, 14.0, 10.0, 14.0, 9.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-104.9375, -101.333984375, -97.73046875, -94.126953125, -90.5234375, -86.919921875, -83.31640625, -79.712890625, -76.109375, -72.505859375, -68.90234375, -65.298828125, -61.6953125, -58.091796875, -54.48828125, -50.884765625, -47.28125, -43.677734375, -40.07421875, -36.470703125, -32.8671875, -29.263671875, -25.66015625, -22.056640625, -18.453125, -14.849609375, -11.24609375, -7.642578125, -4.0390625, -0.435546875, 3.16796875, 6.771484375, 10.375, 13.978515625, 17.58203125, 21.185546875, 24.7890625, 28.392578125, 31.99609375, 35.599609375, 39.203125, 42.806640625, 46.41015625, 50.013671875, 53.6171875, 57.220703125, 60.82421875, 64.427734375, 68.03125, 71.634765625, 75.23828125, 78.841796875, 82.4453125, 86.048828125, 89.65234375, 93.255859375, 96.859375, 100.462890625, 104.06640625, 107.669921875, 111.2734375, 114.876953125, 118.48046875, 122.083984375, 125.6875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 12.0, 24.0, 47.0, 67.0, 133.0, 279.0, 423.0, 798.0, 1309.0, 2198.0, 3833.0, 6440.0, 10102.0, 16208.0, 25273.0, 38242.0, 56219.0, 80516.0, 111506.0, 149404.0, 192874.0, 237564.0, 282149.0, 320155.0, 346395.0, 355459.0, 349122.0, 326719.0, 292061.0, 247299.0, 202420.0, 157891.0, 118981.0, 85784.0, 60835.0, 41637.0, 27687.0, 17682.0, 11276.0, 7097.0, 4164.0, 2433.0, 1551.0, 901.0, 529.0, 284.0, 128.0, 93.0, 35.0, 29.0, 11.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-84.8125, -82.12890625, -79.4453125, -76.76171875, -74.078125, -71.39453125, -68.7109375, -66.02734375, -63.34375, -60.66015625, -57.9765625, -55.29296875, -52.609375, -49.92578125, -47.2421875, -44.55859375, -41.875, -39.19140625, -36.5078125, -33.82421875, -31.140625, -28.45703125, -25.7734375, -23.08984375, -20.40625, -17.72265625, -15.0390625, -12.35546875, -9.671875, -6.98828125, -4.3046875, -1.62109375, 1.0625, 3.74609375, 6.4296875, 9.11328125, 11.796875, 14.48046875, 17.1640625, 19.84765625, 22.53125, 25.21484375, 27.8984375, 30.58203125, 33.265625, 35.94921875, 38.6328125, 41.31640625, 44.0, 46.68359375, 49.3671875, 52.05078125, 54.734375, 57.41796875, 60.1015625, 62.78515625, 65.46875, 68.15234375, 70.8359375, 73.51953125, 76.203125, 78.88671875, 81.5703125, 84.25390625, 86.9375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 11.0, 22.0, 20.0, 25.0, 43.0, 55.0, 44.0, 73.0, 76.0, 103.0, 107.0, 112.0, 131.0, 151.0, 162.0, 198.0, 200.0, 223.0, 227.0, 222.0, 192.0, 185.0, 199.0, 169.0, 182.0, 167.0, 130.0, 125.0, 102.0, 91.0, 68.0, 52.0, 44.0, 30.0, 32.0, 20.0, 23.0, 11.0, 10.0, 8.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-58.375, -56.70703125, -55.0390625, -53.37109375, -51.703125, -50.03515625, -48.3671875, -46.69921875, -45.03125, -43.36328125, -41.6953125, -40.02734375, -38.359375, -36.69140625, -35.0234375, -33.35546875, -31.6875, -30.01953125, -28.3515625, -26.68359375, -25.015625, -23.34765625, -21.6796875, -20.01171875, -18.34375, -16.67578125, -15.0078125, -13.33984375, -11.671875, -10.00390625, -8.3359375, -6.66796875, -5.0, -3.33203125, -1.6640625, 0.00390625, 1.671875, 3.33984375, 5.0078125, 6.67578125, 8.34375, 10.01171875, 11.6796875, 13.34765625, 15.015625, 16.68359375, 18.3515625, 20.01953125, 21.6875, 23.35546875, 25.0234375, 26.69140625, 28.359375, 30.02734375, 31.6953125, 33.36328125, 35.03125, 36.69921875, 38.3671875, 40.03515625, 41.703125, 43.37109375, 45.0390625, 46.70703125, 48.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 2.0, 5.0, 5.0, 8.0, 16.0, 5.0, 23.0, 17.0, 15.0, 21.0, 29.0, 21.0, 35.0, 34.0, 37.0, 45.0, 50.0, 35.0, 34.0, 38.0, 34.0, 44.0, 36.0, 36.0, 33.0, 44.0, 34.0, 23.0, 41.0, 28.0, 24.0, 19.0, 28.0, 19.0, 21.0, 8.0, 9.0, 10.0, 6.0, 6.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-110.3650894165039, -106.53553009033203, -102.70597839355469, -98.87641906738281, -95.04685974121094, -91.21730041503906, -87.38774108886719, -83.55818939208984, -79.72863006591797, -75.8990707397461, -72.06951904296875, -68.23995971679688, -64.410400390625, -60.580841064453125, -56.751285552978516, -52.921730041503906, -49.09217071533203, -45.262611389160156, -41.43305587768555, -37.60350036621094, -33.77394104003906, -29.94438362121582, -26.114826202392578, -22.285268783569336, -18.455711364746094, -14.626153945922852, -10.79659652709961, -6.967039108276367, -3.137481689453125, 0.6920757293701172, 4.521633148193359, 8.351190567016602, 12.180740356445312, 16.010297775268555, 19.839855194091797, 23.66941261291504, 27.49897003173828, 31.328527450561523, 35.158084869384766, 38.987640380859375, 42.81719970703125, 46.646759033203125, 50.476314544677734, 54.305870056152344, 58.13542938232422, 61.964988708496094, 65.79454040527344, 69.62409973144531, 73.45365905761719, 77.28321838378906, 81.11277770996094, 84.94232940673828, 88.77188873291016, 92.60144805908203, 96.43099975585938, 100.26055908203125, 104.09011840820312, 107.919677734375, 111.74923706054688, 115.57878875732422, 119.4083480834961, 123.23790740966797, 127.06745910644531, 130.8970184326172, 134.72657775878906]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 8.0, 10.0, 4.0, 8.0, 10.0, 17.0, 17.0, 22.0, 17.0, 20.0, 29.0, 13.0, 39.0, 34.0, 39.0, 35.0, 49.0, 28.0, 45.0, 33.0, 36.0, 42.0, 48.0, 45.0, 36.0, 26.0, 32.0, 33.0, 35.0, 31.0, 24.0, 22.0, 12.0, 12.0, 15.0, 8.0, 12.0, 10.0, 9.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-114.84429931640625, -111.15113830566406, -107.45797729492188, -103.76481628417969, -100.0716552734375, -96.37849426269531, -92.6853256225586, -88.9921646118164, -85.29900360107422, -81.60584259033203, -77.91268157958984, -74.21952056884766, -70.52635192871094, -66.83319091796875, -63.14002990722656, -59.446868896484375, -55.75370788574219, -52.060546875, -48.36738586425781, -44.67422103881836, -40.98106002807617, -37.287899017333984, -33.59473419189453, -29.901573181152344, -26.208412170410156, -22.51525115966797, -18.82208824157715, -15.128926277160645, -11.43576431274414, -7.742603302001953, -4.049440383911133, -0.3562774658203125, 3.3368759155273438, 7.030037879943848, 10.723199844360352, 14.416361808776855, 18.10952377319336, 21.802684783935547, 25.495847702026367, 29.189010620117188, 32.882171630859375, 36.57533264160156, 40.26849365234375, 43.9616584777832, 47.65481948852539, 51.34798049926758, 55.04114532470703, 58.73430633544922, 62.427467346191406, 66.1206283569336, 69.81378936767578, 73.50695037841797, 77.20011901855469, 80.89328002929688, 84.58644104003906, 88.27960205078125, 91.97276306152344, 95.66592407226562, 99.35908508300781, 103.05224609375, 106.74540710449219, 110.43856811523438, 114.1317367553711, 117.82489776611328, 121.51805877685547]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 18.0, 15.0, 37.0, 56.0, 97.0, 167.0, 247.0, 429.0, 662.0, 1166.0, 1897.0, 3377.0, 5979.0, 10938.0, 19914.0, 36238.0, 66156.0, 110712.0, 162650.0, 190830.0, 167257.0, 115225.0, 68603.0, 38417.0, 20990.0, 11544.0, 6371.0, 3547.0, 1999.0, 1221.0, 682.0, 421.0, 246.0, 174.0, 94.0, 60.0, 40.0, 22.0, 3.0, 11.0, 10.0, 9.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-68.9375, -66.751953125, -64.56640625, -62.380859375, -60.1953125, -58.009765625, -55.82421875, -53.638671875, -51.453125, -49.267578125, -47.08203125, -44.896484375, -42.7109375, -40.525390625, -38.33984375, -36.154296875, -33.96875, -31.783203125, -29.59765625, -27.412109375, -25.2265625, -23.041015625, -20.85546875, -18.669921875, -16.484375, -14.298828125, -12.11328125, -9.927734375, -7.7421875, -5.556640625, -3.37109375, -1.185546875, 1.0, 3.185546875, 5.37109375, 7.556640625, 9.7421875, 11.927734375, 14.11328125, 16.298828125, 18.484375, 20.669921875, 22.85546875, 25.041015625, 27.2265625, 29.412109375, 31.59765625, 33.783203125, 35.96875, 38.154296875, 40.33984375, 42.525390625, 44.7109375, 46.896484375, 49.08203125, 51.267578125, 53.453125, 55.638671875, 57.82421875, 60.009765625, 62.1953125, 64.380859375, 66.56640625, 68.751953125, 70.9375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 10.0, 5.0, 7.0, 10.0, 19.0, 14.0, 24.0, 16.0, 24.0, 25.0, 21.0, 34.0, 33.0, 37.0, 39.0, 48.0, 28.0, 50.0, 27.0, 36.0, 46.0, 46.0, 42.0, 34.0, 29.0, 33.0, 31.0, 36.0, 29.0, 26.0, 20.0, 13.0, 11.0, 15.0, 7.0, 15.0, 8.0, 9.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-114.0, -110.318359375, -106.63671875, -102.955078125, -99.2734375, -95.591796875, -91.91015625, -88.228515625, -84.546875, -80.865234375, -77.18359375, -73.501953125, -69.8203125, -66.138671875, -62.45703125, -58.775390625, -55.09375, -51.412109375, -47.73046875, -44.048828125, -40.3671875, -36.685546875, -33.00390625, -29.322265625, -25.640625, -21.958984375, -18.27734375, -14.595703125, -10.9140625, -7.232421875, -3.55078125, 0.130859375, 3.8125, 7.494140625, 11.17578125, 14.857421875, 18.5390625, 22.220703125, 25.90234375, 29.583984375, 33.265625, 36.947265625, 40.62890625, 44.310546875, 47.9921875, 51.673828125, 55.35546875, 59.037109375, 62.71875, 66.400390625, 70.08203125, 73.763671875, 77.4453125, 81.126953125, 84.80859375, 88.490234375, 92.171875, 95.853515625, 99.53515625, 103.216796875, 106.8984375, 110.580078125, 114.26171875, 117.943359375, 121.625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 10.0, 19.0, 22.0, 23.0, 62.0, 73.0, 110.0, 135.0, 242.0, 350.0, 514.0, 722.0, 1051.0, 1702.0, 2852.0, 5198.0, 9997.0, 20636.0, 47853.0, 113005.0, 235424.0, 289808.0, 176828.0, 76883.0, 32522.0, 14766.0, 7252.0, 3852.0, 2291.0, 1435.0, 953.0, 594.0, 433.0, 285.0, 197.0, 136.0, 103.0, 66.0, 36.0, 36.0, 29.0, 18.0, 8.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-83.8125, -81.2158203125, -78.619140625, -76.0224609375, -73.42578125, -70.8291015625, -68.232421875, -65.6357421875, -63.0390625, -60.4423828125, -57.845703125, -55.2490234375, -52.65234375, -50.0556640625, -47.458984375, -44.8623046875, -42.265625, -39.6689453125, -37.072265625, -34.4755859375, -31.87890625, -29.2822265625, -26.685546875, -24.0888671875, -21.4921875, -18.8955078125, -16.298828125, -13.7021484375, -11.10546875, -8.5087890625, -5.912109375, -3.3154296875, -0.71875, 1.8779296875, 4.474609375, 7.0712890625, 9.66796875, 12.2646484375, 14.861328125, 17.4580078125, 20.0546875, 22.6513671875, 25.248046875, 27.8447265625, 30.44140625, 33.0380859375, 35.634765625, 38.2314453125, 40.828125, 43.4248046875, 46.021484375, 48.6181640625, 51.21484375, 53.8115234375, 56.408203125, 59.0048828125, 61.6015625, 64.1982421875, 66.794921875, 69.3916015625, 71.98828125, 74.5849609375, 77.181640625, 79.7783203125, 82.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 2.0, 10.0, 8.0, 13.0, 15.0, 17.0, 14.0, 23.0, 19.0, 26.0, 30.0, 20.0, 24.0, 34.0, 35.0, 28.0, 38.0, 41.0, 34.0, 40.0, 41.0, 33.0, 45.0, 44.0, 45.0, 29.0, 35.0, 28.0, 32.0, 27.0, 31.0, 22.0, 22.0, 18.0, 12.0, 14.0, 8.0, 5.0, 5.0, 1.0, 8.0, 6.0, 8.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-80.125, -77.7294921875, -75.333984375, -72.9384765625, -70.54296875, -68.1474609375, -65.751953125, -63.3564453125, -60.9609375, -58.5654296875, -56.169921875, -53.7744140625, -51.37890625, -48.9833984375, -46.587890625, -44.1923828125, -41.796875, -39.4013671875, -37.005859375, -34.6103515625, -32.21484375, -29.8193359375, -27.423828125, -25.0283203125, -22.6328125, -20.2373046875, -17.841796875, -15.4462890625, -13.05078125, -10.6552734375, -8.259765625, -5.8642578125, -3.46875, -1.0732421875, 1.322265625, 3.7177734375, 6.11328125, 8.5087890625, 10.904296875, 13.2998046875, 15.6953125, 18.0908203125, 20.486328125, 22.8818359375, 25.27734375, 27.6728515625, 30.068359375, 32.4638671875, 34.859375, 37.2548828125, 39.650390625, 42.0458984375, 44.44140625, 46.8369140625, 49.232421875, 51.6279296875, 54.0234375, 56.4189453125, 58.814453125, 61.2099609375, 63.60546875, 66.0009765625, 68.396484375, 70.7919921875, 73.1875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 12.0, 11.0, 24.0, 35.0, 69.0, 98.0, 152.0, 294.0, 603.0, 1099.0, 2190.0, 4797.0, 11639.0, 32886.0, 125852.0, 479349.0, 288608.0, 66104.0, 20161.0, 7744.0, 3427.0, 1606.0, 811.0, 408.0, 193.0, 128.0, 87.0, 53.0, 41.0, 14.0, 9.0, 11.0, 9.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.1875, -77.494140625, -74.80078125, -72.107421875, -69.4140625, -66.720703125, -64.02734375, -61.333984375, -58.640625, -55.947265625, -53.25390625, -50.560546875, -47.8671875, -45.173828125, -42.48046875, -39.787109375, -37.09375, -34.400390625, -31.70703125, -29.013671875, -26.3203125, -23.626953125, -20.93359375, -18.240234375, -15.546875, -12.853515625, -10.16015625, -7.466796875, -4.7734375, -2.080078125, 0.61328125, 3.306640625, 6.0, 8.693359375, 11.38671875, 14.080078125, 16.7734375, 19.466796875, 22.16015625, 24.853515625, 27.546875, 30.240234375, 32.93359375, 35.626953125, 38.3203125, 41.013671875, 43.70703125, 46.400390625, 49.09375, 51.787109375, 54.48046875, 57.173828125, 59.8671875, 62.560546875, 65.25390625, 67.947265625, 70.640625, 73.333984375, 76.02734375, 78.720703125, 81.4140625, 84.107421875, 86.80078125, 89.494140625, 92.1875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 15.0, 12.0, 26.0, 26.0, 23.0, 32.0, 45.0, 46.0, 52.0, 63.0, 52.0, 66.0, 64.0, 58.0, 56.0, 53.0, 41.0, 47.0, 39.0, 35.0, 31.0, 22.0, 17.0, 22.0, 19.0, 10.0, 5.0, 3.0, 8.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020732879638671875, -0.0020008981227874756, -0.0019285082817077637, -0.0018561184406280518, -0.0017837285995483398, -0.001711338758468628, -0.001638948917388916, -0.001566559076309204, -0.0014941692352294922, -0.0014217793941497803, -0.0013493895530700684, -0.0012769997119903564, -0.0012046098709106445, -0.0011322200298309326, -0.0010598301887512207, -0.0009874403476715088, -0.0009150505065917969, -0.000842660665512085, -0.000770270824432373, -0.0006978809833526611, -0.0006254911422729492, -0.0005531013011932373, -0.0004807114601135254, -0.0004083216190338135, -0.00033593177795410156, -0.00026354193687438965, -0.00019115209579467773, -0.00011876225471496582, -4.6372413635253906e-05, 2.6017427444458008e-05, 9.840726852416992e-05, 0.00017079710960388184, 0.00024318695068359375, 0.00031557679176330566, 0.0003879666328430176, 0.0004603564739227295, 0.0005327463150024414, 0.0006051361560821533, 0.0006775259971618652, 0.0007499158382415771, 0.0008223056793212891, 0.000894695520401001, 0.0009670853614807129, 0.0010394752025604248, 0.0011118650436401367, 0.0011842548847198486, 0.0012566447257995605, 0.0013290345668792725, 0.0014014244079589844, 0.0014738142490386963, 0.0015462040901184082, 0.0016185939311981201, 0.001690983772277832, 0.001763373613357544, 0.0018357634544372559, 0.0019081532955169678, 0.0019805431365966797, 0.0020529329776763916, 0.0021253228187561035, 0.0021977126598358154, 0.0022701025009155273, 0.0023424923419952393, 0.002414882183074951, 0.002487272024154663, 0.002559661865234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 10.0, 16.0, 12.0, 21.0, 31.0, 37.0, 47.0, 73.0, 87.0, 143.0, 200.0, 290.0, 435.0, 571.0, 866.0, 1318.0, 1987.0, 3196.0, 5121.0, 8404.0, 13851.0, 23444.0, 38928.0, 64010.0, 99481.0, 140760.0, 165448.0, 156000.0, 119171.0, 79258.0, 49500.0, 29526.0, 17671.0, 10474.0, 6521.0, 4070.0, 2505.0, 1582.0, 1061.0, 732.0, 517.0, 336.0, 221.0, 174.0, 135.0, 91.0, 53.0, 44.0, 41.0, 32.0, 14.0, 9.0, 8.0, 5.0, 7.0, 2.0, 4.0, 4.0], "bins": [-52.90625, -51.2900390625, -49.673828125, -48.0576171875, -46.44140625, -44.8251953125, -43.208984375, -41.5927734375, -39.9765625, -38.3603515625, -36.744140625, -35.1279296875, -33.51171875, -31.8955078125, -30.279296875, -28.6630859375, -27.046875, -25.4306640625, -23.814453125, -22.1982421875, -20.58203125, -18.9658203125, -17.349609375, -15.7333984375, -14.1171875, -12.5009765625, -10.884765625, -9.2685546875, -7.65234375, -6.0361328125, -4.419921875, -2.8037109375, -1.1875, 0.4287109375, 2.044921875, 3.6611328125, 5.27734375, 6.8935546875, 8.509765625, 10.1259765625, 11.7421875, 13.3583984375, 14.974609375, 16.5908203125, 18.20703125, 19.8232421875, 21.439453125, 23.0556640625, 24.671875, 26.2880859375, 27.904296875, 29.5205078125, 31.13671875, 32.7529296875, 34.369140625, 35.9853515625, 37.6015625, 39.2177734375, 40.833984375, 42.4501953125, 44.06640625, 45.6826171875, 47.298828125, 48.9150390625, 50.53125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 3.0, 5.0, 6.0, 5.0, 6.0, 11.0, 19.0, 15.0, 24.0, 14.0, 26.0, 25.0, 39.0, 55.0, 40.0, 54.0, 56.0, 50.0, 41.0, 65.0, 54.0, 59.0, 33.0, 45.0, 43.0, 45.0, 39.0, 28.0, 29.0, 16.0, 3.0, 9.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.453125, -15.968505859375, -15.48388671875, -14.999267578125, -14.5146484375, -14.030029296875, -13.54541015625, -13.060791015625, -12.576171875, -12.091552734375, -11.60693359375, -11.122314453125, -10.6376953125, -10.153076171875, -9.66845703125, -9.183837890625, -8.69921875, -8.214599609375, -7.72998046875, -7.245361328125, -6.7607421875, -6.276123046875, -5.79150390625, -5.306884765625, -4.822265625, -4.337646484375, -3.85302734375, -3.368408203125, -2.8837890625, -2.399169921875, -1.91455078125, -1.429931640625, -0.9453125, -0.460693359375, 0.02392578125, 0.508544921875, 0.9931640625, 1.477783203125, 1.96240234375, 2.447021484375, 2.931640625, 3.416259765625, 3.90087890625, 4.385498046875, 4.8701171875, 5.354736328125, 5.83935546875, 6.323974609375, 6.80859375, 7.293212890625, 7.77783203125, 8.262451171875, 8.7470703125, 9.231689453125, 9.71630859375, 10.200927734375, 10.685546875, 11.170166015625, 11.65478515625, 12.139404296875, 12.6240234375, 13.108642578125, 13.59326171875, 14.077880859375, 14.5625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 7.0, 2.0, 14.0, 8.0, 7.0, 15.0, 17.0, 16.0, 28.0, 18.0, 21.0, 27.0, 31.0, 35.0, 46.0, 30.0, 42.0, 47.0, 48.0, 30.0, 43.0, 45.0, 33.0, 22.0, 46.0, 36.0, 29.0, 39.0, 20.0, 28.0, 24.0, 23.0, 17.0, 21.0, 19.0, 17.0, 7.0, 8.0, 11.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-115.20955657958984, -111.4174575805664, -107.62535858154297, -103.83325958251953, -100.0411605834961, -96.24905395507812, -92.45695495605469, -88.66485595703125, -84.87275695800781, -81.08065795898438, -77.28855895996094, -73.4964599609375, -69.70436096191406, -65.91226196289062, -62.12015914916992, -58.32805633544922, -54.53596115112305, -50.74386215209961, -46.95176315307617, -43.15966033935547, -39.36756134033203, -35.575462341308594, -31.783363342285156, -27.991262435913086, -24.19916343688965, -20.40706443786621, -16.61496353149414, -12.822864532470703, -9.03076457977295, -5.238664627075195, -1.4465656280517578, 2.3455352783203125, 6.13763427734375, 9.929734230041504, 13.721834182739258, 17.513933181762695, 21.306034088134766, 25.098133087158203, 28.89023208618164, 32.682334899902344, 36.47443389892578, 40.26653289794922, 44.058631896972656, 47.850730895996094, 51.6428337097168, 55.434932708740234, 59.22703170776367, 63.019134521484375, 66.81123352050781, 70.60333251953125, 74.39543151855469, 78.18753051757812, 81.97962951660156, 85.771728515625, 89.56382751464844, 93.3559341430664, 97.14802551269531, 100.94012451171875, 104.73222351074219, 108.52432250976562, 112.31642150878906, 116.1085205078125, 119.90061950683594, 123.6927261352539, 127.48482513427734]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 8.0, 8.0, 4.0, 11.0, 10.0, 17.0, 20.0, 16.0, 14.0, 22.0, 28.0, 24.0, 29.0, 36.0, 39.0, 33.0, 43.0, 41.0, 42.0, 35.0, 31.0, 36.0, 48.0, 56.0, 27.0, 30.0, 37.0, 25.0, 29.0, 32.0, 22.0, 25.0, 22.0, 6.0, 15.0, 11.0, 9.0, 12.0, 11.0, 6.0, 5.0, 4.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.09246063232422, -110.42713928222656, -106.7618179321289, -103.09649658203125, -99.43116760253906, -95.7658462524414, -92.10052490234375, -88.4352035522461, -84.76988220214844, -81.10456085205078, -77.43923950195312, -73.77391052246094, -70.10858917236328, -66.44326782226562, -62.77794647216797, -59.11262512207031, -55.447296142578125, -51.78197479248047, -48.11664962768555, -44.45132827758789, -40.78600311279297, -37.12068176269531, -33.455360412597656, -29.790037155151367, -26.124713897705078, -22.45939064025879, -18.7940673828125, -15.128746032714844, -11.463422775268555, -7.798099517822266, -4.132778167724609, -0.4674549102783203, 3.1978607177734375, 6.863183498382568, 10.5285062789917, 14.193828582763672, 17.85915184020996, 21.52447509765625, 25.189796447753906, 28.855119705200195, 32.520442962646484, 36.18576431274414, 39.85108947753906, 43.51641082763672, 47.181732177734375, 50.8470573425293, 54.51237869262695, 58.177703857421875, 61.84302520751953, 65.50834655761719, 69.17366790771484, 72.8389892578125, 76.50431823730469, 80.16963958740234, 83.8349609375, 87.50028228759766, 91.16560363769531, 94.83092498779297, 98.49624633789062, 102.16157531738281, 105.82689666748047, 109.49221801757812, 113.15753936767578, 116.82286071777344, 120.48818969726562]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 5.0, 12.0, 18.0, 23.0, 46.0, 70.0, 140.0, 172.0, 288.0, 417.0, 648.0, 996.0, 1465.0, 2159.0, 3203.0, 4466.0, 6454.0, 9165.0, 12336.0, 16493.0, 21846.0, 28099.0, 35095.0, 42933.0, 51227.0, 59027.0, 65501.0, 70630.0, 73486.0, 74230.0, 71984.0, 68188.0, 61929.0, 54869.0, 46892.0, 38818.0, 31660.0, 24924.0, 18911.0, 14466.0, 10727.0, 7539.0, 5421.0, 3768.0, 2608.0, 1793.0, 1178.0, 763.0, 545.0, 356.0, 217.0, 140.0, 87.0, 47.0, 28.0, 14.0, 20.0, 9.0, 7.0, 6.0, 0.0, 2.0], "bins": [-64.4375, -62.375, -60.3125, -58.25, -56.1875, -54.125, -52.0625, -50.0, -47.9375, -45.875, -43.8125, -41.75, -39.6875, -37.625, -35.5625, -33.5, -31.4375, -29.375, -27.3125, -25.25, -23.1875, -21.125, -19.0625, -17.0, -14.9375, -12.875, -10.8125, -8.75, -6.6875, -4.625, -2.5625, -0.5, 1.5625, 3.625, 5.6875, 7.75, 9.8125, 11.875, 13.9375, 16.0, 18.0625, 20.125, 22.1875, 24.25, 26.3125, 28.375, 30.4375, 32.5, 34.5625, 36.625, 38.6875, 40.75, 42.8125, 44.875, 46.9375, 49.0, 51.0625, 53.125, 55.1875, 57.25, 59.3125, 61.375, 63.4375, 65.5, 67.5625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 8.0, 7.0, 5.0, 10.0, 15.0, 15.0, 19.0, 14.0, 17.0, 25.0, 26.0, 25.0, 26.0, 35.0, 44.0, 34.0, 38.0, 43.0, 42.0, 35.0, 31.0, 34.0, 48.0, 56.0, 26.0, 32.0, 33.0, 27.0, 36.0, 25.0, 23.0, 24.0, 20.0, 11.0, 14.0, 8.0, 10.0, 11.0, 12.0, 7.0, 3.0, 4.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-109.875, -106.3291015625, -102.783203125, -99.2373046875, -95.69140625, -92.1455078125, -88.599609375, -85.0537109375, -81.5078125, -77.9619140625, -74.416015625, -70.8701171875, -67.32421875, -63.7783203125, -60.232421875, -56.6865234375, -53.140625, -49.5947265625, -46.048828125, -42.5029296875, -38.95703125, -35.4111328125, -31.865234375, -28.3193359375, -24.7734375, -21.2275390625, -17.681640625, -14.1357421875, -10.58984375, -7.0439453125, -3.498046875, 0.0478515625, 3.59375, 7.1396484375, 10.685546875, 14.2314453125, 17.77734375, 21.3232421875, 24.869140625, 28.4150390625, 31.9609375, 35.5068359375, 39.052734375, 42.5986328125, 46.14453125, 49.6904296875, 53.236328125, 56.7822265625, 60.328125, 63.8740234375, 67.419921875, 70.9658203125, 74.51171875, 78.0576171875, 81.603515625, 85.1494140625, 88.6953125, 92.2412109375, 95.787109375, 99.3330078125, 102.87890625, 106.4248046875, 109.970703125, 113.5166015625, 117.0625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 6.0, 14.0, 18.0, 43.0, 61.0, 79.0, 149.0, 214.0, 369.0, 541.0, 825.0, 1333.0, 1917.0, 2892.0, 4312.0, 6182.0, 8810.0, 12158.0, 16781.0, 22246.0, 28889.0, 36724.0, 45647.0, 53618.0, 61722.0, 69069.0, 74741.0, 77119.0, 76678.0, 74072.0, 69233.0, 61487.0, 53588.0, 44884.0, 36532.0, 28666.0, 22044.0, 16120.0, 11855.0, 8428.0, 6133.0, 4175.0, 2786.0, 1814.0, 1299.0, 817.0, 547.0, 365.0, 209.0, 137.0, 91.0, 42.0, 27.0, 20.0, 14.0, 12.0, 12.0, 2.0, 0.0, 1.0], "bins": [-65.0625, -63.02734375, -60.9921875, -58.95703125, -56.921875, -54.88671875, -52.8515625, -50.81640625, -48.78125, -46.74609375, -44.7109375, -42.67578125, -40.640625, -38.60546875, -36.5703125, -34.53515625, -32.5, -30.46484375, -28.4296875, -26.39453125, -24.359375, -22.32421875, -20.2890625, -18.25390625, -16.21875, -14.18359375, -12.1484375, -10.11328125, -8.078125, -6.04296875, -4.0078125, -1.97265625, 0.0625, 2.09765625, 4.1328125, 6.16796875, 8.203125, 10.23828125, 12.2734375, 14.30859375, 16.34375, 18.37890625, 20.4140625, 22.44921875, 24.484375, 26.51953125, 28.5546875, 30.58984375, 32.625, 34.66015625, 36.6953125, 38.73046875, 40.765625, 42.80078125, 44.8359375, 46.87109375, 48.90625, 50.94140625, 52.9765625, 55.01171875, 57.046875, 59.08203125, 61.1171875, 63.15234375, 65.1875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 9.0, 5.0, 4.0, 4.0, 5.0, 8.0, 10.0, 13.0, 15.0, 17.0, 14.0, 27.0, 21.0, 26.0, 38.0, 26.0, 17.0, 36.0, 33.0, 32.0, 47.0, 46.0, 38.0, 36.0, 40.0, 45.0, 40.0, 48.0, 33.0, 29.0, 24.0, 39.0, 27.0, 26.0, 23.0, 22.0, 11.0, 14.0, 9.0, 9.0, 8.0, 12.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-85.0625, -82.578125, -80.09375, -77.609375, -75.125, -72.640625, -70.15625, -67.671875, -65.1875, -62.703125, -60.21875, -57.734375, -55.25, -52.765625, -50.28125, -47.796875, -45.3125, -42.828125, -40.34375, -37.859375, -35.375, -32.890625, -30.40625, -27.921875, -25.4375, -22.953125, -20.46875, -17.984375, -15.5, -13.015625, -10.53125, -8.046875, -5.5625, -3.078125, -0.59375, 1.890625, 4.375, 6.859375, 9.34375, 11.828125, 14.3125, 16.796875, 19.28125, 21.765625, 24.25, 26.734375, 29.21875, 31.703125, 34.1875, 36.671875, 39.15625, 41.640625, 44.125, 46.609375, 49.09375, 51.578125, 54.0625, 56.546875, 59.03125, 61.515625, 64.0, 66.484375, 68.96875, 71.453125, 73.9375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 23.0, 22.0, 29.0, 59.0, 83.0, 118.0, 196.0, 336.0, 510.0, 820.0, 1413.0, 2227.0, 3515.0, 5358.0, 8439.0, 13164.0, 19397.0, 27819.0, 38184.0, 50996.0, 64028.0, 77451.0, 88642.0, 95037.0, 97050.0, 92366.0, 83676.0, 71409.0, 58324.0, 44820.0, 33135.0, 23807.0, 16249.0, 10815.0, 7032.0, 4587.0, 2756.0, 1817.0, 1115.0, 633.0, 424.0, 241.0, 163.0, 96.0, 56.0, 38.0, 30.0, 19.0, 11.0, 12.0, 1.0, 5.0, 2.0, 2.0], "bins": [-36.53125, -35.46533203125, -34.3994140625, -33.33349609375, -32.267578125, -31.20166015625, -30.1357421875, -29.06982421875, -28.00390625, -26.93798828125, -25.8720703125, -24.80615234375, -23.740234375, -22.67431640625, -21.6083984375, -20.54248046875, -19.4765625, -18.41064453125, -17.3447265625, -16.27880859375, -15.212890625, -14.14697265625, -13.0810546875, -12.01513671875, -10.94921875, -9.88330078125, -8.8173828125, -7.75146484375, -6.685546875, -5.61962890625, -4.5537109375, -3.48779296875, -2.421875, -1.35595703125, -0.2900390625, 0.77587890625, 1.841796875, 2.90771484375, 3.9736328125, 5.03955078125, 6.10546875, 7.17138671875, 8.2373046875, 9.30322265625, 10.369140625, 11.43505859375, 12.5009765625, 13.56689453125, 14.6328125, 15.69873046875, 16.7646484375, 17.83056640625, 18.896484375, 19.96240234375, 21.0283203125, 22.09423828125, 23.16015625, 24.22607421875, 25.2919921875, 26.35791015625, 27.423828125, 28.48974609375, 29.5556640625, 30.62158203125, 31.6875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 4.0, 5.0, 6.0, 8.0, 14.0, 18.0, 19.0, 18.0, 19.0, 24.0, 30.0, 27.0, 43.0, 37.0, 42.0, 55.0, 44.0, 44.0, 44.0, 62.0, 48.0, 47.0, 44.0, 47.0, 37.0, 23.0, 28.0, 22.0, 24.0, 23.0, 20.0, 13.0, 15.0, 9.0, 9.0, 4.0, 3.0, 7.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00499725341796875, -0.004838407039642334, -0.004679560661315918, -0.004520714282989502, -0.004361867904663086, -0.00420302152633667, -0.004044175148010254, -0.003885328769683838, -0.003726482391357422, -0.003567636013031006, -0.00340878963470459, -0.003249943256378174, -0.003091096878051758, -0.002932250499725342, -0.0027734041213989258, -0.0026145577430725098, -0.0024557113647460938, -0.0022968649864196777, -0.0021380186080932617, -0.0019791722297668457, -0.0018203258514404297, -0.0016614794731140137, -0.0015026330947875977, -0.0013437867164611816, -0.0011849403381347656, -0.0010260939598083496, -0.0008672475814819336, -0.0007084012031555176, -0.0005495548248291016, -0.00039070844650268555, -0.00023186206817626953, -7.301568984985352e-05, 8.58306884765625e-05, 0.0002446770668029785, 0.00040352344512939453, 0.0005623698234558105, 0.0007212162017822266, 0.0008800625801086426, 0.0010389089584350586, 0.0011977553367614746, 0.0013566017150878906, 0.0015154480934143066, 0.0016742944717407227, 0.0018331408500671387, 0.0019919872283935547, 0.0021508336067199707, 0.0023096799850463867, 0.0024685263633728027, 0.0026273727416992188, 0.0027862191200256348, 0.0029450654983520508, 0.003103911876678467, 0.003262758255004883, 0.003421604633331299, 0.003580451011657715, 0.003739297389984131, 0.003898143768310547, 0.004056990146636963, 0.004215836524963379, 0.004374682903289795, 0.004533529281616211, 0.004692375659942627, 0.004851222038269043, 0.005010068416595459, 0.005168914794921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 8.0, 15.0, 18.0, 36.0, 64.0, 83.0, 148.0, 234.0, 384.0, 607.0, 960.0, 1573.0, 2492.0, 3788.0, 5718.0, 9079.0, 13166.0, 19014.0, 26802.0, 36420.0, 48627.0, 60716.0, 73414.0, 83883.0, 90988.0, 93301.0, 91284.0, 83961.0, 73325.0, 60507.0, 47940.0, 36258.0, 26849.0, 18987.0, 13232.0, 8785.0, 5758.0, 3732.0, 2370.0, 1475.0, 964.0, 634.0, 376.0, 213.0, 141.0, 96.0, 57.0, 28.0, 19.0, 6.0, 9.0, 6.0, 3.0, 4.0], "bins": [-43.0625, -41.84912109375, -40.6357421875, -39.42236328125, -38.208984375, -36.99560546875, -35.7822265625, -34.56884765625, -33.35546875, -32.14208984375, -30.9287109375, -29.71533203125, -28.501953125, -27.28857421875, -26.0751953125, -24.86181640625, -23.6484375, -22.43505859375, -21.2216796875, -20.00830078125, -18.794921875, -17.58154296875, -16.3681640625, -15.15478515625, -13.94140625, -12.72802734375, -11.5146484375, -10.30126953125, -9.087890625, -7.87451171875, -6.6611328125, -5.44775390625, -4.234375, -3.02099609375, -1.8076171875, -0.59423828125, 0.619140625, 1.83251953125, 3.0458984375, 4.25927734375, 5.47265625, 6.68603515625, 7.8994140625, 9.11279296875, 10.326171875, 11.53955078125, 12.7529296875, 13.96630859375, 15.1796875, 16.39306640625, 17.6064453125, 18.81982421875, 20.033203125, 21.24658203125, 22.4599609375, 23.67333984375, 24.88671875, 26.10009765625, 27.3134765625, 28.52685546875, 29.740234375, 30.95361328125, 32.1669921875, 33.38037109375, 34.59375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 3.0, 4.0, 14.0, 15.0, 8.0, 8.0, 18.0, 21.0, 22.0, 20.0, 30.0, 35.0, 35.0, 30.0, 40.0, 30.0, 35.0, 36.0, 40.0, 48.0, 48.0, 52.0, 44.0, 40.0, 45.0, 28.0, 27.0, 43.0, 34.0, 22.0, 20.0, 20.0, 10.0, 13.0, 12.0, 16.0, 9.0, 6.0, 1.0, 3.0, 4.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.984375, -16.41162109375, -15.8388671875, -15.26611328125, -14.693359375, -14.12060546875, -13.5478515625, -12.97509765625, -12.40234375, -11.82958984375, -11.2568359375, -10.68408203125, -10.111328125, -9.53857421875, -8.9658203125, -8.39306640625, -7.8203125, -7.24755859375, -6.6748046875, -6.10205078125, -5.529296875, -4.95654296875, -4.3837890625, -3.81103515625, -3.23828125, -2.66552734375, -2.0927734375, -1.52001953125, -0.947265625, -0.37451171875, 0.1982421875, 0.77099609375, 1.34375, 1.91650390625, 2.4892578125, 3.06201171875, 3.634765625, 4.20751953125, 4.7802734375, 5.35302734375, 5.92578125, 6.49853515625, 7.0712890625, 7.64404296875, 8.216796875, 8.78955078125, 9.3623046875, 9.93505859375, 10.5078125, 11.08056640625, 11.6533203125, 12.22607421875, 12.798828125, 13.37158203125, 13.9443359375, 14.51708984375, 15.08984375, 15.66259765625, 16.2353515625, 16.80810546875, 17.380859375, 17.95361328125, 18.5263671875, 19.09912109375, 19.671875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 4.0, 1.0, 5.0, 7.0, 4.0, 6.0, 7.0, 5.0, 15.0, 19.0, 16.0, 15.0, 26.0, 20.0, 29.0, 33.0, 27.0, 28.0, 27.0, 44.0, 40.0, 31.0, 43.0, 45.0, 32.0, 40.0, 35.0, 32.0, 39.0, 36.0, 30.0, 31.0, 25.0, 25.0, 20.0, 23.0, 24.0, 21.0, 16.0, 16.0, 12.0, 7.0, 13.0, 6.0, 4.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-102.24903106689453, -98.68536376953125, -95.12168884277344, -91.55801391601562, -87.99434661865234, -84.43067932128906, -80.86700439453125, -77.30332946777344, -73.73966217041016, -70.17599487304688, -66.61231994628906, -63.048648834228516, -59.48497772216797, -55.92130661010742, -52.357635498046875, -48.79396438598633, -45.23029327392578, -41.666622161865234, -38.10295104980469, -34.53927993774414, -30.975608825683594, -27.411937713623047, -23.8482666015625, -20.284595489501953, -16.720924377441406, -13.15725326538086, -9.593582153320312, -6.029911041259766, -2.4662399291992188, 1.0974311828613281, 4.661102294921875, 8.224773406982422, 11.7884521484375, 15.352123260498047, 18.915794372558594, 22.47946548461914, 26.043136596679688, 29.606807708740234, 33.17047882080078, 36.73414993286133, 40.297821044921875, 43.86149215698242, 47.42516326904297, 50.988834381103516, 54.55250549316406, 58.11617660522461, 61.679847717285156, 65.24351501464844, 68.80718994140625, 72.37086486816406, 75.93453216552734, 79.49819946289062, 83.06187438964844, 86.62554931640625, 90.18921661376953, 93.75288391113281, 97.31655883789062, 100.88023376464844, 104.44390106201172, 108.007568359375, 111.57124328613281, 115.13491821289062, 118.6985855102539, 122.26225280761719, 125.825927734375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 10.0, 7.0, 11.0, 9.0, 8.0, 17.0, 13.0, 20.0, 14.0, 27.0, 24.0, 26.0, 25.0, 29.0, 32.0, 36.0, 28.0, 49.0, 36.0, 36.0, 51.0, 48.0, 43.0, 49.0, 41.0, 41.0, 28.0, 33.0, 32.0, 17.0, 26.0, 22.0, 21.0, 13.0, 14.0, 11.0, 8.0, 9.0, 9.0, 5.0, 6.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-118.46182250976562, -114.5029067993164, -110.54398345947266, -106.58506774902344, -102.62614440917969, -98.66722869873047, -94.70831298828125, -90.7493896484375, -86.79046630859375, -82.83155059814453, -78.87262725830078, -74.91371154785156, -70.95478820800781, -66.9958724975586, -63.03695297241211, -59.078033447265625, -55.119117736816406, -51.16019821166992, -47.20127868652344, -43.24236297607422, -39.28343963623047, -35.32452392578125, -31.365604400634766, -27.40668487548828, -23.447765350341797, -19.488845825195312, -15.529927253723145, -11.571008682250977, -7.612089157104492, -3.653169631958008, 0.30574798583984375, 4.264667510986328, 8.223587036132812, 12.182506561279297, 16.14142608642578, 20.100343704223633, 24.059263229370117, 28.0181827545166, 31.977100372314453, 35.93601989746094, 39.89493942260742, 43.853858947753906, 47.81277847290039, 51.771697998046875, 55.730613708496094, 59.689537048339844, 63.64845275878906, 67.60737609863281, 71.56629180908203, 75.52520751953125, 79.484130859375, 83.44304656982422, 87.40196990966797, 91.36088562011719, 95.31980895996094, 99.27872467041016, 103.23764038085938, 107.1965560913086, 111.15547943115234, 115.11439514160156, 119.07331848144531, 123.03223419189453, 126.99114990234375, 130.9500732421875, 134.90899658203125]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 9.0, 9.0, 32.0, 48.0, 70.0, 137.0, 215.0, 403.0, 651.0, 1093.0, 1752.0, 3179.0, 4975.0, 8091.0, 12676.0, 19949.0, 30461.0, 45873.0, 66693.0, 94080.0, 131332.0, 173974.0, 223421.0, 273055.0, 317274.0, 352932.0, 370493.0, 368814.0, 346309.0, 311258.0, 263142.0, 214057.0, 165207.0, 123342.0, 89304.0, 61845.0, 42222.0, 28099.0, 18237.0, 11588.0, 7207.0, 4348.0, 2603.0, 1526.0, 990.0, 556.0, 319.0, 197.0, 116.0, 61.0, 32.0, 16.0, 14.0, 2.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.8125, -76.1767578125, -73.541015625, -70.9052734375, -68.26953125, -65.6337890625, -62.998046875, -60.3623046875, -57.7265625, -55.0908203125, -52.455078125, -49.8193359375, -47.18359375, -44.5478515625, -41.912109375, -39.2763671875, -36.640625, -34.0048828125, -31.369140625, -28.7333984375, -26.09765625, -23.4619140625, -20.826171875, -18.1904296875, -15.5546875, -12.9189453125, -10.283203125, -7.6474609375, -5.01171875, -2.3759765625, 0.259765625, 2.8955078125, 5.53125, 8.1669921875, 10.802734375, 13.4384765625, 16.07421875, 18.7099609375, 21.345703125, 23.9814453125, 26.6171875, 29.2529296875, 31.888671875, 34.5244140625, 37.16015625, 39.7958984375, 42.431640625, 45.0673828125, 47.703125, 50.3388671875, 52.974609375, 55.6103515625, 58.24609375, 60.8818359375, 63.517578125, 66.1533203125, 68.7890625, 71.4248046875, 74.060546875, 76.6962890625, 79.33203125, 81.9677734375, 84.603515625, 87.2392578125, 89.875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 12.0, 11.0, 7.0, 17.0, 12.0, 22.0, 16.0, 26.0, 22.0, 27.0, 28.0, 34.0, 27.0, 35.0, 38.0, 39.0, 39.0, 46.0, 42.0, 53.0, 39.0, 43.0, 44.0, 40.0, 28.0, 38.0, 21.0, 22.0, 22.0, 26.0, 18.0, 14.0, 14.0, 9.0, 9.0, 5.0, 12.0, 5.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-107.75, -104.1494140625, -100.548828125, -96.9482421875, -93.34765625, -89.7470703125, -86.146484375, -82.5458984375, -78.9453125, -75.3447265625, -71.744140625, -68.1435546875, -64.54296875, -60.9423828125, -57.341796875, -53.7412109375, -50.140625, -46.5400390625, -42.939453125, -39.3388671875, -35.73828125, -32.1376953125, -28.537109375, -24.9365234375, -21.3359375, -17.7353515625, -14.134765625, -10.5341796875, -6.93359375, -3.3330078125, 0.267578125, 3.8681640625, 7.46875, 11.0693359375, 14.669921875, 18.2705078125, 21.87109375, 25.4716796875, 29.072265625, 32.6728515625, 36.2734375, 39.8740234375, 43.474609375, 47.0751953125, 50.67578125, 54.2763671875, 57.876953125, 61.4775390625, 65.078125, 68.6787109375, 72.279296875, 75.8798828125, 79.48046875, 83.0810546875, 86.681640625, 90.2822265625, 93.8828125, 97.4833984375, 101.083984375, 104.6845703125, 108.28515625, 111.8857421875, 115.486328125, 119.0869140625, 122.6875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 11.0, 8.0, 26.0, 46.0, 83.0, 147.0, 270.0, 440.0, 765.0, 1346.0, 2224.0, 3729.0, 6167.0, 9983.0, 15402.0, 23835.0, 35613.0, 52458.0, 74220.0, 100995.0, 136405.0, 174718.0, 216624.0, 257482.0, 294408.0, 322565.0, 338933.0, 339754.0, 325906.0, 300482.0, 265175.0, 223018.0, 181555.0, 141616.0, 106967.0, 78158.0, 55287.0, 38078.0, 25707.0, 16636.0, 10564.0, 6551.0, 4111.0, 2344.0, 1454.0, 872.0, 509.0, 308.0, 156.0, 81.0, 52.0, 30.0, 16.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.4375, -79.78515625, -77.1328125, -74.48046875, -71.828125, -69.17578125, -66.5234375, -63.87109375, -61.21875, -58.56640625, -55.9140625, -53.26171875, -50.609375, -47.95703125, -45.3046875, -42.65234375, -40.0, -37.34765625, -34.6953125, -32.04296875, -29.390625, -26.73828125, -24.0859375, -21.43359375, -18.78125, -16.12890625, -13.4765625, -10.82421875, -8.171875, -5.51953125, -2.8671875, -0.21484375, 2.4375, 5.08984375, 7.7421875, 10.39453125, 13.046875, 15.69921875, 18.3515625, 21.00390625, 23.65625, 26.30859375, 28.9609375, 31.61328125, 34.265625, 36.91796875, 39.5703125, 42.22265625, 44.875, 47.52734375, 50.1796875, 52.83203125, 55.484375, 58.13671875, 60.7890625, 63.44140625, 66.09375, 68.74609375, 71.3984375, 74.05078125, 76.703125, 79.35546875, 82.0078125, 84.66015625, 87.3125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 6.0, 10.0, 8.0, 28.0, 19.0, 29.0, 29.0, 46.0, 44.0, 63.0, 78.0, 70.0, 98.0, 109.0, 122.0, 119.0, 148.0, 171.0, 159.0, 178.0, 192.0, 202.0, 194.0, 199.0, 200.0, 169.0, 177.0, 158.0, 164.0, 124.0, 127.0, 107.0, 78.0, 85.0, 72.0, 59.0, 49.0, 39.0, 30.0, 32.0, 18.0, 19.0, 9.0, 9.0, 8.0, 8.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.3125, -46.72705078125, -45.1416015625, -43.55615234375, -41.970703125, -40.38525390625, -38.7998046875, -37.21435546875, -35.62890625, -34.04345703125, -32.4580078125, -30.87255859375, -29.287109375, -27.70166015625, -26.1162109375, -24.53076171875, -22.9453125, -21.35986328125, -19.7744140625, -18.18896484375, -16.603515625, -15.01806640625, -13.4326171875, -11.84716796875, -10.26171875, -8.67626953125, -7.0908203125, -5.50537109375, -3.919921875, -2.33447265625, -0.7490234375, 0.83642578125, 2.421875, 4.00732421875, 5.5927734375, 7.17822265625, 8.763671875, 10.34912109375, 11.9345703125, 13.52001953125, 15.10546875, 16.69091796875, 18.2763671875, 19.86181640625, 21.447265625, 23.03271484375, 24.6181640625, 26.20361328125, 27.7890625, 29.37451171875, 30.9599609375, 32.54541015625, 34.130859375, 35.71630859375, 37.3017578125, 38.88720703125, 40.47265625, 42.05810546875, 43.6435546875, 45.22900390625, 46.814453125, 48.39990234375, 49.9853515625, 51.57080078125, 53.15625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 16.0, 10.0, 13.0, 12.0, 18.0, 19.0, 27.0, 27.0, 25.0, 22.0, 26.0, 31.0, 38.0, 38.0, 44.0, 38.0, 41.0, 34.0, 40.0, 30.0, 42.0, 38.0, 31.0, 25.0, 33.0, 35.0, 28.0, 29.0, 26.0, 24.0, 16.0, 11.0, 14.0, 15.0, 10.0, 7.0, 14.0, 3.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-115.63526916503906, -112.03148651123047, -108.42770385742188, -104.82392120361328, -101.22013854980469, -97.6163558959961, -94.0125732421875, -90.4087905883789, -86.80500793457031, -83.20122528076172, -79.59744262695312, -75.99365997314453, -72.38987731933594, -68.78609466552734, -65.18231201171875, -61.578529357910156, -57.97474670410156, -54.37096405029297, -50.767181396484375, -47.16339874267578, -43.55961608886719, -39.955833435058594, -36.35205078125, -32.748268127441406, -29.144485473632812, -25.54070281982422, -21.936920166015625, -18.33313751220703, -14.729354858398438, -11.125572204589844, -7.52178955078125, -3.9180068969726562, -0.3142242431640625, 3.2895584106445312, 6.893341064453125, 10.497123718261719, 14.100906372070312, 17.704689025878906, 21.3084716796875, 24.912254333496094, 28.516036987304688, 32.11981964111328, 35.723602294921875, 39.32738494873047, 42.93116760253906, 46.534950256347656, 50.13873291015625, 53.742515563964844, 57.34629821777344, 60.95008087158203, 64.55386352539062, 68.15764617919922, 71.76142883300781, 75.3652114868164, 78.968994140625, 82.5727767944336, 86.17655944824219, 89.78034210205078, 93.38412475585938, 96.98790740966797, 100.59169006347656, 104.19547271728516, 107.79925537109375, 111.40303802490234, 115.00682067871094]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 6.0, 7.0, 11.0, 17.0, 18.0, 11.0, 17.0, 13.0, 26.0, 24.0, 28.0, 29.0, 34.0, 42.0, 33.0, 37.0, 43.0, 54.0, 52.0, 35.0, 51.0, 49.0, 43.0, 32.0, 37.0, 38.0, 31.0, 28.0, 33.0, 20.0, 16.0, 16.0, 19.0, 8.0, 8.0, 5.0, 6.0, 6.0, 3.0, 0.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.06556701660156, -140.752685546875, -136.4398193359375, -132.126953125, -127.81407165527344, -123.5011978149414, -119.18832397460938, -114.87545013427734, -110.56257629394531, -106.24970245361328, -101.93682861328125, -97.62395477294922, -93.31108093261719, -88.99820709228516, -84.68533325195312, -80.3724594116211, -76.05958557128906, -71.74671173095703, -67.433837890625, -63.12096405029297, -58.80809020996094, -54.495216369628906, -50.182342529296875, -45.869468688964844, -41.55659484863281, -37.24372100830078, -32.93084716796875, -28.61797332763672, -24.305099487304688, -19.992225646972656, -15.679351806640625, -11.366477966308594, -7.0536041259765625, -2.7407302856445312, 1.5721435546875, 5.885017395019531, 10.197891235351562, 14.510765075683594, 18.823638916015625, 23.136512756347656, 27.449386596679688, 31.76226043701172, 36.07513427734375, 40.38800811767578, 44.70088195800781, 49.013755798339844, 53.326629638671875, 57.639503479003906, 61.95237731933594, 66.26525115966797, 70.578125, 74.89099884033203, 79.20387268066406, 83.5167465209961, 87.82962036132812, 92.14249420166016, 96.45536804199219, 100.76824188232422, 105.08111572265625, 109.39398956298828, 113.70686340332031, 118.01973724365234, 122.33261108398438, 126.6454849243164, 130.95835876464844]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 6.0, 11.0, 12.0, 26.0, 26.0, 63.0, 88.0, 137.0, 178.0, 273.0, 466.0, 598.0, 888.0, 1346.0, 1996.0, 2913.0, 4436.0, 6698.0, 10091.0, 14967.0, 21982.0, 32285.0, 45672.0, 62732.0, 81315.0, 99160.0, 110771.0, 113581.0, 105673.0, 88868.0, 71053.0, 52485.0, 37507.0, 26080.0, 17951.0, 11660.0, 8066.0, 5392.0, 3691.0, 2378.0, 1611.0, 1105.0, 739.0, 537.0, 335.0, 214.0, 173.0, 124.0, 68.0, 48.0, 36.0, 16.0, 16.0, 5.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.28125, -37.9814453125, -36.681640625, -35.3818359375, -34.08203125, -32.7822265625, -31.482421875, -30.1826171875, -28.8828125, -27.5830078125, -26.283203125, -24.9833984375, -23.68359375, -22.3837890625, -21.083984375, -19.7841796875, -18.484375, -17.1845703125, -15.884765625, -14.5849609375, -13.28515625, -11.9853515625, -10.685546875, -9.3857421875, -8.0859375, -6.7861328125, -5.486328125, -4.1865234375, -2.88671875, -1.5869140625, -0.287109375, 1.0126953125, 2.3125, 3.6123046875, 4.912109375, 6.2119140625, 7.51171875, 8.8115234375, 10.111328125, 11.4111328125, 12.7109375, 14.0107421875, 15.310546875, 16.6103515625, 17.91015625, 19.2099609375, 20.509765625, 21.8095703125, 23.109375, 24.4091796875, 25.708984375, 27.0087890625, 28.30859375, 29.6083984375, 30.908203125, 32.2080078125, 33.5078125, 34.8076171875, 36.107421875, 37.4072265625, 38.70703125, 40.0068359375, 41.306640625, 42.6064453125, 43.90625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 7.0, 5.0, 11.0, 18.0, 15.0, 14.0, 17.0, 14.0, 25.0, 23.0, 28.0, 26.0, 39.0, 39.0, 33.0, 40.0, 43.0, 54.0, 50.0, 37.0, 47.0, 51.0, 44.0, 36.0, 37.0, 37.0, 28.0, 26.0, 34.0, 21.0, 17.0, 15.0, 18.0, 9.0, 8.0, 5.0, 6.0, 6.0, 2.0, 1.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.625, -140.318359375, -136.01171875, -131.705078125, -127.3984375, -123.091796875, -118.78515625, -114.478515625, -110.171875, -105.865234375, -101.55859375, -97.251953125, -92.9453125, -88.638671875, -84.33203125, -80.025390625, -75.71875, -71.412109375, -67.10546875, -62.798828125, -58.4921875, -54.185546875, -49.87890625, -45.572265625, -41.265625, -36.958984375, -32.65234375, -28.345703125, -24.0390625, -19.732421875, -15.42578125, -11.119140625, -6.8125, -2.505859375, 1.80078125, 6.107421875, 10.4140625, 14.720703125, 19.02734375, 23.333984375, 27.640625, 31.947265625, 36.25390625, 40.560546875, 44.8671875, 49.173828125, 53.48046875, 57.787109375, 62.09375, 66.400390625, 70.70703125, 75.013671875, 79.3203125, 83.626953125, 87.93359375, 92.240234375, 96.546875, 100.853515625, 105.16015625, 109.466796875, 113.7734375, 118.080078125, 122.38671875, 126.693359375, 131.0]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 7.0, 7.0, 4.0, 8.0, 13.0, 21.0, 31.0, 47.0, 67.0, 80.0, 129.0, 188.0, 218.0, 395.0, 518.0, 783.0, 1157.0, 1634.0, 2706.0, 4537.0, 7487.0, 13227.0, 23798.0, 43445.0, 81517.0, 143327.0, 207495.0, 203948.0, 137223.0, 77709.0, 41616.0, 22898.0, 12722.0, 7411.0, 4294.0, 2640.0, 1661.0, 1092.0, 733.0, 530.0, 425.0, 236.0, 177.0, 131.0, 83.0, 51.0, 46.0, 27.0, 17.0, 18.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-57.3125, -55.3994140625, -53.486328125, -51.5732421875, -49.66015625, -47.7470703125, -45.833984375, -43.9208984375, -42.0078125, -40.0947265625, -38.181640625, -36.2685546875, -34.35546875, -32.4423828125, -30.529296875, -28.6162109375, -26.703125, -24.7900390625, -22.876953125, -20.9638671875, -19.05078125, -17.1376953125, -15.224609375, -13.3115234375, -11.3984375, -9.4853515625, -7.572265625, -5.6591796875, -3.74609375, -1.8330078125, 0.080078125, 1.9931640625, 3.90625, 5.8193359375, 7.732421875, 9.6455078125, 11.55859375, 13.4716796875, 15.384765625, 17.2978515625, 19.2109375, 21.1240234375, 23.037109375, 24.9501953125, 26.86328125, 28.7763671875, 30.689453125, 32.6025390625, 34.515625, 36.4287109375, 38.341796875, 40.2548828125, 42.16796875, 44.0810546875, 45.994140625, 47.9072265625, 49.8203125, 51.7333984375, 53.646484375, 55.5595703125, 57.47265625, 59.3857421875, 61.298828125, 63.2119140625, 65.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 4.0, 5.0, 4.0, 18.0, 13.0, 22.0, 17.0, 18.0, 31.0, 23.0, 24.0, 15.0, 32.0, 41.0, 34.0, 50.0, 41.0, 42.0, 45.0, 50.0, 37.0, 39.0, 35.0, 42.0, 42.0, 36.0, 33.0, 33.0, 34.0, 23.0, 25.0, 14.0, 11.0, 15.0, 8.0, 6.0, 9.0, 8.0, 4.0, 0.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-89.875, -87.19921875, -84.5234375, -81.84765625, -79.171875, -76.49609375, -73.8203125, -71.14453125, -68.46875, -65.79296875, -63.1171875, -60.44140625, -57.765625, -55.08984375, -52.4140625, -49.73828125, -47.0625, -44.38671875, -41.7109375, -39.03515625, -36.359375, -33.68359375, -31.0078125, -28.33203125, -25.65625, -22.98046875, -20.3046875, -17.62890625, -14.953125, -12.27734375, -9.6015625, -6.92578125, -4.25, -1.57421875, 1.1015625, 3.77734375, 6.453125, 9.12890625, 11.8046875, 14.48046875, 17.15625, 19.83203125, 22.5078125, 25.18359375, 27.859375, 30.53515625, 33.2109375, 35.88671875, 38.5625, 41.23828125, 43.9140625, 46.58984375, 49.265625, 51.94140625, 54.6171875, 57.29296875, 59.96875, 62.64453125, 65.3203125, 67.99609375, 70.671875, 73.34765625, 76.0234375, 78.69921875, 81.375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 7.0, 3.0, 10.0, 14.0, 14.0, 22.0, 48.0, 45.0, 74.0, 96.0, 145.0, 219.0, 316.0, 449.0, 600.0, 850.0, 1355.0, 2029.0, 3114.0, 5170.0, 8505.0, 15290.0, 28180.0, 56249.0, 122236.0, 256192.0, 274186.0, 137880.0, 62886.0, 31266.0, 16151.0, 9211.0, 5483.0, 3360.0, 2147.0, 1508.0, 952.0, 712.0, 425.0, 321.0, 223.0, 148.0, 134.0, 103.0, 75.0, 46.0, 41.0, 20.0, 22.0, 15.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-45.96875, -44.57861328125, -43.1884765625, -41.79833984375, -40.408203125, -39.01806640625, -37.6279296875, -36.23779296875, -34.84765625, -33.45751953125, -32.0673828125, -30.67724609375, -29.287109375, -27.89697265625, -26.5068359375, -25.11669921875, -23.7265625, -22.33642578125, -20.9462890625, -19.55615234375, -18.166015625, -16.77587890625, -15.3857421875, -13.99560546875, -12.60546875, -11.21533203125, -9.8251953125, -8.43505859375, -7.044921875, -5.65478515625, -4.2646484375, -2.87451171875, -1.484375, -0.09423828125, 1.2958984375, 2.68603515625, 4.076171875, 5.46630859375, 6.8564453125, 8.24658203125, 9.63671875, 11.02685546875, 12.4169921875, 13.80712890625, 15.197265625, 16.58740234375, 17.9775390625, 19.36767578125, 20.7578125, 22.14794921875, 23.5380859375, 24.92822265625, 26.318359375, 27.70849609375, 29.0986328125, 30.48876953125, 31.87890625, 33.26904296875, 34.6591796875, 36.04931640625, 37.439453125, 38.82958984375, 40.2197265625, 41.60986328125, 43.0]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 2.0, 4.0, 9.0, 11.0, 14.0, 13.0, 15.0, 24.0, 43.0, 37.0, 55.0, 53.0, 57.0, 66.0, 57.0, 88.0, 55.0, 60.0, 58.0, 53.0, 50.0, 40.0, 32.0, 22.0, 15.0, 20.0, 8.0, 8.0, 11.0, 6.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0025730133056640625, -0.0025026053190231323, -0.002432197332382202, -0.002361789345741272, -0.002291381359100342, -0.0022209733724594116, -0.0021505653858184814, -0.0020801573991775513, -0.002009749412536621, -0.001939341425895691, -0.0018689334392547607, -0.0017985254526138306, -0.0017281174659729004, -0.0016577094793319702, -0.00158730149269104, -0.0015168935060501099, -0.0014464855194091797, -0.0013760775327682495, -0.0013056695461273193, -0.0012352615594863892, -0.001164853572845459, -0.0010944455862045288, -0.0010240375995635986, -0.0009536296129226685, -0.0008832216262817383, -0.0008128136396408081, -0.0007424056529998779, -0.0006719976663589478, -0.0006015896797180176, -0.0005311816930770874, -0.0004607737064361572, -0.00039036571979522705, -0.0003199577331542969, -0.0002495497465133667, -0.00017914175987243652, -0.00010873377323150635, -3.832578659057617e-05, 3.2082200050354004e-05, 0.00010249018669128418, 0.00017289817333221436, 0.00024330615997314453, 0.0003137141466140747, 0.0003841221332550049, 0.00045453011989593506, 0.0005249381065368652, 0.0005953460931777954, 0.0006657540798187256, 0.0007361620664596558, 0.0008065700531005859, 0.0008769780397415161, 0.0009473860263824463, 0.0010177940130233765, 0.0010882019996643066, 0.0011586099863052368, 0.001229017972946167, 0.0012994259595870972, 0.0013698339462280273, 0.0014402419328689575, 0.0015106499195098877, 0.0015810579061508179, 0.001651465892791748, 0.0017218738794326782, 0.0017922818660736084, 0.0018626898527145386, 0.0019330978393554688]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 6.0, 12.0, 24.0, 23.0, 44.0, 73.0, 85.0, 137.0, 259.0, 329.0, 477.0, 785.0, 1208.0, 1902.0, 2910.0, 4625.0, 7575.0, 12276.0, 20642.0, 34734.0, 56122.0, 87336.0, 124478.0, 152532.0, 156412.0, 131471.0, 94413.0, 61136.0, 37873.0, 22562.0, 13626.0, 8451.0, 5056.0, 3194.0, 2006.0, 1327.0, 858.0, 516.0, 367.0, 226.0, 154.0, 111.0, 80.0, 32.0, 32.0, 22.0, 11.0, 7.0, 10.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.4375, -50.85302734375, -49.2685546875, -47.68408203125, -46.099609375, -44.51513671875, -42.9306640625, -41.34619140625, -39.76171875, -38.17724609375, -36.5927734375, -35.00830078125, -33.423828125, -31.83935546875, -30.2548828125, -28.67041015625, -27.0859375, -25.50146484375, -23.9169921875, -22.33251953125, -20.748046875, -19.16357421875, -17.5791015625, -15.99462890625, -14.41015625, -12.82568359375, -11.2412109375, -9.65673828125, -8.072265625, -6.48779296875, -4.9033203125, -3.31884765625, -1.734375, -0.14990234375, 1.4345703125, 3.01904296875, 4.603515625, 6.18798828125, 7.7724609375, 9.35693359375, 10.94140625, 12.52587890625, 14.1103515625, 15.69482421875, 17.279296875, 18.86376953125, 20.4482421875, 22.03271484375, 23.6171875, 25.20166015625, 26.7861328125, 28.37060546875, 29.955078125, 31.53955078125, 33.1240234375, 34.70849609375, 36.29296875, 37.87744140625, 39.4619140625, 41.04638671875, 42.630859375, 44.21533203125, 45.7998046875, 47.38427734375, 48.96875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 9.0, 7.0, 5.0, 10.0, 10.0, 17.0, 14.0, 17.0, 28.0, 46.0, 43.0, 54.0, 64.0, 77.0, 65.0, 66.0, 75.0, 67.0, 64.0, 62.0, 38.0, 39.0, 31.0, 19.0, 18.0, 12.0, 8.0, 6.0, 4.0, 7.0, 1.0, 7.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.03125, -21.32958984375, -20.6279296875, -19.92626953125, -19.224609375, -18.52294921875, -17.8212890625, -17.11962890625, -16.41796875, -15.71630859375, -15.0146484375, -14.31298828125, -13.611328125, -12.90966796875, -12.2080078125, -11.50634765625, -10.8046875, -10.10302734375, -9.4013671875, -8.69970703125, -7.998046875, -7.29638671875, -6.5947265625, -5.89306640625, -5.19140625, -4.48974609375, -3.7880859375, -3.08642578125, -2.384765625, -1.68310546875, -0.9814453125, -0.27978515625, 0.421875, 1.12353515625, 1.8251953125, 2.52685546875, 3.228515625, 3.93017578125, 4.6318359375, 5.33349609375, 6.03515625, 6.73681640625, 7.4384765625, 8.14013671875, 8.841796875, 9.54345703125, 10.2451171875, 10.94677734375, 11.6484375, 12.35009765625, 13.0517578125, 13.75341796875, 14.455078125, 15.15673828125, 15.8583984375, 16.56005859375, 17.26171875, 17.96337890625, 18.6650390625, 19.36669921875, 20.068359375, 20.77001953125, 21.4716796875, 22.17333984375, 22.875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 16.0, 10.0, 12.0, 8.0, 20.0, 20.0, 19.0, 20.0, 22.0, 26.0, 30.0, 25.0, 21.0, 32.0, 43.0, 41.0, 39.0, 27.0, 38.0, 45.0, 36.0, 34.0, 41.0, 36.0, 23.0, 29.0, 36.0, 23.0, 25.0, 20.0, 32.0, 21.0, 15.0, 13.0, 14.0, 11.0, 8.0, 15.0, 7.0, 2.0, 8.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-108.71739959716797, -105.21744537353516, -101.71749114990234, -98.21753692626953, -94.71758270263672, -91.2176284790039, -87.7176742553711, -84.21772003173828, -80.71776580810547, -77.21781158447266, -73.71785736083984, -70.21790313720703, -66.71794891357422, -63.217994689941406, -59.718040466308594, -56.21808624267578, -52.71813201904297, -49.218177795410156, -45.718223571777344, -42.21826934814453, -38.71831512451172, -35.218360900878906, -31.718406677246094, -28.21845245361328, -24.71849822998047, -21.218544006347656, -17.718589782714844, -14.218635559082031, -10.718681335449219, -7.218727111816406, -3.7187728881835938, -0.21881866455078125, 3.2811355590820312, 6.781089782714844, 10.281044006347656, 13.780998229980469, 17.28095245361328, 20.780906677246094, 24.280860900878906, 27.78081512451172, 31.28076934814453, 34.780723571777344, 38.280677795410156, 41.78063201904297, 45.28058624267578, 48.780540466308594, 52.280494689941406, 55.78044891357422, 59.28040313720703, 62.780357360839844, 66.28031158447266, 69.78026580810547, 73.28022003173828, 76.7801742553711, 80.2801284790039, 83.78008270263672, 87.28003692626953, 90.77999114990234, 94.27994537353516, 97.77989959716797, 101.27985382080078, 104.7798080444336, 108.2797622680664, 111.77971649169922, 115.27967071533203]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 8.0, 10.0, 13.0, 14.0, 12.0, 18.0, 14.0, 20.0, 20.0, 28.0, 36.0, 27.0, 35.0, 35.0, 29.0, 45.0, 43.0, 39.0, 41.0, 44.0, 52.0, 37.0, 46.0, 35.0, 38.0, 30.0, 37.0, 15.0, 29.0, 31.0, 18.0, 15.0, 15.0, 11.0, 12.0, 7.0, 5.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-141.22442626953125, -137.1237335205078, -133.0230255126953, -128.92233276367188, -124.8216323852539, -120.72093200683594, -116.6202392578125, -112.51953887939453, -108.41883850097656, -104.3181381225586, -100.21743774414062, -96.11674499511719, -92.01604461669922, -87.91534423828125, -83.81465148925781, -79.71395111083984, -75.61325073242188, -71.5125503540039, -67.41184997558594, -63.3111572265625, -59.21045684814453, -55.10975646972656, -51.00905990600586, -46.908363342285156, -42.80766296386719, -38.70696258544922, -34.606266021728516, -30.50556755065918, -26.404869079589844, -22.304170608520508, -18.203472137451172, -14.102773666381836, -10.002067565917969, -5.901369094848633, -1.8006706237792969, 2.300027847290039, 6.400726318359375, 10.501424789428711, 14.602123260498047, 18.702821731567383, 22.80352020263672, 26.904218673706055, 31.00491714477539, 35.105613708496094, 39.20631408691406, 43.30701446533203, 47.407711029052734, 51.50840759277344, 55.609107971191406, 59.709808349609375, 63.81050491333008, 67.91120147705078, 72.01190185546875, 76.11260223388672, 80.21330261230469, 84.31399536132812, 88.4146957397461, 92.51539611816406, 96.6160888671875, 100.71678924560547, 104.81748962402344, 108.9181900024414, 113.01889038085938, 117.11958312988281, 121.22028350830078]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 9.0, 13.0, 22.0, 43.0, 63.0, 119.0, 190.0, 333.0, 584.0, 983.0, 1491.0, 2424.0, 3831.0, 6259.0, 9249.0, 13829.0, 19924.0, 27355.0, 36915.0, 47906.0, 59038.0, 70305.0, 79769.0, 86582.0, 88838.0, 87556.0, 82044.0, 72999.0, 62170.0, 51024.0, 40080.0, 30388.0, 21874.0, 15138.0, 10389.0, 6906.0, 4527.0, 2931.0, 1819.0, 1094.0, 662.0, 392.0, 203.0, 124.0, 73.0, 38.0, 21.0, 14.0, 10.0, 7.0, 7.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.4375, -79.9873046875, -77.537109375, -75.0869140625, -72.63671875, -70.1865234375, -67.736328125, -65.2861328125, -62.8359375, -60.3857421875, -57.935546875, -55.4853515625, -53.03515625, -50.5849609375, -48.134765625, -45.6845703125, -43.234375, -40.7841796875, -38.333984375, -35.8837890625, -33.43359375, -30.9833984375, -28.533203125, -26.0830078125, -23.6328125, -21.1826171875, -18.732421875, -16.2822265625, -13.83203125, -11.3818359375, -8.931640625, -6.4814453125, -4.03125, -1.5810546875, 0.869140625, 3.3193359375, 5.76953125, 8.2197265625, 10.669921875, 13.1201171875, 15.5703125, 18.0205078125, 20.470703125, 22.9208984375, 25.37109375, 27.8212890625, 30.271484375, 32.7216796875, 35.171875, 37.6220703125, 40.072265625, 42.5224609375, 44.97265625, 47.4228515625, 49.873046875, 52.3232421875, 54.7734375, 57.2236328125, 59.673828125, 62.1240234375, 64.57421875, 67.0244140625, 69.474609375, 71.9248046875, 74.375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 7.0, 10.0, 6.0, 12.0, 14.0, 14.0, 12.0, 16.0, 17.0, 18.0, 23.0, 32.0, 31.0, 28.0, 34.0, 32.0, 34.0, 47.0, 43.0, 37.0, 45.0, 40.0, 51.0, 38.0, 46.0, 32.0, 40.0, 30.0, 36.0, 16.0, 33.0, 25.0, 16.0, 15.0, 16.0, 11.0, 12.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-136.375, -132.4052734375, -128.435546875, -124.4658203125, -120.49609375, -116.5263671875, -112.556640625, -108.5869140625, -104.6171875, -100.6474609375, -96.677734375, -92.7080078125, -88.73828125, -84.7685546875, -80.798828125, -76.8291015625, -72.859375, -68.8896484375, -64.919921875, -60.9501953125, -56.98046875, -53.0107421875, -49.041015625, -45.0712890625, -41.1015625, -37.1318359375, -33.162109375, -29.1923828125, -25.22265625, -21.2529296875, -17.283203125, -13.3134765625, -9.34375, -5.3740234375, -1.404296875, 2.5654296875, 6.53515625, 10.5048828125, 14.474609375, 18.4443359375, 22.4140625, 26.3837890625, 30.353515625, 34.3232421875, 38.29296875, 42.2626953125, 46.232421875, 50.2021484375, 54.171875, 58.1416015625, 62.111328125, 66.0810546875, 70.05078125, 74.0205078125, 77.990234375, 81.9599609375, 85.9296875, 89.8994140625, 93.869140625, 97.8388671875, 101.80859375, 105.7783203125, 109.748046875, 113.7177734375, 117.6875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 19.0, 30.0, 65.0, 82.0, 185.0, 320.0, 529.0, 904.0, 1431.0, 2424.0, 3882.0, 6011.0, 9219.0, 13736.0, 19744.0, 27700.0, 36952.0, 47485.0, 59640.0, 71244.0, 81354.0, 87340.0, 89722.0, 88468.0, 82628.0, 73545.0, 62450.0, 50560.0, 38733.0, 28772.0, 21039.0, 14724.0, 9877.0, 6658.0, 4250.0, 2688.0, 1643.0, 990.0, 593.0, 392.0, 214.0, 130.0, 77.0, 34.0, 30.0, 15.0, 16.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.125, -71.779296875, -69.43359375, -67.087890625, -64.7421875, -62.396484375, -60.05078125, -57.705078125, -55.359375, -53.013671875, -50.66796875, -48.322265625, -45.9765625, -43.630859375, -41.28515625, -38.939453125, -36.59375, -34.248046875, -31.90234375, -29.556640625, -27.2109375, -24.865234375, -22.51953125, -20.173828125, -17.828125, -15.482421875, -13.13671875, -10.791015625, -8.4453125, -6.099609375, -3.75390625, -1.408203125, 0.9375, 3.283203125, 5.62890625, 7.974609375, 10.3203125, 12.666015625, 15.01171875, 17.357421875, 19.703125, 22.048828125, 24.39453125, 26.740234375, 29.0859375, 31.431640625, 33.77734375, 36.123046875, 38.46875, 40.814453125, 43.16015625, 45.505859375, 47.8515625, 50.197265625, 52.54296875, 54.888671875, 57.234375, 59.580078125, 61.92578125, 64.271484375, 66.6171875, 68.962890625, 71.30859375, 73.654296875, 76.0]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 11.0, 6.0, 6.0, 12.0, 16.0, 12.0, 11.0, 16.0, 16.0, 16.0, 19.0, 26.0, 29.0, 36.0, 32.0, 39.0, 32.0, 51.0, 39.0, 48.0, 36.0, 41.0, 33.0, 45.0, 38.0, 46.0, 50.0, 32.0, 27.0, 26.0, 15.0, 15.0, 23.0, 14.0, 17.0, 12.0, 11.0, 7.0, 6.0, 6.0, 8.0, 9.0, 2.0, 3.0, 1.0, 9.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-87.8125, -85.2294921875, -82.646484375, -80.0634765625, -77.48046875, -74.8974609375, -72.314453125, -69.7314453125, -67.1484375, -64.5654296875, -61.982421875, -59.3994140625, -56.81640625, -54.2333984375, -51.650390625, -49.0673828125, -46.484375, -43.9013671875, -41.318359375, -38.7353515625, -36.15234375, -33.5693359375, -30.986328125, -28.4033203125, -25.8203125, -23.2373046875, -20.654296875, -18.0712890625, -15.48828125, -12.9052734375, -10.322265625, -7.7392578125, -5.15625, -2.5732421875, 0.009765625, 2.5927734375, 5.17578125, 7.7587890625, 10.341796875, 12.9248046875, 15.5078125, 18.0908203125, 20.673828125, 23.2568359375, 25.83984375, 28.4228515625, 31.005859375, 33.5888671875, 36.171875, 38.7548828125, 41.337890625, 43.9208984375, 46.50390625, 49.0869140625, 51.669921875, 54.2529296875, 56.8359375, 59.4189453125, 62.001953125, 64.5849609375, 67.16796875, 69.7509765625, 72.333984375, 74.9169921875, 77.5]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 4.0, 12.0, 23.0, 37.0, 46.0, 71.0, 133.0, 185.0, 279.0, 440.0, 701.0, 1099.0, 1680.0, 2693.0, 4035.0, 6107.0, 8990.0, 13179.0, 18673.0, 25696.0, 34453.0, 44360.0, 55399.0, 65298.0, 76011.0, 82705.0, 87111.0, 86788.0, 82803.0, 75059.0, 65218.0, 53664.0, 43068.0, 32766.0, 24444.0, 17420.0, 12528.0, 8718.0, 5753.0, 3810.0, 2574.0, 1643.0, 1061.0, 661.0, 415.0, 263.0, 192.0, 110.0, 61.0, 34.0, 41.0, 19.0, 8.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0], "bins": [-29.765625, -28.771240234375, -27.77685546875, -26.782470703125, -25.7880859375, -24.793701171875, -23.79931640625, -22.804931640625, -21.810546875, -20.816162109375, -19.82177734375, -18.827392578125, -17.8330078125, -16.838623046875, -15.84423828125, -14.849853515625, -13.85546875, -12.861083984375, -11.86669921875, -10.872314453125, -9.8779296875, -8.883544921875, -7.88916015625, -6.894775390625, -5.900390625, -4.906005859375, -3.91162109375, -2.917236328125, -1.9228515625, -0.928466796875, 0.06591796875, 1.060302734375, 2.0546875, 3.049072265625, 4.04345703125, 5.037841796875, 6.0322265625, 7.026611328125, 8.02099609375, 9.015380859375, 10.009765625, 11.004150390625, 11.99853515625, 12.992919921875, 13.9873046875, 14.981689453125, 15.97607421875, 16.970458984375, 17.96484375, 18.959228515625, 19.95361328125, 20.947998046875, 21.9423828125, 22.936767578125, 23.93115234375, 24.925537109375, 25.919921875, 26.914306640625, 27.90869140625, 28.903076171875, 29.8974609375, 30.891845703125, 31.88623046875, 32.880615234375, 33.875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 8.0, 8.0, 13.0, 11.0, 16.0, 20.0, 22.0, 19.0, 32.0, 29.0, 42.0, 37.0, 33.0, 38.0, 51.0, 47.0, 44.0, 39.0, 48.0, 49.0, 36.0, 51.0, 42.0, 38.0, 35.0, 37.0, 21.0, 23.0, 17.0, 10.0, 14.0, 18.0, 8.0, 11.0, 7.0, 6.0, 12.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005649566650390625, -0.005496382713317871, -0.005343198776245117, -0.005190014839172363, -0.005036830902099609, -0.0048836469650268555, -0.0047304630279541016, -0.004577279090881348, -0.004424095153808594, -0.00427091121673584, -0.004117727279663086, -0.003964543342590332, -0.003811359405517578, -0.0036581754684448242, -0.0035049915313720703, -0.0033518075942993164, -0.0031986236572265625, -0.0030454397201538086, -0.0028922557830810547, -0.0027390718460083008, -0.002585887908935547, -0.002432703971862793, -0.002279520034790039, -0.002126336097717285, -0.0019731521606445312, -0.0018199682235717773, -0.0016667842864990234, -0.0015136003494262695, -0.0013604164123535156, -0.0012072324752807617, -0.0010540485382080078, -0.0009008646011352539, -0.0007476806640625, -0.0005944967269897461, -0.0004413127899169922, -0.0002881288528442383, -0.00013494491577148438, 1.823902130126953e-05, 0.00017142295837402344, 0.00032460689544677734, 0.00047779083251953125, 0.0006309747695922852, 0.0007841587066650391, 0.000937342643737793, 0.0010905265808105469, 0.0012437105178833008, 0.0013968944549560547, 0.0015500783920288086, 0.0017032623291015625, 0.0018564462661743164, 0.0020096302032470703, 0.0021628141403198242, 0.002315998077392578, 0.002469182014465332, 0.002622365951538086, 0.00277554988861084, 0.0029287338256835938, 0.0030819177627563477, 0.0032351016998291016, 0.0033882856369018555, 0.0035414695739746094, 0.0036946535110473633, 0.003847837448120117, 0.004001021385192871, 0.004154205322265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 14.0, 16.0, 38.0, 51.0, 91.0, 132.0, 179.0, 336.0, 583.0, 815.0, 1376.0, 2171.0, 3295.0, 5050.0, 7660.0, 11434.0, 16626.0, 23582.0, 32736.0, 43426.0, 55029.0, 67766.0, 78457.0, 87254.0, 92231.0, 91102.0, 86317.0, 77752.0, 65754.0, 53978.0, 41648.0, 31396.0, 22587.0, 15904.0, 10972.0, 7400.0, 4749.0, 3110.0, 2017.0, 1287.0, 861.0, 512.0, 326.0, 169.0, 139.0, 83.0, 50.0, 32.0, 23.0, 12.0, 7.0, 3.0, 1.0, 5.0, 1.0, 3.0], "bins": [-40.65625, -39.421875, -38.1875, -36.953125, -35.71875, -34.484375, -33.25, -32.015625, -30.78125, -29.546875, -28.3125, -27.078125, -25.84375, -24.609375, -23.375, -22.140625, -20.90625, -19.671875, -18.4375, -17.203125, -15.96875, -14.734375, -13.5, -12.265625, -11.03125, -9.796875, -8.5625, -7.328125, -6.09375, -4.859375, -3.625, -2.390625, -1.15625, 0.078125, 1.3125, 2.546875, 3.78125, 5.015625, 6.25, 7.484375, 8.71875, 9.953125, 11.1875, 12.421875, 13.65625, 14.890625, 16.125, 17.359375, 18.59375, 19.828125, 21.0625, 22.296875, 23.53125, 24.765625, 26.0, 27.234375, 28.46875, 29.703125, 30.9375, 32.171875, 33.40625, 34.640625, 35.875, 37.109375, 38.34375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 7.0, 11.0, 8.0, 17.0, 6.0, 16.0, 20.0, 21.0, 20.0, 23.0, 22.0, 34.0, 42.0, 45.0, 30.0, 46.0, 39.0, 49.0, 46.0, 42.0, 34.0, 43.0, 38.0, 46.0, 35.0, 46.0, 25.0, 20.0, 29.0, 14.0, 18.0, 13.0, 16.0, 14.0, 7.0, 7.0, 6.0, 3.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.71875, -17.156494140625, -16.59423828125, -16.031982421875, -15.4697265625, -14.907470703125, -14.34521484375, -13.782958984375, -13.220703125, -12.658447265625, -12.09619140625, -11.533935546875, -10.9716796875, -10.409423828125, -9.84716796875, -9.284912109375, -8.72265625, -8.160400390625, -7.59814453125, -7.035888671875, -6.4736328125, -5.911376953125, -5.34912109375, -4.786865234375, -4.224609375, -3.662353515625, -3.10009765625, -2.537841796875, -1.9755859375, -1.413330078125, -0.85107421875, -0.288818359375, 0.2734375, 0.835693359375, 1.39794921875, 1.960205078125, 2.5224609375, 3.084716796875, 3.64697265625, 4.209228515625, 4.771484375, 5.333740234375, 5.89599609375, 6.458251953125, 7.0205078125, 7.582763671875, 8.14501953125, 8.707275390625, 9.26953125, 9.831787109375, 10.39404296875, 10.956298828125, 11.5185546875, 12.080810546875, 12.64306640625, 13.205322265625, 13.767578125, 14.329833984375, 14.89208984375, 15.454345703125, 16.0166015625, 16.578857421875, 17.14111328125, 17.703369140625, 18.265625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 3.0, 6.0, 8.0, 8.0, 9.0, 6.0, 18.0, 14.0, 16.0, 20.0, 19.0, 21.0, 21.0, 28.0, 34.0, 34.0, 29.0, 38.0, 39.0, 30.0, 54.0, 44.0, 35.0, 36.0, 30.0, 41.0, 30.0, 33.0, 33.0, 35.0, 28.0, 26.0, 24.0, 22.0, 15.0, 17.0, 18.0, 11.0, 7.0, 10.0, 6.0, 7.0, 10.0, 5.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-122.96511840820312, -119.38027954101562, -115.79544830322266, -112.21061706542969, -108.62577819824219, -105.04093933105469, -101.45610809326172, -97.87127685546875, -94.28643798828125, -90.70159912109375, -87.11676788330078, -83.53193664550781, -79.94709777832031, -76.36225891113281, -72.77742767333984, -69.19259643554688, -65.60775756835938, -62.02292251586914, -58.438087463378906, -54.85325241088867, -51.26841735839844, -47.6835823059082, -44.09874725341797, -40.513912200927734, -36.9290771484375, -33.344242095947266, -29.75940704345703, -26.174571990966797, -22.589736938476562, -19.004901885986328, -15.420066833496094, -11.83523178100586, -8.250396728515625, -4.665561676025391, -1.0807266235351562, 2.504108428955078, 6.0889434814453125, 9.673778533935547, 13.258613586425781, 16.843448638916016, 20.42828369140625, 24.013118743896484, 27.59795379638672, 31.182788848876953, 34.76762390136719, 38.35245895385742, 41.937294006347656, 45.52212905883789, 49.106964111328125, 52.69179916381836, 56.276634216308594, 59.86146926879883, 63.44630432128906, 67.03114318847656, 70.61597442626953, 74.2008056640625, 77.78564453125, 81.3704833984375, 84.95531463623047, 88.54014587402344, 92.12498474121094, 95.70982360839844, 99.2946548461914, 102.87948608398438, 106.46432495117188]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 7.0, 16.0, 9.0, 17.0, 15.0, 16.0, 19.0, 15.0, 24.0, 33.0, 24.0, 33.0, 42.0, 36.0, 42.0, 37.0, 51.0, 42.0, 37.0, 44.0, 40.0, 34.0, 48.0, 47.0, 30.0, 32.0, 42.0, 32.0, 20.0, 25.0, 20.0, 12.0, 6.0, 9.0, 9.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.89109802246094, -129.4365997314453, -124.98210144042969, -120.52760314941406, -116.07310485839844, -111.61860656738281, -107.16410827636719, -102.70960998535156, -98.25511169433594, -93.80061340332031, -89.34611511230469, -84.89161682128906, -80.43711853027344, -75.98262023925781, -71.52812194824219, -67.07362365722656, -62.61912536621094, -58.16462707519531, -53.71012878417969, -49.25563049316406, -44.80113220214844, -40.34663391113281, -35.89213562011719, -31.437637329101562, -26.983139038085938, -22.528640747070312, -18.074142456054688, -13.619644165039062, -9.165145874023438, -4.7106475830078125, -0.2561492919921875, 4.1983489990234375, 8.65283203125, 13.107330322265625, 17.56182861328125, 22.016326904296875, 26.4708251953125, 30.925323486328125, 35.37982177734375, 39.834320068359375, 44.288818359375, 48.743316650390625, 53.19781494140625, 57.652313232421875, 62.1068115234375, 66.56130981445312, 71.01580810546875, 75.47030639648438, 79.9248046875, 84.37930297851562, 88.83380126953125, 93.28829956054688, 97.7427978515625, 102.19729614257812, 106.65179443359375, 111.10629272460938, 115.560791015625, 120.01528930664062, 124.46978759765625, 128.92428588867188, 133.3787841796875, 137.83328247070312, 142.28778076171875, 146.74227905273438, 151.19677734375]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 2.0, 9.0, 7.0, 15.0, 33.0, 56.0, 98.0, 157.0, 295.0, 521.0, 894.0, 1568.0, 2614.0, 4349.0, 7015.0, 11589.0, 18141.0, 28325.0, 42669.0, 63693.0, 91694.0, 127245.0, 170718.0, 220748.0, 270710.0, 318020.0, 353830.0, 373188.0, 372409.0, 352937.0, 315639.0, 268281.0, 217296.0, 168664.0, 124984.0, 89560.0, 62474.0, 41865.0, 27147.0, 17558.0, 10920.0, 6631.0, 4035.0, 2384.0, 1418.0, 848.0, 444.0, 261.0, 161.0, 77.0, 54.0, 21.0, 15.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.875, -78.0830078125, -75.291015625, -72.4990234375, -69.70703125, -66.9150390625, -64.123046875, -61.3310546875, -58.5390625, -55.7470703125, -52.955078125, -50.1630859375, -47.37109375, -44.5791015625, -41.787109375, -38.9951171875, -36.203125, -33.4111328125, -30.619140625, -27.8271484375, -25.03515625, -22.2431640625, -19.451171875, -16.6591796875, -13.8671875, -11.0751953125, -8.283203125, -5.4912109375, -2.69921875, 0.0927734375, 2.884765625, 5.6767578125, 8.46875, 11.2607421875, 14.052734375, 16.8447265625, 19.63671875, 22.4287109375, 25.220703125, 28.0126953125, 30.8046875, 33.5966796875, 36.388671875, 39.1806640625, 41.97265625, 44.7646484375, 47.556640625, 50.3486328125, 53.140625, 55.9326171875, 58.724609375, 61.5166015625, 64.30859375, 67.1005859375, 69.892578125, 72.6845703125, 75.4765625, 78.2685546875, 81.060546875, 83.8525390625, 86.64453125, 89.4365234375, 92.228515625, 95.0205078125, 97.8125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 4.0, 11.0, 14.0, 9.0, 24.0, 6.0, 20.0, 21.0, 14.0, 21.0, 40.0, 32.0, 22.0, 44.0, 35.0, 45.0, 48.0, 38.0, 43.0, 40.0, 39.0, 42.0, 44.0, 43.0, 42.0, 29.0, 36.0, 33.0, 31.0, 20.0, 27.0, 17.0, 11.0, 5.0, 10.0, 9.0, 6.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.8125, -116.7490234375, -112.685546875, -108.6220703125, -104.55859375, -100.4951171875, -96.431640625, -92.3681640625, -88.3046875, -84.2412109375, -80.177734375, -76.1142578125, -72.05078125, -67.9873046875, -63.923828125, -59.8603515625, -55.796875, -51.7333984375, -47.669921875, -43.6064453125, -39.54296875, -35.4794921875, -31.416015625, -27.3525390625, -23.2890625, -19.2255859375, -15.162109375, -11.0986328125, -7.03515625, -2.9716796875, 1.091796875, 5.1552734375, 9.21875, 13.2822265625, 17.345703125, 21.4091796875, 25.47265625, 29.5361328125, 33.599609375, 37.6630859375, 41.7265625, 45.7900390625, 49.853515625, 53.9169921875, 57.98046875, 62.0439453125, 66.107421875, 70.1708984375, 74.234375, 78.2978515625, 82.361328125, 86.4248046875, 90.48828125, 94.5517578125, 98.615234375, 102.6787109375, 106.7421875, 110.8056640625, 114.869140625, 118.9326171875, 122.99609375, 127.0595703125, 131.123046875, 135.1865234375, 139.25]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 6.0, 21.0, 31.0, 68.0, 90.0, 173.0, 259.0, 477.0, 805.0, 1297.0, 2169.0, 3491.0, 5637.0, 8788.0, 13544.0, 20611.0, 30392.0, 43563.0, 61918.0, 84576.0, 113381.0, 145981.0, 182193.0, 221133.0, 256931.0, 287919.0, 311530.0, 323633.0, 321790.0, 308784.0, 283949.0, 252791.0, 214554.0, 177296.0, 140534.0, 109072.0, 81786.0, 59108.0, 41649.0, 28489.0, 19305.0, 12681.0, 8119.0, 5348.0, 3332.0, 2035.0, 1272.0, 742.0, 455.0, 265.0, 132.0, 90.0, 43.0, 28.0, 18.0, 5.0, 3.0, 1.0, 0.0, 3.0], "bins": [-82.8125, -80.21875, -77.625, -75.03125, -72.4375, -69.84375, -67.25, -64.65625, -62.0625, -59.46875, -56.875, -54.28125, -51.6875, -49.09375, -46.5, -43.90625, -41.3125, -38.71875, -36.125, -33.53125, -30.9375, -28.34375, -25.75, -23.15625, -20.5625, -17.96875, -15.375, -12.78125, -10.1875, -7.59375, -5.0, -2.40625, 0.1875, 2.78125, 5.375, 7.96875, 10.5625, 13.15625, 15.75, 18.34375, 20.9375, 23.53125, 26.125, 28.71875, 31.3125, 33.90625, 36.5, 39.09375, 41.6875, 44.28125, 46.875, 49.46875, 52.0625, 54.65625, 57.25, 59.84375, 62.4375, 65.03125, 67.625, 70.21875, 72.8125, 75.40625, 78.0, 80.59375, 83.1875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 4.0, 4.0, 4.0, 9.0, 23.0, 18.0, 28.0, 45.0, 51.0, 51.0, 67.0, 69.0, 87.0, 112.0, 128.0, 150.0, 158.0, 183.0, 178.0, 210.0, 222.0, 216.0, 228.0, 220.0, 192.0, 226.0, 182.0, 171.0, 128.0, 133.0, 106.0, 96.0, 79.0, 68.0, 63.0, 43.0, 37.0, 28.0, 19.0, 12.0, 6.0, 9.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.40625, -52.53173828125, -50.6572265625, -48.78271484375, -46.908203125, -45.03369140625, -43.1591796875, -41.28466796875, -39.41015625, -37.53564453125, -35.6611328125, -33.78662109375, -31.912109375, -30.03759765625, -28.1630859375, -26.28857421875, -24.4140625, -22.53955078125, -20.6650390625, -18.79052734375, -16.916015625, -15.04150390625, -13.1669921875, -11.29248046875, -9.41796875, -7.54345703125, -5.6689453125, -3.79443359375, -1.919921875, -0.04541015625, 1.8291015625, 3.70361328125, 5.578125, 7.45263671875, 9.3271484375, 11.20166015625, 13.076171875, 14.95068359375, 16.8251953125, 18.69970703125, 20.57421875, 22.44873046875, 24.3232421875, 26.19775390625, 28.072265625, 29.94677734375, 31.8212890625, 33.69580078125, 35.5703125, 37.44482421875, 39.3193359375, 41.19384765625, 43.068359375, 44.94287109375, 46.8173828125, 48.69189453125, 50.56640625, 52.44091796875, 54.3154296875, 56.18994140625, 58.064453125, 59.93896484375, 61.8134765625, 63.68798828125, 65.5625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 6.0, 0.0, 7.0, 7.0, 8.0, 11.0, 15.0, 11.0, 12.0, 24.0, 18.0, 26.0, 26.0, 19.0, 24.0, 26.0, 26.0, 31.0, 27.0, 35.0, 36.0, 40.0, 39.0, 48.0, 30.0, 39.0, 30.0, 39.0, 33.0, 27.0, 31.0, 27.0, 30.0, 20.0, 17.0, 24.0, 20.0, 11.0, 13.0, 10.0, 12.0, 18.0, 9.0, 7.0, 6.0, 10.0, 0.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-112.40511322021484, -109.0595703125, -105.71402740478516, -102.36848449707031, -99.02294921875, -95.67739868164062, -92.33186340332031, -88.98632049560547, -85.64077758789062, -82.29523468017578, -78.94969177246094, -75.6041488647461, -72.25860595703125, -68.91307067871094, -65.5675277709961, -62.22198486328125, -58.876441955566406, -55.53089904785156, -52.18535614013672, -48.83981704711914, -45.4942741394043, -42.14873123168945, -38.803192138671875, -35.45764923095703, -32.11210632324219, -28.766563415527344, -25.421022415161133, -22.075481414794922, -18.729938507080078, -15.384395599365234, -12.038854598999023, -8.693313598632812, -5.347770690917969, -2.0022287368774414, 1.343313217163086, 4.688855171203613, 8.03439712524414, 11.379940032958984, 14.725481033325195, 18.071022033691406, 21.41656494140625, 24.762107849121094, 28.107648849487305, 31.453189849853516, 34.79873275756836, 38.1442756652832, 41.48981475830078, 44.835357666015625, 48.18090057373047, 51.52644348144531, 54.871986389160156, 58.217525482177734, 61.56306838989258, 64.90861511230469, 68.254150390625, 71.59969329833984, 74.94523620605469, 78.29077911376953, 81.63632202148438, 84.98186492919922, 88.32740783691406, 91.67294311523438, 95.01848602294922, 98.36402893066406, 101.7095718383789]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 11.0, 12.0, 10.0, 12.0, 15.0, 15.0, 14.0, 11.0, 25.0, 18.0, 21.0, 34.0, 35.0, 27.0, 36.0, 35.0, 47.0, 37.0, 42.0, 40.0, 44.0, 37.0, 35.0, 42.0, 44.0, 26.0, 38.0, 38.0, 25.0, 28.0, 17.0, 16.0, 17.0, 16.0, 13.0, 13.0, 14.0, 7.0, 6.0, 3.0, 6.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-138.41529846191406, -134.32073974609375, -130.22618103027344, -126.13162231445312, -122.03706359863281, -117.9425048828125, -113.84794616699219, -109.75338745117188, -105.65882873535156, -101.56427001953125, -97.46971130371094, -93.37515258789062, -89.28059387207031, -85.18603515625, -81.09147644042969, -76.99691772460938, -72.9023666381836, -68.80780792236328, -64.71324920654297, -60.618690490722656, -56.524131774902344, -52.42957305908203, -48.335018157958984, -44.24045944213867, -40.14590072631836, -36.05134201049805, -31.956783294677734, -27.862226486206055, -23.767667770385742, -19.67310905456543, -15.57855224609375, -11.483993530273438, -7.389442443847656, -3.294884204864502, 0.7996740341186523, 4.894231796264648, 8.988790512084961, 13.083349227905273, 17.177906036376953, 21.272464752197266, 25.367023468017578, 29.46158218383789, 33.5561408996582, 37.65069580078125, 41.74525451660156, 45.839813232421875, 49.93437194824219, 54.0289306640625, 58.12348937988281, 62.218048095703125, 66.31260681152344, 70.40716552734375, 74.50172424316406, 78.59628295898438, 82.69084167480469, 86.785400390625, 90.87995910644531, 94.97451782226562, 99.06907653808594, 103.16363525390625, 107.25819396972656, 111.35275268554688, 115.44731140136719, 119.5418701171875, 123.63642120361328]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 6.0, 2.0, 4.0, 7.0, 15.0, 29.0, 41.0, 54.0, 81.0, 122.0, 180.0, 268.0, 439.0, 704.0, 1065.0, 1532.0, 2488.0, 3773.0, 5974.0, 8805.0, 13334.0, 19983.0, 29786.0, 42544.0, 58867.0, 78454.0, 96758.0, 111376.0, 114792.0, 108997.0, 94062.0, 74653.0, 56423.0, 40093.0, 27839.0, 18748.0, 12507.0, 8151.0, 5568.0, 3493.0, 2330.0, 1487.0, 938.0, 616.0, 427.0, 232.0, 176.0, 112.0, 72.0, 55.0, 35.0, 23.0, 13.0, 13.0, 6.0, 8.0, 2.0, 1.0, 1.0, 2.0], "bins": [-43.9375, -42.58203125, -41.2265625, -39.87109375, -38.515625, -37.16015625, -35.8046875, -34.44921875, -33.09375, -31.73828125, -30.3828125, -29.02734375, -27.671875, -26.31640625, -24.9609375, -23.60546875, -22.25, -20.89453125, -19.5390625, -18.18359375, -16.828125, -15.47265625, -14.1171875, -12.76171875, -11.40625, -10.05078125, -8.6953125, -7.33984375, -5.984375, -4.62890625, -3.2734375, -1.91796875, -0.5625, 0.79296875, 2.1484375, 3.50390625, 4.859375, 6.21484375, 7.5703125, 8.92578125, 10.28125, 11.63671875, 12.9921875, 14.34765625, 15.703125, 17.05859375, 18.4140625, 19.76953125, 21.125, 22.48046875, 23.8359375, 25.19140625, 26.546875, 27.90234375, 29.2578125, 30.61328125, 31.96875, 33.32421875, 34.6796875, 36.03515625, 37.390625, 38.74609375, 40.1015625, 41.45703125, 42.8125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 5.0, 11.0, 13.0, 7.0, 13.0, 15.0, 15.0, 13.0, 12.0, 23.0, 18.0, 21.0, 36.0, 33.0, 27.0, 36.0, 35.0, 50.0, 35.0, 40.0, 38.0, 47.0, 38.0, 35.0, 39.0, 48.0, 25.0, 38.0, 37.0, 27.0, 26.0, 17.0, 17.0, 18.0, 16.0, 14.0, 13.0, 11.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-137.875, -133.7822265625, -129.689453125, -125.5966796875, -121.50390625, -117.4111328125, -113.318359375, -109.2255859375, -105.1328125, -101.0400390625, -96.947265625, -92.8544921875, -88.76171875, -84.6689453125, -80.576171875, -76.4833984375, -72.390625, -68.2978515625, -64.205078125, -60.1123046875, -56.01953125, -51.9267578125, -47.833984375, -43.7412109375, -39.6484375, -35.5556640625, -31.462890625, -27.3701171875, -23.27734375, -19.1845703125, -15.091796875, -10.9990234375, -6.90625, -2.8134765625, 1.279296875, 5.3720703125, 9.46484375, 13.5576171875, 17.650390625, 21.7431640625, 25.8359375, 29.9287109375, 34.021484375, 38.1142578125, 42.20703125, 46.2998046875, 50.392578125, 54.4853515625, 58.578125, 62.6708984375, 66.763671875, 70.8564453125, 74.94921875, 79.0419921875, 83.134765625, 87.2275390625, 91.3203125, 95.4130859375, 99.505859375, 103.5986328125, 107.69140625, 111.7841796875, 115.876953125, 119.9697265625, 124.0625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 3.0, 8.0, 25.0, 14.0, 36.0, 46.0, 63.0, 110.0, 125.0, 175.0, 266.0, 402.0, 609.0, 927.0, 1389.0, 2008.0, 3186.0, 5243.0, 8615.0, 14907.0, 26135.0, 47184.0, 84480.0, 143749.0, 201497.0, 195870.0, 133148.0, 77005.0, 42511.0, 23742.0, 13450.0, 7884.0, 4850.0, 3059.0, 1939.0, 1257.0, 854.0, 578.0, 361.0, 251.0, 193.0, 121.0, 93.0, 63.0, 45.0, 27.0, 19.0, 14.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-65.0, -63.025390625, -61.05078125, -59.076171875, -57.1015625, -55.126953125, -53.15234375, -51.177734375, -49.203125, -47.228515625, -45.25390625, -43.279296875, -41.3046875, -39.330078125, -37.35546875, -35.380859375, -33.40625, -31.431640625, -29.45703125, -27.482421875, -25.5078125, -23.533203125, -21.55859375, -19.583984375, -17.609375, -15.634765625, -13.66015625, -11.685546875, -9.7109375, -7.736328125, -5.76171875, -3.787109375, -1.8125, 0.162109375, 2.13671875, 4.111328125, 6.0859375, 8.060546875, 10.03515625, 12.009765625, 13.984375, 15.958984375, 17.93359375, 19.908203125, 21.8828125, 23.857421875, 25.83203125, 27.806640625, 29.78125, 31.755859375, 33.73046875, 35.705078125, 37.6796875, 39.654296875, 41.62890625, 43.603515625, 45.578125, 47.552734375, 49.52734375, 51.501953125, 53.4765625, 55.451171875, 57.42578125, 59.400390625, 61.375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 7.0, 21.0, 15.0, 21.0, 25.0, 22.0, 19.0, 24.0, 25.0, 34.0, 38.0, 46.0, 51.0, 44.0, 58.0, 49.0, 45.0, 38.0, 39.0, 33.0, 36.0, 33.0, 31.0, 27.0, 29.0, 34.0, 24.0, 21.0, 12.0, 11.0, 16.0, 14.0, 9.0, 10.0, 4.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.875, -74.970703125, -72.06640625, -69.162109375, -66.2578125, -63.353515625, -60.44921875, -57.544921875, -54.640625, -51.736328125, -48.83203125, -45.927734375, -43.0234375, -40.119140625, -37.21484375, -34.310546875, -31.40625, -28.501953125, -25.59765625, -22.693359375, -19.7890625, -16.884765625, -13.98046875, -11.076171875, -8.171875, -5.267578125, -2.36328125, 0.541015625, 3.4453125, 6.349609375, 9.25390625, 12.158203125, 15.0625, 17.966796875, 20.87109375, 23.775390625, 26.6796875, 29.583984375, 32.48828125, 35.392578125, 38.296875, 41.201171875, 44.10546875, 47.009765625, 49.9140625, 52.818359375, 55.72265625, 58.626953125, 61.53125, 64.435546875, 67.33984375, 70.244140625, 73.1484375, 76.052734375, 78.95703125, 81.861328125, 84.765625, 87.669921875, 90.57421875, 93.478515625, 96.3828125, 99.287109375, 102.19140625, 105.095703125, 108.0]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 0.0, 5.0, 5.0, 10.0, 24.0, 27.0, 28.0, 45.0, 62.0, 100.0, 163.0, 190.0, 292.0, 427.0, 567.0, 806.0, 1140.0, 1781.0, 2623.0, 3777.0, 5938.0, 9409.0, 15593.0, 26525.0, 46654.0, 86383.0, 160444.0, 240253.0, 195461.0, 108814.0, 58351.0, 32175.0, 18455.0, 11381.0, 6878.0, 4433.0, 3031.0, 1983.0, 1266.0, 972.0, 635.0, 451.0, 300.0, 200.0, 156.0, 110.0, 75.0, 52.0, 42.0, 24.0, 10.0, 14.0, 8.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.625, -34.50048828125, -33.3759765625, -32.25146484375, -31.126953125, -30.00244140625, -28.8779296875, -27.75341796875, -26.62890625, -25.50439453125, -24.3798828125, -23.25537109375, -22.130859375, -21.00634765625, -19.8818359375, -18.75732421875, -17.6328125, -16.50830078125, -15.3837890625, -14.25927734375, -13.134765625, -12.01025390625, -10.8857421875, -9.76123046875, -8.63671875, -7.51220703125, -6.3876953125, -5.26318359375, -4.138671875, -3.01416015625, -1.8896484375, -0.76513671875, 0.359375, 1.48388671875, 2.6083984375, 3.73291015625, 4.857421875, 5.98193359375, 7.1064453125, 8.23095703125, 9.35546875, 10.47998046875, 11.6044921875, 12.72900390625, 13.853515625, 14.97802734375, 16.1025390625, 17.22705078125, 18.3515625, 19.47607421875, 20.6005859375, 21.72509765625, 22.849609375, 23.97412109375, 25.0986328125, 26.22314453125, 27.34765625, 28.47216796875, 29.5966796875, 30.72119140625, 31.845703125, 32.97021484375, 34.0947265625, 35.21923828125, 36.34375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 4.0, 6.0, 13.0, 7.0, 13.0, 18.0, 24.0, 24.0, 23.0, 40.0, 38.0, 47.0, 41.0, 56.0, 54.0, 58.0, 52.0, 41.0, 58.0, 47.0, 48.0, 42.0, 29.0, 36.0, 32.0, 29.0, 17.0, 17.0, 8.0, 15.0, 10.0, 19.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001956939697265625, -0.0019006282091140747, -0.0018443167209625244, -0.0017880052328109741, -0.0017316937446594238, -0.0016753822565078735, -0.0016190707683563232, -0.001562759280204773, -0.0015064477920532227, -0.0014501363039016724, -0.001393824815750122, -0.0013375133275985718, -0.0012812018394470215, -0.0012248903512954712, -0.001168578863143921, -0.0011122673749923706, -0.0010559558868408203, -0.00099964439868927, -0.0009433329105377197, -0.0008870214223861694, -0.0008307099342346191, -0.0007743984460830688, -0.0007180869579315186, -0.0006617754697799683, -0.000605463981628418, -0.0005491524934768677, -0.0004928410053253174, -0.0004365295171737671, -0.0003802180290222168, -0.0003239065408706665, -0.0002675950527191162, -0.00021128356456756592, -0.00015497207641601562, -9.866058826446533e-05, -4.234910011291504e-05, 1.3962388038635254e-05, 7.027387619018555e-05, 0.00012658536434173584, 0.00018289685249328613, 0.00023920834064483643, 0.0002955198287963867, 0.000351831316947937, 0.0004081428050994873, 0.0004644542932510376, 0.0005207657814025879, 0.0005770772695541382, 0.0006333887577056885, 0.0006897002458572388, 0.0007460117340087891, 0.0008023232221603394, 0.0008586347103118896, 0.0009149461984634399, 0.0009712576866149902, 0.0010275691747665405, 0.0010838806629180908, 0.0011401921510696411, 0.0011965036392211914, 0.0012528151273727417, 0.001309126615524292, 0.0013654381036758423, 0.0014217495918273926, 0.0014780610799789429, 0.0015343725681304932, 0.0015906840562820435, 0.0016469955444335938]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 10.0, 13.0, 18.0, 25.0, 43.0, 57.0, 83.0, 149.0, 225.0, 327.0, 521.0, 820.0, 1285.0, 2049.0, 3130.0, 4983.0, 7502.0, 11909.0, 18528.0, 28382.0, 42664.0, 61634.0, 86383.0, 110361.0, 128220.0, 129973.0, 115851.0, 92182.0, 67396.0, 45984.0, 30647.0, 20285.0, 13148.0, 8417.0, 5492.0, 3584.0, 2243.0, 1384.0, 919.0, 607.0, 393.0, 257.0, 159.0, 111.0, 60.0, 55.0, 35.0, 23.0, 9.0, 9.0, 0.0, 3.0, 1.0, 4.0], "bins": [-45.65625, -44.35595703125, -43.0556640625, -41.75537109375, -40.455078125, -39.15478515625, -37.8544921875, -36.55419921875, -35.25390625, -33.95361328125, -32.6533203125, -31.35302734375, -30.052734375, -28.75244140625, -27.4521484375, -26.15185546875, -24.8515625, -23.55126953125, -22.2509765625, -20.95068359375, -19.650390625, -18.35009765625, -17.0498046875, -15.74951171875, -14.44921875, -13.14892578125, -11.8486328125, -10.54833984375, -9.248046875, -7.94775390625, -6.6474609375, -5.34716796875, -4.046875, -2.74658203125, -1.4462890625, -0.14599609375, 1.154296875, 2.45458984375, 3.7548828125, 5.05517578125, 6.35546875, 7.65576171875, 8.9560546875, 10.25634765625, 11.556640625, 12.85693359375, 14.1572265625, 15.45751953125, 16.7578125, 18.05810546875, 19.3583984375, 20.65869140625, 21.958984375, 23.25927734375, 24.5595703125, 25.85986328125, 27.16015625, 28.46044921875, 29.7607421875, 31.06103515625, 32.361328125, 33.66162109375, 34.9619140625, 36.26220703125, 37.5625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 3.0, 8.0, 9.0, 18.0, 4.0, 16.0, 22.0, 17.0, 26.0, 22.0, 30.0, 37.0, 40.0, 40.0, 36.0, 39.0, 34.0, 45.0, 41.0, 47.0, 49.0, 51.0, 41.0, 30.0, 43.0, 29.0, 29.0, 30.0, 29.0, 20.0, 7.0, 19.0, 13.0, 10.0, 10.0, 10.0, 9.0, 5.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0], "bins": [-14.015625, -13.6339111328125, -13.252197265625, -12.8704833984375, -12.48876953125, -12.1070556640625, -11.725341796875, -11.3436279296875, -10.9619140625, -10.5802001953125, -10.198486328125, -9.8167724609375, -9.43505859375, -9.0533447265625, -8.671630859375, -8.2899169921875, -7.908203125, -7.5264892578125, -7.144775390625, -6.7630615234375, -6.38134765625, -5.9996337890625, -5.617919921875, -5.2362060546875, -4.8544921875, -4.4727783203125, -4.091064453125, -3.7093505859375, -3.32763671875, -2.9459228515625, -2.564208984375, -2.1824951171875, -1.80078125, -1.4190673828125, -1.037353515625, -0.6556396484375, -0.27392578125, 0.1077880859375, 0.489501953125, 0.8712158203125, 1.2529296875, 1.6346435546875, 2.016357421875, 2.3980712890625, 2.77978515625, 3.1614990234375, 3.543212890625, 3.9249267578125, 4.306640625, 4.6883544921875, 5.070068359375, 5.4517822265625, 5.83349609375, 6.2152099609375, 6.596923828125, 6.9786376953125, 7.3603515625, 7.7420654296875, 8.123779296875, 8.5054931640625, 8.88720703125, 9.2689208984375, 9.650634765625, 10.0323486328125, 10.4140625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 6.0, 8.0, 8.0, 7.0, 10.0, 18.0, 12.0, 17.0, 22.0, 24.0, 24.0, 24.0, 32.0, 20.0, 25.0, 37.0, 35.0, 27.0, 23.0, 45.0, 49.0, 43.0, 42.0, 29.0, 34.0, 44.0, 29.0, 27.0, 29.0, 33.0, 22.0, 25.0, 26.0, 19.0, 13.0, 10.0, 21.0, 6.0, 16.0, 12.0, 8.0, 7.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-107.47471618652344, -104.03538513183594, -100.5960464477539, -97.15670776367188, -93.71737670898438, -90.27804565429688, -86.83870697021484, -83.39936828613281, -79.96003723144531, -76.52070617675781, -73.08136749267578, -69.64202880859375, -66.20269775390625, -62.763362884521484, -59.32402801513672, -55.88469314575195, -52.44535827636719, -49.00602340698242, -45.566688537597656, -42.12735366821289, -38.688018798828125, -35.24868392944336, -31.809349060058594, -28.370014190673828, -24.930679321289062, -21.491344451904297, -18.05200958251953, -14.612674713134766, -11.17333984375, -7.734004974365234, -4.294670104980469, -0.8553352355957031, 2.5840072631835938, 6.023342132568359, 9.462677001953125, 12.90201187133789, 16.341346740722656, 19.780681610107422, 23.220016479492188, 26.659351348876953, 30.09868621826172, 33.538021087646484, 36.97735595703125, 40.416690826416016, 43.85602569580078, 47.29536056518555, 50.73469543457031, 54.17403030395508, 57.613365173339844, 61.05270004272461, 64.49203491210938, 67.93136596679688, 71.3707046508789, 74.81004333496094, 78.24937438964844, 81.68870544433594, 85.12804412841797, 88.5673828125, 92.0067138671875, 95.446044921875, 98.88538360595703, 102.32472229003906, 105.76405334472656, 109.20338439941406, 112.6427230834961]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 3.0, 4.0, 9.0, 10.0, 12.0, 11.0, 12.0, 18.0, 16.0, 12.0, 16.0, 23.0, 26.0, 28.0, 38.0, 18.0, 41.0, 43.0, 35.0, 47.0, 34.0, 40.0, 46.0, 38.0, 37.0, 44.0, 36.0, 35.0, 38.0, 31.0, 30.0, 28.0, 13.0, 17.0, 19.0, 15.0, 15.0, 11.0, 12.0, 9.0, 9.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-138.04246520996094, -133.94769287109375, -129.8529052734375, -125.75813293457031, -121.66336059570312, -117.56858825683594, -113.47380828857422, -109.3790283203125, -105.28425598144531, -101.18948364257812, -97.0947036743164, -92.99992370605469, -88.9051513671875, -84.81037902832031, -80.7155990600586, -76.62081909179688, -72.52604675292969, -68.4312744140625, -64.33649444580078, -60.24171829223633, -56.146942138671875, -52.05216598510742, -47.95738983154297, -43.862613677978516, -39.76783752441406, -35.67306137084961, -31.578285217285156, -27.483509063720703, -23.38873291015625, -19.293956756591797, -15.199180603027344, -11.10440444946289, -7.0096435546875, -2.914867401123047, 1.1799087524414062, 5.274684906005859, 9.369461059570312, 13.464237213134766, 17.55901336669922, 21.653789520263672, 25.748565673828125, 29.843341827392578, 33.93811798095703, 38.032894134521484, 42.12767028808594, 46.22244644165039, 50.317222595214844, 54.4119987487793, 58.50677490234375, 62.6015510559082, 66.69632720947266, 70.79110717773438, 74.88587951660156, 78.98065185546875, 83.07543182373047, 87.17021179199219, 91.26498413085938, 95.35975646972656, 99.45453643798828, 103.54931640625, 107.64408874511719, 111.73886108398438, 115.8336410522461, 119.92842102050781, 124.023193359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 9.0, 18.0, 21.0, 22.0, 58.0, 66.0, 101.0, 229.0, 388.0, 522.0, 885.0, 1300.0, 2088.0, 3217.0, 4752.0, 6923.0, 10153.0, 14279.0, 19568.0, 25893.0, 34064.0, 42746.0, 51951.0, 61641.0, 69346.0, 76534.0, 79867.0, 80428.0, 78210.0, 72004.0, 65335.0, 56341.0, 46920.0, 37878.0, 29433.0, 22132.0, 16511.0, 11821.0, 8345.0, 5689.0, 3868.0, 2580.0, 1610.0, 1023.0, 690.0, 431.0, 274.0, 173.0, 81.0, 63.0, 31.0, 27.0, 13.0, 5.0, 5.0, 0.0, 2.0, 2.0], "bins": [-74.75, -72.5, -70.25, -68.0, -65.75, -63.5, -61.25, -59.0, -56.75, -54.5, -52.25, -50.0, -47.75, -45.5, -43.25, -41.0, -38.75, -36.5, -34.25, -32.0, -29.75, -27.5, -25.25, -23.0, -20.75, -18.5, -16.25, -14.0, -11.75, -9.5, -7.25, -5.0, -2.75, -0.5, 1.75, 4.0, 6.25, 8.5, 10.75, 13.0, 15.25, 17.5, 19.75, 22.0, 24.25, 26.5, 28.75, 31.0, 33.25, 35.5, 37.75, 40.0, 42.25, 44.5, 46.75, 49.0, 51.25, 53.5, 55.75, 58.0, 60.25, 62.5, 64.75, 67.0, 69.25]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 3.0, 4.0, 8.0, 11.0, 10.0, 10.0, 13.0, 19.0, 15.0, 12.0, 17.0, 22.0, 27.0, 27.0, 37.0, 21.0, 40.0, 45.0, 35.0, 48.0, 35.0, 38.0, 45.0, 37.0, 40.0, 43.0, 37.0, 40.0, 30.0, 34.0, 30.0, 27.0, 12.0, 20.0, 17.0, 17.0, 15.0, 10.0, 14.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-135.25, -131.2412109375, -127.232421875, -123.2236328125, -119.21484375, -115.2060546875, -111.197265625, -107.1884765625, -103.1796875, -99.1708984375, -95.162109375, -91.1533203125, -87.14453125, -83.1357421875, -79.126953125, -75.1181640625, -71.109375, -67.1005859375, -63.091796875, -59.0830078125, -55.07421875, -51.0654296875, -47.056640625, -43.0478515625, -39.0390625, -35.0302734375, -31.021484375, -27.0126953125, -23.00390625, -18.9951171875, -14.986328125, -10.9775390625, -6.96875, -2.9599609375, 1.048828125, 5.0576171875, 9.06640625, 13.0751953125, 17.083984375, 21.0927734375, 25.1015625, 29.1103515625, 33.119140625, 37.1279296875, 41.13671875, 45.1455078125, 49.154296875, 53.1630859375, 57.171875, 61.1806640625, 65.189453125, 69.1982421875, 73.20703125, 77.2158203125, 81.224609375, 85.2333984375, 89.2421875, 93.2509765625, 97.259765625, 101.2685546875, 105.27734375, 109.2861328125, 113.294921875, 117.3037109375, 121.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 10.0, 2.0, 9.0, 26.0, 36.0, 73.0, 95.0, 149.0, 281.0, 419.0, 739.0, 1229.0, 2127.0, 3314.0, 5275.0, 7967.0, 12265.0, 17764.0, 24672.0, 34152.0, 44603.0, 56396.0, 67877.0, 78585.0, 86023.0, 90371.0, 89759.0, 84630.0, 76166.0, 65818.0, 53526.0, 41873.0, 31590.0, 23261.0, 16369.0, 11181.0, 7351.0, 4813.0, 2970.0, 1899.0, 1204.0, 714.0, 384.0, 260.0, 153.0, 78.0, 50.0, 19.0, 21.0, 6.0, 9.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.9375, -71.5439453125, -69.150390625, -66.7568359375, -64.36328125, -61.9697265625, -59.576171875, -57.1826171875, -54.7890625, -52.3955078125, -50.001953125, -47.6083984375, -45.21484375, -42.8212890625, -40.427734375, -38.0341796875, -35.640625, -33.2470703125, -30.853515625, -28.4599609375, -26.06640625, -23.6728515625, -21.279296875, -18.8857421875, -16.4921875, -14.0986328125, -11.705078125, -9.3115234375, -6.91796875, -4.5244140625, -2.130859375, 0.2626953125, 2.65625, 5.0498046875, 7.443359375, 9.8369140625, 12.23046875, 14.6240234375, 17.017578125, 19.4111328125, 21.8046875, 24.1982421875, 26.591796875, 28.9853515625, 31.37890625, 33.7724609375, 36.166015625, 38.5595703125, 40.953125, 43.3466796875, 45.740234375, 48.1337890625, 50.52734375, 52.9208984375, 55.314453125, 57.7080078125, 60.1015625, 62.4951171875, 64.888671875, 67.2822265625, 69.67578125, 72.0693359375, 74.462890625, 76.8564453125, 79.25]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 4.0, 8.0, 6.0, 9.0, 16.0, 25.0, 34.0, 21.0, 30.0, 39.0, 41.0, 37.0, 36.0, 48.0, 54.0, 40.0, 44.0, 48.0, 45.0, 53.0, 49.0, 45.0, 27.0, 36.0, 34.0, 34.0, 26.0, 19.0, 20.0, 21.0, 9.0, 11.0, 13.0, 3.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.1875, -85.98046875, -82.7734375, -79.56640625, -76.359375, -73.15234375, -69.9453125, -66.73828125, -63.53125, -60.32421875, -57.1171875, -53.91015625, -50.703125, -47.49609375, -44.2890625, -41.08203125, -37.875, -34.66796875, -31.4609375, -28.25390625, -25.046875, -21.83984375, -18.6328125, -15.42578125, -12.21875, -9.01171875, -5.8046875, -2.59765625, 0.609375, 3.81640625, 7.0234375, 10.23046875, 13.4375, 16.64453125, 19.8515625, 23.05859375, 26.265625, 29.47265625, 32.6796875, 35.88671875, 39.09375, 42.30078125, 45.5078125, 48.71484375, 51.921875, 55.12890625, 58.3359375, 61.54296875, 64.75, 67.95703125, 71.1640625, 74.37109375, 77.578125, 80.78515625, 83.9921875, 87.19921875, 90.40625, 93.61328125, 96.8203125, 100.02734375, 103.234375, 106.44140625, 109.6484375, 112.85546875, 116.0625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 11.0, 18.0, 23.0, 48.0, 74.0, 139.0, 248.0, 351.0, 652.0, 1128.0, 2023.0, 3215.0, 5240.0, 8073.0, 12721.0, 19058.0, 27278.0, 37531.0, 50985.0, 63990.0, 77322.0, 89154.0, 96301.0, 98352.0, 93708.0, 84819.0, 71958.0, 58644.0, 45183.0, 33110.0, 23416.0, 16064.0, 10417.0, 6670.0, 4235.0, 2567.0, 1553.0, 891.0, 583.0, 326.0, 176.0, 121.0, 69.0, 46.0, 30.0, 10.0, 12.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.9375, -33.74462890625, -32.5517578125, -31.35888671875, -30.166015625, -28.97314453125, -27.7802734375, -26.58740234375, -25.39453125, -24.20166015625, -23.0087890625, -21.81591796875, -20.623046875, -19.43017578125, -18.2373046875, -17.04443359375, -15.8515625, -14.65869140625, -13.4658203125, -12.27294921875, -11.080078125, -9.88720703125, -8.6943359375, -7.50146484375, -6.30859375, -5.11572265625, -3.9228515625, -2.72998046875, -1.537109375, -0.34423828125, 0.8486328125, 2.04150390625, 3.234375, 4.42724609375, 5.6201171875, 6.81298828125, 8.005859375, 9.19873046875, 10.3916015625, 11.58447265625, 12.77734375, 13.97021484375, 15.1630859375, 16.35595703125, 17.548828125, 18.74169921875, 19.9345703125, 21.12744140625, 22.3203125, 23.51318359375, 24.7060546875, 25.89892578125, 27.091796875, 28.28466796875, 29.4775390625, 30.67041015625, 31.86328125, 33.05615234375, 34.2490234375, 35.44189453125, 36.634765625, 37.82763671875, 39.0205078125, 40.21337890625, 41.40625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 6.0, 11.0, 8.0, 12.0, 9.0, 11.0, 17.0, 18.0, 19.0, 24.0, 29.0, 35.0, 37.0, 39.0, 33.0, 43.0, 50.0, 39.0, 40.0, 33.0, 41.0, 45.0, 47.0, 40.0, 32.0, 44.0, 32.0, 27.0, 22.0, 19.0, 26.0, 21.0, 18.0, 14.0, 12.0, 11.0, 4.0, 4.0, 6.0, 1.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00485992431640625, -0.004708528518676758, -0.004557132720947266, -0.0044057369232177734, -0.004254341125488281, -0.004102945327758789, -0.003951549530029297, -0.0038001537322998047, -0.0036487579345703125, -0.0034973621368408203, -0.003345966339111328, -0.003194570541381836, -0.0030431747436523438, -0.0028917789459228516, -0.0027403831481933594, -0.002588987350463867, -0.002437591552734375, -0.002286195755004883, -0.0021347999572753906, -0.0019834041595458984, -0.0018320083618164062, -0.001680612564086914, -0.0015292167663574219, -0.0013778209686279297, -0.0012264251708984375, -0.0010750293731689453, -0.0009236335754394531, -0.0007722377777099609, -0.0006208419799804688, -0.00046944618225097656, -0.0003180503845214844, -0.0001666545867919922, -1.52587890625e-05, 0.0001361370086669922, 0.0002875328063964844, 0.00043892860412597656, 0.0005903244018554688, 0.0007417201995849609, 0.0008931159973144531, 0.0010445117950439453, 0.0011959075927734375, 0.0013473033905029297, 0.0014986991882324219, 0.001650094985961914, 0.0018014907836914062, 0.0019528865814208984, 0.0021042823791503906, 0.002255678176879883, 0.002407073974609375, 0.002558469772338867, 0.0027098655700683594, 0.0028612613677978516, 0.0030126571655273438, 0.003164052963256836, 0.003315448760986328, 0.0034668445587158203, 0.0036182403564453125, 0.0037696361541748047, 0.003921031951904297, 0.004072427749633789, 0.004223823547363281, 0.0043752193450927734, 0.004526615142822266, 0.004678010940551758, 0.00482940673828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 14.0, 14.0, 28.0, 38.0, 56.0, 128.0, 196.0, 311.0, 498.0, 850.0, 1282.0, 2167.0, 3610.0, 5350.0, 8320.0, 12663.0, 18185.0, 26078.0, 36034.0, 47828.0, 60148.0, 72372.0, 83590.0, 90636.0, 93659.0, 91517.0, 84906.0, 74072.0, 61943.0, 49076.0, 37668.0, 27663.0, 19638.0, 13286.0, 9014.0, 5901.0, 3807.0, 2393.0, 1363.0, 888.0, 536.0, 332.0, 214.0, 139.0, 61.0, 28.0, 28.0, 18.0, 8.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.65625, -39.32666015625, -37.9970703125, -36.66748046875, -35.337890625, -34.00830078125, -32.6787109375, -31.34912109375, -30.01953125, -28.68994140625, -27.3603515625, -26.03076171875, -24.701171875, -23.37158203125, -22.0419921875, -20.71240234375, -19.3828125, -18.05322265625, -16.7236328125, -15.39404296875, -14.064453125, -12.73486328125, -11.4052734375, -10.07568359375, -8.74609375, -7.41650390625, -6.0869140625, -4.75732421875, -3.427734375, -2.09814453125, -0.7685546875, 0.56103515625, 1.890625, 3.22021484375, 4.5498046875, 5.87939453125, 7.208984375, 8.53857421875, 9.8681640625, 11.19775390625, 12.52734375, 13.85693359375, 15.1865234375, 16.51611328125, 17.845703125, 19.17529296875, 20.5048828125, 21.83447265625, 23.1640625, 24.49365234375, 25.8232421875, 27.15283203125, 28.482421875, 29.81201171875, 31.1416015625, 32.47119140625, 33.80078125, 35.13037109375, 36.4599609375, 37.78955078125, 39.119140625, 40.44873046875, 41.7783203125, 43.10791015625, 44.4375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 12.0, 6.0, 10.0, 13.0, 14.0, 15.0, 29.0, 24.0, 25.0, 30.0, 31.0, 37.0, 39.0, 47.0, 37.0, 57.0, 35.0, 49.0, 45.0, 47.0, 52.0, 33.0, 27.0, 26.0, 36.0, 33.0, 22.0, 23.0, 14.0, 17.0, 12.0, 18.0, 11.0, 15.0, 3.0, 8.0, 4.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-18.4375, -17.78759765625, -17.1376953125, -16.48779296875, -15.837890625, -15.18798828125, -14.5380859375, -13.88818359375, -13.23828125, -12.58837890625, -11.9384765625, -11.28857421875, -10.638671875, -9.98876953125, -9.3388671875, -8.68896484375, -8.0390625, -7.38916015625, -6.7392578125, -6.08935546875, -5.439453125, -4.78955078125, -4.1396484375, -3.48974609375, -2.83984375, -2.18994140625, -1.5400390625, -0.89013671875, -0.240234375, 0.40966796875, 1.0595703125, 1.70947265625, 2.359375, 3.00927734375, 3.6591796875, 4.30908203125, 4.958984375, 5.60888671875, 6.2587890625, 6.90869140625, 7.55859375, 8.20849609375, 8.8583984375, 9.50830078125, 10.158203125, 10.80810546875, 11.4580078125, 12.10791015625, 12.7578125, 13.40771484375, 14.0576171875, 14.70751953125, 15.357421875, 16.00732421875, 16.6572265625, 17.30712890625, 17.95703125, 18.60693359375, 19.2568359375, 19.90673828125, 20.556640625, 21.20654296875, 21.8564453125, 22.50634765625, 23.15625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 5.0, 6.0, 5.0, 9.0, 21.0, 13.0, 3.0, 16.0, 16.0, 16.0, 21.0, 23.0, 16.0, 16.0, 32.0, 27.0, 24.0, 42.0, 42.0, 33.0, 32.0, 39.0, 30.0, 38.0, 37.0, 48.0, 37.0, 46.0, 30.0, 32.0, 32.0, 22.0, 19.0, 25.0, 13.0, 18.0, 14.0, 13.0, 11.0, 13.0, 13.0, 10.0, 6.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-111.53697967529297, -108.14422607421875, -104.75147247314453, -101.35871887207031, -97.96597290039062, -94.5732192993164, -91.18046569824219, -87.78771209716797, -84.39495849609375, -81.00220489501953, -77.60945129394531, -74.21670532226562, -70.8239517211914, -67.43119812011719, -64.03844451904297, -60.64569091796875, -57.2529411315918, -53.86018753051758, -50.467437744140625, -47.074684143066406, -43.68193054199219, -40.28917694091797, -36.896427154541016, -33.5036735534668, -30.11092185974121, -26.718170166015625, -23.325416564941406, -19.93266487121582, -16.539913177490234, -13.147159576416016, -9.75440788269043, -6.361654281616211, -2.968902587890625, 0.42384982109069824, 3.8166022300720215, 7.209354400634766, 10.602107048034668, 13.99485969543457, 17.387611389160156, 20.780364990234375, 24.17311668395996, 27.565868377685547, 30.958621978759766, 34.35137176513672, 37.74412536621094, 41.136878967285156, 44.529632568359375, 47.922386169433594, 51.31513595581055, 54.707889556884766, 58.10063934326172, 61.49339294433594, 64.88614654541016, 68.27890014648438, 71.67164611816406, 75.06440734863281, 78.4571533203125, 81.84990692138672, 85.24266052246094, 88.63540649414062, 92.02816009521484, 95.42091369628906, 98.81366729736328, 102.2064208984375, 105.59917449951172]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 5.0, 10.0, 12.0, 14.0, 9.0, 17.0, 32.0, 31.0, 23.0, 31.0, 31.0, 39.0, 40.0, 39.0, 32.0, 42.0, 37.0, 46.0, 43.0, 43.0, 60.0, 28.0, 46.0, 36.0, 34.0, 26.0, 31.0, 33.0, 18.0, 26.0, 7.0, 13.0, 12.0, 10.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.3901824951172, -153.63934326171875, -148.88848876953125, -144.1376495361328, -139.38681030273438, -134.63597106933594, -129.8851318359375, -125.13427734375, -120.38343811035156, -115.63259887695312, -110.88175201416016, -106.13090515136719, -101.38006591796875, -96.62922668457031, -91.87837982177734, -87.12753295898438, -82.37669372558594, -77.6258544921875, -72.87500762939453, -68.12416076660156, -63.373321533203125, -58.62247848510742, -53.87163543701172, -49.120792388916016, -44.36994934082031, -39.61910629272461, -34.868263244628906, -30.117420196533203, -25.3665771484375, -20.615734100341797, -15.864891052246094, -11.11404800415039, -6.3632049560546875, -1.6123619079589844, 3.1384811401367188, 7.889324188232422, 12.640167236328125, 17.391010284423828, 22.14185333251953, 26.892696380615234, 31.643539428710938, 36.39438247680664, 41.145225524902344, 45.89606857299805, 50.64691162109375, 55.39775466918945, 60.148597717285156, 64.89944458007812, 69.65028381347656, 74.401123046875, 79.15196990966797, 83.90281677246094, 88.65365600585938, 93.40449523925781, 98.15534210205078, 102.90618896484375, 107.65702819824219, 112.40786743164062, 117.1587142944336, 121.90956115722656, 126.660400390625, 131.41123962402344, 136.16207885742188, 140.91293334960938, 145.6637725830078]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 13.0, 23.0, 33.0, 42.0, 112.0, 167.0, 276.0, 442.0, 703.0, 1288.0, 2028.0, 3188.0, 5321.0, 8502.0, 13379.0, 20527.0, 30969.0, 45522.0, 66194.0, 92982.0, 125042.0, 164448.0, 208586.0, 254009.0, 296304.0, 329611.0, 350009.0, 353872.0, 339861.0, 313291.0, 273570.0, 229079.0, 184349.0, 141089.0, 105721.0, 76412.0, 53664.0, 36560.0, 24501.0, 16232.0, 10047.0, 6374.0, 3991.0, 2360.0, 1476.0, 896.0, 521.0, 270.0, 189.0, 111.0, 62.0, 33.0, 24.0, 10.0, 7.0, 2.0, 1.0, 1.0], "bins": [-90.6875, -87.95703125, -85.2265625, -82.49609375, -79.765625, -77.03515625, -74.3046875, -71.57421875, -68.84375, -66.11328125, -63.3828125, -60.65234375, -57.921875, -55.19140625, -52.4609375, -49.73046875, -47.0, -44.26953125, -41.5390625, -38.80859375, -36.078125, -33.34765625, -30.6171875, -27.88671875, -25.15625, -22.42578125, -19.6953125, -16.96484375, -14.234375, -11.50390625, -8.7734375, -6.04296875, -3.3125, -0.58203125, 2.1484375, 4.87890625, 7.609375, 10.33984375, 13.0703125, 15.80078125, 18.53125, 21.26171875, 23.9921875, 26.72265625, 29.453125, 32.18359375, 34.9140625, 37.64453125, 40.375, 43.10546875, 45.8359375, 48.56640625, 51.296875, 54.02734375, 56.7578125, 59.48828125, 62.21875, 64.94921875, 67.6796875, 70.41015625, 73.140625, 75.87109375, 78.6015625, 81.33203125, 84.0625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 6.0, 7.0, 7.0, 9.0, 14.0, 8.0, 15.0, 15.0, 32.0, 27.0, 22.0, 32.0, 35.0, 36.0, 42.0, 38.0, 30.0, 36.0, 50.0, 41.0, 38.0, 47.0, 50.0, 39.0, 43.0, 40.0, 34.0, 21.0, 36.0, 29.0, 19.0, 23.0, 15.0, 9.0, 12.0, 13.0, 6.0, 9.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.375, -142.984375, -138.59375, -134.203125, -129.8125, -125.421875, -121.03125, -116.640625, -112.25, -107.859375, -103.46875, -99.078125, -94.6875, -90.296875, -85.90625, -81.515625, -77.125, -72.734375, -68.34375, -63.953125, -59.5625, -55.171875, -50.78125, -46.390625, -42.0, -37.609375, -33.21875, -28.828125, -24.4375, -20.046875, -15.65625, -11.265625, -6.875, -2.484375, 1.90625, 6.296875, 10.6875, 15.078125, 19.46875, 23.859375, 28.25, 32.640625, 37.03125, 41.421875, 45.8125, 50.203125, 54.59375, 58.984375, 63.375, 67.765625, 72.15625, 76.546875, 80.9375, 85.328125, 89.71875, 94.109375, 98.5, 102.890625, 107.28125, 111.671875, 116.0625, 120.453125, 124.84375, 129.234375, 133.625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 11.0, 13.0, 28.0, 62.0, 109.0, 216.0, 357.0, 561.0, 1000.0, 1650.0, 2789.0, 4511.0, 7321.0, 11797.0, 18038.0, 28021.0, 41214.0, 59518.0, 83848.0, 113828.0, 149967.0, 189349.0, 231464.0, 270053.0, 304576.0, 329590.0, 339247.0, 335237.0, 317754.0, 287825.0, 249814.0, 208608.0, 167293.0, 129865.0, 96191.0, 69976.0, 49027.0, 33496.0, 22177.0, 14265.0, 9309.0, 5717.0, 3491.0, 2130.0, 1264.0, 764.0, 428.0, 227.0, 145.0, 74.0, 25.0, 23.0, 15.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-86.875, -84.0478515625, -81.220703125, -78.3935546875, -75.56640625, -72.7392578125, -69.912109375, -67.0849609375, -64.2578125, -61.4306640625, -58.603515625, -55.7763671875, -52.94921875, -50.1220703125, -47.294921875, -44.4677734375, -41.640625, -38.8134765625, -35.986328125, -33.1591796875, -30.33203125, -27.5048828125, -24.677734375, -21.8505859375, -19.0234375, -16.1962890625, -13.369140625, -10.5419921875, -7.71484375, -4.8876953125, -2.060546875, 0.7666015625, 3.59375, 6.4208984375, 9.248046875, 12.0751953125, 14.90234375, 17.7294921875, 20.556640625, 23.3837890625, 26.2109375, 29.0380859375, 31.865234375, 34.6923828125, 37.51953125, 40.3466796875, 43.173828125, 46.0009765625, 48.828125, 51.6552734375, 54.482421875, 57.3095703125, 60.13671875, 62.9638671875, 65.791015625, 68.6181640625, 71.4453125, 74.2724609375, 77.099609375, 79.9267578125, 82.75390625, 85.5810546875, 88.408203125, 91.2353515625, 94.0625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 8.0, 10.0, 17.0, 12.0, 18.0, 23.0, 35.0, 29.0, 35.0, 45.0, 57.0, 69.0, 90.0, 102.0, 99.0, 94.0, 121.0, 125.0, 142.0, 151.0, 170.0, 154.0, 167.0, 174.0, 164.0, 166.0, 177.0, 152.0, 136.0, 157.0, 138.0, 137.0, 126.0, 92.0, 86.0, 103.0, 78.0, 72.0, 52.0, 52.0, 42.0, 35.0, 33.0, 29.0, 17.0, 23.0, 11.0, 12.0, 6.0, 4.0, 10.0, 6.0, 5.0, 1.0, 1.0, 3.0], "bins": [-51.1875, -49.61865234375, -48.0498046875, -46.48095703125, -44.912109375, -43.34326171875, -41.7744140625, -40.20556640625, -38.63671875, -37.06787109375, -35.4990234375, -33.93017578125, -32.361328125, -30.79248046875, -29.2236328125, -27.65478515625, -26.0859375, -24.51708984375, -22.9482421875, -21.37939453125, -19.810546875, -18.24169921875, -16.6728515625, -15.10400390625, -13.53515625, -11.96630859375, -10.3974609375, -8.82861328125, -7.259765625, -5.69091796875, -4.1220703125, -2.55322265625, -0.984375, 0.58447265625, 2.1533203125, 3.72216796875, 5.291015625, 6.85986328125, 8.4287109375, 9.99755859375, 11.56640625, 13.13525390625, 14.7041015625, 16.27294921875, 17.841796875, 19.41064453125, 20.9794921875, 22.54833984375, 24.1171875, 25.68603515625, 27.2548828125, 28.82373046875, 30.392578125, 31.96142578125, 33.5302734375, 35.09912109375, 36.66796875, 38.23681640625, 39.8056640625, 41.37451171875, 42.943359375, 44.51220703125, 46.0810546875, 47.64990234375, 49.21875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 7.0, 15.0, 11.0, 7.0, 16.0, 9.0, 13.0, 15.0, 17.0, 22.0, 22.0, 26.0, 21.0, 29.0, 32.0, 43.0, 29.0, 31.0, 39.0, 29.0, 39.0, 32.0, 38.0, 43.0, 34.0, 33.0, 40.0, 30.0, 31.0, 28.0, 28.0, 20.0, 19.0, 23.0, 20.0, 16.0, 11.0, 10.0, 12.0, 8.0, 12.0, 5.0, 7.0, 5.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.55011749267578, -108.86033630371094, -105.1705551147461, -101.48077392578125, -97.79100036621094, -94.1012191772461, -90.41143798828125, -86.7216567993164, -83.03187561035156, -79.34209442138672, -75.65231323242188, -71.96253967285156, -68.27275848388672, -64.58297729492188, -60.89319610595703, -57.20341491699219, -53.513641357421875, -49.82386016845703, -46.13408279418945, -42.44430160522461, -38.75452423095703, -35.06474304199219, -31.374961853027344, -27.685182571411133, -23.995403289794922, -20.30562400817871, -16.6158447265625, -12.926063537597656, -9.236284255981445, -5.546504974365234, -1.8567237854003906, 1.8330554962158203, 5.5228271484375, 9.212606430053711, 12.902386665344238, 16.592166900634766, 20.281946182250977, 23.971725463867188, 27.66150665283203, 31.351285934448242, 35.04106521606445, 38.7308464050293, 42.420623779296875, 46.11040496826172, 49.80018615722656, 53.48996353149414, 57.179744720458984, 60.86952209472656, 64.5593032836914, 68.24908447265625, 71.9388656616211, 75.62864685058594, 79.31842041015625, 83.0082015991211, 86.69798278808594, 90.38776397705078, 94.07754516601562, 97.76732635498047, 101.45710754394531, 105.14688110351562, 108.83666229248047, 112.52644348144531, 116.21622467041016, 119.906005859375, 123.59577941894531]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 8.0, 8.0, 7.0, 11.0, 15.0, 23.0, 19.0, 14.0, 18.0, 20.0, 22.0, 41.0, 26.0, 31.0, 32.0, 36.0, 38.0, 40.0, 33.0, 48.0, 43.0, 53.0, 53.0, 37.0, 38.0, 38.0, 29.0, 36.0, 36.0, 20.0, 20.0, 20.0, 20.0, 21.0, 10.0, 12.0, 8.0, 3.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-154.86753845214844, -150.0020751953125, -145.13661193847656, -140.27114868164062, -135.4056854248047, -130.54022216796875, -125.67475128173828, -120.80928802490234, -115.9438247680664, -111.07836151123047, -106.21289825439453, -101.3474349975586, -96.48196411132812, -91.61650085449219, -86.75103759765625, -81.88557434082031, -77.02011108398438, -72.15464782714844, -67.2891845703125, -62.4237174987793, -57.55825424194336, -52.69279098510742, -47.82732391357422, -42.96186065673828, -38.096397399902344, -33.230934143066406, -28.365468978881836, -23.500003814697266, -18.634540557861328, -13.76907730102539, -8.90361213684082, -4.03814697265625, 0.82733154296875, 5.692795753479004, 10.558259963989258, 15.423724174499512, 20.289188385009766, 25.154651641845703, 30.020116806030273, 34.885581970214844, 39.75104522705078, 44.61650848388672, 49.481971740722656, 54.34743881225586, 59.2129020690918, 64.078369140625, 68.94383239746094, 73.80929565429688, 78.67475891113281, 83.54022216796875, 88.40568542480469, 93.27114868164062, 98.13661193847656, 103.0020751953125, 107.86754608154297, 112.7330093383789, 117.59847259521484, 122.46393585205078, 127.32939910888672, 132.1948699951172, 137.06033325195312, 141.92579650878906, 146.791259765625, 151.65672302246094, 156.52218627929688]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 4.0, 6.0, 12.0, 16.0, 15.0, 22.0, 25.0, 45.0, 66.0, 96.0, 178.0, 229.0, 387.0, 729.0, 1428.0, 3441.0, 9106.0, 25812.0, 75159.0, 183868.0, 292662.0, 253777.0, 128202.0, 46773.0, 15966.0, 5735.0, 2289.0, 1036.0, 563.0, 309.0, 184.0, 137.0, 77.0, 59.0, 35.0, 38.0, 25.0, 14.0, 10.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.125, -99.412109375, -95.69921875, -91.986328125, -88.2734375, -84.560546875, -80.84765625, -77.134765625, -73.421875, -69.708984375, -65.99609375, -62.283203125, -58.5703125, -54.857421875, -51.14453125, -47.431640625, -43.71875, -40.005859375, -36.29296875, -32.580078125, -28.8671875, -25.154296875, -21.44140625, -17.728515625, -14.015625, -10.302734375, -6.58984375, -2.876953125, 0.8359375, 4.548828125, 8.26171875, 11.974609375, 15.6875, 19.400390625, 23.11328125, 26.826171875, 30.5390625, 34.251953125, 37.96484375, 41.677734375, 45.390625, 49.103515625, 52.81640625, 56.529296875, 60.2421875, 63.955078125, 67.66796875, 71.380859375, 75.09375, 78.806640625, 82.51953125, 86.232421875, 89.9453125, 93.658203125, 97.37109375, 101.083984375, 104.796875, 108.509765625, 112.22265625, 115.935546875, 119.6484375, 123.361328125, 127.07421875, 130.787109375, 134.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 7.0, 7.0, 7.0, 12.0, 16.0, 20.0, 21.0, 14.0, 16.0, 21.0, 23.0, 38.0, 29.0, 29.0, 34.0, 30.0, 42.0, 37.0, 36.0, 46.0, 44.0, 51.0, 55.0, 37.0, 38.0, 32.0, 34.0, 40.0, 33.0, 22.0, 20.0, 19.0, 19.0, 22.0, 12.0, 11.0, 7.0, 5.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-154.5, -149.65625, -144.8125, -139.96875, -135.125, -130.28125, -125.4375, -120.59375, -115.75, -110.90625, -106.0625, -101.21875, -96.375, -91.53125, -86.6875, -81.84375, -77.0, -72.15625, -67.3125, -62.46875, -57.625, -52.78125, -47.9375, -43.09375, -38.25, -33.40625, -28.5625, -23.71875, -18.875, -14.03125, -9.1875, -4.34375, 0.5, 5.34375, 10.1875, 15.03125, 19.875, 24.71875, 29.5625, 34.40625, 39.25, 44.09375, 48.9375, 53.78125, 58.625, 63.46875, 68.3125, 73.15625, 78.0, 82.84375, 87.6875, 92.53125, 97.375, 102.21875, 107.0625, 111.90625, 116.75, 121.59375, 126.4375, 131.28125, 136.125, 140.96875, 145.8125, 150.65625, 155.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 11.0, 9.0, 18.0, 13.0, 28.0, 30.0, 42.0, 34.0, 60.0, 79.0, 124.0, 155.0, 204.0, 313.0, 464.0, 649.0, 1123.0, 1861.0, 3214.0, 5837.0, 11559.0, 24319.0, 54876.0, 122390.0, 233635.0, 271842.0, 168971.0, 78277.0, 34533.0, 15710.0, 7754.0, 4138.0, 2301.0, 1426.0, 787.0, 548.0, 371.0, 245.0, 143.0, 120.0, 76.0, 60.0, 62.0, 38.0, 27.0, 27.0, 15.0, 10.0, 10.0, 2.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-87.9375, -85.2080078125, -82.478515625, -79.7490234375, -77.01953125, -74.2900390625, -71.560546875, -68.8310546875, -66.1015625, -63.3720703125, -60.642578125, -57.9130859375, -55.18359375, -52.4541015625, -49.724609375, -46.9951171875, -44.265625, -41.5361328125, -38.806640625, -36.0771484375, -33.34765625, -30.6181640625, -27.888671875, -25.1591796875, -22.4296875, -19.7001953125, -16.970703125, -14.2412109375, -11.51171875, -8.7822265625, -6.052734375, -3.3232421875, -0.59375, 2.1357421875, 4.865234375, 7.5947265625, 10.32421875, 13.0537109375, 15.783203125, 18.5126953125, 21.2421875, 23.9716796875, 26.701171875, 29.4306640625, 32.16015625, 34.8896484375, 37.619140625, 40.3486328125, 43.078125, 45.8076171875, 48.537109375, 51.2666015625, 53.99609375, 56.7255859375, 59.455078125, 62.1845703125, 64.9140625, 67.6435546875, 70.373046875, 73.1025390625, 75.83203125, 78.5615234375, 81.291015625, 84.0205078125, 86.75]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 5.0, 8.0, 13.0, 5.0, 7.0, 13.0, 18.0, 12.0, 19.0, 20.0, 28.0, 25.0, 33.0, 29.0, 37.0, 31.0, 39.0, 29.0, 29.0, 36.0, 35.0, 35.0, 32.0, 37.0, 46.0, 36.0, 46.0, 38.0, 37.0, 28.0, 28.0, 24.0, 26.0, 23.0, 17.0, 17.0, 11.0, 16.0, 7.0, 4.0, 8.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.75, -85.9150390625, -83.080078125, -80.2451171875, -77.41015625, -74.5751953125, -71.740234375, -68.9052734375, -66.0703125, -63.2353515625, -60.400390625, -57.5654296875, -54.73046875, -51.8955078125, -49.060546875, -46.2255859375, -43.390625, -40.5556640625, -37.720703125, -34.8857421875, -32.05078125, -29.2158203125, -26.380859375, -23.5458984375, -20.7109375, -17.8759765625, -15.041015625, -12.2060546875, -9.37109375, -6.5361328125, -3.701171875, -0.8662109375, 1.96875, 4.8037109375, 7.638671875, 10.4736328125, 13.30859375, 16.1435546875, 18.978515625, 21.8134765625, 24.6484375, 27.4833984375, 30.318359375, 33.1533203125, 35.98828125, 38.8232421875, 41.658203125, 44.4931640625, 47.328125, 50.1630859375, 52.998046875, 55.8330078125, 58.66796875, 61.5029296875, 64.337890625, 67.1728515625, 70.0078125, 72.8427734375, 75.677734375, 78.5126953125, 81.34765625, 84.1826171875, 87.017578125, 89.8525390625, 92.6875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 10.0, 10.0, 17.0, 28.0, 51.0, 53.0, 83.0, 121.0, 172.0, 268.0, 402.0, 564.0, 834.0, 1180.0, 1890.0, 2817.0, 4609.0, 7426.0, 12938.0, 23193.0, 44642.0, 91865.0, 195416.0, 290327.0, 185883.0, 86633.0, 42333.0, 22326.0, 12527.0, 7262.0, 4513.0, 2776.0, 1773.0, 1205.0, 745.0, 512.0, 345.0, 261.0, 186.0, 113.0, 63.0, 62.0, 32.0, 33.0, 20.0, 12.0, 7.0, 8.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-43.71875, -42.3720703125, -41.025390625, -39.6787109375, -38.33203125, -36.9853515625, -35.638671875, -34.2919921875, -32.9453125, -31.5986328125, -30.251953125, -28.9052734375, -27.55859375, -26.2119140625, -24.865234375, -23.5185546875, -22.171875, -20.8251953125, -19.478515625, -18.1318359375, -16.78515625, -15.4384765625, -14.091796875, -12.7451171875, -11.3984375, -10.0517578125, -8.705078125, -7.3583984375, -6.01171875, -4.6650390625, -3.318359375, -1.9716796875, -0.625, 0.7216796875, 2.068359375, 3.4150390625, 4.76171875, 6.1083984375, 7.455078125, 8.8017578125, 10.1484375, 11.4951171875, 12.841796875, 14.1884765625, 15.53515625, 16.8818359375, 18.228515625, 19.5751953125, 20.921875, 22.2685546875, 23.615234375, 24.9619140625, 26.30859375, 27.6552734375, 29.001953125, 30.3486328125, 31.6953125, 33.0419921875, 34.388671875, 35.7353515625, 37.08203125, 38.4287109375, 39.775390625, 41.1220703125, 42.46875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 4.0, 6.0, 13.0, 17.0, 20.0, 23.0, 24.0, 30.0, 38.0, 28.0, 45.0, 36.0, 54.0, 49.0, 51.0, 44.0, 50.0, 45.0, 43.0, 47.0, 44.0, 38.0, 35.0, 35.0, 22.0, 27.0, 27.0, 21.0, 16.0, 11.0, 10.0, 8.0, 9.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018205642700195312, -0.0017643868923187256, -0.00170820951461792, -0.0016520321369171143, -0.0015958547592163086, -0.001539677381515503, -0.0014835000038146973, -0.0014273226261138916, -0.001371145248413086, -0.0013149678707122803, -0.0012587904930114746, -0.001202613115310669, -0.0011464357376098633, -0.0010902583599090576, -0.001034080982208252, -0.0009779036045074463, -0.0009217262268066406, -0.000865548849105835, -0.0008093714714050293, -0.0007531940937042236, -0.000697016716003418, -0.0006408393383026123, -0.0005846619606018066, -0.000528484582901001, -0.0004723072052001953, -0.00041612982749938965, -0.000359952449798584, -0.0003037750720977783, -0.00024759769439697266, -0.000191420316696167, -0.00013524293899536133, -7.906556129455566e-05, -2.288818359375e-05, 3.3289194107055664e-05, 8.946657180786133e-05, 0.000145643949508667, 0.00020182132720947266, 0.0002579987049102783, 0.000314176082611084, 0.00037035346031188965, 0.0004265308380126953, 0.000482708215713501, 0.0005388855934143066, 0.0005950629711151123, 0.000651240348815918, 0.0007074177265167236, 0.0007635951042175293, 0.000819772481918335, 0.0008759498596191406, 0.0009321272373199463, 0.000988304615020752, 0.0010444819927215576, 0.0011006593704223633, 0.001156836748123169, 0.0012130141258239746, 0.0012691915035247803, 0.001325368881225586, 0.0013815462589263916, 0.0014377236366271973, 0.001493901014328003, 0.0015500783920288086, 0.0016062557697296143, 0.00166243314743042, 0.0017186105251312256, 0.0017747879028320312]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 5.0, 8.0, 12.0, 21.0, 36.0, 38.0, 63.0, 120.0, 157.0, 265.0, 357.0, 592.0, 900.0, 1495.0, 2398.0, 3960.0, 6687.0, 11504.0, 20084.0, 34838.0, 59580.0, 97523.0, 141086.0, 172145.0, 164967.0, 126759.0, 83266.0, 49847.0, 28928.0, 16768.0, 9633.0, 5644.0, 3354.0, 2034.0, 1255.0, 783.0, 483.0, 334.0, 203.0, 144.0, 100.0, 61.0, 38.0, 22.0, 25.0, 13.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-59.5625, -57.8525390625, -56.142578125, -54.4326171875, -52.72265625, -51.0126953125, -49.302734375, -47.5927734375, -45.8828125, -44.1728515625, -42.462890625, -40.7529296875, -39.04296875, -37.3330078125, -35.623046875, -33.9130859375, -32.203125, -30.4931640625, -28.783203125, -27.0732421875, -25.36328125, -23.6533203125, -21.943359375, -20.2333984375, -18.5234375, -16.8134765625, -15.103515625, -13.3935546875, -11.68359375, -9.9736328125, -8.263671875, -6.5537109375, -4.84375, -3.1337890625, -1.423828125, 0.2861328125, 1.99609375, 3.7060546875, 5.416015625, 7.1259765625, 8.8359375, 10.5458984375, 12.255859375, 13.9658203125, 15.67578125, 17.3857421875, 19.095703125, 20.8056640625, 22.515625, 24.2255859375, 25.935546875, 27.6455078125, 29.35546875, 31.0654296875, 32.775390625, 34.4853515625, 36.1953125, 37.9052734375, 39.615234375, 41.3251953125, 43.03515625, 44.7451171875, 46.455078125, 48.1650390625, 49.875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 6.0, 6.0, 9.0, 11.0, 14.0, 13.0, 17.0, 23.0, 28.0, 29.0, 39.0, 37.0, 50.0, 55.0, 51.0, 74.0, 77.0, 54.0, 71.0, 66.0, 41.0, 33.0, 42.0, 35.0, 23.0, 17.0, 14.0, 18.0, 13.0, 6.0, 3.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.40625, -21.8482666015625, -21.290283203125, -20.7322998046875, -20.17431640625, -19.6163330078125, -19.058349609375, -18.5003662109375, -17.9423828125, -17.3843994140625, -16.826416015625, -16.2684326171875, -15.71044921875, -15.1524658203125, -14.594482421875, -14.0364990234375, -13.478515625, -12.9205322265625, -12.362548828125, -11.8045654296875, -11.24658203125, -10.6885986328125, -10.130615234375, -9.5726318359375, -9.0146484375, -8.4566650390625, -7.898681640625, -7.3406982421875, -6.78271484375, -6.2247314453125, -5.666748046875, -5.1087646484375, -4.55078125, -3.9927978515625, -3.434814453125, -2.8768310546875, -2.31884765625, -1.7608642578125, -1.202880859375, -0.6448974609375, -0.0869140625, 0.4710693359375, 1.029052734375, 1.5870361328125, 2.14501953125, 2.7030029296875, 3.260986328125, 3.8189697265625, 4.376953125, 4.9349365234375, 5.492919921875, 6.0509033203125, 6.60888671875, 7.1668701171875, 7.724853515625, 8.2828369140625, 8.8408203125, 9.3988037109375, 9.956787109375, 10.5147705078125, 11.07275390625, 11.6307373046875, 12.188720703125, 12.7467041015625, 13.3046875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 6.0, 10.0, 9.0, 11.0, 15.0, 12.0, 9.0, 16.0, 14.0, 14.0, 21.0, 14.0, 29.0, 30.0, 29.0, 28.0, 28.0, 31.0, 37.0, 35.0, 30.0, 37.0, 42.0, 33.0, 24.0, 28.0, 41.0, 48.0, 28.0, 22.0, 42.0, 28.0, 17.0, 23.0, 20.0, 18.0, 17.0, 17.0, 10.0, 8.0, 5.0, 8.0, 8.0, 7.0, 7.0, 2.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-107.73114776611328, -104.18449401855469, -100.63784790039062, -97.09119415283203, -93.54454040527344, -89.99789428710938, -86.45124053955078, -82.90458679199219, -79.35794067382812, -75.81128692626953, -72.26464080810547, -68.71798706054688, -65.17133331298828, -61.62468338012695, -58.078033447265625, -54.53137969970703, -50.98472595214844, -47.43807601928711, -43.891422271728516, -40.34477233886719, -36.798118591308594, -33.251468658447266, -29.704818725585938, -26.158166885375977, -22.611515045166016, -19.064863204956055, -15.51821231842041, -11.971561431884766, -8.424909591674805, -4.878257751464844, -1.3316078186035156, 2.2150440216064453, 5.761695861816406, 9.308347702026367, 12.854998588562012, 16.401649475097656, 19.948301315307617, 23.494953155517578, 27.041603088378906, 30.588254928588867, 34.13490676879883, 37.681556701660156, 41.22821044921875, 44.77486038208008, 48.321510314941406, 51.8681640625, 55.41481399536133, 58.961463928222656, 62.50811767578125, 66.05477142333984, 69.6014175415039, 73.1480712890625, 76.6947250366211, 80.24137878417969, 83.78802490234375, 87.33467864990234, 90.88133239746094, 94.42798614501953, 97.9746322631836, 101.52128601074219, 105.06793975830078, 108.61459350585938, 112.16123962402344, 115.70789337158203, 119.2545394897461]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 8.0, 6.0, 12.0, 17.0, 16.0, 21.0, 15.0, 16.0, 19.0, 28.0, 33.0, 38.0, 27.0, 25.0, 34.0, 38.0, 40.0, 46.0, 44.0, 36.0, 52.0, 53.0, 43.0, 36.0, 31.0, 47.0, 28.0, 36.0, 18.0, 28.0, 18.0, 17.0, 20.0, 9.0, 12.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-156.04119873046875, -151.15054321289062, -146.25990295410156, -141.36924743652344, -136.47860717773438, -131.58795166015625, -126.69730377197266, -121.80665588378906, -116.91600799560547, -112.02536010742188, -107.13471221923828, -102.24406433105469, -97.35340881347656, -92.4627685546875, -87.57211303710938, -82.68146514892578, -77.79081726074219, -72.9001693725586, -68.009521484375, -63.11886978149414, -58.22822189331055, -53.33757400512695, -48.446922302246094, -43.5562744140625, -38.665626525878906, -33.77497863769531, -28.884328842163086, -23.99367904663086, -19.103031158447266, -14.212383270263672, -9.321733474731445, -4.431083679199219, 0.4595489501953125, 5.350197792053223, 10.240846633911133, 15.131495475769043, 20.022144317626953, 24.912792205810547, 29.803442001342773, 34.694091796875, 39.584739685058594, 44.47538757324219, 49.36603546142578, 54.25668716430664, 59.147335052490234, 64.03797912597656, 68.92863464355469, 73.81928253173828, 78.70993041992188, 83.60057830810547, 88.49122619628906, 93.38187408447266, 98.27252197265625, 103.16317749023438, 108.05382537841797, 112.94447326660156, 117.83512115478516, 122.72576904296875, 127.61641693115234, 132.50706481933594, 137.39772033691406, 142.28836059570312, 147.17901611328125, 152.06967163085938, 156.96031188964844]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 9.0, 3.0, 21.0, 13.0, 33.0, 56.0, 95.0, 129.0, 219.0, 348.0, 553.0, 831.0, 1372.0, 2143.0, 3078.0, 4664.0, 6992.0, 9893.0, 13632.0, 18766.0, 24971.0, 32634.0, 40905.0, 49233.0, 58315.0, 66259.0, 72940.0, 76832.0, 77984.0, 76509.0, 72637.0, 66452.0, 58196.0, 49353.0, 40988.0, 32462.0, 25201.0, 19103.0, 13923.0, 9948.0, 7043.0, 4658.0, 3236.0, 2130.0, 1369.0, 912.0, 548.0, 392.0, 225.0, 130.0, 99.0, 50.0, 38.0, 20.0, 9.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-72.375, -70.078125, -67.78125, -65.484375, -63.1875, -60.890625, -58.59375, -56.296875, -54.0, -51.703125, -49.40625, -47.109375, -44.8125, -42.515625, -40.21875, -37.921875, -35.625, -33.328125, -31.03125, -28.734375, -26.4375, -24.140625, -21.84375, -19.546875, -17.25, -14.953125, -12.65625, -10.359375, -8.0625, -5.765625, -3.46875, -1.171875, 1.125, 3.421875, 5.71875, 8.015625, 10.3125, 12.609375, 14.90625, 17.203125, 19.5, 21.796875, 24.09375, 26.390625, 28.6875, 30.984375, 33.28125, 35.578125, 37.875, 40.171875, 42.46875, 44.765625, 47.0625, 49.359375, 51.65625, 53.953125, 56.25, 58.546875, 60.84375, 63.140625, 65.4375, 67.734375, 70.03125, 72.328125, 74.625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 10.0, 5.0, 9.0, 18.0, 16.0, 23.0, 13.0, 12.0, 24.0, 28.0, 36.0, 35.0, 29.0, 24.0, 34.0, 38.0, 39.0, 42.0, 46.0, 36.0, 57.0, 51.0, 48.0, 30.0, 32.0, 46.0, 26.0, 34.0, 23.0, 28.0, 16.0, 18.0, 20.0, 10.0, 12.0, 7.0, 6.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-152.0, -147.236328125, -142.47265625, -137.708984375, -132.9453125, -128.181640625, -123.41796875, -118.654296875, -113.890625, -109.126953125, -104.36328125, -99.599609375, -94.8359375, -90.072265625, -85.30859375, -80.544921875, -75.78125, -71.017578125, -66.25390625, -61.490234375, -56.7265625, -51.962890625, -47.19921875, -42.435546875, -37.671875, -32.908203125, -28.14453125, -23.380859375, -18.6171875, -13.853515625, -9.08984375, -4.326171875, 0.4375, 5.201171875, 9.96484375, 14.728515625, 19.4921875, 24.255859375, 29.01953125, 33.783203125, 38.546875, 43.310546875, 48.07421875, 52.837890625, 57.6015625, 62.365234375, 67.12890625, 71.892578125, 76.65625, 81.419921875, 86.18359375, 90.947265625, 95.7109375, 100.474609375, 105.23828125, 110.001953125, 114.765625, 119.529296875, 124.29296875, 129.056640625, 133.8203125, 138.583984375, 143.34765625, 148.111328125, 152.875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 6.0, 7.0, 15.0, 32.0, 44.0, 86.0, 126.0, 187.0, 347.0, 581.0, 946.0, 1435.0, 2268.0, 3605.0, 5329.0, 8018.0, 11759.0, 16472.0, 22756.0, 30370.0, 38924.0, 48510.0, 58750.0, 67654.0, 75534.0, 80918.0, 82961.0, 81382.0, 77318.0, 69286.0, 60751.0, 50164.0, 40955.0, 31819.0, 24045.0, 17661.0, 12331.0, 8733.0, 5952.0, 3880.0, 2509.0, 1604.0, 984.0, 602.0, 367.0, 240.0, 144.0, 84.0, 46.0, 33.0, 19.0, 6.0, 9.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.125, -65.8232421875, -63.521484375, -61.2197265625, -58.91796875, -56.6162109375, -54.314453125, -52.0126953125, -49.7109375, -47.4091796875, -45.107421875, -42.8056640625, -40.50390625, -38.2021484375, -35.900390625, -33.5986328125, -31.296875, -28.9951171875, -26.693359375, -24.3916015625, -22.08984375, -19.7880859375, -17.486328125, -15.1845703125, -12.8828125, -10.5810546875, -8.279296875, -5.9775390625, -3.67578125, -1.3740234375, 0.927734375, 3.2294921875, 5.53125, 7.8330078125, 10.134765625, 12.4365234375, 14.73828125, 17.0400390625, 19.341796875, 21.6435546875, 23.9453125, 26.2470703125, 28.548828125, 30.8505859375, 33.15234375, 35.4541015625, 37.755859375, 40.0576171875, 42.359375, 44.6611328125, 46.962890625, 49.2646484375, 51.56640625, 53.8681640625, 56.169921875, 58.4716796875, 60.7734375, 63.0751953125, 65.376953125, 67.6787109375, 69.98046875, 72.2822265625, 74.583984375, 76.8857421875, 79.1875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 3.0, 8.0, 6.0, 7.0, 15.0, 13.0, 13.0, 27.0, 17.0, 18.0, 22.0, 23.0, 28.0, 23.0, 34.0, 29.0, 46.0, 42.0, 34.0, 35.0, 39.0, 45.0, 33.0, 46.0, 39.0, 33.0, 43.0, 39.0, 26.0, 24.0, 28.0, 29.0, 14.0, 18.0, 18.0, 10.0, 15.0, 9.0, 17.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-94.4375, -91.6494140625, -88.861328125, -86.0732421875, -83.28515625, -80.4970703125, -77.708984375, -74.9208984375, -72.1328125, -69.3447265625, -66.556640625, -63.7685546875, -60.98046875, -58.1923828125, -55.404296875, -52.6162109375, -49.828125, -47.0400390625, -44.251953125, -41.4638671875, -38.67578125, -35.8876953125, -33.099609375, -30.3115234375, -27.5234375, -24.7353515625, -21.947265625, -19.1591796875, -16.37109375, -13.5830078125, -10.794921875, -8.0068359375, -5.21875, -2.4306640625, 0.357421875, 3.1455078125, 5.93359375, 8.7216796875, 11.509765625, 14.2978515625, 17.0859375, 19.8740234375, 22.662109375, 25.4501953125, 28.23828125, 31.0263671875, 33.814453125, 36.6025390625, 39.390625, 42.1787109375, 44.966796875, 47.7548828125, 50.54296875, 53.3310546875, 56.119140625, 58.9072265625, 61.6953125, 64.4833984375, 67.271484375, 70.0595703125, 72.84765625, 75.6357421875, 78.423828125, 81.2119140625, 84.0]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 6.0, 11.0, 20.0, 33.0, 39.0, 73.0, 135.0, 193.0, 337.0, 550.0, 888.0, 1251.0, 2081.0, 3055.0, 4802.0, 6815.0, 9973.0, 14281.0, 20340.0, 27004.0, 36058.0, 46309.0, 56715.0, 67436.0, 76361.0, 83320.0, 85976.0, 85016.0, 80411.0, 72296.0, 62653.0, 51626.0, 41573.0, 31987.0, 24330.0, 17182.0, 12335.0, 8471.0, 5856.0, 3712.0, 2511.0, 1678.0, 1024.0, 699.0, 414.0, 281.0, 183.0, 109.0, 64.0, 35.0, 25.0, 6.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0], "bins": [-38.46875, -37.294921875, -36.12109375, -34.947265625, -33.7734375, -32.599609375, -31.42578125, -30.251953125, -29.078125, -27.904296875, -26.73046875, -25.556640625, -24.3828125, -23.208984375, -22.03515625, -20.861328125, -19.6875, -18.513671875, -17.33984375, -16.166015625, -14.9921875, -13.818359375, -12.64453125, -11.470703125, -10.296875, -9.123046875, -7.94921875, -6.775390625, -5.6015625, -4.427734375, -3.25390625, -2.080078125, -0.90625, 0.267578125, 1.44140625, 2.615234375, 3.7890625, 4.962890625, 6.13671875, 7.310546875, 8.484375, 9.658203125, 10.83203125, 12.005859375, 13.1796875, 14.353515625, 15.52734375, 16.701171875, 17.875, 19.048828125, 20.22265625, 21.396484375, 22.5703125, 23.744140625, 24.91796875, 26.091796875, 27.265625, 28.439453125, 29.61328125, 30.787109375, 31.9609375, 33.134765625, 34.30859375, 35.482421875, 36.65625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 8.0, 5.0, 12.0, 12.0, 12.0, 21.0, 21.0, 25.0, 25.0, 28.0, 23.0, 36.0, 30.0, 35.0, 33.0, 39.0, 41.0, 40.0, 39.0, 54.0, 47.0, 38.0, 46.0, 35.0, 23.0, 17.0, 25.0, 36.0, 20.0, 27.0, 21.0, 12.0, 12.0, 14.0, 13.0, 11.0, 8.0, 9.0, 3.0, 3.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.00542449951171875, -0.005262613296508789, -0.005100727081298828, -0.004938840866088867, -0.004776954650878906, -0.004615068435668945, -0.004453182220458984, -0.0042912960052490234, -0.0041294097900390625, -0.0039675235748291016, -0.0038056373596191406, -0.0036437511444091797, -0.0034818649291992188, -0.003319978713989258, -0.003158092498779297, -0.002996206283569336, -0.002834320068359375, -0.002672433853149414, -0.002510547637939453, -0.002348661422729492, -0.0021867752075195312, -0.0020248889923095703, -0.0018630027770996094, -0.0017011165618896484, -0.0015392303466796875, -0.0013773441314697266, -0.0012154579162597656, -0.0010535717010498047, -0.0008916854858398438, -0.0007297992706298828, -0.0005679130554199219, -0.00040602684020996094, -0.000244140625, -8.225440979003906e-05, 7.963180541992188e-05, 0.0002415180206298828, 0.00040340423583984375, 0.0005652904510498047, 0.0007271766662597656, 0.0008890628814697266, 0.0010509490966796875, 0.0012128353118896484, 0.0013747215270996094, 0.0015366077423095703, 0.0016984939575195312, 0.0018603801727294922, 0.002022266387939453, 0.002184152603149414, 0.002346038818359375, 0.002507925033569336, 0.002669811248779297, 0.002831697463989258, 0.0029935836791992188, 0.0031554698944091797, 0.0033173561096191406, 0.0034792423248291016, 0.0036411285400390625, 0.0038030147552490234, 0.003964900970458984, 0.004126787185668945, 0.004288673400878906, 0.004450559616088867, 0.004612445831298828, 0.004774332046508789, 0.00493621826171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 17.0, 32.0, 48.0, 62.0, 94.0, 179.0, 256.0, 475.0, 737.0, 1338.0, 2038.0, 3385.0, 5255.0, 8429.0, 12778.0, 19338.0, 27366.0, 38031.0, 50447.0, 64349.0, 77626.0, 87353.0, 95070.0, 97138.0, 93226.0, 84309.0, 72586.0, 58412.0, 45397.0, 33219.0, 23981.0, 16108.0, 10909.0, 7033.0, 4486.0, 2716.0, 1684.0, 1028.0, 626.0, 397.0, 274.0, 119.0, 86.0, 48.0, 28.0, 17.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 3.0], "bins": [-50.84375, -49.361328125, -47.87890625, -46.396484375, -44.9140625, -43.431640625, -41.94921875, -40.466796875, -38.984375, -37.501953125, -36.01953125, -34.537109375, -33.0546875, -31.572265625, -30.08984375, -28.607421875, -27.125, -25.642578125, -24.16015625, -22.677734375, -21.1953125, -19.712890625, -18.23046875, -16.748046875, -15.265625, -13.783203125, -12.30078125, -10.818359375, -9.3359375, -7.853515625, -6.37109375, -4.888671875, -3.40625, -1.923828125, -0.44140625, 1.041015625, 2.5234375, 4.005859375, 5.48828125, 6.970703125, 8.453125, 9.935546875, 11.41796875, 12.900390625, 14.3828125, 15.865234375, 17.34765625, 18.830078125, 20.3125, 21.794921875, 23.27734375, 24.759765625, 26.2421875, 27.724609375, 29.20703125, 30.689453125, 32.171875, 33.654296875, 35.13671875, 36.619140625, 38.1015625, 39.583984375, 41.06640625, 42.548828125, 44.03125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 7.0, 11.0, 13.0, 21.0, 20.0, 33.0, 19.0, 32.0, 31.0, 41.0, 45.0, 46.0, 58.0, 52.0, 51.0, 60.0, 55.0, 52.0, 41.0, 41.0, 39.0, 36.0, 37.0, 21.0, 30.0, 25.0, 23.0, 7.0, 6.0, 7.0, 8.0, 6.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.8125, -25.99365234375, -25.1748046875, -24.35595703125, -23.537109375, -22.71826171875, -21.8994140625, -21.08056640625, -20.26171875, -19.44287109375, -18.6240234375, -17.80517578125, -16.986328125, -16.16748046875, -15.3486328125, -14.52978515625, -13.7109375, -12.89208984375, -12.0732421875, -11.25439453125, -10.435546875, -9.61669921875, -8.7978515625, -7.97900390625, -7.16015625, -6.34130859375, -5.5224609375, -4.70361328125, -3.884765625, -3.06591796875, -2.2470703125, -1.42822265625, -0.609375, 0.20947265625, 1.0283203125, 1.84716796875, 2.666015625, 3.48486328125, 4.3037109375, 5.12255859375, 5.94140625, 6.76025390625, 7.5791015625, 8.39794921875, 9.216796875, 10.03564453125, 10.8544921875, 11.67333984375, 12.4921875, 13.31103515625, 14.1298828125, 14.94873046875, 15.767578125, 16.58642578125, 17.4052734375, 18.22412109375, 19.04296875, 19.86181640625, 20.6806640625, 21.49951171875, 22.318359375, 23.13720703125, 23.9560546875, 24.77490234375, 25.59375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 4.0, 5.0, 6.0, 9.0, 5.0, 10.0, 6.0, 15.0, 17.0, 14.0, 13.0, 17.0, 22.0, 19.0, 22.0, 24.0, 28.0, 38.0, 27.0, 33.0, 30.0, 30.0, 33.0, 39.0, 29.0, 38.0, 42.0, 35.0, 30.0, 34.0, 28.0, 29.0, 36.0, 40.0, 25.0, 17.0, 15.0, 14.0, 16.0, 13.0, 13.0, 12.0, 9.0, 14.0, 10.0, 5.0, 6.0, 7.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-114.6191635131836, -111.02305603027344, -107.42694854736328, -103.83084106445312, -100.2347412109375, -96.63863372802734, -93.04252624511719, -89.44641876220703, -85.85031127929688, -82.25420379638672, -78.65809631347656, -75.06199645996094, -71.46588897705078, -67.86978149414062, -64.27367401123047, -60.67756652832031, -57.08146667480469, -53.48535919189453, -49.88925552368164, -46.293148040771484, -42.697044372558594, -39.10093688964844, -35.50482940673828, -31.908723831176758, -28.312618255615234, -24.71651268005371, -21.120407104492188, -17.52429962158203, -13.928194046020508, -10.332088470458984, -6.735980987548828, -3.1398754119873047, 0.4562225341796875, 4.052328586578369, 7.648434638977051, 11.24454116821289, 14.840646743774414, 18.436752319335938, 22.032859802246094, 25.628965377807617, 29.22507095336914, 32.8211784362793, 36.41728210449219, 40.013389587402344, 43.6094970703125, 47.20560073852539, 50.80170822143555, 54.39781188964844, 57.993919372558594, 61.59002685546875, 65.1861343383789, 68.78224182128906, 72.37834167480469, 75.97444915771484, 79.570556640625, 83.16666412353516, 86.76277160644531, 90.35887908935547, 93.95498657226562, 97.55108642578125, 101.1471939086914, 104.74330139160156, 108.33940887451172, 111.93551635742188, 115.5316162109375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 6.0, 9.0, 13.0, 8.0, 13.0, 17.0, 32.0, 15.0, 20.0, 30.0, 23.0, 35.0, 29.0, 41.0, 40.0, 37.0, 56.0, 45.0, 38.0, 48.0, 50.0, 37.0, 42.0, 52.0, 38.0, 32.0, 41.0, 27.0, 21.0, 30.0, 13.0, 14.0, 12.0, 11.0, 8.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-190.7880401611328, -185.23580932617188, -179.68357849121094, -174.13134765625, -168.5791015625, -163.02687072753906, -157.47463989257812, -151.9224090576172, -146.37017822265625, -140.8179473876953, -135.26571655273438, -129.71348571777344, -124.16124725341797, -118.60901641845703, -113.05677795410156, -107.50454711914062, -101.95231628417969, -96.40008544921875, -90.84785461425781, -85.29561614990234, -79.7433853149414, -74.19115447998047, -68.638916015625, -63.08668518066406, -57.534454345703125, -51.98222351074219, -46.429988861083984, -40.87775421142578, -35.325523376464844, -29.773290634155273, -24.221057891845703, -18.6688232421875, -13.116607666015625, -7.564374923706055, -2.0121421813964844, 3.540090560913086, 9.092323303222656, 14.644556045532227, 20.196788787841797, 25.7490234375, 31.301254272460938, 36.853485107421875, 42.40571975708008, 47.95795440673828, 53.51018524169922, 59.062416076660156, 64.61465454101562, 70.16688537597656, 75.7191162109375, 81.27134704589844, 86.82357788085938, 92.37581634521484, 97.92804718017578, 103.48027801513672, 109.03251647949219, 114.58474731445312, 120.13697814941406, 125.689208984375, 131.24143981933594, 136.79367065429688, 142.34591674804688, 147.8981475830078, 153.45037841796875, 159.0026092529297, 164.55484008789062]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 12.0, 21.0, 46.0, 91.0, 132.0, 207.0, 322.0, 615.0, 990.0, 1578.0, 2753.0, 4515.0, 7529.0, 12129.0, 19335.0, 30196.0, 45964.0, 68272.0, 98225.0, 136476.0, 182456.0, 233699.0, 286128.0, 331417.0, 364431.0, 378682.0, 373100.0, 348501.0, 306620.0, 256224.0, 204315.0, 155312.0, 113548.0, 80211.0, 54200.0, 35784.0, 23121.0, 14460.0, 9205.0, 5424.0, 3266.0, 1995.0, 1178.0, 627.0, 402.0, 226.0, 127.0, 96.0, 53.0, 28.0, 14.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-98.5, -95.3935546875, -92.287109375, -89.1806640625, -86.07421875, -82.9677734375, -79.861328125, -76.7548828125, -73.6484375, -70.5419921875, -67.435546875, -64.3291015625, -61.22265625, -58.1162109375, -55.009765625, -51.9033203125, -48.796875, -45.6904296875, -42.583984375, -39.4775390625, -36.37109375, -33.2646484375, -30.158203125, -27.0517578125, -23.9453125, -20.8388671875, -17.732421875, -14.6259765625, -11.51953125, -8.4130859375, -5.306640625, -2.2001953125, 0.90625, 4.0126953125, 7.119140625, 10.2255859375, 13.33203125, 16.4384765625, 19.544921875, 22.6513671875, 25.7578125, 28.8642578125, 31.970703125, 35.0771484375, 38.18359375, 41.2900390625, 44.396484375, 47.5029296875, 50.609375, 53.7158203125, 56.822265625, 59.9287109375, 63.03515625, 66.1416015625, 69.248046875, 72.3544921875, 75.4609375, 78.5673828125, 81.673828125, 84.7802734375, 87.88671875, 90.9931640625, 94.099609375, 97.2060546875, 100.3125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 9.0, 12.0, 7.0, 16.0, 16.0, 21.0, 23.0, 18.0, 27.0, 25.0, 35.0, 30.0, 40.0, 35.0, 41.0, 50.0, 46.0, 38.0, 47.0, 47.0, 41.0, 42.0, 54.0, 41.0, 35.0, 36.0, 27.0, 28.0, 24.0, 19.0, 14.0, 11.0, 14.0, 5.0, 6.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-185.875, -180.50390625, -175.1328125, -169.76171875, -164.390625, -159.01953125, -153.6484375, -148.27734375, -142.90625, -137.53515625, -132.1640625, -126.79296875, -121.421875, -116.05078125, -110.6796875, -105.30859375, -99.9375, -94.56640625, -89.1953125, -83.82421875, -78.453125, -73.08203125, -67.7109375, -62.33984375, -56.96875, -51.59765625, -46.2265625, -40.85546875, -35.484375, -30.11328125, -24.7421875, -19.37109375, -14.0, -8.62890625, -3.2578125, 2.11328125, 7.484375, 12.85546875, 18.2265625, 23.59765625, 28.96875, 34.33984375, 39.7109375, 45.08203125, 50.453125, 55.82421875, 61.1953125, 66.56640625, 71.9375, 77.30859375, 82.6796875, 88.05078125, 93.421875, 98.79296875, 104.1640625, 109.53515625, 114.90625, 120.27734375, 125.6484375, 131.01953125, 136.390625, 141.76171875, 147.1328125, 152.50390625, 157.875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 16.0, 27.0, 31.0, 79.0, 138.0, 241.0, 414.0, 678.0, 1184.0, 2066.0, 3205.0, 5366.0, 8580.0, 13661.0, 20859.0, 31484.0, 46373.0, 67254.0, 92971.0, 124651.0, 161935.0, 203993.0, 244892.0, 283821.0, 313857.0, 333828.0, 340053.0, 330553.0, 307927.0, 276134.0, 235750.0, 194622.0, 154722.0, 118819.0, 87681.0, 62118.0, 43522.0, 28896.0, 19190.0, 12567.0, 7919.0, 4871.0, 2964.0, 1783.0, 1080.0, 636.0, 361.0, 214.0, 134.0, 62.0, 32.0, 23.0, 20.0, 9.0, 9.0, 1.0, 2.0], "bins": [-101.375, -98.33984375, -95.3046875, -92.26953125, -89.234375, -86.19921875, -83.1640625, -80.12890625, -77.09375, -74.05859375, -71.0234375, -67.98828125, -64.953125, -61.91796875, -58.8828125, -55.84765625, -52.8125, -49.77734375, -46.7421875, -43.70703125, -40.671875, -37.63671875, -34.6015625, -31.56640625, -28.53125, -25.49609375, -22.4609375, -19.42578125, -16.390625, -13.35546875, -10.3203125, -7.28515625, -4.25, -1.21484375, 1.8203125, 4.85546875, 7.890625, 10.92578125, 13.9609375, 16.99609375, 20.03125, 23.06640625, 26.1015625, 29.13671875, 32.171875, 35.20703125, 38.2421875, 41.27734375, 44.3125, 47.34765625, 50.3828125, 53.41796875, 56.453125, 59.48828125, 62.5234375, 65.55859375, 68.59375, 71.62890625, 74.6640625, 77.69921875, 80.734375, 83.76953125, 86.8046875, 89.83984375, 92.875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 18.0, 17.0, 17.0, 28.0, 19.0, 42.0, 42.0, 56.0, 82.0, 76.0, 69.0, 107.0, 123.0, 122.0, 131.0, 156.0, 134.0, 165.0, 206.0, 170.0, 198.0, 184.0, 201.0, 178.0, 181.0, 164.0, 140.0, 146.0, 134.0, 122.0, 115.0, 95.0, 82.0, 67.0, 55.0, 45.0, 30.0, 46.0, 31.0, 14.0, 16.0, 9.0, 15.0, 5.0, 6.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0], "bins": [-65.9375, -64.0029296875, -62.068359375, -60.1337890625, -58.19921875, -56.2646484375, -54.330078125, -52.3955078125, -50.4609375, -48.5263671875, -46.591796875, -44.6572265625, -42.72265625, -40.7880859375, -38.853515625, -36.9189453125, -34.984375, -33.0498046875, -31.115234375, -29.1806640625, -27.24609375, -25.3115234375, -23.376953125, -21.4423828125, -19.5078125, -17.5732421875, -15.638671875, -13.7041015625, -11.76953125, -9.8349609375, -7.900390625, -5.9658203125, -4.03125, -2.0966796875, -0.162109375, 1.7724609375, 3.70703125, 5.6416015625, 7.576171875, 9.5107421875, 11.4453125, 13.3798828125, 15.314453125, 17.2490234375, 19.18359375, 21.1181640625, 23.052734375, 24.9873046875, 26.921875, 28.8564453125, 30.791015625, 32.7255859375, 34.66015625, 36.5947265625, 38.529296875, 40.4638671875, 42.3984375, 44.3330078125, 46.267578125, 48.2021484375, 50.13671875, 52.0712890625, 54.005859375, 55.9404296875, 57.875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [6.0, 2.0, 4.0, 5.0, 4.0, 7.0, 5.0, 6.0, 11.0, 9.0, 8.0, 17.0, 18.0, 16.0, 17.0, 26.0, 19.0, 30.0, 26.0, 32.0, 36.0, 35.0, 41.0, 40.0, 32.0, 44.0, 35.0, 42.0, 46.0, 33.0, 42.0, 31.0, 33.0, 25.0, 28.0, 24.0, 20.0, 25.0, 21.0, 20.0, 12.0, 12.0, 9.0, 11.0, 12.0, 8.0, 10.0, 6.0, 7.0, 0.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.97655487060547, -113.53524017333984, -109.09392547607422, -104.6526107788086, -100.2113037109375, -95.76998901367188, -91.32867431640625, -86.88735961914062, -82.446044921875, -78.00473022460938, -73.56341552734375, -69.12210083007812, -64.6807861328125, -60.23947525024414, -55.79816436767578, -51.356849670410156, -46.91553497314453, -42.474220275878906, -38.03290557861328, -33.59159469604492, -29.150279998779297, -24.708965301513672, -20.26765251159668, -15.826339721679688, -11.385025024414062, -6.943711280822754, -2.5023975372314453, 1.9389162063598633, 6.380229949951172, 10.821544647216797, 15.262857437133789, 19.70417022705078, 24.145477294921875, 28.5867919921875, 33.028106689453125, 37.469417572021484, 41.91073226928711, 46.352046966552734, 50.793357849121094, 55.23467254638672, 59.675987243652344, 64.11730194091797, 68.5586166381836, 72.99993133544922, 77.44123840332031, 81.88255310058594, 86.32386779785156, 90.76518249511719, 95.20649719238281, 99.64781188964844, 104.08912658691406, 108.53044128417969, 112.97175598144531, 117.41307067871094, 121.85437774658203, 126.29569244384766, 130.73699951171875, 135.17831420898438, 139.61962890625, 144.06094360351562, 148.50225830078125, 152.94357299804688, 157.3848876953125, 161.82620239257812, 166.26751708984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 4.0, 7.0, 10.0, 9.0, 11.0, 15.0, 11.0, 21.0, 14.0, 21.0, 23.0, 31.0, 28.0, 36.0, 26.0, 44.0, 40.0, 42.0, 26.0, 35.0, 46.0, 35.0, 45.0, 50.0, 47.0, 33.0, 31.0, 41.0, 35.0, 30.0, 30.0, 14.0, 23.0, 19.0, 11.0, 16.0, 6.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-188.596435546875, -183.07728576660156, -177.55813598632812, -172.03897094726562, -166.5198211669922, -161.00067138671875, -155.4815216064453, -149.96237182617188, -144.44320678710938, -138.92405700683594, -133.4049072265625, -127.88574981689453, -122.36659240722656, -116.84744262695312, -111.32829284667969, -105.80914306640625, -100.28999328613281, -94.77084350585938, -89.2516860961914, -83.73253631591797, -78.21337890625, -72.69422912597656, -67.17507934570312, -61.65592575073242, -56.13677215576172, -50.617618560791016, -45.09846496582031, -39.579315185546875, -34.06016159057617, -28.54100799560547, -23.02185821533203, -17.502704620361328, -11.983551025390625, -6.464398384094238, -0.9452457427978516, 4.573905944824219, 10.093059539794922, 15.612213134765625, 21.131362915039062, 26.650516510009766, 32.16967010498047, 37.68882369995117, 43.207977294921875, 48.72712707519531, 54.246280670166016, 59.76543426513672, 65.28458404541016, 70.80374145507812, 76.32289123535156, 81.842041015625, 87.36119842529297, 92.8803482055664, 98.39950561523438, 103.91865539550781, 109.43780517578125, 114.95695495605469, 120.47611236572266, 125.9952621459961, 131.51441955566406, 137.0335693359375, 142.55271911621094, 148.07186889648438, 153.59103393554688, 159.1101837158203, 164.62933349609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 17.0, 10.0, 17.0, 31.0, 40.0, 69.0, 96.0, 138.0, 212.0, 388.0, 572.0, 946.0, 1446.0, 2514.0, 4120.0, 6979.0, 11693.0, 19350.0, 31308.0, 49967.0, 73888.0, 101247.0, 125292.0, 136979.0, 132398.0, 111564.0, 83635.0, 57522.0, 37267.0, 23385.0, 14108.0, 8394.0, 4992.0, 3005.0, 1816.0, 1103.0, 736.0, 442.0, 303.0, 174.0, 151.0, 82.0, 56.0, 25.0, 23.0, 15.0, 16.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.25, -47.64501953125, -46.0400390625, -44.43505859375, -42.830078125, -41.22509765625, -39.6201171875, -38.01513671875, -36.41015625, -34.80517578125, -33.2001953125, -31.59521484375, -29.990234375, -28.38525390625, -26.7802734375, -25.17529296875, -23.5703125, -21.96533203125, -20.3603515625, -18.75537109375, -17.150390625, -15.54541015625, -13.9404296875, -12.33544921875, -10.73046875, -9.12548828125, -7.5205078125, -5.91552734375, -4.310546875, -2.70556640625, -1.1005859375, 0.50439453125, 2.109375, 3.71435546875, 5.3193359375, 6.92431640625, 8.529296875, 10.13427734375, 11.7392578125, 13.34423828125, 14.94921875, 16.55419921875, 18.1591796875, 19.76416015625, 21.369140625, 22.97412109375, 24.5791015625, 26.18408203125, 27.7890625, 29.39404296875, 30.9990234375, 32.60400390625, 34.208984375, 35.81396484375, 37.4189453125, 39.02392578125, 40.62890625, 42.23388671875, 43.8388671875, 45.44384765625, 47.048828125, 48.65380859375, 50.2587890625, 51.86376953125, 53.46875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 4.0, 7.0, 11.0, 10.0, 11.0, 14.0, 11.0, 22.0, 18.0, 17.0, 24.0, 35.0, 26.0, 31.0, 34.0, 44.0, 39.0, 36.0, 28.0, 39.0, 45.0, 35.0, 47.0, 45.0, 48.0, 38.0, 29.0, 41.0, 33.0, 33.0, 24.0, 15.0, 26.0, 16.0, 12.0, 12.0, 6.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-189.875, -184.33984375, -178.8046875, -173.26953125, -167.734375, -162.19921875, -156.6640625, -151.12890625, -145.59375, -140.05859375, -134.5234375, -128.98828125, -123.453125, -117.91796875, -112.3828125, -106.84765625, -101.3125, -95.77734375, -90.2421875, -84.70703125, -79.171875, -73.63671875, -68.1015625, -62.56640625, -57.03125, -51.49609375, -45.9609375, -40.42578125, -34.890625, -29.35546875, -23.8203125, -18.28515625, -12.75, -7.21484375, -1.6796875, 3.85546875, 9.390625, 14.92578125, 20.4609375, 25.99609375, 31.53125, 37.06640625, 42.6015625, 48.13671875, 53.671875, 59.20703125, 64.7421875, 70.27734375, 75.8125, 81.34765625, 86.8828125, 92.41796875, 97.953125, 103.48828125, 109.0234375, 114.55859375, 120.09375, 125.62890625, 131.1640625, 136.69921875, 142.234375, 147.76953125, 153.3046875, 158.83984375, 164.375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 21.0, 23.0, 22.0, 50.0, 50.0, 96.0, 131.0, 216.0, 343.0, 574.0, 918.0, 1550.0, 2536.0, 4646.0, 8576.0, 17115.0, 34014.0, 66115.0, 125029.0, 199909.0, 226042.0, 165865.0, 94016.0, 48629.0, 24331.0, 12384.0, 6392.0, 3704.0, 2019.0, 1221.0, 709.0, 456.0, 277.0, 195.0, 104.0, 79.0, 68.0, 46.0, 29.0, 16.0, 8.0, 12.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.625, -76.26171875, -73.8984375, -71.53515625, -69.171875, -66.80859375, -64.4453125, -62.08203125, -59.71875, -57.35546875, -54.9921875, -52.62890625, -50.265625, -47.90234375, -45.5390625, -43.17578125, -40.8125, -38.44921875, -36.0859375, -33.72265625, -31.359375, -28.99609375, -26.6328125, -24.26953125, -21.90625, -19.54296875, -17.1796875, -14.81640625, -12.453125, -10.08984375, -7.7265625, -5.36328125, -3.0, -0.63671875, 1.7265625, 4.08984375, 6.453125, 8.81640625, 11.1796875, 13.54296875, 15.90625, 18.26953125, 20.6328125, 22.99609375, 25.359375, 27.72265625, 30.0859375, 32.44921875, 34.8125, 37.17578125, 39.5390625, 41.90234375, 44.265625, 46.62890625, 48.9921875, 51.35546875, 53.71875, 56.08203125, 58.4453125, 60.80859375, 63.171875, 65.53515625, 67.8984375, 70.26171875, 72.625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 15.0, 9.0, 8.0, 15.0, 17.0, 13.0, 19.0, 16.0, 18.0, 22.0, 26.0, 20.0, 22.0, 29.0, 32.0, 33.0, 32.0, 39.0, 29.0, 42.0, 32.0, 48.0, 32.0, 36.0, 41.0, 32.0, 41.0, 30.0, 25.0, 32.0, 18.0, 18.0, 27.0, 17.0, 16.0, 14.0, 18.0, 17.0, 7.0, 5.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0], "bins": [-101.375, -98.3642578125, -95.353515625, -92.3427734375, -89.33203125, -86.3212890625, -83.310546875, -80.2998046875, -77.2890625, -74.2783203125, -71.267578125, -68.2568359375, -65.24609375, -62.2353515625, -59.224609375, -56.2138671875, -53.203125, -50.1923828125, -47.181640625, -44.1708984375, -41.16015625, -38.1494140625, -35.138671875, -32.1279296875, -29.1171875, -26.1064453125, -23.095703125, -20.0849609375, -17.07421875, -14.0634765625, -11.052734375, -8.0419921875, -5.03125, -2.0205078125, 0.990234375, 4.0009765625, 7.01171875, 10.0224609375, 13.033203125, 16.0439453125, 19.0546875, 22.0654296875, 25.076171875, 28.0869140625, 31.09765625, 34.1083984375, 37.119140625, 40.1298828125, 43.140625, 46.1513671875, 49.162109375, 52.1728515625, 55.18359375, 58.1943359375, 61.205078125, 64.2158203125, 67.2265625, 70.2373046875, 73.248046875, 76.2587890625, 79.26953125, 82.2802734375, 85.291015625, 88.3017578125, 91.3125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0, 7.0, 9.0, 13.0, 12.0, 18.0, 30.0, 38.0, 65.0, 106.0, 170.0, 242.0, 330.0, 479.0, 704.0, 1055.0, 1617.0, 2509.0, 4174.0, 7085.0, 12247.0, 22394.0, 43445.0, 90225.0, 192964.0, 290930.0, 191670.0, 89416.0, 43869.0, 22073.0, 12098.0, 6970.0, 4178.0, 2642.0, 1550.0, 1042.0, 692.0, 472.0, 304.0, 246.0, 144.0, 101.0, 60.0, 54.0, 39.0, 18.0, 14.0, 6.0, 8.0, 10.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-47.4375, -45.9775390625, -44.517578125, -43.0576171875, -41.59765625, -40.1376953125, -38.677734375, -37.2177734375, -35.7578125, -34.2978515625, -32.837890625, -31.3779296875, -29.91796875, -28.4580078125, -26.998046875, -25.5380859375, -24.078125, -22.6181640625, -21.158203125, -19.6982421875, -18.23828125, -16.7783203125, -15.318359375, -13.8583984375, -12.3984375, -10.9384765625, -9.478515625, -8.0185546875, -6.55859375, -5.0986328125, -3.638671875, -2.1787109375, -0.71875, 0.7412109375, 2.201171875, 3.6611328125, 5.12109375, 6.5810546875, 8.041015625, 9.5009765625, 10.9609375, 12.4208984375, 13.880859375, 15.3408203125, 16.80078125, 18.2607421875, 19.720703125, 21.1806640625, 22.640625, 24.1005859375, 25.560546875, 27.0205078125, 28.48046875, 29.9404296875, 31.400390625, 32.8603515625, 34.3203125, 35.7802734375, 37.240234375, 38.7001953125, 40.16015625, 41.6201171875, 43.080078125, 44.5400390625, 46.0]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 4.0, 4.0, 10.0, 7.0, 5.0, 11.0, 22.0, 23.0, 24.0, 31.0, 40.0, 26.0, 31.0, 38.0, 46.0, 43.0, 47.0, 52.0, 46.0, 45.0, 67.0, 36.0, 43.0, 38.0, 34.0, 43.0, 34.0, 27.0, 20.0, 14.0, 16.0, 14.0, 13.0, 13.0, 10.0, 8.0, 8.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0018663406372070312, -0.0018041878938674927, -0.001742035150527954, -0.0016798824071884155, -0.001617729663848877, -0.0015555769205093384, -0.0014934241771697998, -0.0014312714338302612, -0.0013691186904907227, -0.001306965947151184, -0.0012448132038116455, -0.001182660460472107, -0.0011205077171325684, -0.0010583549737930298, -0.0009962022304534912, -0.0009340494871139526, -0.0008718967437744141, -0.0008097440004348755, -0.0007475912570953369, -0.0006854385137557983, -0.0006232857704162598, -0.0005611330270767212, -0.0004989802837371826, -0.00043682754039764404, -0.00037467479705810547, -0.0003125220537185669, -0.0002503693103790283, -0.00018821656703948975, -0.00012606382369995117, -6.39110803604126e-05, -1.7583370208740234e-06, 6.039440631866455e-05, 0.00012254714965820312, 0.0001846998929977417, 0.0002468526363372803, 0.00030900537967681885, 0.0003711581230163574, 0.000433310866355896, 0.0004954636096954346, 0.0005576163530349731, 0.0006197690963745117, 0.0006819218397140503, 0.0007440745830535889, 0.0008062273263931274, 0.000868380069732666, 0.0009305328130722046, 0.0009926855564117432, 0.0010548382997512817, 0.0011169910430908203, 0.0011791437864303589, 0.0012412965297698975, 0.001303449273109436, 0.0013656020164489746, 0.0014277547597885132, 0.0014899075031280518, 0.0015520602464675903, 0.001614212989807129, 0.0016763657331466675, 0.001738518476486206, 0.0018006712198257446, 0.0018628239631652832, 0.0019249767065048218, 0.0019871294498443604, 0.002049282193183899, 0.0021114349365234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 12.0, 10.0, 25.0, 22.0, 37.0, 68.0, 105.0, 147.0, 250.0, 425.0, 713.0, 1166.0, 2070.0, 3442.0, 6119.0, 11346.0, 20124.0, 35210.0, 60839.0, 98578.0, 141273.0, 170654.0, 165278.0, 127136.0, 84390.0, 51157.0, 29603.0, 16667.0, 9319.0, 5170.0, 2925.0, 1703.0, 1008.0, 622.0, 338.0, 218.0, 126.0, 98.0, 60.0, 38.0, 21.0, 10.0, 10.0, 8.0, 5.0, 5.0, 2.0, 4.0, 0.0, 2.0], "bins": [-59.6875, -58.02197265625, -56.3564453125, -54.69091796875, -53.025390625, -51.35986328125, -49.6943359375, -48.02880859375, -46.36328125, -44.69775390625, -43.0322265625, -41.36669921875, -39.701171875, -38.03564453125, -36.3701171875, -34.70458984375, -33.0390625, -31.37353515625, -29.7080078125, -28.04248046875, -26.376953125, -24.71142578125, -23.0458984375, -21.38037109375, -19.71484375, -18.04931640625, -16.3837890625, -14.71826171875, -13.052734375, -11.38720703125, -9.7216796875, -8.05615234375, -6.390625, -4.72509765625, -3.0595703125, -1.39404296875, 0.271484375, 1.93701171875, 3.6025390625, 5.26806640625, 6.93359375, 8.59912109375, 10.2646484375, 11.93017578125, 13.595703125, 15.26123046875, 16.9267578125, 18.59228515625, 20.2578125, 21.92333984375, 23.5888671875, 25.25439453125, 26.919921875, 28.58544921875, 30.2509765625, 31.91650390625, 33.58203125, 35.24755859375, 36.9130859375, 38.57861328125, 40.244140625, 41.90966796875, 43.5751953125, 45.24072265625, 46.90625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 3.0, 6.0, 6.0, 9.0, 14.0, 22.0, 34.0, 36.0, 31.0, 44.0, 49.0, 45.0, 57.0, 59.0, 52.0, 58.0, 55.0, 52.0, 56.0, 46.0, 49.0, 33.0, 35.0, 27.0, 23.0, 17.0, 9.0, 14.0, 11.0, 9.0, 5.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.8125, -22.125732421875, -21.43896484375, -20.752197265625, -20.0654296875, -19.378662109375, -18.69189453125, -18.005126953125, -17.318359375, -16.631591796875, -15.94482421875, -15.258056640625, -14.5712890625, -13.884521484375, -13.19775390625, -12.510986328125, -11.82421875, -11.137451171875, -10.45068359375, -9.763916015625, -9.0771484375, -8.390380859375, -7.70361328125, -7.016845703125, -6.330078125, -5.643310546875, -4.95654296875, -4.269775390625, -3.5830078125, -2.896240234375, -2.20947265625, -1.522705078125, -0.8359375, -0.149169921875, 0.53759765625, 1.224365234375, 1.9111328125, 2.597900390625, 3.28466796875, 3.971435546875, 4.658203125, 5.344970703125, 6.03173828125, 6.718505859375, 7.4052734375, 8.092041015625, 8.77880859375, 9.465576171875, 10.15234375, 10.839111328125, 11.52587890625, 12.212646484375, 12.8994140625, 13.586181640625, 14.27294921875, 14.959716796875, 15.646484375, 16.333251953125, 17.02001953125, 17.706787109375, 18.3935546875, 19.080322265625, 19.76708984375, 20.453857421875, 21.140625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 7.0, 2.0, 9.0, 13.0, 6.0, 7.0, 21.0, 20.0, 22.0, 15.0, 23.0, 21.0, 21.0, 24.0, 28.0, 45.0, 36.0, 30.0, 43.0, 46.0, 33.0, 40.0, 46.0, 41.0, 35.0, 37.0, 44.0, 31.0, 26.0, 23.0, 21.0, 28.0, 21.0, 18.0, 15.0, 17.0, 8.0, 12.0, 13.0, 10.0, 12.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.23580169677734, -118.74876403808594, -114.26173400878906, -109.77469635009766, -105.28766632080078, -100.80062866210938, -96.3135986328125, -91.8265609741211, -87.33952331542969, -82.85248565673828, -78.3654556274414, -73.87841796875, -69.39138793945312, -64.90435028076172, -60.41731643676758, -55.93028259277344, -51.44325256347656, -46.95621871948242, -42.46918487548828, -37.982147216796875, -33.4951171875, -29.008081436157227, -24.521045684814453, -20.034011840820312, -15.546977996826172, -11.059944152832031, -6.572909355163574, -2.085874557495117, 2.4011592864990234, 6.888193130493164, 11.375228881835938, 15.862262725830078, 20.349288940429688, 24.836322784423828, 29.32335662841797, 33.810394287109375, 38.29742431640625, 42.784461975097656, 47.2714958190918, 51.75852966308594, 56.24556350708008, 60.73259735107422, 65.21963500976562, 69.7066650390625, 74.1937026977539, 78.68073272705078, 83.16777038574219, 87.65480041503906, 92.14183807373047, 96.62887573242188, 101.11590576171875, 105.60294342041016, 110.08997344970703, 114.57701110839844, 119.06404113769531, 123.55107879638672, 128.03811645507812, 132.525146484375, 137.01219177246094, 141.4992218017578, 145.9862518310547, 150.47328186035156, 154.9603271484375, 159.44735717773438, 163.93438720703125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 10.0, 7.0, 14.0, 21.0, 13.0, 21.0, 22.0, 21.0, 25.0, 29.0, 31.0, 31.0, 46.0, 41.0, 28.0, 35.0, 45.0, 49.0, 36.0, 47.0, 40.0, 44.0, 41.0, 41.0, 40.0, 29.0, 41.0, 17.0, 16.0, 28.0, 22.0, 14.0, 7.0, 6.0, 5.0, 10.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-199.10166931152344, -193.3509063720703, -187.60015869140625, -181.84939575195312, -176.09864807128906, -170.34788513183594, -164.59713745117188, -158.84637451171875, -153.09561157226562, -147.3448486328125, -141.59410095214844, -135.8433380126953, -130.09259033203125, -124.34182739257812, -118.59107208251953, -112.84031677246094, -107.08956909179688, -101.33881378173828, -95.58805847167969, -89.83729553222656, -84.0865478515625, -78.33578491210938, -72.58502960205078, -66.83427429199219, -61.083518981933594, -55.332763671875, -49.582008361816406, -43.83124923706055, -38.08049392700195, -32.32973861694336, -26.5789794921875, -20.828224182128906, -15.077468872070312, -9.326712608337402, -3.575956344604492, 2.1748008728027344, 7.925556182861328, 13.676311492919922, 19.42707061767578, 25.177825927734375, 30.92858123779297, 36.67933654785156, 42.430091857910156, 48.180850982666016, 53.93160629272461, 59.6823616027832, 65.43312072753906, 71.18387603759766, 76.93463134765625, 82.68538665771484, 88.43614196777344, 94.18690490722656, 99.93765258789062, 105.68841552734375, 111.43917083740234, 117.18992614746094, 122.94068145751953, 128.69143676757812, 134.44219970703125, 140.1929473876953, 145.94371032714844, 151.6944580078125, 157.44522094726562, 163.19598388671875, 168.9467315673828]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 8.0, 14.0, 23.0, 21.0, 27.0, 67.0, 66.0, 117.0, 213.0, 268.0, 391.0, 701.0, 1122.0, 1763.0, 3166.0, 5136.0, 8974.0, 15044.0, 24477.0, 37167.0, 54384.0, 73217.0, 92624.0, 107733.0, 115845.0, 113852.0, 103612.0, 86863.0, 67461.0, 48648.0, 32596.0, 20979.0, 13049.0, 7628.0, 4447.0, 2738.0, 1588.0, 958.0, 555.0, 333.0, 239.0, 142.0, 102.0, 67.0, 37.0, 32.0, 24.0, 21.0, 9.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-122.6875, -118.9521484375, -115.216796875, -111.4814453125, -107.74609375, -104.0107421875, -100.275390625, -96.5400390625, -92.8046875, -89.0693359375, -85.333984375, -81.5986328125, -77.86328125, -74.1279296875, -70.392578125, -66.6572265625, -62.921875, -59.1865234375, -55.451171875, -51.7158203125, -47.98046875, -44.2451171875, -40.509765625, -36.7744140625, -33.0390625, -29.3037109375, -25.568359375, -21.8330078125, -18.09765625, -14.3623046875, -10.626953125, -6.8916015625, -3.15625, 0.5791015625, 4.314453125, 8.0498046875, 11.78515625, 15.5205078125, 19.255859375, 22.9912109375, 26.7265625, 30.4619140625, 34.197265625, 37.9326171875, 41.66796875, 45.4033203125, 49.138671875, 52.8740234375, 56.609375, 60.3447265625, 64.080078125, 67.8154296875, 71.55078125, 75.2861328125, 79.021484375, 82.7568359375, 86.4921875, 90.2275390625, 93.962890625, 97.6982421875, 101.43359375, 105.1689453125, 108.904296875, 112.6396484375, 116.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 11.0, 9.0, 12.0, 19.0, 17.0, 18.0, 19.0, 27.0, 23.0, 29.0, 32.0, 31.0, 47.0, 41.0, 31.0, 34.0, 43.0, 50.0, 33.0, 48.0, 42.0, 47.0, 39.0, 38.0, 41.0, 30.0, 38.0, 19.0, 14.0, 32.0, 19.0, 12.0, 9.0, 4.0, 7.0, 11.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-197.75, -192.02734375, -186.3046875, -180.58203125, -174.859375, -169.13671875, -163.4140625, -157.69140625, -151.96875, -146.24609375, -140.5234375, -134.80078125, -129.078125, -123.35546875, -117.6328125, -111.91015625, -106.1875, -100.46484375, -94.7421875, -89.01953125, -83.296875, -77.57421875, -71.8515625, -66.12890625, -60.40625, -54.68359375, -48.9609375, -43.23828125, -37.515625, -31.79296875, -26.0703125, -20.34765625, -14.625, -8.90234375, -3.1796875, 2.54296875, 8.265625, 13.98828125, 19.7109375, 25.43359375, 31.15625, 36.87890625, 42.6015625, 48.32421875, 54.046875, 59.76953125, 65.4921875, 71.21484375, 76.9375, 82.66015625, 88.3828125, 94.10546875, 99.828125, 105.55078125, 111.2734375, 116.99609375, 122.71875, 128.44140625, 134.1640625, 139.88671875, 145.609375, 151.33203125, 157.0546875, 162.77734375, 168.5]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 10.0, 18.0, 23.0, 36.0, 68.0, 101.0, 142.0, 222.0, 356.0, 545.0, 938.0, 1444.0, 2444.0, 4111.0, 6783.0, 10903.0, 17567.0, 27026.0, 40662.0, 57283.0, 77064.0, 95431.0, 107759.0, 114092.0, 110667.0, 98327.0, 82559.0, 62677.0, 45534.0, 30898.0, 20330.0, 12711.0, 7748.0, 4742.0, 2846.0, 1731.0, 1060.0, 598.0, 381.0, 254.0, 170.0, 110.0, 61.0, 49.0, 33.0, 14.0, 10.0, 10.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-119.6875, -115.7822265625, -111.876953125, -107.9716796875, -104.06640625, -100.1611328125, -96.255859375, -92.3505859375, -88.4453125, -84.5400390625, -80.634765625, -76.7294921875, -72.82421875, -68.9189453125, -65.013671875, -61.1083984375, -57.203125, -53.2978515625, -49.392578125, -45.4873046875, -41.58203125, -37.6767578125, -33.771484375, -29.8662109375, -25.9609375, -22.0556640625, -18.150390625, -14.2451171875, -10.33984375, -6.4345703125, -2.529296875, 1.3759765625, 5.28125, 9.1865234375, 13.091796875, 16.9970703125, 20.90234375, 24.8076171875, 28.712890625, 32.6181640625, 36.5234375, 40.4287109375, 44.333984375, 48.2392578125, 52.14453125, 56.0498046875, 59.955078125, 63.8603515625, 67.765625, 71.6708984375, 75.576171875, 79.4814453125, 83.38671875, 87.2919921875, 91.197265625, 95.1025390625, 99.0078125, 102.9130859375, 106.818359375, 110.7236328125, 114.62890625, 118.5341796875, 122.439453125, 126.3447265625, 130.25]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 8.0, 4.0, 6.0, 3.0, 14.0, 10.0, 19.0, 27.0, 28.0, 33.0, 31.0, 31.0, 33.0, 41.0, 35.0, 49.0, 48.0, 38.0, 50.0, 31.0, 47.0, 38.0, 38.0, 41.0, 48.0, 38.0, 34.0, 24.0, 20.0, 24.0, 19.0, 16.0, 12.0, 13.0, 8.0, 9.0, 8.0, 5.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.9375, -100.0595703125, -96.181640625, -92.3037109375, -88.42578125, -84.5478515625, -80.669921875, -76.7919921875, -72.9140625, -69.0361328125, -65.158203125, -61.2802734375, -57.40234375, -53.5244140625, -49.646484375, -45.7685546875, -41.890625, -38.0126953125, -34.134765625, -30.2568359375, -26.37890625, -22.5009765625, -18.623046875, -14.7451171875, -10.8671875, -6.9892578125, -3.111328125, 0.7666015625, 4.64453125, 8.5224609375, 12.400390625, 16.2783203125, 20.15625, 24.0341796875, 27.912109375, 31.7900390625, 35.66796875, 39.5458984375, 43.423828125, 47.3017578125, 51.1796875, 55.0576171875, 58.935546875, 62.8134765625, 66.69140625, 70.5693359375, 74.447265625, 78.3251953125, 82.203125, 86.0810546875, 89.958984375, 93.8369140625, 97.71484375, 101.5927734375, 105.470703125, 109.3486328125, 113.2265625, 117.1044921875, 120.982421875, 124.8603515625, 128.73828125, 132.6162109375, 136.494140625, 140.3720703125, 144.25]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 10.0, 17.0, 26.0, 36.0, 43.0, 59.0, 93.0, 162.0, 226.0, 375.0, 605.0, 997.0, 1677.0, 2981.0, 5014.0, 8529.0, 14341.0, 23064.0, 36321.0, 54149.0, 74130.0, 95494.0, 112988.0, 120886.0, 118773.0, 105592.0, 86395.0, 64529.0, 44951.0, 29846.0, 18631.0, 11173.0, 6637.0, 4021.0, 2232.0, 1282.0, 818.0, 496.0, 306.0, 209.0, 123.0, 84.0, 75.0, 45.0, 34.0, 23.0, 19.0, 10.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-53.90625, -52.26123046875, -50.6162109375, -48.97119140625, -47.326171875, -45.68115234375, -44.0361328125, -42.39111328125, -40.74609375, -39.10107421875, -37.4560546875, -35.81103515625, -34.166015625, -32.52099609375, -30.8759765625, -29.23095703125, -27.5859375, -25.94091796875, -24.2958984375, -22.65087890625, -21.005859375, -19.36083984375, -17.7158203125, -16.07080078125, -14.42578125, -12.78076171875, -11.1357421875, -9.49072265625, -7.845703125, -6.20068359375, -4.5556640625, -2.91064453125, -1.265625, 0.37939453125, 2.0244140625, 3.66943359375, 5.314453125, 6.95947265625, 8.6044921875, 10.24951171875, 11.89453125, 13.53955078125, 15.1845703125, 16.82958984375, 18.474609375, 20.11962890625, 21.7646484375, 23.40966796875, 25.0546875, 26.69970703125, 28.3447265625, 29.98974609375, 31.634765625, 33.27978515625, 34.9248046875, 36.56982421875, 38.21484375, 39.85986328125, 41.5048828125, 43.14990234375, 44.794921875, 46.43994140625, 48.0849609375, 49.72998046875, 51.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 11.0, 5.0, 8.0, 6.0, 16.0, 12.0, 18.0, 24.0, 31.0, 35.0, 23.0, 38.0, 31.0, 30.0, 38.0, 40.0, 38.0, 49.0, 52.0, 56.0, 43.0, 40.0, 31.0, 39.0, 31.0, 32.0, 30.0, 28.0, 27.0, 19.0, 25.0, 14.0, 15.0, 10.0, 12.0, 7.0, 14.0, 7.0, 3.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.006168365478515625, -0.005987107753753662, -0.005805850028991699, -0.005624592304229736, -0.0054433345794677734, -0.0052620768547058105, -0.005080819129943848, -0.004899561405181885, -0.004718303680419922, -0.004537045955657959, -0.004355788230895996, -0.004174530506134033, -0.00399327278137207, -0.0038120150566101074, -0.0036307573318481445, -0.0034494996070861816, -0.0032682418823242188, -0.003086984157562256, -0.002905726432800293, -0.00272446870803833, -0.002543210983276367, -0.0023619532585144043, -0.0021806955337524414, -0.0019994378089904785, -0.0018181800842285156, -0.0016369223594665527, -0.0014556646347045898, -0.001274406909942627, -0.001093149185180664, -0.0009118914604187012, -0.0007306337356567383, -0.0005493760108947754, -0.0003681182861328125, -0.0001868605613708496, -5.602836608886719e-06, 0.00017565488815307617, 0.00035691261291503906, 0.000538170337677002, 0.0007194280624389648, 0.0009006857872009277, 0.0010819435119628906, 0.0012632012367248535, 0.0014444589614868164, 0.0016257166862487793, 0.0018069744110107422, 0.001988232135772705, 0.002169489860534668, 0.002350747585296631, 0.0025320053100585938, 0.0027132630348205566, 0.0028945207595825195, 0.0030757784843444824, 0.0032570362091064453, 0.003438293933868408, 0.003619551658630371, 0.003800809383392334, 0.003982067108154297, 0.00416332483291626, 0.004344582557678223, 0.0045258402824401855, 0.0047070980072021484, 0.004888355731964111, 0.005069613456726074, 0.005250871181488037, 0.00543212890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 13.0, 20.0, 27.0, 50.0, 77.0, 144.0, 217.0, 347.0, 600.0, 925.0, 1490.0, 2479.0, 4016.0, 6012.0, 9341.0, 13860.0, 20181.0, 28695.0, 39191.0, 52146.0, 64681.0, 77869.0, 88383.0, 94659.0, 95188.0, 91385.0, 82426.0, 70459.0, 56581.0, 44183.0, 32577.0, 23409.0, 16267.0, 11089.0, 7242.0, 4671.0, 2942.0, 1773.0, 1127.0, 676.0, 458.0, 267.0, 166.0, 94.0, 73.0, 32.0, 17.0, 13.0, 2.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-41.96875, -40.62353515625, -39.2783203125, -37.93310546875, -36.587890625, -35.24267578125, -33.8974609375, -32.55224609375, -31.20703125, -29.86181640625, -28.5166015625, -27.17138671875, -25.826171875, -24.48095703125, -23.1357421875, -21.79052734375, -20.4453125, -19.10009765625, -17.7548828125, -16.40966796875, -15.064453125, -13.71923828125, -12.3740234375, -11.02880859375, -9.68359375, -8.33837890625, -6.9931640625, -5.64794921875, -4.302734375, -2.95751953125, -1.6123046875, -0.26708984375, 1.078125, 2.42333984375, 3.7685546875, 5.11376953125, 6.458984375, 7.80419921875, 9.1494140625, 10.49462890625, 11.83984375, 13.18505859375, 14.5302734375, 15.87548828125, 17.220703125, 18.56591796875, 19.9111328125, 21.25634765625, 22.6015625, 23.94677734375, 25.2919921875, 26.63720703125, 27.982421875, 29.32763671875, 30.6728515625, 32.01806640625, 33.36328125, 34.70849609375, 36.0537109375, 37.39892578125, 38.744140625, 40.08935546875, 41.4345703125, 42.77978515625, 44.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 9.0, 8.0, 5.0, 17.0, 14.0, 10.0, 14.0, 31.0, 29.0, 27.0, 31.0, 28.0, 38.0, 35.0, 40.0, 46.0, 48.0, 32.0, 48.0, 47.0, 42.0, 41.0, 35.0, 39.0, 28.0, 29.0, 28.0, 22.0, 23.0, 25.0, 25.0, 16.0, 16.0, 10.0, 5.0, 10.0, 9.0, 7.0, 8.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.75, -20.0966796875, -19.443359375, -18.7900390625, -18.13671875, -17.4833984375, -16.830078125, -16.1767578125, -15.5234375, -14.8701171875, -14.216796875, -13.5634765625, -12.91015625, -12.2568359375, -11.603515625, -10.9501953125, -10.296875, -9.6435546875, -8.990234375, -8.3369140625, -7.68359375, -7.0302734375, -6.376953125, -5.7236328125, -5.0703125, -4.4169921875, -3.763671875, -3.1103515625, -2.45703125, -1.8037109375, -1.150390625, -0.4970703125, 0.15625, 0.8095703125, 1.462890625, 2.1162109375, 2.76953125, 3.4228515625, 4.076171875, 4.7294921875, 5.3828125, 6.0361328125, 6.689453125, 7.3427734375, 7.99609375, 8.6494140625, 9.302734375, 9.9560546875, 10.609375, 11.2626953125, 11.916015625, 12.5693359375, 13.22265625, 13.8759765625, 14.529296875, 15.1826171875, 15.8359375, 16.4892578125, 17.142578125, 17.7958984375, 18.44921875, 19.1025390625, 19.755859375, 20.4091796875, 21.0625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 6.0, 9.0, 7.0, 11.0, 21.0, 16.0, 18.0, 17.0, 24.0, 16.0, 21.0, 29.0, 37.0, 46.0, 37.0, 33.0, 40.0, 46.0, 44.0, 40.0, 48.0, 36.0, 38.0, 33.0, 30.0, 30.0, 43.0, 21.0, 34.0, 26.0, 16.0, 15.0, 12.0, 19.0, 13.0, 10.0, 10.0, 8.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-147.6806640625, -142.95852661132812, -138.23638916015625, -133.51425170898438, -128.7921142578125, -124.0699691772461, -119.34782409667969, -114.62568664550781, -109.90354919433594, -105.18141174316406, -100.45927429199219, -95.73712921142578, -91.0149917602539, -86.29285430908203, -81.57070922851562, -76.84857177734375, -72.12643432617188, -67.404296875, -62.68215560913086, -57.96001434326172, -53.237876892089844, -48.51573944091797, -43.79359817504883, -39.07145690917969, -34.34931945800781, -29.627180099487305, -24.905040740966797, -20.18290138244629, -15.460762023925781, -10.738622665405273, -6.016483306884766, -1.294342041015625, 3.42779541015625, 8.149934768676758, 12.872074127197266, 17.594213485717773, 22.31635284423828, 27.03849220275879, 31.760631561279297, 36.48277282714844, 41.20491027832031, 45.92704772949219, 50.64918899536133, 55.37133026123047, 60.093467712402344, 64.81560516357422, 69.53775024414062, 74.2598876953125, 78.98202514648438, 83.70416259765625, 88.42630004882812, 93.14844512939453, 97.8705825805664, 102.59272003173828, 107.31486511230469, 112.03700256347656, 116.75914001464844, 121.48127746582031, 126.20341491699219, 130.92555236816406, 135.647705078125, 140.36984252929688, 145.09197998046875, 149.81411743164062, 154.5362548828125]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 8.0, 7.0, 7.0, 10.0, 11.0, 18.0, 8.0, 13.0, 17.0, 19.0, 19.0, 23.0, 21.0, 26.0, 25.0, 27.0, 35.0, 26.0, 32.0, 31.0, 45.0, 30.0, 51.0, 43.0, 41.0, 37.0, 39.0, 43.0, 43.0, 31.0, 26.0, 30.0, 29.0, 22.0, 22.0, 16.0, 7.0, 5.0, 8.0, 11.0, 15.0, 10.0, 4.0, 6.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-196.55799865722656, -190.81088256835938, -185.0637664794922, -179.316650390625, -173.5695343017578, -167.82241821289062, -162.07528686523438, -156.32818603515625, -150.5810546875, -144.8339385986328, -139.08682250976562, -133.33970642089844, -127.59259033203125, -121.84547424316406, -116.09835052490234, -110.35123443603516, -104.6041259765625, -98.85700988769531, -93.10989379882812, -87.36277770996094, -81.61566162109375, -75.86854553222656, -70.12142181396484, -64.37430572509766, -58.62718963623047, -52.88007354736328, -47.132957458496094, -41.38583755493164, -35.63872146606445, -29.891605377197266, -24.144485473632812, -18.397369384765625, -12.650253295898438, -6.903136253356934, -1.1560192108154297, 4.591098785400391, 10.338214874267578, 16.085330963134766, 21.83245086669922, 27.579566955566406, 33.326683044433594, 39.07379913330078, 44.82091522216797, 50.56803512573242, 56.31515121459961, 62.0622673034668, 67.80938720703125, 73.55650329589844, 79.30361938476562, 85.05073547363281, 90.7978515625, 96.54496765136719, 102.29208374023438, 108.03919982910156, 113.78632354736328, 119.53343963623047, 125.28055572509766, 131.02767944335938, 136.77479553222656, 142.52191162109375, 148.26902770996094, 154.01614379882812, 159.7632598876953, 165.5103759765625, 171.2574920654297]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 10.0, 14.0, 8.0, 23.0, 27.0, 39.0, 56.0, 88.0, 103.0, 170.0, 208.0, 317.0, 382.0, 522.0, 655.0, 859.0, 1174.0, 1429.0, 1770.0, 2099.0, 2602.0, 2967.0, 3279.0, 3781.0, 1008488.0, 3355.0, 2902.0, 2657.0, 2209.0, 1941.0, 1532.0, 1246.0, 966.0, 692.0, 536.0, 400.0, 284.0, 249.0, 181.0, 111.0, 84.0, 60.0, 39.0, 34.0, 22.0, 9.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0], "bins": [-1352.8056640625, -1314.2723388671875, -1275.739013671875, -1237.205810546875, -1198.6724853515625, -1160.13916015625, -1121.6058349609375, -1083.072509765625, -1044.5391845703125, -1006.005859375, -967.4725952148438, -928.9392700195312, -890.4059448242188, -851.8726806640625, -813.33935546875, -774.8060302734375, -736.2727661132812, -697.7394409179688, -659.2061767578125, -620.6728515625, -582.1395263671875, -543.606201171875, -505.07293701171875, -466.53961181640625, -428.0063171386719, -389.4730224609375, -350.939697265625, -312.4064025878906, -273.87310791015625, -235.33978271484375, -196.80648803710938, -158.27316284179688, -119.7398681640625, -81.20655822753906, -42.673255920410156, -4.13995361328125, 34.39335632324219, 72.92666625976562, 111.4599609375, 149.9932861328125, 188.52658081054688, 227.0598907470703, 265.59320068359375, 304.1264953613281, 342.6597900390625, 381.193115234375, 419.7264099121094, 458.2597351074219, 496.79302978515625, 535.3263549804688, 573.859619140625, 612.3929443359375, 650.92626953125, 689.4595947265625, 727.9928588867188, 766.5261840820312, 805.0594482421875, 843.5927734375, 882.1260375976562, 920.6593627929688, 959.1926879882812, 997.7259521484375, 1036.25927734375, 1074.7926025390625, 1113.325927734375]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 10.0, 13.0, 12.0, 16.0, 18.0, 33.0, 40.0, 53.0, 78.0, 121.0, 232.0, 387.0, 820.0, 1403.0, 2595.0, 4650.0, 7988.0, 13413.0, 22328.0, 41217.0, 51304040.0, 29659.0, 17647.0, 10432.0, 6207.0, 3523.0, 1965.0, 1015.0, 601.0, 312.0, 182.0, 107.0, 58.0, 41.0, 23.0, 16.0, 20.0, 8.0, 4.0, 11.0, 7.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1517.404541015625, -1468.8636474609375, -1420.3226318359375, -1371.78173828125, -1323.24072265625, -1274.6998291015625, -1226.158935546875, -1177.617919921875, -1129.0770263671875, -1080.5361328125, -1031.9951171875, -983.4542236328125, -934.9132690429688, -886.372314453125, -837.8313598632812, -789.2904052734375, -740.7494506835938, -692.20849609375, -643.6675415039062, -595.1265869140625, -546.585693359375, -498.04473876953125, -449.5037841796875, -400.9628601074219, -352.4219055175781, -303.8809509277344, -255.34002685546875, -206.799072265625, -158.2581329345703, -109.71719360351562, -61.176239013671875, -12.63531494140625, 35.9056396484375, 84.44657897949219, 132.98751831054688, 181.52847290039062, 230.0694122314453, 278.6103515625, 327.15130615234375, 375.6922302246094, 424.2331848144531, 472.7741394042969, 521.3150634765625, 569.8560180664062, 618.39697265625, 666.9378662109375, 715.4788818359375, 764.019775390625, 812.5607299804688, 861.1016845703125, 909.6426391601562, 958.18359375, 1006.7244873046875, 1055.265380859375, 1103.806396484375, 1152.3472900390625, 1200.8883056640625, 1249.42919921875, 1297.97021484375, 1346.5111083984375, 1395.0521240234375, 1443.593017578125, 1492.134033203125, 1540.6749267578125, 1589.2158203125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 7.0, 12.0, 10.0, 23.0, 26.0, 43.0, 67.0, 106.0, 135.0, 237.0, 371.0, 523.0, 841.0, 1392.0, 2295.0, 3625.0, 6659.0, 11576.0, 22154.0, 44436.0, 96608.0, 228213.0, 599556.0, 1842686.0, 2210025.0, 729263.0, 271461.0, 112017.0, 50959.0, 25209.0, 13135.0, 7180.0, 4125.0, 2455.0, 1475.0, 894.0, 600.0, 360.0, 230.0, 153.0, 108.0, 65.0, 41.0, 30.0, 19.0, 15.0, 7.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-130.625, -126.90234375, -123.1796875, -119.45703125, -115.734375, -112.01171875, -108.2890625, -104.56640625, -100.84375, -97.12109375, -93.3984375, -89.67578125, -85.953125, -82.23046875, -78.5078125, -74.78515625, -71.0625, -67.33984375, -63.6171875, -59.89453125, -56.171875, -52.44921875, -48.7265625, -45.00390625, -41.28125, -37.55859375, -33.8359375, -30.11328125, -26.390625, -22.66796875, -18.9453125, -15.22265625, -11.5, -7.77734375, -4.0546875, -0.33203125, 3.390625, 7.11328125, 10.8359375, 14.55859375, 18.28125, 22.00390625, 25.7265625, 29.44921875, 33.171875, 36.89453125, 40.6171875, 44.33984375, 48.0625, 51.78515625, 55.5078125, 59.23046875, 62.953125, 66.67578125, 70.3984375, 74.12109375, 77.84375, 81.56640625, 85.2890625, 89.01171875, 92.734375, 96.45703125, 100.1796875, 103.90234375, 107.625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 3.0, 2.0, 3.0, 9.0, 15.0, 18.0, 17.0, 18.0, 24.0, 16.0, 30.0, 41.0, 44.0, 36.0, 54.0, 93.0, 117.0, 254.0, 344.0, 255.0, 155.0, 69.0, 52.0, 47.0, 34.0, 38.0, 32.0, 31.0, 28.0, 21.0, 25.0, 17.0, 17.0, 11.0, 5.0, 10.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.5, -90.333984375, -87.16796875, -84.001953125, -80.8359375, -77.669921875, -74.50390625, -71.337890625, -68.171875, -65.005859375, -61.83984375, -58.673828125, -55.5078125, -52.341796875, -49.17578125, -46.009765625, -42.84375, -39.677734375, -36.51171875, -33.345703125, -30.1796875, -27.013671875, -23.84765625, -20.681640625, -17.515625, -14.349609375, -11.18359375, -8.017578125, -4.8515625, -1.685546875, 1.48046875, 4.646484375, 7.8125, 10.978515625, 14.14453125, 17.310546875, 20.4765625, 23.642578125, 26.80859375, 29.974609375, 33.140625, 36.306640625, 39.47265625, 42.638671875, 45.8046875, 48.970703125, 52.13671875, 55.302734375, 58.46875, 61.634765625, 64.80078125, 67.966796875, 71.1328125, 74.298828125, 77.46484375, 80.630859375, 83.796875, 86.962890625, 90.12890625, 93.294921875, 96.4609375, 99.626953125, 102.79296875, 105.958984375, 109.125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 3.0, 11.0, 15.0, 49.0, 67.0, 78.0, 114.0, 166.0, 342.0, 498.0, 902.0, 1349.0, 2293.0, 3784.0, 6391.0, 11270.0, 19066.0, 33841.0, 59342.0, 103758.0, 180523.0, 318595.0, 658306.0, 1979736.0, 1676960.0, 563004.0, 285766.0, 164869.0, 94385.0, 53597.0, 30734.0, 17264.0, 10005.0, 5792.0, 3452.0, 1953.0, 1212.0, 691.0, 430.0, 298.0, 204.0, 132.0, 68.0, 33.0, 26.0, 20.0, 15.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-41.8125, -40.4599609375, -39.107421875, -37.7548828125, -36.40234375, -35.0498046875, -33.697265625, -32.3447265625, -30.9921875, -29.6396484375, -28.287109375, -26.9345703125, -25.58203125, -24.2294921875, -22.876953125, -21.5244140625, -20.171875, -18.8193359375, -17.466796875, -16.1142578125, -14.76171875, -13.4091796875, -12.056640625, -10.7041015625, -9.3515625, -7.9990234375, -6.646484375, -5.2939453125, -3.94140625, -2.5888671875, -1.236328125, 0.1162109375, 1.46875, 2.8212890625, 4.173828125, 5.5263671875, 6.87890625, 8.2314453125, 9.583984375, 10.9365234375, 12.2890625, 13.6416015625, 14.994140625, 16.3466796875, 17.69921875, 19.0517578125, 20.404296875, 21.7568359375, 23.109375, 24.4619140625, 25.814453125, 27.1669921875, 28.51953125, 29.8720703125, 31.224609375, 32.5771484375, 33.9296875, 35.2822265625, 36.634765625, 37.9873046875, 39.33984375, 40.6923828125, 42.044921875, 43.3974609375, 44.75]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 11.0, 16.0, 11.0, 11.0, 16.0, 24.0, 19.0, 34.0, 32.0, 46.0, 35.0, 54.0, 42.0, 72.0, 178.0, 356.0, 401.0, 207.0, 99.0, 66.0, 36.0, 50.0, 38.0, 28.0, 22.0, 24.0, 17.0, 18.0, 18.0, 12.0, 10.0, 7.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.75, -85.5859375, -82.421875, -79.2578125, -76.09375, -72.9296875, -69.765625, -66.6015625, -63.4375, -60.2734375, -57.109375, -53.9453125, -50.78125, -47.6171875, -44.453125, -41.2890625, -38.125, -34.9609375, -31.796875, -28.6328125, -25.46875, -22.3046875, -19.140625, -15.9765625, -12.8125, -9.6484375, -6.484375, -3.3203125, -0.15625, 3.0078125, 6.171875, 9.3359375, 12.5, 15.6640625, 18.828125, 21.9921875, 25.15625, 28.3203125, 31.484375, 34.6484375, 37.8125, 40.9765625, 44.140625, 47.3046875, 50.46875, 53.6328125, 56.796875, 59.9609375, 63.125, 66.2890625, 69.453125, 72.6171875, 75.78125, 78.9453125, 82.109375, 85.2734375, 88.4375, 91.6015625, 94.765625, 97.9296875, 101.09375, 104.2578125, 107.421875, 110.5859375, 113.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 5.0, 10.0, 5.0, 12.0, 19.0, 19.0, 22.0, 30.0, 42.0, 39.0, 75.0, 103.0, 112.0, 154.0, 236.0, 313.0, 481.0, 637.0, 995.0, 1437.0, 2387.0, 4361.0, 8634.0, 19622.0, 48720.0, 165775.0, 5818959.0, 138874.0, 42751.0, 17422.0, 8106.0, 4229.0, 2309.0, 1412.0, 881.0, 549.0, 450.0, 300.0, 255.0, 160.0, 122.0, 91.0, 71.0, 59.0, 57.0, 37.0, 34.0, 9.0, 12.0, 16.0, 4.0, 11.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-154.875, -149.787109375, -144.69921875, -139.611328125, -134.5234375, -129.435546875, -124.34765625, -119.259765625, -114.171875, -109.083984375, -103.99609375, -98.908203125, -93.8203125, -88.732421875, -83.64453125, -78.556640625, -73.46875, -68.380859375, -63.29296875, -58.205078125, -53.1171875, -48.029296875, -42.94140625, -37.853515625, -32.765625, -27.677734375, -22.58984375, -17.501953125, -12.4140625, -7.326171875, -2.23828125, 2.849609375, 7.9375, 13.025390625, 18.11328125, 23.201171875, 28.2890625, 33.376953125, 38.46484375, 43.552734375, 48.640625, 53.728515625, 58.81640625, 63.904296875, 68.9921875, 74.080078125, 79.16796875, 84.255859375, 89.34375, 94.431640625, 99.51953125, 104.607421875, 109.6953125, 114.783203125, 119.87109375, 124.958984375, 130.046875, 135.134765625, 140.22265625, 145.310546875, 150.3984375, 155.486328125, 160.57421875, 165.662109375, 170.75]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 7.0, 2.0, 5.0, 6.0, 9.0, 10.0, 16.0, 12.0, 18.0, 24.0, 25.0, 28.0, 26.0, 36.0, 32.0, 41.0, 56.0, 51.0, 88.0, 275.0, 542.0, 258.0, 79.0, 46.0, 43.0, 45.0, 31.0, 30.0, 23.0, 19.0, 16.0, 20.0, 21.0, 17.0, 16.0, 16.0, 8.0, 9.0, 3.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-107.8125, -104.587890625, -101.36328125, -98.138671875, -94.9140625, -91.689453125, -88.46484375, -85.240234375, -82.015625, -78.791015625, -75.56640625, -72.341796875, -69.1171875, -65.892578125, -62.66796875, -59.443359375, -56.21875, -52.994140625, -49.76953125, -46.544921875, -43.3203125, -40.095703125, -36.87109375, -33.646484375, -30.421875, -27.197265625, -23.97265625, -20.748046875, -17.5234375, -14.298828125, -11.07421875, -7.849609375, -4.625, -1.400390625, 1.82421875, 5.048828125, 8.2734375, 11.498046875, 14.72265625, 17.947265625, 21.171875, 24.396484375, 27.62109375, 30.845703125, 34.0703125, 37.294921875, 40.51953125, 43.744140625, 46.96875, 50.193359375, 53.41796875, 56.642578125, 59.8671875, 63.091796875, 66.31640625, 69.541015625, 72.765625, 75.990234375, 79.21484375, 82.439453125, 85.6640625, 88.888671875, 92.11328125, 95.337890625, 98.5625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 4.0, 14.0, 27.0, 63.0, 155.0, 475.0, 120.0, 61.0, 31.0, 24.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3476.698486328125, -3386.476806640625, -3296.25537109375, -3206.03369140625, -3115.812255859375, -3025.590576171875, -2935.369140625, -2845.1474609375, -2754.92578125, -2664.7041015625, -2574.482666015625, -2484.260986328125, -2394.03955078125, -2303.81787109375, -2213.59619140625, -2123.374755859375, -2033.1533203125, -1942.9317626953125, -1852.710205078125, -1762.488525390625, -1672.26708984375, -1582.04541015625, -1491.8238525390625, -1401.602294921875, -1311.3807373046875, -1221.1591796875, -1130.9376220703125, -1040.716064453125, -950.4944458007812, -860.2728881835938, -770.05126953125, -679.8297119140625, -589.6083984375, -499.3868408203125, -409.1652526855469, -318.94366455078125, -228.72210693359375, -138.50054931640625, -48.2789306640625, 41.942626953125, 132.1641845703125, 222.38575744628906, 312.6073303222656, 402.82891845703125, 493.05047607421875, 583.2720336914062, 673.49365234375, 763.7152099609375, 853.936767578125, 944.1583251953125, 1034.3798828125, 1124.6015625, 1214.822998046875, 1305.044677734375, 1395.2662353515625, 1485.48779296875, 1575.7093505859375, 1665.930908203125, 1756.1524658203125, 1846.3740234375, 1936.595703125, 2026.817138671875, 2117.038818359375, 2207.26025390625, 2297.48193359375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 14.0, 4.0, 12.0, 13.0, 17.0, 26.0, 44.0, 83.0, 329.0, 211.0, 85.0, 28.0, 22.0, 23.0, 14.0, 18.0, 10.0, 4.0, 7.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4454.24169921875, -4326.3544921875, -4198.46728515625, -4070.580078125, -3942.693115234375, -3814.805908203125, -3686.918701171875, -3559.031494140625, -3431.14453125, -3303.25732421875, -3175.3701171875, -3047.48291015625, -2919.595947265625, -2791.708740234375, -2663.821533203125, -2535.934326171875, -2408.047119140625, -2280.159912109375, -2152.272705078125, -2024.3856201171875, -1896.49853515625, -1768.611328125, -1640.72412109375, -1512.8369140625, -1384.9498291015625, -1257.0626220703125, -1129.175537109375, -1001.288330078125, -873.4011840820312, -745.5140380859375, -617.6268310546875, -489.73968505859375, -361.852783203125, -233.9656219482422, -106.07846069335938, 21.8087158203125, 149.69586181640625, 277.5830078125, 405.47021484375, 533.3573608398438, 661.2445068359375, 789.1316528320312, 917.018798828125, 1044.906005859375, 1172.793212890625, 1300.6802978515625, 1428.5675048828125, 1556.45458984375, 1684.341796875, 1812.22900390625, 1940.1160888671875, 2068.00341796875, 2195.890380859375, 2323.777587890625, 2451.664794921875, 2579.552001953125, 2707.43896484375, 2835.326171875, 2963.21337890625, 3091.1005859375, 3218.987548828125, 3346.874755859375, 3474.761962890625, 3602.649169921875, 3730.536376953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 11.0, 5.0, 20.0, 33.0, 23.0, 30.0, 48.0, 75.0, 80.0, 159.0, 205.0, 309.0, 468.0, 726.0, 1278.0, 1900.0, 3398.0, 6292.0, 12590.0, 28005.0, 77626.0, 384082.0, 3326240.0, 233234.0, 64804.0, 25474.0, 11865.0, 6237.0, 3406.0, 2064.0, 1273.0, 800.0, 520.0, 366.0, 203.0, 149.0, 86.0, 71.0, 31.0, 26.0, 26.0, 14.0, 9.0, 4.0, 5.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-12.1796875, -11.8035888671875, -11.427490234375, -11.0513916015625, -10.67529296875, -10.2991943359375, -9.923095703125, -9.5469970703125, -9.1708984375, -8.7947998046875, -8.418701171875, -8.0426025390625, -7.66650390625, -7.2904052734375, -6.914306640625, -6.5382080078125, -6.162109375, -5.7860107421875, -5.409912109375, -5.0338134765625, -4.65771484375, -4.2816162109375, -3.905517578125, -3.5294189453125, -3.1533203125, -2.7772216796875, -2.401123046875, -2.0250244140625, -1.64892578125, -1.2728271484375, -0.896728515625, -0.5206298828125, -0.14453125, 0.2315673828125, 0.607666015625, 0.9837646484375, 1.35986328125, 1.7359619140625, 2.112060546875, 2.4881591796875, 2.8642578125, 3.2403564453125, 3.616455078125, 3.9925537109375, 4.36865234375, 4.7447509765625, 5.120849609375, 5.4969482421875, 5.873046875, 6.2491455078125, 6.625244140625, 7.0013427734375, 7.37744140625, 7.7535400390625, 8.129638671875, 8.5057373046875, 8.8818359375, 9.2579345703125, 9.634033203125, 10.0101318359375, 10.38623046875, 10.7623291015625, 11.138427734375, 11.5145263671875, 11.890625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 6.0, 18.0, 15.0, 21.0, 25.0, 48.0, 90.0, 349.0, 211.0, 63.0, 32.0, 25.0, 25.0, 13.0, 7.0, 9.0, 7.0, 8.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.080413818359375, -2.00848388671875, -1.936553955078125, -1.8646240234375, -1.792694091796875, -1.72076416015625, -1.648834228515625, -1.576904296875, -1.504974365234375, -1.43304443359375, -1.361114501953125, -1.2891845703125, -1.217254638671875, -1.14532470703125, -1.073394775390625, -1.00146484375, -0.929534912109375, -0.85760498046875, -0.785675048828125, -0.7137451171875, -0.641815185546875, -0.56988525390625, -0.497955322265625, -0.426025390625, -0.354095458984375, -0.28216552734375, -0.210235595703125, -0.1383056640625, -0.066375732421875, 0.00555419921875, 0.077484130859375, 0.1494140625, 0.221343994140625, 0.29327392578125, 0.365203857421875, 0.4371337890625, 0.509063720703125, 0.58099365234375, 0.652923583984375, 0.724853515625, 0.796783447265625, 0.86871337890625, 0.940643310546875, 1.0125732421875, 1.084503173828125, 1.15643310546875, 1.228363037109375, 1.30029296875, 1.372222900390625, 1.44415283203125, 1.516082763671875, 1.5880126953125, 1.659942626953125, 1.73187255859375, 1.803802490234375, 1.875732421875, 1.947662353515625, 2.01959228515625, 2.091522216796875, 2.1634521484375, 2.235382080078125, 2.30731201171875, 2.379241943359375, 2.451171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 8.0, 15.0, 16.0, 37.0, 41.0, 78.0, 116.0, 256.0, 743.0, 2384.0, 11446.0, 112565.0, 3310735.0, 717274.0, 31594.0, 4791.0, 1204.0, 406.0, 204.0, 107.0, 76.0, 43.0, 34.0, 24.0, 16.0, 20.0, 8.0, 9.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.921875, -20.218994140625, -19.51611328125, -18.813232421875, -18.1103515625, -17.407470703125, -16.70458984375, -16.001708984375, -15.298828125, -14.595947265625, -13.89306640625, -13.190185546875, -12.4873046875, -11.784423828125, -11.08154296875, -10.378662109375, -9.67578125, -8.972900390625, -8.27001953125, -7.567138671875, -6.8642578125, -6.161376953125, -5.45849609375, -4.755615234375, -4.052734375, -3.349853515625, -2.64697265625, -1.944091796875, -1.2412109375, -0.538330078125, 0.16455078125, 0.867431640625, 1.5703125, 2.273193359375, 2.97607421875, 3.678955078125, 4.3818359375, 5.084716796875, 5.78759765625, 6.490478515625, 7.193359375, 7.896240234375, 8.59912109375, 9.302001953125, 10.0048828125, 10.707763671875, 11.41064453125, 12.113525390625, 12.81640625, 13.519287109375, 14.22216796875, 14.925048828125, 15.6279296875, 16.330810546875, 17.03369140625, 17.736572265625, 18.439453125, 19.142333984375, 19.84521484375, 20.548095703125, 21.2509765625, 21.953857421875, 22.65673828125, 23.359619140625, 24.0625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 8.0, 11.0, 7.0, 16.0, 26.0, 27.0, 39.0, 59.0, 60.0, 71.0, 124.0, 145.0, 174.0, 256.0, 377.0, 476.0, 538.0, 447.0, 313.0, 243.0, 184.0, 129.0, 79.0, 66.0, 52.0, 29.0, 29.0, 19.0, 12.0, 11.0, 8.0, 4.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.264312744140625, -3.16925048828125, -3.074188232421875, -2.9791259765625, -2.884063720703125, -2.78900146484375, -2.693939208984375, -2.598876953125, -2.503814697265625, -2.40875244140625, -2.313690185546875, -2.2186279296875, -2.123565673828125, -2.02850341796875, -1.933441162109375, -1.83837890625, -1.743316650390625, -1.64825439453125, -1.553192138671875, -1.4581298828125, -1.363067626953125, -1.26800537109375, -1.172943115234375, -1.077880859375, -0.982818603515625, -0.88775634765625, -0.792694091796875, -0.6976318359375, -0.602569580078125, -0.50750732421875, -0.412445068359375, -0.3173828125, -0.222320556640625, -0.12725830078125, -0.032196044921875, 0.0628662109375, 0.157928466796875, 0.25299072265625, 0.348052978515625, 0.443115234375, 0.538177490234375, 0.63323974609375, 0.728302001953125, 0.8233642578125, 0.918426513671875, 1.01348876953125, 1.108551025390625, 1.20361328125, 1.298675537109375, 1.39373779296875, 1.488800048828125, 1.5838623046875, 1.678924560546875, 1.77398681640625, 1.869049072265625, 1.964111328125, 2.059173583984375, 2.15423583984375, 2.249298095703125, 2.3443603515625, 2.439422607421875, 2.53448486328125, 2.629547119140625, 2.724609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 23.0, 31.0, 77.0, 138.0, 176.0, 224.0, 155.0, 81.0, 30.0, 23.0, 8.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.34321212768555, -36.83087158203125, -35.31853103637695, -33.806190490722656, -32.29384994506836, -30.781509399414062, -29.269168853759766, -27.75682830810547, -26.244487762451172, -24.732147216796875, -23.219806671142578, -21.70746612548828, -20.195125579833984, -18.682785034179688, -17.17044448852539, -15.65810489654541, -14.14576530456543, -12.633424758911133, -11.121084213256836, -9.608743667602539, -8.096403121948242, -6.5840630531311035, -5.071722984313965, -3.559382438659668, -2.047041893005371, -0.5347014665603638, 0.9776389598846436, 2.4899792671203613, 4.002319812774658, 5.514660358428955, 7.027000427246094, 8.53934097290039, 10.051681518554688, 11.564022064208984, 13.076362609863281, 14.588703155517578, 16.101043701171875, 17.613384246826172, 19.12572479248047, 20.638065338134766, 22.150405883789062, 23.66274642944336, 25.175086975097656, 26.687427520751953, 28.19976806640625, 29.712108612060547, 31.224449157714844, 32.73678970336914, 34.24913024902344, 35.761470794677734, 37.27381134033203, 38.78615188598633, 40.298492431640625, 41.81083297729492, 43.32317352294922, 44.835514068603516, 46.34785079956055, 47.860191345214844, 49.37253189086914, 50.88487243652344, 52.397212982177734, 53.90955352783203, 55.42189407348633, 56.934234619140625, 58.44657516479492]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 4.0, 7.0, 8.0, 12.0, 13.0, 17.0, 18.0, 33.0, 28.0, 31.0, 41.0, 54.0, 42.0, 55.0, 50.0, 56.0, 49.0, 53.0, 54.0, 44.0, 46.0, 45.0, 38.0, 28.0, 32.0, 27.0, 16.0, 27.0, 6.0, 17.0, 9.0, 9.0, 10.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.040180206298828, -13.459205627441406, -12.8782320022583, -12.297257423400879, -11.716282844543457, -11.135309219360352, -10.55433464050293, -9.973360061645508, -9.392385482788086, -8.811410903930664, -8.230437278747559, -7.649462699890137, -7.068488121032715, -6.487514019012451, -5.9065399169921875, -5.325565338134766, -4.74459171295166, -4.1636176109313965, -3.5826430320739746, -3.001668930053711, -2.420694589614868, -1.8397202491760254, -1.2587461471557617, -0.6777715682983398, -0.09679746627807617, 0.4841768145561218, 1.0651510953903198, 1.646125316619873, 2.227099657058716, 2.8080739974975586, 3.3890480995178223, 3.970022678375244, 4.550996780395508, 5.1319708824157715, 5.712945461273193, 6.293919563293457, 6.874894142150879, 7.455868244171143, 8.036842346191406, 8.617816925048828, 9.19879150390625, 9.779766082763672, 10.360739707946777, 10.9417142868042, 11.522688865661621, 12.103662490844727, 12.684637069702148, 13.26561164855957, 13.846585273742676, 14.427559852600098, 15.008533477783203, 15.589508056640625, 16.170482635498047, 16.75145721435547, 17.33243179321289, 17.913406372070312, 18.4943790435791, 19.075353622436523, 19.656328201293945, 20.237300872802734, 20.818275451660156, 21.399250030517578, 21.980224609375, 22.561199188232422, 23.142173767089844]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 12.0, 3.0, 19.0, 16.0, 37.0, 38.0, 51.0, 99.0, 153.0, 232.0, 342.0, 590.0, 1086.0, 1917.0, 4021.0, 9189.0, 25270.0, 121070.0, 745821.0, 99534.0, 22547.0, 8342.0, 3699.0, 1874.0, 1017.0, 596.0, 353.0, 198.0, 134.0, 89.0, 72.0, 44.0, 30.0, 15.0, 13.0, 11.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.111572265625, -15.58251953125, -15.053466796875, -14.5244140625, -13.995361328125, -13.46630859375, -12.937255859375, -12.408203125, -11.879150390625, -11.35009765625, -10.821044921875, -10.2919921875, -9.762939453125, -9.23388671875, -8.704833984375, -8.17578125, -7.646728515625, -7.11767578125, -6.588623046875, -6.0595703125, -5.530517578125, -5.00146484375, -4.472412109375, -3.943359375, -3.414306640625, -2.88525390625, -2.356201171875, -1.8271484375, -1.298095703125, -0.76904296875, -0.239990234375, 0.2890625, 0.818115234375, 1.34716796875, 1.876220703125, 2.4052734375, 2.934326171875, 3.46337890625, 3.992431640625, 4.521484375, 5.050537109375, 5.57958984375, 6.108642578125, 6.6376953125, 7.166748046875, 7.69580078125, 8.224853515625, 8.75390625, 9.282958984375, 9.81201171875, 10.341064453125, 10.8701171875, 11.399169921875, 11.92822265625, 12.457275390625, 12.986328125, 13.515380859375, 14.04443359375, 14.573486328125, 15.1025390625, 15.631591796875, 16.16064453125, 16.689697265625, 17.21875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 6.0, 4.0, 11.0, 11.0, 14.0, 16.0, 32.0, 49.0, 86.0, 146.0, 212.0, 157.0, 88.0, 54.0, 26.0, 21.0, 15.0, 11.0, 9.0, 4.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.140625, -2.068328857421875, -1.99603271484375, -1.923736572265625, -1.8514404296875, -1.779144287109375, -1.70684814453125, -1.634552001953125, -1.562255859375, -1.489959716796875, -1.41766357421875, -1.345367431640625, -1.2730712890625, -1.200775146484375, -1.12847900390625, -1.056182861328125, -0.98388671875, -0.911590576171875, -0.83929443359375, -0.766998291015625, -0.6947021484375, -0.622406005859375, -0.55010986328125, -0.477813720703125, -0.405517578125, -0.333221435546875, -0.26092529296875, -0.188629150390625, -0.1163330078125, -0.044036865234375, 0.02825927734375, 0.100555419921875, 0.1728515625, 0.245147705078125, 0.31744384765625, 0.389739990234375, 0.4620361328125, 0.534332275390625, 0.60662841796875, 0.678924560546875, 0.751220703125, 0.823516845703125, 0.89581298828125, 0.968109130859375, 1.0404052734375, 1.112701416015625, 1.18499755859375, 1.257293701171875, 1.32958984375, 1.401885986328125, 1.47418212890625, 1.546478271484375, 1.6187744140625, 1.691070556640625, 1.76336669921875, 1.835662841796875, 1.907958984375, 1.980255126953125, 2.05255126953125, 2.124847412109375, 2.1971435546875, 2.269439697265625, 2.34173583984375, 2.414031982421875, 2.486328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 6.0, 6.0, 9.0, 11.0, 16.0, 11.0, 16.0, 43.0, 49.0, 71.0, 114.0, 150.0, 244.0, 510.0, 1131.0, 3210.0, 13183.0, 187934.0, 803340.0, 29807.0, 5306.0, 1739.0, 720.0, 360.0, 196.0, 106.0, 69.0, 42.0, 45.0, 31.0, 23.0, 18.0, 2.0, 8.0, 8.0, 6.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.0625, -26.24755859375, -25.4326171875, -24.61767578125, -23.802734375, -22.98779296875, -22.1728515625, -21.35791015625, -20.54296875, -19.72802734375, -18.9130859375, -18.09814453125, -17.283203125, -16.46826171875, -15.6533203125, -14.83837890625, -14.0234375, -13.20849609375, -12.3935546875, -11.57861328125, -10.763671875, -9.94873046875, -9.1337890625, -8.31884765625, -7.50390625, -6.68896484375, -5.8740234375, -5.05908203125, -4.244140625, -3.42919921875, -2.6142578125, -1.79931640625, -0.984375, -0.16943359375, 0.6455078125, 1.46044921875, 2.275390625, 3.09033203125, 3.9052734375, 4.72021484375, 5.53515625, 6.35009765625, 7.1650390625, 7.97998046875, 8.794921875, 9.60986328125, 10.4248046875, 11.23974609375, 12.0546875, 12.86962890625, 13.6845703125, 14.49951171875, 15.314453125, 16.12939453125, 16.9443359375, 17.75927734375, 18.57421875, 19.38916015625, 20.2041015625, 21.01904296875, 21.833984375, 22.64892578125, 23.4638671875, 24.27880859375, 25.09375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 10.0, 8.0, 14.0, 18.0, 22.0, 17.0, 25.0, 23.0, 37.0, 35.0, 42.0, 33.0, 39.0, 40.0, 39.0, 38.0, 45.0, 45.0, 43.0, 35.0, 37.0, 33.0, 37.0, 35.0, 35.0, 30.0, 26.0, 21.0, 23.0, 14.0, 21.0, 22.0, 15.0, 10.0, 6.0, 4.0, 6.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.5625, -7.3349609375, -7.107421875, -6.8798828125, -6.65234375, -6.4248046875, -6.197265625, -5.9697265625, -5.7421875, -5.5146484375, -5.287109375, -5.0595703125, -4.83203125, -4.6044921875, -4.376953125, -4.1494140625, -3.921875, -3.6943359375, -3.466796875, -3.2392578125, -3.01171875, -2.7841796875, -2.556640625, -2.3291015625, -2.1015625, -1.8740234375, -1.646484375, -1.4189453125, -1.19140625, -0.9638671875, -0.736328125, -0.5087890625, -0.28125, -0.0537109375, 0.173828125, 0.4013671875, 0.62890625, 0.8564453125, 1.083984375, 1.3115234375, 1.5390625, 1.7666015625, 1.994140625, 2.2216796875, 2.44921875, 2.6767578125, 2.904296875, 3.1318359375, 3.359375, 3.5869140625, 3.814453125, 4.0419921875, 4.26953125, 4.4970703125, 4.724609375, 4.9521484375, 5.1796875, 5.4072265625, 5.634765625, 5.8623046875, 6.08984375, 6.3173828125, 6.544921875, 6.7724609375, 7.0]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 6.0, 8.0, 16.0, 23.0, 23.0, 40.0, 37.0, 72.0, 95.0, 124.0, 192.0, 348.0, 647.0, 1294.0, 3357.0, 13182.0, 200029.0, 796535.0, 23853.0, 4987.0, 1726.0, 784.0, 404.0, 264.0, 159.0, 90.0, 67.0, 63.0, 30.0, 28.0, 13.0, 17.0, 10.0, 7.0, 8.0, 1.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.234375, -29.37451171875, -28.5146484375, -27.65478515625, -26.794921875, -25.93505859375, -25.0751953125, -24.21533203125, -23.35546875, -22.49560546875, -21.6357421875, -20.77587890625, -19.916015625, -19.05615234375, -18.1962890625, -17.33642578125, -16.4765625, -15.61669921875, -14.7568359375, -13.89697265625, -13.037109375, -12.17724609375, -11.3173828125, -10.45751953125, -9.59765625, -8.73779296875, -7.8779296875, -7.01806640625, -6.158203125, -5.29833984375, -4.4384765625, -3.57861328125, -2.71875, -1.85888671875, -0.9990234375, -0.13916015625, 0.720703125, 1.58056640625, 2.4404296875, 3.30029296875, 4.16015625, 5.02001953125, 5.8798828125, 6.73974609375, 7.599609375, 8.45947265625, 9.3193359375, 10.17919921875, 11.0390625, 11.89892578125, 12.7587890625, 13.61865234375, 14.478515625, 15.33837890625, 16.1982421875, 17.05810546875, 17.91796875, 18.77783203125, 19.6376953125, 20.49755859375, 21.357421875, 22.21728515625, 23.0771484375, 23.93701171875, 24.796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 7.0, 11.0, 11.0, 12.0, 16.0, 18.0, 22.0, 33.0, 39.0, 34.0, 63.0, 83.0, 80.0, 73.0, 59.0, 61.0, 60.0, 78.0, 47.0, 34.0, 35.0, 20.0, 14.0, 18.0, 12.0, 8.0, 12.0, 8.0, 2.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000308990478515625, -0.00029661133885383606, -0.0002842321991920471, -0.0002718530595302582, -0.00025947391986846924, -0.0002470947802066803, -0.00023471564054489136, -0.00022233650088310242, -0.00020995736122131348, -0.00019757822155952454, -0.0001851990818977356, -0.00017281994223594666, -0.00016044080257415771, -0.00014806166291236877, -0.00013568252325057983, -0.0001233033835887909, -0.00011092424392700195, -9.854510426521301e-05, -8.616596460342407e-05, -7.378682494163513e-05, -6.140768527984619e-05, -4.902854561805725e-05, -3.664940595626831e-05, -2.427026629447937e-05, -1.189112663269043e-05, 4.880130290985107e-07, 1.2867152690887451e-05, 2.524629235267639e-05, 3.762543201446533e-05, 5.000457167625427e-05, 6.238371133804321e-05, 7.476285099983215e-05, 8.71419906616211e-05, 9.952113032341003e-05, 0.00011190026998519897, 0.00012427940964698792, 0.00013665854930877686, 0.0001490376889705658, 0.00016141682863235474, 0.00017379596829414368, 0.00018617510795593262, 0.00019855424761772156, 0.0002109333872795105, 0.00022331252694129944, 0.00023569166660308838, 0.0002480708062648773, 0.00026044994592666626, 0.0002728290855884552, 0.00028520822525024414, 0.0002975873649120331, 0.000309966504573822, 0.00032234564423561096, 0.0003347247838973999, 0.00034710392355918884, 0.0003594830632209778, 0.0003718622028827667, 0.00038424134254455566, 0.0003966204822063446, 0.00040899962186813354, 0.0004213787615299225, 0.0004337579011917114, 0.00044613704085350037, 0.0004585161805152893, 0.00047089532017707825, 0.0004832744598388672]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 3.0, 2.0, 10.0, 10.0, 8.0, 21.0, 26.0, 42.0, 66.0, 100.0, 202.0, 380.0, 866.0, 2336.0, 8424.0, 62663.0, 893032.0, 67357.0, 8878.0, 2367.0, 897.0, 380.0, 185.0, 118.0, 74.0, 40.0, 23.0, 14.0, 11.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.078125, -19.32080078125, -18.5634765625, -17.80615234375, -17.048828125, -16.29150390625, -15.5341796875, -14.77685546875, -14.01953125, -13.26220703125, -12.5048828125, -11.74755859375, -10.990234375, -10.23291015625, -9.4755859375, -8.71826171875, -7.9609375, -7.20361328125, -6.4462890625, -5.68896484375, -4.931640625, -4.17431640625, -3.4169921875, -2.65966796875, -1.90234375, -1.14501953125, -0.3876953125, 0.36962890625, 1.126953125, 1.88427734375, 2.6416015625, 3.39892578125, 4.15625, 4.91357421875, 5.6708984375, 6.42822265625, 7.185546875, 7.94287109375, 8.7001953125, 9.45751953125, 10.21484375, 10.97216796875, 11.7294921875, 12.48681640625, 13.244140625, 14.00146484375, 14.7587890625, 15.51611328125, 16.2734375, 17.03076171875, 17.7880859375, 18.54541015625, 19.302734375, 20.06005859375, 20.8173828125, 21.57470703125, 22.33203125, 23.08935546875, 23.8466796875, 24.60400390625, 25.361328125, 26.11865234375, 26.8759765625, 27.63330078125, 28.390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 8.0, 3.0, 10.0, 7.0, 17.0, 8.0, 25.0, 31.0, 55.0, 78.0, 107.0, 110.0, 153.0, 100.0, 88.0, 53.0, 38.0, 27.0, 18.0, 15.0, 10.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-12.4765625, -12.1422119140625, -11.807861328125, -11.4735107421875, -11.13916015625, -10.8048095703125, -10.470458984375, -10.1361083984375, -9.8017578125, -9.4674072265625, -9.133056640625, -8.7987060546875, -8.46435546875, -8.1300048828125, -7.795654296875, -7.4613037109375, -7.126953125, -6.7926025390625, -6.458251953125, -6.1239013671875, -5.78955078125, -5.4552001953125, -5.120849609375, -4.7864990234375, -4.4521484375, -4.1177978515625, -3.783447265625, -3.4490966796875, -3.11474609375, -2.7803955078125, -2.446044921875, -2.1116943359375, -1.77734375, -1.4429931640625, -1.108642578125, -0.7742919921875, -0.43994140625, -0.1055908203125, 0.228759765625, 0.5631103515625, 0.8974609375, 1.2318115234375, 1.566162109375, 1.9005126953125, 2.23486328125, 2.5692138671875, 2.903564453125, 3.2379150390625, 3.572265625, 3.9066162109375, 4.240966796875, 4.5753173828125, 4.90966796875, 5.2440185546875, 5.578369140625, 5.9127197265625, 6.2470703125, 6.5814208984375, 6.915771484375, 7.2501220703125, 7.58447265625, 7.9188232421875, 8.253173828125, 8.5875244140625, 8.921875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 6.0, 15.0, 29.0, 81.0, 244.0, 390.0, 144.0, 32.0, 20.0, 12.0, 12.0, 7.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.83003234863281, -72.04130554199219, -66.2525863647461, -60.463863372802734, -54.675140380859375, -48.886417388916016, -43.097694396972656, -37.3089714050293, -31.520248413085938, -25.731525421142578, -19.94280242919922, -14.15407943725586, -8.3653564453125, -2.5766334533691406, 3.2120895385742188, 9.000812530517578, 14.789535522460938, 20.578258514404297, 26.366981506347656, 32.155704498291016, 37.944427490234375, 43.733150482177734, 49.521873474121094, 55.31059646606445, 61.09931945800781, 66.88804626464844, 72.67676544189453, 78.46548461914062, 84.25421142578125, 90.04293823242188, 95.83165740966797, 101.62037658691406, 107.40911865234375, 113.19784545898438, 118.98656463623047, 124.77528381347656, 130.5640106201172, 136.3527374267578, 142.14144897460938, 147.93017578125, 153.71890258789062, 159.50762939453125, 165.29635620117188, 171.08506774902344, 176.87379455566406, 182.6625213623047, 188.45123291015625, 194.23995971679688, 200.0286865234375, 205.81741333007812, 211.60614013671875, 217.3948516845703, 223.18357849121094, 228.97230529785156, 234.76101684570312, 240.54974365234375, 246.33847045898438, 252.127197265625, 257.9159240722656, 263.70465087890625, 269.49334716796875, 275.2820739746094, 281.07080078125, 286.8595275878906, 292.64825439453125]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 6.0, 10.0, 12.0, 15.0, 17.0, 27.0, 48.0, 69.0, 115.0, 112.0, 141.0, 134.0, 70.0, 52.0, 48.0, 28.0, 25.0, 11.0, 8.0, 8.0, 5.0, 8.0, 8.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-139.07284545898438, -135.01824951171875, -130.9636688232422, -126.90907287597656, -122.85448455810547, -118.79989624023438, -114.74530029296875, -110.69071197509766, -106.63612365722656, -102.58153533935547, -98.52693939208984, -94.47235107421875, -90.41776275634766, -86.36317443847656, -82.30857849121094, -78.25399017333984, -74.19939422607422, -70.14480590820312, -66.0902099609375, -62.035621643066406, -57.98103332519531, -53.92644119262695, -49.871849060058594, -45.8172607421875, -41.76266860961914, -37.70807647705078, -33.65348815917969, -29.598896026611328, -25.5443058013916, -21.489715576171875, -17.435123443603516, -13.380533218383789, -9.325942993164062, -5.271352291107178, -1.216761589050293, 2.83782958984375, 6.892419815063477, 10.947010040283203, 15.001602172851562, 19.05619239807129, 23.110782623291016, 27.165372848510742, 31.21996307373047, 35.27455520629883, 39.32914733886719, 43.38373565673828, 47.43832778930664, 51.492919921875, 55.547508239746094, 59.60210037231445, 63.65668869018555, 67.7112808227539, 71.765869140625, 75.82046508789062, 79.87505340576172, 83.92964172363281, 87.98423767089844, 92.03882598876953, 96.09342193603516, 100.14801025390625, 104.20259857177734, 108.25718688964844, 112.31178283691406, 116.36637115478516, 120.42095947265625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 11.0, 9.0, 22.0, 40.0, 73.0, 209.0, 651.0, 2825.0, 18310.0, 2748162.0, 1402296.0, 17867.0, 2750.0, 642.0, 231.0, 72.0, 31.0, 26.0, 12.0, 10.0, 8.0, 3.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.25, -69.4697265625, -66.689453125, -63.9091796875, -61.12890625, -58.3486328125, -55.568359375, -52.7880859375, -50.0078125, -47.2275390625, -44.447265625, -41.6669921875, -38.88671875, -36.1064453125, -33.326171875, -30.5458984375, -27.765625, -24.9853515625, -22.205078125, -19.4248046875, -16.64453125, -13.8642578125, -11.083984375, -8.3037109375, -5.5234375, -2.7431640625, 0.037109375, 2.8173828125, 5.59765625, 8.3779296875, 11.158203125, 13.9384765625, 16.71875, 19.4990234375, 22.279296875, 25.0595703125, 27.83984375, 30.6201171875, 33.400390625, 36.1806640625, 38.9609375, 41.7412109375, 44.521484375, 47.3017578125, 50.08203125, 52.8623046875, 55.642578125, 58.4228515625, 61.203125, 63.9833984375, 66.763671875, 69.5439453125, 72.32421875, 75.1044921875, 77.884765625, 80.6650390625, 83.4453125, 86.2255859375, 89.005859375, 91.7861328125, 94.56640625, 97.3466796875, 100.126953125, 102.9072265625, 105.6875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 0.0, 7.0, 5.0, 5.0, 9.0, 7.0, 10.0, 17.0, 24.0, 35.0, 35.0, 56.0, 58.0, 84.0, 100.0, 110.0, 101.0, 84.0, 59.0, 37.0, 36.0, 23.0, 14.0, 17.0, 12.0, 6.0, 8.0, 6.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6279296875, -1.580413818359375, -1.53289794921875, -1.485382080078125, -1.4378662109375, -1.390350341796875, -1.34283447265625, -1.295318603515625, -1.247802734375, -1.200286865234375, -1.15277099609375, -1.105255126953125, -1.0577392578125, -1.010223388671875, -0.96270751953125, -0.915191650390625, -0.86767578125, -0.820159912109375, -0.77264404296875, -0.725128173828125, -0.6776123046875, -0.630096435546875, -0.58258056640625, -0.535064697265625, -0.487548828125, -0.440032958984375, -0.39251708984375, -0.345001220703125, -0.2974853515625, -0.249969482421875, -0.20245361328125, -0.154937744140625, -0.107421875, -0.059906005859375, -0.01239013671875, 0.035125732421875, 0.0826416015625, 0.130157470703125, 0.17767333984375, 0.225189208984375, 0.272705078125, 0.320220947265625, 0.36773681640625, 0.415252685546875, 0.4627685546875, 0.510284423828125, 0.55780029296875, 0.605316162109375, 0.65283203125, 0.700347900390625, 0.74786376953125, 0.795379638671875, 0.8428955078125, 0.890411376953125, 0.93792724609375, 0.985443115234375, 1.032958984375, 1.080474853515625, 1.12799072265625, 1.175506591796875, 1.2230224609375, 1.270538330078125, 1.31805419921875, 1.365570068359375, 1.4130859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 14.0, 11.0, 21.0, 20.0, 25.0, 27.0, 65.0, 113.0, 206.0, 541.0, 1649.0, 6377.0, 42899.0, 1173556.0, 2898740.0, 59422.0, 7687.0, 1764.0, 588.0, 226.0, 96.0, 64.0, 46.0, 21.0, 17.0, 13.0, 13.0, 7.0, 8.0, 3.0, 9.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.5, -40.021484375, -38.54296875, -37.064453125, -35.5859375, -34.107421875, -32.62890625, -31.150390625, -29.671875, -28.193359375, -26.71484375, -25.236328125, -23.7578125, -22.279296875, -20.80078125, -19.322265625, -17.84375, -16.365234375, -14.88671875, -13.408203125, -11.9296875, -10.451171875, -8.97265625, -7.494140625, -6.015625, -4.537109375, -3.05859375, -1.580078125, -0.1015625, 1.376953125, 2.85546875, 4.333984375, 5.8125, 7.291015625, 8.76953125, 10.248046875, 11.7265625, 13.205078125, 14.68359375, 16.162109375, 17.640625, 19.119140625, 20.59765625, 22.076171875, 23.5546875, 25.033203125, 26.51171875, 27.990234375, 29.46875, 30.947265625, 32.42578125, 33.904296875, 35.3828125, 36.861328125, 38.33984375, 39.818359375, 41.296875, 42.775390625, 44.25390625, 45.732421875, 47.2109375, 48.689453125, 50.16796875, 51.646484375, 53.125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 1.0, 8.0, 9.0, 4.0, 8.0, 12.0, 8.0, 8.0, 8.0, 27.0, 31.0, 42.0, 43.0, 61.0, 61.0, 117.0, 161.0, 237.0, 447.0, 987.0, 705.0, 314.0, 216.0, 154.0, 89.0, 65.0, 46.0, 39.0, 34.0, 26.0, 19.0, 19.0, 13.0, 11.0, 7.0, 8.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.732421875, -2.646697998046875, -2.56097412109375, -2.475250244140625, -2.3895263671875, -2.303802490234375, -2.21807861328125, -2.132354736328125, -2.046630859375, -1.960906982421875, -1.87518310546875, -1.789459228515625, -1.7037353515625, -1.618011474609375, -1.53228759765625, -1.446563720703125, -1.36083984375, -1.275115966796875, -1.18939208984375, -1.103668212890625, -1.0179443359375, -0.932220458984375, -0.84649658203125, -0.760772705078125, -0.675048828125, -0.589324951171875, -0.50360107421875, -0.417877197265625, -0.3321533203125, -0.246429443359375, -0.16070556640625, -0.074981689453125, 0.0107421875, 0.096466064453125, 0.18218994140625, 0.267913818359375, 0.3536376953125, 0.439361572265625, 0.52508544921875, 0.610809326171875, 0.696533203125, 0.782257080078125, 0.86798095703125, 0.953704833984375, 1.0394287109375, 1.125152587890625, 1.21087646484375, 1.296600341796875, 1.38232421875, 1.468048095703125, 1.55377197265625, 1.639495849609375, 1.7252197265625, 1.810943603515625, 1.89666748046875, 1.982391357421875, 2.068115234375, 2.153839111328125, 2.23956298828125, 2.325286865234375, 2.4110107421875, 2.496734619140625, 2.58245849609375, 2.668182373046875, 2.75390625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 10.0, 23.0, 67.0, 227.0, 380.0, 216.0, 63.0, 12.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.6811752319336, -118.24066162109375, -115.80015563964844, -113.3596420288086, -110.91913604736328, -108.47862243652344, -106.03811645507812, -103.59760284423828, -101.15708923339844, -98.7165756225586, -96.27606964111328, -93.83555603027344, -91.39505004882812, -88.95453643798828, -86.51403045654297, -84.07351684570312, -81.63301086425781, -79.19249725341797, -76.75199127197266, -74.31147766113281, -71.8709716796875, -69.43045806884766, -66.98995208740234, -64.5494384765625, -62.10892868041992, -59.668418884277344, -57.227909088134766, -54.78739929199219, -52.346885681152344, -49.90637969970703, -47.46586608886719, -45.02535629272461, -42.58485412597656, -40.144344329833984, -37.703834533691406, -35.26332473754883, -32.82281494140625, -30.38230323791504, -27.941791534423828, -25.50128173828125, -23.060771942138672, -20.620262145996094, -18.179752349853516, -15.739240646362305, -13.298730850219727, -10.858221054077148, -8.417710304260254, -5.977199554443359, -3.5366897583007812, -1.096179485321045, 1.3443307876586914, 3.7848410606384277, 6.225351333618164, 8.665861129760742, 11.106371879577637, 13.546882629394531, 15.98739242553711, 18.427902221679688, 20.868412017822266, 23.308923721313477, 25.749433517456055, 28.189943313598633, 30.630455017089844, 33.07096481323242, 35.511474609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 9.0, 7.0, 3.0, 19.0, 20.0, 29.0, 31.0, 34.0, 40.0, 75.0, 69.0, 71.0, 61.0, 61.0, 75.0, 60.0, 57.0, 46.0, 41.0, 27.0, 25.0, 27.0, 26.0, 18.0, 17.0, 5.0, 8.0, 6.0, 0.0, 4.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.11478042602539, -16.550708770751953, -15.986639022827148, -15.422568321228027, -14.858497619628906, -14.294426918029785, -13.730356216430664, -13.166285514831543, -12.602214813232422, -12.0381441116333, -11.47407341003418, -10.910002708435059, -10.345932006835938, -9.781861305236816, -9.217790603637695, -8.653719902038574, -8.089649200439453, -7.525578498840332, -6.961507797241211, -6.39743709564209, -5.833366394042969, -5.269295692443848, -4.705224990844727, -4.1411542892456055, -3.5770835876464844, -3.0130128860473633, -2.448942184448242, -1.884871482849121, -1.32080078125, -0.7567300796508789, -0.1926593780517578, 0.3714113235473633, 0.9354820251464844, 1.4995527267456055, 2.0636234283447266, 2.6276941299438477, 3.1917648315429688, 3.75583553314209, 4.319906234741211, 4.883976936340332, 5.448047637939453, 6.012118339538574, 6.576189041137695, 7.140259742736816, 7.7043304443359375, 8.268401145935059, 8.83247184753418, 9.3965425491333, 9.960613250732422, 10.524683952331543, 11.088754653930664, 11.652825355529785, 12.216896057128906, 12.780966758728027, 13.345037460327148, 13.90910816192627, 14.47317886352539, 15.037249565124512, 15.601320266723633, 16.165390014648438, 16.729461669921875, 17.293533325195312, 17.857603073120117, 18.421672821044922, 18.98574447631836]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 12.0, 16.0, 11.0, 30.0, 27.0, 49.0, 71.0, 100.0, 161.0, 240.0, 411.0, 676.0, 1221.0, 2285.0, 4989.0, 12407.0, 38088.0, 210411.0, 643607.0, 94676.0, 23048.0, 8162.0, 3628.0, 1794.0, 958.0, 558.0, 311.0, 188.0, 122.0, 91.0, 62.0, 45.0, 18.0, 17.0, 15.0, 5.0, 10.0, 8.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-29.78125, -28.9375, -28.09375, -27.25, -26.40625, -25.5625, -24.71875, -23.875, -23.03125, -22.1875, -21.34375, -20.5, -19.65625, -18.8125, -17.96875, -17.125, -16.28125, -15.4375, -14.59375, -13.75, -12.90625, -12.0625, -11.21875, -10.375, -9.53125, -8.6875, -7.84375, -7.0, -6.15625, -5.3125, -4.46875, -3.625, -2.78125, -1.9375, -1.09375, -0.25, 0.59375, 1.4375, 2.28125, 3.125, 3.96875, 4.8125, 5.65625, 6.5, 7.34375, 8.1875, 9.03125, 9.875, 10.71875, 11.5625, 12.40625, 13.25, 14.09375, 14.9375, 15.78125, 16.625, 17.46875, 18.3125, 19.15625, 20.0, 20.84375, 21.6875, 22.53125, 23.375, 24.21875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 8.0, 11.0, 15.0, 15.0, 29.0, 39.0, 51.0, 63.0, 99.0, 107.0, 113.0, 117.0, 82.0, 69.0, 53.0, 35.0, 26.0, 17.0, 10.0, 11.0, 6.0, 4.0, 6.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6142578125, -1.5457611083984375, -1.477264404296875, -1.4087677001953125, -1.34027099609375, -1.2717742919921875, -1.203277587890625, -1.1347808837890625, -1.0662841796875, -0.9977874755859375, -0.929290771484375, -0.8607940673828125, -0.79229736328125, -0.7238006591796875, -0.655303955078125, -0.5868072509765625, -0.518310546875, -0.4498138427734375, -0.381317138671875, -0.3128204345703125, -0.24432373046875, -0.1758270263671875, -0.107330322265625, -0.0388336181640625, 0.0296630859375, 0.0981597900390625, 0.166656494140625, 0.2351531982421875, 0.30364990234375, 0.3721466064453125, 0.440643310546875, 0.5091400146484375, 0.57763671875, 0.6461334228515625, 0.714630126953125, 0.7831268310546875, 0.85162353515625, 0.9201202392578125, 0.988616943359375, 1.0571136474609375, 1.1256103515625, 1.1941070556640625, 1.262603759765625, 1.3311004638671875, 1.39959716796875, 1.4680938720703125, 1.536590576171875, 1.6050872802734375, 1.673583984375, 1.7420806884765625, 1.810577392578125, 1.8790740966796875, 1.94757080078125, 2.0160675048828125, 2.084564208984375, 2.1530609130859375, 2.2215576171875, 2.2900543212890625, 2.358551025390625, 2.4270477294921875, 2.49554443359375, 2.5640411376953125, 2.632537841796875, 2.7010345458984375, 2.76953125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 1.0, 6.0, 7.0, 4.0, 12.0, 27.0, 43.0, 85.0, 435.0, 23286.0, 1022732.0, 1588.0, 167.0, 54.0, 33.0, 13.0, 11.0, 11.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.875, -113.203125, -108.53125, -103.859375, -99.1875, -94.515625, -89.84375, -85.171875, -80.5, -75.828125, -71.15625, -66.484375, -61.8125, -57.140625, -52.46875, -47.796875, -43.125, -38.453125, -33.78125, -29.109375, -24.4375, -19.765625, -15.09375, -10.421875, -5.75, -1.078125, 3.59375, 8.265625, 12.9375, 17.609375, 22.28125, 26.953125, 31.625, 36.296875, 40.96875, 45.640625, 50.3125, 54.984375, 59.65625, 64.328125, 69.0, 73.671875, 78.34375, 83.015625, 87.6875, 92.359375, 97.03125, 101.703125, 106.375, 111.046875, 115.71875, 120.390625, 125.0625, 129.734375, 134.40625, 139.078125, 143.75, 148.421875, 153.09375, 157.765625, 162.4375, 167.109375, 171.78125, 176.453125, 181.125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 7.0, 15.0, 12.0, 14.0, 22.0, 28.0, 29.0, 26.0, 21.0, 31.0, 35.0, 36.0, 55.0, 53.0, 42.0, 43.0, 54.0, 47.0, 58.0, 54.0, 44.0, 46.0, 45.0, 37.0, 22.0, 17.0, 19.0, 20.0, 14.0, 12.0, 13.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.737060546875, -5.50537109375, -5.273681640625, -5.0419921875, -4.810302734375, -4.57861328125, -4.346923828125, -4.115234375, -3.883544921875, -3.65185546875, -3.420166015625, -3.1884765625, -2.956787109375, -2.72509765625, -2.493408203125, -2.26171875, -2.030029296875, -1.79833984375, -1.566650390625, -1.3349609375, -1.103271484375, -0.87158203125, -0.639892578125, -0.408203125, -0.176513671875, 0.05517578125, 0.286865234375, 0.5185546875, 0.750244140625, 0.98193359375, 1.213623046875, 1.4453125, 1.677001953125, 1.90869140625, 2.140380859375, 2.3720703125, 2.603759765625, 2.83544921875, 3.067138671875, 3.298828125, 3.530517578125, 3.76220703125, 3.993896484375, 4.2255859375, 4.457275390625, 4.68896484375, 4.920654296875, 5.15234375, 5.384033203125, 5.61572265625, 5.847412109375, 6.0791015625, 6.310791015625, 6.54248046875, 6.774169921875, 7.005859375, 7.237548828125, 7.46923828125, 7.700927734375, 7.9326171875, 8.164306640625, 8.39599609375, 8.627685546875, 8.859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 1.0, 4.0, 6.0, 8.0, 10.0, 18.0, 26.0, 26.0, 51.0, 143.0, 956.0, 229834.0, 815805.0, 1289.0, 177.0, 64.0, 38.0, 18.0, 14.0, 12.0, 8.0, 12.0, 7.0, 5.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.25, -167.55859375, -160.8671875, -154.17578125, -147.484375, -140.79296875, -134.1015625, -127.41015625, -120.71875, -114.02734375, -107.3359375, -100.64453125, -93.953125, -87.26171875, -80.5703125, -73.87890625, -67.1875, -60.49609375, -53.8046875, -47.11328125, -40.421875, -33.73046875, -27.0390625, -20.34765625, -13.65625, -6.96484375, -0.2734375, 6.41796875, 13.109375, 19.80078125, 26.4921875, 33.18359375, 39.875, 46.56640625, 53.2578125, 59.94921875, 66.640625, 73.33203125, 80.0234375, 86.71484375, 93.40625, 100.09765625, 106.7890625, 113.48046875, 120.171875, 126.86328125, 133.5546875, 140.24609375, 146.9375, 153.62890625, 160.3203125, 167.01171875, 173.703125, 180.39453125, 187.0859375, 193.77734375, 200.46875, 207.16015625, 213.8515625, 220.54296875, 227.234375, 233.92578125, 240.6171875, 247.30859375, 254.0]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 10.0, 14.0, 21.0, 24.0, 30.0, 29.0, 60.0, 59.0, 90.0, 101.0, 89.0, 98.0, 79.0, 58.0, 57.0, 38.0, 35.0, 23.0, 21.0, 13.0, 4.0, 6.0, 4.0, 3.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00070953369140625, -0.0006870478391647339, -0.0006645619869232178, -0.0006420761346817017, -0.0006195902824401855, -0.0005971044301986694, -0.0005746185779571533, -0.0005521327257156372, -0.0005296468734741211, -0.000507161021232605, -0.00048467516899108887, -0.00046218931674957275, -0.00043970346450805664, -0.00041721761226654053, -0.0003947317600250244, -0.0003722459077835083, -0.0003497600555419922, -0.0003272742033004761, -0.00030478835105895996, -0.00028230249881744385, -0.00025981664657592773, -0.00023733079433441162, -0.0002148449420928955, -0.0001923590898513794, -0.00016987323760986328, -0.00014738738536834717, -0.00012490153312683105, -0.00010241568088531494, -7.992982864379883e-05, -5.7443976402282715e-05, -3.49581241607666e-05, -1.2472271919250488e-05, 1.0013580322265625e-05, 3.249943256378174e-05, 5.498528480529785e-05, 7.747113704681396e-05, 9.995698928833008e-05, 0.0001224428415298462, 0.0001449286937713623, 0.00016741454601287842, 0.00018990039825439453, 0.00021238625049591064, 0.00023487210273742676, 0.00025735795497894287, 0.000279843807220459, 0.0003023296594619751, 0.0003248155117034912, 0.0003473013639450073, 0.00036978721618652344, 0.00039227306842803955, 0.00041475892066955566, 0.0004372447729110718, 0.0004597306251525879, 0.000482216477394104, 0.0005047023296356201, 0.0005271881818771362, 0.0005496740341186523, 0.0005721598863601685, 0.0005946457386016846, 0.0006171315908432007, 0.0006396174430847168, 0.0006621032953262329, 0.000684589147567749, 0.0007070749998092651, 0.0007295608520507812]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 9.0, 11.0, 19.0, 18.0, 26.0, 27.0, 56.0, 46.0, 113.0, 107.0, 189.0, 270.0, 417.0, 659.0, 1062.0, 1764.0, 3136.0, 6093.0, 13327.0, 35088.0, 185546.0, 680232.0, 77939.0, 22312.0, 9403.0, 4424.0, 2482.0, 1355.0, 816.0, 524.0, 330.0, 222.0, 140.0, 102.0, 89.0, 57.0, 34.0, 27.0, 23.0, 16.0, 13.0, 8.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0], "bins": [-52.125, -50.60498046875, -49.0849609375, -47.56494140625, -46.044921875, -44.52490234375, -43.0048828125, -41.48486328125, -39.96484375, -38.44482421875, -36.9248046875, -35.40478515625, -33.884765625, -32.36474609375, -30.8447265625, -29.32470703125, -27.8046875, -26.28466796875, -24.7646484375, -23.24462890625, -21.724609375, -20.20458984375, -18.6845703125, -17.16455078125, -15.64453125, -14.12451171875, -12.6044921875, -11.08447265625, -9.564453125, -8.04443359375, -6.5244140625, -5.00439453125, -3.484375, -1.96435546875, -0.4443359375, 1.07568359375, 2.595703125, 4.11572265625, 5.6357421875, 7.15576171875, 8.67578125, 10.19580078125, 11.7158203125, 13.23583984375, 14.755859375, 16.27587890625, 17.7958984375, 19.31591796875, 20.8359375, 22.35595703125, 23.8759765625, 25.39599609375, 26.916015625, 28.43603515625, 29.9560546875, 31.47607421875, 32.99609375, 34.51611328125, 36.0361328125, 37.55615234375, 39.076171875, 40.59619140625, 42.1162109375, 43.63623046875, 45.15625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 3.0, 12.0, 11.0, 11.0, 13.0, 19.0, 46.0, 77.0, 134.0, 241.0, 164.0, 95.0, 54.0, 27.0, 22.0, 18.0, 9.0, 8.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.125, -38.8603515625, -37.595703125, -36.3310546875, -35.06640625, -33.8017578125, -32.537109375, -31.2724609375, -30.0078125, -28.7431640625, -27.478515625, -26.2138671875, -24.94921875, -23.6845703125, -22.419921875, -21.1552734375, -19.890625, -18.6259765625, -17.361328125, -16.0966796875, -14.83203125, -13.5673828125, -12.302734375, -11.0380859375, -9.7734375, -8.5087890625, -7.244140625, -5.9794921875, -4.71484375, -3.4501953125, -2.185546875, -0.9208984375, 0.34375, 1.6083984375, 2.873046875, 4.1376953125, 5.40234375, 6.6669921875, 7.931640625, 9.1962890625, 10.4609375, 11.7255859375, 12.990234375, 14.2548828125, 15.51953125, 16.7841796875, 18.048828125, 19.3134765625, 20.578125, 21.8427734375, 23.107421875, 24.3720703125, 25.63671875, 26.9013671875, 28.166015625, 29.4306640625, 30.6953125, 31.9599609375, 33.224609375, 34.4892578125, 35.75390625, 37.0185546875, 38.283203125, 39.5478515625, 40.8125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 13.0, 15.0, 35.0, 63.0, 129.0, 260.0, 244.0, 151.0, 47.0, 33.0, 12.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-325.18994140625, -318.8143310546875, -312.438720703125, -306.0631103515625, -299.6875, -293.3118896484375, -286.936279296875, -280.5606689453125, -274.18505859375, -267.8094482421875, -261.433837890625, -255.0582275390625, -248.6826171875, -242.3070068359375, -235.931396484375, -229.5557861328125, -223.18016052246094, -216.80455017089844, -210.42893981933594, -204.05332946777344, -197.67771911621094, -191.30210876464844, -184.92648315429688, -178.55087280273438, -172.17526245117188, -165.79965209960938, -159.42404174804688, -153.04843139648438, -146.67282104492188, -140.29721069335938, -133.92160034179688, -127.54598236083984, -121.17036437988281, -114.79475402832031, -108.41914367675781, -102.04353332519531, -95.66792297363281, -89.29231262207031, -82.91669464111328, -76.54108428955078, -70.16547393798828, -63.78986358642578, -57.41425323486328, -51.038639068603516, -44.663028717041016, -38.287418365478516, -31.91180419921875, -25.53619384765625, -19.16058349609375, -12.784972190856934, -6.409360885620117, -0.033748626708984375, 6.341861724853516, 12.717472076416016, 19.09308624267578, 25.46869659423828, 31.84430694580078, 38.21991729736328, 44.59552764892578, 50.97114181518555, 57.34675216674805, 63.72236251831055, 70.09797668457031, 76.47358703613281, 82.84919738769531]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 17.0, 20.0, 32.0, 49.0, 61.0, 69.0, 89.0, 97.0, 96.0, 113.0, 75.0, 78.0, 54.0, 44.0, 32.0, 27.0, 12.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-181.71389770507812, -177.78546142578125, -173.8570098876953, -169.92857360839844, -166.00013732910156, -162.07168579101562, -158.14324951171875, -154.21481323242188, -150.286376953125, -146.35794067382812, -142.4294891357422, -138.5010528564453, -134.57261657714844, -130.6441650390625, -126.71572875976562, -122.78729248046875, -118.85884094238281, -114.9303970336914, -111.00196075439453, -107.07351684570312, -103.14508056640625, -99.21663665771484, -95.28819274902344, -91.35975646972656, -87.43131256103516, -83.50286865234375, -79.57443237304688, -75.64598846435547, -71.71754455566406, -67.78910827636719, -63.86066436767578, -59.93222427368164, -56.00379180908203, -52.07535171508789, -48.14691162109375, -44.218467712402344, -40.2900276184082, -36.36158752441406, -32.433143615722656, -28.504703521728516, -24.576263427734375, -20.647823333740234, -16.71938133239746, -12.790940284729004, -8.862499237060547, -4.934059143066406, -1.0056171417236328, 2.9228248596191406, 6.851264953613281, 10.779706001281738, 14.708147048950195, 18.63658905029297, 22.56502914428711, 26.49346923828125, 30.421911239624023, 34.3503532409668, 38.27879333496094, 42.20723342895508, 46.13567352294922, 50.064117431640625, 53.992557525634766, 57.920997619628906, 61.84944152832031, 65.77787780761719, 69.7063217163086]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 9.0, 10.0, 16.0, 12.0, 19.0, 23.0, 36.0, 49.0, 70.0, 112.0, 129.0, 240.0, 450.0, 923.0, 2205.0, 6333.0, 29804.0, 441934.0, 3611181.0, 81845.0, 12846.0, 3610.0, 1295.0, 547.0, 277.0, 133.0, 63.0, 41.0, 32.0, 15.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-83.375, -81.53173828125, -79.6884765625, -77.84521484375, -76.001953125, -74.15869140625, -72.3154296875, -70.47216796875, -68.62890625, -66.78564453125, -64.9423828125, -63.09912109375, -61.255859375, -59.41259765625, -57.5693359375, -55.72607421875, -53.8828125, -52.03955078125, -50.1962890625, -48.35302734375, -46.509765625, -44.66650390625, -42.8232421875, -40.97998046875, -39.13671875, -37.29345703125, -35.4501953125, -33.60693359375, -31.763671875, -29.92041015625, -28.0771484375, -26.23388671875, -24.390625, -22.54736328125, -20.7041015625, -18.86083984375, -17.017578125, -15.17431640625, -13.3310546875, -11.48779296875, -9.64453125, -7.80126953125, -5.9580078125, -4.11474609375, -2.271484375, -0.42822265625, 1.4150390625, 3.25830078125, 5.1015625, 6.94482421875, 8.7880859375, 10.63134765625, 12.474609375, 14.31787109375, 16.1611328125, 18.00439453125, 19.84765625, 21.69091796875, 23.5341796875, 25.37744140625, 27.220703125, 29.06396484375, 30.9072265625, 32.75048828125, 34.59375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 11.0, 13.0, 11.0, 17.0, 19.0, 39.0, 53.0, 67.0, 83.0, 96.0, 120.0, 89.0, 90.0, 84.0, 58.0, 44.0, 30.0, 22.0, 16.0, 10.0, 12.0, 11.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0], "bins": [-3.615234375, -3.5379791259765625, -3.460723876953125, -3.3834686279296875, -3.30621337890625, -3.2289581298828125, -3.151702880859375, -3.0744476318359375, -2.9971923828125, -2.9199371337890625, -2.842681884765625, -2.7654266357421875, -2.68817138671875, -2.6109161376953125, -2.533660888671875, -2.4564056396484375, -2.379150390625, -2.3018951416015625, -2.224639892578125, -2.1473846435546875, -2.07012939453125, -1.9928741455078125, -1.915618896484375, -1.8383636474609375, -1.7611083984375, -1.6838531494140625, -1.606597900390625, -1.5293426513671875, -1.45208740234375, -1.3748321533203125, -1.297576904296875, -1.2203216552734375, -1.14306640625, -1.0658111572265625, -0.988555908203125, -0.9113006591796875, -0.83404541015625, -0.7567901611328125, -0.679534912109375, -0.6022796630859375, -0.5250244140625, -0.4477691650390625, -0.370513916015625, -0.2932586669921875, -0.21600341796875, -0.1387481689453125, -0.061492919921875, 0.0157623291015625, 0.093017578125, 0.1702728271484375, 0.247528076171875, 0.3247833251953125, 0.40203857421875, 0.4792938232421875, 0.556549072265625, 0.6338043212890625, 0.7110595703125, 0.7883148193359375, 0.865570068359375, 0.9428253173828125, 1.02008056640625, 1.0973358154296875, 1.174591064453125, 1.2518463134765625, 1.3291015625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 6.0, 7.0, 8.0, 12.0, 20.0, 43.0, 44.0, 77.0, 154.0, 329.0, 1290.0, 21415.0, 3967700.0, 198311.0, 3683.0, 599.0, 207.0, 140.0, 74.0, 52.0, 29.0, 20.0, 18.0, 13.0, 8.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.8125, -102.4765625, -99.140625, -95.8046875, -92.46875, -89.1328125, -85.796875, -82.4609375, -79.125, -75.7890625, -72.453125, -69.1171875, -65.78125, -62.4453125, -59.109375, -55.7734375, -52.4375, -49.1015625, -45.765625, -42.4296875, -39.09375, -35.7578125, -32.421875, -29.0859375, -25.75, -22.4140625, -19.078125, -15.7421875, -12.40625, -9.0703125, -5.734375, -2.3984375, 0.9375, 4.2734375, 7.609375, 10.9453125, 14.28125, 17.6171875, 20.953125, 24.2890625, 27.625, 30.9609375, 34.296875, 37.6328125, 40.96875, 44.3046875, 47.640625, 50.9765625, 54.3125, 57.6484375, 60.984375, 64.3203125, 67.65625, 70.9921875, 74.328125, 77.6640625, 81.0, 84.3359375, 87.671875, 91.0078125, 94.34375, 97.6796875, 101.015625, 104.3515625, 107.6875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 10.0, 5.0, 16.0, 16.0, 41.0, 78.0, 130.0, 198.0, 397.0, 866.0, 1243.0, 525.0, 254.0, 104.0, 73.0, 36.0, 18.0, 31.0, 8.0, 10.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8125, -4.6136474609375, -4.414794921875, -4.2159423828125, -4.01708984375, -3.8182373046875, -3.619384765625, -3.4205322265625, -3.2216796875, -3.0228271484375, -2.823974609375, -2.6251220703125, -2.42626953125, -2.2274169921875, -2.028564453125, -1.8297119140625, -1.630859375, -1.4320068359375, -1.233154296875, -1.0343017578125, -0.83544921875, -0.6365966796875, -0.437744140625, -0.2388916015625, -0.0400390625, 0.1588134765625, 0.357666015625, 0.5565185546875, 0.75537109375, 0.9542236328125, 1.153076171875, 1.3519287109375, 1.55078125, 1.7496337890625, 1.948486328125, 2.1473388671875, 2.34619140625, 2.5450439453125, 2.743896484375, 2.9427490234375, 3.1416015625, 3.3404541015625, 3.539306640625, 3.7381591796875, 3.93701171875, 4.1358642578125, 4.334716796875, 4.5335693359375, 4.732421875, 4.9312744140625, 5.130126953125, 5.3289794921875, 5.52783203125, 5.7266845703125, 5.925537109375, 6.1243896484375, 6.3232421875, 6.5220947265625, 6.720947265625, 6.9197998046875, 7.11865234375, 7.3175048828125, 7.516357421875, 7.7152099609375, 7.9140625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 10.0, 12.0, 43.0, 143.0, 330.0, 280.0, 120.0, 49.0, 14.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.438289642333984, -26.4831600189209, -23.528030395507812, -20.57290267944336, -17.617773056030273, -14.662643432617188, -11.707515716552734, -8.752386093139648, -5.7972564697265625, -2.8421273231506348, 0.11300182342529297, 3.0681304931640625, 6.023260116577148, 8.978389739990234, 11.933517456054688, 14.888647079467773, 17.84377670288086, 20.798906326293945, 23.75403594970703, 26.709163665771484, 29.66429328918457, 32.619422912597656, 35.57455062866211, 38.52967834472656, 41.48480987548828, 44.439937591552734, 47.39506912231445, 50.350196838378906, 53.305328369140625, 56.26045608520508, 59.21558380126953, 62.17071533203125, 65.12583923339844, 68.08097076416016, 71.03609466552734, 73.99122619628906, 76.94635772705078, 79.9014892578125, 82.85661315917969, 85.8117446899414, 88.76687622070312, 91.72200775146484, 94.67713165283203, 97.63226318359375, 100.58739471435547, 103.54252624511719, 106.49765014648438, 109.4527816772461, 112.40790557861328, 115.363037109375, 118.31816101074219, 121.2732925415039, 124.22842407226562, 127.18354797363281, 130.138671875, 133.09381103515625, 136.04893493652344, 139.00405883789062, 141.95919799804688, 144.91432189941406, 147.86944580078125, 150.8245849609375, 153.7797088623047, 156.73483276367188, 159.68997192382812]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 1.0, 0.0, 0.0, 1.0, 7.0, 11.0, 12.0, 10.0, 10.0, 16.0, 30.0, 34.0, 49.0, 48.0, 60.0, 52.0, 70.0, 64.0, 69.0, 65.0, 58.0, 62.0, 66.0, 43.0, 40.0, 27.0, 22.0, 21.0, 12.0, 7.0, 15.0, 8.0, 2.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.70903778076172, -20.838333129882812, -19.967626571655273, -19.096921920776367, -18.22621726989746, -17.355510711669922, -16.484806060791016, -15.61410140991211, -14.743396759033203, -13.87269115447998, -13.001986503601074, -12.131280899047852, -11.260576248168945, -10.389870643615723, -9.5191650390625, -8.648460388183594, -7.777754783630371, -6.907049655914307, -6.036344528198242, -5.1656389236450195, -4.294934272766113, -3.4242286682128906, -2.553523540496826, -1.6828184127807617, -0.8121132850646973, 0.05859190225601196, 0.9292970895767212, 1.8000023365020752, 2.6707074642181396, 3.541412830352783, 4.412117958068848, 5.282823085784912, 6.153528213500977, 7.024233341217041, 7.8949384689331055, 8.765644073486328, 9.636348724365234, 10.507054328918457, 11.37775993347168, 12.248464584350586, 13.119169235229492, 13.989874839782715, 14.860579490661621, 15.731285095214844, 16.60198974609375, 17.472694396972656, 18.343400955200195, 19.2141056060791, 20.08481216430664, 20.955516815185547, 21.826223373413086, 22.696928024291992, 23.5676326751709, 24.438339233398438, 25.309043884277344, 26.17974853515625, 27.050453186035156, 27.921157836914062, 28.7918643951416, 29.662569046020508, 30.533273696899414, 31.403980255126953, 32.27468490600586, 33.145389556884766, 34.01609420776367]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 2.0, 7.0, 2.0, 11.0, 23.0, 12.0, 20.0, 19.0, 26.0, 26.0, 35.0, 49.0, 114.0, 383.0, 1911.0, 11913.0, 115266.0, 670473.0, 222940.0, 21310.0, 2925.0, 628.0, 171.0, 75.0, 39.0, 31.0, 21.0, 16.0, 13.0, 14.0, 21.0, 12.0, 10.0, 5.0, 6.0, 4.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.53125, -34.408203125, -33.28515625, -32.162109375, -31.0390625, -29.916015625, -28.79296875, -27.669921875, -26.546875, -25.423828125, -24.30078125, -23.177734375, -22.0546875, -20.931640625, -19.80859375, -18.685546875, -17.5625, -16.439453125, -15.31640625, -14.193359375, -13.0703125, -11.947265625, -10.82421875, -9.701171875, -8.578125, -7.455078125, -6.33203125, -5.208984375, -4.0859375, -2.962890625, -1.83984375, -0.716796875, 0.40625, 1.529296875, 2.65234375, 3.775390625, 4.8984375, 6.021484375, 7.14453125, 8.267578125, 9.390625, 10.513671875, 11.63671875, 12.759765625, 13.8828125, 15.005859375, 16.12890625, 17.251953125, 18.375, 19.498046875, 20.62109375, 21.744140625, 22.8671875, 23.990234375, 25.11328125, 26.236328125, 27.359375, 28.482421875, 29.60546875, 30.728515625, 31.8515625, 32.974609375, 34.09765625, 35.220703125, 36.34375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 1.0, 8.0, 8.0, 18.0, 18.0, 27.0, 32.0, 34.0, 45.0, 58.0, 63.0, 63.0, 74.0, 74.0, 71.0, 62.0, 67.0, 57.0, 45.0, 36.0, 33.0, 33.0, 19.0, 14.0, 13.0, 9.0, 7.0, 0.0, 3.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9345703125, -1.8672027587890625, -1.799835205078125, -1.7324676513671875, -1.66510009765625, -1.5977325439453125, -1.530364990234375, -1.4629974365234375, -1.3956298828125, -1.3282623291015625, -1.260894775390625, -1.1935272216796875, -1.12615966796875, -1.0587921142578125, -0.991424560546875, -0.9240570068359375, -0.856689453125, -0.7893218994140625, -0.721954345703125, -0.6545867919921875, -0.58721923828125, -0.5198516845703125, -0.452484130859375, -0.3851165771484375, -0.3177490234375, -0.2503814697265625, -0.183013916015625, -0.1156463623046875, -0.04827880859375, 0.0190887451171875, 0.086456298828125, 0.1538238525390625, 0.22119140625, 0.2885589599609375, 0.355926513671875, 0.4232940673828125, 0.49066162109375, 0.5580291748046875, 0.625396728515625, 0.6927642822265625, 0.7601318359375, 0.8274993896484375, 0.894866943359375, 0.9622344970703125, 1.02960205078125, 1.0969696044921875, 1.164337158203125, 1.2317047119140625, 1.299072265625, 1.3664398193359375, 1.433807373046875, 1.5011749267578125, 1.56854248046875, 1.6359100341796875, 1.703277587890625, 1.7706451416015625, 1.8380126953125, 1.9053802490234375, 1.972747802734375, 2.0401153564453125, 2.10748291015625, 2.1748504638671875, 2.242218017578125, 2.3095855712890625, 2.376953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 13.0, 13.0, 26.0, 35.0, 36.0, 82.0, 113.0, 189.0, 255.0, 398.0, 654.0, 1205.0, 2227.0, 4394.0, 9971.0, 24027.0, 62784.0, 161936.0, 320266.0, 267223.0, 115971.0, 44104.0, 17444.0, 7289.0, 3471.0, 1748.0, 1013.0, 595.0, 381.0, 200.0, 151.0, 116.0, 73.0, 43.0, 36.0, 20.0, 13.0, 11.0, 8.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.6015625, -12.1317138671875, -11.661865234375, -11.1920166015625, -10.72216796875, -10.2523193359375, -9.782470703125, -9.3126220703125, -8.8427734375, -8.3729248046875, -7.903076171875, -7.4332275390625, -6.96337890625, -6.4935302734375, -6.023681640625, -5.5538330078125, -5.083984375, -4.6141357421875, -4.144287109375, -3.6744384765625, -3.20458984375, -2.7347412109375, -2.264892578125, -1.7950439453125, -1.3251953125, -0.8553466796875, -0.385498046875, 0.0843505859375, 0.55419921875, 1.0240478515625, 1.493896484375, 1.9637451171875, 2.43359375, 2.9034423828125, 3.373291015625, 3.8431396484375, 4.31298828125, 4.7828369140625, 5.252685546875, 5.7225341796875, 6.1923828125, 6.6622314453125, 7.132080078125, 7.6019287109375, 8.07177734375, 8.5416259765625, 9.011474609375, 9.4813232421875, 9.951171875, 10.4210205078125, 10.890869140625, 11.3607177734375, 11.83056640625, 12.3004150390625, 12.770263671875, 13.2401123046875, 13.7099609375, 14.1798095703125, 14.649658203125, 15.1195068359375, 15.58935546875, 16.0592041015625, 16.529052734375, 16.9989013671875, 17.46875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 5.0, 6.0, 9.0, 13.0, 14.0, 22.0, 26.0, 20.0, 40.0, 45.0, 39.0, 46.0, 55.0, 61.0, 49.0, 59.0, 54.0, 47.0, 53.0, 55.0, 33.0, 38.0, 39.0, 42.0, 23.0, 20.0, 19.0, 16.0, 10.0, 11.0, 9.0, 11.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9140625, -10.5379638671875, -10.161865234375, -9.7857666015625, -9.40966796875, -9.0335693359375, -8.657470703125, -8.2813720703125, -7.9052734375, -7.5291748046875, -7.153076171875, -6.7769775390625, -6.40087890625, -6.0247802734375, -5.648681640625, -5.2725830078125, -4.896484375, -4.5203857421875, -4.144287109375, -3.7681884765625, -3.39208984375, -3.0159912109375, -2.639892578125, -2.2637939453125, -1.8876953125, -1.5115966796875, -1.135498046875, -0.7593994140625, -0.38330078125, -0.0072021484375, 0.368896484375, 0.7449951171875, 1.12109375, 1.4971923828125, 1.873291015625, 2.2493896484375, 2.62548828125, 3.0015869140625, 3.377685546875, 3.7537841796875, 4.1298828125, 4.5059814453125, 4.882080078125, 5.2581787109375, 5.63427734375, 6.0103759765625, 6.386474609375, 6.7625732421875, 7.138671875, 7.5147705078125, 7.890869140625, 8.2669677734375, 8.64306640625, 9.0191650390625, 9.395263671875, 9.7713623046875, 10.1474609375, 10.5235595703125, 10.899658203125, 11.2757568359375, 11.65185546875, 12.0279541015625, 12.404052734375, 12.7801513671875, 13.15625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 2.0, 6.0, 11.0, 15.0, 30.0, 50.0, 53.0, 69.0, 79.0, 151.0, 221.0, 414.0, 728.0, 1317.0, 2682.0, 5576.0, 14457.0, 42000.0, 130481.0, 330748.0, 326567.0, 126779.0, 40669.0, 14128.0, 5680.0, 2471.0, 1335.0, 722.0, 396.0, 238.0, 128.0, 98.0, 76.0, 51.0, 33.0, 23.0, 17.0, 10.0, 10.0, 3.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.015625, -14.5604248046875, -14.105224609375, -13.6500244140625, -13.19482421875, -12.7396240234375, -12.284423828125, -11.8292236328125, -11.3740234375, -10.9188232421875, -10.463623046875, -10.0084228515625, -9.55322265625, -9.0980224609375, -8.642822265625, -8.1876220703125, -7.732421875, -7.2772216796875, -6.822021484375, -6.3668212890625, -5.91162109375, -5.4564208984375, -5.001220703125, -4.5460205078125, -4.0908203125, -3.6356201171875, -3.180419921875, -2.7252197265625, -2.27001953125, -1.8148193359375, -1.359619140625, -0.9044189453125, -0.44921875, 0.0059814453125, 0.461181640625, 0.9163818359375, 1.37158203125, 1.8267822265625, 2.281982421875, 2.7371826171875, 3.1923828125, 3.6475830078125, 4.102783203125, 4.5579833984375, 5.01318359375, 5.4683837890625, 5.923583984375, 6.3787841796875, 6.833984375, 7.2891845703125, 7.744384765625, 8.1995849609375, 8.65478515625, 9.1099853515625, 9.565185546875, 10.0203857421875, 10.4755859375, 10.9307861328125, 11.385986328125, 11.8411865234375, 12.29638671875, 12.7515869140625, 13.206787109375, 13.6619873046875, 14.1171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 11.0, 11.0, 12.0, 19.0, 18.0, 43.0, 60.0, 65.0, 84.0, 114.0, 105.0, 109.0, 89.0, 68.0, 47.0, 49.0, 28.0, 20.0, 12.0, 10.0, 7.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024871826171875, -0.0024084150791168213, -0.0023296475410461426, -0.002250880002975464, -0.002172112464904785, -0.0020933449268341064, -0.0020145773887634277, -0.001935809850692749, -0.0018570423126220703, -0.0017782747745513916, -0.0016995072364807129, -0.0016207396984100342, -0.0015419721603393555, -0.0014632046222686768, -0.001384437084197998, -0.0013056695461273193, -0.0012269020080566406, -0.001148134469985962, -0.0010693669319152832, -0.0009905993938446045, -0.0009118318557739258, -0.0008330643177032471, -0.0007542967796325684, -0.0006755292415618896, -0.0005967617034912109, -0.0005179941654205322, -0.0004392266273498535, -0.0003604590892791748, -0.0002816915512084961, -0.00020292401313781738, -0.00012415647506713867, -4.538893699645996e-05, 3.337860107421875e-05, 0.00011214613914489746, 0.00019091367721557617, 0.0002696812152862549, 0.0003484487533569336, 0.0004272162914276123, 0.000505983829498291, 0.0005847513675689697, 0.0006635189056396484, 0.0007422864437103271, 0.0008210539817810059, 0.0008998215198516846, 0.0009785890579223633, 0.001057356595993042, 0.0011361241340637207, 0.0012148916721343994, 0.0012936592102050781, 0.0013724267482757568, 0.0014511942863464355, 0.0015299618244171143, 0.001608729362487793, 0.0016874969005584717, 0.0017662644386291504, 0.001845031976699829, 0.0019237995147705078, 0.0020025670528411865, 0.0020813345909118652, 0.002160102128982544, 0.0022388696670532227, 0.0023176372051239014, 0.00239640474319458, 0.002475172281265259, 0.0025539398193359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 6.0, 14.0, 14.0, 21.0, 33.0, 29.0, 41.0, 73.0, 141.0, 231.0, 367.0, 644.0, 1220.0, 2570.0, 6263.0, 20605.0, 103430.0, 504833.0, 329964.0, 56511.0, 12990.0, 4560.0, 1837.0, 901.0, 478.0, 251.0, 188.0, 121.0, 82.0, 44.0, 28.0, 14.0, 12.0, 6.0, 6.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.609375, -21.8759765625, -21.142578125, -20.4091796875, -19.67578125, -18.9423828125, -18.208984375, -17.4755859375, -16.7421875, -16.0087890625, -15.275390625, -14.5419921875, -13.80859375, -13.0751953125, -12.341796875, -11.6083984375, -10.875, -10.1416015625, -9.408203125, -8.6748046875, -7.94140625, -7.2080078125, -6.474609375, -5.7412109375, -5.0078125, -4.2744140625, -3.541015625, -2.8076171875, -2.07421875, -1.3408203125, -0.607421875, 0.1259765625, 0.859375, 1.5927734375, 2.326171875, 3.0595703125, 3.79296875, 4.5263671875, 5.259765625, 5.9931640625, 6.7265625, 7.4599609375, 8.193359375, 8.9267578125, 9.66015625, 10.3935546875, 11.126953125, 11.8603515625, 12.59375, 13.3271484375, 14.060546875, 14.7939453125, 15.52734375, 16.2607421875, 16.994140625, 17.7275390625, 18.4609375, 19.1943359375, 19.927734375, 20.6611328125, 21.39453125, 22.1279296875, 22.861328125, 23.5947265625, 24.328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 3.0, 7.0, 16.0, 27.0, 28.0, 44.0, 53.0, 58.0, 64.0, 82.0, 91.0, 105.0, 68.0, 83.0, 56.0, 42.0, 36.0, 29.0, 14.0, 21.0, 15.0, 7.0, 9.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.8548583984375, -7.584716796875, -7.3145751953125, -7.04443359375, -6.7742919921875, -6.504150390625, -6.2340087890625, -5.9638671875, -5.6937255859375, -5.423583984375, -5.1534423828125, -4.88330078125, -4.6131591796875, -4.343017578125, -4.0728759765625, -3.802734375, -3.5325927734375, -3.262451171875, -2.9923095703125, -2.72216796875, -2.4520263671875, -2.181884765625, -1.9117431640625, -1.6416015625, -1.3714599609375, -1.101318359375, -0.8311767578125, -0.56103515625, -0.2908935546875, -0.020751953125, 0.2493896484375, 0.51953125, 0.7896728515625, 1.059814453125, 1.3299560546875, 1.60009765625, 1.8702392578125, 2.140380859375, 2.4105224609375, 2.6806640625, 2.9508056640625, 3.220947265625, 3.4910888671875, 3.76123046875, 4.0313720703125, 4.301513671875, 4.5716552734375, 4.841796875, 5.1119384765625, 5.382080078125, 5.6522216796875, 5.92236328125, 6.1925048828125, 6.462646484375, 6.7327880859375, 7.0029296875, 7.2730712890625, 7.543212890625, 7.8133544921875, 8.08349609375, 8.3536376953125, 8.623779296875, 8.8939208984375, 9.1640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 14.0, 15.0, 49.0, 52.0, 127.0, 182.0, 170.0, 164.0, 99.0, 60.0, 32.0, 15.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-236.9807586669922, -231.9921875, -227.00363159179688, -222.0150604248047, -217.0264892578125, -212.0379180908203, -207.0493621826172, -202.060791015625, -197.0722198486328, -192.08364868164062, -187.0950927734375, -182.1065216064453, -177.11795043945312, -172.12937927246094, -167.1408233642578, -162.15225219726562, -157.1636962890625, -152.1751251220703, -147.1865692138672, -142.197998046875, -137.2094268798828, -132.22085571289062, -127.2322998046875, -122.24372863769531, -117.25515747070312, -112.26659393310547, -107.27802276611328, -102.28945922851562, -97.30088806152344, -92.31232452392578, -87.32376098632812, -82.33518981933594, -77.34661102294922, -72.35804748535156, -67.36947631835938, -62.38091278076172, -57.39234161376953, -52.403778076171875, -47.41521072387695, -42.42664337158203, -37.43807601928711, -32.44950866699219, -27.460941314697266, -22.472375869750977, -17.483808517456055, -12.495241165161133, -7.506675720214844, -2.518108367919922, 2.470458984375, 7.459025859832764, 12.447592735290527, 17.436159133911133, 22.424726486206055, 27.413293838500977, 32.401859283447266, 37.39042663574219, 42.37899398803711, 47.36756134033203, 52.35612869262695, 57.344696044921875, 62.33325958251953, 67.32183074951172, 72.31039428710938, 77.29896545410156, 82.28752899169922]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 5.0, 9.0, 12.0, 10.0, 12.0, 27.0, 19.0, 41.0, 34.0, 46.0, 44.0, 55.0, 46.0, 42.0, 63.0, 76.0, 69.0, 54.0, 56.0, 61.0, 43.0, 33.0, 25.0, 20.0, 29.0, 19.0, 13.0, 9.0, 8.0, 8.0, 2.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.72776794433594, -93.0004653930664, -90.27315521240234, -87.54585266113281, -84.81855010986328, -82.09124755859375, -79.36393737792969, -76.63663482666016, -73.90933227539062, -71.1820297241211, -68.45471954345703, -65.7274169921875, -63.00011444091797, -60.27280807495117, -57.545501708984375, -54.818199157714844, -52.09089279174805, -49.36358642578125, -46.63628387451172, -43.90897750854492, -41.18167495727539, -38.454368591308594, -35.72706604003906, -32.999759674072266, -30.2724552154541, -27.545150756835938, -24.817846298217773, -22.09054183959961, -19.363235473632812, -16.63593292236328, -13.908626556396484, -11.18132209777832, -8.454017639160156, -5.726713180541992, -2.99940824508667, -0.27210330963134766, 2.4552011489868164, 5.1825056076049805, 7.909811019897461, 10.637115478515625, 13.364419937133789, 16.091724395751953, 18.819028854370117, 21.54633331298828, 24.273639678955078, 27.00094223022461, 29.728248596191406, 32.45555114746094, 35.182857513427734, 37.91016387939453, 40.63746643066406, 43.36477279663086, 46.09207534790039, 48.81938171386719, 51.54668426513672, 54.273990631103516, 57.00129699707031, 59.72860336303711, 62.45590591430664, 65.18321228027344, 67.91051483154297, 70.6378173828125, 73.36512756347656, 76.0924301147461, 78.81973266601562]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 2.0, 8.0, 14.0, 12.0, 22.0, 25.0, 40.0, 66.0, 108.0, 224.0, 676.0, 2872.0, 17329.0, 407494.0, 3726111.0, 32954.0, 4672.0, 1032.0, 264.0, 127.0, 69.0, 43.0, 32.0, 17.0, 20.0, 18.0, 10.0, 6.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.375, -97.251953125, -94.12890625, -91.005859375, -87.8828125, -84.759765625, -81.63671875, -78.513671875, -75.390625, -72.267578125, -69.14453125, -66.021484375, -62.8984375, -59.775390625, -56.65234375, -53.529296875, -50.40625, -47.283203125, -44.16015625, -41.037109375, -37.9140625, -34.791015625, -31.66796875, -28.544921875, -25.421875, -22.298828125, -19.17578125, -16.052734375, -12.9296875, -9.806640625, -6.68359375, -3.560546875, -0.4375, 2.685546875, 5.80859375, 8.931640625, 12.0546875, 15.177734375, 18.30078125, 21.423828125, 24.546875, 27.669921875, 30.79296875, 33.916015625, 37.0390625, 40.162109375, 43.28515625, 46.408203125, 49.53125, 52.654296875, 55.77734375, 58.900390625, 62.0234375, 65.146484375, 68.26953125, 71.392578125, 74.515625, 77.638671875, 80.76171875, 83.884765625, 87.0078125, 90.130859375, 93.25390625, 96.376953125, 99.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 4.0, 12.0, 8.0, 10.0, 14.0, 17.0, 33.0, 35.0, 49.0, 44.0, 59.0, 66.0, 75.0, 69.0, 75.0, 77.0, 53.0, 49.0, 40.0, 51.0, 37.0, 23.0, 18.0, 16.0, 14.0, 16.0, 13.0, 9.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.869140625, -2.7847900390625, -2.700439453125, -2.6160888671875, -2.53173828125, -2.4473876953125, -2.363037109375, -2.2786865234375, -2.1943359375, -2.1099853515625, -2.025634765625, -1.9412841796875, -1.85693359375, -1.7725830078125, -1.688232421875, -1.6038818359375, -1.51953125, -1.4351806640625, -1.350830078125, -1.2664794921875, -1.18212890625, -1.0977783203125, -1.013427734375, -0.9290771484375, -0.8447265625, -0.7603759765625, -0.676025390625, -0.5916748046875, -0.50732421875, -0.4229736328125, -0.338623046875, -0.2542724609375, -0.169921875, -0.0855712890625, -0.001220703125, 0.0831298828125, 0.16748046875, 0.2518310546875, 0.336181640625, 0.4205322265625, 0.5048828125, 0.5892333984375, 0.673583984375, 0.7579345703125, 0.84228515625, 0.9266357421875, 1.010986328125, 1.0953369140625, 1.1796875, 1.2640380859375, 1.348388671875, 1.4327392578125, 1.51708984375, 1.6014404296875, 1.685791015625, 1.7701416015625, 1.8544921875, 1.9388427734375, 2.023193359375, 2.1075439453125, 2.19189453125, 2.2762451171875, 2.360595703125, 2.4449462890625, 2.529296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 14.0, 17.0, 29.0, 44.0, 43.0, 67.0, 77.0, 80.0, 120.0, 167.0, 249.0, 786.0, 8127.0, 362943.0, 3784100.0, 33971.0, 2127.0, 381.0, 229.0, 182.0, 135.0, 97.0, 87.0, 51.0, 42.0, 37.0, 28.0, 17.0, 16.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -63.9951171875, -61.115234375, -58.2353515625, -55.35546875, -52.4755859375, -49.595703125, -46.7158203125, -43.8359375, -40.9560546875, -38.076171875, -35.1962890625, -32.31640625, -29.4365234375, -26.556640625, -23.6767578125, -20.796875, -17.9169921875, -15.037109375, -12.1572265625, -9.27734375, -6.3974609375, -3.517578125, -0.6376953125, 2.2421875, 5.1220703125, 8.001953125, 10.8818359375, 13.76171875, 16.6416015625, 19.521484375, 22.4013671875, 25.28125, 28.1611328125, 31.041015625, 33.9208984375, 36.80078125, 39.6806640625, 42.560546875, 45.4404296875, 48.3203125, 51.2001953125, 54.080078125, 56.9599609375, 59.83984375, 62.7197265625, 65.599609375, 68.4794921875, 71.359375, 74.2392578125, 77.119140625, 79.9990234375, 82.87890625, 85.7587890625, 88.638671875, 91.5185546875, 94.3984375, 97.2783203125, 100.158203125, 103.0380859375, 105.91796875, 108.7978515625, 111.677734375, 114.5576171875, 117.4375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 6.0, 11.0, 20.0, 21.0, 42.0, 64.0, 113.0, 222.0, 523.0, 1647.0, 820.0, 271.0, 129.0, 76.0, 38.0, 27.0, 11.0, 14.0, 8.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -3.8375244140625, -3.534423828125, -3.2313232421875, -2.92822265625, -2.6251220703125, -2.322021484375, -2.0189208984375, -1.7158203125, -1.4127197265625, -1.109619140625, -0.8065185546875, -0.50341796875, -0.2003173828125, 0.102783203125, 0.4058837890625, 0.708984375, 1.0120849609375, 1.315185546875, 1.6182861328125, 1.92138671875, 2.2244873046875, 2.527587890625, 2.8306884765625, 3.1337890625, 3.4368896484375, 3.739990234375, 4.0430908203125, 4.34619140625, 4.6492919921875, 4.952392578125, 5.2554931640625, 5.55859375, 5.8616943359375, 6.164794921875, 6.4678955078125, 6.77099609375, 7.0740966796875, 7.377197265625, 7.6802978515625, 7.9833984375, 8.2864990234375, 8.589599609375, 8.8927001953125, 9.19580078125, 9.4989013671875, 9.802001953125, 10.1051025390625, 10.408203125, 10.7113037109375, 11.014404296875, 11.3175048828125, 11.62060546875, 11.9237060546875, 12.226806640625, 12.5299072265625, 12.8330078125, 13.1361083984375, 13.439208984375, 13.7423095703125, 14.04541015625, 14.3485107421875, 14.651611328125, 14.9547119140625, 15.2578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 20.0, 54.0, 111.0, 193.0, 247.0, 162.0, 107.0, 56.0, 18.0, 15.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.5120849609375, -101.46363830566406, -98.41519927978516, -95.36675262451172, -92.31830596923828, -89.26986694335938, -86.22142028808594, -83.1729736328125, -80.12452697753906, -77.07608032226562, -74.02764129638672, -70.97919464111328, -67.93074798583984, -64.88230895996094, -61.8338623046875, -58.78541564941406, -55.736976623535156, -52.688533782958984, -49.64008712768555, -46.591644287109375, -43.54319763183594, -40.494754791259766, -37.446311950683594, -34.397865295410156, -31.349422454833984, -28.30097770690918, -25.252532958984375, -22.204090118408203, -19.1556453704834, -16.107200622558594, -13.058757781982422, -10.010313034057617, -6.9618682861328125, -3.913424015045166, -0.8649797439575195, 2.1834640502929688, 5.231908798217773, 8.280353546142578, 11.32879638671875, 14.377241134643555, 17.42568588256836, 20.474130630493164, 23.52257537841797, 26.57101821899414, 29.619462966918945, 32.66790771484375, 35.71635055541992, 38.764793395996094, 41.81324005126953, 44.8616828918457, 47.91012954711914, 50.95857238769531, 54.00701904296875, 57.05546188354492, 60.103904724121094, 63.15235137939453, 66.20079040527344, 69.24923706054688, 72.29767608642578, 75.34612274169922, 78.39456939697266, 81.44300842285156, 84.491455078125, 87.53990173339844, 90.58834838867188]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 2.0, 5.0, 8.0, 10.0, 9.0, 10.0, 16.0, 18.0, 17.0, 20.0, 21.0, 27.0, 24.0, 39.0, 46.0, 36.0, 33.0, 41.0, 37.0, 39.0, 40.0, 40.0, 43.0, 34.0, 34.0, 35.0, 37.0, 37.0, 31.0, 39.0, 25.0, 23.0, 18.0, 19.0, 16.0, 13.0, 10.0, 7.0, 9.0, 6.0, 5.0, 8.0, 5.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0], "bins": [-22.431995391845703, -21.747270584106445, -21.06254768371582, -20.377822875976562, -19.693099975585938, -19.00837516784668, -18.323652267456055, -17.638927459716797, -16.954204559326172, -16.269479751586914, -15.584756851196289, -14.900032997131348, -14.215309143066406, -13.530585289001465, -12.845861434936523, -12.161136627197266, -11.476412773132324, -10.791688919067383, -10.106965065002441, -9.4222412109375, -8.737517356872559, -8.052793502807617, -7.368069171905518, -6.683345317840576, -5.998621463775635, -5.313897609710693, -4.629173755645752, -3.9444496631622314, -3.25972580909729, -2.5750019550323486, -1.8902778625488281, -1.2055540084838867, -0.5208301544189453, 0.16389375925064087, 0.848617672920227, 1.533341646194458, 2.2180655002593994, 2.902789354324341, 3.5875134468078613, 4.272237300872803, 4.956961154937744, 5.6416850090026855, 6.326408863067627, 7.011133193969727, 7.695857048034668, 8.38058090209961, 9.06530475616455, 9.750028610229492, 10.434752464294434, 11.119476318359375, 11.804200172424316, 12.488924026489258, 13.1736478805542, 13.85837173461914, 14.543096542358398, 15.227819442749023, 15.912544250488281, 16.59726905822754, 17.281991958618164, 17.966716766357422, 18.651439666748047, 19.336164474487305, 20.02088737487793, 20.705612182617188, 21.390335083007812]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 10.0, 10.0, 14.0, 23.0, 30.0, 43.0, 55.0, 114.0, 190.0, 413.0, 978.0, 3144.0, 16416.0, 143029.0, 618102.0, 233171.0, 26251.0, 4299.0, 1264.0, 449.0, 209.0, 122.0, 61.0, 35.0, 24.0, 18.0, 11.0, 14.0, 10.0, 8.0, 11.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5, -34.30126953125, -33.1025390625, -31.90380859375, -30.705078125, -29.50634765625, -28.3076171875, -27.10888671875, -25.91015625, -24.71142578125, -23.5126953125, -22.31396484375, -21.115234375, -19.91650390625, -18.7177734375, -17.51904296875, -16.3203125, -15.12158203125, -13.9228515625, -12.72412109375, -11.525390625, -10.32666015625, -9.1279296875, -7.92919921875, -6.73046875, -5.53173828125, -4.3330078125, -3.13427734375, -1.935546875, -0.73681640625, 0.4619140625, 1.66064453125, 2.859375, 4.05810546875, 5.2568359375, 6.45556640625, 7.654296875, 8.85302734375, 10.0517578125, 11.25048828125, 12.44921875, 13.64794921875, 14.8466796875, 16.04541015625, 17.244140625, 18.44287109375, 19.6416015625, 20.84033203125, 22.0390625, 23.23779296875, 24.4365234375, 25.63525390625, 26.833984375, 28.03271484375, 29.2314453125, 30.43017578125, 31.62890625, 32.82763671875, 34.0263671875, 35.22509765625, 36.423828125, 37.62255859375, 38.8212890625, 40.02001953125, 41.21875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 4.0, 6.0, 3.0, 10.0, 20.0, 29.0, 34.0, 33.0, 52.0, 75.0, 73.0, 65.0, 76.0, 93.0, 72.0, 67.0, 55.0, 57.0, 55.0, 29.0, 21.0, 18.0, 17.0, 14.0, 7.0, 3.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.95703125, -3.86297607421875, -3.7689208984375, -3.67486572265625, -3.580810546875, -3.48675537109375, -3.3927001953125, -3.29864501953125, -3.20458984375, -3.11053466796875, -3.0164794921875, -2.92242431640625, -2.828369140625, -2.73431396484375, -2.6402587890625, -2.54620361328125, -2.4521484375, -2.35809326171875, -2.2640380859375, -2.16998291015625, -2.075927734375, -1.98187255859375, -1.8878173828125, -1.79376220703125, -1.69970703125, -1.60565185546875, -1.5115966796875, -1.41754150390625, -1.323486328125, -1.22943115234375, -1.1353759765625, -1.04132080078125, -0.947265625, -0.85321044921875, -0.7591552734375, -0.66510009765625, -0.571044921875, -0.47698974609375, -0.3829345703125, -0.28887939453125, -0.19482421875, -0.10076904296875, -0.0067138671875, 0.08734130859375, 0.181396484375, 0.27545166015625, 0.3695068359375, 0.46356201171875, 0.5576171875, 0.65167236328125, 0.7457275390625, 0.83978271484375, 0.933837890625, 1.02789306640625, 1.1219482421875, 1.21600341796875, 1.31005859375, 1.40411376953125, 1.4981689453125, 1.59222412109375, 1.686279296875, 1.78033447265625, 1.8743896484375, 1.96844482421875, 2.0625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 5.0, 3.0, 7.0, 5.0, 8.0, 9.0, 25.0, 33.0, 58.0, 69.0, 76.0, 147.0, 178.0, 286.0, 383.0, 554.0, 878.0, 1418.0, 2755.0, 5891.0, 14159.0, 38385.0, 102726.0, 239161.0, 321248.0, 192235.0, 77601.0, 28922.0, 10775.0, 4710.0, 2263.0, 1180.0, 802.0, 465.0, 352.0, 209.0, 161.0, 116.0, 96.0, 68.0, 44.0, 27.0, 28.0, 15.0, 12.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9453125, -13.48583984375, -13.0263671875, -12.56689453125, -12.107421875, -11.64794921875, -11.1884765625, -10.72900390625, -10.26953125, -9.81005859375, -9.3505859375, -8.89111328125, -8.431640625, -7.97216796875, -7.5126953125, -7.05322265625, -6.59375, -6.13427734375, -5.6748046875, -5.21533203125, -4.755859375, -4.29638671875, -3.8369140625, -3.37744140625, -2.91796875, -2.45849609375, -1.9990234375, -1.53955078125, -1.080078125, -0.62060546875, -0.1611328125, 0.29833984375, 0.7578125, 1.21728515625, 1.6767578125, 2.13623046875, 2.595703125, 3.05517578125, 3.5146484375, 3.97412109375, 4.43359375, 4.89306640625, 5.3525390625, 5.81201171875, 6.271484375, 6.73095703125, 7.1904296875, 7.64990234375, 8.109375, 8.56884765625, 9.0283203125, 9.48779296875, 9.947265625, 10.40673828125, 10.8662109375, 11.32568359375, 11.78515625, 12.24462890625, 12.7041015625, 13.16357421875, 13.623046875, 14.08251953125, 14.5419921875, 15.00146484375, 15.4609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 11.0, 4.0, 7.0, 17.0, 12.0, 22.0, 22.0, 21.0, 24.0, 22.0, 36.0, 43.0, 39.0, 37.0, 45.0, 46.0, 44.0, 40.0, 47.0, 50.0, 52.0, 47.0, 45.0, 35.0, 29.0, 35.0, 27.0, 29.0, 19.0, 21.0, 12.0, 23.0, 10.0, 7.0, 7.0, 6.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.31298828125, -9.9541015625, -9.59521484375, -9.236328125, -8.87744140625, -8.5185546875, -8.15966796875, -7.80078125, -7.44189453125, -7.0830078125, -6.72412109375, -6.365234375, -6.00634765625, -5.6474609375, -5.28857421875, -4.9296875, -4.57080078125, -4.2119140625, -3.85302734375, -3.494140625, -3.13525390625, -2.7763671875, -2.41748046875, -2.05859375, -1.69970703125, -1.3408203125, -0.98193359375, -0.623046875, -0.26416015625, 0.0947265625, 0.45361328125, 0.8125, 1.17138671875, 1.5302734375, 1.88916015625, 2.248046875, 2.60693359375, 2.9658203125, 3.32470703125, 3.68359375, 4.04248046875, 4.4013671875, 4.76025390625, 5.119140625, 5.47802734375, 5.8369140625, 6.19580078125, 6.5546875, 6.91357421875, 7.2724609375, 7.63134765625, 7.990234375, 8.34912109375, 8.7080078125, 9.06689453125, 9.42578125, 9.78466796875, 10.1435546875, 10.50244140625, 10.861328125, 11.22021484375, 11.5791015625, 11.93798828125, 12.296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 4.0, 8.0, 12.0, 22.0, 40.0, 45.0, 73.0, 140.0, 182.0, 383.0, 700.0, 1578.0, 3714.0, 10005.0, 33693.0, 167955.0, 526403.0, 236937.0, 45598.0, 12778.0, 4490.0, 1878.0, 880.0, 405.0, 226.0, 131.0, 77.0, 65.0, 38.0, 25.0, 19.0, 13.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.453125, -21.74267578125, -21.0322265625, -20.32177734375, -19.611328125, -18.90087890625, -18.1904296875, -17.47998046875, -16.76953125, -16.05908203125, -15.3486328125, -14.63818359375, -13.927734375, -13.21728515625, -12.5068359375, -11.79638671875, -11.0859375, -10.37548828125, -9.6650390625, -8.95458984375, -8.244140625, -7.53369140625, -6.8232421875, -6.11279296875, -5.40234375, -4.69189453125, -3.9814453125, -3.27099609375, -2.560546875, -1.85009765625, -1.1396484375, -0.42919921875, 0.28125, 0.99169921875, 1.7021484375, 2.41259765625, 3.123046875, 3.83349609375, 4.5439453125, 5.25439453125, 5.96484375, 6.67529296875, 7.3857421875, 8.09619140625, 8.806640625, 9.51708984375, 10.2275390625, 10.93798828125, 11.6484375, 12.35888671875, 13.0693359375, 13.77978515625, 14.490234375, 15.20068359375, 15.9111328125, 16.62158203125, 17.33203125, 18.04248046875, 18.7529296875, 19.46337890625, 20.173828125, 20.88427734375, 21.5947265625, 22.30517578125, 23.015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 10.0, 10.0, 18.0, 10.0, 21.0, 32.0, 47.0, 48.0, 56.0, 96.0, 95.0, 106.0, 99.0, 66.0, 60.0, 44.0, 23.0, 36.0, 22.0, 15.0, 14.0, 18.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.002685546875, -0.0026152729988098145, -0.002544999122619629, -0.0024747252464294434, -0.002404451370239258, -0.0023341774940490723, -0.0022639036178588867, -0.002193629741668701, -0.0021233558654785156, -0.00205308198928833, -0.0019828081130981445, -0.001912534236907959, -0.0018422603607177734, -0.0017719864845275879, -0.0017017126083374023, -0.0016314387321472168, -0.0015611648559570312, -0.0014908909797668457, -0.0014206171035766602, -0.0013503432273864746, -0.001280069351196289, -0.0012097954750061035, -0.001139521598815918, -0.0010692477226257324, -0.0009989738464355469, -0.0009286999702453613, -0.0008584260940551758, -0.0007881522178649902, -0.0007178783416748047, -0.0006476044654846191, -0.0005773305892944336, -0.000507056713104248, -0.0004367828369140625, -0.00036650896072387695, -0.0002962350845336914, -0.00022596120834350586, -0.0001556873321533203, -8.541345596313477e-05, -1.5139579772949219e-05, 5.513429641723633e-05, 0.00012540817260742188, 0.00019568204879760742, 0.00026595592498779297, 0.0003362298011779785, 0.00040650367736816406, 0.0004767775535583496, 0.0005470514297485352, 0.0006173253059387207, 0.0006875991821289062, 0.0007578730583190918, 0.0008281469345092773, 0.0008984208106994629, 0.0009686946868896484, 0.001038968563079834, 0.0011092424392700195, 0.001179516315460205, 0.0012497901916503906, 0.0013200640678405762, 0.0013903379440307617, 0.0014606118202209473, 0.0015308856964111328, 0.0016011595726013184, 0.001671433448791504, 0.0017417073249816895, 0.001811981201171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 7.0, 11.0, 31.0, 54.0, 72.0, 89.0, 170.0, 332.0, 608.0, 1353.0, 3384.0, 9842.0, 39566.0, 244841.0, 560544.0, 149027.0, 26245.0, 7190.0, 2617.0, 1165.0, 605.0, 322.0, 163.0, 114.0, 57.0, 30.0, 30.0, 15.0, 17.0, 9.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.0, -21.196044921875, -20.39208984375, -19.588134765625, -18.7841796875, -17.980224609375, -17.17626953125, -16.372314453125, -15.568359375, -14.764404296875, -13.96044921875, -13.156494140625, -12.3525390625, -11.548583984375, -10.74462890625, -9.940673828125, -9.13671875, -8.332763671875, -7.52880859375, -6.724853515625, -5.9208984375, -5.116943359375, -4.31298828125, -3.509033203125, -2.705078125, -1.901123046875, -1.09716796875, -0.293212890625, 0.5107421875, 1.314697265625, 2.11865234375, 2.922607421875, 3.7265625, 4.530517578125, 5.33447265625, 6.138427734375, 6.9423828125, 7.746337890625, 8.55029296875, 9.354248046875, 10.158203125, 10.962158203125, 11.76611328125, 12.570068359375, 13.3740234375, 14.177978515625, 14.98193359375, 15.785888671875, 16.58984375, 17.393798828125, 18.19775390625, 19.001708984375, 19.8056640625, 20.609619140625, 21.41357421875, 22.217529296875, 23.021484375, 23.825439453125, 24.62939453125, 25.433349609375, 26.2373046875, 27.041259765625, 27.84521484375, 28.649169921875, 29.453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 8.0, 20.0, 19.0, 40.0, 62.0, 79.0, 103.0, 129.0, 124.0, 129.0, 110.0, 65.0, 34.0, 30.0, 22.0, 8.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -9.890869140625, -9.34423828125, -8.797607421875, -8.2509765625, -7.704345703125, -7.15771484375, -6.611083984375, -6.064453125, -5.517822265625, -4.97119140625, -4.424560546875, -3.8779296875, -3.331298828125, -2.78466796875, -2.238037109375, -1.69140625, -1.144775390625, -0.59814453125, -0.051513671875, 0.4951171875, 1.041748046875, 1.58837890625, 2.135009765625, 2.681640625, 3.228271484375, 3.77490234375, 4.321533203125, 4.8681640625, 5.414794921875, 5.96142578125, 6.508056640625, 7.0546875, 7.601318359375, 8.14794921875, 8.694580078125, 9.2412109375, 9.787841796875, 10.33447265625, 10.881103515625, 11.427734375, 11.974365234375, 12.52099609375, 13.067626953125, 13.6142578125, 14.160888671875, 14.70751953125, 15.254150390625, 15.80078125, 16.347412109375, 16.89404296875, 17.440673828125, 17.9873046875, 18.533935546875, 19.08056640625, 19.627197265625, 20.173828125, 20.720458984375, 21.26708984375, 21.813720703125, 22.3603515625, 22.906982421875, 23.45361328125, 24.000244140625, 24.546875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 10.0, 22.0, 49.0, 123.0, 176.0, 215.0, 206.0, 115.0, 45.0, 14.0, 9.0, 10.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-234.92721557617188, -227.93663024902344, -220.94606018066406, -213.95547485351562, -206.96490478515625, -199.9743194580078, -192.98373413085938, -185.9931640625, -179.00259399414062, -172.0120086669922, -165.0214385986328, -158.03085327148438, -151.040283203125, -144.04969787597656, -137.05911254882812, -130.06854248046875, -123.07795715332031, -116.0873794555664, -109.0968017578125, -102.10621643066406, -95.11564636230469, -88.12506103515625, -81.13448333740234, -74.14390563964844, -67.15332794189453, -60.162750244140625, -53.17217254638672, -46.18159103393555, -39.19101333618164, -32.200435638427734, -25.209854125976562, -18.219276428222656, -11.22869873046875, -4.238120079040527, 2.7524585723876953, 9.743038177490234, 16.73361587524414, 23.724193572998047, 30.71477508544922, 37.705352783203125, 44.69593048095703, 51.68650817871094, 58.677085876464844, 65.66766357421875, 72.65824890136719, 79.64881896972656, 86.639404296875, 93.6299819946289, 100.62055969238281, 107.61113739013672, 114.60171508789062, 121.59230041503906, 128.58287048339844, 135.57345581054688, 142.56402587890625, 149.5546112060547, 156.54519653320312, 163.53578186035156, 170.52635192871094, 177.51693725585938, 184.50750732421875, 191.4980926513672, 198.48867797851562, 205.479248046875, 212.46981811523438]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 4.0, 7.0, 8.0, 5.0, 6.0, 11.0, 13.0, 13.0, 14.0, 20.0, 17.0, 21.0, 32.0, 31.0, 36.0, 36.0, 42.0, 37.0, 35.0, 57.0, 38.0, 43.0, 44.0, 41.0, 50.0, 39.0, 37.0, 32.0, 42.0, 23.0, 30.0, 19.0, 23.0, 17.0, 11.0, 17.0, 3.0, 9.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.568115234375, -64.40438842773438, -62.24066925048828, -60.07694625854492, -57.91322326660156, -55.74949645996094, -53.58577346801758, -51.42205047607422, -49.25832748413086, -47.0946044921875, -44.93088150024414, -42.76715850830078, -40.603431701660156, -38.43971252441406, -36.27598571777344, -34.11226272583008, -31.94853973388672, -29.78481674194336, -27.62109375, -25.457368850708008, -23.29364585876465, -21.12992286682129, -18.966197967529297, -16.802474975585938, -14.638751983642578, -12.475028991699219, -10.311305046081543, -8.147581100463867, -5.983858108520508, -3.8201351165771484, -1.6564111709594727, 0.5073127746582031, 2.6710357666015625, 4.83475923538208, 6.998482704162598, 9.162206649780273, 11.325929641723633, 13.489652633666992, 15.653376579284668, 17.817100524902344, 19.980823516845703, 22.144546508789062, 24.308269500732422, 26.471994400024414, 28.635717391967773, 30.799440383911133, 32.963165283203125, 35.126888275146484, 37.290611267089844, 39.4543342590332, 41.61805725097656, 43.78178024291992, 45.94550323486328, 48.109230041503906, 50.272953033447266, 52.436676025390625, 54.600399017333984, 56.764122009277344, 58.9278450012207, 61.09156799316406, 63.25529479980469, 65.41901397705078, 67.5827407836914, 69.7464599609375, 71.91018676757812]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 3.0, 3.0, 10.0, 8.0, 24.0, 21.0, 31.0, 26.0, 65.0, 97.0, 139.0, 212.0, 411.0, 811.0, 2154.0, 6706.0, 24909.0, 169851.0, 3646212.0, 293459.0, 34831.0, 8809.0, 3005.0, 1214.0, 526.0, 268.0, 156.0, 113.0, 64.0, 38.0, 24.0, 29.0, 16.0, 8.0, 6.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.15625, -41.79052734375, -40.4248046875, -39.05908203125, -37.693359375, -36.32763671875, -34.9619140625, -33.59619140625, -32.23046875, -30.86474609375, -29.4990234375, -28.13330078125, -26.767578125, -25.40185546875, -24.0361328125, -22.67041015625, -21.3046875, -19.93896484375, -18.5732421875, -17.20751953125, -15.841796875, -14.47607421875, -13.1103515625, -11.74462890625, -10.37890625, -9.01318359375, -7.6474609375, -6.28173828125, -4.916015625, -3.55029296875, -2.1845703125, -0.81884765625, 0.546875, 1.91259765625, 3.2783203125, 4.64404296875, 6.009765625, 7.37548828125, 8.7412109375, 10.10693359375, 11.47265625, 12.83837890625, 14.2041015625, 15.56982421875, 16.935546875, 18.30126953125, 19.6669921875, 21.03271484375, 22.3984375, 23.76416015625, 25.1298828125, 26.49560546875, 27.861328125, 29.22705078125, 30.5927734375, 31.95849609375, 33.32421875, 34.68994140625, 36.0556640625, 37.42138671875, 38.787109375, 40.15283203125, 41.5185546875, 42.88427734375, 44.25]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 5.0, 8.0, 15.0, 11.0, 17.0, 33.0, 26.0, 21.0, 39.0, 43.0, 43.0, 58.0, 73.0, 60.0, 55.0, 43.0, 52.0, 55.0, 54.0, 39.0, 38.0, 36.0, 39.0, 25.0, 21.0, 26.0, 17.0, 6.0, 6.0, 6.0, 6.0, 5.0, 7.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.044921875, -2.964935302734375, -2.88494873046875, -2.804962158203125, -2.7249755859375, -2.644989013671875, -2.56500244140625, -2.485015869140625, -2.405029296875, -2.325042724609375, -2.24505615234375, -2.165069580078125, -2.0850830078125, -2.005096435546875, -1.92510986328125, -1.845123291015625, -1.76513671875, -1.685150146484375, -1.60516357421875, -1.525177001953125, -1.4451904296875, -1.365203857421875, -1.28521728515625, -1.205230712890625, -1.125244140625, -1.045257568359375, -0.96527099609375, -0.885284423828125, -0.8052978515625, -0.725311279296875, -0.64532470703125, -0.565338134765625, -0.4853515625, -0.405364990234375, -0.32537841796875, -0.245391845703125, -0.1654052734375, -0.085418701171875, -0.00543212890625, 0.074554443359375, 0.154541015625, 0.234527587890625, 0.31451416015625, 0.394500732421875, 0.4744873046875, 0.554473876953125, 0.63446044921875, 0.714447021484375, 0.79443359375, 0.874420166015625, 0.95440673828125, 1.034393310546875, 1.1143798828125, 1.194366455078125, 1.27435302734375, 1.354339599609375, 1.434326171875, 1.514312744140625, 1.59429931640625, 1.674285888671875, 1.7542724609375, 1.834259033203125, 1.91424560546875, 1.994232177734375, 2.07421875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 4.0, 3.0, 9.0, 12.0, 11.0, 18.0, 13.0, 37.0, 40.0, 63.0, 115.0, 166.0, 342.0, 655.0, 1637.0, 6923.0, 129404.0, 3945832.0, 98761.0, 6665.0, 1851.0, 789.0, 370.0, 221.0, 101.0, 60.0, 44.0, 32.0, 21.0, 26.0, 14.0, 15.0, 6.0, 8.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-82.875, -80.5380859375, -78.201171875, -75.8642578125, -73.52734375, -71.1904296875, -68.853515625, -66.5166015625, -64.1796875, -61.8427734375, -59.505859375, -57.1689453125, -54.83203125, -52.4951171875, -50.158203125, -47.8212890625, -45.484375, -43.1474609375, -40.810546875, -38.4736328125, -36.13671875, -33.7998046875, -31.462890625, -29.1259765625, -26.7890625, -24.4521484375, -22.115234375, -19.7783203125, -17.44140625, -15.1044921875, -12.767578125, -10.4306640625, -8.09375, -5.7568359375, -3.419921875, -1.0830078125, 1.25390625, 3.5908203125, 5.927734375, 8.2646484375, 10.6015625, 12.9384765625, 15.275390625, 17.6123046875, 19.94921875, 22.2861328125, 24.623046875, 26.9599609375, 29.296875, 31.6337890625, 33.970703125, 36.3076171875, 38.64453125, 40.9814453125, 43.318359375, 45.6552734375, 47.9921875, 50.3291015625, 52.666015625, 55.0029296875, 57.33984375, 59.6767578125, 62.013671875, 64.3505859375, 66.6875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 12.0, 14.0, 15.0, 36.0, 37.0, 60.0, 116.0, 182.0, 283.0, 646.0, 1159.0, 659.0, 340.0, 174.0, 100.0, 64.0, 43.0, 29.0, 29.0, 13.0, 14.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4765625, -5.2529296875, -5.029296875, -4.8056640625, -4.58203125, -4.3583984375, -4.134765625, -3.9111328125, -3.6875, -3.4638671875, -3.240234375, -3.0166015625, -2.79296875, -2.5693359375, -2.345703125, -2.1220703125, -1.8984375, -1.6748046875, -1.451171875, -1.2275390625, -1.00390625, -0.7802734375, -0.556640625, -0.3330078125, -0.109375, 0.1142578125, 0.337890625, 0.5615234375, 0.78515625, 1.0087890625, 1.232421875, 1.4560546875, 1.6796875, 1.9033203125, 2.126953125, 2.3505859375, 2.57421875, 2.7978515625, 3.021484375, 3.2451171875, 3.46875, 3.6923828125, 3.916015625, 4.1396484375, 4.36328125, 4.5869140625, 4.810546875, 5.0341796875, 5.2578125, 5.4814453125, 5.705078125, 5.9287109375, 6.15234375, 6.3759765625, 6.599609375, 6.8232421875, 7.046875, 7.2705078125, 7.494140625, 7.7177734375, 7.94140625, 8.1650390625, 8.388671875, 8.6123046875, 8.8359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 6.0, 3.0, 3.0, 13.0, 20.0, 34.0, 42.0, 62.0, 109.0, 120.0, 143.0, 121.0, 113.0, 74.0, 49.0, 29.0, 14.0, 18.0, 5.0, 9.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.70625305175781, -48.78070068359375, -46.85515213012695, -44.92959976196289, -43.004051208496094, -41.07849884033203, -39.15294647216797, -37.22739791870117, -35.301849365234375, -33.37629699707031, -31.450748443603516, -29.525196075439453, -27.599647521972656, -25.674095153808594, -23.748544692993164, -21.822994232177734, -19.897441864013672, -17.971891403198242, -16.046340942382812, -14.120789527893066, -12.195239067077637, -10.269688606262207, -8.344137191772461, -6.418586730957031, -4.493036270141602, -2.5674855709075928, -0.641934871673584, 1.283616065979004, 3.2091665267944336, 5.134716987609863, 7.060268402099609, 8.985818862915039, 10.911369323730469, 12.836919784545898, 14.762470245361328, 16.68802261352539, 18.613571166992188, 20.53912353515625, 22.46467399597168, 24.39022445678711, 26.31577491760254, 28.24132537841797, 30.1668758392334, 32.09242630004883, 34.01797866821289, 35.94352722167969, 37.86907958984375, 39.79463195800781, 41.72018051147461, 43.64573287963867, 45.57128143310547, 47.49683380126953, 49.42238235473633, 51.34793472290039, 53.27348327636719, 55.19903564453125, 57.12458801269531, 59.050140380859375, 60.97568893432617, 62.901241302490234, 64.82678985595703, 66.7523422241211, 68.67789459228516, 70.60343933105469, 72.52899169921875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 7.0, 21.0, 23.0, 35.0, 39.0, 33.0, 52.0, 50.0, 58.0, 67.0, 63.0, 63.0, 61.0, 65.0, 65.0, 57.0, 49.0, 36.0, 40.0, 28.0, 20.0, 18.0, 9.0, 12.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-50.2838249206543, -49.11212921142578, -47.940433502197266, -46.76873779296875, -45.5970458984375, -44.425350189208984, -43.25365447998047, -42.08195877075195, -40.91026306152344, -39.73856735229492, -38.566871643066406, -37.39517593383789, -36.223480224609375, -35.051788330078125, -33.88009262084961, -32.708396911621094, -31.536701202392578, -30.365005493164062, -29.193309783935547, -28.021615982055664, -26.84992027282715, -25.678224563598633, -24.50653076171875, -23.334835052490234, -22.16313934326172, -20.991443634033203, -19.819747924804688, -18.648054122924805, -17.47635841369629, -16.304662704467773, -15.132967948913574, -13.961273193359375, -12.789581298828125, -11.61788558959961, -10.44619083404541, -9.274496078491211, -8.102800369262695, -6.931105136871338, -5.7594099044799805, -4.587715148925781, -3.4160194396972656, -2.244324207305908, -1.0726289749145508, 0.09906625747680664, 1.270761489868164, 2.4424567222595215, 3.614151954650879, 4.785846710205078, 5.957542419433594, 7.129237651824951, 8.300932884216309, 9.472627639770508, 10.644323348999023, 11.816019058227539, 12.987713813781738, 14.159408569335938, 15.331104278564453, 16.50279998779297, 17.674495697021484, 18.846189498901367, 20.017885208129883, 21.1895809173584, 22.36127471923828, 23.532970428466797, 24.704666137695312]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 7.0, 7.0, 8.0, 18.0, 27.0, 27.0, 57.0, 57.0, 119.0, 220.0, 391.0, 883.0, 2290.0, 8240.0, 41826.0, 251749.0, 545449.0, 161563.0, 26735.0, 5630.0, 1808.0, 684.0, 295.0, 181.0, 119.0, 43.0, 38.0, 31.0, 21.0, 8.0, 9.0, 3.0, 9.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.375, -27.440673828125, -26.50634765625, -25.572021484375, -24.6376953125, -23.703369140625, -22.76904296875, -21.834716796875, -20.900390625, -19.966064453125, -19.03173828125, -18.097412109375, -17.1630859375, -16.228759765625, -15.29443359375, -14.360107421875, -13.42578125, -12.491455078125, -11.55712890625, -10.622802734375, -9.6884765625, -8.754150390625, -7.81982421875, -6.885498046875, -5.951171875, -5.016845703125, -4.08251953125, -3.148193359375, -2.2138671875, -1.279541015625, -0.34521484375, 0.589111328125, 1.5234375, 2.457763671875, 3.39208984375, 4.326416015625, 5.2607421875, 6.195068359375, 7.12939453125, 8.063720703125, 8.998046875, 9.932373046875, 10.86669921875, 11.801025390625, 12.7353515625, 13.669677734375, 14.60400390625, 15.538330078125, 16.47265625, 17.406982421875, 18.34130859375, 19.275634765625, 20.2099609375, 21.144287109375, 22.07861328125, 23.012939453125, 23.947265625, 24.881591796875, 25.81591796875, 26.750244140625, 27.6845703125, 28.618896484375, 29.55322265625, 30.487548828125, 31.421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 3.0, 7.0, 12.0, 18.0, 11.0, 24.0, 37.0, 18.0, 38.0, 43.0, 53.0, 45.0, 47.0, 57.0, 55.0, 57.0, 47.0, 43.0, 60.0, 50.0, 44.0, 32.0, 43.0, 31.0, 27.0, 23.0, 22.0, 15.0, 8.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.947265625, -2.86199951171875, -2.7767333984375, -2.69146728515625, -2.606201171875, -2.52093505859375, -2.4356689453125, -2.35040283203125, -2.26513671875, -2.17987060546875, -2.0946044921875, -2.00933837890625, -1.924072265625, -1.83880615234375, -1.7535400390625, -1.66827392578125, -1.5830078125, -1.49774169921875, -1.4124755859375, -1.32720947265625, -1.241943359375, -1.15667724609375, -1.0714111328125, -0.98614501953125, -0.90087890625, -0.81561279296875, -0.7303466796875, -0.64508056640625, -0.559814453125, -0.47454833984375, -0.3892822265625, -0.30401611328125, -0.21875, -0.13348388671875, -0.0482177734375, 0.03704833984375, 0.122314453125, 0.20758056640625, 0.2928466796875, 0.37811279296875, 0.46337890625, 0.54864501953125, 0.6339111328125, 0.71917724609375, 0.804443359375, 0.88970947265625, 0.9749755859375, 1.06024169921875, 1.1455078125, 1.23077392578125, 1.3160400390625, 1.40130615234375, 1.486572265625, 1.57183837890625, 1.6571044921875, 1.74237060546875, 1.82763671875, 1.91290283203125, 1.9981689453125, 2.08343505859375, 2.168701171875, 2.25396728515625, 2.3392333984375, 2.42449951171875, 2.509765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 3.0, 3.0, 8.0, 7.0, 7.0, 7.0, 11.0, 17.0, 22.0, 35.0, 40.0, 67.0, 79.0, 132.0, 164.0, 255.0, 338.0, 545.0, 802.0, 1438.0, 2434.0, 4797.0, 10687.0, 27482.0, 73153.0, 182664.0, 319578.0, 244575.0, 108073.0, 40412.0, 15983.0, 6835.0, 3119.0, 1694.0, 1043.0, 627.0, 435.0, 294.0, 190.0, 140.0, 104.0, 57.0, 50.0, 32.0, 38.0, 23.0, 18.0, 13.0, 7.0, 5.0, 6.0, 7.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.8203125, -12.388671875, -11.95703125, -11.525390625, -11.09375, -10.662109375, -10.23046875, -9.798828125, -9.3671875, -8.935546875, -8.50390625, -8.072265625, -7.640625, -7.208984375, -6.77734375, -6.345703125, -5.9140625, -5.482421875, -5.05078125, -4.619140625, -4.1875, -3.755859375, -3.32421875, -2.892578125, -2.4609375, -2.029296875, -1.59765625, -1.166015625, -0.734375, -0.302734375, 0.12890625, 0.560546875, 0.9921875, 1.423828125, 1.85546875, 2.287109375, 2.71875, 3.150390625, 3.58203125, 4.013671875, 4.4453125, 4.876953125, 5.30859375, 5.740234375, 6.171875, 6.603515625, 7.03515625, 7.466796875, 7.8984375, 8.330078125, 8.76171875, 9.193359375, 9.625, 10.056640625, 10.48828125, 10.919921875, 11.3515625, 11.783203125, 12.21484375, 12.646484375, 13.078125, 13.509765625, 13.94140625, 14.373046875, 14.8046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 7.0, 3.0, 6.0, 10.0, 7.0, 3.0, 11.0, 10.0, 15.0, 22.0, 13.0, 20.0, 30.0, 31.0, 29.0, 36.0, 24.0, 47.0, 45.0, 41.0, 43.0, 37.0, 34.0, 34.0, 40.0, 52.0, 40.0, 37.0, 29.0, 33.0, 30.0, 23.0, 19.0, 21.0, 21.0, 14.0, 10.0, 13.0, 11.0, 6.0, 13.0, 4.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8515625, -10.5196533203125, -10.187744140625, -9.8558349609375, -9.52392578125, -9.1920166015625, -8.860107421875, -8.5281982421875, -8.1962890625, -7.8643798828125, -7.532470703125, -7.2005615234375, -6.86865234375, -6.5367431640625, -6.204833984375, -5.8729248046875, -5.541015625, -5.2091064453125, -4.877197265625, -4.5452880859375, -4.21337890625, -3.8814697265625, -3.549560546875, -3.2176513671875, -2.8857421875, -2.5538330078125, -2.221923828125, -1.8900146484375, -1.55810546875, -1.2261962890625, -0.894287109375, -0.5623779296875, -0.23046875, 0.1014404296875, 0.433349609375, 0.7652587890625, 1.09716796875, 1.4290771484375, 1.760986328125, 2.0928955078125, 2.4248046875, 2.7567138671875, 3.088623046875, 3.4205322265625, 3.75244140625, 4.0843505859375, 4.416259765625, 4.7481689453125, 5.080078125, 5.4119873046875, 5.743896484375, 6.0758056640625, 6.40771484375, 6.7396240234375, 7.071533203125, 7.4034423828125, 7.7353515625, 8.0672607421875, 8.399169921875, 8.7310791015625, 9.06298828125, 9.3948974609375, 9.726806640625, 10.0587158203125, 10.390625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 4.0, 13.0, 11.0, 31.0, 39.0, 45.0, 101.0, 193.0, 340.0, 764.0, 1801.0, 5680.0, 23094.0, 159950.0, 650600.0, 172333.0, 24142.0, 5927.0, 1933.0, 746.0, 350.0, 182.0, 91.0, 66.0, 38.0, 31.0, 15.0, 8.0, 5.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-27.765625, -27.06298828125, -26.3603515625, -25.65771484375, -24.955078125, -24.25244140625, -23.5498046875, -22.84716796875, -22.14453125, -21.44189453125, -20.7392578125, -20.03662109375, -19.333984375, -18.63134765625, -17.9287109375, -17.22607421875, -16.5234375, -15.82080078125, -15.1181640625, -14.41552734375, -13.712890625, -13.01025390625, -12.3076171875, -11.60498046875, -10.90234375, -10.19970703125, -9.4970703125, -8.79443359375, -8.091796875, -7.38916015625, -6.6865234375, -5.98388671875, -5.28125, -4.57861328125, -3.8759765625, -3.17333984375, -2.470703125, -1.76806640625, -1.0654296875, -0.36279296875, 0.33984375, 1.04248046875, 1.7451171875, 2.44775390625, 3.150390625, 3.85302734375, 4.5556640625, 5.25830078125, 5.9609375, 6.66357421875, 7.3662109375, 8.06884765625, 8.771484375, 9.47412109375, 10.1767578125, 10.87939453125, 11.58203125, 12.28466796875, 12.9873046875, 13.68994140625, 14.392578125, 15.09521484375, 15.7978515625, 16.50048828125, 17.203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 9.0, 3.0, 9.0, 5.0, 10.0, 10.0, 20.0, 18.0, 32.0, 39.0, 40.0, 40.0, 57.0, 77.0, 85.0, 80.0, 72.0, 54.0, 65.0, 60.0, 44.0, 24.0, 35.0, 16.0, 18.0, 15.0, 9.0, 5.0, 8.0, 5.0, 6.0, 6.0, 6.0, 0.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0015048980712890625, -0.0014551281929016113, -0.0014053583145141602, -0.001355588436126709, -0.0013058185577392578, -0.0012560486793518066, -0.0012062788009643555, -0.0011565089225769043, -0.0011067390441894531, -0.001056969165802002, -0.0010071992874145508, -0.0009574294090270996, -0.0009076595306396484, -0.0008578896522521973, -0.0008081197738647461, -0.0007583498954772949, -0.0007085800170898438, -0.0006588101387023926, -0.0006090402603149414, -0.0005592703819274902, -0.0005095005035400391, -0.0004597306251525879, -0.0004099607467651367, -0.00036019086837768555, -0.0003104209899902344, -0.0002606511116027832, -0.00021088123321533203, -0.00016111135482788086, -0.00011134147644042969, -6.157159805297852e-05, -1.1801719665527344e-05, 3.796815872192383e-05, 8.7738037109375e-05, 0.00013750791549682617, 0.00018727779388427734, 0.00023704767227172852, 0.0002868175506591797, 0.00033658742904663086, 0.00038635730743408203, 0.0004361271858215332, 0.0004858970642089844, 0.0005356669425964355, 0.0005854368209838867, 0.0006352066993713379, 0.0006849765777587891, 0.0007347464561462402, 0.0007845163345336914, 0.0008342862129211426, 0.0008840560913085938, 0.0009338259696960449, 0.000983595848083496, 0.0010333657264709473, 0.0010831356048583984, 0.0011329054832458496, 0.0011826753616333008, 0.001232445240020752, 0.0012822151184082031, 0.0013319849967956543, 0.0013817548751831055, 0.0014315247535705566, 0.0014812946319580078, 0.001531064510345459, 0.0015808343887329102, 0.0016306042671203613, 0.0016803741455078125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 3.0, 1.0, 3.0, 8.0, 5.0, 14.0, 18.0, 25.0, 40.0, 52.0, 92.0, 132.0, 238.0, 480.0, 808.0, 1650.0, 3719.0, 9297.0, 28158.0, 134758.0, 555573.0, 247042.0, 43998.0, 12920.0, 4982.0, 2130.0, 1023.0, 587.0, 300.0, 155.0, 125.0, 70.0, 45.0, 26.0, 20.0, 12.0, 11.0, 9.0, 5.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.0625, -17.45361328125, -16.8447265625, -16.23583984375, -15.626953125, -15.01806640625, -14.4091796875, -13.80029296875, -13.19140625, -12.58251953125, -11.9736328125, -11.36474609375, -10.755859375, -10.14697265625, -9.5380859375, -8.92919921875, -8.3203125, -7.71142578125, -7.1025390625, -6.49365234375, -5.884765625, -5.27587890625, -4.6669921875, -4.05810546875, -3.44921875, -2.84033203125, -2.2314453125, -1.62255859375, -1.013671875, -0.40478515625, 0.2041015625, 0.81298828125, 1.421875, 2.03076171875, 2.6396484375, 3.24853515625, 3.857421875, 4.46630859375, 5.0751953125, 5.68408203125, 6.29296875, 6.90185546875, 7.5107421875, 8.11962890625, 8.728515625, 9.33740234375, 9.9462890625, 10.55517578125, 11.1640625, 11.77294921875, 12.3818359375, 12.99072265625, 13.599609375, 14.20849609375, 14.8173828125, 15.42626953125, 16.03515625, 16.64404296875, 17.2529296875, 17.86181640625, 18.470703125, 19.07958984375, 19.6884765625, 20.29736328125, 20.90625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 11.0, 10.0, 21.0, 27.0, 37.0, 33.0, 40.0, 66.0, 82.0, 73.0, 63.0, 72.0, 78.0, 75.0, 55.0, 60.0, 44.0, 20.0, 23.0, 25.0, 19.0, 8.0, 13.0, 10.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6015625, -9.3111572265625, -9.020751953125, -8.7303466796875, -8.43994140625, -8.1495361328125, -7.859130859375, -7.5687255859375, -7.2783203125, -6.9879150390625, -6.697509765625, -6.4071044921875, -6.11669921875, -5.8262939453125, -5.535888671875, -5.2454833984375, -4.955078125, -4.6646728515625, -4.374267578125, -4.0838623046875, -3.79345703125, -3.5030517578125, -3.212646484375, -2.9222412109375, -2.6318359375, -2.3414306640625, -2.051025390625, -1.7606201171875, -1.47021484375, -1.1798095703125, -0.889404296875, -0.5989990234375, -0.30859375, -0.0181884765625, 0.272216796875, 0.5626220703125, 0.85302734375, 1.1434326171875, 1.433837890625, 1.7242431640625, 2.0146484375, 2.3050537109375, 2.595458984375, 2.8858642578125, 3.17626953125, 3.4666748046875, 3.757080078125, 4.0474853515625, 4.337890625, 4.6282958984375, 4.918701171875, 5.2091064453125, 5.49951171875, 5.7899169921875, 6.080322265625, 6.3707275390625, 6.6611328125, 6.9515380859375, 7.241943359375, 7.5323486328125, 7.82275390625, 8.1131591796875, 8.403564453125, 8.6939697265625, 8.984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 20.0, 55.0, 100.0, 186.0, 210.0, 200.0, 137.0, 46.0, 25.0, 9.0, 5.0, 9.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-365.9214782714844, -358.5467529296875, -351.1720275878906, -343.79730224609375, -336.4225769042969, -329.0478515625, -321.6731262207031, -314.29840087890625, -306.9236755371094, -299.5489501953125, -292.1742248535156, -284.79949951171875, -277.4247741699219, -270.050048828125, -262.6753234863281, -255.30059814453125, -247.92588806152344, -240.55116271972656, -233.1764373779297, -225.8017120361328, -218.42698669433594, -211.05226135253906, -203.67755126953125, -196.30282592773438, -188.9281005859375, -181.55337524414062, -174.17864990234375, -166.80392456054688, -159.42919921875, -152.05447387695312, -144.67974853515625, -137.30502319335938, -129.93028259277344, -122.55555725097656, -115.18083190917969, -107.80610656738281, -100.43138122558594, -93.05665588378906, -85.68193817138672, -78.30721282958984, -70.93248748779297, -63.557762145996094, -56.18303680419922, -48.80831527709961, -41.433589935302734, -34.05886459350586, -26.68414306640625, -19.309417724609375, -11.9346923828125, -4.559967994689941, 2.814756393432617, 10.18947982788086, 17.564205169677734, 24.93893051147461, 32.31365203857422, 39.688377380371094, 47.06310272216797, 54.437828063964844, 61.81255340576172, 69.18727111816406, 76.56199645996094, 83.93672180175781, 91.31144714355469, 98.68617248535156, 106.06089782714844]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 5.0, 11.0, 15.0, 17.0, 21.0, 25.0, 25.0, 37.0, 23.0, 29.0, 37.0, 46.0, 41.0, 47.0, 56.0, 46.0, 55.0, 38.0, 54.0, 46.0, 44.0, 29.0, 46.0, 36.0, 26.0, 25.0, 23.0, 18.0, 16.0, 13.0, 8.0, 8.0, 6.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-84.3667984008789, -81.9338607788086, -79.50093078613281, -77.0679931640625, -74.63506317138672, -72.2021255493164, -69.76919555664062, -67.33625793457031, -64.9033203125, -62.47038650512695, -60.037452697753906, -57.60451889038086, -55.17158508300781, -52.7386474609375, -50.30571365356445, -47.872779846191406, -45.439849853515625, -43.00691604614258, -40.57398223876953, -38.141048431396484, -35.70811462402344, -33.275177001953125, -30.842243194580078, -28.40930938720703, -25.976375579833984, -23.543441772460938, -21.11050796508789, -18.67757225036621, -16.244638442993164, -13.811704635620117, -11.378769874572754, -8.94583511352539, -6.5128936767578125, -4.079959392547607, -1.6470251083374023, 0.7859091758728027, 3.218843460083008, 5.651777267456055, 8.084712028503418, 10.517646789550781, 12.950580596923828, 15.383514404296875, 17.816448211669922, 20.2493839263916, 22.68231773376465, 25.115251541137695, 27.548187255859375, 29.981121063232422, 32.41405487060547, 34.846988677978516, 37.27992248535156, 39.71285629272461, 42.145790100097656, 44.57872772216797, 47.011661529541016, 49.44459533691406, 51.87752914428711, 54.310462951660156, 56.7433967590332, 59.17633056640625, 61.60926818847656, 64.04219818115234, 66.47513580322266, 68.90806579589844, 71.34100341796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 5.0, 6.0, 9.0, 13.0, 16.0, 14.0, 20.0, 31.0, 28.0, 32.0, 61.0, 64.0, 95.0, 142.0, 198.0, 260.0, 405.0, 647.0, 1106.0, 2218.0, 4889.0, 12751.0, 48425.0, 672236.0, 3328495.0, 89726.0, 19423.0, 6727.0, 2861.0, 1448.0, 759.0, 431.0, 232.0, 164.0, 113.0, 62.0, 44.0, 35.0, 14.0, 19.0, 13.0, 9.0, 11.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-41.53125, -40.3828125, -39.234375, -38.0859375, -36.9375, -35.7890625, -34.640625, -33.4921875, -32.34375, -31.1953125, -30.046875, -28.8984375, -27.75, -26.6015625, -25.453125, -24.3046875, -23.15625, -22.0078125, -20.859375, -19.7109375, -18.5625, -17.4140625, -16.265625, -15.1171875, -13.96875, -12.8203125, -11.671875, -10.5234375, -9.375, -8.2265625, -7.078125, -5.9296875, -4.78125, -3.6328125, -2.484375, -1.3359375, -0.1875, 0.9609375, 2.109375, 3.2578125, 4.40625, 5.5546875, 6.703125, 7.8515625, 9.0, 10.1484375, 11.296875, 12.4453125, 13.59375, 14.7421875, 15.890625, 17.0390625, 18.1875, 19.3359375, 20.484375, 21.6328125, 22.78125, 23.9296875, 25.078125, 26.2265625, 27.375, 28.5234375, 29.671875, 30.8203125, 31.96875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 5.0, 13.0, 14.0, 24.0, 29.0, 31.0, 41.0, 58.0, 69.0, 65.0, 61.0, 65.0, 67.0, 81.0, 60.0, 78.0, 58.0, 46.0, 27.0, 37.0, 22.0, 17.0, 12.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.083343505859375, -3.96356201171875, -3.843780517578125, -3.7239990234375, -3.604217529296875, -3.48443603515625, -3.364654541015625, -3.244873046875, -3.125091552734375, -3.00531005859375, -2.885528564453125, -2.7657470703125, -2.645965576171875, -2.52618408203125, -2.406402587890625, -2.28662109375, -2.166839599609375, -2.04705810546875, -1.927276611328125, -1.8074951171875, -1.687713623046875, -1.56793212890625, -1.448150634765625, -1.328369140625, -1.208587646484375, -1.08880615234375, -0.969024658203125, -0.8492431640625, -0.729461669921875, -0.60968017578125, -0.489898681640625, -0.3701171875, -0.250335693359375, -0.13055419921875, -0.010772705078125, 0.1090087890625, 0.228790283203125, 0.34857177734375, 0.468353271484375, 0.588134765625, 0.707916259765625, 0.82769775390625, 0.947479248046875, 1.0672607421875, 1.187042236328125, 1.30682373046875, 1.426605224609375, 1.54638671875, 1.666168212890625, 1.78594970703125, 1.905731201171875, 2.0255126953125, 2.145294189453125, 2.26507568359375, 2.384857177734375, 2.504638671875, 2.624420166015625, 2.74420166015625, 2.863983154296875, 2.9837646484375, 3.103546142578125, 3.22332763671875, 3.343109130859375, 3.462890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 8.0, 8.0, 18.0, 18.0, 23.0, 55.0, 66.0, 100.0, 178.0, 318.0, 681.0, 2604.0, 26381.0, 3989997.0, 165971.0, 5664.0, 1145.0, 436.0, 247.0, 127.0, 81.0, 56.0, 34.0, 13.0, 21.0, 8.0, 8.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.4375, -95.4287109375, -92.419921875, -89.4111328125, -86.40234375, -83.3935546875, -80.384765625, -77.3759765625, -74.3671875, -71.3583984375, -68.349609375, -65.3408203125, -62.33203125, -59.3232421875, -56.314453125, -53.3056640625, -50.296875, -47.2880859375, -44.279296875, -41.2705078125, -38.26171875, -35.2529296875, -32.244140625, -29.2353515625, -26.2265625, -23.2177734375, -20.208984375, -17.2001953125, -14.19140625, -11.1826171875, -8.173828125, -5.1650390625, -2.15625, 0.8525390625, 3.861328125, 6.8701171875, 9.87890625, 12.8876953125, 15.896484375, 18.9052734375, 21.9140625, 24.9228515625, 27.931640625, 30.9404296875, 33.94921875, 36.9580078125, 39.966796875, 42.9755859375, 45.984375, 48.9931640625, 52.001953125, 55.0107421875, 58.01953125, 61.0283203125, 64.037109375, 67.0458984375, 70.0546875, 73.0634765625, 76.072265625, 79.0810546875, 82.08984375, 85.0986328125, 88.107421875, 91.1162109375, 94.125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 15.0, 20.0, 54.0, 138.0, 728.0, 2379.0, 517.0, 124.0, 59.0, 20.0, 11.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.625, -26.01171875, -25.3984375, -24.78515625, -24.171875, -23.55859375, -22.9453125, -22.33203125, -21.71875, -21.10546875, -20.4921875, -19.87890625, -19.265625, -18.65234375, -18.0390625, -17.42578125, -16.8125, -16.19921875, -15.5859375, -14.97265625, -14.359375, -13.74609375, -13.1328125, -12.51953125, -11.90625, -11.29296875, -10.6796875, -10.06640625, -9.453125, -8.83984375, -8.2265625, -7.61328125, -7.0, -6.38671875, -5.7734375, -5.16015625, -4.546875, -3.93359375, -3.3203125, -2.70703125, -2.09375, -1.48046875, -0.8671875, -0.25390625, 0.359375, 0.97265625, 1.5859375, 2.19921875, 2.8125, 3.42578125, 4.0390625, 4.65234375, 5.265625, 5.87890625, 6.4921875, 7.10546875, 7.71875, 8.33203125, 8.9453125, 9.55859375, 10.171875, 10.78515625, 11.3984375, 12.01171875, 12.625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 14.0, 27.0, 74.0, 132.0, 229.0, 218.0, 157.0, 66.0, 51.0, 13.0, 9.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.55551147460938, -118.52092742919922, -115.48634338378906, -112.4517593383789, -109.41717529296875, -106.3825912475586, -103.34800720214844, -100.31341552734375, -97.27883911132812, -94.24425506591797, -91.20967102050781, -88.17508697509766, -85.1405029296875, -82.10591888427734, -79.07133483886719, -76.0367431640625, -73.00215911865234, -69.96757507324219, -66.93299102783203, -63.898406982421875, -60.86382293701172, -57.82923889160156, -54.79465103149414, -51.760066986083984, -48.72548294067383, -45.69089889526367, -42.656314849853516, -39.621726989746094, -36.58714294433594, -33.55255889892578, -30.517974853515625, -27.48339080810547, -24.448814392089844, -21.414230346679688, -18.37964630126953, -15.345060348510742, -12.310476303100586, -9.27589225769043, -6.241306304931641, -3.2067222595214844, -0.17213821411132812, 2.8624463081359863, 5.897030830383301, 8.931615829467773, 11.96619987487793, 15.000783920288086, 18.035369873046875, 21.06995391845703, 24.104537963867188, 27.139122009277344, 30.1737060546875, 33.208290100097656, 36.24287414550781, 39.27745819091797, 42.31204605102539, 45.34663009643555, 48.3812141418457, 51.41579818725586, 54.450382232666016, 57.48497009277344, 60.519554138183594, 63.55413818359375, 66.5887222290039, 69.62330627441406, 72.65789031982422]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 5.0, 6.0, 1.0, 7.0, 12.0, 18.0, 22.0, 24.0, 29.0, 26.0, 31.0, 34.0, 43.0, 61.0, 56.0, 46.0, 67.0, 49.0, 67.0, 50.0, 62.0, 46.0, 42.0, 39.0, 32.0, 26.0, 22.0, 16.0, 13.0, 14.0, 11.0, 8.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.97541809082031, -32.917293548583984, -31.859169006347656, -30.801042556762695, -29.742918014526367, -28.68479347229004, -27.626667022705078, -26.56854248046875, -25.510417938232422, -24.452293395996094, -23.394168853759766, -22.336042404174805, -21.277917861938477, -20.21979331970215, -19.161666870117188, -18.10354232788086, -17.04541778564453, -15.987293243408203, -14.929167747497559, -13.871042251586914, -12.812917709350586, -11.754793167114258, -10.696667671203613, -9.638542175292969, -8.58041763305664, -7.522292613983154, -6.464167594909668, -5.406042575836182, -4.347917556762695, -3.289792537689209, -2.2316675186157227, -1.1735424995422363, -0.11541748046875, 0.9427075386047363, 2.0008325576782227, 3.058957576751709, 4.117082595825195, 5.175207614898682, 6.233332633972168, 7.291457653045654, 8.34958267211914, 9.407707214355469, 10.465832710266113, 11.523958206176758, 12.582082748413086, 13.640207290649414, 14.698332786560059, 15.756458282470703, 16.81458282470703, 17.87270736694336, 18.930831909179688, 19.98895835876465, 21.047082901000977, 22.105207443237305, 23.163333892822266, 24.221458435058594, 25.279582977294922, 26.33770751953125, 27.395832061767578, 28.45395851135254, 29.512083053588867, 30.570207595825195, 31.628334045410156, 32.686458587646484, 33.74458312988281]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 7.0, 13.0, 22.0, 34.0, 42.0, 58.0, 103.0, 181.0, 288.0, 559.0, 1075.0, 2637.0, 7405.0, 26601.0, 112657.0, 398704.0, 364915.0, 98439.0, 23345.0, 6818.0, 2341.0, 1050.0, 518.0, 245.0, 162.0, 106.0, 65.0, 40.0, 31.0, 14.0, 10.0, 14.0, 10.0, 5.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.9375, -29.148681640625, -28.35986328125, -27.571044921875, -26.7822265625, -25.993408203125, -25.20458984375, -24.415771484375, -23.626953125, -22.838134765625, -22.04931640625, -21.260498046875, -20.4716796875, -19.682861328125, -18.89404296875, -18.105224609375, -17.31640625, -16.527587890625, -15.73876953125, -14.949951171875, -14.1611328125, -13.372314453125, -12.58349609375, -11.794677734375, -11.005859375, -10.217041015625, -9.42822265625, -8.639404296875, -7.8505859375, -7.061767578125, -6.27294921875, -5.484130859375, -4.6953125, -3.906494140625, -3.11767578125, -2.328857421875, -1.5400390625, -0.751220703125, 0.03759765625, 0.826416015625, 1.615234375, 2.404052734375, 3.19287109375, 3.981689453125, 4.7705078125, 5.559326171875, 6.34814453125, 7.136962890625, 7.92578125, 8.714599609375, 9.50341796875, 10.292236328125, 11.0810546875, 11.869873046875, 12.65869140625, 13.447509765625, 14.236328125, 15.025146484375, 15.81396484375, 16.602783203125, 17.3916015625, 18.180419921875, 18.96923828125, 19.758056640625, 20.546875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 5.0, 5.0, 3.0, 4.0, 4.0, 9.0, 9.0, 14.0, 15.0, 4.0, 25.0, 17.0, 20.0, 19.0, 29.0, 39.0, 35.0, 38.0, 47.0, 54.0, 43.0, 51.0, 43.0, 49.0, 45.0, 46.0, 42.0, 43.0, 28.0, 37.0, 29.0, 20.0, 28.0, 17.0, 19.0, 18.0, 10.0, 11.0, 7.0, 9.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.23828125, -2.14996337890625, -2.0616455078125, -1.97332763671875, -1.885009765625, -1.79669189453125, -1.7083740234375, -1.62005615234375, -1.53173828125, -1.44342041015625, -1.3551025390625, -1.26678466796875, -1.178466796875, -1.09014892578125, -1.0018310546875, -0.91351318359375, -0.8251953125, -0.73687744140625, -0.6485595703125, -0.56024169921875, -0.471923828125, -0.38360595703125, -0.2952880859375, -0.20697021484375, -0.11865234375, -0.03033447265625, 0.0579833984375, 0.14630126953125, 0.234619140625, 0.32293701171875, 0.4112548828125, 0.49957275390625, 0.587890625, 0.67620849609375, 0.7645263671875, 0.85284423828125, 0.941162109375, 1.02947998046875, 1.1177978515625, 1.20611572265625, 1.29443359375, 1.38275146484375, 1.4710693359375, 1.55938720703125, 1.647705078125, 1.73602294921875, 1.8243408203125, 1.91265869140625, 2.0009765625, 2.08929443359375, 2.1776123046875, 2.26593017578125, 2.354248046875, 2.44256591796875, 2.5308837890625, 2.61920166015625, 2.70751953125, 2.79583740234375, 2.8841552734375, 2.97247314453125, 3.060791015625, 3.14910888671875, 3.2374267578125, 3.32574462890625, 3.4140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 13.0, 15.0, 12.0, 19.0, 27.0, 28.0, 39.0, 45.0, 89.0, 121.0, 150.0, 214.0, 346.0, 472.0, 887.0, 1574.0, 3401.0, 8628.0, 26045.0, 85225.0, 249814.0, 385548.0, 191798.0, 62080.0, 18874.0, 6860.0, 2844.0, 1339.0, 709.0, 463.0, 256.0, 182.0, 123.0, 87.0, 59.0, 43.0, 30.0, 18.0, 18.0, 18.0, 8.0, 9.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.140625, -17.596923828125, -17.05322265625, -16.509521484375, -15.9658203125, -15.422119140625, -14.87841796875, -14.334716796875, -13.791015625, -13.247314453125, -12.70361328125, -12.159912109375, -11.6162109375, -11.072509765625, -10.52880859375, -9.985107421875, -9.44140625, -8.897705078125, -8.35400390625, -7.810302734375, -7.2666015625, -6.722900390625, -6.17919921875, -5.635498046875, -5.091796875, -4.548095703125, -4.00439453125, -3.460693359375, -2.9169921875, -2.373291015625, -1.82958984375, -1.285888671875, -0.7421875, -0.198486328125, 0.34521484375, 0.888916015625, 1.4326171875, 1.976318359375, 2.52001953125, 3.063720703125, 3.607421875, 4.151123046875, 4.69482421875, 5.238525390625, 5.7822265625, 6.325927734375, 6.86962890625, 7.413330078125, 7.95703125, 8.500732421875, 9.04443359375, 9.588134765625, 10.1318359375, 10.675537109375, 11.21923828125, 11.762939453125, 12.306640625, 12.850341796875, 13.39404296875, 13.937744140625, 14.4814453125, 15.025146484375, 15.56884765625, 16.112548828125, 16.65625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 8.0, 3.0, 9.0, 15.0, 12.0, 15.0, 21.0, 15.0, 22.0, 30.0, 27.0, 34.0, 36.0, 39.0, 53.0, 45.0, 42.0, 47.0, 48.0, 58.0, 56.0, 49.0, 38.0, 36.0, 32.0, 29.0, 41.0, 22.0, 26.0, 24.0, 15.0, 10.0, 11.0, 6.0, 7.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.84375, -11.382080078125, -10.92041015625, -10.458740234375, -9.9970703125, -9.535400390625, -9.07373046875, -8.612060546875, -8.150390625, -7.688720703125, -7.22705078125, -6.765380859375, -6.3037109375, -5.842041015625, -5.38037109375, -4.918701171875, -4.45703125, -3.995361328125, -3.53369140625, -3.072021484375, -2.6103515625, -2.148681640625, -1.68701171875, -1.225341796875, -0.763671875, -0.302001953125, 0.15966796875, 0.621337890625, 1.0830078125, 1.544677734375, 2.00634765625, 2.468017578125, 2.9296875, 3.391357421875, 3.85302734375, 4.314697265625, 4.7763671875, 5.238037109375, 5.69970703125, 6.161376953125, 6.623046875, 7.084716796875, 7.54638671875, 8.008056640625, 8.4697265625, 8.931396484375, 9.39306640625, 9.854736328125, 10.31640625, 10.778076171875, 11.23974609375, 11.701416015625, 12.1630859375, 12.624755859375, 13.08642578125, 13.548095703125, 14.009765625, 14.471435546875, 14.93310546875, 15.394775390625, 15.8564453125, 16.318115234375, 16.77978515625, 17.241455078125, 17.703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 8.0, 19.0, 19.0, 33.0, 37.0, 75.0, 101.0, 161.0, 292.0, 596.0, 1243.0, 2909.0, 9928.0, 66567.0, 681506.0, 253574.0, 22851.0, 5002.0, 1781.0, 770.0, 418.0, 248.0, 134.0, 84.0, 51.0, 30.0, 23.0, 26.0, 10.0, 8.0, 12.0, 6.0, 3.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.359375, -23.54052734375, -22.7216796875, -21.90283203125, -21.083984375, -20.26513671875, -19.4462890625, -18.62744140625, -17.80859375, -16.98974609375, -16.1708984375, -15.35205078125, -14.533203125, -13.71435546875, -12.8955078125, -12.07666015625, -11.2578125, -10.43896484375, -9.6201171875, -8.80126953125, -7.982421875, -7.16357421875, -6.3447265625, -5.52587890625, -4.70703125, -3.88818359375, -3.0693359375, -2.25048828125, -1.431640625, -0.61279296875, 0.2060546875, 1.02490234375, 1.84375, 2.66259765625, 3.4814453125, 4.30029296875, 5.119140625, 5.93798828125, 6.7568359375, 7.57568359375, 8.39453125, 9.21337890625, 10.0322265625, 10.85107421875, 11.669921875, 12.48876953125, 13.3076171875, 14.12646484375, 14.9453125, 15.76416015625, 16.5830078125, 17.40185546875, 18.220703125, 19.03955078125, 19.8583984375, 20.67724609375, 21.49609375, 22.31494140625, 23.1337890625, 23.95263671875, 24.771484375, 25.59033203125, 26.4091796875, 27.22802734375, 28.046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 3.0, 5.0, 5.0, 4.0, 9.0, 20.0, 32.0, 62.0, 98.0, 191.0, 226.0, 160.0, 90.0, 44.0, 22.0, 8.0, 6.0, 5.0, 8.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005054473876953125, -0.004902482032775879, -0.004750490188598633, -0.004598498344421387, -0.004446506500244141, -0.0042945146560668945, -0.0041425228118896484, -0.003990530967712402, -0.0038385391235351562, -0.00368654727935791, -0.003534555435180664, -0.003382563591003418, -0.003230571746826172, -0.0030785799026489258, -0.0029265880584716797, -0.0027745962142944336, -0.0026226043701171875, -0.0024706125259399414, -0.0023186206817626953, -0.0021666288375854492, -0.002014636993408203, -0.001862645149230957, -0.001710653305053711, -0.0015586614608764648, -0.0014066696166992188, -0.0012546777725219727, -0.0011026859283447266, -0.0009506940841674805, -0.0007987022399902344, -0.0006467103958129883, -0.0004947185516357422, -0.0003427267074584961, -0.00019073486328125, -3.8743019104003906e-05, 0.00011324882507324219, 0.0002652406692504883, 0.0004172325134277344, 0.0005692243576049805, 0.0007212162017822266, 0.0008732080459594727, 0.0010251998901367188, 0.0011771917343139648, 0.001329183578491211, 0.001481175422668457, 0.0016331672668457031, 0.0017851591110229492, 0.0019371509552001953, 0.0020891427993774414, 0.0022411346435546875, 0.0023931264877319336, 0.0025451183319091797, 0.0026971101760864258, 0.002849102020263672, 0.003001093864440918, 0.003153085708618164, 0.00330507755279541, 0.0034570693969726562, 0.0036090612411499023, 0.0037610530853271484, 0.0039130449295043945, 0.004065036773681641, 0.004217028617858887, 0.004369020462036133, 0.004521012306213379, 0.004673004150390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 8.0, 5.0, 9.0, 10.0, 21.0, 35.0, 70.0, 103.0, 183.0, 353.0, 720.0, 1854.0, 5847.0, 35892.0, 685032.0, 293947.0, 18009.0, 3833.0, 1411.0, 570.0, 280.0, 147.0, 70.0, 40.0, 31.0, 19.0, 13.0, 8.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.703125, -26.631103515625, -25.55908203125, -24.487060546875, -23.4150390625, -22.343017578125, -21.27099609375, -20.198974609375, -19.126953125, -18.054931640625, -16.98291015625, -15.910888671875, -14.8388671875, -13.766845703125, -12.69482421875, -11.622802734375, -10.55078125, -9.478759765625, -8.40673828125, -7.334716796875, -6.2626953125, -5.190673828125, -4.11865234375, -3.046630859375, -1.974609375, -0.902587890625, 0.16943359375, 1.241455078125, 2.3134765625, 3.385498046875, 4.45751953125, 5.529541015625, 6.6015625, 7.673583984375, 8.74560546875, 9.817626953125, 10.8896484375, 11.961669921875, 13.03369140625, 14.105712890625, 15.177734375, 16.249755859375, 17.32177734375, 18.393798828125, 19.4658203125, 20.537841796875, 21.60986328125, 22.681884765625, 23.75390625, 24.825927734375, 25.89794921875, 26.969970703125, 28.0419921875, 29.114013671875, 30.18603515625, 31.258056640625, 32.330078125, 33.402099609375, 34.47412109375, 35.546142578125, 36.6181640625, 37.690185546875, 38.76220703125, 39.834228515625, 40.90625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 10.0, 5.0, 19.0, 31.0, 56.0, 75.0, 91.0, 142.0, 144.0, 117.0, 87.0, 61.0, 46.0, 33.0, 27.0, 10.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.015625, -11.56201171875, -11.1083984375, -10.65478515625, -10.201171875, -9.74755859375, -9.2939453125, -8.84033203125, -8.38671875, -7.93310546875, -7.4794921875, -7.02587890625, -6.572265625, -6.11865234375, -5.6650390625, -5.21142578125, -4.7578125, -4.30419921875, -3.8505859375, -3.39697265625, -2.943359375, -2.48974609375, -2.0361328125, -1.58251953125, -1.12890625, -0.67529296875, -0.2216796875, 0.23193359375, 0.685546875, 1.13916015625, 1.5927734375, 2.04638671875, 2.5, 2.95361328125, 3.4072265625, 3.86083984375, 4.314453125, 4.76806640625, 5.2216796875, 5.67529296875, 6.12890625, 6.58251953125, 7.0361328125, 7.48974609375, 7.943359375, 8.39697265625, 8.8505859375, 9.30419921875, 9.7578125, 10.21142578125, 10.6650390625, 11.11865234375, 11.572265625, 12.02587890625, 12.4794921875, 12.93310546875, 13.38671875, 13.84033203125, 14.2939453125, 14.74755859375, 15.201171875, 15.65478515625, 16.1083984375, 16.56201171875, 17.015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 9.0, 51.0, 123.0, 316.0, 310.0, 130.0, 41.0, 16.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-688.1822509765625, -674.6695556640625, -661.1568603515625, -647.6441040039062, -634.1314086914062, -620.6187133789062, -607.1060180664062, -593.5933227539062, -580.08056640625, -566.56787109375, -553.05517578125, -539.5424194335938, -526.0297241210938, -512.5170288085938, -499.00433349609375, -485.4916076660156, -471.97894287109375, -458.46624755859375, -444.9535217285156, -431.4408264160156, -417.9281005859375, -404.4154052734375, -390.9027099609375, -377.3899841308594, -363.87725830078125, -350.36456298828125, -336.8518371582031, -323.3391418457031, -309.826416015625, -296.313720703125, -282.801025390625, -269.2882995605469, -255.77560424804688, -242.2628936767578, -228.75018310546875, -215.23748779296875, -201.7247772216797, -188.21206665039062, -174.69935607910156, -161.1866455078125, -147.6739501953125, -134.16123962402344, -120.6485366821289, -107.13582611083984, -93.62312316894531, -80.11041259765625, -66.59770202636719, -53.084999084472656, -39.57228088378906, -26.059574127197266, -12.546865463256836, 0.9658432006835938, 14.47854995727539, 27.991256713867188, 41.50396728515625, 55.01667022705078, 68.52938079833984, 82.0420913696289, 95.55479431152344, 109.0675048828125, 122.58021545410156, 136.09292602539062, 149.60562133789062, 163.1183319091797, 176.63104248046875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 10.0, 7.0, 7.0, 13.0, 12.0, 22.0, 24.0, 27.0, 37.0, 39.0, 51.0, 50.0, 40.0, 56.0, 48.0, 39.0, 42.0, 57.0, 59.0, 55.0, 30.0, 48.0, 34.0, 29.0, 32.0, 26.0, 20.0, 20.0, 9.0, 7.0, 16.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-107.59994506835938, -104.49720001220703, -101.39446258544922, -98.29171752929688, -95.18898010253906, -92.08623504638672, -88.98348999023438, -85.88075256347656, -82.77800750732422, -79.67526245117188, -76.57252502441406, -73.46977996826172, -70.36703491210938, -67.26429748535156, -64.16155242919922, -61.05881118774414, -57.95606994628906, -54.853328704833984, -51.750587463378906, -48.64784240722656, -45.545101165771484, -42.442359924316406, -39.33961486816406, -36.236873626708984, -33.134132385253906, -30.031391143798828, -26.928647994995117, -23.825904846191406, -20.723163604736328, -17.62042236328125, -14.517679214477539, -11.414936065673828, -8.312202453613281, -5.209460258483887, -2.106718063354492, 0.9960241317749023, 4.098766326904297, 7.201508522033691, 10.304250717163086, 13.406993865966797, 16.509735107421875, 19.612476348876953, 22.715219497680664, 25.817962646484375, 28.920703887939453, 32.02344512939453, 35.126190185546875, 38.22893142700195, 41.33167266845703, 44.43441390991211, 47.53715515136719, 50.63990020751953, 53.74264144897461, 56.84538269042969, 59.94812774658203, 63.05086898803711, 66.15361022949219, 69.25635528564453, 72.35909271240234, 75.46183776855469, 78.5645751953125, 81.66732025146484, 84.77006530761719, 87.872802734375, 90.97554779052734]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 12.0, 5.0, 11.0, 14.0, 11.0, 22.0, 26.0, 32.0, 45.0, 65.0, 113.0, 143.0, 226.0, 330.0, 512.0, 876.0, 1491.0, 2909.0, 5942.0, 15361.0, 48040.0, 258409.0, 3270423.0, 483913.0, 69313.0, 20343.0, 7927.0, 3591.0, 1792.0, 972.0, 540.0, 304.0, 194.0, 136.0, 69.0, 51.0, 39.0, 24.0, 14.0, 17.0, 8.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.921875, -31.0, -30.078125, -29.15625, -28.234375, -27.3125, -26.390625, -25.46875, -24.546875, -23.625, -22.703125, -21.78125, -20.859375, -19.9375, -19.015625, -18.09375, -17.171875, -16.25, -15.328125, -14.40625, -13.484375, -12.5625, -11.640625, -10.71875, -9.796875, -8.875, -7.953125, -7.03125, -6.109375, -5.1875, -4.265625, -3.34375, -2.421875, -1.5, -0.578125, 0.34375, 1.265625, 2.1875, 3.109375, 4.03125, 4.953125, 5.875, 6.796875, 7.71875, 8.640625, 9.5625, 10.484375, 11.40625, 12.328125, 13.25, 14.171875, 15.09375, 16.015625, 16.9375, 17.859375, 18.78125, 19.703125, 20.625, 21.546875, 22.46875, 23.390625, 24.3125, 25.234375, 26.15625, 27.078125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 5.0, 8.0, 10.0, 21.0, 17.0, 25.0, 23.0, 46.0, 55.0, 43.0, 67.0, 64.0, 56.0, 50.0, 68.0, 57.0, 53.0, 68.0, 54.0, 38.0, 44.0, 38.0, 25.0, 22.0, 12.0, 14.0, 4.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.716644287109375, -4.58563232421875, -4.454620361328125, -4.3236083984375, -4.192596435546875, -4.06158447265625, -3.930572509765625, -3.799560546875, -3.668548583984375, -3.53753662109375, -3.406524658203125, -3.2755126953125, -3.144500732421875, -3.01348876953125, -2.882476806640625, -2.75146484375, -2.620452880859375, -2.48944091796875, -2.358428955078125, -2.2274169921875, -2.096405029296875, -1.96539306640625, -1.834381103515625, -1.703369140625, -1.572357177734375, -1.44134521484375, -1.310333251953125, -1.1793212890625, -1.048309326171875, -0.91729736328125, -0.786285400390625, -0.6552734375, -0.524261474609375, -0.39324951171875, -0.262237548828125, -0.1312255859375, -0.000213623046875, 0.13079833984375, 0.261810302734375, 0.392822265625, 0.523834228515625, 0.65484619140625, 0.785858154296875, 0.9168701171875, 1.047882080078125, 1.17889404296875, 1.309906005859375, 1.44091796875, 1.571929931640625, 1.70294189453125, 1.833953857421875, 1.9649658203125, 2.095977783203125, 2.22698974609375, 2.358001708984375, 2.489013671875, 2.620025634765625, 2.75103759765625, 2.882049560546875, 3.0130615234375, 3.144073486328125, 3.27508544921875, 3.406097412109375, 3.537109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 26.0, 28.0, 50.0, 90.0, 135.0, 322.0, 1072.0, 50975.0, 4137410.0, 3104.0, 497.0, 245.0, 128.0, 80.0, 46.0, 30.0, 21.0, 10.0, 7.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.0, -103.5390625, -95.078125, -86.6171875, -78.15625, -69.6953125, -61.234375, -52.7734375, -44.3125, -35.8515625, -27.390625, -18.9296875, -10.46875, -2.0078125, 6.453125, 14.9140625, 23.375, 31.8359375, 40.296875, 48.7578125, 57.21875, 65.6796875, 74.140625, 82.6015625, 91.0625, 99.5234375, 107.984375, 116.4453125, 124.90625, 133.3671875, 141.828125, 150.2890625, 158.75, 167.2109375, 175.671875, 184.1328125, 192.59375, 201.0546875, 209.515625, 217.9765625, 226.4375, 234.8984375, 243.359375, 251.8203125, 260.28125, 268.7421875, 277.203125, 285.6640625, 294.125, 302.5859375, 311.046875, 319.5078125, 327.96875, 336.4296875, 344.890625, 353.3515625, 361.8125, 370.2734375, 378.734375, 387.1953125, 395.65625, 404.1171875, 412.578125, 421.0390625, 429.5]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 6.0, 17.0, 48.0, 143.0, 579.0, 2543.0, 571.0, 111.0, 44.0, 13.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.03125, -9.73388671875, -8.4365234375, -7.13916015625, -5.841796875, -4.54443359375, -3.2470703125, -1.94970703125, -0.65234375, 0.64501953125, 1.9423828125, 3.23974609375, 4.537109375, 5.83447265625, 7.1318359375, 8.42919921875, 9.7265625, 11.02392578125, 12.3212890625, 13.61865234375, 14.916015625, 16.21337890625, 17.5107421875, 18.80810546875, 20.10546875, 21.40283203125, 22.7001953125, 23.99755859375, 25.294921875, 26.59228515625, 27.8896484375, 29.18701171875, 30.484375, 31.78173828125, 33.0791015625, 34.37646484375, 35.673828125, 36.97119140625, 38.2685546875, 39.56591796875, 40.86328125, 42.16064453125, 43.4580078125, 44.75537109375, 46.052734375, 47.35009765625, 48.6474609375, 49.94482421875, 51.2421875, 52.53955078125, 53.8369140625, 55.13427734375, 56.431640625, 57.72900390625, 59.0263671875, 60.32373046875, 61.62109375, 62.91845703125, 64.2158203125, 65.51318359375, 66.810546875, 68.10791015625, 69.4052734375, 70.70263671875, 72.0]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 18.0, 43.0, 175.0, 370.0, 264.0, 67.0, 37.0, 13.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-473.6034851074219, -463.6739501953125, -453.74444580078125, -443.81494140625, -433.8854064941406, -423.95587158203125, -414.0263671875, -404.09686279296875, -394.1673278808594, -384.23779296875, -374.30828857421875, -364.3787841796875, -354.4492492675781, -344.51971435546875, -334.5902099609375, -324.66070556640625, -314.7311706542969, -304.8016357421875, -294.87213134765625, -284.942626953125, -275.0130920410156, -265.08355712890625, -255.154052734375, -245.2245330810547, -235.29501342773438, -225.36549377441406, -215.43597412109375, -205.50645446777344, -195.57693481445312, -185.6474151611328, -175.7178955078125, -165.7883758544922, -155.85882568359375, -145.92930603027344, -135.99978637695312, -126.07026672363281, -116.1407470703125, -106.21122741699219, -96.28170776367188, -86.35218811035156, -76.42266845703125, -66.49314880371094, -56.563629150390625, -46.63410949707031, -36.70458984375, -26.775070190429688, -16.845550537109375, -6.9160308837890625, 3.01348876953125, 12.943008422851562, 22.872528076171875, 32.80204772949219, 42.7315673828125, 52.66108703613281, 62.590606689453125, 72.52012634277344, 82.44964599609375, 92.37916564941406, 102.30868530273438, 112.23820495605469, 122.167724609375, 132.0972442626953, 142.02676391601562, 151.95628356933594, 161.88580322265625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 13.0, 15.0, 35.0, 45.0, 42.0, 72.0, 79.0, 86.0, 89.0, 81.0, 99.0, 76.0, 52.0, 68.0, 33.0, 43.0, 19.0, 15.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.61752319335938, -110.95903015136719, -107.300537109375, -103.64204406738281, -99.9835433959961, -96.3250503540039, -92.66655731201172, -89.00806427001953, -85.34956359863281, -81.69107055664062, -78.03257751464844, -74.37408447265625, -70.71558380126953, -67.05709075927734, -63.398597717285156, -59.74010467529297, -56.08161163330078, -52.423118591308594, -48.76462173461914, -45.10612869262695, -41.4476318359375, -37.78913879394531, -34.130645751953125, -30.472150802612305, -26.813655853271484, -23.155160903930664, -19.496665954589844, -15.838172912597656, -12.179677963256836, -8.521183013916016, -4.862689971923828, -1.2041950225830078, 2.4542999267578125, 6.112794399261475, 9.771288871765137, 13.42978286743164, 17.08827781677246, 20.74677276611328, 24.40526580810547, 28.06376075744629, 31.72225570678711, 35.3807487487793, 39.03924560546875, 42.69773864746094, 46.356231689453125, 50.01472854614258, 53.673221588134766, 57.33171844482422, 60.990211486816406, 64.6487045288086, 68.30719757080078, 71.9656982421875, 75.62419128417969, 79.28268432617188, 82.94117736816406, 86.59967041015625, 90.25816345214844, 93.91665649414062, 97.57514953613281, 101.233642578125, 104.89214324951172, 108.5506362915039, 112.2091293334961, 115.86762237548828, 119.526123046875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 9.0, 13.0, 11.0, 21.0, 31.0, 46.0, 56.0, 80.0, 121.0, 187.0, 289.0, 467.0, 778.0, 1457.0, 2715.0, 5717.0, 14907.0, 43724.0, 143313.0, 407143.0, 290541.0, 90064.0, 27764.0, 9978.0, 4175.0, 2053.0, 1089.0, 622.0, 400.0, 231.0, 179.0, 111.0, 79.0, 49.0, 38.0, 32.0, 12.0, 16.0, 6.0, 7.0, 4.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.765625, -26.892578125, -26.01953125, -25.146484375, -24.2734375, -23.400390625, -22.52734375, -21.654296875, -20.78125, -19.908203125, -19.03515625, -18.162109375, -17.2890625, -16.416015625, -15.54296875, -14.669921875, -13.796875, -12.923828125, -12.05078125, -11.177734375, -10.3046875, -9.431640625, -8.55859375, -7.685546875, -6.8125, -5.939453125, -5.06640625, -4.193359375, -3.3203125, -2.447265625, -1.57421875, -0.701171875, 0.171875, 1.044921875, 1.91796875, 2.791015625, 3.6640625, 4.537109375, 5.41015625, 6.283203125, 7.15625, 8.029296875, 8.90234375, 9.775390625, 10.6484375, 11.521484375, 12.39453125, 13.267578125, 14.140625, 15.013671875, 15.88671875, 16.759765625, 17.6328125, 18.505859375, 19.37890625, 20.251953125, 21.125, 21.998046875, 22.87109375, 23.744140625, 24.6171875, 25.490234375, 26.36328125, 27.236328125, 28.109375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 4.0, 8.0, 5.0, 23.0, 19.0, 23.0, 36.0, 40.0, 34.0, 44.0, 61.0, 67.0, 65.0, 73.0, 76.0, 69.0, 65.0, 51.0, 55.0, 36.0, 30.0, 32.0, 20.0, 16.0, 7.0, 12.0, 5.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.81640625, -6.6346435546875, -6.452880859375, -6.2711181640625, -6.08935546875, -5.9075927734375, -5.725830078125, -5.5440673828125, -5.3623046875, -5.1805419921875, -4.998779296875, -4.8170166015625, -4.63525390625, -4.4534912109375, -4.271728515625, -4.0899658203125, -3.908203125, -3.7264404296875, -3.544677734375, -3.3629150390625, -3.18115234375, -2.9993896484375, -2.817626953125, -2.6358642578125, -2.4541015625, -2.2723388671875, -2.090576171875, -1.9088134765625, -1.72705078125, -1.5452880859375, -1.363525390625, -1.1817626953125, -1.0, -0.8182373046875, -0.636474609375, -0.4547119140625, -0.27294921875, -0.0911865234375, 0.090576171875, 0.2723388671875, 0.4541015625, 0.6358642578125, 0.817626953125, 0.9993896484375, 1.18115234375, 1.3629150390625, 1.544677734375, 1.7264404296875, 1.908203125, 2.0899658203125, 2.271728515625, 2.4534912109375, 2.63525390625, 2.8170166015625, 2.998779296875, 3.1805419921875, 3.3623046875, 3.5440673828125, 3.725830078125, 3.9075927734375, 4.08935546875, 4.2711181640625, 4.452880859375, 4.6346435546875, 4.81640625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 6.0, 8.0, 13.0, 9.0, 19.0, 23.0, 19.0, 44.0, 65.0, 78.0, 112.0, 213.0, 370.0, 750.0, 1811.0, 4766.0, 15268.0, 54457.0, 208797.0, 472345.0, 210141.0, 55502.0, 15378.0, 4868.0, 1732.0, 822.0, 346.0, 217.0, 107.0, 74.0, 56.0, 38.0, 29.0, 17.0, 18.0, 13.0, 5.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.546875, -18.836181640625, -18.12548828125, -17.414794921875, -16.7041015625, -15.993408203125, -15.28271484375, -14.572021484375, -13.861328125, -13.150634765625, -12.43994140625, -11.729248046875, -11.0185546875, -10.307861328125, -9.59716796875, -8.886474609375, -8.17578125, -7.465087890625, -6.75439453125, -6.043701171875, -5.3330078125, -4.622314453125, -3.91162109375, -3.200927734375, -2.490234375, -1.779541015625, -1.06884765625, -0.358154296875, 0.3525390625, 1.063232421875, 1.77392578125, 2.484619140625, 3.1953125, 3.906005859375, 4.61669921875, 5.327392578125, 6.0380859375, 6.748779296875, 7.45947265625, 8.170166015625, 8.880859375, 9.591552734375, 10.30224609375, 11.012939453125, 11.7236328125, 12.434326171875, 13.14501953125, 13.855712890625, 14.56640625, 15.277099609375, 15.98779296875, 16.698486328125, 17.4091796875, 18.119873046875, 18.83056640625, 19.541259765625, 20.251953125, 20.962646484375, 21.67333984375, 22.384033203125, 23.0947265625, 23.805419921875, 24.51611328125, 25.226806640625, 25.9375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 5.0, 4.0, 5.0, 11.0, 5.0, 9.0, 17.0, 15.0, 11.0, 22.0, 27.0, 27.0, 32.0, 25.0, 44.0, 33.0, 46.0, 44.0, 41.0, 33.0, 49.0, 49.0, 59.0, 47.0, 43.0, 42.0, 24.0, 30.0, 29.0, 30.0, 26.0, 13.0, 19.0, 13.0, 13.0, 11.0, 10.0, 8.0, 7.0, 9.0, 4.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-16.84375, -16.3577880859375, -15.871826171875, -15.3858642578125, -14.89990234375, -14.4139404296875, -13.927978515625, -13.4420166015625, -12.9560546875, -12.4700927734375, -11.984130859375, -11.4981689453125, -11.01220703125, -10.5262451171875, -10.040283203125, -9.5543212890625, -9.068359375, -8.5823974609375, -8.096435546875, -7.6104736328125, -7.12451171875, -6.6385498046875, -6.152587890625, -5.6666259765625, -5.1806640625, -4.6947021484375, -4.208740234375, -3.7227783203125, -3.23681640625, -2.7508544921875, -2.264892578125, -1.7789306640625, -1.29296875, -0.8070068359375, -0.321044921875, 0.1649169921875, 0.65087890625, 1.1368408203125, 1.622802734375, 2.1087646484375, 2.5947265625, 3.0806884765625, 3.566650390625, 4.0526123046875, 4.53857421875, 5.0245361328125, 5.510498046875, 5.9964599609375, 6.482421875, 6.9683837890625, 7.454345703125, 7.9403076171875, 8.42626953125, 8.9122314453125, 9.398193359375, 9.8841552734375, 10.3701171875, 10.8560791015625, 11.342041015625, 11.8280029296875, 12.31396484375, 12.7999267578125, 13.285888671875, 13.7718505859375, 14.2578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 9.0, 5.0, 12.0, 26.0, 35.0, 34.0, 61.0, 74.0, 142.0, 249.0, 465.0, 931.0, 1834.0, 4235.0, 11719.0, 45954.0, 382282.0, 516006.0, 60955.0, 14311.0, 4905.0, 2054.0, 1001.0, 523.0, 276.0, 167.0, 101.0, 58.0, 46.0, 24.0, 21.0, 15.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.609375, -20.83984375, -20.0703125, -19.30078125, -18.53125, -17.76171875, -16.9921875, -16.22265625, -15.453125, -14.68359375, -13.9140625, -13.14453125, -12.375, -11.60546875, -10.8359375, -10.06640625, -9.296875, -8.52734375, -7.7578125, -6.98828125, -6.21875, -5.44921875, -4.6796875, -3.91015625, -3.140625, -2.37109375, -1.6015625, -0.83203125, -0.0625, 0.70703125, 1.4765625, 2.24609375, 3.015625, 3.78515625, 4.5546875, 5.32421875, 6.09375, 6.86328125, 7.6328125, 8.40234375, 9.171875, 9.94140625, 10.7109375, 11.48046875, 12.25, 13.01953125, 13.7890625, 14.55859375, 15.328125, 16.09765625, 16.8671875, 17.63671875, 18.40625, 19.17578125, 19.9453125, 20.71484375, 21.484375, 22.25390625, 23.0234375, 23.79296875, 24.5625, 25.33203125, 26.1015625, 26.87109375, 27.640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 4.0, 5.0, 5.0, 10.0, 13.0, 19.0, 36.0, 41.0, 59.0, 76.0, 70.0, 118.0, 122.0, 115.0, 82.0, 48.0, 44.0, 37.0, 21.0, 19.0, 7.0, 14.0, 5.0, 7.0, 6.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018291473388671875, -0.0017619132995605469, -0.0016946792602539062, -0.0016274452209472656, -0.001560211181640625, -0.0014929771423339844, -0.0014257431030273438, -0.0013585090637207031, -0.0012912750244140625, -0.0012240409851074219, -0.0011568069458007812, -0.0010895729064941406, -0.0010223388671875, -0.0009551048278808594, -0.0008878707885742188, -0.0008206367492675781, -0.0007534027099609375, -0.0006861686706542969, -0.0006189346313476562, -0.0005517005920410156, -0.000484466552734375, -0.0004172325134277344, -0.00034999847412109375, -0.0002827644348144531, -0.0002155303955078125, -0.00014829635620117188, -8.106231689453125e-05, -1.3828277587890625e-05, 5.340576171875e-05, 0.00012063980102539062, 0.00018787384033203125, 0.0002551078796386719, 0.0003223419189453125, 0.0003895759582519531, 0.00045680999755859375, 0.0005240440368652344, 0.000591278076171875, 0.0006585121154785156, 0.0007257461547851562, 0.0007929801940917969, 0.0008602142333984375, 0.0009274482727050781, 0.0009946823120117188, 0.0010619163513183594, 0.001129150390625, 0.0011963844299316406, 0.0012636184692382812, 0.0013308525085449219, 0.0013980865478515625, 0.0014653205871582031, 0.0015325546264648438, 0.0015997886657714844, 0.001667022705078125, 0.0017342567443847656, 0.0018014907836914062, 0.0018687248229980469, 0.0019359588623046875, 0.002003192901611328, 0.0020704269409179688, 0.0021376609802246094, 0.00220489501953125, 0.0022721290588378906, 0.0023393630981445312, 0.002406597137451172, 0.0024738311767578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 15.0, 10.0, 15.0, 35.0, 55.0, 86.0, 178.0, 380.0, 785.0, 2035.0, 6398.0, 30063.0, 468801.0, 497709.0, 31538.0, 6621.0, 2175.0, 825.0, 397.0, 194.0, 89.0, 53.0, 36.0, 26.0, 8.0, 9.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.375, -38.21728515625, -37.0595703125, -35.90185546875, -34.744140625, -33.58642578125, -32.4287109375, -31.27099609375, -30.11328125, -28.95556640625, -27.7978515625, -26.64013671875, -25.482421875, -24.32470703125, -23.1669921875, -22.00927734375, -20.8515625, -19.69384765625, -18.5361328125, -17.37841796875, -16.220703125, -15.06298828125, -13.9052734375, -12.74755859375, -11.58984375, -10.43212890625, -9.2744140625, -8.11669921875, -6.958984375, -5.80126953125, -4.6435546875, -3.48583984375, -2.328125, -1.17041015625, -0.0126953125, 1.14501953125, 2.302734375, 3.46044921875, 4.6181640625, 5.77587890625, 6.93359375, 8.09130859375, 9.2490234375, 10.40673828125, 11.564453125, 12.72216796875, 13.8798828125, 15.03759765625, 16.1953125, 17.35302734375, 18.5107421875, 19.66845703125, 20.826171875, 21.98388671875, 23.1416015625, 24.29931640625, 25.45703125, 26.61474609375, 27.7724609375, 28.93017578125, 30.087890625, 31.24560546875, 32.4033203125, 33.56103515625, 34.71875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 6.0, 4.0, 5.0, 11.0, 8.0, 11.0, 10.0, 11.0, 21.0, 24.0, 45.0, 50.0, 67.0, 112.0, 115.0, 104.0, 103.0, 72.0, 49.0, 40.0, 22.0, 27.0, 21.0, 14.0, 8.0, 11.0, 13.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.03125, -13.59228515625, -13.1533203125, -12.71435546875, -12.275390625, -11.83642578125, -11.3974609375, -10.95849609375, -10.51953125, -10.08056640625, -9.6416015625, -9.20263671875, -8.763671875, -8.32470703125, -7.8857421875, -7.44677734375, -7.0078125, -6.56884765625, -6.1298828125, -5.69091796875, -5.251953125, -4.81298828125, -4.3740234375, -3.93505859375, -3.49609375, -3.05712890625, -2.6181640625, -2.17919921875, -1.740234375, -1.30126953125, -0.8623046875, -0.42333984375, 0.015625, 0.45458984375, 0.8935546875, 1.33251953125, 1.771484375, 2.21044921875, 2.6494140625, 3.08837890625, 3.52734375, 3.96630859375, 4.4052734375, 4.84423828125, 5.283203125, 5.72216796875, 6.1611328125, 6.60009765625, 7.0390625, 7.47802734375, 7.9169921875, 8.35595703125, 8.794921875, 9.23388671875, 9.6728515625, 10.11181640625, 10.55078125, 10.98974609375, 11.4287109375, 11.86767578125, 12.306640625, 12.74560546875, 13.1845703125, 13.62353515625, 14.0625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 11.0, 26.0, 46.0, 87.0, 114.0, 157.0, 172.0, 149.0, 96.0, 59.0, 35.0, 16.0, 13.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.11306762695312, -229.74993896484375, -222.38681030273438, -215.023681640625, -207.66055297851562, -200.29742431640625, -192.93431091308594, -185.57118225097656, -178.2080535888672, -170.8449249267578, -163.48179626464844, -156.11866760253906, -148.75555419921875, -141.39242553710938, -134.029296875, -126.66616821289062, -119.30303955078125, -111.93991088867188, -104.5767822265625, -97.21366119384766, -89.85053253173828, -82.4874038696289, -75.12428283691406, -67.76115417480469, -60.39802551269531, -53.03489685058594, -45.67177200317383, -38.30864715576172, -30.945518493652344, -23.58238983154297, -16.21926498413086, -8.85614013671875, -1.493011474609375, 5.870115280151367, 13.23324203491211, 20.59636878967285, 27.959495544433594, 35.32262420654297, 42.68574905395508, 50.04887390136719, 57.41200256347656, 64.77513122558594, 72.13825988769531, 79.50138092041016, 86.86450958251953, 94.2276382446289, 101.59075927734375, 108.95388793945312, 116.3170166015625, 123.68014526367188, 131.04327392578125, 138.40640258789062, 145.76953125, 153.13265991210938, 160.4957733154297, 167.85890197753906, 175.22203063964844, 182.5851593017578, 189.9482879638672, 197.31141662597656, 204.67453002929688, 212.03765869140625, 219.40078735351562, 226.763916015625, 234.12704467773438]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 8.0, 7.0, 10.0, 10.0, 12.0, 17.0, 19.0, 19.0, 22.0, 21.0, 21.0, 25.0, 35.0, 35.0, 32.0, 37.0, 41.0, 38.0, 43.0, 37.0, 41.0, 44.0, 40.0, 39.0, 40.0, 28.0, 35.0, 32.0, 29.0, 28.0, 27.0, 14.0, 19.0, 17.0, 13.0, 4.0, 7.0, 13.0, 5.0, 9.0, 7.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-96.47310638427734, -93.6259994506836, -90.77890014648438, -87.93179321289062, -85.08468627929688, -82.23758697509766, -79.3904800415039, -76.54338073730469, -73.69627380371094, -70.84916687011719, -68.00206756591797, -65.15496063232422, -62.307857513427734, -59.46075439453125, -56.6136474609375, -53.766544342041016, -50.91944122314453, -48.07233810424805, -45.22523498535156, -42.37812805175781, -39.53102493286133, -36.683921813964844, -33.836814880371094, -30.98971176147461, -28.142608642578125, -25.29550552368164, -22.448400497436523, -19.601295471191406, -16.754192352294922, -13.907088279724121, -11.05998420715332, -8.212879180908203, -5.36578369140625, -2.518679618835449, 0.32842445373535156, 3.1755285263061523, 6.022632598876953, 8.869736671447754, 11.716840744018555, 14.563945770263672, 17.411048889160156, 20.25815200805664, 23.105257034301758, 25.952362060546875, 28.79946517944336, 31.646568298339844, 34.493675231933594, 37.34077835083008, 40.18788146972656, 43.03498458862305, 45.88208770751953, 48.72919464111328, 51.576297760009766, 54.42340087890625, 57.2705078125, 60.117610931396484, 62.96471405029297, 65.81182098388672, 68.65892028808594, 71.50602722167969, 74.35313415527344, 77.20023345947266, 80.0473403930664, 82.89443969726562, 85.74154663085938]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 10.0, 5.0, 12.0, 16.0, 17.0, 24.0, 37.0, 57.0, 81.0, 136.0, 199.0, 340.0, 662.0, 1413.0, 3232.0, 9927.0, 55222.0, 3784611.0, 306428.0, 22728.0, 5509.0, 1902.0, 796.0, 393.0, 204.0, 116.0, 71.0, 52.0, 24.0, 20.0, 11.0, 12.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.8125, -69.91064453125, -68.0087890625, -66.10693359375, -64.205078125, -62.30322265625, -60.4013671875, -58.49951171875, -56.59765625, -54.69580078125, -52.7939453125, -50.89208984375, -48.990234375, -47.08837890625, -45.1865234375, -43.28466796875, -41.3828125, -39.48095703125, -37.5791015625, -35.67724609375, -33.775390625, -31.87353515625, -29.9716796875, -28.06982421875, -26.16796875, -24.26611328125, -22.3642578125, -20.46240234375, -18.560546875, -16.65869140625, -14.7568359375, -12.85498046875, -10.953125, -9.05126953125, -7.1494140625, -5.24755859375, -3.345703125, -1.44384765625, 0.4580078125, 2.35986328125, 4.26171875, 6.16357421875, 8.0654296875, 9.96728515625, 11.869140625, 13.77099609375, 15.6728515625, 17.57470703125, 19.4765625, 21.37841796875, 23.2802734375, 25.18212890625, 27.083984375, 28.98583984375, 30.8876953125, 32.78955078125, 34.69140625, 36.59326171875, 38.4951171875, 40.39697265625, 42.298828125, 44.20068359375, 46.1025390625, 48.00439453125, 49.90625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 7.0, 7.0, 8.0, 13.0, 15.0, 15.0, 28.0, 37.0, 36.0, 32.0, 53.0, 59.0, 68.0, 57.0, 61.0, 63.0, 60.0, 60.0, 57.0, 50.0, 32.0, 33.0, 26.0, 21.0, 24.0, 18.0, 11.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.1875, -6.02276611328125, -5.8580322265625, -5.69329833984375, -5.528564453125, -5.36383056640625, -5.1990966796875, -5.03436279296875, -4.86962890625, -4.70489501953125, -4.5401611328125, -4.37542724609375, -4.210693359375, -4.04595947265625, -3.8812255859375, -3.71649169921875, -3.5517578125, -3.38702392578125, -3.2222900390625, -3.05755615234375, -2.892822265625, -2.72808837890625, -2.5633544921875, -2.39862060546875, -2.23388671875, -2.06915283203125, -1.9044189453125, -1.73968505859375, -1.574951171875, -1.41021728515625, -1.2454833984375, -1.08074951171875, -0.916015625, -0.75128173828125, -0.5865478515625, -0.42181396484375, -0.257080078125, -0.09234619140625, 0.0723876953125, 0.23712158203125, 0.40185546875, 0.56658935546875, 0.7313232421875, 0.89605712890625, 1.060791015625, 1.22552490234375, 1.3902587890625, 1.55499267578125, 1.7197265625, 1.88446044921875, 2.0491943359375, 2.21392822265625, 2.378662109375, 2.54339599609375, 2.7081298828125, 2.87286376953125, 3.03759765625, 3.20233154296875, 3.3670654296875, 3.53179931640625, 3.696533203125, 3.86126708984375, 4.0260009765625, 4.19073486328125, 4.35546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 7.0, 8.0, 19.0, 26.0, 43.0, 47.0, 63.0, 85.0, 366.0, 4857.0, 3895099.0, 290180.0, 2889.0, 267.0, 92.0, 74.0, 50.0, 37.0, 27.0, 20.0, 13.0, 9.0, 8.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.25, -84.6875, -78.125, -71.5625, -65.0, -58.4375, -51.875, -45.3125, -38.75, -32.1875, -25.625, -19.0625, -12.5, -5.9375, 0.625, 7.1875, 13.75, 20.3125, 26.875, 33.4375, 40.0, 46.5625, 53.125, 59.6875, 66.25, 72.8125, 79.375, 85.9375, 92.5, 99.0625, 105.625, 112.1875, 118.75, 125.3125, 131.875, 138.4375, 145.0, 151.5625, 158.125, 164.6875, 171.25, 177.8125, 184.375, 190.9375, 197.5, 204.0625, 210.625, 217.1875, 223.75, 230.3125, 236.875, 243.4375, 250.0, 256.5625, 263.125, 269.6875, 276.25, 282.8125, 289.375, 295.9375, 302.5, 309.0625, 315.625, 322.1875, 328.75]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 5.0, 13.0, 17.0, 39.0, 84.0, 401.0, 2735.0, 561.0, 123.0, 46.0, 23.0, 10.0, 11.0, 13.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3203125, -10.2528076171875, -9.185302734375, -8.1177978515625, -7.05029296875, -5.9827880859375, -4.915283203125, -3.8477783203125, -2.7802734375, -1.7127685546875, -0.645263671875, 0.4222412109375, 1.48974609375, 2.5572509765625, 3.624755859375, 4.6922607421875, 5.759765625, 6.8272705078125, 7.894775390625, 8.9622802734375, 10.02978515625, 11.0972900390625, 12.164794921875, 13.2322998046875, 14.2998046875, 15.3673095703125, 16.434814453125, 17.5023193359375, 18.56982421875, 19.6373291015625, 20.704833984375, 21.7723388671875, 22.83984375, 23.9073486328125, 24.974853515625, 26.0423583984375, 27.10986328125, 28.1773681640625, 29.244873046875, 30.3123779296875, 31.3798828125, 32.4473876953125, 33.514892578125, 34.5823974609375, 35.64990234375, 36.7174072265625, 37.784912109375, 38.8524169921875, 39.919921875, 40.9874267578125, 42.054931640625, 43.1224365234375, 44.18994140625, 45.2574462890625, 46.324951171875, 47.3924560546875, 48.4599609375, 49.5274658203125, 50.594970703125, 51.6624755859375, 52.72998046875, 53.7974853515625, 54.864990234375, 55.9324951171875, 57.0]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 27.0, 54.0, 189.0, 294.0, 232.0, 111.0, 44.0, 17.0, 13.0, 2.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-253.0552215576172, -246.34535217285156, -239.63548278808594, -232.92562866210938, -226.21575927734375, -219.50588989257812, -212.7960205078125, -206.08615112304688, -199.37628173828125, -192.66641235351562, -185.95654296875, -179.24667358398438, -172.5368194580078, -165.8269500732422, -159.11708068847656, -152.40721130371094, -145.69735717773438, -138.98748779296875, -132.27761840820312, -125.56775665283203, -118.85789489746094, -112.14802551269531, -105.43815612792969, -98.72828674316406, -92.01842498779297, -85.30855560302734, -78.59869384765625, -71.88882446289062, -65.178955078125, -58.469093322753906, -51.75922393798828, -45.04935836791992, -38.339508056640625, -31.629642486572266, -24.919775009155273, -18.20990753173828, -11.500041961669922, -4.7901763916015625, 1.9196929931640625, 8.629558563232422, 15.339424133300781, 22.04928970336914, 28.759157180786133, 35.469024658203125, 42.178890228271484, 48.888755798339844, 55.59862518310547, 62.30849075317383, 69.01835632324219, 75.72822570800781, 82.4380874633789, 89.14795684814453, 95.85781860351562, 102.56768798828125, 109.27755737304688, 115.9874267578125, 122.6972885131836, 129.4071502685547, 136.1170196533203, 142.82688903808594, 149.53675842285156, 156.24661254882812, 162.95648193359375, 169.66635131835938, 176.376220703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 6.0, 29.0, 33.0, 38.0, 50.0, 59.0, 65.0, 88.0, 86.0, 98.0, 79.0, 70.0, 66.0, 70.0, 48.0, 34.0, 23.0, 14.0, 14.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-126.77935791015625, -123.48429107666016, -120.1892318725586, -116.8941650390625, -113.59910583496094, -110.30403900146484, -107.00897216796875, -103.71391296386719, -100.4188461303711, -97.123779296875, -93.82872009277344, -90.53365325927734, -87.23858642578125, -83.94352722167969, -80.6484603881836, -77.3533935546875, -74.05833435058594, -70.76326751708984, -67.46820831298828, -64.17314147949219, -60.87807846069336, -57.58301544189453, -54.28794860839844, -50.99288558959961, -47.69782257080078, -44.40275955200195, -41.107696533203125, -37.81262969970703, -34.5175666809082, -31.222503662109375, -27.927438735961914, -24.632373809814453, -21.337310791015625, -18.042247772216797, -14.747182846069336, -11.452118873596191, -8.157054901123047, -4.861991882324219, -1.5669269561767578, 1.7281379699707031, 5.023200988769531, 8.318264961242676, 11.61332893371582, 14.908392906188965, 18.20345687866211, 21.498519897460938, 24.7935848236084, 28.08864974975586, 31.383712768554688, 34.678775787353516, 37.973838806152344, 41.26890563964844, 44.563968658447266, 47.859031677246094, 51.15409851074219, 54.449161529541016, 57.744224548339844, 61.03928756713867, 64.3343505859375, 67.6294174194336, 70.92448425292969, 74.21954345703125, 77.51461029052734, 80.80967712402344, 84.104736328125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 7.0, 12.0, 10.0, 18.0, 13.0, 26.0, 24.0, 32.0, 65.0, 68.0, 132.0, 170.0, 291.0, 415.0, 707.0, 1265.0, 2354.0, 4825.0, 10843.0, 28616.0, 93797.0, 351536.0, 391052.0, 106746.0, 32323.0, 12109.0, 5155.0, 2473.0, 1337.0, 759.0, 453.0, 284.0, 185.0, 117.0, 96.0, 63.0, 42.0, 38.0, 20.0, 12.0, 11.0, 9.0, 10.0, 3.0, 5.0, 4.0, 9.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.1875, -31.0400390625, -29.892578125, -28.7451171875, -27.59765625, -26.4501953125, -25.302734375, -24.1552734375, -23.0078125, -21.8603515625, -20.712890625, -19.5654296875, -18.41796875, -17.2705078125, -16.123046875, -14.9755859375, -13.828125, -12.6806640625, -11.533203125, -10.3857421875, -9.23828125, -8.0908203125, -6.943359375, -5.7958984375, -4.6484375, -3.5009765625, -2.353515625, -1.2060546875, -0.05859375, 1.0888671875, 2.236328125, 3.3837890625, 4.53125, 5.6787109375, 6.826171875, 7.9736328125, 9.12109375, 10.2685546875, 11.416015625, 12.5634765625, 13.7109375, 14.8583984375, 16.005859375, 17.1533203125, 18.30078125, 19.4482421875, 20.595703125, 21.7431640625, 22.890625, 24.0380859375, 25.185546875, 26.3330078125, 27.48046875, 28.6279296875, 29.775390625, 30.9228515625, 32.0703125, 33.2177734375, 34.365234375, 35.5126953125, 36.66015625, 37.8076171875, 38.955078125, 40.1025390625, 41.25]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 10.0, 8.0, 9.0, 13.0, 25.0, 37.0, 24.0, 37.0, 38.0, 41.0, 70.0, 61.0, 60.0, 77.0, 64.0, 73.0, 50.0, 50.0, 58.0, 34.0, 28.0, 33.0, 36.0, 11.0, 8.0, 14.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.5703125, -8.342529296875, -8.11474609375, -7.886962890625, -7.6591796875, -7.431396484375, -7.20361328125, -6.975830078125, -6.748046875, -6.520263671875, -6.29248046875, -6.064697265625, -5.8369140625, -5.609130859375, -5.38134765625, -5.153564453125, -4.92578125, -4.697998046875, -4.47021484375, -4.242431640625, -4.0146484375, -3.786865234375, -3.55908203125, -3.331298828125, -3.103515625, -2.875732421875, -2.64794921875, -2.420166015625, -2.1923828125, -1.964599609375, -1.73681640625, -1.509033203125, -1.28125, -1.053466796875, -0.82568359375, -0.597900390625, -0.3701171875, -0.142333984375, 0.08544921875, 0.313232421875, 0.541015625, 0.768798828125, 0.99658203125, 1.224365234375, 1.4521484375, 1.679931640625, 1.90771484375, 2.135498046875, 2.36328125, 2.591064453125, 2.81884765625, 3.046630859375, 3.2744140625, 3.502197265625, 3.72998046875, 3.957763671875, 4.185546875, 4.413330078125, 4.64111328125, 4.868896484375, 5.0966796875, 5.324462890625, 5.55224609375, 5.780029296875, 6.0078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 7.0, 11.0, 26.0, 19.0, 32.0, 31.0, 43.0, 54.0, 76.0, 99.0, 157.0, 253.0, 429.0, 879.0, 1872.0, 4635.0, 13565.0, 51477.0, 266393.0, 539618.0, 126731.0, 27855.0, 8164.0, 3033.0, 1356.0, 625.0, 363.0, 209.0, 147.0, 98.0, 60.0, 49.0, 38.0, 26.0, 31.0, 18.0, 14.0, 14.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.0, -31.873046875, -30.74609375, -29.619140625, -28.4921875, -27.365234375, -26.23828125, -25.111328125, -23.984375, -22.857421875, -21.73046875, -20.603515625, -19.4765625, -18.349609375, -17.22265625, -16.095703125, -14.96875, -13.841796875, -12.71484375, -11.587890625, -10.4609375, -9.333984375, -8.20703125, -7.080078125, -5.953125, -4.826171875, -3.69921875, -2.572265625, -1.4453125, -0.318359375, 0.80859375, 1.935546875, 3.0625, 4.189453125, 5.31640625, 6.443359375, 7.5703125, 8.697265625, 9.82421875, 10.951171875, 12.078125, 13.205078125, 14.33203125, 15.458984375, 16.5859375, 17.712890625, 18.83984375, 19.966796875, 21.09375, 22.220703125, 23.34765625, 24.474609375, 25.6015625, 26.728515625, 27.85546875, 28.982421875, 30.109375, 31.236328125, 32.36328125, 33.490234375, 34.6171875, 35.744140625, 36.87109375, 37.998046875, 39.125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 7.0, 2.0, 12.0, 7.0, 9.0, 19.0, 10.0, 15.0, 30.0, 21.0, 20.0, 31.0, 22.0, 40.0, 22.0, 45.0, 43.0, 47.0, 38.0, 40.0, 35.0, 48.0, 41.0, 30.0, 49.0, 36.0, 34.0, 30.0, 27.0, 26.0, 15.0, 14.0, 24.0, 21.0, 18.0, 12.0, 13.0, 9.0, 7.0, 5.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.0625, -20.42578125, -19.7890625, -19.15234375, -18.515625, -17.87890625, -17.2421875, -16.60546875, -15.96875, -15.33203125, -14.6953125, -14.05859375, -13.421875, -12.78515625, -12.1484375, -11.51171875, -10.875, -10.23828125, -9.6015625, -8.96484375, -8.328125, -7.69140625, -7.0546875, -6.41796875, -5.78125, -5.14453125, -4.5078125, -3.87109375, -3.234375, -2.59765625, -1.9609375, -1.32421875, -0.6875, -0.05078125, 0.5859375, 1.22265625, 1.859375, 2.49609375, 3.1328125, 3.76953125, 4.40625, 5.04296875, 5.6796875, 6.31640625, 6.953125, 7.58984375, 8.2265625, 8.86328125, 9.5, 10.13671875, 10.7734375, 11.41015625, 12.046875, 12.68359375, 13.3203125, 13.95703125, 14.59375, 15.23046875, 15.8671875, 16.50390625, 17.140625, 17.77734375, 18.4140625, 19.05078125, 19.6875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 23.0, 24.0, 57.0, 93.0, 193.0, 442.0, 1088.0, 3333.0, 12521.0, 93431.0, 816959.0, 101808.0, 13122.0, 3392.0, 1129.0, 491.0, 216.0, 100.0, 48.0, 33.0, 15.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.40625, -41.10205078125, -39.7978515625, -38.49365234375, -37.189453125, -35.88525390625, -34.5810546875, -33.27685546875, -31.97265625, -30.66845703125, -29.3642578125, -28.06005859375, -26.755859375, -25.45166015625, -24.1474609375, -22.84326171875, -21.5390625, -20.23486328125, -18.9306640625, -17.62646484375, -16.322265625, -15.01806640625, -13.7138671875, -12.40966796875, -11.10546875, -9.80126953125, -8.4970703125, -7.19287109375, -5.888671875, -4.58447265625, -3.2802734375, -1.97607421875, -0.671875, 0.63232421875, 1.9365234375, 3.24072265625, 4.544921875, 5.84912109375, 7.1533203125, 8.45751953125, 9.76171875, 11.06591796875, 12.3701171875, 13.67431640625, 14.978515625, 16.28271484375, 17.5869140625, 18.89111328125, 20.1953125, 21.49951171875, 22.8037109375, 24.10791015625, 25.412109375, 26.71630859375, 28.0205078125, 29.32470703125, 30.62890625, 31.93310546875, 33.2373046875, 34.54150390625, 35.845703125, 37.14990234375, 38.4541015625, 39.75830078125, 41.0625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 13.0, 10.0, 25.0, 21.0, 46.0, 78.0, 84.0, 150.0, 198.0, 150.0, 80.0, 40.0, 30.0, 16.0, 10.0, 13.0, 10.0, 1.0, 5.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00411224365234375, -0.003972172737121582, -0.003832101821899414, -0.003692030906677246, -0.003551959991455078, -0.00341188907623291, -0.003271818161010742, -0.0031317472457885742, -0.0029916763305664062, -0.0028516054153442383, -0.0027115345001220703, -0.0025714635848999023, -0.0024313926696777344, -0.0022913217544555664, -0.0021512508392333984, -0.0020111799240112305, -0.0018711090087890625, -0.0017310380935668945, -0.0015909671783447266, -0.0014508962631225586, -0.0013108253479003906, -0.0011707544326782227, -0.0010306835174560547, -0.0008906126022338867, -0.0007505416870117188, -0.0006104707717895508, -0.0004703998565673828, -0.00033032894134521484, -0.00019025802612304688, -5.0187110900878906e-05, 8.988380432128906e-05, 0.00022995471954345703, 0.000370025634765625, 0.000510096549987793, 0.0006501674652099609, 0.0007902383804321289, 0.0009303092956542969, 0.0010703802108764648, 0.0012104511260986328, 0.0013505220413208008, 0.0014905929565429688, 0.0016306638717651367, 0.0017707347869873047, 0.0019108057022094727, 0.0020508766174316406, 0.0021909475326538086, 0.0023310184478759766, 0.0024710893630981445, 0.0026111602783203125, 0.0027512311935424805, 0.0028913021087646484, 0.0030313730239868164, 0.0031714439392089844, 0.0033115148544311523, 0.0034515857696533203, 0.0035916566848754883, 0.0037317276000976562, 0.0038717985153198242, 0.004011869430541992, 0.00415194034576416, 0.004292011260986328, 0.004432082176208496, 0.004572153091430664, 0.004712224006652832, 0.004852294921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 12.0, 10.0, 15.0, 32.0, 48.0, 90.0, 149.0, 243.0, 537.0, 1092.0, 2717.0, 8867.0, 45454.0, 689362.0, 266488.0, 24089.0, 5659.0, 1865.0, 842.0, 406.0, 222.0, 127.0, 67.0, 40.0, 30.0, 23.0, 12.0, 8.0, 9.0, 3.0, 6.0, 4.0, 7.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-47.78125, -46.48388671875, -45.1865234375, -43.88916015625, -42.591796875, -41.29443359375, -39.9970703125, -38.69970703125, -37.40234375, -36.10498046875, -34.8076171875, -33.51025390625, -32.212890625, -30.91552734375, -29.6181640625, -28.32080078125, -27.0234375, -25.72607421875, -24.4287109375, -23.13134765625, -21.833984375, -20.53662109375, -19.2392578125, -17.94189453125, -16.64453125, -15.34716796875, -14.0498046875, -12.75244140625, -11.455078125, -10.15771484375, -8.8603515625, -7.56298828125, -6.265625, -4.96826171875, -3.6708984375, -2.37353515625, -1.076171875, 0.22119140625, 1.5185546875, 2.81591796875, 4.11328125, 5.41064453125, 6.7080078125, 8.00537109375, 9.302734375, 10.60009765625, 11.8974609375, 13.19482421875, 14.4921875, 15.78955078125, 17.0869140625, 18.38427734375, 19.681640625, 20.97900390625, 22.2763671875, 23.57373046875, 24.87109375, 26.16845703125, 27.4658203125, 28.76318359375, 30.060546875, 31.35791015625, 32.6552734375, 33.95263671875, 35.25]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 7.0, 3.0, 3.0, 2.0, 10.0, 11.0, 13.0, 26.0, 34.0, 39.0, 62.0, 68.0, 110.0, 135.0, 122.0, 99.0, 70.0, 52.0, 38.0, 23.0, 17.0, 9.0, 9.0, 7.0, 9.0, 7.0, 7.0, 3.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -19.07470703125, -18.4775390625, -17.88037109375, -17.283203125, -16.68603515625, -16.0888671875, -15.49169921875, -14.89453125, -14.29736328125, -13.7001953125, -13.10302734375, -12.505859375, -11.90869140625, -11.3115234375, -10.71435546875, -10.1171875, -9.52001953125, -8.9228515625, -8.32568359375, -7.728515625, -7.13134765625, -6.5341796875, -5.93701171875, -5.33984375, -4.74267578125, -4.1455078125, -3.54833984375, -2.951171875, -2.35400390625, -1.7568359375, -1.15966796875, -0.5625, 0.03466796875, 0.6318359375, 1.22900390625, 1.826171875, 2.42333984375, 3.0205078125, 3.61767578125, 4.21484375, 4.81201171875, 5.4091796875, 6.00634765625, 6.603515625, 7.20068359375, 7.7978515625, 8.39501953125, 8.9921875, 9.58935546875, 10.1865234375, 10.78369140625, 11.380859375, 11.97802734375, 12.5751953125, 13.17236328125, 13.76953125, 14.36669921875, 14.9638671875, 15.56103515625, 16.158203125, 16.75537109375, 17.3525390625, 17.94970703125, 18.546875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 13.0, 17.0, 49.0, 79.0, 122.0, 162.0, 226.0, 158.0, 94.0, 50.0, 18.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-443.2331237792969, -431.9515075683594, -420.6698913574219, -409.38824462890625, -398.10662841796875, -386.82501220703125, -375.54339599609375, -364.26177978515625, -352.98016357421875, -341.69854736328125, -330.41693115234375, -319.13531494140625, -307.8536682128906, -296.5720520019531, -285.2904357910156, -274.0088195800781, -262.7271728515625, -251.445556640625, -240.16392517089844, -228.88230895996094, -217.60069274902344, -206.31906127929688, -195.03744506835938, -183.75582885742188, -172.47421264648438, -161.19259643554688, -149.9109649658203, -138.6293487548828, -127.34773254394531, -116.06610870361328, -104.78448486328125, -93.50286865234375, -82.22125244140625, -70.93962860107422, -59.65801239013672, -48.37638854980469, -37.09476852416992, -25.813148498535156, -14.531524658203125, -3.249908447265625, 8.031715393066406, 19.313335418701172, 30.59495735168457, 41.87657928466797, 53.158199310302734, 64.4398193359375, 75.72144317626953, 87.00305938720703, 98.28468322753906, 109.5663070678711, 120.8479232788086, 132.12954711914062, 143.41116333007812, 154.69277954101562, 165.9744110107422, 177.2560272216797, 188.53765869140625, 199.81927490234375, 211.1009063720703, 222.3825225830078, 233.6641387939453, 244.94577026367188, 256.2273864746094, 267.5090026855469, 278.7906188964844]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 8.0, 5.0, 12.0, 18.0, 22.0, 34.0, 42.0, 56.0, 69.0, 58.0, 58.0, 86.0, 83.0, 68.0, 67.0, 67.0, 48.0, 50.0, 57.0, 38.0, 25.0, 13.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-255.7662353515625, -248.75341796875, -241.7406005859375, -234.727783203125, -227.7149658203125, -220.7021484375, -213.6893310546875, -206.676513671875, -199.6636962890625, -192.65087890625, -185.6380615234375, -178.625244140625, -171.6124267578125, -164.599609375, -157.5867919921875, -150.573974609375, -143.5611572265625, -136.54833984375, -129.5355224609375, -122.522705078125, -115.5098876953125, -108.4970703125, -101.4842529296875, -94.471435546875, -87.45860290527344, -80.44578552246094, -73.43296813964844, -66.42015075683594, -59.40733337402344, -52.39451217651367, -45.38169479370117, -38.36887741088867, -31.356063842773438, -24.343246459960938, -17.330429077148438, -10.317609786987305, -3.3047924041748047, 3.708026885986328, 10.720844268798828, 17.733661651611328, 24.746479034423828, 31.759296417236328, 38.77211380004883, 45.784934997558594, 52.797752380371094, 59.810569763183594, 66.8233871459961, 73.8362045288086, 80.8490219116211, 87.8618392944336, 94.8746566772461, 101.8874740600586, 108.9002914428711, 115.91311645507812, 122.92593383789062, 129.93875122070312, 136.95156860351562, 143.96438598632812, 150.97720336914062, 157.99002075195312, 165.00283813476562, 172.01565551757812, 179.02847290039062, 186.04129028320312, 193.05410766601562]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 6.0, 10.0, 11.0, 10.0, 21.0, 14.0, 30.0, 33.0, 32.0, 57.0, 67.0, 57.0, 96.0, 107.0, 121.0, 178.0, 246.0, 383.0, 590.0, 902.0, 1617.0, 2690.0, 5164.0, 10370.0, 23585.0, 83345.0, 2735943.0, 1216937.0, 68542.0, 21254.0, 9808.0, 5111.0, 2851.0, 1649.0, 881.0, 531.0, 316.0, 206.0, 148.0, 95.0, 81.0, 41.0, 45.0, 29.0, 26.0, 18.0, 4.0, 6.0, 3.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-56.34375, -54.77587890625, -53.2080078125, -51.64013671875, -50.072265625, -48.50439453125, -46.9365234375, -45.36865234375, -43.80078125, -42.23291015625, -40.6650390625, -39.09716796875, -37.529296875, -35.96142578125, -34.3935546875, -32.82568359375, -31.2578125, -29.68994140625, -28.1220703125, -26.55419921875, -24.986328125, -23.41845703125, -21.8505859375, -20.28271484375, -18.71484375, -17.14697265625, -15.5791015625, -14.01123046875, -12.443359375, -10.87548828125, -9.3076171875, -7.73974609375, -6.171875, -4.60400390625, -3.0361328125, -1.46826171875, 0.099609375, 1.66748046875, 3.2353515625, 4.80322265625, 6.37109375, 7.93896484375, 9.5068359375, 11.07470703125, 12.642578125, 14.21044921875, 15.7783203125, 17.34619140625, 18.9140625, 20.48193359375, 22.0498046875, 23.61767578125, 25.185546875, 26.75341796875, 28.3212890625, 29.88916015625, 31.45703125, 33.02490234375, 34.5927734375, 36.16064453125, 37.728515625, 39.29638671875, 40.8642578125, 42.43212890625, 44.0]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 11.0, 11.0, 24.0, 23.0, 32.0, 37.0, 36.0, 53.0, 66.0, 60.0, 83.0, 71.0, 55.0, 65.0, 68.0, 65.0, 61.0, 37.0, 30.0, 29.0, 19.0, 18.0, 9.0, 11.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.7265625, -10.46923828125, -10.2119140625, -9.95458984375, -9.697265625, -9.43994140625, -9.1826171875, -8.92529296875, -8.66796875, -8.41064453125, -8.1533203125, -7.89599609375, -7.638671875, -7.38134765625, -7.1240234375, -6.86669921875, -6.609375, -6.35205078125, -6.0947265625, -5.83740234375, -5.580078125, -5.32275390625, -5.0654296875, -4.80810546875, -4.55078125, -4.29345703125, -4.0361328125, -3.77880859375, -3.521484375, -3.26416015625, -3.0068359375, -2.74951171875, -2.4921875, -2.23486328125, -1.9775390625, -1.72021484375, -1.462890625, -1.20556640625, -0.9482421875, -0.69091796875, -0.43359375, -0.17626953125, 0.0810546875, 0.33837890625, 0.595703125, 0.85302734375, 1.1103515625, 1.36767578125, 1.625, 1.88232421875, 2.1396484375, 2.39697265625, 2.654296875, 2.91162109375, 3.1689453125, 3.42626953125, 3.68359375, 3.94091796875, 4.1982421875, 4.45556640625, 4.712890625, 4.97021484375, 5.2275390625, 5.48486328125, 5.7421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 8.0, 5.0, 18.0, 13.0, 26.0, 43.0, 62.0, 111.0, 273.0, 1077.0, 7526.0, 213800.0, 3947913.0, 20281.0, 2255.0, 476.0, 163.0, 79.0, 46.0, 33.0, 26.0, 20.0, 12.0, 11.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.1875, -80.8662109375, -75.544921875, -70.2236328125, -64.90234375, -59.5810546875, -54.259765625, -48.9384765625, -43.6171875, -38.2958984375, -32.974609375, -27.6533203125, -22.33203125, -17.0107421875, -11.689453125, -6.3681640625, -1.046875, 4.2744140625, 9.595703125, 14.9169921875, 20.23828125, 25.5595703125, 30.880859375, 36.2021484375, 41.5234375, 46.8447265625, 52.166015625, 57.4873046875, 62.80859375, 68.1298828125, 73.451171875, 78.7724609375, 84.09375, 89.4150390625, 94.736328125, 100.0576171875, 105.37890625, 110.7001953125, 116.021484375, 121.3427734375, 126.6640625, 131.9853515625, 137.306640625, 142.6279296875, 147.94921875, 153.2705078125, 158.591796875, 163.9130859375, 169.234375, 174.5556640625, 179.876953125, 185.1982421875, 190.51953125, 195.8408203125, 201.162109375, 206.4833984375, 211.8046875, 217.1259765625, 222.447265625, 227.7685546875, 233.08984375, 238.4111328125, 243.732421875, 249.0537109375, 254.375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 11.0, 17.0, 34.0, 54.0, 97.0, 267.0, 1386.0, 1710.0, 254.0, 90.0, 54.0, 31.0, 22.0, 11.0, 10.0, 2.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.828125, -19.607177734375, -18.38623046875, -17.165283203125, -15.9443359375, -14.723388671875, -13.50244140625, -12.281494140625, -11.060546875, -9.839599609375, -8.61865234375, -7.397705078125, -6.1767578125, -4.955810546875, -3.73486328125, -2.513916015625, -1.29296875, -0.072021484375, 1.14892578125, 2.369873046875, 3.5908203125, 4.811767578125, 6.03271484375, 7.253662109375, 8.474609375, 9.695556640625, 10.91650390625, 12.137451171875, 13.3583984375, 14.579345703125, 15.80029296875, 17.021240234375, 18.2421875, 19.463134765625, 20.68408203125, 21.905029296875, 23.1259765625, 24.346923828125, 25.56787109375, 26.788818359375, 28.009765625, 29.230712890625, 30.45166015625, 31.672607421875, 32.8935546875, 34.114501953125, 35.33544921875, 36.556396484375, 37.77734375, 38.998291015625, 40.21923828125, 41.440185546875, 42.6611328125, 43.882080078125, 45.10302734375, 46.323974609375, 47.544921875, 48.765869140625, 49.98681640625, 51.207763671875, 52.4287109375, 53.649658203125, 54.87060546875, 56.091552734375, 57.3125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 2.0, 8.0, 15.0, 9.0, 16.0, 32.0, 40.0, 47.0, 69.0, 97.0, 108.0, 126.0, 117.0, 74.0, 52.0, 52.0, 27.0, 21.0, 17.0, 7.0, 8.0, 15.0, 5.0, 9.0, 4.0, 1.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-125.87464141845703, -122.41179656982422, -118.94894409179688, -115.48609924316406, -112.02325439453125, -108.5604019165039, -105.0975570678711, -101.63470458984375, -98.17185974121094, -94.70901489257812, -91.24616241455078, -87.78331756591797, -84.32046508789062, -80.85762023925781, -77.394775390625, -73.93193054199219, -70.46907806396484, -67.00623321533203, -63.54338073730469, -60.080535888671875, -56.6176872253418, -53.15483856201172, -49.691993713378906, -46.22914505004883, -42.76629638671875, -39.30344772338867, -35.840599060058594, -32.37775421142578, -28.914905548095703, -25.452056884765625, -21.98921012878418, -18.526363372802734, -15.063522338867188, -11.600674629211426, -8.137826919555664, -4.674979209899902, -1.2121315002441406, 2.2507171630859375, 5.713563919067383, 9.176410675048828, 12.639259338378906, 16.102108001708984, 19.56495475769043, 23.027801513671875, 26.490650177001953, 29.95349884033203, 33.416343688964844, 36.87919235229492, 40.342041015625, 43.80488967895508, 47.267738342285156, 50.73058319091797, 54.19343185424805, 57.656280517578125, 61.11912536621094, 64.58197021484375, 68.0448226928711, 71.5076675415039, 74.97052001953125, 78.43336486816406, 81.89620971679688, 85.35906219482422, 88.82190704345703, 92.28475952148438, 95.74760437011719]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 11.0, 6.0, 11.0, 12.0, 11.0, 15.0, 21.0, 29.0, 32.0, 31.0, 42.0, 33.0, 43.0, 63.0, 64.0, 55.0, 60.0, 48.0, 55.0, 60.0, 51.0, 47.0, 30.0, 26.0, 29.0, 27.0, 19.0, 25.0, 9.0, 10.0, 7.0, 10.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.40242767333984, -91.37747192382812, -88.3525161743164, -85.32756042480469, -82.30260467529297, -79.27764892578125, -76.25269317626953, -73.22773742675781, -70.2027816772461, -67.17782592773438, -64.15287017822266, -61.12791442871094, -58.10295867919922, -55.0780029296875, -52.05304718017578, -49.02809143066406, -46.003135681152344, -42.978179931640625, -39.953224182128906, -36.92826843261719, -33.90331268310547, -30.87835693359375, -27.85340118408203, -24.828445434570312, -21.803489685058594, -18.778533935546875, -15.753578186035156, -12.728622436523438, -9.703666687011719, -6.6787109375, -3.6537551879882812, -0.6287994384765625, 2.3961639404296875, 5.421119689941406, 8.446075439453125, 11.471031188964844, 14.495986938476562, 17.52094268798828, 20.5458984375, 23.57085418701172, 26.595809936523438, 29.620765686035156, 32.645721435546875, 35.670677185058594, 38.69563293457031, 41.72058868408203, 44.74554443359375, 47.77050018310547, 50.79545593261719, 53.820411682128906, 56.845367431640625, 59.870323181152344, 62.89527893066406, 65.92023468017578, 68.9451904296875, 71.97014617919922, 74.99510192871094, 78.02005767822266, 81.04501342773438, 84.0699691772461, 87.09492492675781, 90.11988067626953, 93.14483642578125, 96.16979217529297, 99.19474792480469]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 15.0, 10.0, 7.0, 16.0, 12.0, 18.0, 32.0, 54.0, 81.0, 84.0, 138.0, 232.0, 348.0, 569.0, 991.0, 1784.0, 3509.0, 7293.0, 16767.0, 44687.0, 151636.0, 524759.0, 201692.0, 56023.0, 20341.0, 8517.0, 3946.0, 2128.0, 1077.0, 669.0, 365.0, 254.0, 137.0, 104.0, 76.0, 40.0, 41.0, 25.0, 18.0, 12.0, 12.0, 9.0, 8.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.90625, -35.7001953125, -34.494140625, -33.2880859375, -32.08203125, -30.8759765625, -29.669921875, -28.4638671875, -27.2578125, -26.0517578125, -24.845703125, -23.6396484375, -22.43359375, -21.2275390625, -20.021484375, -18.8154296875, -17.609375, -16.4033203125, -15.197265625, -13.9912109375, -12.78515625, -11.5791015625, -10.373046875, -9.1669921875, -7.9609375, -6.7548828125, -5.548828125, -4.3427734375, -3.13671875, -1.9306640625, -0.724609375, 0.4814453125, 1.6875, 2.8935546875, 4.099609375, 5.3056640625, 6.51171875, 7.7177734375, 8.923828125, 10.1298828125, 11.3359375, 12.5419921875, 13.748046875, 14.9541015625, 16.16015625, 17.3662109375, 18.572265625, 19.7783203125, 20.984375, 22.1904296875, 23.396484375, 24.6025390625, 25.80859375, 27.0146484375, 28.220703125, 29.4267578125, 30.6328125, 31.8388671875, 33.044921875, 34.2509765625, 35.45703125, 36.6630859375, 37.869140625, 39.0751953125, 40.28125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 1.0, 14.0, 16.0, 18.0, 19.0, 39.0, 32.0, 33.0, 58.0, 56.0, 50.0, 64.0, 40.0, 61.0, 67.0, 66.0, 66.0, 45.0, 44.0, 41.0, 31.0, 41.0, 23.0, 21.0, 16.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.25, -8.98138427734375, -8.7127685546875, -8.44415283203125, -8.175537109375, -7.90692138671875, -7.6383056640625, -7.36968994140625, -7.10107421875, -6.83245849609375, -6.5638427734375, -6.29522705078125, -6.026611328125, -5.75799560546875, -5.4893798828125, -5.22076416015625, -4.9521484375, -4.68353271484375, -4.4149169921875, -4.14630126953125, -3.877685546875, -3.60906982421875, -3.3404541015625, -3.07183837890625, -2.80322265625, -2.53460693359375, -2.2659912109375, -1.99737548828125, -1.728759765625, -1.46014404296875, -1.1915283203125, -0.92291259765625, -0.654296875, -0.38568115234375, -0.1170654296875, 0.15155029296875, 0.420166015625, 0.68878173828125, 0.9573974609375, 1.22601318359375, 1.49462890625, 1.76324462890625, 2.0318603515625, 2.30047607421875, 2.569091796875, 2.83770751953125, 3.1063232421875, 3.37493896484375, 3.6435546875, 3.91217041015625, 4.1807861328125, 4.44940185546875, 4.718017578125, 4.98663330078125, 5.2552490234375, 5.52386474609375, 5.79248046875, 6.06109619140625, 6.3297119140625, 6.59832763671875, 6.866943359375, 7.13555908203125, 7.4041748046875, 7.67279052734375, 7.94140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 10.0, 7.0, 9.0, 19.0, 26.0, 39.0, 72.0, 75.0, 142.0, 277.0, 594.0, 1379.0, 3915.0, 14010.0, 73451.0, 630447.0, 275729.0, 35633.0, 8194.0, 2498.0, 1008.0, 439.0, 232.0, 124.0, 73.0, 43.0, 30.0, 26.0, 18.0, 12.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.0, -56.23193359375, -54.4638671875, -52.69580078125, -50.927734375, -49.15966796875, -47.3916015625, -45.62353515625, -43.85546875, -42.08740234375, -40.3193359375, -38.55126953125, -36.783203125, -35.01513671875, -33.2470703125, -31.47900390625, -29.7109375, -27.94287109375, -26.1748046875, -24.40673828125, -22.638671875, -20.87060546875, -19.1025390625, -17.33447265625, -15.56640625, -13.79833984375, -12.0302734375, -10.26220703125, -8.494140625, -6.72607421875, -4.9580078125, -3.18994140625, -1.421875, 0.34619140625, 2.1142578125, 3.88232421875, 5.650390625, 7.41845703125, 9.1865234375, 10.95458984375, 12.72265625, 14.49072265625, 16.2587890625, 18.02685546875, 19.794921875, 21.56298828125, 23.3310546875, 25.09912109375, 26.8671875, 28.63525390625, 30.4033203125, 32.17138671875, 33.939453125, 35.70751953125, 37.4755859375, 39.24365234375, 41.01171875, 42.77978515625, 44.5478515625, 46.31591796875, 48.083984375, 49.85205078125, 51.6201171875, 53.38818359375, 55.15625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 3.0, 9.0, 9.0, 7.0, 8.0, 16.0, 12.0, 11.0, 29.0, 24.0, 40.0, 38.0, 43.0, 37.0, 50.0, 71.0, 28.0, 59.0, 54.0, 52.0, 51.0, 41.0, 42.0, 37.0, 30.0, 38.0, 24.0, 31.0, 17.0, 21.0, 22.0, 12.0, 8.0, 7.0, 7.0, 4.0, 0.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.9375, -30.945556640625, -29.95361328125, -28.961669921875, -27.9697265625, -26.977783203125, -25.98583984375, -24.993896484375, -24.001953125, -23.010009765625, -22.01806640625, -21.026123046875, -20.0341796875, -19.042236328125, -18.05029296875, -17.058349609375, -16.06640625, -15.074462890625, -14.08251953125, -13.090576171875, -12.0986328125, -11.106689453125, -10.11474609375, -9.122802734375, -8.130859375, -7.138916015625, -6.14697265625, -5.155029296875, -4.1630859375, -3.171142578125, -2.17919921875, -1.187255859375, -0.1953125, 0.796630859375, 1.78857421875, 2.780517578125, 3.7724609375, 4.764404296875, 5.75634765625, 6.748291015625, 7.740234375, 8.732177734375, 9.72412109375, 10.716064453125, 11.7080078125, 12.699951171875, 13.69189453125, 14.683837890625, 15.67578125, 16.667724609375, 17.65966796875, 18.651611328125, 19.6435546875, 20.635498046875, 21.62744140625, 22.619384765625, 23.611328125, 24.603271484375, 25.59521484375, 26.587158203125, 27.5791015625, 28.571044921875, 29.56298828125, 30.554931640625, 31.546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 6.0, 6.0, 15.0, 19.0, 23.0, 45.0, 94.0, 130.0, 207.0, 322.0, 528.0, 967.0, 1759.0, 3644.0, 8556.0, 26581.0, 153484.0, 759601.0, 64483.0, 16138.0, 6037.0, 2729.0, 1364.0, 727.0, 411.0, 247.0, 144.0, 101.0, 65.0, 35.0, 25.0, 21.0, 9.0, 3.0, 6.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-48.03125, -46.7080078125, -45.384765625, -44.0615234375, -42.73828125, -41.4150390625, -40.091796875, -38.7685546875, -37.4453125, -36.1220703125, -34.798828125, -33.4755859375, -32.15234375, -30.8291015625, -29.505859375, -28.1826171875, -26.859375, -25.5361328125, -24.212890625, -22.8896484375, -21.56640625, -20.2431640625, -18.919921875, -17.5966796875, -16.2734375, -14.9501953125, -13.626953125, -12.3037109375, -10.98046875, -9.6572265625, -8.333984375, -7.0107421875, -5.6875, -4.3642578125, -3.041015625, -1.7177734375, -0.39453125, 0.9287109375, 2.251953125, 3.5751953125, 4.8984375, 6.2216796875, 7.544921875, 8.8681640625, 10.19140625, 11.5146484375, 12.837890625, 14.1611328125, 15.484375, 16.8076171875, 18.130859375, 19.4541015625, 20.77734375, 22.1005859375, 23.423828125, 24.7470703125, 26.0703125, 27.3935546875, 28.716796875, 30.0400390625, 31.36328125, 32.6865234375, 34.009765625, 35.3330078125, 36.65625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 5.0, 5.0, 11.0, 9.0, 18.0, 19.0, 34.0, 48.0, 105.0, 264.0, 208.0, 93.0, 38.0, 22.0, 23.0, 10.0, 14.0, 10.0, 9.0, 6.0, 4.0, 3.0, 5.0, 5.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.00494384765625, -0.004788637161254883, -0.004633426666259766, -0.0044782161712646484, -0.004323005676269531, -0.004167795181274414, -0.004012584686279297, -0.0038573741912841797, -0.0037021636962890625, -0.0035469532012939453, -0.003391742706298828, -0.003236532211303711, -0.0030813217163085938, -0.0029261112213134766, -0.0027709007263183594, -0.002615690231323242, -0.002460479736328125, -0.002305269241333008, -0.0021500587463378906, -0.0019948482513427734, -0.0018396377563476562, -0.001684427261352539, -0.0015292167663574219, -0.0013740062713623047, -0.0012187957763671875, -0.0010635852813720703, -0.0009083747863769531, -0.0007531642913818359, -0.0005979537963867188, -0.00044274330139160156, -0.0002875328063964844, -0.0001323223114013672, 2.288818359375e-05, 0.0001780986785888672, 0.0003333091735839844, 0.0004885196685791016, 0.0006437301635742188, 0.0007989406585693359, 0.0009541511535644531, 0.0011093616485595703, 0.0012645721435546875, 0.0014197826385498047, 0.0015749931335449219, 0.001730203628540039, 0.0018854141235351562, 0.0020406246185302734, 0.0021958351135253906, 0.002351045608520508, 0.002506256103515625, 0.002661466598510742, 0.0028166770935058594, 0.0029718875885009766, 0.0031270980834960938, 0.003282308578491211, 0.003437519073486328, 0.0035927295684814453, 0.0037479400634765625, 0.0039031505584716797, 0.004058361053466797, 0.004213571548461914, 0.004368782043457031, 0.0045239925384521484, 0.004679203033447266, 0.004834413528442383, 0.0049896240234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 10.0, 12.0, 23.0, 27.0, 43.0, 83.0, 144.0, 287.0, 677.0, 1994.0, 7802.0, 50189.0, 905467.0, 68774.0, 9212.0, 2347.0, 741.0, 323.0, 152.0, 73.0, 59.0, 36.0, 22.0, 17.0, 8.0, 7.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-84.9375, -82.79052734375, -80.6435546875, -78.49658203125, -76.349609375, -74.20263671875, -72.0556640625, -69.90869140625, -67.76171875, -65.61474609375, -63.4677734375, -61.32080078125, -59.173828125, -57.02685546875, -54.8798828125, -52.73291015625, -50.5859375, -48.43896484375, -46.2919921875, -44.14501953125, -41.998046875, -39.85107421875, -37.7041015625, -35.55712890625, -33.41015625, -31.26318359375, -29.1162109375, -26.96923828125, -24.822265625, -22.67529296875, -20.5283203125, -18.38134765625, -16.234375, -14.08740234375, -11.9404296875, -9.79345703125, -7.646484375, -5.49951171875, -3.3525390625, -1.20556640625, 0.94140625, 3.08837890625, 5.2353515625, 7.38232421875, 9.529296875, 11.67626953125, 13.8232421875, 15.97021484375, 18.1171875, 20.26416015625, 22.4111328125, 24.55810546875, 26.705078125, 28.85205078125, 30.9990234375, 33.14599609375, 35.29296875, 37.43994140625, 39.5869140625, 41.73388671875, 43.880859375, 46.02783203125, 48.1748046875, 50.32177734375, 52.46875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 4.0, 8.0, 7.0, 11.0, 14.0, 27.0, 34.0, 34.0, 69.0, 158.0, 255.0, 154.0, 70.0, 49.0, 32.0, 16.0, 14.0, 9.0, 14.0, 6.0, 7.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.21875, -39.05322265625, -37.8876953125, -36.72216796875, -35.556640625, -34.39111328125, -33.2255859375, -32.06005859375, -30.89453125, -29.72900390625, -28.5634765625, -27.39794921875, -26.232421875, -25.06689453125, -23.9013671875, -22.73583984375, -21.5703125, -20.40478515625, -19.2392578125, -18.07373046875, -16.908203125, -15.74267578125, -14.5771484375, -13.41162109375, -12.24609375, -11.08056640625, -9.9150390625, -8.74951171875, -7.583984375, -6.41845703125, -5.2529296875, -4.08740234375, -2.921875, -1.75634765625, -0.5908203125, 0.57470703125, 1.740234375, 2.90576171875, 4.0712890625, 5.23681640625, 6.40234375, 7.56787109375, 8.7333984375, 9.89892578125, 11.064453125, 12.22998046875, 13.3955078125, 14.56103515625, 15.7265625, 16.89208984375, 18.0576171875, 19.22314453125, 20.388671875, 21.55419921875, 22.7197265625, 23.88525390625, 25.05078125, 26.21630859375, 27.3818359375, 28.54736328125, 29.712890625, 30.87841796875, 32.0439453125, 33.20947265625, 34.375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 10.0, 23.0, 44.0, 84.0, 145.0, 226.0, 197.0, 124.0, 72.0, 32.0, 21.0, 10.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-508.4537048339844, -493.4522399902344, -478.45074462890625, -463.44927978515625, -448.4477844238281, -433.4463195800781, -418.44482421875, -403.443359375, -388.44189453125, -373.4404296875, -358.4389343261719, -343.4374694824219, -328.43597412109375, -313.43450927734375, -298.43304443359375, -283.4315490722656, -268.4300537109375, -253.42857360839844, -238.42709350585938, -223.42562866210938, -208.42413330078125, -193.42266845703125, -178.4211883544922, -163.41970825195312, -148.41822814941406, -133.416748046875, -118.41526794433594, -103.4137954711914, -88.41231536865234, -73.41083526611328, -58.40936279296875, -43.40788269042969, -28.4063720703125, -13.40489387512207, 1.5965843200683594, 16.598060607910156, 31.59954071044922, 46.60102081298828, 61.60249328613281, 76.60397338867188, 91.60545349121094, 106.60693359375, 121.60841369628906, 136.60989379882812, 151.61135864257812, 166.61285400390625, 181.61431884765625, 196.6157989501953, 211.61727905273438, 226.61875915527344, 241.6202392578125, 256.6217041015625, 271.6231994628906, 286.6246643066406, 301.62615966796875, 316.62762451171875, 331.62908935546875, 346.63055419921875, 361.6320495605469, 376.6335144042969, 391.635009765625, 406.636474609375, 421.637939453125, 436.6394348144531, 451.64093017578125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 9.0, 12.0, 2.0, 10.0, 12.0, 10.0, 12.0, 21.0, 13.0, 19.0, 35.0, 38.0, 24.0, 33.0, 35.0, 43.0, 39.0, 60.0, 44.0, 49.0, 52.0, 35.0, 44.0, 42.0, 38.0, 27.0, 30.0, 28.0, 41.0, 21.0, 25.0, 17.0, 20.0, 16.0, 12.0, 7.0, 6.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.48416137695312, -155.19436645507812, -149.9045867919922, -144.6147918701172, -139.3249969482422, -134.03521728515625, -128.74542236328125, -123.45563507080078, -118.16584777832031, -112.87606048583984, -107.58626556396484, -102.29647827148438, -97.0066909790039, -91.71690368652344, -86.42710876464844, -81.13732147216797, -75.84752655029297, -70.5577392578125, -65.2679443359375, -59.97815704345703, -54.68836975097656, -49.39857864379883, -44.108787536621094, -38.819000244140625, -33.52920913696289, -28.23941993713379, -22.949630737304688, -17.659839630126953, -12.370050430297852, -7.08026123046875, -1.7904701232910156, 3.499317169189453, 8.789108276367188, 14.078897476196289, 19.36868667602539, 24.658477783203125, 29.948266983032227, 35.23805618286133, 40.52784729003906, 45.81763458251953, 51.107425689697266, 56.397216796875, 61.68700408935547, 66.97679138183594, 72.26658630371094, 77.5563735961914, 82.84616088867188, 88.13595581054688, 93.42574310302734, 98.71553039550781, 104.00532531738281, 109.29511260986328, 114.58489990234375, 119.87469482421875, 125.16448211669922, 130.4542694091797, 135.7440643310547, 141.0338592529297, 146.32363891601562, 151.61343383789062, 156.90322875976562, 162.19300842285156, 167.48280334472656, 172.7725830078125, 178.0623779296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 4.0, 16.0, 14.0, 22.0, 35.0, 54.0, 48.0, 86.0, 115.0, 159.0, 249.0, 373.0, 623.0, 1095.0, 1914.0, 4001.0, 9785.0, 39600.0, 3220982.0, 867434.0, 30800.0, 8892.0, 3646.0, 1771.0, 970.0, 562.0, 324.0, 215.0, 160.0, 93.0, 74.0, 37.0, 27.0, 16.0, 19.0, 17.0, 9.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-90.875, -88.115234375, -85.35546875, -82.595703125, -79.8359375, -77.076171875, -74.31640625, -71.556640625, -68.796875, -66.037109375, -63.27734375, -60.517578125, -57.7578125, -54.998046875, -52.23828125, -49.478515625, -46.71875, -43.958984375, -41.19921875, -38.439453125, -35.6796875, -32.919921875, -30.16015625, -27.400390625, -24.640625, -21.880859375, -19.12109375, -16.361328125, -13.6015625, -10.841796875, -8.08203125, -5.322265625, -2.5625, 0.197265625, 2.95703125, 5.716796875, 8.4765625, 11.236328125, 13.99609375, 16.755859375, 19.515625, 22.275390625, 25.03515625, 27.794921875, 30.5546875, 33.314453125, 36.07421875, 38.833984375, 41.59375, 44.353515625, 47.11328125, 49.873046875, 52.6328125, 55.392578125, 58.15234375, 60.912109375, 63.671875, 66.431640625, 69.19140625, 71.951171875, 74.7109375, 77.470703125, 80.23046875, 82.990234375, 85.75]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 6.0, 16.0, 18.0, 19.0, 19.0, 20.0, 25.0, 38.0, 43.0, 49.0, 53.0, 49.0, 55.0, 49.0, 54.0, 70.0, 38.0, 50.0, 47.0, 43.0, 46.0, 36.0, 28.0, 25.0, 25.0, 17.0, 13.0, 7.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.39520263671875, -8.1419677734375, -7.88873291015625, -7.635498046875, -7.38226318359375, -7.1290283203125, -6.87579345703125, -6.62255859375, -6.36932373046875, -6.1160888671875, -5.86285400390625, -5.609619140625, -5.35638427734375, -5.1031494140625, -4.84991455078125, -4.5966796875, -4.34344482421875, -4.0902099609375, -3.83697509765625, -3.583740234375, -3.33050537109375, -3.0772705078125, -2.82403564453125, -2.57080078125, -2.31756591796875, -2.0643310546875, -1.81109619140625, -1.557861328125, -1.30462646484375, -1.0513916015625, -0.79815673828125, -0.544921875, -0.29168701171875, -0.0384521484375, 0.21478271484375, 0.468017578125, 0.72125244140625, 0.9744873046875, 1.22772216796875, 1.48095703125, 1.73419189453125, 1.9874267578125, 2.24066162109375, 2.493896484375, 2.74713134765625, 3.0003662109375, 3.25360107421875, 3.5068359375, 3.76007080078125, 4.0133056640625, 4.26654052734375, 4.519775390625, 4.77301025390625, 5.0262451171875, 5.27947998046875, 5.53271484375, 5.78594970703125, 6.0391845703125, 6.29241943359375, 6.545654296875, 6.79888916015625, 7.0521240234375, 7.30535888671875, 7.55859375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 12.0, 19.0, 21.0, 33.0, 39.0, 54.0, 80.0, 113.0, 492.0, 14742.0, 4155189.0, 22407.0, 676.0, 102.0, 84.0, 60.0, 53.0, 39.0, 11.0, 17.0, 16.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.125, -182.123046875, -171.12109375, -160.119140625, -149.1171875, -138.115234375, -127.11328125, -116.111328125, -105.109375, -94.107421875, -83.10546875, -72.103515625, -61.1015625, -50.099609375, -39.09765625, -28.095703125, -17.09375, -6.091796875, 4.91015625, 15.912109375, 26.9140625, 37.916015625, 48.91796875, 59.919921875, 70.921875, 81.923828125, 92.92578125, 103.927734375, 114.9296875, 125.931640625, 136.93359375, 147.935546875, 158.9375, 169.939453125, 180.94140625, 191.943359375, 202.9453125, 213.947265625, 224.94921875, 235.951171875, 246.953125, 257.955078125, 268.95703125, 279.958984375, 290.9609375, 301.962890625, 312.96484375, 323.966796875, 334.96875, 345.970703125, 356.97265625, 367.974609375, 378.9765625, 389.978515625, 400.98046875, 411.982421875, 422.984375, 433.986328125, 444.98828125, 455.990234375, 466.9921875, 477.994140625, 488.99609375, 499.998046875, 511.0]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 5.0, 14.0, 19.0, 27.0, 66.0, 411.0, 3188.0, 243.0, 52.0, 30.0, 10.0, 10.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.609375, -21.334228515625, -19.05908203125, -16.783935546875, -14.5087890625, -12.233642578125, -9.95849609375, -7.683349609375, -5.408203125, -3.133056640625, -0.85791015625, 1.417236328125, 3.6923828125, 5.967529296875, 8.24267578125, 10.517822265625, 12.79296875, 15.068115234375, 17.34326171875, 19.618408203125, 21.8935546875, 24.168701171875, 26.44384765625, 28.718994140625, 30.994140625, 33.269287109375, 35.54443359375, 37.819580078125, 40.0947265625, 42.369873046875, 44.64501953125, 46.920166015625, 49.1953125, 51.470458984375, 53.74560546875, 56.020751953125, 58.2958984375, 60.571044921875, 62.84619140625, 65.121337890625, 67.396484375, 69.671630859375, 71.94677734375, 74.221923828125, 76.4970703125, 78.772216796875, 81.04736328125, 83.322509765625, 85.59765625, 87.872802734375, 90.14794921875, 92.423095703125, 94.6982421875, 96.973388671875, 99.24853515625, 101.523681640625, 103.798828125, 106.073974609375, 108.34912109375, 110.624267578125, 112.8994140625, 115.174560546875, 117.44970703125, 119.724853515625, 122.0]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 9.0, 15.0, 28.0, 31.0, 68.0, 158.0, 203.0, 205.0, 127.0, 61.0, 35.0, 22.0, 14.0, 7.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.16131591796875, -271.1591796875, -264.1570739746094, -257.1549377441406, -250.15283203125, -243.1507110595703, -236.14859008789062, -229.14645385742188, -222.14434814453125, -215.14222717285156, -208.14010620117188, -201.1379852294922, -194.1358642578125, -187.1337432861328, -180.13162231445312, -173.12948608398438, -166.1273651123047, -159.125244140625, -152.1231231689453, -145.12100219726562, -138.11888122558594, -131.11676025390625, -124.11463165283203, -117.11251068115234, -110.11038970947266, -103.10826873779297, -96.10614776611328, -89.10401916503906, -82.10189819335938, -75.09977722167969, -68.09765625, -61.09553527832031, -54.09342956542969, -47.09130859375, -40.08918762207031, -33.08706283569336, -26.084941864013672, -19.082820892333984, -12.080696105957031, -5.078575134277344, 1.9235458374023438, 8.925667762756348, 15.927789688110352, 22.929912567138672, 29.93203353881836, 36.93415451049805, 43.936279296875, 50.93840026855469, 57.940521240234375, 64.94264221191406, 71.94476318359375, 78.94688415527344, 85.94900512695312, 92.95112609863281, 99.95325469970703, 106.95537567138672, 113.9574966430664, 120.9596176147461, 127.96173858642578, 134.9638671875, 141.9659881591797, 148.96810913085938, 155.97023010253906, 162.97235107421875, 169.97447204589844]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 11.0, 11.0, 20.0, 37.0, 49.0, 51.0, 64.0, 103.0, 86.0, 115.0, 81.0, 96.0, 72.0, 61.0, 41.0, 31.0, 26.0, 19.0, 15.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-202.77987670898438, -197.08584594726562, -191.39181518554688, -185.69778442382812, -180.00375366210938, -174.3097381591797, -168.61570739746094, -162.9216766357422, -157.22764587402344, -151.5336151123047, -145.83958435058594, -140.1455535888672, -134.4515380859375, -128.75750732421875, -123.0634765625, -117.36944580078125, -111.6754150390625, -105.98138427734375, -100.287353515625, -94.59333038330078, -88.89929962158203, -83.20526885986328, -77.51124572753906, -71.81721496582031, -66.12318420410156, -60.42915344238281, -54.73512649536133, -49.041099548339844, -43.347068786621094, -37.653038024902344, -31.95901107788086, -26.264984130859375, -20.570953369140625, -14.876924514770508, -9.18289566040039, -3.4888668060302734, 2.2051620483398438, 7.899190902709961, 13.593219757080078, 19.287246704101562, 24.981277465820312, 30.67530632019043, 36.36933517456055, 42.06336212158203, 47.75739288330078, 53.45142364501953, 59.145450592041016, 64.8394775390625, 70.53350830078125, 76.2275390625, 81.92156982421875, 87.61559295654297, 93.30962371826172, 99.00365447998047, 104.69767761230469, 110.39170837402344, 116.08573913574219, 121.77976989746094, 127.47380065917969, 133.16783142089844, 138.86184692382812, 144.55587768554688, 150.24990844726562, 155.94393920898438, 161.63796997070312]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 10.0, 6.0, 11.0, 20.0, 25.0, 22.0, 33.0, 42.0, 65.0, 114.0, 173.0, 268.0, 467.0, 711.0, 1333.0, 2608.0, 5578.0, 12750.0, 33156.0, 104723.0, 519687.0, 263670.0, 63324.0, 22253.0, 8917.0, 3948.0, 1967.0, 1027.0, 634.0, 338.0, 227.0, 142.0, 87.0, 53.0, 44.0, 28.0, 21.0, 16.0, 8.0, 14.0, 9.0, 6.0, 5.0, 4.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-54.375, -52.76611328125, -51.1572265625, -49.54833984375, -47.939453125, -46.33056640625, -44.7216796875, -43.11279296875, -41.50390625, -39.89501953125, -38.2861328125, -36.67724609375, -35.068359375, -33.45947265625, -31.8505859375, -30.24169921875, -28.6328125, -27.02392578125, -25.4150390625, -23.80615234375, -22.197265625, -20.58837890625, -18.9794921875, -17.37060546875, -15.76171875, -14.15283203125, -12.5439453125, -10.93505859375, -9.326171875, -7.71728515625, -6.1083984375, -4.49951171875, -2.890625, -1.28173828125, 0.3271484375, 1.93603515625, 3.544921875, 5.15380859375, 6.7626953125, 8.37158203125, 9.98046875, 11.58935546875, 13.1982421875, 14.80712890625, 16.416015625, 18.02490234375, 19.6337890625, 21.24267578125, 22.8515625, 24.46044921875, 26.0693359375, 27.67822265625, 29.287109375, 30.89599609375, 32.5048828125, 34.11376953125, 35.72265625, 37.33154296875, 38.9404296875, 40.54931640625, 42.158203125, 43.76708984375, 45.3759765625, 46.98486328125, 48.59375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 11.0, 7.0, 13.0, 16.0, 23.0, 42.0, 41.0, 40.0, 64.0, 56.0, 73.0, 77.0, 93.0, 83.0, 63.0, 63.0, 61.0, 45.0, 42.0, 27.0, 25.0, 10.0, 16.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9453125, -15.4927978515625, -15.040283203125, -14.5877685546875, -14.13525390625, -13.6827392578125, -13.230224609375, -12.7777099609375, -12.3251953125, -11.8726806640625, -11.420166015625, -10.9676513671875, -10.51513671875, -10.0626220703125, -9.610107421875, -9.1575927734375, -8.705078125, -8.2525634765625, -7.800048828125, -7.3475341796875, -6.89501953125, -6.4425048828125, -5.989990234375, -5.5374755859375, -5.0849609375, -4.6324462890625, -4.179931640625, -3.7274169921875, -3.27490234375, -2.8223876953125, -2.369873046875, -1.9173583984375, -1.46484375, -1.0123291015625, -0.559814453125, -0.1072998046875, 0.34521484375, 0.7977294921875, 1.250244140625, 1.7027587890625, 2.1552734375, 2.6077880859375, 3.060302734375, 3.5128173828125, 3.96533203125, 4.4178466796875, 4.870361328125, 5.3228759765625, 5.775390625, 6.2279052734375, 6.680419921875, 7.1329345703125, 7.58544921875, 8.0379638671875, 8.490478515625, 8.9429931640625, 9.3955078125, 9.8480224609375, 10.300537109375, 10.7530517578125, 11.20556640625, 11.6580810546875, 12.110595703125, 12.5631103515625, 13.015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 7.0, 9.0, 13.0, 13.0, 34.0, 57.0, 83.0, 177.0, 461.0, 1257.0, 4042.0, 16873.0, 112606.0, 767363.0, 121419.0, 17802.0, 4165.0, 1313.0, 443.0, 170.0, 70.0, 53.0, 28.0, 16.0, 19.0, 9.0, 9.0, 5.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.875, -72.572265625, -70.26953125, -67.966796875, -65.6640625, -63.361328125, -61.05859375, -58.755859375, -56.453125, -54.150390625, -51.84765625, -49.544921875, -47.2421875, -44.939453125, -42.63671875, -40.333984375, -38.03125, -35.728515625, -33.42578125, -31.123046875, -28.8203125, -26.517578125, -24.21484375, -21.912109375, -19.609375, -17.306640625, -15.00390625, -12.701171875, -10.3984375, -8.095703125, -5.79296875, -3.490234375, -1.1875, 1.115234375, 3.41796875, 5.720703125, 8.0234375, 10.326171875, 12.62890625, 14.931640625, 17.234375, 19.537109375, 21.83984375, 24.142578125, 26.4453125, 28.748046875, 31.05078125, 33.353515625, 35.65625, 37.958984375, 40.26171875, 42.564453125, 44.8671875, 47.169921875, 49.47265625, 51.775390625, 54.078125, 56.380859375, 58.68359375, 60.986328125, 63.2890625, 65.591796875, 67.89453125, 70.197265625, 72.5]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 5.0, 14.0, 15.0, 16.0, 21.0, 32.0, 46.0, 42.0, 52.0, 46.0, 62.0, 51.0, 73.0, 73.0, 49.0, 56.0, 46.0, 54.0, 51.0, 44.0, 31.0, 27.0, 15.0, 22.0, 17.0, 8.0, 10.0, 5.0, 6.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.5625, -48.037109375, -46.51171875, -44.986328125, -43.4609375, -41.935546875, -40.41015625, -38.884765625, -37.359375, -35.833984375, -34.30859375, -32.783203125, -31.2578125, -29.732421875, -28.20703125, -26.681640625, -25.15625, -23.630859375, -22.10546875, -20.580078125, -19.0546875, -17.529296875, -16.00390625, -14.478515625, -12.953125, -11.427734375, -9.90234375, -8.376953125, -6.8515625, -5.326171875, -3.80078125, -2.275390625, -0.75, 0.775390625, 2.30078125, 3.826171875, 5.3515625, 6.876953125, 8.40234375, 9.927734375, 11.453125, 12.978515625, 14.50390625, 16.029296875, 17.5546875, 19.080078125, 20.60546875, 22.130859375, 23.65625, 25.181640625, 26.70703125, 28.232421875, 29.7578125, 31.283203125, 32.80859375, 34.333984375, 35.859375, 37.384765625, 38.91015625, 40.435546875, 41.9609375, 43.486328125, 45.01171875, 46.537109375, 48.0625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 4.0, 20.0, 14.0, 29.0, 41.0, 61.0, 104.0, 202.0, 332.0, 614.0, 1149.0, 2233.0, 4513.0, 11476.0, 48392.0, 761116.0, 182590.0, 21752.0, 7171.0, 3242.0, 1558.0, 864.0, 447.0, 255.0, 134.0, 92.0, 54.0, 25.0, 21.0, 10.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-55.59375, -54.0390625, -52.484375, -50.9296875, -49.375, -47.8203125, -46.265625, -44.7109375, -43.15625, -41.6015625, -40.046875, -38.4921875, -36.9375, -35.3828125, -33.828125, -32.2734375, -30.71875, -29.1640625, -27.609375, -26.0546875, -24.5, -22.9453125, -21.390625, -19.8359375, -18.28125, -16.7265625, -15.171875, -13.6171875, -12.0625, -10.5078125, -8.953125, -7.3984375, -5.84375, -4.2890625, -2.734375, -1.1796875, 0.375, 1.9296875, 3.484375, 5.0390625, 6.59375, 8.1484375, 9.703125, 11.2578125, 12.8125, 14.3671875, 15.921875, 17.4765625, 19.03125, 20.5859375, 22.140625, 23.6953125, 25.25, 26.8046875, 28.359375, 29.9140625, 31.46875, 33.0234375, 34.578125, 36.1328125, 37.6875, 39.2421875, 40.796875, 42.3515625, 43.90625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 5.0, 13.0, 20.0, 47.0, 94.0, 264.0, 351.0, 97.0, 45.0, 18.0, 15.0, 7.0, 3.0, 5.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01373291015625, -0.013414323329925537, -0.013095736503601074, -0.012777149677276611, -0.012458562850952148, -0.012139976024627686, -0.011821389198303223, -0.01150280237197876, -0.011184215545654297, -0.010865628719329834, -0.010547041893005371, -0.010228455066680908, -0.009909868240356445, -0.009591281414031982, -0.00927269458770752, -0.008954107761383057, -0.008635520935058594, -0.00831693410873413, -0.007998347282409668, -0.007679760456085205, -0.007361173629760742, -0.007042586803436279, -0.006723999977111816, -0.0064054131507873535, -0.006086826324462891, -0.005768239498138428, -0.005449652671813965, -0.005131065845489502, -0.004812479019165039, -0.004493892192840576, -0.004175305366516113, -0.0038567185401916504, -0.0035381317138671875, -0.0032195448875427246, -0.0029009580612182617, -0.002582371234893799, -0.002263784408569336, -0.001945197582244873, -0.0016266107559204102, -0.0013080239295959473, -0.0009894371032714844, -0.0006708502769470215, -0.0003522634506225586, -3.36766242980957e-05, 0.0002849102020263672, 0.0006034970283508301, 0.000922083854675293, 0.0012406706809997559, 0.0015592575073242188, 0.0018778443336486816, 0.0021964311599731445, 0.0025150179862976074, 0.0028336048126220703, 0.003152191638946533, 0.003470778465270996, 0.003789365291595459, 0.004107952117919922, 0.004426538944244385, 0.004745125770568848, 0.0050637125968933105, 0.0053822994232177734, 0.005700886249542236, 0.006019473075866699, 0.006338059902191162, 0.006656646728515625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 8.0, 10.0, 18.0, 30.0, 53.0, 83.0, 159.0, 392.0, 974.0, 3110.0, 15799.0, 907246.0, 110497.0, 7179.0, 1833.0, 636.0, 257.0, 116.0, 65.0, 41.0, 17.0, 7.0, 9.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.4375, -73.2236328125, -70.009765625, -66.7958984375, -63.58203125, -60.3681640625, -57.154296875, -53.9404296875, -50.7265625, -47.5126953125, -44.298828125, -41.0849609375, -37.87109375, -34.6572265625, -31.443359375, -28.2294921875, -25.015625, -21.8017578125, -18.587890625, -15.3740234375, -12.16015625, -8.9462890625, -5.732421875, -2.5185546875, 0.6953125, 3.9091796875, 7.123046875, 10.3369140625, 13.55078125, 16.7646484375, 19.978515625, 23.1923828125, 26.40625, 29.6201171875, 32.833984375, 36.0478515625, 39.26171875, 42.4755859375, 45.689453125, 48.9033203125, 52.1171875, 55.3310546875, 58.544921875, 61.7587890625, 64.97265625, 68.1865234375, 71.400390625, 74.6142578125, 77.828125, 81.0419921875, 84.255859375, 87.4697265625, 90.68359375, 93.8974609375, 97.111328125, 100.3251953125, 103.5390625, 106.7529296875, 109.966796875, 113.1806640625, 116.39453125, 119.6083984375, 122.822265625, 126.0361328125, 129.25]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 9.0, 6.0, 10.0, 12.0, 19.0, 29.0, 55.0, 111.0, 252.0, 224.0, 115.0, 85.0, 22.0, 14.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.375, -33.83056640625, -32.2861328125, -30.74169921875, -29.197265625, -27.65283203125, -26.1083984375, -24.56396484375, -23.01953125, -21.47509765625, -19.9306640625, -18.38623046875, -16.841796875, -15.29736328125, -13.7529296875, -12.20849609375, -10.6640625, -9.11962890625, -7.5751953125, -6.03076171875, -4.486328125, -2.94189453125, -1.3974609375, 0.14697265625, 1.69140625, 3.23583984375, 4.7802734375, 6.32470703125, 7.869140625, 9.41357421875, 10.9580078125, 12.50244140625, 14.046875, 15.59130859375, 17.1357421875, 18.68017578125, 20.224609375, 21.76904296875, 23.3134765625, 24.85791015625, 26.40234375, 27.94677734375, 29.4912109375, 31.03564453125, 32.580078125, 34.12451171875, 35.6689453125, 37.21337890625, 38.7578125, 40.30224609375, 41.8466796875, 43.39111328125, 44.935546875, 46.47998046875, 48.0244140625, 49.56884765625, 51.11328125, 52.65771484375, 54.2021484375, 55.74658203125, 57.291015625, 58.83544921875, 60.3798828125, 61.92431640625, 63.46875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 15.0, 24.0, 62.0, 97.0, 209.0, 266.0, 142.0, 93.0, 54.0, 18.0, 12.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-458.1123046875, -437.78912353515625, -417.4659729003906, -397.142822265625, -376.81964111328125, -356.4964599609375, -336.1733093261719, -315.85015869140625, -295.5269775390625, -275.20379638671875, -254.88064575195312, -234.55747985839844, -214.23431396484375, -193.91114807128906, -173.58798217773438, -153.2648162841797, -132.941650390625, -112.61848449707031, -92.29531860351562, -71.97215270996094, -51.64898681640625, -31.325820922851562, -11.002655029296875, 9.320510864257812, 29.6436767578125, 49.96684265136719, 70.29000854492188, 90.61317443847656, 110.93634033203125, 131.25950622558594, 151.58267211914062, 171.9058380126953, 192.22900390625, 212.5521697998047, 232.87533569335938, 253.19850158691406, 273.52166748046875, 293.8448486328125, 314.1679992675781, 334.49114990234375, 354.8143310546875, 375.13751220703125, 395.4606628417969, 415.7838134765625, 436.10699462890625, 456.43017578125, 476.7533264160156, 497.07647705078125, 517.399658203125, 537.7228393554688, 558.0460205078125, 578.369140625, 598.6923217773438, 619.0155029296875, 639.338623046875, 659.6618041992188, 679.9849853515625, 700.3081665039062, 720.63134765625, 740.9544677734375, 761.2776489257812, 781.600830078125, 801.9239501953125, 822.2471313476562, 842.5703125]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 7.0, 7.0, 9.0, 17.0, 11.0, 18.0, 24.0, 22.0, 33.0, 32.0, 37.0, 45.0, 46.0, 35.0, 51.0, 47.0, 46.0, 60.0, 49.0, 41.0, 51.0, 47.0, 36.0, 31.0, 33.0, 23.0, 30.0, 16.0, 14.0, 10.0, 15.0, 10.0, 9.0, 7.0, 6.0, 7.0, 4.0, 2.0, 9.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-246.58033752441406, -239.5565643310547, -232.53277587890625, -225.50900268554688, -218.48521423339844, -211.46144104003906, -204.43765258789062, -197.41387939453125, -190.39010620117188, -183.3663330078125, -176.34254455566406, -169.3187713623047, -162.29498291015625, -155.27120971679688, -148.2474365234375, -141.22364807128906, -134.19985961914062, -127.17607879638672, -120.15229797363281, -113.12852478027344, -106.10474395751953, -99.08096313476562, -92.05718231201172, -85.03340148925781, -78.00962829589844, -70.98584747314453, -63.96207046508789, -56.938289642333984, -49.914512634277344, -42.89073181152344, -35.86695098876953, -28.84317398071289, -21.81939697265625, -14.795618057250977, -7.771838188171387, -0.7480583190917969, 6.275720596313477, 13.29949951171875, 20.323280334472656, 27.347057342529297, 34.3708381652832, 41.39461898803711, 48.41839599609375, 55.442176818847656, 62.46595764160156, 69.48973083496094, 76.51351928710938, 83.53729248046875, 90.56107330322266, 97.58485412597656, 104.60863494873047, 111.63241577148438, 118.65618896484375, 125.67996978759766, 132.70375061035156, 139.72752380371094, 146.75131225585938, 153.77508544921875, 160.7988739013672, 167.82264709472656, 174.846435546875, 181.87020874023438, 188.89398193359375, 195.9177703857422, 202.94154357910156]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 9.0, 9.0, 20.0, 26.0, 29.0, 38.0, 51.0, 90.0, 125.0, 164.0, 302.0, 468.0, 872.0, 1614.0, 3113.0, 6470.0, 15188.0, 52160.0, 3589375.0, 466218.0, 34485.0, 12292.0, 5406.0, 2609.0, 1354.0, 741.0, 379.0, 240.0, 131.0, 82.0, 73.0, 36.0, 30.0, 16.0, 21.0, 11.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-103.3125, -100.0703125, -96.828125, -93.5859375, -90.34375, -87.1015625, -83.859375, -80.6171875, -77.375, -74.1328125, -70.890625, -67.6484375, -64.40625, -61.1640625, -57.921875, -54.6796875, -51.4375, -48.1953125, -44.953125, -41.7109375, -38.46875, -35.2265625, -31.984375, -28.7421875, -25.5, -22.2578125, -19.015625, -15.7734375, -12.53125, -9.2890625, -6.046875, -2.8046875, 0.4375, 3.6796875, 6.921875, 10.1640625, 13.40625, 16.6484375, 19.890625, 23.1328125, 26.375, 29.6171875, 32.859375, 36.1015625, 39.34375, 42.5859375, 45.828125, 49.0703125, 52.3125, 55.5546875, 58.796875, 62.0390625, 65.28125, 68.5234375, 71.765625, 75.0078125, 78.25, 81.4921875, 84.734375, 87.9765625, 91.21875, 94.4609375, 97.703125, 100.9453125, 104.1875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 8.0, 10.0, 9.0, 13.0, 23.0, 26.0, 33.0, 35.0, 44.0, 56.0, 61.0, 69.0, 83.0, 73.0, 55.0, 69.0, 61.0, 48.0, 43.0, 43.0, 37.0, 33.0, 19.0, 16.0, 13.0, 7.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.8515625, -14.42236328125, -13.9931640625, -13.56396484375, -13.134765625, -12.70556640625, -12.2763671875, -11.84716796875, -11.41796875, -10.98876953125, -10.5595703125, -10.13037109375, -9.701171875, -9.27197265625, -8.8427734375, -8.41357421875, -7.984375, -7.55517578125, -7.1259765625, -6.69677734375, -6.267578125, -5.83837890625, -5.4091796875, -4.97998046875, -4.55078125, -4.12158203125, -3.6923828125, -3.26318359375, -2.833984375, -2.40478515625, -1.9755859375, -1.54638671875, -1.1171875, -0.68798828125, -0.2587890625, 0.17041015625, 0.599609375, 1.02880859375, 1.4580078125, 1.88720703125, 2.31640625, 2.74560546875, 3.1748046875, 3.60400390625, 4.033203125, 4.46240234375, 4.8916015625, 5.32080078125, 5.75, 6.17919921875, 6.6083984375, 7.03759765625, 7.466796875, 7.89599609375, 8.3251953125, 8.75439453125, 9.18359375, 9.61279296875, 10.0419921875, 10.47119140625, 10.900390625, 11.32958984375, 11.7587890625, 12.18798828125, 12.6171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 11.0, 19.0, 46.0, 71.0, 156.0, 350.0, 753.0, 1814.0, 4954.0, 17210.0, 163963.0, 3946743.0, 43580.0, 9340.0, 3059.0, 1193.0, 513.0, 237.0, 124.0, 70.0, 24.0, 18.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-168.5, -163.435546875, -158.37109375, -153.306640625, -148.2421875, -143.177734375, -138.11328125, -133.048828125, -127.984375, -122.919921875, -117.85546875, -112.791015625, -107.7265625, -102.662109375, -97.59765625, -92.533203125, -87.46875, -82.404296875, -77.33984375, -72.275390625, -67.2109375, -62.146484375, -57.08203125, -52.017578125, -46.953125, -41.888671875, -36.82421875, -31.759765625, -26.6953125, -21.630859375, -16.56640625, -11.501953125, -6.4375, -1.373046875, 3.69140625, 8.755859375, 13.8203125, 18.884765625, 23.94921875, 29.013671875, 34.078125, 39.142578125, 44.20703125, 49.271484375, 54.3359375, 59.400390625, 64.46484375, 69.529296875, 74.59375, 79.658203125, 84.72265625, 89.787109375, 94.8515625, 99.916015625, 104.98046875, 110.044921875, 115.109375, 120.173828125, 125.23828125, 130.302734375, 135.3671875, 140.431640625, 145.49609375, 150.560546875, 155.625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 11.0, 5.0, 7.0, 10.0, 15.0, 20.0, 19.0, 41.0, 82.0, 261.0, 2248.0, 921.0, 198.0, 76.0, 36.0, 25.0, 11.0, 14.0, 16.0, 11.0, 7.0, 9.0, 8.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.53125, -37.35888671875, -36.1865234375, -35.01416015625, -33.841796875, -32.66943359375, -31.4970703125, -30.32470703125, -29.15234375, -27.97998046875, -26.8076171875, -25.63525390625, -24.462890625, -23.29052734375, -22.1181640625, -20.94580078125, -19.7734375, -18.60107421875, -17.4287109375, -16.25634765625, -15.083984375, -13.91162109375, -12.7392578125, -11.56689453125, -10.39453125, -9.22216796875, -8.0498046875, -6.87744140625, -5.705078125, -4.53271484375, -3.3603515625, -2.18798828125, -1.015625, 0.15673828125, 1.3291015625, 2.50146484375, 3.673828125, 4.84619140625, 6.0185546875, 7.19091796875, 8.36328125, 9.53564453125, 10.7080078125, 11.88037109375, 13.052734375, 14.22509765625, 15.3974609375, 16.56982421875, 17.7421875, 18.91455078125, 20.0869140625, 21.25927734375, 22.431640625, 23.60400390625, 24.7763671875, 25.94873046875, 27.12109375, 28.29345703125, 29.4658203125, 30.63818359375, 31.810546875, 32.98291015625, 34.1552734375, 35.32763671875, 36.5]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 24.0, 107.0, 414.0, 303.0, 94.0, 37.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.54135131835938, -218.01744079589844, -199.49354553222656, -180.96963500976562, -162.44573974609375, -143.9218292236328, -125.39791870117188, -106.8740234375, -88.35011291503906, -69.82621002197266, -51.302303314208984, -32.77839660644531, -14.254493713378906, 4.2694091796875, 22.793319702148438, 41.31721496582031, 59.84112548828125, 78.36502838134766, 96.88893127441406, 115.412841796875, 133.93673706054688, 152.4606475830078, 170.98455810546875, 189.50845336914062, 208.03236389160156, 226.5562744140625, 245.08016967773438, 263.60406494140625, 282.12799072265625, 300.6518859863281, 319.17578125, 337.69970703125, 356.22357177734375, 374.7474670410156, 393.2713928222656, 411.7952880859375, 430.3191833496094, 448.84307861328125, 467.36700439453125, 485.8908996582031, 504.414794921875, 522.938720703125, 541.4625854492188, 559.9865112304688, 578.5104370117188, 597.0343017578125, 615.5582275390625, 634.0821533203125, 652.6060791015625, 671.1300048828125, 689.6538696289062, 708.1777954101562, 726.7017211914062, 745.2255859375, 763.74951171875, 782.2734375, 800.7973022460938, 819.3212280273438, 837.8450927734375, 856.3690185546875, 874.8929443359375, 893.4168090820312, 911.9407348632812, 930.464599609375, 948.988525390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 3.0, 7.0, 10.0, 28.0, 16.0, 33.0, 24.0, 48.0, 43.0, 46.0, 40.0, 45.0, 51.0, 54.0, 48.0, 59.0, 62.0, 56.0, 37.0, 39.0, 47.0, 44.0, 43.0, 28.0, 17.0, 17.0, 16.0, 16.0, 4.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-172.2137908935547, -167.89244079589844, -163.57107543945312, -159.24972534179688, -154.92837524414062, -150.60702514648438, -146.28565979003906, -141.9643096923828, -137.6429443359375, -133.32159423828125, -129.00022888183594, -124.67887878417969, -120.35752868652344, -116.03617095947266, -111.71481323242188, -107.39346313476562, -103.07211303710938, -98.7507553100586, -94.42940521240234, -90.10804748535156, -85.78669738769531, -81.46533966064453, -77.14398193359375, -72.8226318359375, -68.50127410888672, -64.17991638183594, -59.85856628417969, -55.537208557128906, -51.21585464477539, -46.894500732421875, -42.573143005371094, -38.25178909301758, -33.930419921875, -29.609066009521484, -25.287710189819336, -20.966354370117188, -16.645000457763672, -12.323646545410156, -8.002290725708008, -3.6809349060058594, 0.6404190063476562, 4.961773872375488, 9.28312873840332, 13.604483604431152, 17.925838470458984, 22.2471923828125, 26.56854820251465, 30.889904022216797, 35.21125793457031, 39.53261184692383, 43.853965759277344, 48.175323486328125, 52.49667739868164, 56.818031311035156, 61.13938903808594, 65.46073913574219, 69.78209686279297, 74.10345458984375, 78.4248046875, 82.74616241455078, 87.06752014160156, 91.38887023925781, 95.7102279663086, 100.03158569335938, 104.35293579101562]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 11.0, 10.0, 14.0, 12.0, 24.0, 28.0, 40.0, 55.0, 107.0, 140.0, 210.0, 331.0, 536.0, 953.0, 1539.0, 3003.0, 5571.0, 10883.0, 22691.0, 53146.0, 141974.0, 398074.0, 253634.0, 87339.0, 34821.0, 15926.0, 7960.0, 4097.0, 2189.0, 1290.0, 732.0, 410.0, 258.0, 185.0, 110.0, 77.0, 49.0, 38.0, 26.0, 19.0, 14.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-46.9375, -45.5048828125, -44.072265625, -42.6396484375, -41.20703125, -39.7744140625, -38.341796875, -36.9091796875, -35.4765625, -34.0439453125, -32.611328125, -31.1787109375, -29.74609375, -28.3134765625, -26.880859375, -25.4482421875, -24.015625, -22.5830078125, -21.150390625, -19.7177734375, -18.28515625, -16.8525390625, -15.419921875, -13.9873046875, -12.5546875, -11.1220703125, -9.689453125, -8.2568359375, -6.82421875, -5.3916015625, -3.958984375, -2.5263671875, -1.09375, 0.3388671875, 1.771484375, 3.2041015625, 4.63671875, 6.0693359375, 7.501953125, 8.9345703125, 10.3671875, 11.7998046875, 13.232421875, 14.6650390625, 16.09765625, 17.5302734375, 18.962890625, 20.3955078125, 21.828125, 23.2607421875, 24.693359375, 26.1259765625, 27.55859375, 28.9912109375, 30.423828125, 31.8564453125, 33.2890625, 34.7216796875, 36.154296875, 37.5869140625, 39.01953125, 40.4521484375, 41.884765625, 43.3173828125, 44.75]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 9.0, 12.0, 14.0, 22.0, 17.0, 27.0, 39.0, 37.0, 49.0, 60.0, 59.0, 63.0, 58.0, 73.0, 76.0, 49.0, 58.0, 56.0, 42.0, 31.0, 34.0, 29.0, 23.0, 15.0, 12.0, 18.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.25, -15.77490234375, -15.2998046875, -14.82470703125, -14.349609375, -13.87451171875, -13.3994140625, -12.92431640625, -12.44921875, -11.97412109375, -11.4990234375, -11.02392578125, -10.548828125, -10.07373046875, -9.5986328125, -9.12353515625, -8.6484375, -8.17333984375, -7.6982421875, -7.22314453125, -6.748046875, -6.27294921875, -5.7978515625, -5.32275390625, -4.84765625, -4.37255859375, -3.8974609375, -3.42236328125, -2.947265625, -2.47216796875, -1.9970703125, -1.52197265625, -1.046875, -0.57177734375, -0.0966796875, 0.37841796875, 0.853515625, 1.32861328125, 1.8037109375, 2.27880859375, 2.75390625, 3.22900390625, 3.7041015625, 4.17919921875, 4.654296875, 5.12939453125, 5.6044921875, 6.07958984375, 6.5546875, 7.02978515625, 7.5048828125, 7.97998046875, 8.455078125, 8.93017578125, 9.4052734375, 9.88037109375, 10.35546875, 10.83056640625, 11.3056640625, 11.78076171875, 12.255859375, 12.73095703125, 13.2060546875, 13.68115234375, 14.15625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 11.0, 9.0, 21.0, 18.0, 30.0, 34.0, 42.0, 58.0, 77.0, 110.0, 162.0, 252.0, 387.0, 682.0, 1458.0, 4233.0, 14744.0, 67656.0, 536393.0, 355211.0, 49335.0, 11322.0, 3322.0, 1219.0, 582.0, 339.0, 236.0, 146.0, 101.0, 89.0, 60.0, 41.0, 31.0, 30.0, 29.0, 14.0, 14.0, 12.0, 10.0, 7.0, 3.0, 6.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-81.8125, -79.46875, -77.125, -74.78125, -72.4375, -70.09375, -67.75, -65.40625, -63.0625, -60.71875, -58.375, -56.03125, -53.6875, -51.34375, -49.0, -46.65625, -44.3125, -41.96875, -39.625, -37.28125, -34.9375, -32.59375, -30.25, -27.90625, -25.5625, -23.21875, -20.875, -18.53125, -16.1875, -13.84375, -11.5, -9.15625, -6.8125, -4.46875, -2.125, 0.21875, 2.5625, 4.90625, 7.25, 9.59375, 11.9375, 14.28125, 16.625, 18.96875, 21.3125, 23.65625, 26.0, 28.34375, 30.6875, 33.03125, 35.375, 37.71875, 40.0625, 42.40625, 44.75, 47.09375, 49.4375, 51.78125, 54.125, 56.46875, 58.8125, 61.15625, 63.5, 65.84375, 68.1875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 6.0, 5.0, 8.0, 16.0, 10.0, 12.0, 14.0, 17.0, 21.0, 22.0, 27.0, 30.0, 28.0, 36.0, 44.0, 36.0, 32.0, 55.0, 41.0, 37.0, 42.0, 58.0, 47.0, 41.0, 36.0, 31.0, 38.0, 22.0, 31.0, 22.0, 18.0, 18.0, 18.0, 18.0, 14.0, 12.0, 13.0, 5.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.21875, -44.6357421875, -43.052734375, -41.4697265625, -39.88671875, -38.3037109375, -36.720703125, -35.1376953125, -33.5546875, -31.9716796875, -30.388671875, -28.8056640625, -27.22265625, -25.6396484375, -24.056640625, -22.4736328125, -20.890625, -19.3076171875, -17.724609375, -16.1416015625, -14.55859375, -12.9755859375, -11.392578125, -9.8095703125, -8.2265625, -6.6435546875, -5.060546875, -3.4775390625, -1.89453125, -0.3115234375, 1.271484375, 2.8544921875, 4.4375, 6.0205078125, 7.603515625, 9.1865234375, 10.76953125, 12.3525390625, 13.935546875, 15.5185546875, 17.1015625, 18.6845703125, 20.267578125, 21.8505859375, 23.43359375, 25.0166015625, 26.599609375, 28.1826171875, 29.765625, 31.3486328125, 32.931640625, 34.5146484375, 36.09765625, 37.6806640625, 39.263671875, 40.8466796875, 42.4296875, 44.0126953125, 45.595703125, 47.1787109375, 48.76171875, 50.3447265625, 51.927734375, 53.5107421875, 55.09375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 10.0, 21.0, 26.0, 41.0, 53.0, 84.0, 98.0, 159.0, 320.0, 465.0, 751.0, 1476.0, 2734.0, 5823.0, 13637.0, 45827.0, 441539.0, 462924.0, 46552.0, 13843.0, 5867.0, 2759.0, 1404.0, 852.0, 467.0, 305.0, 187.0, 97.0, 60.0, 50.0, 32.0, 16.0, 19.0, 7.0, 8.0, 2.0, 9.0, 5.0, 2.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.96875, -36.5087890625, -35.048828125, -33.5888671875, -32.12890625, -30.6689453125, -29.208984375, -27.7490234375, -26.2890625, -24.8291015625, -23.369140625, -21.9091796875, -20.44921875, -18.9892578125, -17.529296875, -16.0693359375, -14.609375, -13.1494140625, -11.689453125, -10.2294921875, -8.76953125, -7.3095703125, -5.849609375, -4.3896484375, -2.9296875, -1.4697265625, -0.009765625, 1.4501953125, 2.91015625, 4.3701171875, 5.830078125, 7.2900390625, 8.75, 10.2099609375, 11.669921875, 13.1298828125, 14.58984375, 16.0498046875, 17.509765625, 18.9697265625, 20.4296875, 21.8896484375, 23.349609375, 24.8095703125, 26.26953125, 27.7294921875, 29.189453125, 30.6494140625, 32.109375, 33.5693359375, 35.029296875, 36.4892578125, 37.94921875, 39.4091796875, 40.869140625, 42.3291015625, 43.7890625, 45.2490234375, 46.708984375, 48.1689453125, 49.62890625, 51.0888671875, 52.548828125, 54.0087890625, 55.46875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 10.0, 17.0, 14.0, 19.0, 35.0, 56.0, 99.0, 244.0, 208.0, 114.0, 47.0, 40.0, 21.0, 20.0, 10.0, 10.0, 5.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00836181640625, -0.008082389831542969, -0.0078029632568359375, -0.007523536682128906, -0.007244110107421875, -0.006964683532714844, -0.0066852569580078125, -0.006405830383300781, -0.00612640380859375, -0.005846977233886719, -0.0055675506591796875, -0.005288124084472656, -0.005008697509765625, -0.004729270935058594, -0.0044498443603515625, -0.004170417785644531, -0.0038909912109375, -0.0036115646362304688, -0.0033321380615234375, -0.0030527114868164062, -0.002773284912109375, -0.0024938583374023438, -0.0022144317626953125, -0.0019350051879882812, -0.00165557861328125, -0.0013761520385742188, -0.0010967254638671875, -0.0008172988891601562, -0.000537872314453125, -0.00025844573974609375, 2.09808349609375e-05, 0.00030040740966796875, 0.000579833984375, 0.0008592605590820312, 0.0011386871337890625, 0.0014181137084960938, 0.001697540283203125, 0.0019769668579101562, 0.0022563934326171875, 0.0025358200073242188, 0.00281524658203125, 0.0030946731567382812, 0.0033740997314453125, 0.0036535263061523438, 0.003932952880859375, 0.004212379455566406, 0.0044918060302734375, 0.004771232604980469, 0.0050506591796875, 0.005330085754394531, 0.0056095123291015625, 0.005888938903808594, 0.006168365478515625, 0.006447792053222656, 0.0067272186279296875, 0.007006645202636719, 0.00728607177734375, 0.007565498352050781, 0.007844924926757812, 0.008124351501464844, 0.008403778076171875, 0.008683204650878906, 0.008962631225585938, 0.009242057800292969, 0.009521484375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 6.0, 9.0, 13.0, 14.0, 27.0, 40.0, 55.0, 128.0, 206.0, 418.0, 913.0, 2492.0, 9473.0, 85730.0, 902411.0, 37287.0, 5975.0, 1790.0, 731.0, 339.0, 185.0, 102.0, 64.0, 37.0, 27.0, 16.0, 16.0, 8.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-95.6875, -92.3125, -88.9375, -85.5625, -82.1875, -78.8125, -75.4375, -72.0625, -68.6875, -65.3125, -61.9375, -58.5625, -55.1875, -51.8125, -48.4375, -45.0625, -41.6875, -38.3125, -34.9375, -31.5625, -28.1875, -24.8125, -21.4375, -18.0625, -14.6875, -11.3125, -7.9375, -4.5625, -1.1875, 2.1875, 5.5625, 8.9375, 12.3125, 15.6875, 19.0625, 22.4375, 25.8125, 29.1875, 32.5625, 35.9375, 39.3125, 42.6875, 46.0625, 49.4375, 52.8125, 56.1875, 59.5625, 62.9375, 66.3125, 69.6875, 73.0625, 76.4375, 79.8125, 83.1875, 86.5625, 89.9375, 93.3125, 96.6875, 100.0625, 103.4375, 106.8125, 110.1875, 113.5625, 116.9375, 120.3125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 9.0, 10.0, 18.0, 21.0, 26.0, 51.0, 87.0, 122.0, 174.0, 145.0, 102.0, 58.0, 30.0, 25.0, 21.0, 22.0, 13.0, 9.0, 13.0, 6.0, 1.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.78125, -41.1767578125, -39.572265625, -37.9677734375, -36.36328125, -34.7587890625, -33.154296875, -31.5498046875, -29.9453125, -28.3408203125, -26.736328125, -25.1318359375, -23.52734375, -21.9228515625, -20.318359375, -18.7138671875, -17.109375, -15.5048828125, -13.900390625, -12.2958984375, -10.69140625, -9.0869140625, -7.482421875, -5.8779296875, -4.2734375, -2.6689453125, -1.064453125, 0.5400390625, 2.14453125, 3.7490234375, 5.353515625, 6.9580078125, 8.5625, 10.1669921875, 11.771484375, 13.3759765625, 14.98046875, 16.5849609375, 18.189453125, 19.7939453125, 21.3984375, 23.0029296875, 24.607421875, 26.2119140625, 27.81640625, 29.4208984375, 31.025390625, 32.6298828125, 34.234375, 35.8388671875, 37.443359375, 39.0478515625, 40.65234375, 42.2568359375, 43.861328125, 45.4658203125, 47.0703125, 48.6748046875, 50.279296875, 51.8837890625, 53.48828125, 55.0927734375, 56.697265625, 58.3017578125, 59.90625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 4.0, 7.0, 20.0, 32.0, 32.0, 42.0, 87.0, 83.0, 132.0, 131.0, 118.0, 99.0, 74.0, 44.0, 29.0, 13.0, 11.0, 14.0, 5.0, 3.0, 1.0, 4.0, 0.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-456.236083984375, -442.46307373046875, -428.6900634765625, -414.91705322265625, -401.14404296875, -387.37103271484375, -373.5980224609375, -359.82501220703125, -346.052001953125, -332.27899169921875, -318.5059814453125, -304.73297119140625, -290.9599609375, -277.18695068359375, -263.4139404296875, -249.64093017578125, -235.86793518066406, -222.0949249267578, -208.32191467285156, -194.5489044189453, -180.77589416503906, -167.00289916992188, -153.22988891601562, -139.45687866210938, -125.6838607788086, -111.91085052490234, -98.1378402709961, -84.36483764648438, -70.59182739257812, -56.818817138671875, -43.045806884765625, -29.272796630859375, -15.499786376953125, -1.7267770767211914, 12.046232223510742, 25.81924057006836, 39.59225082397461, 53.365257263183594, 67.13826751708984, 80.9112777709961, 94.68428802490234, 108.4572982788086, 122.23030853271484, 136.00331115722656, 149.7763214111328, 163.54933166503906, 177.3223419189453, 191.09535217285156, 204.8683624267578, 218.64137268066406, 232.4143829345703, 246.18739318847656, 259.96038818359375, 273.7333984375, 287.50640869140625, 301.2794189453125, 315.05242919921875, 328.825439453125, 342.59844970703125, 356.3714599609375, 370.14447021484375, 383.91748046875, 397.69049072265625, 411.4635009765625, 425.23651123046875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 9.0, 7.0, 6.0, 5.0, 14.0, 10.0, 16.0, 18.0, 20.0, 25.0, 36.0, 23.0, 40.0, 38.0, 29.0, 32.0, 39.0, 43.0, 44.0, 47.0, 45.0, 47.0, 44.0, 39.0, 31.0, 42.0, 37.0, 19.0, 29.0, 27.0, 21.0, 22.0, 16.0, 15.0, 14.0, 8.0, 11.0, 5.0, 8.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-282.01031494140625, -273.06591796875, -264.12152099609375, -255.1771240234375, -246.2327117919922, -237.28831481933594, -228.3439178466797, -219.39952087402344, -210.45510864257812, -201.51071166992188, -192.56631469726562, -183.62191772460938, -174.67750549316406, -165.7331085205078, -156.78871154785156, -147.8443145751953, -138.89991760253906, -129.9555206298828, -121.01111602783203, -112.06671905517578, -103.122314453125, -94.17791748046875, -85.2335205078125, -76.28912353515625, -67.34471893310547, -58.40031814575195, -49.45591735839844, -40.51152038574219, -31.567119598388672, -22.622718811035156, -13.678321838378906, -4.733921051025391, 4.210479736328125, 13.154879570007324, 22.099279403686523, 31.043678283691406, 39.98807907104492, 48.93247985839844, 57.87687683105469, 66.82127380371094, 75.76567840576172, 84.71007537841797, 93.65447998046875, 102.598876953125, 111.54327392578125, 120.48767852783203, 129.43206787109375, 138.37648010253906, 147.3208770751953, 156.26527404785156, 165.2096710205078, 174.15408325195312, 183.09848022460938, 192.04287719726562, 200.98727416992188, 209.93167114257812, 218.87606811523438, 227.82046508789062, 236.76486206054688, 245.70925903320312, 254.65367126464844, 263.59808349609375, 272.54248046875, 281.48687744140625, 290.4312744140625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 9.0, 11.0, 13.0, 15.0, 20.0, 20.0, 47.0, 72.0, 108.0, 163.0, 205.0, 366.0, 609.0, 983.0, 1626.0, 3022.0, 5924.0, 13733.0, 55604.0, 3632983.0, 428131.0, 29861.0, 9972.0, 4615.0, 2537.0, 1416.0, 855.0, 491.0, 334.0, 183.0, 116.0, 77.0, 62.0, 32.0, 17.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-100.0, -96.953125, -93.90625, -90.859375, -87.8125, -84.765625, -81.71875, -78.671875, -75.625, -72.578125, -69.53125, -66.484375, -63.4375, -60.390625, -57.34375, -54.296875, -51.25, -48.203125, -45.15625, -42.109375, -39.0625, -36.015625, -32.96875, -29.921875, -26.875, -23.828125, -20.78125, -17.734375, -14.6875, -11.640625, -8.59375, -5.546875, -2.5, 0.546875, 3.59375, 6.640625, 9.6875, 12.734375, 15.78125, 18.828125, 21.875, 24.921875, 27.96875, 31.015625, 34.0625, 37.109375, 40.15625, 43.203125, 46.25, 49.296875, 52.34375, 55.390625, 58.4375, 61.484375, 64.53125, 67.578125, 70.625, 73.671875, 76.71875, 79.765625, 82.8125, 85.859375, 88.90625, 91.953125, 95.0]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 9.0, 8.0, 5.0, 14.0, 21.0, 27.0, 24.0, 32.0, 42.0, 38.0, 55.0, 79.0, 64.0, 65.0, 69.0, 71.0, 63.0, 59.0, 45.0, 54.0, 28.0, 32.0, 27.0, 19.0, 15.0, 12.0, 9.0, 7.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.25, -17.731201171875, -17.21240234375, -16.693603515625, -16.1748046875, -15.656005859375, -15.13720703125, -14.618408203125, -14.099609375, -13.580810546875, -13.06201171875, -12.543212890625, -12.0244140625, -11.505615234375, -10.98681640625, -10.468017578125, -9.94921875, -9.430419921875, -8.91162109375, -8.392822265625, -7.8740234375, -7.355224609375, -6.83642578125, -6.317626953125, -5.798828125, -5.280029296875, -4.76123046875, -4.242431640625, -3.7236328125, -3.204833984375, -2.68603515625, -2.167236328125, -1.6484375, -1.129638671875, -0.61083984375, -0.092041015625, 0.4267578125, 0.945556640625, 1.46435546875, 1.983154296875, 2.501953125, 3.020751953125, 3.53955078125, 4.058349609375, 4.5771484375, 5.095947265625, 5.61474609375, 6.133544921875, 6.65234375, 7.171142578125, 7.68994140625, 8.208740234375, 8.7275390625, 9.246337890625, 9.76513671875, 10.283935546875, 10.802734375, 11.321533203125, 11.84033203125, 12.359130859375, 12.8779296875, 13.396728515625, 13.91552734375, 14.434326171875, 14.953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 7.0, 14.0, 30.0, 44.0, 71.0, 125.0, 223.0, 382.0, 768.0, 1509.0, 3364.0, 8506.0, 28440.0, 408813.0, 3673988.0, 47244.0, 11997.0, 4470.0, 2066.0, 1024.0, 532.0, 251.0, 174.0, 99.0, 55.0, 36.0, 15.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-142.25, -137.826171875, -133.40234375, -128.978515625, -124.5546875, -120.130859375, -115.70703125, -111.283203125, -106.859375, -102.435546875, -98.01171875, -93.587890625, -89.1640625, -84.740234375, -80.31640625, -75.892578125, -71.46875, -67.044921875, -62.62109375, -58.197265625, -53.7734375, -49.349609375, -44.92578125, -40.501953125, -36.078125, -31.654296875, -27.23046875, -22.806640625, -18.3828125, -13.958984375, -9.53515625, -5.111328125, -0.6875, 3.736328125, 8.16015625, 12.583984375, 17.0078125, 21.431640625, 25.85546875, 30.279296875, 34.703125, 39.126953125, 43.55078125, 47.974609375, 52.3984375, 56.822265625, 61.24609375, 65.669921875, 70.09375, 74.517578125, 78.94140625, 83.365234375, 87.7890625, 92.212890625, 96.63671875, 101.060546875, 105.484375, 109.908203125, 114.33203125, 118.755859375, 123.1796875, 127.603515625, 132.02734375, 136.451171875, 140.875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 5.0, 2.0, 5.0, 11.0, 7.0, 9.0, 9.0, 12.0, 15.0, 21.0, 24.0, 41.0, 78.0, 164.0, 630.0, 2312.0, 405.0, 121.0, 70.0, 40.0, 19.0, 18.0, 11.0, 10.0, 11.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.96875, -43.43798828125, -41.9072265625, -40.37646484375, -38.845703125, -37.31494140625, -35.7841796875, -34.25341796875, -32.72265625, -31.19189453125, -29.6611328125, -28.13037109375, -26.599609375, -25.06884765625, -23.5380859375, -22.00732421875, -20.4765625, -18.94580078125, -17.4150390625, -15.88427734375, -14.353515625, -12.82275390625, -11.2919921875, -9.76123046875, -8.23046875, -6.69970703125, -5.1689453125, -3.63818359375, -2.107421875, -0.57666015625, 0.9541015625, 2.48486328125, 4.015625, 5.54638671875, 7.0771484375, 8.60791015625, 10.138671875, 11.66943359375, 13.2001953125, 14.73095703125, 16.26171875, 17.79248046875, 19.3232421875, 20.85400390625, 22.384765625, 23.91552734375, 25.4462890625, 26.97705078125, 28.5078125, 30.03857421875, 31.5693359375, 33.10009765625, 34.630859375, 36.16162109375, 37.6923828125, 39.22314453125, 40.75390625, 42.28466796875, 43.8154296875, 45.34619140625, 46.876953125, 48.40771484375, 49.9384765625, 51.46923828125, 53.0]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 18.0, 38.0, 111.0, 315.0, 369.0, 105.0, 30.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-893.8897705078125, -867.6461181640625, -841.4025268554688, -815.1588745117188, -788.915283203125, -762.671630859375, -736.427978515625, -710.184326171875, -683.9407348632812, -657.6970825195312, -631.4534912109375, -605.2098388671875, -578.9661865234375, -552.7225952148438, -526.4789428710938, -500.2353210449219, -473.99169921875, -447.7480773925781, -421.50445556640625, -395.26080322265625, -369.0171813964844, -342.7735595703125, -316.5299072265625, -290.2862854003906, -264.04266357421875, -237.79904174804688, -211.55540466308594, -185.311767578125, -159.06814575195312, -132.82452392578125, -106.58088684082031, -80.33724975585938, -54.09368896484375, -27.850059509277344, -1.6064300537109375, 24.63719940185547, 50.880828857421875, 77.12445068359375, 103.36808776855469, 129.61172485351562, 155.8553466796875, 182.09896850585938, 208.3426055908203, 234.58624267578125, 260.8298645019531, 287.073486328125, 313.317138671875, 339.5607604980469, 365.80438232421875, 392.0480041503906, 418.2916259765625, 444.5352783203125, 470.7789001464844, 497.02252197265625, 523.2661743164062, 549.509765625, 575.75341796875, 601.9970703125, 628.2406616210938, 654.4843139648438, 680.7279052734375, 706.9715576171875, 733.2152099609375, 759.4588623046875, 785.7024536132812]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 1.0, 4.0, 4.0, 10.0, 6.0, 12.0, 11.0, 21.0, 18.0, 9.0, 33.0, 33.0, 33.0, 36.0, 31.0, 36.0, 46.0, 33.0, 46.0, 50.0, 48.0, 33.0, 50.0, 49.0, 35.0, 31.0, 44.0, 40.0, 32.0, 37.0, 14.0, 22.0, 19.0, 17.0, 19.0, 10.0, 5.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-171.67056274414062, -166.81753540039062, -161.96449279785156, -157.11146545410156, -152.2584228515625, -147.4053955078125, -142.55235290527344, -137.69932556152344, -132.84628295898438, -127.99324798583984, -123.14021301269531, -118.28717803955078, -113.43414306640625, -108.58111572265625, -103.72808074951172, -98.87504577636719, -94.02201843261719, -89.16898345947266, -84.31594848632812, -79.4629135131836, -74.60987854003906, -69.75685119628906, -64.90381622314453, -60.05078125, -55.19774627685547, -50.34471130371094, -45.491676330566406, -40.63864517211914, -35.78561019897461, -30.932575225830078, -26.07954216003418, -21.22650909423828, -16.373458862304688, -11.520424842834473, -6.667390823364258, -1.814356803894043, 3.038677215576172, 7.891712188720703, 12.744745254516602, 17.5977783203125, 22.45081329345703, 27.303848266601562, 32.156883239746094, 37.00991439819336, 41.86294937133789, 46.71598434448242, 51.56901550292969, 56.42205047607422, 61.27508544921875, 66.12812042236328, 70.98115539550781, 75.83419036865234, 80.68722534179688, 85.54025268554688, 90.3932876586914, 95.24632263183594, 100.09935760498047, 104.952392578125, 109.80542755126953, 114.65846252441406, 119.51148986816406, 124.36453247070312, 129.21755981445312, 134.07058715820312, 138.9236297607422]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 9.0, 17.0, 16.0, 18.0, 25.0, 38.0, 61.0, 100.0, 161.0, 254.0, 391.0, 630.0, 1065.0, 1775.0, 3145.0, 5723.0, 11104.0, 22190.0, 48791.0, 122635.0, 305707.0, 305559.0, 123463.0, 48741.0, 22274.0, 11390.0, 5763.0, 3034.0, 1788.0, 1021.0, 604.0, 416.0, 215.0, 145.0, 87.0, 65.0, 42.0, 27.0, 23.0, 17.0, 8.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-49.46875, -47.9697265625, -46.470703125, -44.9716796875, -43.47265625, -41.9736328125, -40.474609375, -38.9755859375, -37.4765625, -35.9775390625, -34.478515625, -32.9794921875, -31.48046875, -29.9814453125, -28.482421875, -26.9833984375, -25.484375, -23.9853515625, -22.486328125, -20.9873046875, -19.48828125, -17.9892578125, -16.490234375, -14.9912109375, -13.4921875, -11.9931640625, -10.494140625, -8.9951171875, -7.49609375, -5.9970703125, -4.498046875, -2.9990234375, -1.5, -0.0009765625, 1.498046875, 2.9970703125, 4.49609375, 5.9951171875, 7.494140625, 8.9931640625, 10.4921875, 11.9912109375, 13.490234375, 14.9892578125, 16.48828125, 17.9873046875, 19.486328125, 20.9853515625, 22.484375, 23.9833984375, 25.482421875, 26.9814453125, 28.48046875, 29.9794921875, 31.478515625, 32.9775390625, 34.4765625, 35.9755859375, 37.474609375, 38.9736328125, 40.47265625, 41.9716796875, 43.470703125, 44.9697265625, 46.46875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 8.0, 12.0, 27.0, 18.0, 28.0, 27.0, 41.0, 32.0, 38.0, 58.0, 47.0, 47.0, 56.0, 37.0, 54.0, 65.0, 59.0, 50.0, 39.0, 46.0, 37.0, 23.0, 24.0, 30.0, 25.0, 21.0, 16.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.1328125, -15.625, -15.1171875, -14.609375, -14.1015625, -13.59375, -13.0859375, -12.578125, -12.0703125, -11.5625, -11.0546875, -10.546875, -10.0390625, -9.53125, -9.0234375, -8.515625, -8.0078125, -7.5, -6.9921875, -6.484375, -5.9765625, -5.46875, -4.9609375, -4.453125, -3.9453125, -3.4375, -2.9296875, -2.421875, -1.9140625, -1.40625, -0.8984375, -0.390625, 0.1171875, 0.625, 1.1328125, 1.640625, 2.1484375, 2.65625, 3.1640625, 3.671875, 4.1796875, 4.6875, 5.1953125, 5.703125, 6.2109375, 6.71875, 7.2265625, 7.734375, 8.2421875, 8.75, 9.2578125, 9.765625, 10.2734375, 10.78125, 11.2890625, 11.796875, 12.3046875, 12.8125, 13.3203125, 13.828125, 14.3359375, 14.84375, 15.3515625, 15.859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 15.0, 27.0, 21.0, 46.0, 56.0, 73.0, 136.0, 218.0, 313.0, 542.0, 1228.0, 3201.0, 13654.0, 105863.0, 755984.0, 143542.0, 17020.0, 3681.0, 1309.0, 625.0, 359.0, 208.0, 115.0, 91.0, 59.0, 37.0, 32.0, 24.0, 17.0, 11.0, 8.0, 5.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-117.4375, -113.5947265625, -109.751953125, -105.9091796875, -102.06640625, -98.2236328125, -94.380859375, -90.5380859375, -86.6953125, -82.8525390625, -79.009765625, -75.1669921875, -71.32421875, -67.4814453125, -63.638671875, -59.7958984375, -55.953125, -52.1103515625, -48.267578125, -44.4248046875, -40.58203125, -36.7392578125, -32.896484375, -29.0537109375, -25.2109375, -21.3681640625, -17.525390625, -13.6826171875, -9.83984375, -5.9970703125, -2.154296875, 1.6884765625, 5.53125, 9.3740234375, 13.216796875, 17.0595703125, 20.90234375, 24.7451171875, 28.587890625, 32.4306640625, 36.2734375, 40.1162109375, 43.958984375, 47.8017578125, 51.64453125, 55.4873046875, 59.330078125, 63.1728515625, 67.015625, 70.8583984375, 74.701171875, 78.5439453125, 82.38671875, 86.2294921875, 90.072265625, 93.9150390625, 97.7578125, 101.6005859375, 105.443359375, 109.2861328125, 113.12890625, 116.9716796875, 120.814453125, 124.6572265625, 128.5]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 2.0, 8.0, 2.0, 12.0, 11.0, 18.0, 15.0, 20.0, 20.0, 19.0, 23.0, 34.0, 44.0, 31.0, 44.0, 52.0, 51.0, 40.0, 46.0, 41.0, 52.0, 42.0, 57.0, 37.0, 34.0, 31.0, 42.0, 25.0, 26.0, 22.0, 19.0, 20.0, 14.0, 11.0, 8.0, 7.0, 9.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.1875, -62.9384765625, -60.689453125, -58.4404296875, -56.19140625, -53.9423828125, -51.693359375, -49.4443359375, -47.1953125, -44.9462890625, -42.697265625, -40.4482421875, -38.19921875, -35.9501953125, -33.701171875, -31.4521484375, -29.203125, -26.9541015625, -24.705078125, -22.4560546875, -20.20703125, -17.9580078125, -15.708984375, -13.4599609375, -11.2109375, -8.9619140625, -6.712890625, -4.4638671875, -2.21484375, 0.0341796875, 2.283203125, 4.5322265625, 6.78125, 9.0302734375, 11.279296875, 13.5283203125, 15.77734375, 18.0263671875, 20.275390625, 22.5244140625, 24.7734375, 27.0224609375, 29.271484375, 31.5205078125, 33.76953125, 36.0185546875, 38.267578125, 40.5166015625, 42.765625, 45.0146484375, 47.263671875, 49.5126953125, 51.76171875, 54.0107421875, 56.259765625, 58.5087890625, 60.7578125, 63.0068359375, 65.255859375, 67.5048828125, 69.75390625, 72.0029296875, 74.251953125, 76.5009765625, 78.75]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 12.0, 8.0, 22.0, 20.0, 39.0, 54.0, 59.0, 114.0, 149.0, 261.0, 426.0, 647.0, 1296.0, 2711.0, 6195.0, 17941.0, 70297.0, 585568.0, 298627.0, 42492.0, 12363.0, 4712.0, 2005.0, 1042.0, 530.0, 357.0, 207.0, 119.0, 99.0, 50.0, 43.0, 25.0, 17.0, 13.0, 11.0, 7.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-69.0, -67.07470703125, -65.1494140625, -63.22412109375, -61.298828125, -59.37353515625, -57.4482421875, -55.52294921875, -53.59765625, -51.67236328125, -49.7470703125, -47.82177734375, -45.896484375, -43.97119140625, -42.0458984375, -40.12060546875, -38.1953125, -36.27001953125, -34.3447265625, -32.41943359375, -30.494140625, -28.56884765625, -26.6435546875, -24.71826171875, -22.79296875, -20.86767578125, -18.9423828125, -17.01708984375, -15.091796875, -13.16650390625, -11.2412109375, -9.31591796875, -7.390625, -5.46533203125, -3.5400390625, -1.61474609375, 0.310546875, 2.23583984375, 4.1611328125, 6.08642578125, 8.01171875, 9.93701171875, 11.8623046875, 13.78759765625, 15.712890625, 17.63818359375, 19.5634765625, 21.48876953125, 23.4140625, 25.33935546875, 27.2646484375, 29.18994140625, 31.115234375, 33.04052734375, 34.9658203125, 36.89111328125, 38.81640625, 40.74169921875, 42.6669921875, 44.59228515625, 46.517578125, 48.44287109375, 50.3681640625, 52.29345703125, 54.21875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 2.0, 12.0, 17.0, 24.0, 62.0, 86.0, 174.0, 264.0, 165.0, 59.0, 49.0, 24.0, 20.0, 14.0, 6.0, 7.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0156097412109375, -0.015169739723205566, -0.014729738235473633, -0.0142897367477417, -0.013849735260009766, -0.013409733772277832, -0.012969732284545898, -0.012529730796813965, -0.012089729309082031, -0.011649727821350098, -0.011209726333618164, -0.01076972484588623, -0.010329723358154297, -0.009889721870422363, -0.00944972038269043, -0.009009718894958496, -0.008569717407226562, -0.008129715919494629, -0.007689714431762695, -0.007249712944030762, -0.006809711456298828, -0.0063697099685668945, -0.005929708480834961, -0.005489706993103027, -0.005049705505371094, -0.00460970401763916, -0.0041697025299072266, -0.003729701042175293, -0.0032896995544433594, -0.0028496980667114258, -0.002409696578979492, -0.0019696950912475586, -0.001529693603515625, -0.0010896921157836914, -0.0006496906280517578, -0.00020968914031982422, 0.00023031234741210938, 0.000670313835144043, 0.0011103153228759766, 0.0015503168106079102, 0.0019903182983398438, 0.0024303197860717773, 0.002870321273803711, 0.0033103227615356445, 0.003750324249267578, 0.004190325736999512, 0.004630327224731445, 0.005070328712463379, 0.0055103302001953125, 0.005950331687927246, 0.00639033317565918, 0.006830334663391113, 0.007270336151123047, 0.0077103376388549805, 0.008150339126586914, 0.008590340614318848, 0.009030342102050781, 0.009470343589782715, 0.009910345077514648, 0.010350346565246582, 0.010790348052978516, 0.01123034954071045, 0.011670351028442383, 0.012110352516174316, 0.01255035400390625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 2.0, 2.0, 6.0, 3.0, 3.0, 5.0, 8.0, 14.0, 21.0, 26.0, 30.0, 54.0, 95.0, 111.0, 179.0, 371.0, 766.0, 1731.0, 5024.0, 18848.0, 154179.0, 785690.0, 63602.0, 11503.0, 3481.0, 1359.0, 572.0, 327.0, 209.0, 97.0, 71.0, 35.0, 44.0, 29.0, 15.0, 13.0, 5.0, 7.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0], "bins": [-100.375, -97.6123046875, -94.849609375, -92.0869140625, -89.32421875, -86.5615234375, -83.798828125, -81.0361328125, -78.2734375, -75.5107421875, -72.748046875, -69.9853515625, -67.22265625, -64.4599609375, -61.697265625, -58.9345703125, -56.171875, -53.4091796875, -50.646484375, -47.8837890625, -45.12109375, -42.3583984375, -39.595703125, -36.8330078125, -34.0703125, -31.3076171875, -28.544921875, -25.7822265625, -23.01953125, -20.2568359375, -17.494140625, -14.7314453125, -11.96875, -9.2060546875, -6.443359375, -3.6806640625, -0.91796875, 1.8447265625, 4.607421875, 7.3701171875, 10.1328125, 12.8955078125, 15.658203125, 18.4208984375, 21.18359375, 23.9462890625, 26.708984375, 29.4716796875, 32.234375, 34.9970703125, 37.759765625, 40.5224609375, 43.28515625, 46.0478515625, 48.810546875, 51.5732421875, 54.3359375, 57.0986328125, 59.861328125, 62.6240234375, 65.38671875, 68.1494140625, 70.912109375, 73.6748046875, 76.4375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 1.0, 12.0, 8.0, 6.0, 8.0, 10.0, 24.0, 39.0, 43.0, 78.0, 100.0, 90.0, 122.0, 110.0, 93.0, 94.0, 43.0, 29.0, 30.0, 10.0, 10.0, 9.0, 7.0, 13.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-63.25, -61.552734375, -59.85546875, -58.158203125, -56.4609375, -54.763671875, -53.06640625, -51.369140625, -49.671875, -47.974609375, -46.27734375, -44.580078125, -42.8828125, -41.185546875, -39.48828125, -37.791015625, -36.09375, -34.396484375, -32.69921875, -31.001953125, -29.3046875, -27.607421875, -25.91015625, -24.212890625, -22.515625, -20.818359375, -19.12109375, -17.423828125, -15.7265625, -14.029296875, -12.33203125, -10.634765625, -8.9375, -7.240234375, -5.54296875, -3.845703125, -2.1484375, -0.451171875, 1.24609375, 2.943359375, 4.640625, 6.337890625, 8.03515625, 9.732421875, 11.4296875, 13.126953125, 14.82421875, 16.521484375, 18.21875, 19.916015625, 21.61328125, 23.310546875, 25.0078125, 26.705078125, 28.40234375, 30.099609375, 31.796875, 33.494140625, 35.19140625, 36.888671875, 38.5859375, 40.283203125, 41.98046875, 43.677734375, 45.375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 16.0, 43.0, 121.0, 275.0, 285.0, 150.0, 63.0, 25.0, 8.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2168.21337890625, -2124.948486328125, -2081.68359375, -2038.4185791015625, -1995.1536865234375, -1951.8887939453125, -1908.623779296875, -1865.35888671875, -1822.093994140625, -1778.8291015625, -1735.564208984375, -1692.2991943359375, -1649.0343017578125, -1605.7694091796875, -1562.50439453125, -1519.239501953125, -1475.974609375, -1432.709716796875, -1389.44482421875, -1346.1798095703125, -1302.9149169921875, -1259.6500244140625, -1216.385009765625, -1173.1201171875, -1129.855224609375, -1086.59033203125, -1043.325439453125, -1000.0604248046875, -956.7955322265625, -913.5306396484375, -870.2656860351562, -827.000732421875, -783.7359008789062, -740.470947265625, -697.2060546875, -653.941162109375, -610.6762084960938, -567.4112548828125, -524.1463623046875, -480.8814392089844, -437.61651611328125, -394.3515930175781, -351.086669921875, -307.8217468261719, -264.55682373046875, -221.29190063476562, -178.0269775390625, -134.76205444335938, -91.49713134765625, -48.232208251953125, -4.96728515625, 38.297637939453125, 81.56256103515625, 124.82748413085938, 168.0924072265625, 211.35733032226562, 254.62225341796875, 297.8871765136719, 341.152099609375, 384.4170227050781, 427.68194580078125, 470.9468688964844, 514.2117919921875, 557.4766845703125, 600.7416381835938]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 11.0, 12.0, 8.0, 17.0, 10.0, 21.0, 20.0, 22.0, 24.0, 27.0, 28.0, 32.0, 30.0, 28.0, 28.0, 52.0, 34.0, 45.0, 47.0, 45.0, 34.0, 29.0, 45.0, 45.0, 35.0, 20.0, 29.0, 32.0, 25.0, 19.0, 21.0, 11.0, 19.0, 19.0, 14.0, 6.0, 9.0, 6.0, 2.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-337.964599609375, -328.0608825683594, -318.1571350097656, -308.25341796875, -298.34967041015625, -288.4459533691406, -278.5422058105469, -268.63848876953125, -258.7347412109375, -248.8310089111328, -238.92727661132812, -229.02354431152344, -219.11981201171875, -209.21609497070312, -199.31236267089844, -189.40863037109375, -179.50491333007812, -169.60118103027344, -159.69744873046875, -149.79371643066406, -139.88998413085938, -129.98626708984375, -120.08253479003906, -110.17880249023438, -100.27507019042969, -90.371337890625, -80.46760559082031, -70.56388092041016, -60.66014862060547, -50.75641632080078, -40.85268783569336, -30.948959350585938, -21.045257568359375, -11.14152717590332, -1.2377967834472656, 8.665933609008789, 18.569664001464844, 28.47339630126953, 38.37712478637695, 48.280853271484375, 58.18458557128906, 68.08831787109375, 77.99205017089844, 87.8957748413086, 97.79950714111328, 107.70323944091797, 117.60696411132812, 127.51069641113281, 137.4144287109375, 147.3181610107422, 157.22189331054688, 167.12562561035156, 177.02935791015625, 186.93307495117188, 196.83680725097656, 206.74053955078125, 216.64427185058594, 226.54800415039062, 236.4517364501953, 246.35546875, 256.2591857910156, 266.1629333496094, 276.066650390625, 285.97039794921875, 295.8741149902344]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 2.0, 13.0, 12.0, 10.0, 17.0, 33.0, 37.0, 40.0, 88.0, 115.0, 164.0, 239.0, 426.0, 721.0, 1445.0, 3626.0, 30516.0, 4139513.0, 11702.0, 2651.0, 1190.0, 659.0, 341.0, 249.0, 145.0, 85.0, 69.0, 47.0, 33.0, 25.0, 11.0, 18.0, 6.0, 11.0, 7.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.75, -142.716796875, -137.68359375, -132.650390625, -127.6171875, -122.583984375, -117.55078125, -112.517578125, -107.484375, -102.451171875, -97.41796875, -92.384765625, -87.3515625, -82.318359375, -77.28515625, -72.251953125, -67.21875, -62.185546875, -57.15234375, -52.119140625, -47.0859375, -42.052734375, -37.01953125, -31.986328125, -26.953125, -21.919921875, -16.88671875, -11.853515625, -6.8203125, -1.787109375, 3.24609375, 8.279296875, 13.3125, 18.345703125, 23.37890625, 28.412109375, 33.4453125, 38.478515625, 43.51171875, 48.544921875, 53.578125, 58.611328125, 63.64453125, 68.677734375, 73.7109375, 78.744140625, 83.77734375, 88.810546875, 93.84375, 98.876953125, 103.91015625, 108.943359375, 113.9765625, 119.009765625, 124.04296875, 129.076171875, 134.109375, 139.142578125, 144.17578125, 149.208984375, 154.2421875, 159.275390625, 164.30859375, 169.341796875, 174.375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 13.0, 12.0, 13.0, 17.0, 17.0, 26.0, 24.0, 25.0, 44.0, 39.0, 44.0, 58.0, 47.0, 55.0, 54.0, 64.0, 64.0, 46.0, 57.0, 49.0, 41.0, 31.0, 35.0, 30.0, 17.0, 25.0, 15.0, 8.0, 10.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -17.995361328125, -17.41259765625, -16.829833984375, -16.2470703125, -15.664306640625, -15.08154296875, -14.498779296875, -13.916015625, -13.333251953125, -12.75048828125, -12.167724609375, -11.5849609375, -11.002197265625, -10.41943359375, -9.836669921875, -9.25390625, -8.671142578125, -8.08837890625, -7.505615234375, -6.9228515625, -6.340087890625, -5.75732421875, -5.174560546875, -4.591796875, -4.009033203125, -3.42626953125, -2.843505859375, -2.2607421875, -1.677978515625, -1.09521484375, -0.512451171875, 0.0703125, 0.653076171875, 1.23583984375, 1.818603515625, 2.4013671875, 2.984130859375, 3.56689453125, 4.149658203125, 4.732421875, 5.315185546875, 5.89794921875, 6.480712890625, 7.0634765625, 7.646240234375, 8.22900390625, 8.811767578125, 9.39453125, 9.977294921875, 10.56005859375, 11.142822265625, 11.7255859375, 12.308349609375, 12.89111328125, 13.473876953125, 14.056640625, 14.639404296875, 15.22216796875, 15.804931640625, 16.3876953125, 16.970458984375, 17.55322265625, 18.135986328125, 18.71875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 10.0, 10.0, 14.0, 13.0, 25.0, 37.0, 51.0, 72.0, 123.0, 161.0, 234.0, 337.0, 521.0, 823.0, 1289.0, 2543.0, 8109.0, 3904295.0, 262767.0, 6925.0, 2341.0, 1229.0, 822.0, 511.0, 331.0, 223.0, 137.0, 110.0, 74.0, 42.0, 24.0, 28.0, 16.0, 12.0, 6.0, 11.0, 6.0, 5.0, 0.0, 0.0, 2.0], "bins": [-211.25, -206.0908203125, -200.931640625, -195.7724609375, -190.61328125, -185.4541015625, -180.294921875, -175.1357421875, -169.9765625, -164.8173828125, -159.658203125, -154.4990234375, -149.33984375, -144.1806640625, -139.021484375, -133.8623046875, -128.703125, -123.5439453125, -118.384765625, -113.2255859375, -108.06640625, -102.9072265625, -97.748046875, -92.5888671875, -87.4296875, -82.2705078125, -77.111328125, -71.9521484375, -66.79296875, -61.6337890625, -56.474609375, -51.3154296875, -46.15625, -40.9970703125, -35.837890625, -30.6787109375, -25.51953125, -20.3603515625, -15.201171875, -10.0419921875, -4.8828125, 0.2763671875, 5.435546875, 10.5947265625, 15.75390625, 20.9130859375, 26.072265625, 31.2314453125, 36.390625, 41.5498046875, 46.708984375, 51.8681640625, 57.02734375, 62.1865234375, 67.345703125, 72.5048828125, 77.6640625, 82.8232421875, 87.982421875, 93.1416015625, 98.30078125, 103.4599609375, 108.619140625, 113.7783203125, 118.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 10.0, 9.0, 39.0, 3201.0, 756.0, 30.0, 8.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-51.90625, -50.751708984375, -49.59716796875, -48.442626953125, -47.2880859375, -46.133544921875, -44.97900390625, -43.824462890625, -42.669921875, -41.515380859375, -40.36083984375, -39.206298828125, -38.0517578125, -36.897216796875, -35.74267578125, -34.588134765625, -33.43359375, -32.279052734375, -31.12451171875, -29.969970703125, -28.8154296875, -27.660888671875, -26.50634765625, -25.351806640625, -24.197265625, -23.042724609375, -21.88818359375, -20.733642578125, -19.5791015625, -18.424560546875, -17.27001953125, -16.115478515625, -14.9609375, -13.806396484375, -12.65185546875, -11.497314453125, -10.3427734375, -9.188232421875, -8.03369140625, -6.879150390625, -5.724609375, -4.570068359375, -3.41552734375, -2.260986328125, -1.1064453125, 0.048095703125, 1.20263671875, 2.357177734375, 3.51171875, 4.666259765625, 5.82080078125, 6.975341796875, 8.1298828125, 9.284423828125, 10.43896484375, 11.593505859375, 12.748046875, 13.902587890625, 15.05712890625, 16.211669921875, 17.3662109375, 18.520751953125, 19.67529296875, 20.829833984375, 21.984375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 10.0, 11.0, 15.0, 22.0, 54.0, 106.0, 174.0, 231.0, 169.0, 100.0, 43.0, 23.0, 17.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.26759338378906, -62.6895637512207, -59.11153793334961, -55.53350830078125, -51.95547866821289, -48.37744903564453, -44.79942321777344, -41.22139358520508, -37.64336395263672, -34.06533432006836, -30.487306594848633, -26.909278869628906, -23.331249237060547, -19.75322151184082, -16.175193786621094, -12.597164154052734, -9.01913833618164, -5.441109657287598, -1.863081455230713, 1.7149467468261719, 5.292975425720215, 8.871004104614258, 12.449031829833984, 16.027061462402344, 19.60508918762207, 23.183116912841797, 26.761146545410156, 30.339174270629883, 33.91720199584961, 37.49523162841797, 41.07325744628906, 44.65129089355469, 48.22931671142578, 51.80734634399414, 55.385372161865234, 58.963401794433594, 62.54143142700195, 66.11946105957031, 69.6974868774414, 73.2755126953125, 76.85354614257812, 80.43157196044922, 84.00960540771484, 87.58763122558594, 91.16565704345703, 94.74369049072266, 98.32171630859375, 101.89974975585938, 105.47776794433594, 109.05579376220703, 112.63382720947266, 116.21185302734375, 119.78987884521484, 123.36791229248047, 126.94593811035156, 130.5239715576172, 134.1020050048828, 137.68003845214844, 141.258056640625, 144.83609008789062, 148.41412353515625, 151.9921417236328, 155.57017517089844, 159.14820861816406, 162.72622680664062]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 10.0, 7.0, 9.0, 9.0, 13.0, 24.0, 15.0, 22.0, 23.0, 30.0, 27.0, 44.0, 37.0, 36.0, 37.0, 40.0, 51.0, 46.0, 51.0, 40.0, 45.0, 45.0, 37.0, 28.0, 32.0, 36.0, 30.0, 33.0, 19.0, 18.0, 9.0, 17.0, 14.0, 7.0, 11.0, 12.0, 1.0, 2.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.705421447753906, -39.30282211303711, -37.90022659301758, -36.49762725830078, -35.09503173828125, -33.69243240356445, -32.289833068847656, -30.887235641479492, -29.484638214111328, -28.082040786743164, -26.679443359375, -25.276844024658203, -23.87424659729004, -22.471649169921875, -21.069049835205078, -19.666452407836914, -18.26385498046875, -16.861257553100586, -15.458659172058105, -14.056060791015625, -12.653463363647461, -11.250865936279297, -9.848267555236816, -8.445669174194336, -7.043071746826172, -5.64047384262085, -4.237875938415527, -2.835278034210205, -1.4326801300048828, -0.030082225799560547, 1.3725156784057617, 2.775114059448242, 4.177715301513672, 5.580313205718994, 6.982911109924316, 8.385509490966797, 9.788106918334961, 11.190704345703125, 12.593302726745605, 13.995901107788086, 15.39849853515625, 16.801095962524414, 18.203693389892578, 19.606292724609375, 21.00889015197754, 22.411487579345703, 23.8140869140625, 25.216684341430664, 26.619281768798828, 28.021879196166992, 29.424476623535156, 30.827075958251953, 32.22967529296875, 33.63227081298828, 35.03487014770508, 36.437469482421875, 37.840065002441406, 39.2426643371582, 40.645259857177734, 42.04785919189453, 43.45045471191406, 44.85305404663086, 46.255653381347656, 47.65824890136719, 49.060848236083984]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 5.0, 15.0, 16.0, 30.0, 35.0, 55.0, 91.0, 154.0, 242.0, 376.0, 608.0, 932.0, 1700.0, 2998.0, 5155.0, 9493.0, 17936.0, 35655.0, 80488.0, 197834.0, 345518.0, 194885.0, 79317.0, 35554.0, 17644.0, 9480.0, 5213.0, 2902.0, 1666.0, 986.0, 552.0, 352.0, 233.0, 138.0, 118.0, 54.0, 40.0, 29.0, 20.0, 10.0, 11.0, 1.0, 1.0, 6.0, 3.0, 0.0, 1.0, 2.0], "bins": [-49.25, -47.900390625, -46.55078125, -45.201171875, -43.8515625, -42.501953125, -41.15234375, -39.802734375, -38.453125, -37.103515625, -35.75390625, -34.404296875, -33.0546875, -31.705078125, -30.35546875, -29.005859375, -27.65625, -26.306640625, -24.95703125, -23.607421875, -22.2578125, -20.908203125, -19.55859375, -18.208984375, -16.859375, -15.509765625, -14.16015625, -12.810546875, -11.4609375, -10.111328125, -8.76171875, -7.412109375, -6.0625, -4.712890625, -3.36328125, -2.013671875, -0.6640625, 0.685546875, 2.03515625, 3.384765625, 4.734375, 6.083984375, 7.43359375, 8.783203125, 10.1328125, 11.482421875, 12.83203125, 14.181640625, 15.53125, 16.880859375, 18.23046875, 19.580078125, 20.9296875, 22.279296875, 23.62890625, 24.978515625, 26.328125, 27.677734375, 29.02734375, 30.376953125, 31.7265625, 33.076171875, 34.42578125, 35.775390625, 37.125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 14.0, 11.0, 16.0, 13.0, 21.0, 22.0, 16.0, 31.0, 38.0, 40.0, 36.0, 38.0, 47.0, 54.0, 49.0, 46.0, 39.0, 50.0, 43.0, 53.0, 38.0, 39.0, 30.0, 32.0, 27.0, 16.0, 23.0, 21.0, 16.0, 12.0, 13.0, 11.0, 6.0, 10.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.71875, -17.163330078125, -16.60791015625, -16.052490234375, -15.4970703125, -14.941650390625, -14.38623046875, -13.830810546875, -13.275390625, -12.719970703125, -12.16455078125, -11.609130859375, -11.0537109375, -10.498291015625, -9.94287109375, -9.387451171875, -8.83203125, -8.276611328125, -7.72119140625, -7.165771484375, -6.6103515625, -6.054931640625, -5.49951171875, -4.944091796875, -4.388671875, -3.833251953125, -3.27783203125, -2.722412109375, -2.1669921875, -1.611572265625, -1.05615234375, -0.500732421875, 0.0546875, 0.610107421875, 1.16552734375, 1.720947265625, 2.2763671875, 2.831787109375, 3.38720703125, 3.942626953125, 4.498046875, 5.053466796875, 5.60888671875, 6.164306640625, 6.7197265625, 7.275146484375, 7.83056640625, 8.385986328125, 8.94140625, 9.496826171875, 10.05224609375, 10.607666015625, 11.1630859375, 11.718505859375, 12.27392578125, 12.829345703125, 13.384765625, 13.940185546875, 14.49560546875, 15.051025390625, 15.6064453125, 16.161865234375, 16.71728515625, 17.272705078125, 17.828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 12.0, 7.0, 13.0, 25.0, 34.0, 44.0, 69.0, 90.0, 134.0, 228.0, 342.0, 547.0, 983.0, 2414.0, 11216.0, 117619.0, 802643.0, 97664.0, 9791.0, 2185.0, 963.0, 558.0, 354.0, 213.0, 126.0, 91.0, 55.0, 40.0, 21.0, 19.0, 20.0, 14.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-128.375, -124.4208984375, -120.466796875, -116.5126953125, -112.55859375, -108.6044921875, -104.650390625, -100.6962890625, -96.7421875, -92.7880859375, -88.833984375, -84.8798828125, -80.92578125, -76.9716796875, -73.017578125, -69.0634765625, -65.109375, -61.1552734375, -57.201171875, -53.2470703125, -49.29296875, -45.3388671875, -41.384765625, -37.4306640625, -33.4765625, -29.5224609375, -25.568359375, -21.6142578125, -17.66015625, -13.7060546875, -9.751953125, -5.7978515625, -1.84375, 2.1103515625, 6.064453125, 10.0185546875, 13.97265625, 17.9267578125, 21.880859375, 25.8349609375, 29.7890625, 33.7431640625, 37.697265625, 41.6513671875, 45.60546875, 49.5595703125, 53.513671875, 57.4677734375, 61.421875, 65.3759765625, 69.330078125, 73.2841796875, 77.23828125, 81.1923828125, 85.146484375, 89.1005859375, 93.0546875, 97.0087890625, 100.962890625, 104.9169921875, 108.87109375, 112.8251953125, 116.779296875, 120.7333984375, 124.6875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 2.0, 4.0, 6.0, 11.0, 9.0, 10.0, 11.0, 9.0, 29.0, 31.0, 41.0, 47.0, 31.0, 48.0, 51.0, 50.0, 47.0, 39.0, 52.0, 56.0, 52.0, 52.0, 41.0, 40.0, 40.0, 41.0, 27.0, 31.0, 20.0, 20.0, 9.0, 12.0, 6.0, 11.0, 3.0, 6.0, 1.0, 1.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-109.0625, -106.23046875, -103.3984375, -100.56640625, -97.734375, -94.90234375, -92.0703125, -89.23828125, -86.40625, -83.57421875, -80.7421875, -77.91015625, -75.078125, -72.24609375, -69.4140625, -66.58203125, -63.75, -60.91796875, -58.0859375, -55.25390625, -52.421875, -49.58984375, -46.7578125, -43.92578125, -41.09375, -38.26171875, -35.4296875, -32.59765625, -29.765625, -26.93359375, -24.1015625, -21.26953125, -18.4375, -15.60546875, -12.7734375, -9.94140625, -7.109375, -4.27734375, -1.4453125, 1.38671875, 4.21875, 7.05078125, 9.8828125, 12.71484375, 15.546875, 18.37890625, 21.2109375, 24.04296875, 26.875, 29.70703125, 32.5390625, 35.37109375, 38.203125, 41.03515625, 43.8671875, 46.69921875, 49.53125, 52.36328125, 55.1953125, 58.02734375, 60.859375, 63.69140625, 66.5234375, 69.35546875, 72.1875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 9.0, 19.0, 19.0, 31.0, 42.0, 62.0, 72.0, 104.0, 175.0, 319.0, 657.0, 1509.0, 3627.0, 10140.0, 40062.0, 392409.0, 532181.0, 48203.0, 11517.0, 4011.0, 1616.0, 789.0, 378.0, 203.0, 149.0, 80.0, 50.0, 42.0, 17.0, 20.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.84375, -62.0224609375, -60.201171875, -58.3798828125, -56.55859375, -54.7373046875, -52.916015625, -51.0947265625, -49.2734375, -47.4521484375, -45.630859375, -43.8095703125, -41.98828125, -40.1669921875, -38.345703125, -36.5244140625, -34.703125, -32.8818359375, -31.060546875, -29.2392578125, -27.41796875, -25.5966796875, -23.775390625, -21.9541015625, -20.1328125, -18.3115234375, -16.490234375, -14.6689453125, -12.84765625, -11.0263671875, -9.205078125, -7.3837890625, -5.5625, -3.7412109375, -1.919921875, -0.0986328125, 1.72265625, 3.5439453125, 5.365234375, 7.1865234375, 9.0078125, 10.8291015625, 12.650390625, 14.4716796875, 16.29296875, 18.1142578125, 19.935546875, 21.7568359375, 23.578125, 25.3994140625, 27.220703125, 29.0419921875, 30.86328125, 32.6845703125, 34.505859375, 36.3271484375, 38.1484375, 39.9697265625, 41.791015625, 43.6123046875, 45.43359375, 47.2548828125, 49.076171875, 50.8974609375, 52.71875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 9.0, 6.0, 8.0, 20.0, 18.0, 19.0, 39.0, 86.0, 153.0, 180.0, 183.0, 96.0, 52.0, 43.0, 28.0, 17.0, 13.0, 12.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01158905029296875, -0.011264681816101074, -0.010940313339233398, -0.010615944862365723, -0.010291576385498047, -0.009967207908630371, -0.009642839431762695, -0.00931847095489502, -0.008994102478027344, -0.008669734001159668, -0.008345365524291992, -0.008020997047424316, -0.007696628570556641, -0.007372260093688965, -0.007047891616821289, -0.006723523139953613, -0.0063991546630859375, -0.006074786186218262, -0.005750417709350586, -0.00542604923248291, -0.005101680755615234, -0.004777312278747559, -0.004452943801879883, -0.004128575325012207, -0.0038042068481445312, -0.0034798383712768555, -0.0031554698944091797, -0.002831101417541504, -0.002506732940673828, -0.0021823644638061523, -0.0018579959869384766, -0.0015336275100708008, -0.001209259033203125, -0.0008848905563354492, -0.0005605220794677734, -0.00023615360260009766, 8.821487426757812e-05, 0.0004125833511352539, 0.0007369518280029297, 0.0010613203048706055, 0.0013856887817382812, 0.001710057258605957, 0.002034425735473633, 0.0023587942123413086, 0.0026831626892089844, 0.00300753116607666, 0.003331899642944336, 0.0036562681198120117, 0.0039806365966796875, 0.004305005073547363, 0.004629373550415039, 0.004953742027282715, 0.005278110504150391, 0.005602478981018066, 0.005926847457885742, 0.006251215934753418, 0.006575584411621094, 0.0068999528884887695, 0.007224321365356445, 0.007548689842224121, 0.007873058319091797, 0.008197426795959473, 0.008521795272827148, 0.008846163749694824, 0.0091705322265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 9.0, 6.0, 13.0, 12.0, 16.0, 29.0, 44.0, 58.0, 82.0, 138.0, 208.0, 370.0, 791.0, 1874.0, 5882.0, 28738.0, 447572.0, 521165.0, 31599.0, 6153.0, 1983.0, 773.0, 394.0, 223.0, 131.0, 73.0, 53.0, 50.0, 32.0, 20.0, 16.0, 10.0, 7.0, 9.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.84375, -60.51806640625, -58.1923828125, -55.86669921875, -53.541015625, -51.21533203125, -48.8896484375, -46.56396484375, -44.23828125, -41.91259765625, -39.5869140625, -37.26123046875, -34.935546875, -32.60986328125, -30.2841796875, -27.95849609375, -25.6328125, -23.30712890625, -20.9814453125, -18.65576171875, -16.330078125, -14.00439453125, -11.6787109375, -9.35302734375, -7.02734375, -4.70166015625, -2.3759765625, -0.05029296875, 2.275390625, 4.60107421875, 6.9267578125, 9.25244140625, 11.578125, 13.90380859375, 16.2294921875, 18.55517578125, 20.880859375, 23.20654296875, 25.5322265625, 27.85791015625, 30.18359375, 32.50927734375, 34.8349609375, 37.16064453125, 39.486328125, 41.81201171875, 44.1376953125, 46.46337890625, 48.7890625, 51.11474609375, 53.4404296875, 55.76611328125, 58.091796875, 60.41748046875, 62.7431640625, 65.06884765625, 67.39453125, 69.72021484375, 72.0458984375, 74.37158203125, 76.697265625, 79.02294921875, 81.3486328125, 83.67431640625, 86.0]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 4.0, 6.0, 7.0, 16.0, 6.0, 10.0, 21.0, 20.0, 34.0, 41.0, 42.0, 81.0, 78.0, 114.0, 90.0, 89.0, 74.0, 53.0, 43.0, 35.0, 37.0, 23.0, 14.0, 16.0, 13.0, 9.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.15625, -37.7646484375, -36.373046875, -34.9814453125, -33.58984375, -32.1982421875, -30.806640625, -29.4150390625, -28.0234375, -26.6318359375, -25.240234375, -23.8486328125, -22.45703125, -21.0654296875, -19.673828125, -18.2822265625, -16.890625, -15.4990234375, -14.107421875, -12.7158203125, -11.32421875, -9.9326171875, -8.541015625, -7.1494140625, -5.7578125, -4.3662109375, -2.974609375, -1.5830078125, -0.19140625, 1.2001953125, 2.591796875, 3.9833984375, 5.375, 6.7666015625, 8.158203125, 9.5498046875, 10.94140625, 12.3330078125, 13.724609375, 15.1162109375, 16.5078125, 17.8994140625, 19.291015625, 20.6826171875, 22.07421875, 23.4658203125, 24.857421875, 26.2490234375, 27.640625, 29.0322265625, 30.423828125, 31.8154296875, 33.20703125, 34.5986328125, 35.990234375, 37.3818359375, 38.7734375, 40.1650390625, 41.556640625, 42.9482421875, 44.33984375, 45.7314453125, 47.123046875, 48.5146484375, 49.90625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 11.0, 14.0, 55.0, 145.0, 240.0, 284.0, 147.0, 76.0, 14.0, 10.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-710.7371215820312, -669.2864990234375, -627.8358154296875, -586.3851928710938, -544.9345703125, -503.48388671875, -462.03326416015625, -420.5826110839844, -379.1319580078125, -337.6813049316406, -296.23065185546875, -254.780029296875, -213.32937622070312, -171.87872314453125, -130.42808532714844, -88.97744750976562, -47.52679443359375, -6.076148986816406, 35.37449645996094, 76.82514190673828, 118.27578735351562, 159.7264404296875, 201.1770782470703, 242.62771606445312, 284.078369140625, 325.5290222167969, 366.97967529296875, 408.4302978515625, 449.8809509277344, 491.33160400390625, 532.7822265625, 574.23291015625, 615.68359375, 657.1342163085938, 698.5848999023438, 740.0355224609375, 781.4862060546875, 822.9368286132812, 864.387451171875, 905.838134765625, 947.2887573242188, 988.7393798828125, 1030.1900634765625, 1071.6407470703125, 1113.09130859375, 1154.5419921875, 1195.99267578125, 1237.4432373046875, 1278.8939208984375, 1320.3446044921875, 1361.795166015625, 1403.245849609375, 1444.696533203125, 1486.147216796875, 1527.5977783203125, 1569.0484619140625, 1610.4990234375, 1651.94970703125, 1693.4002685546875, 1734.8509521484375, 1776.3016357421875, 1817.752197265625, 1859.202880859375, 1900.653564453125, 1942.104248046875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 11.0, 6.0, 5.0, 12.0, 10.0, 9.0, 13.0, 21.0, 22.0, 41.0, 36.0, 26.0, 36.0, 46.0, 40.0, 43.0, 44.0, 47.0, 55.0, 48.0, 47.0, 52.0, 34.0, 29.0, 37.0, 31.0, 34.0, 18.0, 26.0, 16.0, 17.0, 15.0, 13.0, 17.0, 5.0, 5.0, 9.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-363.6934814453125, -351.2881774902344, -338.8829040527344, -326.47760009765625, -314.07232666015625, -301.6670227050781, -289.2617492675781, -276.8564453125, -264.451171875, -252.04588317871094, -239.64059448242188, -227.2353057861328, -214.83001708984375, -202.4247283935547, -190.01943969726562, -177.6141357421875, -165.20884704589844, -152.80355834960938, -140.3982696533203, -127.99298095703125, -115.58769226074219, -103.18240356445312, -90.77710723876953, -78.37181854248047, -65.9665298461914, -53.561241149902344, -41.15595245361328, -28.750659942626953, -16.34537124633789, -3.940082550048828, 8.4652099609375, 20.870498657226562, 33.275787353515625, 45.68107604980469, 58.08636474609375, 70.49165344238281, 82.89694213867188, 95.30223083496094, 107.70752716064453, 120.1128158569336, 132.51809692382812, 144.9233856201172, 157.32867431640625, 169.7339630126953, 182.13925170898438, 194.54454040527344, 206.9498291015625, 219.35513305664062, 231.7604217529297, 244.16571044921875, 256.5710144042969, 268.9762878417969, 281.381591796875, 293.786865234375, 306.1921691894531, 318.5974426269531, 331.00274658203125, 343.4080505371094, 355.8133239746094, 368.2186279296875, 380.6239013671875, 393.0292053222656, 405.4344787597656, 417.83978271484375, 430.24505615234375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 4.0, 14.0, 13.0, 16.0, 12.0, 27.0, 38.0, 63.0, 74.0, 119.0, 141.0, 216.0, 301.0, 452.0, 742.0, 1200.0, 2178.0, 4311.0, 11709.0, 90254.0, 4042182.0, 25638.0, 6947.0, 3046.0, 1655.0, 1009.0, 646.0, 407.0, 260.0, 166.0, 121.0, 100.0, 62.0, 45.0, 33.0, 24.0, 12.0, 11.0, 12.0, 7.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.4375, -71.978515625, -69.51953125, -67.060546875, -64.6015625, -62.142578125, -59.68359375, -57.224609375, -54.765625, -52.306640625, -49.84765625, -47.388671875, -44.9296875, -42.470703125, -40.01171875, -37.552734375, -35.09375, -32.634765625, -30.17578125, -27.716796875, -25.2578125, -22.798828125, -20.33984375, -17.880859375, -15.421875, -12.962890625, -10.50390625, -8.044921875, -5.5859375, -3.126953125, -0.66796875, 1.791015625, 4.25, 6.708984375, 9.16796875, 11.626953125, 14.0859375, 16.544921875, 19.00390625, 21.462890625, 23.921875, 26.380859375, 28.83984375, 31.298828125, 33.7578125, 36.216796875, 38.67578125, 41.134765625, 43.59375, 46.052734375, 48.51171875, 50.970703125, 53.4296875, 55.888671875, 58.34765625, 60.806640625, 63.265625, 65.724609375, 68.18359375, 70.642578125, 73.1015625, 75.560546875, 78.01953125, 80.478515625, 82.9375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 12.0, 9.0, 13.0, 13.0, 19.0, 6.0, 23.0, 37.0, 31.0, 25.0, 35.0, 45.0, 39.0, 55.0, 49.0, 53.0, 47.0, 63.0, 35.0, 51.0, 41.0, 36.0, 36.0, 31.0, 32.0, 23.0, 24.0, 23.0, 18.0, 15.0, 9.0, 14.0, 4.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.921875, -15.36328125, -14.8046875, -14.24609375, -13.6875, -13.12890625, -12.5703125, -12.01171875, -11.453125, -10.89453125, -10.3359375, -9.77734375, -9.21875, -8.66015625, -8.1015625, -7.54296875, -6.984375, -6.42578125, -5.8671875, -5.30859375, -4.75, -4.19140625, -3.6328125, -3.07421875, -2.515625, -1.95703125, -1.3984375, -0.83984375, -0.28125, 0.27734375, 0.8359375, 1.39453125, 1.953125, 2.51171875, 3.0703125, 3.62890625, 4.1875, 4.74609375, 5.3046875, 5.86328125, 6.421875, 6.98046875, 7.5390625, 8.09765625, 8.65625, 9.21484375, 9.7734375, 10.33203125, 10.890625, 11.44921875, 12.0078125, 12.56640625, 13.125, 13.68359375, 14.2421875, 14.80078125, 15.359375, 15.91796875, 16.4765625, 17.03515625, 17.59375, 18.15234375, 18.7109375, 19.26953125, 19.828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 8.0, 12.0, 12.0, 22.0, 27.0, 52.0, 60.0, 89.0, 146.0, 160.0, 284.0, 356.0, 611.0, 896.0, 1618.0, 2979.0, 7163.0, 21965.0, 3903589.0, 224492.0, 17287.0, 5961.0, 2525.0, 1408.0, 807.0, 488.0, 367.0, 265.0, 170.0, 121.0, 93.0, 54.0, 47.0, 22.0, 29.0, 20.0, 13.0, 17.0, 8.0, 2.0, 5.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.1875, -91.1396484375, -88.091796875, -85.0439453125, -81.99609375, -78.9482421875, -75.900390625, -72.8525390625, -69.8046875, -66.7568359375, -63.708984375, -60.6611328125, -57.61328125, -54.5654296875, -51.517578125, -48.4697265625, -45.421875, -42.3740234375, -39.326171875, -36.2783203125, -33.23046875, -30.1826171875, -27.134765625, -24.0869140625, -21.0390625, -17.9912109375, -14.943359375, -11.8955078125, -8.84765625, -5.7998046875, -2.751953125, 0.2958984375, 3.34375, 6.3916015625, 9.439453125, 12.4873046875, 15.53515625, 18.5830078125, 21.630859375, 24.6787109375, 27.7265625, 30.7744140625, 33.822265625, 36.8701171875, 39.91796875, 42.9658203125, 46.013671875, 49.0615234375, 52.109375, 55.1572265625, 58.205078125, 61.2529296875, 64.30078125, 67.3486328125, 70.396484375, 73.4443359375, 76.4921875, 79.5400390625, 82.587890625, 85.6357421875, 88.68359375, 91.7314453125, 94.779296875, 97.8271484375, 100.875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 7.0, 12.0, 10.0, 19.0, 23.0, 80.0, 3731.0, 115.0, 32.0, 21.0, 7.0, 5.0, 3.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.3125, -31.31982421875, -30.3271484375, -29.33447265625, -28.341796875, -27.34912109375, -26.3564453125, -25.36376953125, -24.37109375, -23.37841796875, -22.3857421875, -21.39306640625, -20.400390625, -19.40771484375, -18.4150390625, -17.42236328125, -16.4296875, -15.43701171875, -14.4443359375, -13.45166015625, -12.458984375, -11.46630859375, -10.4736328125, -9.48095703125, -8.48828125, -7.49560546875, -6.5029296875, -5.51025390625, -4.517578125, -3.52490234375, -2.5322265625, -1.53955078125, -0.546875, 0.44580078125, 1.4384765625, 2.43115234375, 3.423828125, 4.41650390625, 5.4091796875, 6.40185546875, 7.39453125, 8.38720703125, 9.3798828125, 10.37255859375, 11.365234375, 12.35791015625, 13.3505859375, 14.34326171875, 15.3359375, 16.32861328125, 17.3212890625, 18.31396484375, 19.306640625, 20.29931640625, 21.2919921875, 22.28466796875, 23.27734375, 24.27001953125, 25.2626953125, 26.25537109375, 27.248046875, 28.24072265625, 29.2333984375, 30.22607421875, 31.21875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 32.0, 47.0, 152.0, 243.0, 264.0, 126.0, 75.0, 33.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-227.29412841796875, -222.01141357421875, -216.7286834716797, -211.4459686279297, -206.16323852539062, -200.88052368164062, -195.59779357910156, -190.31507873535156, -185.0323486328125, -179.7496337890625, -174.46690368652344, -169.18418884277344, -163.90145874023438, -158.61874389648438, -153.3360137939453, -148.0532989501953, -142.77056884765625, -137.48785400390625, -132.2051239013672, -126.92240142822266, -121.63967895507812, -116.3569564819336, -111.07423400878906, -105.79151916503906, -100.50880432128906, -95.22608184814453, -89.943359375, -84.66063690185547, -79.37791442871094, -74.0951919555664, -68.81246948242188, -63.52975082397461, -58.24702453613281, -52.96430206298828, -47.68157958984375, -42.39885711669922, -37.11613464355469, -31.83341407775879, -26.55069351196289, -21.26797103881836, -15.985248565673828, -10.702526092529297, -5.419804573059082, -0.1370830535888672, 5.145639419555664, 10.428361892700195, 15.711082458496094, 20.993804931640625, 26.276527404785156, 31.559249877929688, 36.84197235107422, 42.12469482421875, 47.40741729736328, 52.69013977050781, 57.97285842895508, 63.25558090209961, 68.53829956054688, 73.8210220336914, 79.10374450683594, 84.38646697998047, 89.669189453125, 94.95191192626953, 100.23463439941406, 105.51734924316406, 110.80007934570312]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 12.0, 9.0, 9.0, 21.0, 18.0, 16.0, 23.0, 32.0, 26.0, 32.0, 44.0, 43.0, 44.0, 57.0, 54.0, 53.0, 54.0, 60.0, 38.0, 48.0, 33.0, 51.0, 37.0, 28.0, 21.0, 15.0, 21.0, 19.0, 13.0, 14.0, 13.0, 10.0, 6.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.94529724121094, -47.49171447753906, -46.03813552856445, -44.58455276489258, -43.13097381591797, -41.677391052246094, -40.22380828857422, -38.770225524902344, -37.316646575927734, -35.86306381225586, -34.40948486328125, -32.955902099609375, -31.502321243286133, -30.04874038696289, -28.595157623291016, -27.141576766967773, -25.68799591064453, -24.23441505432129, -22.780834197998047, -21.327251434326172, -19.87367057800293, -18.420089721679688, -16.966506958007812, -15.51292610168457, -14.059345245361328, -12.605764389038086, -11.152182579040527, -9.698600769042969, -8.245019912719727, -6.791438579559326, -5.337857246398926, -3.884275436401367, -2.430694580078125, -0.9771132469177246, 0.4764680862426758, 1.9300494194030762, 3.3836307525634766, 4.837212085723877, 6.290793418884277, 7.744375228881836, 9.197956085205078, 10.65153694152832, 12.105118751525879, 13.558700561523438, 15.01228141784668, 16.465862274169922, 17.919445037841797, 19.37302589416504, 20.82660675048828, 22.280187606811523, 23.733768463134766, 25.18735122680664, 26.640932083129883, 28.094512939453125, 29.548095703125, 31.001676559448242, 32.455257415771484, 33.90884017944336, 35.36241912841797, 36.816001892089844, 38.26958465576172, 39.72316360473633, 41.1767463684082, 42.63032531738281, 44.08390808105469]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 9.0, 8.0, 8.0, 19.0, 21.0, 24.0, 56.0, 81.0, 122.0, 231.0, 330.0, 612.0, 1232.0, 2617.0, 5722.0, 13931.0, 36652.0, 110289.0, 355891.0, 351181.0, 108742.0, 36067.0, 13667.0, 5658.0, 2595.0, 1208.0, 655.0, 345.0, 214.0, 115.0, 84.0, 55.0, 32.0, 16.0, 24.0, 15.0, 3.0, 7.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.0625, -46.40478515625, -44.7470703125, -43.08935546875, -41.431640625, -39.77392578125, -38.1162109375, -36.45849609375, -34.80078125, -33.14306640625, -31.4853515625, -29.82763671875, -28.169921875, -26.51220703125, -24.8544921875, -23.19677734375, -21.5390625, -19.88134765625, -18.2236328125, -16.56591796875, -14.908203125, -13.25048828125, -11.5927734375, -9.93505859375, -8.27734375, -6.61962890625, -4.9619140625, -3.30419921875, -1.646484375, 0.01123046875, 1.6689453125, 3.32666015625, 4.984375, 6.64208984375, 8.2998046875, 9.95751953125, 11.615234375, 13.27294921875, 14.9306640625, 16.58837890625, 18.24609375, 19.90380859375, 21.5615234375, 23.21923828125, 24.876953125, 26.53466796875, 28.1923828125, 29.85009765625, 31.5078125, 33.16552734375, 34.8232421875, 36.48095703125, 38.138671875, 39.79638671875, 41.4541015625, 43.11181640625, 44.76953125, 46.42724609375, 48.0849609375, 49.74267578125, 51.400390625, 53.05810546875, 54.7158203125, 56.37353515625, 58.03125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 12.0, 8.0, 14.0, 13.0, 17.0, 15.0, 16.0, 13.0, 25.0, 37.0, 34.0, 38.0, 47.0, 46.0, 40.0, 52.0, 47.0, 54.0, 52.0, 46.0, 52.0, 46.0, 35.0, 38.0, 32.0, 30.0, 27.0, 22.0, 18.0, 15.0, 7.0, 14.0, 11.0, 7.0, 7.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.59375, -16.007080078125, -15.42041015625, -14.833740234375, -14.2470703125, -13.660400390625, -13.07373046875, -12.487060546875, -11.900390625, -11.313720703125, -10.72705078125, -10.140380859375, -9.5537109375, -8.967041015625, -8.38037109375, -7.793701171875, -7.20703125, -6.620361328125, -6.03369140625, -5.447021484375, -4.8603515625, -4.273681640625, -3.68701171875, -3.100341796875, -2.513671875, -1.927001953125, -1.34033203125, -0.753662109375, -0.1669921875, 0.419677734375, 1.00634765625, 1.593017578125, 2.1796875, 2.766357421875, 3.35302734375, 3.939697265625, 4.5263671875, 5.113037109375, 5.69970703125, 6.286376953125, 6.873046875, 7.459716796875, 8.04638671875, 8.633056640625, 9.2197265625, 9.806396484375, 10.39306640625, 10.979736328125, 11.56640625, 12.153076171875, 12.73974609375, 13.326416015625, 13.9130859375, 14.499755859375, 15.08642578125, 15.673095703125, 16.259765625, 16.846435546875, 17.43310546875, 18.019775390625, 18.6064453125, 19.193115234375, 19.77978515625, 20.366455078125, 20.953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 13.0, 8.0, 11.0, 23.0, 24.0, 29.0, 28.0, 48.0, 69.0, 89.0, 92.0, 145.0, 208.0, 299.0, 379.0, 601.0, 956.0, 1857.0, 5094.0, 19846.0, 127052.0, 692612.0, 163923.0, 23991.0, 5800.0, 2109.0, 1016.0, 645.0, 440.0, 327.0, 201.0, 131.0, 111.0, 82.0, 63.0, 51.0, 30.0, 41.0, 18.0, 14.0, 15.0, 7.0, 11.0, 14.0, 7.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-86.1875, -83.619140625, -81.05078125, -78.482421875, -75.9140625, -73.345703125, -70.77734375, -68.208984375, -65.640625, -63.072265625, -60.50390625, -57.935546875, -55.3671875, -52.798828125, -50.23046875, -47.662109375, -45.09375, -42.525390625, -39.95703125, -37.388671875, -34.8203125, -32.251953125, -29.68359375, -27.115234375, -24.546875, -21.978515625, -19.41015625, -16.841796875, -14.2734375, -11.705078125, -9.13671875, -6.568359375, -4.0, -1.431640625, 1.13671875, 3.705078125, 6.2734375, 8.841796875, 11.41015625, 13.978515625, 16.546875, 19.115234375, 21.68359375, 24.251953125, 26.8203125, 29.388671875, 31.95703125, 34.525390625, 37.09375, 39.662109375, 42.23046875, 44.798828125, 47.3671875, 49.935546875, 52.50390625, 55.072265625, 57.640625, 60.208984375, 62.77734375, 65.345703125, 67.9140625, 70.482421875, 73.05078125, 75.619140625, 78.1875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 8.0, 9.0, 9.0, 8.0, 10.0, 12.0, 14.0, 9.0, 23.0, 26.0, 20.0, 32.0, 33.0, 30.0, 32.0, 33.0, 40.0, 40.0, 40.0, 48.0, 42.0, 37.0, 44.0, 24.0, 43.0, 38.0, 36.0, 34.0, 29.0, 28.0, 30.0, 20.0, 22.0, 17.0, 21.0, 12.0, 10.0, 7.0, 11.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-81.0, -78.7216796875, -76.443359375, -74.1650390625, -71.88671875, -69.6083984375, -67.330078125, -65.0517578125, -62.7734375, -60.4951171875, -58.216796875, -55.9384765625, -53.66015625, -51.3818359375, -49.103515625, -46.8251953125, -44.546875, -42.2685546875, -39.990234375, -37.7119140625, -35.43359375, -33.1552734375, -30.876953125, -28.5986328125, -26.3203125, -24.0419921875, -21.763671875, -19.4853515625, -17.20703125, -14.9287109375, -12.650390625, -10.3720703125, -8.09375, -5.8154296875, -3.537109375, -1.2587890625, 1.01953125, 3.2978515625, 5.576171875, 7.8544921875, 10.1328125, 12.4111328125, 14.689453125, 16.9677734375, 19.24609375, 21.5244140625, 23.802734375, 26.0810546875, 28.359375, 30.6376953125, 32.916015625, 35.1943359375, 37.47265625, 39.7509765625, 42.029296875, 44.3076171875, 46.5859375, 48.8642578125, 51.142578125, 53.4208984375, 55.69921875, 57.9775390625, 60.255859375, 62.5341796875, 64.8125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 8.0, 2.0, 4.0, 13.0, 21.0, 16.0, 30.0, 38.0, 45.0, 90.0, 126.0, 278.0, 412.0, 842.0, 1933.0, 5434.0, 21685.0, 135729.0, 658767.0, 184382.0, 27535.0, 6803.0, 2196.0, 935.0, 475.0, 264.0, 162.0, 94.0, 72.0, 57.0, 34.0, 23.0, 16.0, 10.0, 7.0, 7.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.046875, -27.993408203125, -26.93994140625, -25.886474609375, -24.8330078125, -23.779541015625, -22.72607421875, -21.672607421875, -20.619140625, -19.565673828125, -18.51220703125, -17.458740234375, -16.4052734375, -15.351806640625, -14.29833984375, -13.244873046875, -12.19140625, -11.137939453125, -10.08447265625, -9.031005859375, -7.9775390625, -6.924072265625, -5.87060546875, -4.817138671875, -3.763671875, -2.710205078125, -1.65673828125, -0.603271484375, 0.4501953125, 1.503662109375, 2.55712890625, 3.610595703125, 4.6640625, 5.717529296875, 6.77099609375, 7.824462890625, 8.8779296875, 9.931396484375, 10.98486328125, 12.038330078125, 13.091796875, 14.145263671875, 15.19873046875, 16.252197265625, 17.3056640625, 18.359130859375, 19.41259765625, 20.466064453125, 21.51953125, 22.572998046875, 23.62646484375, 24.679931640625, 25.7333984375, 26.786865234375, 27.84033203125, 28.893798828125, 29.947265625, 31.000732421875, 32.05419921875, 33.107666015625, 34.1611328125, 35.214599609375, 36.26806640625, 37.321533203125, 38.375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 8.0, 2.0, 8.0, 7.0, 19.0, 16.0, 21.0, 55.0, 47.0, 66.0, 87.0, 115.0, 126.0, 108.0, 88.0, 74.0, 36.0, 31.0, 30.0, 10.0, 18.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004543304443359375, -0.004377186298370361, -0.004211068153381348, -0.004044950008392334, -0.0038788318634033203, -0.0037127137184143066, -0.003546595573425293, -0.0033804774284362793, -0.0032143592834472656, -0.003048241138458252, -0.0028821229934692383, -0.0027160048484802246, -0.002549886703491211, -0.0023837685585021973, -0.0022176504135131836, -0.00205153226852417, -0.0018854141235351562, -0.0017192959785461426, -0.001553177833557129, -0.0013870596885681152, -0.0012209415435791016, -0.0010548233985900879, -0.0008887052536010742, -0.0007225871086120605, -0.0005564689636230469, -0.0003903508186340332, -0.00022423267364501953, -5.811452865600586e-05, 0.00010800361633300781, 0.0002741217613220215, 0.00044023990631103516, 0.0006063580513000488, 0.0007724761962890625, 0.0009385943412780762, 0.0011047124862670898, 0.0012708306312561035, 0.0014369487762451172, 0.0016030669212341309, 0.0017691850662231445, 0.0019353032112121582, 0.002101421356201172, 0.0022675395011901855, 0.0024336576461791992, 0.002599775791168213, 0.0027658939361572266, 0.0029320120811462402, 0.003098130226135254, 0.0032642483711242676, 0.0034303665161132812, 0.003596484661102295, 0.0037626028060913086, 0.003928720951080322, 0.004094839096069336, 0.00426095724105835, 0.004427075386047363, 0.004593193531036377, 0.004759311676025391, 0.004925429821014404, 0.005091547966003418, 0.005257666110992432, 0.005423784255981445, 0.005589902400970459, 0.005756020545959473, 0.005922138690948486, 0.0060882568359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 7.0, 14.0, 22.0, 29.0, 53.0, 82.0, 181.0, 359.0, 802.0, 1993.0, 7278.0, 53381.0, 718478.0, 240883.0, 18838.0, 3772.0, 1269.0, 540.0, 265.0, 129.0, 70.0, 37.0, 16.0, 19.0, 8.0, 5.0, 8.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.28125, -46.6591796875, -45.037109375, -43.4150390625, -41.79296875, -40.1708984375, -38.548828125, -36.9267578125, -35.3046875, -33.6826171875, -32.060546875, -30.4384765625, -28.81640625, -27.1943359375, -25.572265625, -23.9501953125, -22.328125, -20.7060546875, -19.083984375, -17.4619140625, -15.83984375, -14.2177734375, -12.595703125, -10.9736328125, -9.3515625, -7.7294921875, -6.107421875, -4.4853515625, -2.86328125, -1.2412109375, 0.380859375, 2.0029296875, 3.625, 5.2470703125, 6.869140625, 8.4912109375, 10.11328125, 11.7353515625, 13.357421875, 14.9794921875, 16.6015625, 18.2236328125, 19.845703125, 21.4677734375, 23.08984375, 24.7119140625, 26.333984375, 27.9560546875, 29.578125, 31.2001953125, 32.822265625, 34.4443359375, 36.06640625, 37.6884765625, 39.310546875, 40.9326171875, 42.5546875, 44.1767578125, 45.798828125, 47.4208984375, 49.04296875, 50.6650390625, 52.287109375, 53.9091796875, 55.53125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 8.0, 15.0, 17.0, 19.0, 20.0, 40.0, 45.0, 64.0, 85.0, 82.0, 104.0, 91.0, 93.0, 80.0, 59.0, 35.0, 31.0, 29.0, 26.0, 19.0, 12.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.078125, -23.113525390625, -22.14892578125, -21.184326171875, -20.2197265625, -19.255126953125, -18.29052734375, -17.325927734375, -16.361328125, -15.396728515625, -14.43212890625, -13.467529296875, -12.5029296875, -11.538330078125, -10.57373046875, -9.609130859375, -8.64453125, -7.679931640625, -6.71533203125, -5.750732421875, -4.7861328125, -3.821533203125, -2.85693359375, -1.892333984375, -0.927734375, 0.036865234375, 1.00146484375, 1.966064453125, 2.9306640625, 3.895263671875, 4.85986328125, 5.824462890625, 6.7890625, 7.753662109375, 8.71826171875, 9.682861328125, 10.6474609375, 11.612060546875, 12.57666015625, 13.541259765625, 14.505859375, 15.470458984375, 16.43505859375, 17.399658203125, 18.3642578125, 19.328857421875, 20.29345703125, 21.258056640625, 22.22265625, 23.187255859375, 24.15185546875, 25.116455078125, 26.0810546875, 27.045654296875, 28.01025390625, 28.974853515625, 29.939453125, 30.904052734375, 31.86865234375, 32.833251953125, 33.7978515625, 34.762451171875, 35.72705078125, 36.691650390625, 37.65625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 18.0, 66.0, 164.0, 291.0, 276.0, 127.0, 39.0, 12.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1836.1102294921875, -1799.421630859375, -1762.7330322265625, -1726.04443359375, -1689.355712890625, -1652.6671142578125, -1615.978515625, -1579.2899169921875, -1542.601318359375, -1505.9127197265625, -1469.22412109375, -1432.5355224609375, -1395.846923828125, -1359.158203125, -1322.4696044921875, -1285.781005859375, -1249.0924072265625, -1212.40380859375, -1175.7152099609375, -1139.026611328125, -1102.337890625, -1065.6492919921875, -1028.960693359375, -992.2720947265625, -955.58349609375, -918.8948974609375, -882.206298828125, -845.5176391601562, -808.8290405273438, -772.1404418945312, -735.4517822265625, -698.76318359375, -662.07470703125, -625.3861083984375, -588.697509765625, -552.0088500976562, -515.3202514648438, -478.63165283203125, -441.9430236816406, -405.25439453125, -368.5657958984375, -331.877197265625, -295.1885681152344, -258.49993896484375, -221.81134033203125, -185.1227264404297, -148.43411254882812, -111.7454833984375, -75.056884765625, -38.36827087402344, -1.679656982421875, 35.00895690917969, 71.69757080078125, 108.38618469238281, 145.07479858398438, 181.763427734375, 218.4520263671875, 255.14064025878906, 291.8292541503906, 328.51788330078125, 365.20648193359375, 401.89508056640625, 438.5837097167969, 475.2723388671875, 511.9609375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 14.0, 13.0, 12.0, 13.0, 20.0, 16.0, 24.0, 25.0, 31.0, 32.0, 33.0, 43.0, 37.0, 49.0, 46.0, 46.0, 51.0, 48.0, 45.0, 56.0, 41.0, 38.0, 28.0, 31.0, 25.0, 30.0, 24.0, 24.0, 16.0, 13.0, 13.0, 15.0, 7.0, 8.0, 4.0, 3.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-332.44537353515625, -321.09197998046875, -309.7385559082031, -298.3851623535156, -287.0317687988281, -275.6783447265625, -264.324951171875, -252.9715576171875, -241.61814880371094, -230.26473999023438, -218.91134643554688, -207.5579376220703, -196.20452880859375, -184.85113525390625, -173.4977264404297, -162.14431762695312, -150.79092407226562, -139.43751525878906, -128.08412170410156, -116.730712890625, -105.37731170654297, -94.02391052246094, -82.67050170898438, -71.31710052490234, -59.96369934082031, -48.61029815673828, -37.256893157958984, -25.903488159179688, -14.550086975097656, -3.196685791015625, 8.156723022460938, 19.51012420654297, 30.863555908203125, 42.216957092285156, 53.57036209106445, 64.92376708984375, 76.27716827392578, 87.63056945800781, 98.98397827148438, 110.3373794555664, 121.69078063964844, 133.044189453125, 144.3975830078125, 155.75099182128906, 167.10440063476562, 178.45779418945312, 189.8112030029297, 201.16461181640625, 212.51800537109375, 223.8714141845703, 235.2248077392578, 246.57821655273438, 257.9316101074219, 269.2850341796875, 280.638427734375, 291.9918212890625, 303.34521484375, 314.6986083984375, 326.0520324707031, 337.4054260253906, 348.7588195800781, 360.11224365234375, 371.46563720703125, 382.81903076171875, 394.1724548339844]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 14.0, 13.0, 18.0, 23.0, 24.0, 42.0, 41.0, 100.0, 154.0, 223.0, 358.0, 746.0, 1598.0, 4932.0, 51109.0, 4119730.0, 10132.0, 2664.0, 1008.0, 491.0, 318.0, 161.0, 102.0, 84.0, 47.0, 44.0, 44.0, 14.0, 8.0, 9.0, 6.0, 4.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.0625, -118.275390625, -114.48828125, -110.701171875, -106.9140625, -103.126953125, -99.33984375, -95.552734375, -91.765625, -87.978515625, -84.19140625, -80.404296875, -76.6171875, -72.830078125, -69.04296875, -65.255859375, -61.46875, -57.681640625, -53.89453125, -50.107421875, -46.3203125, -42.533203125, -38.74609375, -34.958984375, -31.171875, -27.384765625, -23.59765625, -19.810546875, -16.0234375, -12.236328125, -8.44921875, -4.662109375, -0.875, 2.912109375, 6.69921875, 10.486328125, 14.2734375, 18.060546875, 21.84765625, 25.634765625, 29.421875, 33.208984375, 36.99609375, 40.783203125, 44.5703125, 48.357421875, 52.14453125, 55.931640625, 59.71875, 63.505859375, 67.29296875, 71.080078125, 74.8671875, 78.654296875, 82.44140625, 86.228515625, 90.015625, 93.802734375, 97.58984375, 101.376953125, 105.1640625, 108.951171875, 112.73828125, 116.525390625, 120.3125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 4.0, 6.0, 9.0, 12.0, 4.0, 15.0, 12.0, 17.0, 30.0, 26.0, 27.0, 31.0, 37.0, 35.0, 41.0, 45.0, 47.0, 51.0, 43.0, 60.0, 43.0, 38.0, 42.0, 45.0, 40.0, 38.0, 47.0, 26.0, 25.0, 21.0, 20.0, 21.0, 8.0, 11.0, 4.0, 6.0, 2.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.359375, -15.777587890625, -15.19580078125, -14.614013671875, -14.0322265625, -13.450439453125, -12.86865234375, -12.286865234375, -11.705078125, -11.123291015625, -10.54150390625, -9.959716796875, -9.3779296875, -8.796142578125, -8.21435546875, -7.632568359375, -7.05078125, -6.468994140625, -5.88720703125, -5.305419921875, -4.7236328125, -4.141845703125, -3.56005859375, -2.978271484375, -2.396484375, -1.814697265625, -1.23291015625, -0.651123046875, -0.0693359375, 0.512451171875, 1.09423828125, 1.676025390625, 2.2578125, 2.839599609375, 3.42138671875, 4.003173828125, 4.5849609375, 5.166748046875, 5.74853515625, 6.330322265625, 6.912109375, 7.493896484375, 8.07568359375, 8.657470703125, 9.2392578125, 9.821044921875, 10.40283203125, 10.984619140625, 11.56640625, 12.148193359375, 12.72998046875, 13.311767578125, 13.8935546875, 14.475341796875, 15.05712890625, 15.638916015625, 16.220703125, 16.802490234375, 17.38427734375, 17.966064453125, 18.5478515625, 19.129638671875, 19.71142578125, 20.293212890625, 20.875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 10.0, 8.0, 8.0, 11.0, 13.0, 17.0, 19.0, 24.0, 43.0, 49.0, 96.0, 124.0, 157.0, 272.0, 452.0, 745.0, 1324.0, 2588.0, 5805.0, 20327.0, 4103245.0, 43947.0, 7759.0, 3163.0, 1637.0, 903.0, 512.0, 311.0, 222.0, 145.0, 112.0, 69.0, 43.0, 24.0, 21.0, 20.0, 11.0, 10.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-80.1875, -77.5712890625, -74.955078125, -72.3388671875, -69.72265625, -67.1064453125, -64.490234375, -61.8740234375, -59.2578125, -56.6416015625, -54.025390625, -51.4091796875, -48.79296875, -46.1767578125, -43.560546875, -40.9443359375, -38.328125, -35.7119140625, -33.095703125, -30.4794921875, -27.86328125, -25.2470703125, -22.630859375, -20.0146484375, -17.3984375, -14.7822265625, -12.166015625, -9.5498046875, -6.93359375, -4.3173828125, -1.701171875, 0.9150390625, 3.53125, 6.1474609375, 8.763671875, 11.3798828125, 13.99609375, 16.6123046875, 19.228515625, 21.8447265625, 24.4609375, 27.0771484375, 29.693359375, 32.3095703125, 34.92578125, 37.5419921875, 40.158203125, 42.7744140625, 45.390625, 48.0068359375, 50.623046875, 53.2392578125, 55.85546875, 58.4716796875, 61.087890625, 63.7041015625, 66.3203125, 68.9365234375, 71.552734375, 74.1689453125, 76.78515625, 79.4013671875, 82.017578125, 84.6337890625, 87.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 10.0, 9.0, 17.0, 49.0, 3495.0, 416.0, 35.0, 16.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.2491455078125, -10.584228515625, -9.9193115234375, -9.25439453125, -8.5894775390625, -7.924560546875, -7.2596435546875, -6.5947265625, -5.9298095703125, -5.264892578125, -4.5999755859375, -3.93505859375, -3.2701416015625, -2.605224609375, -1.9403076171875, -1.275390625, -0.6104736328125, 0.054443359375, 0.7193603515625, 1.38427734375, 2.0491943359375, 2.714111328125, 3.3790283203125, 4.0439453125, 4.7088623046875, 5.373779296875, 6.0386962890625, 6.70361328125, 7.3685302734375, 8.033447265625, 8.6983642578125, 9.36328125, 10.0281982421875, 10.693115234375, 11.3580322265625, 12.02294921875, 12.6878662109375, 13.352783203125, 14.0177001953125, 14.6826171875, 15.3475341796875, 16.012451171875, 16.6773681640625, 17.34228515625, 18.0072021484375, 18.672119140625, 19.3370361328125, 20.001953125, 20.6668701171875, 21.331787109375, 21.9967041015625, 22.66162109375, 23.3265380859375, 23.991455078125, 24.6563720703125, 25.3212890625, 25.9862060546875, 26.651123046875, 27.3160400390625, 27.98095703125, 28.6458740234375, 29.310791015625, 29.9757080078125, 30.640625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 5.0, 16.0, 42.0, 95.0, 216.0, 271.0, 228.0, 88.0, 29.0, 10.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.78084564208984, -106.04561614990234, -102.31038665771484, -98.57515716552734, -94.83992767333984, -91.10469818115234, -87.36947631835938, -83.63424682617188, -79.89901733398438, -76.16378784179688, -72.42855834960938, -68.69332885742188, -64.95809936523438, -61.222869873046875, -57.48764419555664, -53.75241470336914, -50.017181396484375, -46.281951904296875, -42.546722412109375, -38.811492919921875, -35.076263427734375, -31.341035842895508, -27.60580825805664, -23.87057876586914, -20.13534927368164, -16.40011978149414, -12.664891242980957, -8.929662704467773, -5.194433212280273, -1.4592037200927734, 2.2760238647460938, 6.011253356933594, 9.746475219726562, 13.481704711914062, 17.216934204101562, 20.95216178894043, 24.68739128112793, 28.42262077331543, 32.1578483581543, 35.8930778503418, 39.6283073425293, 43.3635368347168, 47.0987663269043, 50.83399200439453, 54.56922149658203, 58.30445098876953, 62.03968048095703, 65.77490997314453, 69.51013946533203, 73.24536895751953, 76.98059844970703, 80.71582794189453, 84.45105743408203, 88.18628692626953, 91.9215087890625, 95.65673828125, 99.3919677734375, 103.127197265625, 106.8624267578125, 110.59765625, 114.3328857421875, 118.068115234375, 121.8033447265625, 125.53857421875, 129.2738037109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 15.0, 14.0, 24.0, 32.0, 24.0, 41.0, 42.0, 32.0, 53.0, 72.0, 65.0, 61.0, 50.0, 55.0, 43.0, 54.0, 40.0, 44.0, 33.0, 36.0, 35.0, 28.0, 25.0, 13.0, 16.0, 10.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.82115936279297, -28.777429580688477, -27.733699798583984, -26.689970016479492, -25.646240234375, -24.602508544921875, -23.558778762817383, -22.51504898071289, -21.4713191986084, -20.427589416503906, -19.383859634399414, -18.340129852294922, -17.296398162841797, -16.252670288085938, -15.208938598632812, -14.16520881652832, -13.121479034423828, -12.077749252319336, -11.034019470214844, -9.990288734436035, -8.946558952331543, -7.902829170227051, -6.8590989112854, -5.81536865234375, -4.771638870239258, -3.7279088497161865, -2.6841788291931152, -1.640448808670044, -0.5967187881469727, 0.44701099395751953, 1.49074125289917, 2.5344715118408203, 3.578205108642578, 4.62193489074707, 5.665665149688721, 6.709395408630371, 7.753125190734863, 8.796854972839355, 9.840585708618164, 10.884315490722656, 11.928045272827148, 12.97177505493164, 14.015504837036133, 15.059235572814941, 16.10296630859375, 17.14669418334961, 18.190425872802734, 19.234155654907227, 20.27788543701172, 21.32161521911621, 22.365345001220703, 23.409074783325195, 24.452804565429688, 25.496536254882812, 26.540266036987305, 27.583995819091797, 28.62772560119629, 29.67145538330078, 30.715185165405273, 31.758914947509766, 32.80264663696289, 33.84637451171875, 34.890106201171875, 35.933837890625, 36.97756576538086]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 13.0, 17.0, 18.0, 39.0, 53.0, 91.0, 137.0, 177.0, 318.0, 524.0, 837.0, 1592.0, 3064.0, 6006.0, 13040.0, 29984.0, 73850.0, 192340.0, 368528.0, 214298.0, 82079.0, 33161.0, 14447.0, 6690.0, 3259.0, 1638.0, 932.0, 532.0, 315.0, 192.0, 114.0, 80.0, 56.0, 38.0, 26.0, 19.0, 12.0, 10.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-42.65625, -41.421875, -40.1875, -38.953125, -37.71875, -36.484375, -35.25, -34.015625, -32.78125, -31.546875, -30.3125, -29.078125, -27.84375, -26.609375, -25.375, -24.140625, -22.90625, -21.671875, -20.4375, -19.203125, -17.96875, -16.734375, -15.5, -14.265625, -13.03125, -11.796875, -10.5625, -9.328125, -8.09375, -6.859375, -5.625, -4.390625, -3.15625, -1.921875, -0.6875, 0.546875, 1.78125, 3.015625, 4.25, 5.484375, 6.71875, 7.953125, 9.1875, 10.421875, 11.65625, 12.890625, 14.125, 15.359375, 16.59375, 17.828125, 19.0625, 20.296875, 21.53125, 22.765625, 24.0, 25.234375, 26.46875, 27.703125, 28.9375, 30.171875, 31.40625, 32.640625, 33.875, 35.109375, 36.34375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 4.0, 12.0, 13.0, 8.0, 14.0, 17.0, 24.0, 25.0, 29.0, 27.0, 44.0, 31.0, 48.0, 49.0, 41.0, 41.0, 53.0, 57.0, 47.0, 36.0, 50.0, 51.0, 43.0, 35.0, 30.0, 26.0, 34.0, 23.0, 22.0, 13.0, 5.0, 12.0, 8.0, 3.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.0625, -17.4609375, -16.859375, -16.2578125, -15.65625, -15.0546875, -14.453125, -13.8515625, -13.25, -12.6484375, -12.046875, -11.4453125, -10.84375, -10.2421875, -9.640625, -9.0390625, -8.4375, -7.8359375, -7.234375, -6.6328125, -6.03125, -5.4296875, -4.828125, -4.2265625, -3.625, -3.0234375, -2.421875, -1.8203125, -1.21875, -0.6171875, -0.015625, 0.5859375, 1.1875, 1.7890625, 2.390625, 2.9921875, 3.59375, 4.1953125, 4.796875, 5.3984375, 6.0, 6.6015625, 7.203125, 7.8046875, 8.40625, 9.0078125, 9.609375, 10.2109375, 10.8125, 11.4140625, 12.015625, 12.6171875, 13.21875, 13.8203125, 14.421875, 15.0234375, 15.625, 16.2265625, 16.828125, 17.4296875, 18.03125, 18.6328125, 19.234375, 19.8359375, 20.4375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 4.0, 10.0, 16.0, 27.0, 26.0, 42.0, 69.0, 72.0, 114.0, 158.0, 247.0, 330.0, 524.0, 908.0, 1830.0, 5046.0, 20933.0, 145565.0, 711833.0, 132662.0, 19170.0, 4717.0, 1771.0, 873.0, 507.0, 294.0, 233.0, 168.0, 108.0, 73.0, 48.0, 41.0, 23.0, 19.0, 13.0, 18.0, 13.0, 10.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-80.0, -77.6796875, -75.359375, -73.0390625, -70.71875, -68.3984375, -66.078125, -63.7578125, -61.4375, -59.1171875, -56.796875, -54.4765625, -52.15625, -49.8359375, -47.515625, -45.1953125, -42.875, -40.5546875, -38.234375, -35.9140625, -33.59375, -31.2734375, -28.953125, -26.6328125, -24.3125, -21.9921875, -19.671875, -17.3515625, -15.03125, -12.7109375, -10.390625, -8.0703125, -5.75, -3.4296875, -1.109375, 1.2109375, 3.53125, 5.8515625, 8.171875, 10.4921875, 12.8125, 15.1328125, 17.453125, 19.7734375, 22.09375, 24.4140625, 26.734375, 29.0546875, 31.375, 33.6953125, 36.015625, 38.3359375, 40.65625, 42.9765625, 45.296875, 47.6171875, 49.9375, 52.2578125, 54.578125, 56.8984375, 59.21875, 61.5390625, 63.859375, 66.1796875, 68.5]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 6.0, 6.0, 7.0, 8.0, 6.0, 15.0, 19.0, 23.0, 24.0, 29.0, 33.0, 27.0, 43.0, 41.0, 37.0, 47.0, 40.0, 53.0, 59.0, 40.0, 48.0, 48.0, 37.0, 56.0, 25.0, 38.0, 34.0, 27.0, 28.0, 23.0, 15.0, 9.0, 15.0, 6.0, 9.0, 4.0, 6.0, 5.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -84.8798828125, -82.322265625, -79.7646484375, -77.20703125, -74.6494140625, -72.091796875, -69.5341796875, -66.9765625, -64.4189453125, -61.861328125, -59.3037109375, -56.74609375, -54.1884765625, -51.630859375, -49.0732421875, -46.515625, -43.9580078125, -41.400390625, -38.8427734375, -36.28515625, -33.7275390625, -31.169921875, -28.6123046875, -26.0546875, -23.4970703125, -20.939453125, -18.3818359375, -15.82421875, -13.2666015625, -10.708984375, -8.1513671875, -5.59375, -3.0361328125, -0.478515625, 2.0791015625, 4.63671875, 7.1943359375, 9.751953125, 12.3095703125, 14.8671875, 17.4248046875, 19.982421875, 22.5400390625, 25.09765625, 27.6552734375, 30.212890625, 32.7705078125, 35.328125, 37.8857421875, 40.443359375, 43.0009765625, 45.55859375, 48.1162109375, 50.673828125, 53.2314453125, 55.7890625, 58.3466796875, 60.904296875, 63.4619140625, 66.01953125, 68.5771484375, 71.134765625, 73.6923828125, 76.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 12.0, 11.0, 13.0, 14.0, 33.0, 42.0, 81.0, 89.0, 195.0, 366.0, 911.0, 2563.0, 13053.0, 199429.0, 788437.0, 35868.0, 4933.0, 1296.0, 547.0, 243.0, 134.0, 85.0, 56.0, 35.0, 27.0, 20.0, 8.0, 9.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.09375, -52.4150390625, -50.736328125, -49.0576171875, -47.37890625, -45.7001953125, -44.021484375, -42.3427734375, -40.6640625, -38.9853515625, -37.306640625, -35.6279296875, -33.94921875, -32.2705078125, -30.591796875, -28.9130859375, -27.234375, -25.5556640625, -23.876953125, -22.1982421875, -20.51953125, -18.8408203125, -17.162109375, -15.4833984375, -13.8046875, -12.1259765625, -10.447265625, -8.7685546875, -7.08984375, -5.4111328125, -3.732421875, -2.0537109375, -0.375, 1.3037109375, 2.982421875, 4.6611328125, 6.33984375, 8.0185546875, 9.697265625, 11.3759765625, 13.0546875, 14.7333984375, 16.412109375, 18.0908203125, 19.76953125, 21.4482421875, 23.126953125, 24.8056640625, 26.484375, 28.1630859375, 29.841796875, 31.5205078125, 33.19921875, 34.8779296875, 36.556640625, 38.2353515625, 39.9140625, 41.5927734375, 43.271484375, 44.9501953125, 46.62890625, 48.3076171875, 49.986328125, 51.6650390625, 53.34375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 8.0, 8.0, 12.0, 12.0, 15.0, 21.0, 34.0, 47.0, 62.0, 77.0, 130.0, 150.0, 112.0, 88.0, 52.0, 37.0, 32.0, 20.0, 15.0, 7.0, 8.0, 9.0, 11.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00540924072265625, -0.005235493183135986, -0.005061745643615723, -0.004887998104095459, -0.004714250564575195, -0.004540503025054932, -0.004366755485534668, -0.004193007946014404, -0.004019260406494141, -0.003845512866973877, -0.0036717653274536133, -0.0034980177879333496, -0.003324270248413086, -0.0031505227088928223, -0.0029767751693725586, -0.002803027629852295, -0.0026292800903320312, -0.0024555325508117676, -0.002281785011291504, -0.0021080374717712402, -0.0019342899322509766, -0.0017605423927307129, -0.0015867948532104492, -0.0014130473136901855, -0.0012392997741699219, -0.0010655522346496582, -0.0008918046951293945, -0.0007180571556091309, -0.0005443096160888672, -0.0003705620765686035, -0.00019681453704833984, -2.3066997528076172e-05, 0.0001506805419921875, 0.00032442808151245117, 0.0004981756210327148, 0.0006719231605529785, 0.0008456707000732422, 0.0010194182395935059, 0.0011931657791137695, 0.0013669133186340332, 0.0015406608581542969, 0.0017144083976745605, 0.0018881559371948242, 0.002061903476715088, 0.0022356510162353516, 0.0024093985557556152, 0.002583146095275879, 0.0027568936347961426, 0.0029306411743164062, 0.00310438871383667, 0.0032781362533569336, 0.0034518837928771973, 0.003625631332397461, 0.0037993788719177246, 0.003973126411437988, 0.004146873950958252, 0.004320621490478516, 0.004494369029998779, 0.004668116569519043, 0.004841864109039307, 0.00501561164855957, 0.005189359188079834, 0.005363106727600098, 0.005536854267120361, 0.005710601806640625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 4.0, 6.0, 16.0, 15.0, 12.0, 31.0, 37.0, 43.0, 86.0, 141.0, 200.0, 316.0, 599.0, 1018.0, 2042.0, 4704.0, 13635.0, 64195.0, 599403.0, 308019.0, 37062.0, 9476.0, 3601.0, 1701.0, 861.0, 486.0, 278.0, 188.0, 107.0, 75.0, 49.0, 35.0, 23.0, 22.0, 11.0, 15.0, 9.0, 5.0, 0.0, 4.0, 7.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-39.375, -38.276611328125, -37.17822265625, -36.079833984375, -34.9814453125, -33.883056640625, -32.78466796875, -31.686279296875, -30.587890625, -29.489501953125, -28.39111328125, -27.292724609375, -26.1943359375, -25.095947265625, -23.99755859375, -22.899169921875, -21.80078125, -20.702392578125, -19.60400390625, -18.505615234375, -17.4072265625, -16.308837890625, -15.21044921875, -14.112060546875, -13.013671875, -11.915283203125, -10.81689453125, -9.718505859375, -8.6201171875, -7.521728515625, -6.42333984375, -5.324951171875, -4.2265625, -3.128173828125, -2.02978515625, -0.931396484375, 0.1669921875, 1.265380859375, 2.36376953125, 3.462158203125, 4.560546875, 5.658935546875, 6.75732421875, 7.855712890625, 8.9541015625, 10.052490234375, 11.15087890625, 12.249267578125, 13.34765625, 14.446044921875, 15.54443359375, 16.642822265625, 17.7412109375, 18.839599609375, 19.93798828125, 21.036376953125, 22.134765625, 23.233154296875, 24.33154296875, 25.429931640625, 26.5283203125, 27.626708984375, 28.72509765625, 29.823486328125, 30.921875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 11.0, 13.0, 16.0, 21.0, 17.0, 26.0, 31.0, 30.0, 42.0, 46.0, 60.0, 66.0, 87.0, 92.0, 68.0, 76.0, 74.0, 41.0, 34.0, 35.0, 23.0, 19.0, 17.0, 13.0, 13.0, 6.0, 4.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.265625, -26.4482421875, -25.630859375, -24.8134765625, -23.99609375, -23.1787109375, -22.361328125, -21.5439453125, -20.7265625, -19.9091796875, -19.091796875, -18.2744140625, -17.45703125, -16.6396484375, -15.822265625, -15.0048828125, -14.1875, -13.3701171875, -12.552734375, -11.7353515625, -10.91796875, -10.1005859375, -9.283203125, -8.4658203125, -7.6484375, -6.8310546875, -6.013671875, -5.1962890625, -4.37890625, -3.5615234375, -2.744140625, -1.9267578125, -1.109375, -0.2919921875, 0.525390625, 1.3427734375, 2.16015625, 2.9775390625, 3.794921875, 4.6123046875, 5.4296875, 6.2470703125, 7.064453125, 7.8818359375, 8.69921875, 9.5166015625, 10.333984375, 11.1513671875, 11.96875, 12.7861328125, 13.603515625, 14.4208984375, 15.23828125, 16.0556640625, 16.873046875, 17.6904296875, 18.5078125, 19.3251953125, 20.142578125, 20.9599609375, 21.77734375, 22.5947265625, 23.412109375, 24.2294921875, 25.046875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 9.0, 44.0, 79.0, 162.0, 252.0, 235.0, 108.0, 55.0, 25.0, 17.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1028.652587890625, -1001.4903564453125, -974.3280639648438, -947.1658325195312, -920.0035400390625, -892.84130859375, -865.6790771484375, -838.5167846679688, -811.3545532226562, -784.1923217773438, -757.030029296875, -729.8677978515625, -702.7055053710938, -675.5432739257812, -648.3809814453125, -621.21875, -594.0565185546875, -566.894287109375, -539.7319946289062, -512.5697631835938, -485.4075012207031, -458.2452392578125, -431.0829772949219, -403.92071533203125, -376.7584228515625, -349.5961608886719, -322.43389892578125, -295.27166748046875, -268.1094055175781, -240.9471435546875, -213.78488159179688, -186.6226348876953, -159.46038818359375, -132.29812622070312, -105.13587951660156, -77.97361755371094, -50.811363220214844, -23.64910888671875, 3.513153076171875, 30.675399780273438, 57.83766174316406, 84.99991607666016, 112.16217041015625, 139.32443237304688, 166.4866943359375, 193.64894104003906, 220.8112030029297, 247.97344970703125, 275.1357116699219, 302.2979736328125, 329.4602355957031, 356.62249755859375, 383.78472900390625, 410.9469909667969, 438.1092529296875, 465.271484375, 492.43377685546875, 519.5960083007812, 546.75830078125, 573.9205322265625, 601.0828247070312, 628.2450561523438, 655.4073486328125, 682.569580078125, 709.7318115234375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 10.0, 13.0, 12.0, 14.0, 16.0, 20.0, 28.0, 26.0, 35.0, 35.0, 35.0, 41.0, 43.0, 50.0, 56.0, 43.0, 61.0, 57.0, 47.0, 49.0, 41.0, 33.0, 40.0, 32.0, 32.0, 18.0, 22.0, 15.0, 14.0, 13.0, 8.0, 5.0, 9.0, 3.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-392.20098876953125, -380.6000671386719, -368.9991455078125, -357.3982238769531, -345.79730224609375, -334.1963806152344, -322.595458984375, -310.9945068359375, -299.39361572265625, -287.7926940917969, -276.1917724609375, -264.5908508300781, -252.98992919921875, -241.38900756835938, -229.78807067871094, -218.18714904785156, -206.58621215820312, -194.98529052734375, -183.38436889648438, -171.783447265625, -160.18252563476562, -148.58160400390625, -136.9806671142578, -125.37974548339844, -113.77882385253906, -102.17790222167969, -90.57698059082031, -78.9760513305664, -67.37512969970703, -55.774208068847656, -44.17327880859375, -32.572357177734375, -20.971435546875, -9.370512008666992, 2.2304115295410156, 13.831336975097656, 25.43225860595703, 37.033180236816406, 48.63410949707031, 60.23503112792969, 71.83595275878906, 83.43687438964844, 95.03779602050781, 106.63872528076172, 118.2396469116211, 129.840576171875, 141.44149780273438, 153.04241943359375, 164.64334106445312, 176.2442626953125, 187.84518432617188, 199.44610595703125, 211.04702758789062, 222.64794921875, 234.24888610839844, 245.8498077392578, 257.45074462890625, 269.0516662597656, 280.652587890625, 292.2535095214844, 303.85443115234375, 315.4553527832031, 327.0562744140625, 338.6572265625, 350.25811767578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 28.0, 24.0, 40.0, 53.0, 95.0, 138.0, 235.0, 400.0, 735.0, 1438.0, 3131.0, 10071.0, 404677.0, 3755139.0, 11247.0, 3428.0, 1517.0, 769.0, 422.0, 237.0, 134.0, 83.0, 55.0, 37.0, 36.0, 27.0, 18.0, 14.0, 5.0, 3.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.75, -101.013671875, -97.27734375, -93.541015625, -89.8046875, -86.068359375, -82.33203125, -78.595703125, -74.859375, -71.123046875, -67.38671875, -63.650390625, -59.9140625, -56.177734375, -52.44140625, -48.705078125, -44.96875, -41.232421875, -37.49609375, -33.759765625, -30.0234375, -26.287109375, -22.55078125, -18.814453125, -15.078125, -11.341796875, -7.60546875, -3.869140625, -0.1328125, 3.603515625, 7.33984375, 11.076171875, 14.8125, 18.548828125, 22.28515625, 26.021484375, 29.7578125, 33.494140625, 37.23046875, 40.966796875, 44.703125, 48.439453125, 52.17578125, 55.912109375, 59.6484375, 63.384765625, 67.12109375, 70.857421875, 74.59375, 78.330078125, 82.06640625, 85.802734375, 89.5390625, 93.275390625, 97.01171875, 100.748046875, 104.484375, 108.220703125, 111.95703125, 115.693359375, 119.4296875, 123.166015625, 126.90234375, 130.638671875, 134.375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 10.0, 7.0, 5.0, 14.0, 19.0, 16.0, 20.0, 15.0, 36.0, 35.0, 26.0, 35.0, 39.0, 55.0, 45.0, 37.0, 45.0, 59.0, 53.0, 40.0, 41.0, 53.0, 44.0, 33.0, 35.0, 27.0, 34.0, 19.0, 21.0, 18.0, 13.0, 11.0, 8.0, 4.0, 4.0, 3.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.384033203125, -12.81494140625, -12.245849609375, -11.6767578125, -11.107666015625, -10.53857421875, -9.969482421875, -9.400390625, -8.831298828125, -8.26220703125, -7.693115234375, -7.1240234375, -6.554931640625, -5.98583984375, -5.416748046875, -4.84765625, -4.278564453125, -3.70947265625, -3.140380859375, -2.5712890625, -2.002197265625, -1.43310546875, -0.864013671875, -0.294921875, 0.274169921875, 0.84326171875, 1.412353515625, 1.9814453125, 2.550537109375, 3.11962890625, 3.688720703125, 4.2578125, 4.826904296875, 5.39599609375, 5.965087890625, 6.5341796875, 7.103271484375, 7.67236328125, 8.241455078125, 8.810546875, 9.379638671875, 9.94873046875, 10.517822265625, 11.0869140625, 11.656005859375, 12.22509765625, 12.794189453125, 13.36328125, 13.932373046875, 14.50146484375, 15.070556640625, 15.6396484375, 16.208740234375, 16.77783203125, 17.346923828125, 17.916015625, 18.485107421875, 19.05419921875, 19.623291015625, 20.1923828125, 20.761474609375, 21.33056640625, 21.899658203125, 22.46875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 12.0, 15.0, 10.0, 19.0, 22.0, 33.0, 39.0, 53.0, 54.0, 85.0, 108.0, 171.0, 205.0, 249.0, 350.0, 442.0, 707.0, 1100.0, 1535.0, 2637.0, 4871.0, 10154.0, 29770.0, 676855.0, 3407534.0, 33167.0, 10896.0, 5005.0, 2835.0, 1693.0, 1015.0, 680.0, 514.0, 348.0, 293.0, 220.0, 159.0, 100.0, 68.0, 54.0, 59.0, 45.0, 31.0, 25.0, 17.0, 10.0, 13.0, 8.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-48.375, -46.81640625, -45.2578125, -43.69921875, -42.140625, -40.58203125, -39.0234375, -37.46484375, -35.90625, -34.34765625, -32.7890625, -31.23046875, -29.671875, -28.11328125, -26.5546875, -24.99609375, -23.4375, -21.87890625, -20.3203125, -18.76171875, -17.203125, -15.64453125, -14.0859375, -12.52734375, -10.96875, -9.41015625, -7.8515625, -6.29296875, -4.734375, -3.17578125, -1.6171875, -0.05859375, 1.5, 3.05859375, 4.6171875, 6.17578125, 7.734375, 9.29296875, 10.8515625, 12.41015625, 13.96875, 15.52734375, 17.0859375, 18.64453125, 20.203125, 21.76171875, 23.3203125, 24.87890625, 26.4375, 27.99609375, 29.5546875, 31.11328125, 32.671875, 34.23046875, 35.7890625, 37.34765625, 38.90625, 40.46484375, 42.0234375, 43.58203125, 45.140625, 46.69921875, 48.2578125, 49.81640625, 51.375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 1.0, 6.0, 5.0, 5.0, 11.0, 15.0, 21.0, 48.0, 119.0, 3215.0, 444.0, 84.0, 29.0, 23.0, 9.0, 12.0, 2.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.84375, -34.919677734375, -33.99560546875, -33.071533203125, -32.1474609375, -31.223388671875, -30.29931640625, -29.375244140625, -28.451171875, -27.527099609375, -26.60302734375, -25.678955078125, -24.7548828125, -23.830810546875, -22.90673828125, -21.982666015625, -21.05859375, -20.134521484375, -19.21044921875, -18.286376953125, -17.3623046875, -16.438232421875, -15.51416015625, -14.590087890625, -13.666015625, -12.741943359375, -11.81787109375, -10.893798828125, -9.9697265625, -9.045654296875, -8.12158203125, -7.197509765625, -6.2734375, -5.349365234375, -4.42529296875, -3.501220703125, -2.5771484375, -1.653076171875, -0.72900390625, 0.195068359375, 1.119140625, 2.043212890625, 2.96728515625, 3.891357421875, 4.8154296875, 5.739501953125, 6.66357421875, 7.587646484375, 8.51171875, 9.435791015625, 10.35986328125, 11.283935546875, 12.2080078125, 13.132080078125, 14.05615234375, 14.980224609375, 15.904296875, 16.828369140625, 17.75244140625, 18.676513671875, 19.6005859375, 20.524658203125, 21.44873046875, 22.372802734375, 23.296875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 13.0, 13.0, 16.0, 31.0, 74.0, 84.0, 147.0, 157.0, 177.0, 137.0, 66.0, 43.0, 22.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-197.0768280029297, -192.12539672851562, -187.17396545410156, -182.22251892089844, -177.27108764648438, -172.3196563720703, -167.36822509765625, -162.4167938232422, -157.46536254882812, -152.51393127441406, -147.5625, -142.61105346679688, -137.6596221923828, -132.70819091796875, -127.75675964355469, -122.80532836914062, -117.8538818359375, -112.90245056152344, -107.95101165771484, -102.99958038330078, -98.04814147949219, -93.09671020507812, -88.14527893066406, -83.19384765625, -78.2424087524414, -73.29097747802734, -68.33953857421875, -63.38810729980469, -58.43667221069336, -53.48523712158203, -48.53380584716797, -43.58237075805664, -38.63092041015625, -33.67948532104492, -28.728052139282227, -23.77661895751953, -18.825183868408203, -13.873748779296875, -8.92231559753418, -3.9708824157714844, 0.9805526733398438, 5.9319868087768555, 10.883420944213867, 15.834855079650879, 20.78628921508789, 25.73772430419922, 30.689157485961914, 35.64059066772461, 40.59202575683594, 45.543460845947266, 50.494895935058594, 55.446327209472656, 60.397762298583984, 65.34919738769531, 70.30062866210938, 75.25205993652344, 80.20349884033203, 85.1549301147461, 90.10636901855469, 95.05780029296875, 100.00923156738281, 104.9606704711914, 109.91210174560547, 114.86354064941406, 119.81497192382812]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 11.0, 10.0, 9.0, 14.0, 14.0, 17.0, 33.0, 30.0, 28.0, 34.0, 31.0, 52.0, 57.0, 52.0, 65.0, 56.0, 56.0, 73.0, 60.0, 43.0, 39.0, 43.0, 31.0, 27.0, 29.0, 13.0, 23.0, 13.0, 10.0, 6.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.22349548339844, -70.8622055053711, -68.50091552734375, -66.13963317871094, -63.778343200683594, -61.41705322265625, -59.05576705932617, -56.694480895996094, -54.33319091796875, -51.971900939941406, -49.61061477661133, -47.24932861328125, -44.888038635253906, -42.52674865722656, -40.165462493896484, -37.804176330566406, -35.44288635253906, -33.08159637451172, -30.72031021118164, -28.35902214050293, -25.99773406982422, -23.636445999145508, -21.275157928466797, -18.913869857788086, -16.552581787109375, -14.191293716430664, -11.830005645751953, -9.468717575073242, -7.107429504394531, -4.74614143371582, -2.3848533630371094, -0.023565292358398438, 2.3377151489257812, 4.699003219604492, 7.060291290283203, 9.421579360961914, 11.782867431640625, 14.144155502319336, 16.505443572998047, 18.866731643676758, 21.22801971435547, 23.58930778503418, 25.95059585571289, 28.3118839263916, 30.673171997070312, 33.034461975097656, 35.395748138427734, 37.75703430175781, 40.118324279785156, 42.4796142578125, 44.84090042114258, 47.202186584472656, 49.5634765625, 51.924766540527344, 54.28605270385742, 56.6473388671875, 59.008628845214844, 61.36991882324219, 63.731204986572266, 66.09249114990234, 68.45378112792969, 70.81507110595703, 73.17636108398438, 75.53764343261719, 77.89893341064453]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 13.0, 14.0, 12.0, 25.0, 35.0, 39.0, 66.0, 103.0, 146.0, 244.0, 409.0, 734.0, 1492.0, 2884.0, 6509.0, 16192.0, 44116.0, 140465.0, 412158.0, 286171.0, 87257.0, 28874.0, 11107.0, 4807.0, 2132.0, 1091.0, 545.0, 335.0, 188.0, 122.0, 84.0, 47.0, 39.0, 33.0, 23.0, 9.0, 9.0, 13.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.375, -45.72998046875, -44.0849609375, -42.43994140625, -40.794921875, -39.14990234375, -37.5048828125, -35.85986328125, -34.21484375, -32.56982421875, -30.9248046875, -29.27978515625, -27.634765625, -25.98974609375, -24.3447265625, -22.69970703125, -21.0546875, -19.40966796875, -17.7646484375, -16.11962890625, -14.474609375, -12.82958984375, -11.1845703125, -9.53955078125, -7.89453125, -6.24951171875, -4.6044921875, -2.95947265625, -1.314453125, 0.33056640625, 1.9755859375, 3.62060546875, 5.265625, 6.91064453125, 8.5556640625, 10.20068359375, 11.845703125, 13.49072265625, 15.1357421875, 16.78076171875, 18.42578125, 20.07080078125, 21.7158203125, 23.36083984375, 25.005859375, 26.65087890625, 28.2958984375, 29.94091796875, 31.5859375, 33.23095703125, 34.8759765625, 36.52099609375, 38.166015625, 39.81103515625, 41.4560546875, 43.10107421875, 44.74609375, 46.39111328125, 48.0361328125, 49.68115234375, 51.326171875, 52.97119140625, 54.6162109375, 56.26123046875, 57.90625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 10.0, 9.0, 9.0, 6.0, 15.0, 23.0, 17.0, 21.0, 22.0, 33.0, 42.0, 42.0, 49.0, 44.0, 40.0, 47.0, 61.0, 66.0, 53.0, 46.0, 50.0, 37.0, 44.0, 35.0, 38.0, 27.0, 28.0, 10.0, 14.0, 14.0, 11.0, 3.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.265625, -16.628173828125, -15.99072265625, -15.353271484375, -14.7158203125, -14.078369140625, -13.44091796875, -12.803466796875, -12.166015625, -11.528564453125, -10.89111328125, -10.253662109375, -9.6162109375, -8.978759765625, -8.34130859375, -7.703857421875, -7.06640625, -6.428955078125, -5.79150390625, -5.154052734375, -4.5166015625, -3.879150390625, -3.24169921875, -2.604248046875, -1.966796875, -1.329345703125, -0.69189453125, -0.054443359375, 0.5830078125, 1.220458984375, 1.85791015625, 2.495361328125, 3.1328125, 3.770263671875, 4.40771484375, 5.045166015625, 5.6826171875, 6.320068359375, 6.95751953125, 7.594970703125, 8.232421875, 8.869873046875, 9.50732421875, 10.144775390625, 10.7822265625, 11.419677734375, 12.05712890625, 12.694580078125, 13.33203125, 13.969482421875, 14.60693359375, 15.244384765625, 15.8818359375, 16.519287109375, 17.15673828125, 17.794189453125, 18.431640625, 19.069091796875, 19.70654296875, 20.343994140625, 20.9814453125, 21.618896484375, 22.25634765625, 22.893798828125, 23.53125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 6.0, 10.0, 9.0, 11.0, 13.0, 21.0, 23.0, 34.0, 46.0, 60.0, 78.0, 113.0, 180.0, 348.0, 566.0, 1156.0, 2808.0, 10796.0, 84436.0, 767247.0, 157651.0, 16315.0, 3615.0, 1295.0, 646.0, 387.0, 206.0, 137.0, 91.0, 70.0, 38.0, 30.0, 24.0, 21.0, 20.0, 12.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-96.3125, -93.060546875, -89.80859375, -86.556640625, -83.3046875, -80.052734375, -76.80078125, -73.548828125, -70.296875, -67.044921875, -63.79296875, -60.541015625, -57.2890625, -54.037109375, -50.78515625, -47.533203125, -44.28125, -41.029296875, -37.77734375, -34.525390625, -31.2734375, -28.021484375, -24.76953125, -21.517578125, -18.265625, -15.013671875, -11.76171875, -8.509765625, -5.2578125, -2.005859375, 1.24609375, 4.498046875, 7.75, 11.001953125, 14.25390625, 17.505859375, 20.7578125, 24.009765625, 27.26171875, 30.513671875, 33.765625, 37.017578125, 40.26953125, 43.521484375, 46.7734375, 50.025390625, 53.27734375, 56.529296875, 59.78125, 63.033203125, 66.28515625, 69.537109375, 72.7890625, 76.041015625, 79.29296875, 82.544921875, 85.796875, 89.048828125, 92.30078125, 95.552734375, 98.8046875, 102.056640625, 105.30859375, 108.560546875, 111.8125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 7.0, 6.0, 9.0, 11.0, 9.0, 17.0, 15.0, 17.0, 25.0, 36.0, 32.0, 43.0, 34.0, 41.0, 38.0, 39.0, 70.0, 53.0, 59.0, 40.0, 50.0, 43.0, 40.0, 38.0, 35.0, 36.0, 25.0, 24.0, 23.0, 21.0, 11.0, 14.0, 5.0, 7.0, 7.0, 7.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-92.0, -89.2578125, -86.515625, -83.7734375, -81.03125, -78.2890625, -75.546875, -72.8046875, -70.0625, -67.3203125, -64.578125, -61.8359375, -59.09375, -56.3515625, -53.609375, -50.8671875, -48.125, -45.3828125, -42.640625, -39.8984375, -37.15625, -34.4140625, -31.671875, -28.9296875, -26.1875, -23.4453125, -20.703125, -17.9609375, -15.21875, -12.4765625, -9.734375, -6.9921875, -4.25, -1.5078125, 1.234375, 3.9765625, 6.71875, 9.4609375, 12.203125, 14.9453125, 17.6875, 20.4296875, 23.171875, 25.9140625, 28.65625, 31.3984375, 34.140625, 36.8828125, 39.625, 42.3671875, 45.109375, 47.8515625, 50.59375, 53.3359375, 56.078125, 58.8203125, 61.5625, 64.3046875, 67.046875, 69.7890625, 72.53125, 75.2734375, 78.015625, 80.7578125, 83.5]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 7.0, 6.0, 12.0, 13.0, 18.0, 30.0, 41.0, 52.0, 91.0, 127.0, 172.0, 280.0, 504.0, 892.0, 1675.0, 4200.0, 12479.0, 51945.0, 309923.0, 544539.0, 91373.0, 19506.0, 5802.0, 2263.0, 1018.0, 560.0, 339.0, 194.0, 142.0, 103.0, 55.0, 56.0, 32.0, 26.0, 22.0, 13.0, 8.0, 8.0, 6.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.53125, -21.871826171875, -21.21240234375, -20.552978515625, -19.8935546875, -19.234130859375, -18.57470703125, -17.915283203125, -17.255859375, -16.596435546875, -15.93701171875, -15.277587890625, -14.6181640625, -13.958740234375, -13.29931640625, -12.639892578125, -11.98046875, -11.321044921875, -10.66162109375, -10.002197265625, -9.3427734375, -8.683349609375, -8.02392578125, -7.364501953125, -6.705078125, -6.045654296875, -5.38623046875, -4.726806640625, -4.0673828125, -3.407958984375, -2.74853515625, -2.089111328125, -1.4296875, -0.770263671875, -0.11083984375, 0.548583984375, 1.2080078125, 1.867431640625, 2.52685546875, 3.186279296875, 3.845703125, 4.505126953125, 5.16455078125, 5.823974609375, 6.4833984375, 7.142822265625, 7.80224609375, 8.461669921875, 9.12109375, 9.780517578125, 10.43994140625, 11.099365234375, 11.7587890625, 12.418212890625, 13.07763671875, 13.737060546875, 14.396484375, 15.055908203125, 15.71533203125, 16.374755859375, 17.0341796875, 17.693603515625, 18.35302734375, 19.012451171875, 19.671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 6.0, 9.0, 12.0, 12.0, 11.0, 23.0, 19.0, 20.0, 32.0, 29.0, 37.0, 61.0, 68.0, 80.0, 100.0, 83.0, 79.0, 55.0, 32.0, 31.0, 35.0, 17.0, 27.0, 17.0, 18.0, 14.0, 12.0, 11.0, 5.0, 9.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.003383636474609375, -0.0032833218574523926, -0.00318300724029541, -0.0030826926231384277, -0.0029823780059814453, -0.002882063388824463, -0.0027817487716674805, -0.002681434154510498, -0.0025811195373535156, -0.002480804920196533, -0.0023804903030395508, -0.0022801756858825684, -0.002179861068725586, -0.0020795464515686035, -0.001979231834411621, -0.0018789172172546387, -0.0017786026000976562, -0.0016782879829406738, -0.0015779733657836914, -0.001477658748626709, -0.0013773441314697266, -0.0012770295143127441, -0.0011767148971557617, -0.0010764002799987793, -0.0009760856628417969, -0.0008757710456848145, -0.000775456428527832, -0.0006751418113708496, -0.0005748271942138672, -0.00047451257705688477, -0.00037419795989990234, -0.0002738833427429199, -0.0001735687255859375, -7.325410842895508e-05, 2.7060508728027344e-05, 0.00012737512588500977, 0.0002276897430419922, 0.0003280043601989746, 0.00042831897735595703, 0.0005286335945129395, 0.0006289482116699219, 0.0007292628288269043, 0.0008295774459838867, 0.0009298920631408691, 0.0010302066802978516, 0.001130521297454834, 0.0012308359146118164, 0.0013311505317687988, 0.0014314651489257812, 0.0015317797660827637, 0.001632094383239746, 0.0017324090003967285, 0.001832723617553711, 0.0019330382347106934, 0.0020333528518676758, 0.002133667469024658, 0.0022339820861816406, 0.002334296703338623, 0.0024346113204956055, 0.002534925937652588, 0.0026352405548095703, 0.0027355551719665527, 0.002835869789123535, 0.0029361844062805176, 0.0030364990234375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 6.0, 22.0, 29.0, 43.0, 104.0, 159.0, 345.0, 817.0, 2680.0, 17654.0, 426778.0, 573118.0, 22032.0, 3114.0, 895.0, 358.0, 178.0, 97.0, 51.0, 24.0, 18.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75, -40.3603515625, -38.970703125, -37.5810546875, -36.19140625, -34.8017578125, -33.412109375, -32.0224609375, -30.6328125, -29.2431640625, -27.853515625, -26.4638671875, -25.07421875, -23.6845703125, -22.294921875, -20.9052734375, -19.515625, -18.1259765625, -16.736328125, -15.3466796875, -13.95703125, -12.5673828125, -11.177734375, -9.7880859375, -8.3984375, -7.0087890625, -5.619140625, -4.2294921875, -2.83984375, -1.4501953125, -0.060546875, 1.3291015625, 2.71875, 4.1083984375, 5.498046875, 6.8876953125, 8.27734375, 9.6669921875, 11.056640625, 12.4462890625, 13.8359375, 15.2255859375, 16.615234375, 18.0048828125, 19.39453125, 20.7841796875, 22.173828125, 23.5634765625, 24.953125, 26.3427734375, 27.732421875, 29.1220703125, 30.51171875, 31.9013671875, 33.291015625, 34.6806640625, 36.0703125, 37.4599609375, 38.849609375, 40.2392578125, 41.62890625, 43.0185546875, 44.408203125, 45.7978515625, 47.1875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 7.0, 1.0, 4.0, 7.0, 11.0, 14.0, 22.0, 22.0, 33.0, 43.0, 53.0, 69.0, 103.0, 103.0, 91.0, 90.0, 78.0, 73.0, 57.0, 34.0, 24.0, 17.0, 16.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.0, -21.16552734375, -20.3310546875, -19.49658203125, -18.662109375, -17.82763671875, -16.9931640625, -16.15869140625, -15.32421875, -14.48974609375, -13.6552734375, -12.82080078125, -11.986328125, -11.15185546875, -10.3173828125, -9.48291015625, -8.6484375, -7.81396484375, -6.9794921875, -6.14501953125, -5.310546875, -4.47607421875, -3.6416015625, -2.80712890625, -1.97265625, -1.13818359375, -0.3037109375, 0.53076171875, 1.365234375, 2.19970703125, 3.0341796875, 3.86865234375, 4.703125, 5.53759765625, 6.3720703125, 7.20654296875, 8.041015625, 8.87548828125, 9.7099609375, 10.54443359375, 11.37890625, 12.21337890625, 13.0478515625, 13.88232421875, 14.716796875, 15.55126953125, 16.3857421875, 17.22021484375, 18.0546875, 18.88916015625, 19.7236328125, 20.55810546875, 21.392578125, 22.22705078125, 23.0615234375, 23.89599609375, 24.73046875, 25.56494140625, 26.3994140625, 27.23388671875, 28.068359375, 28.90283203125, 29.7373046875, 30.57177734375, 31.40625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 15.0, 22.0, 34.0, 53.0, 99.0, 141.0, 179.0, 160.0, 114.0, 92.0, 39.0, 17.0, 14.0, 7.0, 6.0, 2.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-758.835205078125, -739.2603759765625, -719.6854858398438, -700.1106567382812, -680.5357666015625, -660.9609375, -641.3861083984375, -621.8112182617188, -602.2363891601562, -582.6615600585938, -563.086669921875, -543.5118408203125, -523.9369506835938, -504.36212158203125, -484.7872619628906, -465.21240234375, -445.6375427246094, -426.06268310546875, -406.4878234863281, -386.9129638671875, -367.338134765625, -347.7632751464844, -328.18841552734375, -308.61358642578125, -289.0386962890625, -269.4638366699219, -249.8889923095703, -230.3141326904297, -210.73928833007812, -191.1644287109375, -171.58956909179688, -152.0147247314453, -132.43991088867188, -112.86505889892578, -93.29020690917969, -73.71534729003906, -54.14049530029297, -34.565643310546875, -14.99078369140625, 4.5840606689453125, 24.158920288085938, 43.73377227783203, 63.30862808227539, 82.88348388671875, 102.45833587646484, 122.03318786621094, 141.60804748535156, 161.18289184570312, 180.75775146484375, 200.33261108398438, 219.90745544433594, 239.48231506347656, 259.0571594238281, 278.63201904296875, 298.2068786621094, 317.78173828125, 337.3565673828125, 356.9314270019531, 376.50628662109375, 396.08111572265625, 415.6559753417969, 435.2308349609375, 454.8056945800781, 474.38055419921875, 493.9554138183594]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 8.0, 6.0, 10.0, 9.0, 13.0, 10.0, 19.0, 15.0, 18.0, 21.0, 16.0, 26.0, 28.0, 31.0, 26.0, 50.0, 45.0, 46.0, 40.0, 65.0, 54.0, 43.0, 53.0, 42.0, 49.0, 24.0, 33.0, 27.0, 25.0, 23.0, 20.0, 17.0, 10.0, 9.0, 10.0, 14.0, 6.0, 6.0, 6.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-328.0400390625, -317.5859069824219, -307.1318054199219, -296.67767333984375, -286.2235412597656, -275.7694091796875, -265.3153076171875, -254.86117553710938, -244.40704345703125, -233.9529266357422, -223.49879455566406, -213.044677734375, -202.59054565429688, -192.1364288330078, -181.68231201171875, -171.22817993164062, -160.77406311035156, -150.3199462890625, -139.86581420898438, -129.4116973876953, -118.95756530761719, -108.50344848632812, -98.04932403564453, -87.59519958496094, -77.14107513427734, -66.68695068359375, -56.232826232910156, -45.77870559692383, -35.324581146240234, -24.87045669555664, -14.416336059570312, -3.9622116088867188, 6.491912841796875, 16.94603729248047, 27.40015983581543, 37.85428237915039, 48.308406829833984, 58.76253128051758, 69.2166519165039, 79.6707763671875, 90.1249008178711, 100.57902526855469, 111.03314971923828, 121.48727416992188, 131.94139099121094, 142.39552307128906, 152.84963989257812, 163.30377197265625, 173.7578887939453, 184.21200561523438, 194.6661376953125, 205.12025451660156, 215.5743865966797, 226.02850341796875, 236.48263549804688, 246.93675231933594, 257.390869140625, 267.8450012207031, 278.2991027832031, 288.75323486328125, 299.2073669433594, 309.6614990234375, 320.1156005859375, 330.5697326660156, 341.02386474609375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 15.0, 21.0, 20.0, 43.0, 38.0, 75.0, 97.0, 146.0, 179.0, 295.0, 464.0, 753.0, 1167.0, 1869.0, 3290.0, 6170.0, 13593.0, 37917.0, 192961.0, 3336565.0, 500434.0, 61321.0, 18622.0, 7903.0, 3989.0, 2275.0, 1365.0, 881.0, 585.0, 399.0, 271.0, 179.0, 148.0, 52.0, 56.0, 32.0, 24.0, 14.0, 8.0, 7.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-36.21875, -35.0380859375, -33.857421875, -32.6767578125, -31.49609375, -30.3154296875, -29.134765625, -27.9541015625, -26.7734375, -25.5927734375, -24.412109375, -23.2314453125, -22.05078125, -20.8701171875, -19.689453125, -18.5087890625, -17.328125, -16.1474609375, -14.966796875, -13.7861328125, -12.60546875, -11.4248046875, -10.244140625, -9.0634765625, -7.8828125, -6.7021484375, -5.521484375, -4.3408203125, -3.16015625, -1.9794921875, -0.798828125, 0.3818359375, 1.5625, 2.7431640625, 3.923828125, 5.1044921875, 6.28515625, 7.4658203125, 8.646484375, 9.8271484375, 11.0078125, 12.1884765625, 13.369140625, 14.5498046875, 15.73046875, 16.9111328125, 18.091796875, 19.2724609375, 20.453125, 21.6337890625, 22.814453125, 23.9951171875, 25.17578125, 26.3564453125, 27.537109375, 28.7177734375, 29.8984375, 31.0791015625, 32.259765625, 33.4404296875, 34.62109375, 35.8017578125, 36.982421875, 38.1630859375, 39.34375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 10.0, 8.0, 11.0, 8.0, 13.0, 12.0, 24.0, 33.0, 38.0, 57.0, 52.0, 53.0, 51.0, 75.0, 75.0, 76.0, 72.0, 51.0, 48.0, 45.0, 48.0, 41.0, 31.0, 19.0, 10.0, 7.0, 15.0, 4.0, 7.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.03125, -25.257568359375, -24.48388671875, -23.710205078125, -22.9365234375, -22.162841796875, -21.38916015625, -20.615478515625, -19.841796875, -19.068115234375, -18.29443359375, -17.520751953125, -16.7470703125, -15.973388671875, -15.19970703125, -14.426025390625, -13.65234375, -12.878662109375, -12.10498046875, -11.331298828125, -10.5576171875, -9.783935546875, -9.01025390625, -8.236572265625, -7.462890625, -6.689208984375, -5.91552734375, -5.141845703125, -4.3681640625, -3.594482421875, -2.82080078125, -2.047119140625, -1.2734375, -0.499755859375, 0.27392578125, 1.047607421875, 1.8212890625, 2.594970703125, 3.36865234375, 4.142333984375, 4.916015625, 5.689697265625, 6.46337890625, 7.237060546875, 8.0107421875, 8.784423828125, 9.55810546875, 10.331787109375, 11.10546875, 11.879150390625, 12.65283203125, 13.426513671875, 14.2001953125, 14.973876953125, 15.74755859375, 16.521240234375, 17.294921875, 18.068603515625, 18.84228515625, 19.615966796875, 20.3896484375, 21.163330078125, 21.93701171875, 22.710693359375, 23.484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 9.0, 10.0, 20.0, 15.0, 19.0, 42.0, 58.0, 120.0, 324.0, 850.0, 2909.0, 11460.0, 88355.0, 3960315.0, 111727.0, 13329.0, 3128.0, 946.0, 298.0, 150.0, 60.0, 24.0, 20.0, 13.0, 16.0, 10.0, 11.0, 10.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-102.125, -98.986328125, -95.84765625, -92.708984375, -89.5703125, -86.431640625, -83.29296875, -80.154296875, -77.015625, -73.876953125, -70.73828125, -67.599609375, -64.4609375, -61.322265625, -58.18359375, -55.044921875, -51.90625, -48.767578125, -45.62890625, -42.490234375, -39.3515625, -36.212890625, -33.07421875, -29.935546875, -26.796875, -23.658203125, -20.51953125, -17.380859375, -14.2421875, -11.103515625, -7.96484375, -4.826171875, -1.6875, 1.451171875, 4.58984375, 7.728515625, 10.8671875, 14.005859375, 17.14453125, 20.283203125, 23.421875, 26.560546875, 29.69921875, 32.837890625, 35.9765625, 39.115234375, 42.25390625, 45.392578125, 48.53125, 51.669921875, 54.80859375, 57.947265625, 61.0859375, 64.224609375, 67.36328125, 70.501953125, 73.640625, 76.779296875, 79.91796875, 83.056640625, 86.1953125, 89.333984375, 92.47265625, 95.611328125, 98.75]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 10.0, 9.0, 12.0, 20.0, 29.0, 29.0, 66.0, 104.0, 251.0, 695.0, 1578.0, 661.0, 251.0, 117.0, 70.0, 36.0, 26.0, 18.0, 12.0, 9.0, 10.0, 11.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.53125, -55.7626953125, -53.994140625, -52.2255859375, -50.45703125, -48.6884765625, -46.919921875, -45.1513671875, -43.3828125, -41.6142578125, -39.845703125, -38.0771484375, -36.30859375, -34.5400390625, -32.771484375, -31.0029296875, -29.234375, -27.4658203125, -25.697265625, -23.9287109375, -22.16015625, -20.3916015625, -18.623046875, -16.8544921875, -15.0859375, -13.3173828125, -11.548828125, -9.7802734375, -8.01171875, -6.2431640625, -4.474609375, -2.7060546875, -0.9375, 0.8310546875, 2.599609375, 4.3681640625, 6.13671875, 7.9052734375, 9.673828125, 11.4423828125, 13.2109375, 14.9794921875, 16.748046875, 18.5166015625, 20.28515625, 22.0537109375, 23.822265625, 25.5908203125, 27.359375, 29.1279296875, 30.896484375, 32.6650390625, 34.43359375, 36.2021484375, 37.970703125, 39.7392578125, 41.5078125, 43.2763671875, 45.044921875, 46.8134765625, 48.58203125, 50.3505859375, 52.119140625, 53.8876953125, 55.65625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 14.0, 19.0, 39.0, 72.0, 114.0, 197.0, 206.0, 140.0, 95.0, 37.0, 24.0, 13.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.1231689453125, -251.33702087402344, -234.55087280273438, -217.76473999023438, -200.9785919189453, -184.19244384765625, -167.40631103515625, -150.6201629638672, -133.83401489257812, -117.04786682128906, -100.26172637939453, -83.4755859375, -66.68943786621094, -49.903289794921875, -33.117149353027344, -16.331008911132812, 0.45513916015625, 17.241283416748047, 34.027427673339844, 50.81357192993164, 67.59971618652344, 84.3858642578125, 101.17200469970703, 117.95814514160156, 134.74429321289062, 151.5304412841797, 168.31658935546875, 185.10272216796875, 201.8888702392578, 218.67501831054688, 235.46115112304688, 252.24729919433594, 269.033447265625, 285.819580078125, 302.6057434082031, 319.3918762207031, 336.17803955078125, 352.96417236328125, 369.75030517578125, 386.53643798828125, 403.3226013183594, 420.1087341308594, 436.8948974609375, 453.6810302734375, 470.4671630859375, 487.2533264160156, 504.0394592285156, 520.8256225585938, 537.6117553710938, 554.3978881835938, 571.1840209960938, 587.97021484375, 604.75634765625, 621.54248046875, 638.32861328125, 655.11474609375, 671.90087890625, 688.68701171875, 705.47314453125, 722.2593383789062, 739.0454711914062, 755.8316040039062, 772.6177368164062, 789.4038696289062, 806.1900634765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 9.0, 14.0, 9.0, 14.0, 8.0, 24.0, 25.0, 35.0, 36.0, 35.0, 38.0, 26.0, 39.0, 49.0, 58.0, 60.0, 43.0, 48.0, 38.0, 43.0, 53.0, 47.0, 28.0, 39.0, 29.0, 29.0, 25.0, 15.0, 17.0, 10.0, 3.0, 10.0, 11.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-237.68701171875, -230.64279174804688, -223.59857177734375, -216.55435180664062, -209.5101318359375, -202.46591186523438, -195.42169189453125, -188.37745666503906, -181.33323669433594, -174.2890167236328, -167.2447967529297, -160.20057678222656, -153.15635681152344, -146.11212158203125, -139.06790161132812, -132.023681640625, -124.9794692993164, -117.93524932861328, -110.89102935791016, -103.8468017578125, -96.80258178710938, -89.75836181640625, -82.71414184570312, -75.669921875, -68.62570190429688, -61.58148193359375, -54.53725814819336, -47.493038177490234, -40.448814392089844, -33.40459442138672, -26.360374450683594, -19.316150665283203, -12.271926879882812, -5.227705478668213, 1.8165159225463867, 8.860736846923828, 15.904958724975586, 22.949180603027344, 29.99340057373047, 37.03762435913086, 44.081844329833984, 51.12606430053711, 58.1702880859375, 65.21450805664062, 72.25872802734375, 79.30294799804688, 86.34716796875, 93.39139556884766, 100.43561553955078, 107.4798355102539, 114.52405548095703, 121.56828308105469, 128.6125030517578, 135.65672302246094, 142.70094299316406, 149.7451629638672, 156.7893829345703, 163.83360290527344, 170.87782287597656, 177.9220428466797, 184.9662628173828, 192.010498046875, 199.05471801757812, 206.09893798828125, 213.14315795898438]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 12.0, 4.0, 11.0, 8.0, 19.0, 31.0, 34.0, 54.0, 67.0, 110.0, 166.0, 244.0, 387.0, 580.0, 897.0, 1447.0, 2365.0, 4162.0, 7398.0, 14021.0, 28157.0, 60400.0, 141655.0, 326164.0, 259613.0, 105477.0, 46617.0, 22084.0, 11334.0, 6079.0, 3437.0, 2048.0, 1200.0, 773.0, 483.0, 309.0, 229.0, 165.0, 100.0, 65.0, 51.0, 31.0, 25.0, 12.0, 8.0, 11.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.09375, -32.05419921875, -31.0146484375, -29.97509765625, -28.935546875, -27.89599609375, -26.8564453125, -25.81689453125, -24.77734375, -23.73779296875, -22.6982421875, -21.65869140625, -20.619140625, -19.57958984375, -18.5400390625, -17.50048828125, -16.4609375, -15.42138671875, -14.3818359375, -13.34228515625, -12.302734375, -11.26318359375, -10.2236328125, -9.18408203125, -8.14453125, -7.10498046875, -6.0654296875, -5.02587890625, -3.986328125, -2.94677734375, -1.9072265625, -0.86767578125, 0.171875, 1.21142578125, 2.2509765625, 3.29052734375, 4.330078125, 5.36962890625, 6.4091796875, 7.44873046875, 8.48828125, 9.52783203125, 10.5673828125, 11.60693359375, 12.646484375, 13.68603515625, 14.7255859375, 15.76513671875, 16.8046875, 17.84423828125, 18.8837890625, 19.92333984375, 20.962890625, 22.00244140625, 23.0419921875, 24.08154296875, 25.12109375, 26.16064453125, 27.2001953125, 28.23974609375, 29.279296875, 30.31884765625, 31.3583984375, 32.39794921875, 33.4375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 3.0, 7.0, 9.0, 13.0, 16.0, 9.0, 14.0, 21.0, 22.0, 37.0, 43.0, 42.0, 42.0, 52.0, 65.0, 39.0, 40.0, 51.0, 60.0, 60.0, 55.0, 33.0, 44.0, 32.0, 37.0, 22.0, 22.0, 23.0, 21.0, 15.0, 14.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.203125, -18.605712890625, -18.00830078125, -17.410888671875, -16.8134765625, -16.216064453125, -15.61865234375, -15.021240234375, -14.423828125, -13.826416015625, -13.22900390625, -12.631591796875, -12.0341796875, -11.436767578125, -10.83935546875, -10.241943359375, -9.64453125, -9.047119140625, -8.44970703125, -7.852294921875, -7.2548828125, -6.657470703125, -6.06005859375, -5.462646484375, -4.865234375, -4.267822265625, -3.67041015625, -3.072998046875, -2.4755859375, -1.878173828125, -1.28076171875, -0.683349609375, -0.0859375, 0.511474609375, 1.10888671875, 1.706298828125, 2.3037109375, 2.901123046875, 3.49853515625, 4.095947265625, 4.693359375, 5.290771484375, 5.88818359375, 6.485595703125, 7.0830078125, 7.680419921875, 8.27783203125, 8.875244140625, 9.47265625, 10.070068359375, 10.66748046875, 11.264892578125, 11.8623046875, 12.459716796875, 13.05712890625, 13.654541015625, 14.251953125, 14.849365234375, 15.44677734375, 16.044189453125, 16.6416015625, 17.239013671875, 17.83642578125, 18.433837890625, 19.03125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 2.0, 7.0, 9.0, 16.0, 26.0, 38.0, 82.0, 141.0, 206.0, 442.0, 1114.0, 4283.0, 58160.0, 937079.0, 41362.0, 3597.0, 1020.0, 419.0, 224.0, 115.0, 84.0, 48.0, 25.0, 23.0, 10.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.625, -174.55859375, -169.4921875, -164.42578125, -159.359375, -154.29296875, -149.2265625, -144.16015625, -139.09375, -134.02734375, -128.9609375, -123.89453125, -118.828125, -113.76171875, -108.6953125, -103.62890625, -98.5625, -93.49609375, -88.4296875, -83.36328125, -78.296875, -73.23046875, -68.1640625, -63.09765625, -58.03125, -52.96484375, -47.8984375, -42.83203125, -37.765625, -32.69921875, -27.6328125, -22.56640625, -17.5, -12.43359375, -7.3671875, -2.30078125, 2.765625, 7.83203125, 12.8984375, 17.96484375, 23.03125, 28.09765625, 33.1640625, 38.23046875, 43.296875, 48.36328125, 53.4296875, 58.49609375, 63.5625, 68.62890625, 73.6953125, 78.76171875, 83.828125, 88.89453125, 93.9609375, 99.02734375, 104.09375, 109.16015625, 114.2265625, 119.29296875, 124.359375, 129.42578125, 134.4921875, 139.55859375, 144.625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 11.0, 14.0, 14.0, 19.0, 21.0, 23.0, 30.0, 40.0, 37.0, 48.0, 37.0, 40.0, 49.0, 54.0, 45.0, 37.0, 49.0, 45.0, 45.0, 42.0, 44.0, 30.0, 43.0, 30.0, 21.0, 28.0, 19.0, 17.0, 13.0, 12.0, 4.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-74.125, -71.6484375, -69.171875, -66.6953125, -64.21875, -61.7421875, -59.265625, -56.7890625, -54.3125, -51.8359375, -49.359375, -46.8828125, -44.40625, -41.9296875, -39.453125, -36.9765625, -34.5, -32.0234375, -29.546875, -27.0703125, -24.59375, -22.1171875, -19.640625, -17.1640625, -14.6875, -12.2109375, -9.734375, -7.2578125, -4.78125, -2.3046875, 0.171875, 2.6484375, 5.125, 7.6015625, 10.078125, 12.5546875, 15.03125, 17.5078125, 19.984375, 22.4609375, 24.9375, 27.4140625, 29.890625, 32.3671875, 34.84375, 37.3203125, 39.796875, 42.2734375, 44.75, 47.2265625, 49.703125, 52.1796875, 54.65625, 57.1328125, 59.609375, 62.0859375, 64.5625, 67.0390625, 69.515625, 71.9921875, 74.46875, 76.9453125, 79.421875, 81.8984375, 84.375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 16.0, 10.0, 20.0, 47.0, 72.0, 108.0, 164.0, 297.0, 640.0, 1582.0, 5774.0, 37795.0, 785437.0, 196503.0, 14829.0, 3101.0, 1084.0, 474.0, 210.0, 128.0, 82.0, 36.0, 32.0, 30.0, 6.0, 15.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0], "bins": [-50.0, -48.77392578125, -47.5478515625, -46.32177734375, -45.095703125, -43.86962890625, -42.6435546875, -41.41748046875, -40.19140625, -38.96533203125, -37.7392578125, -36.51318359375, -35.287109375, -34.06103515625, -32.8349609375, -31.60888671875, -30.3828125, -29.15673828125, -27.9306640625, -26.70458984375, -25.478515625, -24.25244140625, -23.0263671875, -21.80029296875, -20.57421875, -19.34814453125, -18.1220703125, -16.89599609375, -15.669921875, -14.44384765625, -13.2177734375, -11.99169921875, -10.765625, -9.53955078125, -8.3134765625, -7.08740234375, -5.861328125, -4.63525390625, -3.4091796875, -2.18310546875, -0.95703125, 0.26904296875, 1.4951171875, 2.72119140625, 3.947265625, 5.17333984375, 6.3994140625, 7.62548828125, 8.8515625, 10.07763671875, 11.3037109375, 12.52978515625, 13.755859375, 14.98193359375, 16.2080078125, 17.43408203125, 18.66015625, 19.88623046875, 21.1123046875, 22.33837890625, 23.564453125, 24.79052734375, 26.0166015625, 27.24267578125, 28.46875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 5.0, 11.0, 12.0, 38.0, 40.0, 60.0, 109.0, 185.0, 212.0, 121.0, 69.0, 38.0, 23.0, 19.0, 19.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00937652587890625, -0.009130120277404785, -0.00888371467590332, -0.008637309074401855, -0.00839090347290039, -0.008144497871398926, -0.007898092269897461, -0.007651686668395996, -0.007405281066894531, -0.007158875465393066, -0.0069124698638916016, -0.006666064262390137, -0.006419658660888672, -0.006173253059387207, -0.005926847457885742, -0.005680441856384277, -0.0054340362548828125, -0.005187630653381348, -0.004941225051879883, -0.004694819450378418, -0.004448413848876953, -0.004202008247375488, -0.0039556026458740234, -0.0037091970443725586, -0.0034627914428710938, -0.003216385841369629, -0.002969980239868164, -0.0027235746383666992, -0.0024771690368652344, -0.0022307634353637695, -0.0019843578338623047, -0.0017379522323608398, -0.001491546630859375, -0.0012451410293579102, -0.0009987354278564453, -0.0007523298263549805, -0.0005059242248535156, -0.0002595186233520508, -1.3113021850585938e-05, 0.0002332925796508789, 0.00047969818115234375, 0.0007261037826538086, 0.0009725093841552734, 0.0012189149856567383, 0.0014653205871582031, 0.001711726188659668, 0.001958131790161133, 0.0022045373916625977, 0.0024509429931640625, 0.0026973485946655273, 0.002943754196166992, 0.003190159797668457, 0.003436565399169922, 0.0036829710006713867, 0.0039293766021728516, 0.004175782203674316, 0.004422187805175781, 0.004668593406677246, 0.004914999008178711, 0.005161404609680176, 0.005407810211181641, 0.0056542158126831055, 0.00590062141418457, 0.006147027015686035, 0.0063934326171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 10.0, 7.0, 9.0, 8.0, 9.0, 14.0, 34.0, 46.0, 45.0, 99.0, 146.0, 209.0, 388.0, 646.0, 1402.0, 3415.0, 11236.0, 67401.0, 714217.0, 216060.0, 23340.0, 5550.0, 2067.0, 915.0, 502.0, 261.0, 157.0, 113.0, 78.0, 55.0, 31.0, 32.0, 15.0, 17.0, 8.0, 10.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.421875, -24.470947265625, -23.52001953125, -22.569091796875, -21.6181640625, -20.667236328125, -19.71630859375, -18.765380859375, -17.814453125, -16.863525390625, -15.91259765625, -14.961669921875, -14.0107421875, -13.059814453125, -12.10888671875, -11.157958984375, -10.20703125, -9.256103515625, -8.30517578125, -7.354248046875, -6.4033203125, -5.452392578125, -4.50146484375, -3.550537109375, -2.599609375, -1.648681640625, -0.69775390625, 0.253173828125, 1.2041015625, 2.155029296875, 3.10595703125, 4.056884765625, 5.0078125, 5.958740234375, 6.90966796875, 7.860595703125, 8.8115234375, 9.762451171875, 10.71337890625, 11.664306640625, 12.615234375, 13.566162109375, 14.51708984375, 15.468017578125, 16.4189453125, 17.369873046875, 18.32080078125, 19.271728515625, 20.22265625, 21.173583984375, 22.12451171875, 23.075439453125, 24.0263671875, 24.977294921875, 25.92822265625, 26.879150390625, 27.830078125, 28.781005859375, 29.73193359375, 30.682861328125, 31.6337890625, 32.584716796875, 33.53564453125, 34.486572265625, 35.4375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 3.0, 13.0, 8.0, 17.0, 19.0, 29.0, 38.0, 32.0, 37.0, 55.0, 57.0, 82.0, 88.0, 69.0, 68.0, 67.0, 60.0, 38.0, 51.0, 34.0, 28.0, 21.0, 13.0, 13.0, 14.0, 8.0, 5.0, 8.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.296875, -18.662109375, -18.02734375, -17.392578125, -16.7578125, -16.123046875, -15.48828125, -14.853515625, -14.21875, -13.583984375, -12.94921875, -12.314453125, -11.6796875, -11.044921875, -10.41015625, -9.775390625, -9.140625, -8.505859375, -7.87109375, -7.236328125, -6.6015625, -5.966796875, -5.33203125, -4.697265625, -4.0625, -3.427734375, -2.79296875, -2.158203125, -1.5234375, -0.888671875, -0.25390625, 0.380859375, 1.015625, 1.650390625, 2.28515625, 2.919921875, 3.5546875, 4.189453125, 4.82421875, 5.458984375, 6.09375, 6.728515625, 7.36328125, 7.998046875, 8.6328125, 9.267578125, 9.90234375, 10.537109375, 11.171875, 11.806640625, 12.44140625, 13.076171875, 13.7109375, 14.345703125, 14.98046875, 15.615234375, 16.25, 16.884765625, 17.51953125, 18.154296875, 18.7890625, 19.423828125, 20.05859375, 20.693359375, 21.328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 5.0, 5.0, 10.0, 6.0, 14.0, 19.0, 46.0, 63.0, 78.0, 114.0, 143.0, 168.0, 99.0, 78.0, 67.0, 34.0, 23.0, 13.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0], "bins": [-665.3333129882812, -652.0772705078125, -638.8211669921875, -625.5651245117188, -612.3090209960938, -599.052978515625, -585.796875, -572.5408325195312, -559.2847900390625, -546.0287475585938, -532.7726440429688, -519.5166015625, -506.260498046875, -493.00445556640625, -479.7483825683594, -466.4923095703125, -453.2362060546875, -439.9801330566406, -426.72406005859375, -413.4679870605469, -400.2119140625, -386.95587158203125, -373.6997985839844, -360.4437255859375, -347.1876525878906, -333.93157958984375, -320.6755065917969, -307.41943359375, -294.16339111328125, -280.90728759765625, -267.6512451171875, -254.39517211914062, -241.1390838623047, -227.8830108642578, -214.626953125, -201.37088012695312, -188.11480712890625, -174.85873413085938, -161.6026611328125, -148.3466033935547, -135.0905303955078, -121.83445739746094, -108.5783920288086, -95.32232666015625, -82.06625366210938, -68.8101806640625, -55.554115295410156, -42.29804992675781, -29.041976928710938, -15.785907745361328, -2.5298385620117188, 10.72623062133789, 23.9822998046875, 37.238372802734375, 50.49443817138672, 63.75050354003906, 77.00657653808594, 90.26264953613281, 103.51871490478516, 116.7747802734375, 130.03085327148438, 143.28692626953125, 156.54299926757812, 169.79905700683594, 183.0551300048828]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 2.0, 6.0, 5.0, 8.0, 10.0, 12.0, 12.0, 27.0, 28.0, 29.0, 29.0, 43.0, 51.0, 65.0, 67.0, 91.0, 83.0, 67.0, 60.0, 62.0, 46.0, 47.0, 43.0, 29.0, 18.0, 15.0, 11.0, 14.0, 8.0, 8.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-373.707275390625, -360.5602111816406, -347.4131774902344, -334.26611328125, -321.11907958984375, -307.9720153808594, -294.824951171875, -281.67791748046875, -268.5308837890625, -255.3838348388672, -242.23678588867188, -229.0897216796875, -215.94268798828125, -202.79562377929688, -189.64857482910156, -176.50152587890625, -163.35446166992188, -150.20741271972656, -137.06036376953125, -123.9133071899414, -110.7662582397461, -97.61920928955078, -84.47215270996094, -71.32510375976562, -58.17805480957031, -45.031005859375, -31.883953094482422, -18.736900329589844, -5.589851379394531, 7.557197570800781, 20.704254150390625, 33.85130310058594, 46.998382568359375, 60.14543151855469, 73.29248046875, 86.43953704833984, 99.58658599853516, 112.73363494873047, 125.88069152832031, 139.02774047851562, 152.17478942871094, 165.32183837890625, 178.46888732910156, 191.61593627929688, 204.76300048828125, 217.9100341796875, 231.05709838867188, 244.2041473388672, 257.3511962890625, 270.4982604980469, 283.6452941894531, 296.7923583984375, 309.93939208984375, 323.0864562988281, 336.2335205078125, 349.38055419921875, 362.527587890625, 375.6746520996094, 388.8216857910156, 401.96875, 415.11578369140625, 428.2628479003906, 441.409912109375, 454.55694580078125, 467.7040100097656]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 7.0, 11.0, 14.0, 21.0, 44.0, 32.0, 67.0, 101.0, 163.0, 200.0, 381.0, 625.0, 1120.0, 2516.0, 5784.0, 18291.0, 136586.0, 3882624.0, 117913.0, 16971.0, 5705.0, 2402.0, 1130.0, 572.0, 341.0, 207.0, 145.0, 88.0, 57.0, 50.0, 24.0, 18.0, 18.0, 14.0, 8.0, 9.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-68.0, -65.90625, -63.8125, -61.71875, -59.625, -57.53125, -55.4375, -53.34375, -51.25, -49.15625, -47.0625, -44.96875, -42.875, -40.78125, -38.6875, -36.59375, -34.5, -32.40625, -30.3125, -28.21875, -26.125, -24.03125, -21.9375, -19.84375, -17.75, -15.65625, -13.5625, -11.46875, -9.375, -7.28125, -5.1875, -3.09375, -1.0, 1.09375, 3.1875, 5.28125, 7.375, 9.46875, 11.5625, 13.65625, 15.75, 17.84375, 19.9375, 22.03125, 24.125, 26.21875, 28.3125, 30.40625, 32.5, 34.59375, 36.6875, 38.78125, 40.875, 42.96875, 45.0625, 47.15625, 49.25, 51.34375, 53.4375, 55.53125, 57.625, 59.71875, 61.8125, 63.90625, 66.0]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 10.0, 6.0, 10.0, 27.0, 32.0, 54.0, 49.0, 64.0, 64.0, 89.0, 94.0, 81.0, 85.0, 73.0, 57.0, 65.0, 37.0, 37.0, 30.0, 15.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8125, -14.88623046875, -13.9599609375, -13.03369140625, -12.107421875, -11.18115234375, -10.2548828125, -9.32861328125, -8.40234375, -7.47607421875, -6.5498046875, -5.62353515625, -4.697265625, -3.77099609375, -2.8447265625, -1.91845703125, -0.9921875, -0.06591796875, 0.8603515625, 1.78662109375, 2.712890625, 3.63916015625, 4.5654296875, 5.49169921875, 6.41796875, 7.34423828125, 8.2705078125, 9.19677734375, 10.123046875, 11.04931640625, 11.9755859375, 12.90185546875, 13.828125, 14.75439453125, 15.6806640625, 16.60693359375, 17.533203125, 18.45947265625, 19.3857421875, 20.31201171875, 21.23828125, 22.16455078125, 23.0908203125, 24.01708984375, 24.943359375, 25.86962890625, 26.7958984375, 27.72216796875, 28.6484375, 29.57470703125, 30.5009765625, 31.42724609375, 32.353515625, 33.27978515625, 34.2060546875, 35.13232421875, 36.05859375, 36.98486328125, 37.9111328125, 38.83740234375, 39.763671875, 40.68994140625, 41.6162109375, 42.54248046875, 43.46875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 9.0, 14.0, 20.0, 20.0, 51.0, 62.0, 125.0, 235.0, 435.0, 852.0, 1720.0, 3675.0, 9544.0, 32467.0, 288271.0, 3712364.0, 111431.0, 20281.0, 6892.0, 3013.0, 1380.0, 661.0, 315.0, 178.0, 97.0, 52.0, 27.0, 28.0, 13.0, 12.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-68.625, -66.68310546875, -64.7412109375, -62.79931640625, -60.857421875, -58.91552734375, -56.9736328125, -55.03173828125, -53.08984375, -51.14794921875, -49.2060546875, -47.26416015625, -45.322265625, -43.38037109375, -41.4384765625, -39.49658203125, -37.5546875, -35.61279296875, -33.6708984375, -31.72900390625, -29.787109375, -27.84521484375, -25.9033203125, -23.96142578125, -22.01953125, -20.07763671875, -18.1357421875, -16.19384765625, -14.251953125, -12.31005859375, -10.3681640625, -8.42626953125, -6.484375, -4.54248046875, -2.6005859375, -0.65869140625, 1.283203125, 3.22509765625, 5.1669921875, 7.10888671875, 9.05078125, 10.99267578125, 12.9345703125, 14.87646484375, 16.818359375, 18.76025390625, 20.7021484375, 22.64404296875, 24.5859375, 26.52783203125, 28.4697265625, 30.41162109375, 32.353515625, 34.29541015625, 36.2373046875, 38.17919921875, 40.12109375, 42.06298828125, 44.0048828125, 45.94677734375, 47.888671875, 49.83056640625, 51.7724609375, 53.71435546875, 55.65625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 11.0, 9.0, 15.0, 16.0, 25.0, 37.0, 44.0, 67.0, 152.0, 341.0, 950.0, 1273.0, 560.0, 228.0, 126.0, 44.0, 39.0, 31.0, 22.0, 11.0, 6.0, 14.0, 4.0, 9.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-50.71875, -49.3193359375, -47.919921875, -46.5205078125, -45.12109375, -43.7216796875, -42.322265625, -40.9228515625, -39.5234375, -38.1240234375, -36.724609375, -35.3251953125, -33.92578125, -32.5263671875, -31.126953125, -29.7275390625, -28.328125, -26.9287109375, -25.529296875, -24.1298828125, -22.73046875, -21.3310546875, -19.931640625, -18.5322265625, -17.1328125, -15.7333984375, -14.333984375, -12.9345703125, -11.53515625, -10.1357421875, -8.736328125, -7.3369140625, -5.9375, -4.5380859375, -3.138671875, -1.7392578125, -0.33984375, 1.0595703125, 2.458984375, 3.8583984375, 5.2578125, 6.6572265625, 8.056640625, 9.4560546875, 10.85546875, 12.2548828125, 13.654296875, 15.0537109375, 16.453125, 17.8525390625, 19.251953125, 20.6513671875, 22.05078125, 23.4501953125, 24.849609375, 26.2490234375, 27.6484375, 29.0478515625, 30.447265625, 31.8466796875, 33.24609375, 34.6455078125, 36.044921875, 37.4443359375, 38.84375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 13.0, 45.0, 107.0, 228.0, 282.0, 168.0, 75.0, 32.0, 16.0, 14.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-711.7965087890625, -693.1132202148438, -674.429931640625, -655.7467041015625, -637.0634155273438, -618.380126953125, -599.6968994140625, -581.0136108398438, -562.330322265625, -543.6470336914062, -524.9637451171875, -506.280517578125, -487.59722900390625, -468.9139404296875, -450.2306823730469, -431.54742431640625, -412.8641357421875, -394.18084716796875, -375.4975891113281, -356.8143310546875, -338.13104248046875, -319.44775390625, -300.7644958496094, -282.08123779296875, -263.39794921875, -244.7146759033203, -226.03140258789062, -207.34812927246094, -188.66485595703125, -169.98158264160156, -151.29830932617188, -132.6150360107422, -113.93170166015625, -95.24842834472656, -76.56515502929688, -57.88188171386719, -39.1986083984375, -20.515335083007812, -1.832061767578125, 16.851211547851562, 35.53448486328125, 54.21775817871094, 72.90103149414062, 91.58430480957031, 110.267578125, 128.9508514404297, 147.63412475585938, 166.31739807128906, 185.00067138671875, 203.68394470214844, 222.36721801757812, 241.0504913330078, 259.7337646484375, 278.41705322265625, 297.1003112792969, 315.7835693359375, 334.46685791015625, 353.150146484375, 371.8334045410156, 390.51666259765625, 409.199951171875, 427.88323974609375, 446.5664978027344, 465.249755859375, 483.93304443359375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 7.0, 4.0, 3.0, 7.0, 11.0, 10.0, 11.0, 18.0, 11.0, 25.0, 23.0, 31.0, 36.0, 33.0, 36.0, 57.0, 56.0, 66.0, 49.0, 45.0, 51.0, 50.0, 53.0, 40.0, 43.0, 30.0, 26.0, 20.0, 20.0, 24.0, 28.0, 20.0, 14.0, 7.0, 11.0, 10.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.21029663085938, -181.7702178955078, -176.3301544189453, -170.89007568359375, -165.45001220703125, -160.0099334716797, -154.56985473632812, -149.12979125976562, -143.68971252441406, -138.2496337890625, -132.8095703125, -127.36949157714844, -121.9294204711914, -116.48934936523438, -111.04927062988281, -105.60919952392578, -100.16912841796875, -94.72905731201172, -89.28898620605469, -83.84890747070312, -78.4088363647461, -72.96876525878906, -67.5286865234375, -62.08861541748047, -56.64854431152344, -51.208473205566406, -45.76839828491211, -40.32832336425781, -34.88825225830078, -29.448179244995117, -24.008106231689453, -18.568031311035156, -13.127975463867188, -7.687902450561523, -2.2478294372558594, 3.1922435760498047, 8.632316589355469, 14.072389602661133, 19.512462615966797, 24.952537536621094, 30.392608642578125, 35.832679748535156, 41.27275466918945, 46.71282958984375, 52.15290069580078, 57.59297180175781, 63.03304672241211, 68.4731216430664, 73.91319274902344, 79.35326385498047, 84.7933349609375, 90.23341369628906, 95.6734848022461, 101.11355590820312, 106.55363464355469, 111.99370574951172, 117.43377685546875, 122.87384796142578, 128.3139190673828, 133.75399780273438, 139.19406127929688, 144.63414001464844, 150.07421875, 155.5142822265625, 160.95436096191406]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 10.0, 12.0, 13.0, 19.0, 26.0, 42.0, 54.0, 79.0, 110.0, 195.0, 302.0, 411.0, 675.0, 1124.0, 1892.0, 3228.0, 5680.0, 9985.0, 18599.0, 35902.0, 74062.0, 167679.0, 341219.0, 206963.0, 89044.0, 42232.0, 21708.0, 11586.0, 6475.0, 3608.0, 2118.0, 1278.0, 803.0, 519.0, 296.0, 196.0, 115.0, 91.0, 53.0, 44.0, 29.0, 16.0, 14.0, 19.0, 18.0, 2.0, 8.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-33.46875, -32.501953125, -31.53515625, -30.568359375, -29.6015625, -28.634765625, -27.66796875, -26.701171875, -25.734375, -24.767578125, -23.80078125, -22.833984375, -21.8671875, -20.900390625, -19.93359375, -18.966796875, -18.0, -17.033203125, -16.06640625, -15.099609375, -14.1328125, -13.166015625, -12.19921875, -11.232421875, -10.265625, -9.298828125, -8.33203125, -7.365234375, -6.3984375, -5.431640625, -4.46484375, -3.498046875, -2.53125, -1.564453125, -0.59765625, 0.369140625, 1.3359375, 2.302734375, 3.26953125, 4.236328125, 5.203125, 6.169921875, 7.13671875, 8.103515625, 9.0703125, 10.037109375, 11.00390625, 11.970703125, 12.9375, 13.904296875, 14.87109375, 15.837890625, 16.8046875, 17.771484375, 18.73828125, 19.705078125, 20.671875, 21.638671875, 22.60546875, 23.572265625, 24.5390625, 25.505859375, 26.47265625, 27.439453125, 28.40625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 6.0, 6.0, 5.0, 8.0, 16.0, 19.0, 17.0, 39.0, 23.0, 32.0, 46.0, 36.0, 51.0, 63.0, 44.0, 46.0, 79.0, 60.0, 51.0, 48.0, 49.0, 47.0, 37.0, 31.0, 33.0, 29.0, 28.0, 15.0, 11.0, 7.0, 9.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.375, -15.7333984375, -15.091796875, -14.4501953125, -13.80859375, -13.1669921875, -12.525390625, -11.8837890625, -11.2421875, -10.6005859375, -9.958984375, -9.3173828125, -8.67578125, -8.0341796875, -7.392578125, -6.7509765625, -6.109375, -5.4677734375, -4.826171875, -4.1845703125, -3.54296875, -2.9013671875, -2.259765625, -1.6181640625, -0.9765625, -0.3349609375, 0.306640625, 0.9482421875, 1.58984375, 2.2314453125, 2.873046875, 3.5146484375, 4.15625, 4.7978515625, 5.439453125, 6.0810546875, 6.72265625, 7.3642578125, 8.005859375, 8.6474609375, 9.2890625, 9.9306640625, 10.572265625, 11.2138671875, 11.85546875, 12.4970703125, 13.138671875, 13.7802734375, 14.421875, 15.0634765625, 15.705078125, 16.3466796875, 16.98828125, 17.6298828125, 18.271484375, 18.9130859375, 19.5546875, 20.1962890625, 20.837890625, 21.4794921875, 22.12109375, 22.7626953125, 23.404296875, 24.0458984375, 24.6875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 12.0, 11.0, 10.0, 19.0, 23.0, 40.0, 45.0, 67.0, 95.0, 129.0, 186.0, 303.0, 471.0, 888.0, 1954.0, 4995.0, 16671.0, 74117.0, 517653.0, 350284.0, 58502.0, 13934.0, 4362.0, 1676.0, 775.0, 426.0, 262.0, 166.0, 133.0, 83.0, 61.0, 51.0, 31.0, 17.0, 21.0, 10.0, 11.0, 6.0, 6.0, 5.0, 7.0, 6.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-62.78125, -60.9306640625, -59.080078125, -57.2294921875, -55.37890625, -53.5283203125, -51.677734375, -49.8271484375, -47.9765625, -46.1259765625, -44.275390625, -42.4248046875, -40.57421875, -38.7236328125, -36.873046875, -35.0224609375, -33.171875, -31.3212890625, -29.470703125, -27.6201171875, -25.76953125, -23.9189453125, -22.068359375, -20.2177734375, -18.3671875, -16.5166015625, -14.666015625, -12.8154296875, -10.96484375, -9.1142578125, -7.263671875, -5.4130859375, -3.5625, -1.7119140625, 0.138671875, 1.9892578125, 3.83984375, 5.6904296875, 7.541015625, 9.3916015625, 11.2421875, 13.0927734375, 14.943359375, 16.7939453125, 18.64453125, 20.4951171875, 22.345703125, 24.1962890625, 26.046875, 27.8974609375, 29.748046875, 31.5986328125, 33.44921875, 35.2998046875, 37.150390625, 39.0009765625, 40.8515625, 42.7021484375, 44.552734375, 46.4033203125, 48.25390625, 50.1044921875, 51.955078125, 53.8056640625, 55.65625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 12.0, 16.0, 15.0, 23.0, 29.0, 28.0, 41.0, 33.0, 36.0, 48.0, 41.0, 48.0, 68.0, 44.0, 55.0, 54.0, 49.0, 53.0, 41.0, 38.0, 34.0, 30.0, 26.0, 20.0, 20.0, 21.0, 8.0, 8.0, 7.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.8125, -62.599609375, -60.38671875, -58.173828125, -55.9609375, -53.748046875, -51.53515625, -49.322265625, -47.109375, -44.896484375, -42.68359375, -40.470703125, -38.2578125, -36.044921875, -33.83203125, -31.619140625, -29.40625, -27.193359375, -24.98046875, -22.767578125, -20.5546875, -18.341796875, -16.12890625, -13.916015625, -11.703125, -9.490234375, -7.27734375, -5.064453125, -2.8515625, -0.638671875, 1.57421875, 3.787109375, 6.0, 8.212890625, 10.42578125, 12.638671875, 14.8515625, 17.064453125, 19.27734375, 21.490234375, 23.703125, 25.916015625, 28.12890625, 30.341796875, 32.5546875, 34.767578125, 36.98046875, 39.193359375, 41.40625, 43.619140625, 45.83203125, 48.044921875, 50.2578125, 52.470703125, 54.68359375, 56.896484375, 59.109375, 61.322265625, 63.53515625, 65.748046875, 67.9609375, 70.173828125, 72.38671875, 74.599609375, 76.8125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 1.0, 6.0, 12.0, 5.0, 17.0, 17.0, 15.0, 23.0, 50.0, 57.0, 105.0, 148.0, 275.0, 593.0, 1232.0, 3314.0, 10552.0, 52716.0, 650444.0, 285910.0, 31197.0, 7405.0, 2389.0, 951.0, 471.0, 227.0, 141.0, 88.0, 58.0, 30.0, 25.0, 27.0, 12.0, 11.0, 9.0, 2.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90625, -31.934326171875, -30.96240234375, -29.990478515625, -29.0185546875, -28.046630859375, -27.07470703125, -26.102783203125, -25.130859375, -24.158935546875, -23.18701171875, -22.215087890625, -21.2431640625, -20.271240234375, -19.29931640625, -18.327392578125, -17.35546875, -16.383544921875, -15.41162109375, -14.439697265625, -13.4677734375, -12.495849609375, -11.52392578125, -10.552001953125, -9.580078125, -8.608154296875, -7.63623046875, -6.664306640625, -5.6923828125, -4.720458984375, -3.74853515625, -2.776611328125, -1.8046875, -0.832763671875, 0.13916015625, 1.111083984375, 2.0830078125, 3.054931640625, 4.02685546875, 4.998779296875, 5.970703125, 6.942626953125, 7.91455078125, 8.886474609375, 9.8583984375, 10.830322265625, 11.80224609375, 12.774169921875, 13.74609375, 14.718017578125, 15.68994140625, 16.661865234375, 17.6337890625, 18.605712890625, 19.57763671875, 20.549560546875, 21.521484375, 22.493408203125, 23.46533203125, 24.437255859375, 25.4091796875, 26.381103515625, 27.35302734375, 28.324951171875, 29.296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 5.0, 8.0, 9.0, 12.0, 35.0, 44.0, 75.0, 151.0, 261.0, 157.0, 78.0, 50.0, 29.0, 25.0, 14.0, 6.0, 3.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00937652587890625, -0.00912022590637207, -0.00886392593383789, -0.008607625961303711, -0.008351325988769531, -0.008095026016235352, -0.007838726043701172, -0.007582426071166992, -0.0073261260986328125, -0.007069826126098633, -0.006813526153564453, -0.0065572261810302734, -0.006300926208496094, -0.006044626235961914, -0.005788326263427734, -0.005532026290893555, -0.005275726318359375, -0.005019426345825195, -0.004763126373291016, -0.004506826400756836, -0.004250526428222656, -0.0039942264556884766, -0.003737926483154297, -0.003481626510620117, -0.0032253265380859375, -0.002969026565551758, -0.002712726593017578, -0.0024564266204833984, -0.0022001266479492188, -0.001943826675415039, -0.0016875267028808594, -0.0014312267303466797, -0.0011749267578125, -0.0009186267852783203, -0.0006623268127441406, -0.00040602684020996094, -0.00014972686767578125, 0.00010657310485839844, 0.0003628730773925781, 0.0006191730499267578, 0.0008754730224609375, 0.0011317729949951172, 0.0013880729675292969, 0.0016443729400634766, 0.0019006729125976562, 0.002156972885131836, 0.0024132728576660156, 0.0026695728302001953, 0.002925872802734375, 0.0031821727752685547, 0.0034384727478027344, 0.003694772720336914, 0.003951072692871094, 0.0042073726654052734, 0.004463672637939453, 0.004719972610473633, 0.0049762725830078125, 0.005232572555541992, 0.005488872528076172, 0.0057451725006103516, 0.006001472473144531, 0.006257772445678711, 0.006514072418212891, 0.00677037239074707, 0.00702667236328125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 11.0, 9.0, 20.0, 32.0, 52.0, 94.0, 193.0, 404.0, 918.0, 2997.0, 11685.0, 91715.0, 811592.0, 110699.0, 13139.0, 3187.0, 999.0, 400.0, 182.0, 81.0, 58.0, 28.0, 19.0, 19.0, 3.0, 11.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.53955078125, -33.3291015625, -32.11865234375, -30.908203125, -29.69775390625, -28.4873046875, -27.27685546875, -26.06640625, -24.85595703125, -23.6455078125, -22.43505859375, -21.224609375, -20.01416015625, -18.8037109375, -17.59326171875, -16.3828125, -15.17236328125, -13.9619140625, -12.75146484375, -11.541015625, -10.33056640625, -9.1201171875, -7.90966796875, -6.69921875, -5.48876953125, -4.2783203125, -3.06787109375, -1.857421875, -0.64697265625, 0.5634765625, 1.77392578125, 2.984375, 4.19482421875, 5.4052734375, 6.61572265625, 7.826171875, 9.03662109375, 10.2470703125, 11.45751953125, 12.66796875, 13.87841796875, 15.0888671875, 16.29931640625, 17.509765625, 18.72021484375, 19.9306640625, 21.14111328125, 22.3515625, 23.56201171875, 24.7724609375, 25.98291015625, 27.193359375, 28.40380859375, 29.6142578125, 30.82470703125, 32.03515625, 33.24560546875, 34.4560546875, 35.66650390625, 36.876953125, 38.08740234375, 39.2978515625, 40.50830078125, 41.71875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 12.0, 12.0, 12.0, 19.0, 24.0, 23.0, 57.0, 67.0, 91.0, 129.0, 123.0, 122.0, 78.0, 72.0, 47.0, 42.0, 18.0, 19.0, 9.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6875, -33.759033203125, -32.83056640625, -31.902099609375, -30.9736328125, -30.045166015625, -29.11669921875, -28.188232421875, -27.259765625, -26.331298828125, -25.40283203125, -24.474365234375, -23.5458984375, -22.617431640625, -21.68896484375, -20.760498046875, -19.83203125, -18.903564453125, -17.97509765625, -17.046630859375, -16.1181640625, -15.189697265625, -14.26123046875, -13.332763671875, -12.404296875, -11.475830078125, -10.54736328125, -9.618896484375, -8.6904296875, -7.761962890625, -6.83349609375, -5.905029296875, -4.9765625, -4.048095703125, -3.11962890625, -2.191162109375, -1.2626953125, -0.334228515625, 0.59423828125, 1.522705078125, 2.451171875, 3.379638671875, 4.30810546875, 5.236572265625, 6.1650390625, 7.093505859375, 8.02197265625, 8.950439453125, 9.87890625, 10.807373046875, 11.73583984375, 12.664306640625, 13.5927734375, 14.521240234375, 15.44970703125, 16.378173828125, 17.306640625, 18.235107421875, 19.16357421875, 20.092041015625, 21.0205078125, 21.948974609375, 22.87744140625, 23.805908203125, 24.734375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 14.0, 33.0, 60.0, 107.0, 178.0, 241.0, 170.0, 106.0, 41.0, 19.0, 12.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-893.0054321289062, -874.2302856445312, -855.4552001953125, -836.6800537109375, -817.9049072265625, -799.1297607421875, -780.3546142578125, -761.5795288085938, -742.8043823242188, -724.0292358398438, -705.254150390625, -686.47900390625, -667.703857421875, -648.9287109375, -630.153564453125, -611.3784790039062, -592.6033325195312, -573.8281860351562, -555.0531005859375, -536.2779541015625, -517.5028076171875, -498.7276611328125, -479.9525451660156, -461.17742919921875, -442.40228271484375, -423.62713623046875, -404.8520202636719, -386.076904296875, -367.3017578125, -348.526611328125, -329.7514953613281, -310.97637939453125, -292.20123291015625, -273.42608642578125, -254.65097045898438, -235.87583923339844, -217.1007080078125, -198.32557678222656, -179.55044555664062, -160.7753143310547, -142.00018310546875, -123.22505187988281, -104.44992065429688, -85.67478942871094, -66.899658203125, -48.12452697753906, -29.349395751953125, -10.574264526367188, 8.20086669921875, 26.975997924804688, 45.751129150390625, 64.52626037597656, 83.3013916015625, 102.07652282714844, 120.85165405273438, 139.6267852783203, 158.40191650390625, 177.1770477294922, 195.95217895507812, 214.72731018066406, 233.50244140625, 252.27757263183594, 271.0527038574219, 289.82781982421875, 308.60296630859375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 1.0, 5.0, 9.0, 15.0, 17.0, 22.0, 28.0, 37.0, 54.0, 55.0, 49.0, 79.0, 101.0, 104.0, 78.0, 70.0, 50.0, 56.0, 45.0, 40.0, 29.0, 21.0, 12.0, 11.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-534.060791015625, -520.0051879882812, -505.9495849609375, -491.89398193359375, -477.83837890625, -463.78277587890625, -449.7271728515625, -435.67156982421875, -421.615966796875, -407.56036376953125, -393.5047607421875, -379.44915771484375, -365.3935546875, -351.33795166015625, -337.2823486328125, -323.22674560546875, -309.1711730957031, -295.1155700683594, -281.0599670410156, -267.0043640136719, -252.94876098632812, -238.89315795898438, -224.8375701904297, -210.78196716308594, -196.7263641357422, -182.67076110839844, -168.6151580810547, -154.5595703125, -140.50396728515625, -126.44835662841797, -112.39276123046875, -98.337158203125, -84.28155517578125, -70.2259521484375, -56.170352935791016, -42.11475372314453, -28.05915069580078, -14.003547668457031, 0.0520477294921875, 14.107650756835938, 28.163253784179688, 42.21885681152344, 56.27445602416992, 70.3300552368164, 84.38565826416016, 98.4412612915039, 112.49685668945312, 126.55245971679688, 140.60806274414062, 154.66366577148438, 168.71926879882812, 182.77487182617188, 196.83047485351562, 210.88607788085938, 224.94166564941406, 238.9972686767578, 253.05287170410156, 267.10845947265625, 281.1640625, 295.21966552734375, 309.2752685546875, 323.33087158203125, 337.386474609375, 351.44207763671875, 365.4976806640625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 22.0, 21.0, 42.0, 56.0, 103.0, 128.0, 255.0, 405.0, 852.0, 1738.0, 3746.0, 9186.0, 34342.0, 777698.0, 3272771.0, 69553.0, 14264.0, 4943.0, 2064.0, 1014.0, 473.0, 226.0, 123.0, 81.0, 52.0, 38.0, 20.0, 12.0, 17.0, 11.0, 1.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.9375, -62.7109375, -60.484375, -58.2578125, -56.03125, -53.8046875, -51.578125, -49.3515625, -47.125, -44.8984375, -42.671875, -40.4453125, -38.21875, -35.9921875, -33.765625, -31.5390625, -29.3125, -27.0859375, -24.859375, -22.6328125, -20.40625, -18.1796875, -15.953125, -13.7265625, -11.5, -9.2734375, -7.046875, -4.8203125, -2.59375, -0.3671875, 1.859375, 4.0859375, 6.3125, 8.5390625, 10.765625, 12.9921875, 15.21875, 17.4453125, 19.671875, 21.8984375, 24.125, 26.3515625, 28.578125, 30.8046875, 33.03125, 35.2578125, 37.484375, 39.7109375, 41.9375, 44.1640625, 46.390625, 48.6171875, 50.84375, 53.0703125, 55.296875, 57.5234375, 59.75, 61.9765625, 64.203125, 66.4296875, 68.65625, 70.8828125, 73.109375, 75.3359375, 77.5625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 17.0, 21.0, 38.0, 57.0, 77.0, 62.0, 95.0, 98.0, 131.0, 96.0, 88.0, 49.0, 55.0, 49.0, 23.0, 22.0, 11.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-52.15625, -51.0936279296875, -50.031005859375, -48.9683837890625, -47.90576171875, -46.8431396484375, -45.780517578125, -44.7178955078125, -43.6552734375, -42.5926513671875, -41.530029296875, -40.4674072265625, -39.40478515625, -38.3421630859375, -37.279541015625, -36.2169189453125, -35.154296875, -34.0916748046875, -33.029052734375, -31.9664306640625, -30.90380859375, -29.8411865234375, -28.778564453125, -27.7159423828125, -26.6533203125, -25.5906982421875, -24.528076171875, -23.4654541015625, -22.40283203125, -21.3402099609375, -20.277587890625, -19.2149658203125, -18.15234375, -17.0897216796875, -16.027099609375, -14.9644775390625, -13.90185546875, -12.8392333984375, -11.776611328125, -10.7139892578125, -9.6513671875, -8.5887451171875, -7.526123046875, -6.4635009765625, -5.40087890625, -4.3382568359375, -3.275634765625, -2.2130126953125, -1.150390625, -0.0877685546875, 0.974853515625, 2.0374755859375, 3.10009765625, 4.1627197265625, 5.225341796875, 6.2879638671875, 7.3505859375, 8.4132080078125, 9.475830078125, 10.5384521484375, 11.60107421875, 12.6636962890625, 13.726318359375, 14.7889404296875, 15.8515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 6.0, 7.0, 7.0, 7.0, 20.0, 22.0, 27.0, 75.0, 102.0, 196.0, 348.0, 799.0, 1894.0, 5430.0, 18448.0, 112437.0, 3770185.0, 245979.0, 26813.0, 7158.0, 2444.0, 1010.0, 371.0, 208.0, 123.0, 50.0, 29.0, 22.0, 21.0, 11.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.0, -82.47265625, -79.9453125, -77.41796875, -74.890625, -72.36328125, -69.8359375, -67.30859375, -64.78125, -62.25390625, -59.7265625, -57.19921875, -54.671875, -52.14453125, -49.6171875, -47.08984375, -44.5625, -42.03515625, -39.5078125, -36.98046875, -34.453125, -31.92578125, -29.3984375, -26.87109375, -24.34375, -21.81640625, -19.2890625, -16.76171875, -14.234375, -11.70703125, -9.1796875, -6.65234375, -4.125, -1.59765625, 0.9296875, 3.45703125, 5.984375, 8.51171875, 11.0390625, 13.56640625, 16.09375, 18.62109375, 21.1484375, 23.67578125, 26.203125, 28.73046875, 31.2578125, 33.78515625, 36.3125, 38.83984375, 41.3671875, 43.89453125, 46.421875, 48.94921875, 51.4765625, 54.00390625, 56.53125, 59.05859375, 61.5859375, 64.11328125, 66.640625, 69.16796875, 71.6953125, 74.22265625, 76.75]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 5.0, 16.0, 12.0, 16.0, 29.0, 29.0, 50.0, 65.0, 119.0, 193.0, 512.0, 1056.0, 983.0, 427.0, 202.0, 108.0, 59.0, 35.0, 26.0, 21.0, 23.0, 8.0, 8.0, 9.0, 10.0, 5.0, 2.0, 3.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.0625, -59.2626953125, -57.462890625, -55.6630859375, -53.86328125, -52.0634765625, -50.263671875, -48.4638671875, -46.6640625, -44.8642578125, -43.064453125, -41.2646484375, -39.46484375, -37.6650390625, -35.865234375, -34.0654296875, -32.265625, -30.4658203125, -28.666015625, -26.8662109375, -25.06640625, -23.2666015625, -21.466796875, -19.6669921875, -17.8671875, -16.0673828125, -14.267578125, -12.4677734375, -10.66796875, -8.8681640625, -7.068359375, -5.2685546875, -3.46875, -1.6689453125, 0.130859375, 1.9306640625, 3.73046875, 5.5302734375, 7.330078125, 9.1298828125, 10.9296875, 12.7294921875, 14.529296875, 16.3291015625, 18.12890625, 19.9287109375, 21.728515625, 23.5283203125, 25.328125, 27.1279296875, 28.927734375, 30.7275390625, 32.52734375, 34.3271484375, 36.126953125, 37.9267578125, 39.7265625, 41.5263671875, 43.326171875, 45.1259765625, 46.92578125, 48.7255859375, 50.525390625, 52.3251953125, 54.125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 8.0, 14.0, 10.0, 24.0, 35.0, 57.0, 98.0, 120.0, 160.0, 149.0, 98.0, 84.0, 60.0, 30.0, 18.0, 7.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-440.40216064453125, -426.91455078125, -413.42694091796875, -399.9393310546875, -386.45172119140625, -372.964111328125, -359.47650146484375, -345.9888916015625, -332.50128173828125, -319.013671875, -305.52606201171875, -292.0384521484375, -278.55084228515625, -265.063232421875, -251.5756378173828, -238.08802795410156, -224.60043334960938, -211.11282348632812, -197.62521362304688, -184.13760375976562, -170.64999389648438, -157.16238403320312, -143.67478942871094, -130.1871795654297, -116.69956970214844, -103.21195983886719, -89.72434997558594, -76.23674774169922, -62.74913787841797, -49.26152801513672, -35.77392578125, -22.28631591796875, -8.798675537109375, 4.688932418823242, 18.17654037475586, 31.664146423339844, 45.151756286621094, 58.639366149902344, 72.12696838378906, 85.61457824707031, 99.10218811035156, 112.58979797363281, 126.07740783691406, 139.56500244140625, 153.0526123046875, 166.54022216796875, 180.02783203125, 193.51544189453125, 207.0030517578125, 220.49066162109375, 233.978271484375, 247.46588134765625, 260.9534912109375, 274.44110107421875, 287.9287109375, 301.41632080078125, 314.9039306640625, 328.39154052734375, 341.879150390625, 355.36676025390625, 368.8543701171875, 382.34197998046875, 395.82958984375, 409.31719970703125, 422.8047790527344]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 9.0, 20.0, 21.0, 31.0, 42.0, 48.0, 63.0, 64.0, 79.0, 73.0, 77.0, 74.0, 54.0, 59.0, 59.0, 49.0, 39.0, 31.0, 24.0, 19.0, 13.0, 16.0, 8.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.71209716796875, -211.03237915039062, -199.3526611328125, -187.6729278564453, -175.9932098388672, -164.31349182128906, -152.63375854492188, -140.95404052734375, -129.27432250976562, -117.5946044921875, -105.91487884521484, -94.23515319824219, -82.55543518066406, -70.87571716308594, -59.19599151611328, -47.516265869140625, -35.8365478515625, -24.15682601928711, -12.477104187011719, -0.7973823547363281, 10.882339477539062, 22.562061309814453, 34.241783142089844, 45.9215087890625, 57.601226806640625, 69.28094482421875, 80.9606704711914, 92.64039611816406, 104.32011413574219, 115.99983215332031, 127.67955780029297, 139.35928344726562, 151.03900146484375, 162.71871948242188, 174.3984375, 186.0781707763672, 197.7578887939453, 209.43760681152344, 221.11734008789062, 232.79705810546875, 244.47677612304688, 256.156494140625, 267.8362121582031, 279.51593017578125, 291.1956787109375, 302.8753967285156, 314.55511474609375, 326.2348327636719, 337.91455078125, 349.5942687988281, 361.27398681640625, 372.9537048339844, 384.6334228515625, 396.31317138671875, 407.9928894042969, 419.672607421875, 431.3523254394531, 443.03204345703125, 454.7117614746094, 466.3914794921875, 478.07122802734375, 489.7509460449219, 501.4306640625, 513.1103515625, 524.7901000976562]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 7.0, 12.0, 17.0, 23.0, 35.0, 48.0, 75.0, 130.0, 161.0, 261.0, 427.0, 671.0, 1147.0, 2303.0, 4545.0, 9767.0, 22481.0, 56150.0, 151422.0, 386345.0, 254737.0, 92916.0, 36008.0, 14721.0, 6772.0, 3312.0, 1631.0, 946.0, 540.0, 321.0, 204.0, 134.0, 101.0, 44.0, 34.0, 28.0, 19.0, 18.0, 13.0, 6.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.84375, -40.56640625, -39.2890625, -38.01171875, -36.734375, -35.45703125, -34.1796875, -32.90234375, -31.625, -30.34765625, -29.0703125, -27.79296875, -26.515625, -25.23828125, -23.9609375, -22.68359375, -21.40625, -20.12890625, -18.8515625, -17.57421875, -16.296875, -15.01953125, -13.7421875, -12.46484375, -11.1875, -9.91015625, -8.6328125, -7.35546875, -6.078125, -4.80078125, -3.5234375, -2.24609375, -0.96875, 0.30859375, 1.5859375, 2.86328125, 4.140625, 5.41796875, 6.6953125, 7.97265625, 9.25, 10.52734375, 11.8046875, 13.08203125, 14.359375, 15.63671875, 16.9140625, 18.19140625, 19.46875, 20.74609375, 22.0234375, 23.30078125, 24.578125, 25.85546875, 27.1328125, 28.41015625, 29.6875, 30.96484375, 32.2421875, 33.51953125, 34.796875, 36.07421875, 37.3515625, 38.62890625, 39.90625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 11.0, 12.0, 20.0, 21.0, 28.0, 25.0, 31.0, 27.0, 31.0, 35.0, 46.0, 48.0, 52.0, 52.0, 67.0, 48.0, 45.0, 53.0, 43.0, 55.0, 30.0, 27.0, 31.0, 28.0, 29.0, 17.0, 17.0, 16.0, 14.0, 12.0, 9.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.953125, -19.3983154296875, -18.843505859375, -18.2886962890625, -17.73388671875, -17.1790771484375, -16.624267578125, -16.0694580078125, -15.5146484375, -14.9598388671875, -14.405029296875, -13.8502197265625, -13.29541015625, -12.7406005859375, -12.185791015625, -11.6309814453125, -11.076171875, -10.5213623046875, -9.966552734375, -9.4117431640625, -8.85693359375, -8.3021240234375, -7.747314453125, -7.1925048828125, -6.6376953125, -6.0828857421875, -5.528076171875, -4.9732666015625, -4.41845703125, -3.8636474609375, -3.308837890625, -2.7540283203125, -2.19921875, -1.6444091796875, -1.089599609375, -0.5347900390625, 0.02001953125, 0.5748291015625, 1.129638671875, 1.6844482421875, 2.2392578125, 2.7940673828125, 3.348876953125, 3.9036865234375, 4.45849609375, 5.0133056640625, 5.568115234375, 6.1229248046875, 6.677734375, 7.2325439453125, 7.787353515625, 8.3421630859375, 8.89697265625, 9.4517822265625, 10.006591796875, 10.5614013671875, 11.1162109375, 11.6710205078125, 12.225830078125, 12.7806396484375, 13.33544921875, 13.8902587890625, 14.445068359375, 14.9998779296875, 15.5546875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 1.0, 8.0, 7.0, 11.0, 14.0, 21.0, 28.0, 42.0, 63.0, 80.0, 126.0, 190.0, 224.0, 389.0, 533.0, 916.0, 1619.0, 3240.0, 9308.0, 46447.0, 564542.0, 366013.0, 39383.0, 8242.0, 2997.0, 1534.0, 813.0, 547.0, 371.0, 248.0, 179.0, 120.0, 75.0, 62.0, 44.0, 24.0, 29.0, 14.0, 15.0, 7.0, 7.0, 10.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.5, -78.8671875, -76.234375, -73.6015625, -70.96875, -68.3359375, -65.703125, -63.0703125, -60.4375, -57.8046875, -55.171875, -52.5390625, -49.90625, -47.2734375, -44.640625, -42.0078125, -39.375, -36.7421875, -34.109375, -31.4765625, -28.84375, -26.2109375, -23.578125, -20.9453125, -18.3125, -15.6796875, -13.046875, -10.4140625, -7.78125, -5.1484375, -2.515625, 0.1171875, 2.75, 5.3828125, 8.015625, 10.6484375, 13.28125, 15.9140625, 18.546875, 21.1796875, 23.8125, 26.4453125, 29.078125, 31.7109375, 34.34375, 36.9765625, 39.609375, 42.2421875, 44.875, 47.5078125, 50.140625, 52.7734375, 55.40625, 58.0390625, 60.671875, 63.3046875, 65.9375, 68.5703125, 71.203125, 73.8359375, 76.46875, 79.1015625, 81.734375, 84.3671875, 87.0]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 1.0, 11.0, 10.0, 12.0, 17.0, 19.0, 22.0, 23.0, 16.0, 28.0, 32.0, 38.0, 39.0, 39.0, 41.0, 30.0, 44.0, 52.0, 61.0, 40.0, 45.0, 40.0, 51.0, 48.0, 41.0, 30.0, 30.0, 25.0, 21.0, 10.0, 12.0, 18.0, 6.0, 20.0, 10.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.9375, -63.59375, -61.25, -58.90625, -56.5625, -54.21875, -51.875, -49.53125, -47.1875, -44.84375, -42.5, -40.15625, -37.8125, -35.46875, -33.125, -30.78125, -28.4375, -26.09375, -23.75, -21.40625, -19.0625, -16.71875, -14.375, -12.03125, -9.6875, -7.34375, -5.0, -2.65625, -0.3125, 2.03125, 4.375, 6.71875, 9.0625, 11.40625, 13.75, 16.09375, 18.4375, 20.78125, 23.125, 25.46875, 27.8125, 30.15625, 32.5, 34.84375, 37.1875, 39.53125, 41.875, 44.21875, 46.5625, 48.90625, 51.25, 53.59375, 55.9375, 58.28125, 60.625, 62.96875, 65.3125, 67.65625, 70.0, 72.34375, 74.6875, 77.03125, 79.375, 81.71875, 84.0625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 10.0, 5.0, 8.0, 14.0, 20.0, 22.0, 29.0, 35.0, 70.0, 102.0, 167.0, 368.0, 843.0, 2321.0, 8442.0, 57212.0, 855800.0, 105707.0, 12317.0, 3038.0, 988.0, 481.0, 220.0, 129.0, 76.0, 34.0, 30.0, 20.0, 17.0, 12.0, 8.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.9375, -32.79150390625, -31.6455078125, -30.49951171875, -29.353515625, -28.20751953125, -27.0615234375, -25.91552734375, -24.76953125, -23.62353515625, -22.4775390625, -21.33154296875, -20.185546875, -19.03955078125, -17.8935546875, -16.74755859375, -15.6015625, -14.45556640625, -13.3095703125, -12.16357421875, -11.017578125, -9.87158203125, -8.7255859375, -7.57958984375, -6.43359375, -5.28759765625, -4.1416015625, -2.99560546875, -1.849609375, -0.70361328125, 0.4423828125, 1.58837890625, 2.734375, 3.88037109375, 5.0263671875, 6.17236328125, 7.318359375, 8.46435546875, 9.6103515625, 10.75634765625, 11.90234375, 13.04833984375, 14.1943359375, 15.34033203125, 16.486328125, 17.63232421875, 18.7783203125, 19.92431640625, 21.0703125, 22.21630859375, 23.3623046875, 24.50830078125, 25.654296875, 26.80029296875, 27.9462890625, 29.09228515625, 30.23828125, 31.38427734375, 32.5302734375, 33.67626953125, 34.822265625, 35.96826171875, 37.1142578125, 38.26025390625, 39.40625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 1.0, 4.0, 7.0, 7.0, 12.0, 16.0, 18.0, 31.0, 33.0, 45.0, 49.0, 96.0, 151.0, 172.0, 113.0, 59.0, 41.0, 32.0, 33.0, 17.0, 16.0, 13.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005420684814453125, -0.0052283406257629395, -0.005035996437072754, -0.004843652248382568, -0.004651308059692383, -0.004458963871002197, -0.004266619682312012, -0.004074275493621826, -0.0038819313049316406, -0.003689587116241455, -0.0034972429275512695, -0.003304898738861084, -0.0031125545501708984, -0.002920210361480713, -0.0027278661727905273, -0.002535521984100342, -0.0023431777954101562, -0.0021508336067199707, -0.001958489418029785, -0.0017661452293395996, -0.001573801040649414, -0.0013814568519592285, -0.001189112663269043, -0.0009967684745788574, -0.0008044242858886719, -0.0006120800971984863, -0.0004197359085083008, -0.00022739171981811523, -3.504753112792969e-05, 0.00015729665756225586, 0.0003496408462524414, 0.000541985034942627, 0.0007343292236328125, 0.000926673412322998, 0.0011190176010131836, 0.0013113617897033691, 0.0015037059783935547, 0.0016960501670837402, 0.0018883943557739258, 0.0020807385444641113, 0.002273082733154297, 0.0024654269218444824, 0.002657771110534668, 0.0028501152992248535, 0.003042459487915039, 0.0032348036766052246, 0.00342714786529541, 0.0036194920539855957, 0.0038118362426757812, 0.004004180431365967, 0.004196524620056152, 0.004388868808746338, 0.0045812129974365234, 0.004773557186126709, 0.0049659013748168945, 0.00515824556350708, 0.005350589752197266, 0.005542933940887451, 0.005735278129577637, 0.005927622318267822, 0.006119966506958008, 0.006312310695648193, 0.006504654884338379, 0.0066969990730285645, 0.00688934326171875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 5.0, 9.0, 13.0, 8.0, 13.0, 19.0, 27.0, 49.0, 49.0, 79.0, 141.0, 225.0, 537.0, 1082.0, 2532.0, 6329.0, 21785.0, 198013.0, 755487.0, 45290.0, 10060.0, 3673.0, 1557.0, 662.0, 354.0, 210.0, 98.0, 75.0, 56.0, 35.0, 27.0, 12.0, 16.0, 7.0, 9.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.6875, -31.703369140625, -30.71923828125, -29.735107421875, -28.7509765625, -27.766845703125, -26.78271484375, -25.798583984375, -24.814453125, -23.830322265625, -22.84619140625, -21.862060546875, -20.8779296875, -19.893798828125, -18.90966796875, -17.925537109375, -16.94140625, -15.957275390625, -14.97314453125, -13.989013671875, -13.0048828125, -12.020751953125, -11.03662109375, -10.052490234375, -9.068359375, -8.084228515625, -7.10009765625, -6.115966796875, -5.1318359375, -4.147705078125, -3.16357421875, -2.179443359375, -1.1953125, -0.211181640625, 0.77294921875, 1.757080078125, 2.7412109375, 3.725341796875, 4.70947265625, 5.693603515625, 6.677734375, 7.661865234375, 8.64599609375, 9.630126953125, 10.6142578125, 11.598388671875, 12.58251953125, 13.566650390625, 14.55078125, 15.534912109375, 16.51904296875, 17.503173828125, 18.4873046875, 19.471435546875, 20.45556640625, 21.439697265625, 22.423828125, 23.407958984375, 24.39208984375, 25.376220703125, 26.3603515625, 27.344482421875, 28.32861328125, 29.312744140625, 30.296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 9.0, 6.0, 7.0, 10.0, 9.0, 20.0, 22.0, 38.0, 38.0, 55.0, 89.0, 104.0, 138.0, 111.0, 87.0, 59.0, 47.0, 32.0, 26.0, 18.0, 15.0, 7.0, 9.0, 7.0, 5.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.875, -21.11328125, -20.3515625, -19.58984375, -18.828125, -18.06640625, -17.3046875, -16.54296875, -15.78125, -15.01953125, -14.2578125, -13.49609375, -12.734375, -11.97265625, -11.2109375, -10.44921875, -9.6875, -8.92578125, -8.1640625, -7.40234375, -6.640625, -5.87890625, -5.1171875, -4.35546875, -3.59375, -2.83203125, -2.0703125, -1.30859375, -0.546875, 0.21484375, 0.9765625, 1.73828125, 2.5, 3.26171875, 4.0234375, 4.78515625, 5.546875, 6.30859375, 7.0703125, 7.83203125, 8.59375, 9.35546875, 10.1171875, 10.87890625, 11.640625, 12.40234375, 13.1640625, 13.92578125, 14.6875, 15.44921875, 16.2109375, 16.97265625, 17.734375, 18.49609375, 19.2578125, 20.01953125, 20.78125, 21.54296875, 22.3046875, 23.06640625, 23.828125, 24.58984375, 25.3515625, 26.11328125, 26.875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 22.0, 46.0, 182.0, 396.0, 242.0, 71.0, 21.0, 9.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-548.4449462890625, -513.5303955078125, -478.6158752441406, -443.70135498046875, -408.78680419921875, -373.87225341796875, -338.9577331542969, -304.043212890625, -269.128662109375, -234.21412658691406, -199.29959106445312, -164.3850555419922, -129.47052001953125, -94.55598449707031, -59.641448974609375, -24.726913452148438, 10.1876220703125, 45.10215759277344, 80.01669311523438, 114.93122863769531, 149.84576416015625, 184.7602996826172, 219.67483520507812, 254.58937072753906, 289.50390625, 324.41845703125, 359.3329772949219, 394.24749755859375, 429.16204833984375, 464.07659912109375, 498.9911193847656, 533.9056396484375, 568.8201904296875, 603.7347412109375, 638.6492919921875, 673.5637817382812, 708.4783325195312, 743.3928833007812, 778.307373046875, 813.221923828125, 848.136474609375, 883.051025390625, 917.965576171875, 952.8800659179688, 987.7946166992188, 1022.7091674804688, 1057.6236572265625, 1092.5382080078125, 1127.4527587890625, 1162.3673095703125, 1197.2818603515625, 1232.1964111328125, 1267.11083984375, 1302.025390625, 1336.93994140625, 1371.8544921875, 1406.76904296875, 1441.68359375, 1476.59814453125, 1511.5126953125, 1546.42724609375, 1581.3416748046875, 1616.2562255859375, 1651.1707763671875, 1686.0853271484375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 8.0, 15.0, 13.0, 19.0, 16.0, 31.0, 24.0, 26.0, 36.0, 35.0, 47.0, 64.0, 61.0, 67.0, 84.0, 77.0, 63.0, 47.0, 35.0, 42.0, 25.0, 24.0, 32.0, 26.0, 23.0, 12.0, 11.0, 6.0, 7.0, 2.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-434.45263671875, -422.6624450683594, -410.8722229003906, -399.08203125, -387.29180908203125, -375.5016174316406, -363.71142578125, -351.92120361328125, -340.1309814453125, -328.3407897949219, -316.5505676269531, -304.7603759765625, -292.97015380859375, -281.1799621582031, -269.3897705078125, -257.59954833984375, -245.80935668945312, -234.01914978027344, -222.22894287109375, -210.43875122070312, -198.64852905273438, -186.85833740234375, -175.06813049316406, -163.27792358398438, -151.4877166748047, -139.697509765625, -127.90730285644531, -116.11710357666016, -104.32689666748047, -92.53668975830078, -80.74649047851562, -68.95628356933594, -57.16607666015625, -45.37586975097656, -33.58566665649414, -21.79546356201172, -10.005256652832031, 1.7849502563476562, 13.575149536132812, 25.3653564453125, 37.15556335449219, 48.945770263671875, 60.7359733581543, 72.52617645263672, 84.3163833618164, 96.1065902709961, 107.89678955078125, 119.68699645996094, 131.47720336914062, 143.2674102783203, 155.0576171875, 166.84780883789062, 178.63803100585938, 190.42822265625, 202.2184295654297, 214.00863647460938, 225.79884338378906, 237.58905029296875, 249.37925720214844, 261.1694641113281, 272.95965576171875, 284.7498779296875, 296.5400695800781, 308.33026123046875, 320.1204833984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 9.0, 16.0, 29.0, 38.0, 66.0, 72.0, 141.0, 218.0, 376.0, 543.0, 929.0, 1553.0, 2813.0, 5453.0, 13730.0, 50789.0, 692571.0, 3211570.0, 169576.0, 25893.0, 8691.0, 4051.0, 2036.0, 1197.0, 698.0, 432.0, 293.0, 180.0, 101.0, 77.0, 47.0, 32.0, 14.0, 13.0, 7.0, 11.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.21875, -36.9130859375, -35.607421875, -34.3017578125, -32.99609375, -31.6904296875, -30.384765625, -29.0791015625, -27.7734375, -26.4677734375, -25.162109375, -23.8564453125, -22.55078125, -21.2451171875, -19.939453125, -18.6337890625, -17.328125, -16.0224609375, -14.716796875, -13.4111328125, -12.10546875, -10.7998046875, -9.494140625, -8.1884765625, -6.8828125, -5.5771484375, -4.271484375, -2.9658203125, -1.66015625, -0.3544921875, 0.951171875, 2.2568359375, 3.5625, 4.8681640625, 6.173828125, 7.4794921875, 8.78515625, 10.0908203125, 11.396484375, 12.7021484375, 14.0078125, 15.3134765625, 16.619140625, 17.9248046875, 19.23046875, 20.5361328125, 21.841796875, 23.1474609375, 24.453125, 25.7587890625, 27.064453125, 28.3701171875, 29.67578125, 30.9814453125, 32.287109375, 33.5927734375, 34.8984375, 36.2041015625, 37.509765625, 38.8154296875, 40.12109375, 41.4267578125, 42.732421875, 44.0380859375, 45.34375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 4.0, 12.0, 8.0, 10.0, 13.0, 17.0, 20.0, 23.0, 30.0, 21.0, 39.0, 52.0, 42.0, 51.0, 72.0, 53.0, 64.0, 58.0, 60.0, 43.0, 45.0, 29.0, 32.0, 25.0, 28.0, 27.0, 22.0, 21.0, 21.0, 10.0, 8.0, 7.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09375, -18.537841796875, -17.98193359375, -17.426025390625, -16.8701171875, -16.314208984375, -15.75830078125, -15.202392578125, -14.646484375, -14.090576171875, -13.53466796875, -12.978759765625, -12.4228515625, -11.866943359375, -11.31103515625, -10.755126953125, -10.19921875, -9.643310546875, -9.08740234375, -8.531494140625, -7.9755859375, -7.419677734375, -6.86376953125, -6.307861328125, -5.751953125, -5.196044921875, -4.64013671875, -4.084228515625, -3.5283203125, -2.972412109375, -2.41650390625, -1.860595703125, -1.3046875, -0.748779296875, -0.19287109375, 0.363037109375, 0.9189453125, 1.474853515625, 2.03076171875, 2.586669921875, 3.142578125, 3.698486328125, 4.25439453125, 4.810302734375, 5.3662109375, 5.922119140625, 6.47802734375, 7.033935546875, 7.58984375, 8.145751953125, 8.70166015625, 9.257568359375, 9.8134765625, 10.369384765625, 10.92529296875, 11.481201171875, 12.037109375, 12.593017578125, 13.14892578125, 13.704833984375, 14.2607421875, 14.816650390625, 15.37255859375, 15.928466796875, 16.484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 8.0, 7.0, 13.0, 14.0, 29.0, 44.0, 83.0, 111.0, 213.0, 397.0, 795.0, 1854.0, 4044.0, 11039.0, 39041.0, 441316.0, 3540235.0, 117612.0, 23410.0, 7689.0, 3147.0, 1409.0, 697.0, 402.0, 248.0, 134.0, 96.0, 74.0, 39.0, 20.0, 21.0, 10.0, 9.0, 9.0, 5.0, 2.0, 1.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.09375, -52.18115234375, -50.2685546875, -48.35595703125, -46.443359375, -44.53076171875, -42.6181640625, -40.70556640625, -38.79296875, -36.88037109375, -34.9677734375, -33.05517578125, -31.142578125, -29.22998046875, -27.3173828125, -25.40478515625, -23.4921875, -21.57958984375, -19.6669921875, -17.75439453125, -15.841796875, -13.92919921875, -12.0166015625, -10.10400390625, -8.19140625, -6.27880859375, -4.3662109375, -2.45361328125, -0.541015625, 1.37158203125, 3.2841796875, 5.19677734375, 7.109375, 9.02197265625, 10.9345703125, 12.84716796875, 14.759765625, 16.67236328125, 18.5849609375, 20.49755859375, 22.41015625, 24.32275390625, 26.2353515625, 28.14794921875, 30.060546875, 31.97314453125, 33.8857421875, 35.79833984375, 37.7109375, 39.62353515625, 41.5361328125, 43.44873046875, 45.361328125, 47.27392578125, 49.1865234375, 51.09912109375, 53.01171875, 54.92431640625, 56.8369140625, 58.74951171875, 60.662109375, 62.57470703125, 64.4873046875, 66.39990234375, 68.3125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 5.0, 4.0, 5.0, 5.0, 10.0, 11.0, 14.0, 26.0, 32.0, 50.0, 74.0, 140.0, 223.0, 597.0, 1059.0, 869.0, 402.0, 176.0, 109.0, 59.0, 42.0, 43.0, 33.0, 12.0, 11.0, 12.0, 11.0, 10.0, 3.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.78125, -41.1875, -39.59375, -38.0, -36.40625, -34.8125, -33.21875, -31.625, -30.03125, -28.4375, -26.84375, -25.25, -23.65625, -22.0625, -20.46875, -18.875, -17.28125, -15.6875, -14.09375, -12.5, -10.90625, -9.3125, -7.71875, -6.125, -4.53125, -2.9375, -1.34375, 0.25, 1.84375, 3.4375, 5.03125, 6.625, 8.21875, 9.8125, 11.40625, 13.0, 14.59375, 16.1875, 17.78125, 19.375, 20.96875, 22.5625, 24.15625, 25.75, 27.34375, 28.9375, 30.53125, 32.125, 33.71875, 35.3125, 36.90625, 38.5, 40.09375, 41.6875, 43.28125, 44.875, 46.46875, 48.0625, 49.65625, 51.25, 52.84375, 54.4375, 56.03125, 57.625, 59.21875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 15.0, 43.0, 104.0, 218.0, 253.0, 195.0, 93.0, 34.0, 21.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-372.90728759765625, -350.035400390625, -327.16351318359375, -304.2915954589844, -281.4197082519531, -258.5478210449219, -235.67591857910156, -212.80401611328125, -189.93212890625, -167.06024169921875, -144.18833923339844, -121.31644439697266, -98.44454956054688, -75.5726547241211, -52.70075988769531, -29.828857421875, -6.95697021484375, 15.914924621582031, 38.78681945800781, 61.658714294433594, 84.53060913085938, 107.40250396728516, 130.27439880371094, 153.14630126953125, 176.0181884765625, 198.89007568359375, 221.76197814941406, 244.63388061523438, 267.5057678222656, 290.3776550292969, 313.24957275390625, 336.1214599609375, 358.993408203125, 381.86529541015625, 404.7371826171875, 427.6091003417969, 450.4809875488281, 473.3528747558594, 496.22479248046875, 519.0966796875, 541.9685668945312, 564.8404541015625, 587.7123413085938, 610.584228515625, 633.4561767578125, 656.3280639648438, 679.199951171875, 702.0718383789062, 724.9437255859375, 747.8156127929688, 770.6875, 793.5593872070312, 816.4312744140625, 839.30322265625, 862.1751098632812, 885.0469970703125, 907.9188842773438, 930.790771484375, 953.6626586914062, 976.5345458984375, 999.406494140625, 1022.2783813476562, 1045.1502685546875, 1068.022216796875, 1090.89404296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 1.0, 4.0, 8.0, 6.0, 11.0, 22.0, 18.0, 19.0, 24.0, 24.0, 41.0, 48.0, 42.0, 57.0, 53.0, 57.0, 60.0, 56.0, 58.0, 64.0, 42.0, 52.0, 39.0, 37.0, 23.0, 25.0, 21.0, 26.0, 13.0, 12.0, 11.0, 12.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.9266052246094, -280.7915954589844, -272.65655517578125, -264.52154541015625, -256.3865051269531, -248.25149536132812, -240.11647033691406, -231.9814453125, -223.846435546875, -215.71141052246094, -207.57638549804688, -199.44137573242188, -191.3063507080078, -183.17132568359375, -175.0363006591797, -166.90127563476562, -158.76625061035156, -150.6312255859375, -142.49620056152344, -134.36117553710938, -126.22616577148438, -118.09114074707031, -109.95611572265625, -101.82109069824219, -93.68607330322266, -85.5510482788086, -77.41603088378906, -69.281005859375, -61.1459846496582, -53.010963439941406, -44.875938415527344, -36.74091720581055, -28.605911254882812, -20.470890045166016, -12.335866928100586, -4.200843811035156, 3.9341773986816406, 12.069198608398438, 20.2042236328125, 28.339244842529297, 36.474266052246094, 44.60928726196289, 52.74430847167969, 60.87933349609375, 69.01435852050781, 77.14937591552734, 85.2844009399414, 93.41941833496094, 101.554443359375, 109.68946838378906, 117.8244857788086, 125.95951080322266, 134.0945281982422, 142.22955322265625, 150.3645782470703, 158.49960327148438, 166.63461303710938, 174.76963806152344, 182.9046630859375, 191.0396728515625, 199.17469787597656, 207.30972290039062, 215.4447479248047, 223.57977294921875, 231.7147979736328]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 14.0, 20.0, 24.0, 39.0, 62.0, 100.0, 169.0, 301.0, 496.0, 868.0, 1532.0, 2827.0, 5536.0, 11382.0, 26482.0, 69472.0, 209385.0, 436820.0, 178258.0, 59915.0, 23277.0, 10259.0, 5226.0, 2632.0, 1433.0, 820.0, 483.0, 276.0, 141.0, 114.0, 67.0, 32.0, 27.0, 20.0, 12.0, 12.0, 7.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.03125, -36.8212890625, -35.611328125, -34.4013671875, -33.19140625, -31.9814453125, -30.771484375, -29.5615234375, -28.3515625, -27.1416015625, -25.931640625, -24.7216796875, -23.51171875, -22.3017578125, -21.091796875, -19.8818359375, -18.671875, -17.4619140625, -16.251953125, -15.0419921875, -13.83203125, -12.6220703125, -11.412109375, -10.2021484375, -8.9921875, -7.7822265625, -6.572265625, -5.3623046875, -4.15234375, -2.9423828125, -1.732421875, -0.5224609375, 0.6875, 1.8974609375, 3.107421875, 4.3173828125, 5.52734375, 6.7373046875, 7.947265625, 9.1572265625, 10.3671875, 11.5771484375, 12.787109375, 13.9970703125, 15.20703125, 16.4169921875, 17.626953125, 18.8369140625, 20.046875, 21.2568359375, 22.466796875, 23.6767578125, 24.88671875, 26.0966796875, 27.306640625, 28.5166015625, 29.7265625, 30.9365234375, 32.146484375, 33.3564453125, 34.56640625, 35.7763671875, 36.986328125, 38.1962890625, 39.40625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 2.0, 6.0, 7.0, 6.0, 9.0, 18.0, 17.0, 26.0, 23.0, 39.0, 29.0, 41.0, 55.0, 53.0, 45.0, 52.0, 65.0, 65.0, 63.0, 53.0, 48.0, 38.0, 35.0, 41.0, 32.0, 35.0, 19.0, 15.0, 15.0, 7.0, 11.0, 10.0, 9.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.4404296875, -15.802734375, -15.1650390625, -14.52734375, -13.8896484375, -13.251953125, -12.6142578125, -11.9765625, -11.3388671875, -10.701171875, -10.0634765625, -9.42578125, -8.7880859375, -8.150390625, -7.5126953125, -6.875, -6.2373046875, -5.599609375, -4.9619140625, -4.32421875, -3.6865234375, -3.048828125, -2.4111328125, -1.7734375, -1.1357421875, -0.498046875, 0.1396484375, 0.77734375, 1.4150390625, 2.052734375, 2.6904296875, 3.328125, 3.9658203125, 4.603515625, 5.2412109375, 5.87890625, 6.5166015625, 7.154296875, 7.7919921875, 8.4296875, 9.0673828125, 9.705078125, 10.3427734375, 10.98046875, 11.6181640625, 12.255859375, 12.8935546875, 13.53125, 14.1689453125, 14.806640625, 15.4443359375, 16.08203125, 16.7197265625, 17.357421875, 17.9951171875, 18.6328125, 19.2705078125, 19.908203125, 20.5458984375, 21.18359375, 21.8212890625, 22.458984375, 23.0966796875, 23.734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 15.0, 14.0, 28.0, 31.0, 50.0, 88.0, 120.0, 168.0, 258.0, 423.0, 752.0, 1380.0, 3067.0, 8654.0, 38805.0, 369889.0, 563860.0, 44548.0, 9494.0, 3287.0, 1506.0, 794.0, 434.0, 279.0, 175.0, 133.0, 82.0, 62.0, 38.0, 28.0, 27.0, 18.0, 8.0, 3.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 4.0], "bins": [-94.8125, -92.3837890625, -89.955078125, -87.5263671875, -85.09765625, -82.6689453125, -80.240234375, -77.8115234375, -75.3828125, -72.9541015625, -70.525390625, -68.0966796875, -65.66796875, -63.2392578125, -60.810546875, -58.3818359375, -55.953125, -53.5244140625, -51.095703125, -48.6669921875, -46.23828125, -43.8095703125, -41.380859375, -38.9521484375, -36.5234375, -34.0947265625, -31.666015625, -29.2373046875, -26.80859375, -24.3798828125, -21.951171875, -19.5224609375, -17.09375, -14.6650390625, -12.236328125, -9.8076171875, -7.37890625, -4.9501953125, -2.521484375, -0.0927734375, 2.3359375, 4.7646484375, 7.193359375, 9.6220703125, 12.05078125, 14.4794921875, 16.908203125, 19.3369140625, 21.765625, 24.1943359375, 26.623046875, 29.0517578125, 31.48046875, 33.9091796875, 36.337890625, 38.7666015625, 41.1953125, 43.6240234375, 46.052734375, 48.4814453125, 50.91015625, 53.3388671875, 55.767578125, 58.1962890625, 60.625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 15.0, 6.0, 17.0, 20.0, 30.0, 12.0, 33.0, 30.0, 41.0, 28.0, 46.0, 38.0, 46.0, 46.0, 43.0, 68.0, 47.0, 40.0, 42.0, 53.0, 45.0, 51.0, 28.0, 29.0, 22.0, 29.0, 13.0, 10.0, 13.0, 10.0, 8.0, 2.0, 9.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.5625, -67.2978515625, -65.033203125, -62.7685546875, -60.50390625, -58.2392578125, -55.974609375, -53.7099609375, -51.4453125, -49.1806640625, -46.916015625, -44.6513671875, -42.38671875, -40.1220703125, -37.857421875, -35.5927734375, -33.328125, -31.0634765625, -28.798828125, -26.5341796875, -24.26953125, -22.0048828125, -19.740234375, -17.4755859375, -15.2109375, -12.9462890625, -10.681640625, -8.4169921875, -6.15234375, -3.8876953125, -1.623046875, 0.6416015625, 2.90625, 5.1708984375, 7.435546875, 9.7001953125, 11.96484375, 14.2294921875, 16.494140625, 18.7587890625, 21.0234375, 23.2880859375, 25.552734375, 27.8173828125, 30.08203125, 32.3466796875, 34.611328125, 36.8759765625, 39.140625, 41.4052734375, 43.669921875, 45.9345703125, 48.19921875, 50.4638671875, 52.728515625, 54.9931640625, 57.2578125, 59.5224609375, 61.787109375, 64.0517578125, 66.31640625, 68.5810546875, 70.845703125, 73.1103515625, 75.375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 11.0, 7.0, 8.0, 17.0, 23.0, 25.0, 44.0, 60.0, 97.0, 149.0, 265.0, 528.0, 1118.0, 2898.0, 10904.0, 72376.0, 780065.0, 154074.0, 18697.0, 4239.0, 1410.0, 603.0, 335.0, 198.0, 134.0, 82.0, 50.0, 38.0, 19.0, 20.0, 16.0, 13.0, 9.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.609375, -23.83203125, -23.0546875, -22.27734375, -21.5, -20.72265625, -19.9453125, -19.16796875, -18.390625, -17.61328125, -16.8359375, -16.05859375, -15.28125, -14.50390625, -13.7265625, -12.94921875, -12.171875, -11.39453125, -10.6171875, -9.83984375, -9.0625, -8.28515625, -7.5078125, -6.73046875, -5.953125, -5.17578125, -4.3984375, -3.62109375, -2.84375, -2.06640625, -1.2890625, -0.51171875, 0.265625, 1.04296875, 1.8203125, 2.59765625, 3.375, 4.15234375, 4.9296875, 5.70703125, 6.484375, 7.26171875, 8.0390625, 8.81640625, 9.59375, 10.37109375, 11.1484375, 11.92578125, 12.703125, 13.48046875, 14.2578125, 15.03515625, 15.8125, 16.58984375, 17.3671875, 18.14453125, 18.921875, 19.69921875, 20.4765625, 21.25390625, 22.03125, 22.80859375, 23.5859375, 24.36328125, 25.140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 9.0, 17.0, 14.0, 19.0, 18.0, 23.0, 36.0, 49.0, 67.0, 167.0, 245.0, 126.0, 55.0, 38.0, 26.0, 21.0, 15.0, 12.0, 11.0, 6.0, 3.0, 7.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006988525390625, -0.006778419017791748, -0.006568312644958496, -0.006358206272125244, -0.006148099899291992, -0.00593799352645874, -0.005727887153625488, -0.005517780780792236, -0.005307674407958984, -0.005097568035125732, -0.0048874616622924805, -0.0046773552894592285, -0.0044672489166259766, -0.004257142543792725, -0.004047036170959473, -0.0038369297981262207, -0.0036268234252929688, -0.003416717052459717, -0.003206610679626465, -0.002996504306793213, -0.002786397933959961, -0.002576291561126709, -0.002366185188293457, -0.002156078815460205, -0.0019459724426269531, -0.0017358660697937012, -0.0015257596969604492, -0.0013156533241271973, -0.0011055469512939453, -0.0008954405784606934, -0.0006853342056274414, -0.00047522783279418945, -0.0002651214599609375, -5.501508712768555e-05, 0.0001550912857055664, 0.00036519765853881836, 0.0005753040313720703, 0.0007854104042053223, 0.0009955167770385742, 0.0012056231498718262, 0.0014157295227050781, 0.00162583589553833, 0.001835942268371582, 0.002046048641204834, 0.002256155014038086, 0.002466261386871338, 0.00267636775970459, 0.002886474132537842, 0.0030965805053710938, 0.0033066868782043457, 0.0035167932510375977, 0.0037268996238708496, 0.0039370059967041016, 0.0041471123695373535, 0.0043572187423706055, 0.004567325115203857, 0.004777431488037109, 0.004987537860870361, 0.005197644233703613, 0.005407750606536865, 0.005617856979370117, 0.005827963352203369, 0.006038069725036621, 0.006248176097869873, 0.006458282470703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 12.0, 5.0, 14.0, 17.0, 26.0, 39.0, 44.0, 64.0, 109.0, 158.0, 236.0, 390.0, 654.0, 1055.0, 1864.0, 3660.0, 8082.0, 22282.0, 82106.0, 547259.0, 288184.0, 60825.0, 17408.0, 6703.0, 3227.0, 1642.0, 897.0, 535.0, 349.0, 228.0, 139.0, 115.0, 61.0, 52.0, 24.0, 25.0, 10.0, 12.0, 9.0, 3.0, 8.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.015625, -15.5286865234375, -15.041748046875, -14.5548095703125, -14.06787109375, -13.5809326171875, -13.093994140625, -12.6070556640625, -12.1201171875, -11.6331787109375, -11.146240234375, -10.6593017578125, -10.17236328125, -9.6854248046875, -9.198486328125, -8.7115478515625, -8.224609375, -7.7376708984375, -7.250732421875, -6.7637939453125, -6.27685546875, -5.7899169921875, -5.302978515625, -4.8160400390625, -4.3291015625, -3.8421630859375, -3.355224609375, -2.8682861328125, -2.38134765625, -1.8944091796875, -1.407470703125, -0.9205322265625, -0.43359375, 0.0533447265625, 0.540283203125, 1.0272216796875, 1.51416015625, 2.0010986328125, 2.488037109375, 2.9749755859375, 3.4619140625, 3.9488525390625, 4.435791015625, 4.9227294921875, 5.40966796875, 5.8966064453125, 6.383544921875, 6.8704833984375, 7.357421875, 7.8443603515625, 8.331298828125, 8.8182373046875, 9.30517578125, 9.7921142578125, 10.279052734375, 10.7659912109375, 11.2529296875, 11.7398681640625, 12.226806640625, 12.7137451171875, 13.20068359375, 13.6876220703125, 14.174560546875, 14.6614990234375, 15.1484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 9.0, 5.0, 10.0, 12.0, 11.0, 16.0, 22.0, 27.0, 27.0, 34.0, 51.0, 46.0, 89.0, 67.0, 90.0, 80.0, 82.0, 66.0, 52.0, 41.0, 37.0, 24.0, 16.0, 13.0, 18.0, 8.0, 8.0, 10.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.734375, -17.222412109375, -16.71044921875, -16.198486328125, -15.6865234375, -15.174560546875, -14.66259765625, -14.150634765625, -13.638671875, -13.126708984375, -12.61474609375, -12.102783203125, -11.5908203125, -11.078857421875, -10.56689453125, -10.054931640625, -9.54296875, -9.031005859375, -8.51904296875, -8.007080078125, -7.4951171875, -6.983154296875, -6.47119140625, -5.959228515625, -5.447265625, -4.935302734375, -4.42333984375, -3.911376953125, -3.3994140625, -2.887451171875, -2.37548828125, -1.863525390625, -1.3515625, -0.839599609375, -0.32763671875, 0.184326171875, 0.6962890625, 1.208251953125, 1.72021484375, 2.232177734375, 2.744140625, 3.256103515625, 3.76806640625, 4.280029296875, 4.7919921875, 5.303955078125, 5.81591796875, 6.327880859375, 6.83984375, 7.351806640625, 7.86376953125, 8.375732421875, 8.8876953125, 9.399658203125, 9.91162109375, 10.423583984375, 10.935546875, 11.447509765625, 11.95947265625, 12.471435546875, 12.9833984375, 13.495361328125, 14.00732421875, 14.519287109375, 15.03125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 2.0, 12.0, 4.0, 15.0, 19.0, 40.0, 79.0, 146.0, 250.0, 169.0, 110.0, 67.0, 40.0, 24.0, 8.0, 5.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-589.7750244140625, -574.85107421875, -559.9271240234375, -545.003173828125, -530.0791625976562, -515.1552124023438, -500.23126220703125, -485.30731201171875, -470.38336181640625, -455.45941162109375, -440.5354309082031, -425.6114807128906, -410.6875305175781, -395.7635498046875, -380.839599609375, -365.9156494140625, -350.99169921875, -336.0677490234375, -321.1437683105469, -306.2198181152344, -291.2958679199219, -276.37188720703125, -261.44793701171875, -246.52398681640625, -231.60000610351562, -216.67604064941406, -201.75209045410156, -186.828125, -171.9041748046875, -156.98020935058594, -142.05624389648438, -127.13229370117188, -112.20834350585938, -97.28438568115234, -82.36042785644531, -67.43646240234375, -52.512508392333984, -37.58854675292969, -22.664588928222656, -7.740631103515625, 7.183326721191406, 22.107284545898438, 37.03124237060547, 51.955204010009766, 66.87916564941406, 81.8031234741211, 96.72708129882812, 111.65103912353516, 126.57499694824219, 141.49896240234375, 156.42291259765625, 171.3468780517578, 186.2708282470703, 201.19479370117188, 216.11874389648438, 231.04270935058594, 245.9666748046875, 260.890625, 275.8146057128906, 290.7385559082031, 305.6625061035156, 320.58648681640625, 335.51043701171875, 350.43438720703125, 365.35833740234375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [4.0, 6.0, 5.0, 3.0, 1.0, 6.0, 4.0, 8.0, 7.0, 6.0, 11.0, 11.0, 9.0, 13.0, 13.0, 14.0, 12.0, 21.0, 26.0, 36.0, 24.0, 34.0, 30.0, 25.0, 53.0, 50.0, 54.0, 67.0, 56.0, 61.0, 44.0, 45.0, 32.0, 22.0, 40.0, 19.0, 15.0, 14.0, 18.0, 13.0, 16.0, 10.0, 15.0, 7.0, 9.0, 11.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-235.69149780273438, -227.13516235351562, -218.57884216308594, -210.02252197265625, -201.4661865234375, -192.90985107421875, -184.35353088378906, -175.79721069335938, -167.24087524414062, -158.68453979492188, -150.1282196044922, -141.5718994140625, -133.01556396484375, -124.45923614501953, -115.90290832519531, -107.3465805053711, -98.79025268554688, -90.23392486572266, -81.67759704589844, -73.12126922607422, -64.56494140625, -56.00861358642578, -47.45228576660156, -38.895957946777344, -30.339630126953125, -21.783302307128906, -13.226974487304688, -4.670646667480469, 3.88568115234375, 12.442008972167969, 20.998336791992188, 29.554664611816406, 38.1109619140625, 46.66728973388672, 55.22361755371094, 63.779945373535156, 72.33627319335938, 80.8926010131836, 89.44892883300781, 98.00525665283203, 106.56158447265625, 115.11791229248047, 123.67424011230469, 132.23056030273438, 140.78689575195312, 149.34323120117188, 157.89955139160156, 166.45587158203125, 175.01220703125, 183.56854248046875, 192.12486267089844, 200.68118286132812, 209.23751831054688, 217.79385375976562, 226.3501739501953, 234.906494140625, 243.46282958984375, 252.0191650390625, 260.57550048828125, 269.1318054199219, 277.6881408691406, 286.2444763183594, 294.80078125, 303.35711669921875, 311.9134521484375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 11.0, 5.0, 12.0, 15.0, 24.0, 41.0, 43.0, 61.0, 70.0, 118.0, 152.0, 183.0, 294.0, 403.0, 502.0, 804.0, 1119.0, 1620.0, 2527.0, 4231.0, 8006.0, 21064.0, 141299.0, 3271810.0, 670810.0, 41736.0, 12005.0, 5626.0, 3002.0, 2017.0, 1366.0, 953.0, 722.0, 465.0, 325.0, 257.0, 152.0, 137.0, 88.0, 62.0, 41.0, 23.0, 25.0, 14.0, 13.0, 6.0, 12.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-39.375, -38.09375, -36.8125, -35.53125, -34.25, -32.96875, -31.6875, -30.40625, -29.125, -27.84375, -26.5625, -25.28125, -24.0, -22.71875, -21.4375, -20.15625, -18.875, -17.59375, -16.3125, -15.03125, -13.75, -12.46875, -11.1875, -9.90625, -8.625, -7.34375, -6.0625, -4.78125, -3.5, -2.21875, -0.9375, 0.34375, 1.625, 2.90625, 4.1875, 5.46875, 6.75, 8.03125, 9.3125, 10.59375, 11.875, 13.15625, 14.4375, 15.71875, 17.0, 18.28125, 19.5625, 20.84375, 22.125, 23.40625, 24.6875, 25.96875, 27.25, 28.53125, 29.8125, 31.09375, 32.375, 33.65625, 34.9375, 36.21875, 37.5, 38.78125, 40.0625, 41.34375, 42.625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 7.0, 3.0, 10.0, 12.0, 6.0, 18.0, 29.0, 23.0, 31.0, 43.0, 41.0, 50.0, 34.0, 59.0, 53.0, 45.0, 54.0, 52.0, 41.0, 40.0, 39.0, 52.0, 41.0, 37.0, 28.0, 45.0, 21.0, 16.0, 13.0, 16.0, 10.0, 10.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.1875, -18.632568359375, -18.07763671875, -17.522705078125, -16.9677734375, -16.412841796875, -15.85791015625, -15.302978515625, -14.748046875, -14.193115234375, -13.63818359375, -13.083251953125, -12.5283203125, -11.973388671875, -11.41845703125, -10.863525390625, -10.30859375, -9.753662109375, -9.19873046875, -8.643798828125, -8.0888671875, -7.533935546875, -6.97900390625, -6.424072265625, -5.869140625, -5.314208984375, -4.75927734375, -4.204345703125, -3.6494140625, -3.094482421875, -2.53955078125, -1.984619140625, -1.4296875, -0.874755859375, -0.31982421875, 0.235107421875, 0.7900390625, 1.344970703125, 1.89990234375, 2.454833984375, 3.009765625, 3.564697265625, 4.11962890625, 4.674560546875, 5.2294921875, 5.784423828125, 6.33935546875, 6.894287109375, 7.44921875, 8.004150390625, 8.55908203125, 9.114013671875, 9.6689453125, 10.223876953125, 10.77880859375, 11.333740234375, 11.888671875, 12.443603515625, 12.99853515625, 13.553466796875, 14.1083984375, 14.663330078125, 15.21826171875, 15.773193359375, 16.328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 8.0, 11.0, 6.0, 9.0, 14.0, 21.0, 25.0, 52.0, 59.0, 107.0, 142.0, 234.0, 467.0, 805.0, 1461.0, 3090.0, 7462.0, 25347.0, 231530.0, 3798287.0, 97563.0, 16998.0, 5565.0, 2325.0, 1138.0, 599.0, 343.0, 215.0, 145.0, 79.0, 43.0, 48.0, 27.0, 18.0, 12.0, 7.0, 7.0, 5.0, 4.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-74.625, -72.453125, -70.28125, -68.109375, -65.9375, -63.765625, -61.59375, -59.421875, -57.25, -55.078125, -52.90625, -50.734375, -48.5625, -46.390625, -44.21875, -42.046875, -39.875, -37.703125, -35.53125, -33.359375, -31.1875, -29.015625, -26.84375, -24.671875, -22.5, -20.328125, -18.15625, -15.984375, -13.8125, -11.640625, -9.46875, -7.296875, -5.125, -2.953125, -0.78125, 1.390625, 3.5625, 5.734375, 7.90625, 10.078125, 12.25, 14.421875, 16.59375, 18.765625, 20.9375, 23.109375, 25.28125, 27.453125, 29.625, 31.796875, 33.96875, 36.140625, 38.3125, 40.484375, 42.65625, 44.828125, 47.0, 49.171875, 51.34375, 53.515625, 55.6875, 57.859375, 60.03125, 62.203125, 64.375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 6.0, 5.0, 4.0, 13.0, 3.0, 5.0, 16.0, 18.0, 31.0, 42.0, 60.0, 130.0, 325.0, 1006.0, 1341.0, 590.0, 203.0, 95.0, 56.0, 37.0, 20.0, 12.0, 14.0, 8.0, 10.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.78125, -53.93603515625, -52.0908203125, -50.24560546875, -48.400390625, -46.55517578125, -44.7099609375, -42.86474609375, -41.01953125, -39.17431640625, -37.3291015625, -35.48388671875, -33.638671875, -31.79345703125, -29.9482421875, -28.10302734375, -26.2578125, -24.41259765625, -22.5673828125, -20.72216796875, -18.876953125, -17.03173828125, -15.1865234375, -13.34130859375, -11.49609375, -9.65087890625, -7.8056640625, -5.96044921875, -4.115234375, -2.27001953125, -0.4248046875, 1.42041015625, 3.265625, 5.11083984375, 6.9560546875, 8.80126953125, 10.646484375, 12.49169921875, 14.3369140625, 16.18212890625, 18.02734375, 19.87255859375, 21.7177734375, 23.56298828125, 25.408203125, 27.25341796875, 29.0986328125, 30.94384765625, 32.7890625, 34.63427734375, 36.4794921875, 38.32470703125, 40.169921875, 42.01513671875, 43.8603515625, 45.70556640625, 47.55078125, 49.39599609375, 51.2412109375, 53.08642578125, 54.931640625, 56.77685546875, 58.6220703125, 60.46728515625, 62.3125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 11.0, 22.0, 52.0, 125.0, 246.0, 295.0, 135.0, 60.0, 22.0, 14.0, 12.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-933.5205078125, -910.7752685546875, -888.0300903320312, -865.2848510742188, -842.5396118164062, -819.79443359375, -797.0491943359375, -774.303955078125, -751.5587158203125, -728.8134765625, -706.0682983398438, -683.3230590820312, -660.5778198242188, -637.8326416015625, -615.08740234375, -592.3421630859375, -569.5969848632812, -546.8517456054688, -524.1065673828125, -501.361328125, -478.6160888671875, -455.8708801269531, -433.12567138671875, -410.38043212890625, -387.6352233886719, -364.8900146484375, -342.144775390625, -319.3995666503906, -296.65435791015625, -273.90911865234375, -251.16390991210938, -228.41868591308594, -205.6734619140625, -182.92823791503906, -160.18301391601562, -137.43780517578125, -114.69258117675781, -91.94735717773438, -69.2021484375, -46.45692443847656, -23.711700439453125, -0.9664802551269531, 21.77873992919922, 44.523956298828125, 67.26918029785156, 90.014404296875, 112.75961303710938, 135.5048370361328, 158.25006103515625, 180.9952850341797, 203.74050903320312, 226.4857177734375, 249.23094177246094, 271.9761657714844, 294.72137451171875, 317.46661376953125, 340.2118225097656, 362.95703125, 385.7022705078125, 408.4474792480469, 431.19268798828125, 453.93792724609375, 476.6831359863281, 499.4283447265625, 522.173583984375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 13.0, 8.0, 16.0, 15.0, 20.0, 27.0, 35.0, 44.0, 39.0, 45.0, 46.0, 48.0, 56.0, 74.0, 78.0, 58.0, 57.0, 39.0, 44.0, 38.0, 44.0, 34.0, 21.0, 19.0, 19.0, 8.0, 15.0, 9.0, 6.0, 7.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.5360565185547, -220.23008728027344, -212.92410278320312, -205.61813354492188, -198.31214904785156, -191.0061798095703, -183.7001953125, -176.39422607421875, -169.08824157714844, -161.7822723388672, -154.47628784179688, -147.17031860351562, -139.8643341064453, -132.55836486816406, -125.25238037109375, -117.9464111328125, -110.64043426513672, -103.33445739746094, -96.02848052978516, -88.72250366210938, -81.4165267944336, -74.11054992675781, -66.80458068847656, -59.498600006103516, -52.192623138427734, -44.88664627075195, -37.58066940307617, -30.274694442749023, -22.968717575073242, -15.662742614746094, -8.356765747070312, -1.0507888793945312, 6.25518798828125, 13.561164855957031, 20.867141723632812, 28.17311668395996, 35.479095458984375, 42.78506851196289, 50.09104537963867, 57.39702224731445, 64.7030029296875, 72.00897979736328, 79.31495666503906, 86.62093353271484, 93.92691040039062, 101.23287963867188, 108.53886413574219, 115.84483337402344, 123.15081024169922, 130.456787109375, 137.76275634765625, 145.06874084472656, 152.3747100830078, 159.68069458007812, 166.98666381835938, 174.2926483154297, 181.59861755371094, 188.9045867919922, 196.2105712890625, 203.51654052734375, 210.82252502441406, 218.1284942626953, 225.43447875976562, 232.74044799804688, 240.0464324951172]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 10.0, 11.0, 19.0, 31.0, 28.0, 62.0, 80.0, 131.0, 200.0, 303.0, 508.0, 743.0, 1270.0, 2170.0, 4024.0, 7483.0, 15793.0, 37349.0, 101759.0, 291658.0, 358040.0, 137492.0, 48655.0, 20288.0, 9133.0, 4727.0, 2613.0, 1493.0, 923.0, 528.0, 364.0, 223.0, 135.0, 106.0, 59.0, 42.0, 28.0, 21.0, 16.0, 11.0, 13.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.875, -26.9501953125, -26.025390625, -25.1005859375, -24.17578125, -23.2509765625, -22.326171875, -21.4013671875, -20.4765625, -19.5517578125, -18.626953125, -17.7021484375, -16.77734375, -15.8525390625, -14.927734375, -14.0029296875, -13.078125, -12.1533203125, -11.228515625, -10.3037109375, -9.37890625, -8.4541015625, -7.529296875, -6.6044921875, -5.6796875, -4.7548828125, -3.830078125, -2.9052734375, -1.98046875, -1.0556640625, -0.130859375, 0.7939453125, 1.71875, 2.6435546875, 3.568359375, 4.4931640625, 5.41796875, 6.3427734375, 7.267578125, 8.1923828125, 9.1171875, 10.0419921875, 10.966796875, 11.8916015625, 12.81640625, 13.7412109375, 14.666015625, 15.5908203125, 16.515625, 17.4404296875, 18.365234375, 19.2900390625, 20.21484375, 21.1396484375, 22.064453125, 22.9892578125, 23.9140625, 24.8388671875, 25.763671875, 26.6884765625, 27.61328125, 28.5380859375, 29.462890625, 30.3876953125, 31.3125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 13.0, 14.0, 8.0, 16.0, 25.0, 31.0, 32.0, 36.0, 41.0, 42.0, 46.0, 47.0, 48.0, 46.0, 44.0, 50.0, 42.0, 55.0, 37.0, 46.0, 36.0, 41.0, 32.0, 22.0, 26.0, 24.0, 20.0, 19.0, 13.0, 10.0, 9.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.984375, -19.42236328125, -18.8603515625, -18.29833984375, -17.736328125, -17.17431640625, -16.6123046875, -16.05029296875, -15.48828125, -14.92626953125, -14.3642578125, -13.80224609375, -13.240234375, -12.67822265625, -12.1162109375, -11.55419921875, -10.9921875, -10.43017578125, -9.8681640625, -9.30615234375, -8.744140625, -8.18212890625, -7.6201171875, -7.05810546875, -6.49609375, -5.93408203125, -5.3720703125, -4.81005859375, -4.248046875, -3.68603515625, -3.1240234375, -2.56201171875, -2.0, -1.43798828125, -0.8759765625, -0.31396484375, 0.248046875, 0.81005859375, 1.3720703125, 1.93408203125, 2.49609375, 3.05810546875, 3.6201171875, 4.18212890625, 4.744140625, 5.30615234375, 5.8681640625, 6.43017578125, 6.9921875, 7.55419921875, 8.1162109375, 8.67822265625, 9.240234375, 9.80224609375, 10.3642578125, 10.92626953125, 11.48828125, 12.05029296875, 12.6123046875, 13.17431640625, 13.736328125, 14.29833984375, 14.8603515625, 15.42236328125, 15.984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 11.0, 21.0, 23.0, 38.0, 47.0, 88.0, 177.0, 294.0, 625.0, 1495.0, 4300.0, 15803.0, 90249.0, 725715.0, 174624.0, 25229.0, 6083.0, 2024.0, 836.0, 407.0, 187.0, 107.0, 47.0, 40.0, 19.0, 16.0, 9.0, 13.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.4375, -58.58642578125, -56.7353515625, -54.88427734375, -53.033203125, -51.18212890625, -49.3310546875, -47.47998046875, -45.62890625, -43.77783203125, -41.9267578125, -40.07568359375, -38.224609375, -36.37353515625, -34.5224609375, -32.67138671875, -30.8203125, -28.96923828125, -27.1181640625, -25.26708984375, -23.416015625, -21.56494140625, -19.7138671875, -17.86279296875, -16.01171875, -14.16064453125, -12.3095703125, -10.45849609375, -8.607421875, -6.75634765625, -4.9052734375, -3.05419921875, -1.203125, 0.64794921875, 2.4990234375, 4.35009765625, 6.201171875, 8.05224609375, 9.9033203125, 11.75439453125, 13.60546875, 15.45654296875, 17.3076171875, 19.15869140625, 21.009765625, 22.86083984375, 24.7119140625, 26.56298828125, 28.4140625, 30.26513671875, 32.1162109375, 33.96728515625, 35.818359375, 37.66943359375, 39.5205078125, 41.37158203125, 43.22265625, 45.07373046875, 46.9248046875, 48.77587890625, 50.626953125, 52.47802734375, 54.3291015625, 56.18017578125, 58.03125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 5.0, 9.0, 3.0, 18.0, 20.0, 22.0, 17.0, 31.0, 36.0, 28.0, 42.0, 53.0, 48.0, 46.0, 40.0, 42.0, 48.0, 51.0, 64.0, 56.0, 42.0, 43.0, 38.0, 33.0, 31.0, 29.0, 20.0, 15.0, 15.0, 9.0, 12.0, 5.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.75, -69.7421875, -67.734375, -65.7265625, -63.71875, -61.7109375, -59.703125, -57.6953125, -55.6875, -53.6796875, -51.671875, -49.6640625, -47.65625, -45.6484375, -43.640625, -41.6328125, -39.625, -37.6171875, -35.609375, -33.6015625, -31.59375, -29.5859375, -27.578125, -25.5703125, -23.5625, -21.5546875, -19.546875, -17.5390625, -15.53125, -13.5234375, -11.515625, -9.5078125, -7.5, -5.4921875, -3.484375, -1.4765625, 0.53125, 2.5390625, 4.546875, 6.5546875, 8.5625, 10.5703125, 12.578125, 14.5859375, 16.59375, 18.6015625, 20.609375, 22.6171875, 24.625, 26.6328125, 28.640625, 30.6484375, 32.65625, 34.6640625, 36.671875, 38.6796875, 40.6875, 42.6953125, 44.703125, 46.7109375, 48.71875, 50.7265625, 52.734375, 54.7421875, 56.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 8.0, 5.0, 10.0, 14.0, 19.0, 16.0, 22.0, 35.0, 62.0, 89.0, 108.0, 161.0, 267.0, 301.0, 484.0, 703.0, 1047.0, 1684.0, 2886.0, 5505.0, 13662.0, 52094.0, 535490.0, 358952.0, 48651.0, 12911.0, 5562.0, 2910.0, 1623.0, 1006.0, 650.0, 478.0, 362.0, 222.0, 158.0, 99.0, 84.0, 63.0, 42.0, 18.0, 14.0, 19.0, 12.0, 13.0, 7.0, 8.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 3.0], "bins": [-16.09375, -15.6201171875, -15.146484375, -14.6728515625, -14.19921875, -13.7255859375, -13.251953125, -12.7783203125, -12.3046875, -11.8310546875, -11.357421875, -10.8837890625, -10.41015625, -9.9365234375, -9.462890625, -8.9892578125, -8.515625, -8.0419921875, -7.568359375, -7.0947265625, -6.62109375, -6.1474609375, -5.673828125, -5.2001953125, -4.7265625, -4.2529296875, -3.779296875, -3.3056640625, -2.83203125, -2.3583984375, -1.884765625, -1.4111328125, -0.9375, -0.4638671875, 0.009765625, 0.4833984375, 0.95703125, 1.4306640625, 1.904296875, 2.3779296875, 2.8515625, 3.3251953125, 3.798828125, 4.2724609375, 4.74609375, 5.2197265625, 5.693359375, 6.1669921875, 6.640625, 7.1142578125, 7.587890625, 8.0615234375, 8.53515625, 9.0087890625, 9.482421875, 9.9560546875, 10.4296875, 10.9033203125, 11.376953125, 11.8505859375, 12.32421875, 12.7978515625, 13.271484375, 13.7451171875, 14.21875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 10.0, 12.0, 25.0, 30.0, 47.0, 89.0, 143.0, 180.0, 143.0, 100.0, 74.0, 39.0, 23.0, 20.0, 8.0, 5.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005313873291015625, -0.005145668983459473, -0.00497746467590332, -0.004809260368347168, -0.004641056060791016, -0.004472851753234863, -0.004304647445678711, -0.004136443138122559, -0.003968238830566406, -0.003800034523010254, -0.0036318302154541016, -0.0034636259078979492, -0.003295421600341797, -0.0031272172927856445, -0.002959012985229492, -0.00279080867767334, -0.0026226043701171875, -0.002454400062561035, -0.002286195755004883, -0.0021179914474487305, -0.0019497871398925781, -0.0017815828323364258, -0.0016133785247802734, -0.001445174217224121, -0.0012769699096679688, -0.0011087656021118164, -0.0009405612945556641, -0.0007723569869995117, -0.0006041526794433594, -0.00043594837188720703, -0.0002677440643310547, -9.953975677490234e-05, 6.866455078125e-05, 0.00023686885833740234, 0.0004050731658935547, 0.000573277473449707, 0.0007414817810058594, 0.0009096860885620117, 0.001077890396118164, 0.0012460947036743164, 0.0014142990112304688, 0.001582503318786621, 0.0017507076263427734, 0.0019189119338989258, 0.002087116241455078, 0.0022553205490112305, 0.002423524856567383, 0.002591729164123535, 0.0027599334716796875, 0.00292813777923584, 0.003096342086791992, 0.0032645463943481445, 0.003432750701904297, 0.0036009550094604492, 0.0037691593170166016, 0.003937363624572754, 0.004105567932128906, 0.004273772239685059, 0.004441976547241211, 0.004610180854797363, 0.004778385162353516, 0.004946589469909668, 0.00511479377746582, 0.005282998085021973, 0.005451202392578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 11.0, 15.0, 12.0, 26.0, 29.0, 34.0, 72.0, 117.0, 193.0, 321.0, 458.0, 956.0, 1599.0, 3088.0, 6714.0, 17319.0, 56668.0, 265750.0, 569301.0, 84634.0, 23747.0, 8937.0, 4029.0, 1925.0, 1057.0, 603.0, 345.0, 212.0, 130.0, 71.0, 53.0, 40.0, 30.0, 17.0, 7.0, 13.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.5703125, -12.1390380859375, -11.707763671875, -11.2764892578125, -10.84521484375, -10.4139404296875, -9.982666015625, -9.5513916015625, -9.1201171875, -8.6888427734375, -8.257568359375, -7.8262939453125, -7.39501953125, -6.9637451171875, -6.532470703125, -6.1011962890625, -5.669921875, -5.2386474609375, -4.807373046875, -4.3760986328125, -3.94482421875, -3.5135498046875, -3.082275390625, -2.6510009765625, -2.2197265625, -1.7884521484375, -1.357177734375, -0.9259033203125, -0.49462890625, -0.0633544921875, 0.367919921875, 0.7991943359375, 1.23046875, 1.6617431640625, 2.093017578125, 2.5242919921875, 2.95556640625, 3.3868408203125, 3.818115234375, 4.2493896484375, 4.6806640625, 5.1119384765625, 5.543212890625, 5.9744873046875, 6.40576171875, 6.8370361328125, 7.268310546875, 7.6995849609375, 8.130859375, 8.5621337890625, 8.993408203125, 9.4246826171875, 9.85595703125, 10.2872314453125, 10.718505859375, 11.1497802734375, 11.5810546875, 12.0123291015625, 12.443603515625, 12.8748779296875, 13.30615234375, 13.7374267578125, 14.168701171875, 14.5999755859375, 15.03125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 8.0, 14.0, 16.0, 9.0, 19.0, 17.0, 23.0, 41.0, 56.0, 54.0, 62.0, 104.0, 96.0, 79.0, 79.0, 62.0, 58.0, 37.0, 32.0, 24.0, 13.0, 15.0, 14.0, 11.0, 9.0, 5.0, 5.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0234375, -11.61474609375, -11.2060546875, -10.79736328125, -10.388671875, -9.97998046875, -9.5712890625, -9.16259765625, -8.75390625, -8.34521484375, -7.9365234375, -7.52783203125, -7.119140625, -6.71044921875, -6.3017578125, -5.89306640625, -5.484375, -5.07568359375, -4.6669921875, -4.25830078125, -3.849609375, -3.44091796875, -3.0322265625, -2.62353515625, -2.21484375, -1.80615234375, -1.3974609375, -0.98876953125, -0.580078125, -0.17138671875, 0.2373046875, 0.64599609375, 1.0546875, 1.46337890625, 1.8720703125, 2.28076171875, 2.689453125, 3.09814453125, 3.5068359375, 3.91552734375, 4.32421875, 4.73291015625, 5.1416015625, 5.55029296875, 5.958984375, 6.36767578125, 6.7763671875, 7.18505859375, 7.59375, 8.00244140625, 8.4111328125, 8.81982421875, 9.228515625, 9.63720703125, 10.0458984375, 10.45458984375, 10.86328125, 11.27197265625, 11.6806640625, 12.08935546875, 12.498046875, 12.90673828125, 13.3154296875, 13.72412109375, 14.1328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 8.0, 4.0, 7.0, 6.0, 17.0, 52.0, 83.0, 126.0, 287.0, 212.0, 97.0, 65.0, 15.0, 14.0, 6.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-467.85528564453125, -452.68414306640625, -437.5130310058594, -422.3418884277344, -407.1707458496094, -391.9996337890625, -376.8284912109375, -361.6573486328125, -346.4862060546875, -331.3150634765625, -316.1439514160156, -300.9728088378906, -285.8016662597656, -270.63055419921875, -255.45941162109375, -240.28826904296875, -225.11715698242188, -209.94602966308594, -194.77488708496094, -179.603759765625, -164.4326171875, -149.26148986816406, -134.09036254882812, -118.91922760009766, -103.74809265136719, -88.57695770263672, -73.40582275390625, -58.23469543457031, -43.063560485839844, -27.892425537109375, -12.721298217773438, 2.4498367309570312, 17.620941162109375, 32.792076110839844, 47.96320724487305, 63.13433837890625, 78.30547332763672, 93.47660827636719, 108.64773559570312, 123.8188705444336, 138.99000549316406, 154.1611328125, 169.332275390625, 184.50340270996094, 199.67453002929688, 214.84567260742188, 230.0167999267578, 245.18792724609375, 260.35906982421875, 275.53021240234375, 290.7013244628906, 305.8724670410156, 321.0436096191406, 336.2147216796875, 351.3858642578125, 366.5570068359375, 381.7281494140625, 396.8992919921875, 412.0704040527344, 427.2415466308594, 442.4126892089844, 457.58380126953125, 472.75494384765625, 487.92608642578125, 503.0971984863281]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 2.0, 3.0, 6.0, 7.0, 12.0, 8.0, 16.0, 15.0, 22.0, 26.0, 24.0, 24.0, 37.0, 34.0, 41.0, 50.0, 55.0, 67.0, 105.0, 75.0, 60.0, 46.0, 39.0, 44.0, 27.0, 25.0, 18.0, 18.0, 21.0, 12.0, 13.0, 14.0, 7.0, 8.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-244.37013244628906, -235.69248962402344, -227.01486206054688, -218.33721923828125, -209.65957641601562, -200.98193359375, -192.30429077148438, -183.6266632080078, -174.9490203857422, -166.27137756347656, -157.59375, -148.91610717773438, -140.23846435546875, -131.56082153320312, -122.88318634033203, -114.20555114746094, -105.52790832519531, -96.85026550292969, -88.1726303100586, -79.4949951171875, -70.81735229492188, -62.139713287353516, -53.462074279785156, -44.7844352722168, -36.10679626464844, -27.429157257080078, -18.75151824951172, -10.07387924194336, -1.396240234375, 7.281398773193359, 15.959037780761719, 24.636676788330078, 33.3143310546875, 41.99197006225586, 50.66960906982422, 59.34724807739258, 68.02488708496094, 76.70252990722656, 85.38016510009766, 94.05780029296875, 102.73544311523438, 111.4130859375, 120.0907211303711, 128.7683563232422, 137.4459991455078, 146.12364196777344, 154.80126953125, 163.47891235351562, 172.15655517578125, 180.83419799804688, 189.5118408203125, 198.18946838378906, 206.8671112060547, 215.5447540283203, 224.22238159179688, 232.9000244140625, 241.57766723632812, 250.25531005859375, 258.9329528808594, 267.610595703125, 276.2882080078125, 284.9658508300781, 293.64349365234375, 302.3211364746094, 310.998779296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 6.0, 21.0, 22.0, 34.0, 42.0, 49.0, 110.0, 113.0, 157.0, 246.0, 400.0, 579.0, 973.0, 1602.0, 2951.0, 6391.0, 18890.0, 216897.0, 3675276.0, 235769.0, 20055.0, 6406.0, 2920.0, 1639.0, 963.0, 584.0, 371.0, 251.0, 166.0, 128.0, 82.0, 43.0, 40.0, 29.0, 22.0, 14.0, 9.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.65625, -42.1767578125, -40.697265625, -39.2177734375, -37.73828125, -36.2587890625, -34.779296875, -33.2998046875, -31.8203125, -30.3408203125, -28.861328125, -27.3818359375, -25.90234375, -24.4228515625, -22.943359375, -21.4638671875, -19.984375, -18.5048828125, -17.025390625, -15.5458984375, -14.06640625, -12.5869140625, -11.107421875, -9.6279296875, -8.1484375, -6.6689453125, -5.189453125, -3.7099609375, -2.23046875, -0.7509765625, 0.728515625, 2.2080078125, 3.6875, 5.1669921875, 6.646484375, 8.1259765625, 9.60546875, 11.0849609375, 12.564453125, 14.0439453125, 15.5234375, 17.0029296875, 18.482421875, 19.9619140625, 21.44140625, 22.9208984375, 24.400390625, 25.8798828125, 27.359375, 28.8388671875, 30.318359375, 31.7978515625, 33.27734375, 34.7568359375, 36.236328125, 37.7158203125, 39.1953125, 40.6748046875, 42.154296875, 43.6337890625, 45.11328125, 46.5927734375, 48.072265625, 49.5517578125, 51.03125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 6.0, 9.0, 5.0, 13.0, 5.0, 13.0, 10.0, 20.0, 24.0, 26.0, 29.0, 35.0, 33.0, 35.0, 33.0, 44.0, 44.0, 43.0, 56.0, 44.0, 33.0, 52.0, 44.0, 33.0, 39.0, 45.0, 26.0, 44.0, 27.0, 16.0, 15.0, 18.0, 15.0, 12.0, 14.0, 9.0, 5.0, 11.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.34375, -16.849609375, -16.35546875, -15.861328125, -15.3671875, -14.873046875, -14.37890625, -13.884765625, -13.390625, -12.896484375, -12.40234375, -11.908203125, -11.4140625, -10.919921875, -10.42578125, -9.931640625, -9.4375, -8.943359375, -8.44921875, -7.955078125, -7.4609375, -6.966796875, -6.47265625, -5.978515625, -5.484375, -4.990234375, -4.49609375, -4.001953125, -3.5078125, -3.013671875, -2.51953125, -2.025390625, -1.53125, -1.037109375, -0.54296875, -0.048828125, 0.4453125, 0.939453125, 1.43359375, 1.927734375, 2.421875, 2.916015625, 3.41015625, 3.904296875, 4.3984375, 4.892578125, 5.38671875, 5.880859375, 6.375, 6.869140625, 7.36328125, 7.857421875, 8.3515625, 8.845703125, 9.33984375, 9.833984375, 10.328125, 10.822265625, 11.31640625, 11.810546875, 12.3046875, 12.798828125, 13.29296875, 13.787109375, 14.28125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 12.0, 14.0, 24.0, 27.0, 62.0, 112.0, 238.0, 481.0, 1207.0, 3453.0, 15079.0, 328552.0, 3802348.0, 33963.0, 5662.0, 1754.0, 671.0, 307.0, 119.0, 62.0, 36.0, 21.0, 17.0, 11.0, 4.0, 6.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.3125, -82.4873046875, -79.662109375, -76.8369140625, -74.01171875, -71.1865234375, -68.361328125, -65.5361328125, -62.7109375, -59.8857421875, -57.060546875, -54.2353515625, -51.41015625, -48.5849609375, -45.759765625, -42.9345703125, -40.109375, -37.2841796875, -34.458984375, -31.6337890625, -28.80859375, -25.9833984375, -23.158203125, -20.3330078125, -17.5078125, -14.6826171875, -11.857421875, -9.0322265625, -6.20703125, -3.3818359375, -0.556640625, 2.2685546875, 5.09375, 7.9189453125, 10.744140625, 13.5693359375, 16.39453125, 19.2197265625, 22.044921875, 24.8701171875, 27.6953125, 30.5205078125, 33.345703125, 36.1708984375, 38.99609375, 41.8212890625, 44.646484375, 47.4716796875, 50.296875, 53.1220703125, 55.947265625, 58.7724609375, 61.59765625, 64.4228515625, 67.248046875, 70.0732421875, 72.8984375, 75.7236328125, 78.548828125, 81.3740234375, 84.19921875, 87.0244140625, 89.849609375, 92.6748046875, 95.5]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 5.0, 11.0, 11.0, 20.0, 41.0, 60.0, 97.0, 197.0, 588.0, 1329.0, 957.0, 356.0, 148.0, 74.0, 46.0, 35.0, 20.0, 20.0, 6.0, 6.0, 11.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.0625, -49.45458984375, -47.8466796875, -46.23876953125, -44.630859375, -43.02294921875, -41.4150390625, -39.80712890625, -38.19921875, -36.59130859375, -34.9833984375, -33.37548828125, -31.767578125, -30.15966796875, -28.5517578125, -26.94384765625, -25.3359375, -23.72802734375, -22.1201171875, -20.51220703125, -18.904296875, -17.29638671875, -15.6884765625, -14.08056640625, -12.47265625, -10.86474609375, -9.2568359375, -7.64892578125, -6.041015625, -4.43310546875, -2.8251953125, -1.21728515625, 0.390625, 1.99853515625, 3.6064453125, 5.21435546875, 6.822265625, 8.43017578125, 10.0380859375, 11.64599609375, 13.25390625, 14.86181640625, 16.4697265625, 18.07763671875, 19.685546875, 21.29345703125, 22.9013671875, 24.50927734375, 26.1171875, 27.72509765625, 29.3330078125, 30.94091796875, 32.548828125, 34.15673828125, 35.7646484375, 37.37255859375, 38.98046875, 40.58837890625, 42.1962890625, 43.80419921875, 45.412109375, 47.02001953125, 48.6279296875, 50.23583984375, 51.84375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 11.0, 9.0, 12.0, 29.0, 58.0, 79.0, 125.0, 181.0, 191.0, 116.0, 80.0, 53.0, 24.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-399.2503967285156, -387.8344421386719, -376.41845703125, -365.00250244140625, -353.5865173339844, -342.1705627441406, -330.75457763671875, -319.338623046875, -307.92266845703125, -296.5067138671875, -285.0907287597656, -273.6747741699219, -262.2587890625, -250.84283447265625, -239.42686462402344, -228.01089477539062, -216.59490966796875, -205.17893981933594, -193.76296997070312, -182.34701538085938, -170.9310302734375, -159.51507568359375, -148.09910583496094, -136.68313598632812, -125.26716613769531, -113.8511962890625, -102.43522644042969, -91.0192642211914, -79.6032943725586, -68.18732452392578, -56.7713623046875, -45.35539245605469, -33.939453125, -22.52348518371582, -11.10751724243164, 0.30844879150390625, 11.724418640136719, 23.14038848876953, 34.55635070800781, 45.972320556640625, 57.38829040527344, 68.80426025390625, 80.22023010253906, 91.63619232177734, 103.05216217041016, 114.46813201904297, 125.88409423828125, 137.30006408691406, 148.71603393554688, 160.1320037841797, 171.5479736328125, 182.96392822265625, 194.37991333007812, 205.79586791992188, 217.2118377685547, 228.6278076171875, 240.0437774658203, 251.45974731445312, 262.8757019042969, 274.29168701171875, 285.7076416015625, 297.1236267089844, 308.5395812988281, 319.95556640625, 331.37152099609375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 4.0, 6.0, 9.0, 17.0, 16.0, 19.0, 20.0, 16.0, 21.0, 22.0, 30.0, 36.0, 37.0, 45.0, 50.0, 47.0, 70.0, 46.0, 48.0, 64.0, 46.0, 41.0, 48.0, 37.0, 27.0, 31.0, 24.0, 25.0, 21.0, 14.0, 14.0, 15.0, 2.0, 6.0, 5.0, 6.0, 4.0, 1.0, 7.0, 1.0, 0.0, 1.0], "bins": [-212.7361602783203, -207.28536987304688, -201.83456420898438, -196.38377380371094, -190.93296813964844, -185.482177734375, -180.0313720703125, -174.58058166503906, -169.12977600097656, -163.67898559570312, -158.22817993164062, -152.7773895263672, -147.3265838623047, -141.87579345703125, -136.42498779296875, -130.9741973876953, -125.52339935302734, -120.07260131835938, -114.6218032836914, -109.17100524902344, -103.72020721435547, -98.2694091796875, -92.81861877441406, -87.36781311035156, -81.91702270507812, -76.46622467041016, -71.01542663574219, -65.56462860107422, -60.11383056640625, -54.66303253173828, -49.21223831176758, -43.76144027709961, -38.310638427734375, -32.859840393066406, -27.409042358398438, -21.9582462310791, -16.507448196411133, -11.056650161743164, -5.605854034423828, -0.15505599975585938, 5.295742034912109, 10.746540069580078, 16.197338104248047, 21.648134231567383, 27.09893226623535, 32.54972839355469, 38.000526428222656, 43.451324462890625, 48.902122497558594, 54.35292053222656, 59.80371856689453, 65.2545166015625, 70.70531463623047, 76.15611267089844, 81.60690307617188, 87.05770874023438, 92.50849914550781, 97.95929718017578, 103.41009521484375, 108.86089324951172, 114.31169128417969, 119.76248931884766, 125.21328735351562, 130.66407775878906, 136.11488342285156]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 5.0, 10.0, 12.0, 12.0, 24.0, 41.0, 57.0, 106.0, 202.0, 320.0, 708.0, 1571.0, 3680.0, 9629.0, 27023.0, 88331.0, 340403.0, 412279.0, 112084.0, 32726.0, 11317.0, 4416.0, 1858.0, 824.0, 368.0, 211.0, 106.0, 82.0, 52.0, 32.0, 14.0, 11.0, 10.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.9375, -29.9423828125, -28.947265625, -27.9521484375, -26.95703125, -25.9619140625, -24.966796875, -23.9716796875, -22.9765625, -21.9814453125, -20.986328125, -19.9912109375, -18.99609375, -18.0009765625, -17.005859375, -16.0107421875, -15.015625, -14.0205078125, -13.025390625, -12.0302734375, -11.03515625, -10.0400390625, -9.044921875, -8.0498046875, -7.0546875, -6.0595703125, -5.064453125, -4.0693359375, -3.07421875, -2.0791015625, -1.083984375, -0.0888671875, 0.90625, 1.9013671875, 2.896484375, 3.8916015625, 4.88671875, 5.8818359375, 6.876953125, 7.8720703125, 8.8671875, 9.8623046875, 10.857421875, 11.8525390625, 12.84765625, 13.8427734375, 14.837890625, 15.8330078125, 16.828125, 17.8232421875, 18.818359375, 19.8134765625, 20.80859375, 21.8037109375, 22.798828125, 23.7939453125, 24.7890625, 25.7841796875, 26.779296875, 27.7744140625, 28.76953125, 29.7646484375, 30.759765625, 31.7548828125, 32.75]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 2.0, 4.0, 10.0, 9.0, 10.0, 11.0, 15.0, 27.0, 23.0, 22.0, 34.0, 28.0, 33.0, 29.0, 40.0, 40.0, 39.0, 43.0, 41.0, 53.0, 47.0, 50.0, 44.0, 32.0, 44.0, 44.0, 39.0, 30.0, 23.0, 20.0, 17.0, 16.0, 16.0, 16.0, 9.0, 11.0, 3.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.989013671875, -16.46240234375, -15.935791015625, -15.4091796875, -14.882568359375, -14.35595703125, -13.829345703125, -13.302734375, -12.776123046875, -12.24951171875, -11.722900390625, -11.1962890625, -10.669677734375, -10.14306640625, -9.616455078125, -9.08984375, -8.563232421875, -8.03662109375, -7.510009765625, -6.9833984375, -6.456787109375, -5.93017578125, -5.403564453125, -4.876953125, -4.350341796875, -3.82373046875, -3.297119140625, -2.7705078125, -2.243896484375, -1.71728515625, -1.190673828125, -0.6640625, -0.137451171875, 0.38916015625, 0.915771484375, 1.4423828125, 1.968994140625, 2.49560546875, 3.022216796875, 3.548828125, 4.075439453125, 4.60205078125, 5.128662109375, 5.6552734375, 6.181884765625, 6.70849609375, 7.235107421875, 7.76171875, 8.288330078125, 8.81494140625, 9.341552734375, 9.8681640625, 10.394775390625, 10.92138671875, 11.447998046875, 11.974609375, 12.501220703125, 13.02783203125, 13.554443359375, 14.0810546875, 14.607666015625, 15.13427734375, 15.660888671875, 16.1875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 9.0, 18.0, 14.0, 22.0, 18.0, 30.0, 51.0, 70.0, 87.0, 129.0, 186.0, 290.0, 405.0, 689.0, 1250.0, 2615.0, 6412.0, 19645.0, 81202.0, 636985.0, 234091.0, 43446.0, 12002.0, 4385.0, 1892.0, 947.0, 548.0, 337.0, 215.0, 147.0, 92.0, 67.0, 68.0, 45.0, 26.0, 19.0, 18.0, 19.0, 15.0, 8.0, 10.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-36.53125, -35.30517578125, -34.0791015625, -32.85302734375, -31.626953125, -30.40087890625, -29.1748046875, -27.94873046875, -26.72265625, -25.49658203125, -24.2705078125, -23.04443359375, -21.818359375, -20.59228515625, -19.3662109375, -18.14013671875, -16.9140625, -15.68798828125, -14.4619140625, -13.23583984375, -12.009765625, -10.78369140625, -9.5576171875, -8.33154296875, -7.10546875, -5.87939453125, -4.6533203125, -3.42724609375, -2.201171875, -0.97509765625, 0.2509765625, 1.47705078125, 2.703125, 3.92919921875, 5.1552734375, 6.38134765625, 7.607421875, 8.83349609375, 10.0595703125, 11.28564453125, 12.51171875, 13.73779296875, 14.9638671875, 16.18994140625, 17.416015625, 18.64208984375, 19.8681640625, 21.09423828125, 22.3203125, 23.54638671875, 24.7724609375, 25.99853515625, 27.224609375, 28.45068359375, 29.6767578125, 30.90283203125, 32.12890625, 33.35498046875, 34.5810546875, 35.80712890625, 37.033203125, 38.25927734375, 39.4853515625, 40.71142578125, 41.9375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 1.0, 9.0, 11.0, 13.0, 13.0, 11.0, 13.0, 26.0, 37.0, 35.0, 33.0, 36.0, 51.0, 58.0, 42.0, 64.0, 62.0, 53.0, 40.0, 39.0, 50.0, 43.0, 31.0, 42.0, 24.0, 24.0, 26.0, 20.0, 6.0, 17.0, 11.0, 12.0, 8.0, 4.0, 3.0, 3.0, 4.0, 8.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.1875, -68.17919921875, -66.1708984375, -64.16259765625, -62.154296875, -60.14599609375, -58.1376953125, -56.12939453125, -54.12109375, -52.11279296875, -50.1044921875, -48.09619140625, -46.087890625, -44.07958984375, -42.0712890625, -40.06298828125, -38.0546875, -36.04638671875, -34.0380859375, -32.02978515625, -30.021484375, -28.01318359375, -26.0048828125, -23.99658203125, -21.98828125, -19.97998046875, -17.9716796875, -15.96337890625, -13.955078125, -11.94677734375, -9.9384765625, -7.93017578125, -5.921875, -3.91357421875, -1.9052734375, 0.10302734375, 2.111328125, 4.11962890625, 6.1279296875, 8.13623046875, 10.14453125, 12.15283203125, 14.1611328125, 16.16943359375, 18.177734375, 20.18603515625, 22.1943359375, 24.20263671875, 26.2109375, 28.21923828125, 30.2275390625, 32.23583984375, 34.244140625, 36.25244140625, 38.2607421875, 40.26904296875, 42.27734375, 44.28564453125, 46.2939453125, 48.30224609375, 50.310546875, 52.31884765625, 54.3271484375, 56.33544921875, 58.34375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 3.0, 3.0, 9.0, 6.0, 8.0, 15.0, 30.0, 25.0, 40.0, 56.0, 103.0, 172.0, 264.0, 493.0, 869.0, 1950.0, 4661.0, 13666.0, 51330.0, 572143.0, 334785.0, 47041.0, 12563.0, 4414.0, 1834.0, 876.0, 485.0, 256.0, 140.0, 113.0, 54.0, 40.0, 24.0, 15.0, 12.0, 12.0, 14.0, 6.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.578125, -10.236572265625, -9.89501953125, -9.553466796875, -9.2119140625, -8.870361328125, -8.52880859375, -8.187255859375, -7.845703125, -7.504150390625, -7.16259765625, -6.821044921875, -6.4794921875, -6.137939453125, -5.79638671875, -5.454833984375, -5.11328125, -4.771728515625, -4.43017578125, -4.088623046875, -3.7470703125, -3.405517578125, -3.06396484375, -2.722412109375, -2.380859375, -2.039306640625, -1.69775390625, -1.356201171875, -1.0146484375, -0.673095703125, -0.33154296875, 0.010009765625, 0.3515625, 0.693115234375, 1.03466796875, 1.376220703125, 1.7177734375, 2.059326171875, 2.40087890625, 2.742431640625, 3.083984375, 3.425537109375, 3.76708984375, 4.108642578125, 4.4501953125, 4.791748046875, 5.13330078125, 5.474853515625, 5.81640625, 6.157958984375, 6.49951171875, 6.841064453125, 7.1826171875, 7.524169921875, 7.86572265625, 8.207275390625, 8.548828125, 8.890380859375, 9.23193359375, 9.573486328125, 9.9150390625, 10.256591796875, 10.59814453125, 10.939697265625, 11.28125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 6.0, 6.0, 10.0, 25.0, 19.0, 28.0, 39.0, 77.0, 123.0, 171.0, 139.0, 93.0, 56.0, 44.0, 24.0, 25.0, 15.0, 12.0, 18.0, 8.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00240325927734375, -0.0023134350776672363, -0.0022236108779907227, -0.002133786678314209, -0.0020439624786376953, -0.0019541382789611816, -0.001864314079284668, -0.0017744898796081543, -0.0016846656799316406, -0.001594841480255127, -0.0015050172805786133, -0.0014151930809020996, -0.001325368881225586, -0.0012355446815490723, -0.0011457204818725586, -0.001055896282196045, -0.0009660720825195312, -0.0008762478828430176, -0.0007864236831665039, -0.0006965994834899902, -0.0006067752838134766, -0.0005169510841369629, -0.0004271268844604492, -0.00033730268478393555, -0.0002474784851074219, -0.0001576542854309082, -6.783008575439453e-05, 2.199411392211914e-05, 0.00011181831359863281, 0.00020164251327514648, 0.00029146671295166016, 0.00038129091262817383, 0.0004711151123046875, 0.0005609393119812012, 0.0006507635116577148, 0.0007405877113342285, 0.0008304119110107422, 0.0009202361106872559, 0.0010100603103637695, 0.0010998845100402832, 0.0011897087097167969, 0.0012795329093933105, 0.0013693571090698242, 0.0014591813087463379, 0.0015490055084228516, 0.0016388297080993652, 0.001728653907775879, 0.0018184781074523926, 0.0019083023071289062, 0.00199812650680542, 0.0020879507064819336, 0.0021777749061584473, 0.002267599105834961, 0.0023574233055114746, 0.0024472475051879883, 0.002537071704864502, 0.0026268959045410156, 0.0027167201042175293, 0.002806544303894043, 0.0028963685035705566, 0.0029861927032470703, 0.003076016902923584, 0.0031658411026000977, 0.0032556653022766113, 0.003345489501953125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 11.0, 8.0, 11.0, 11.0, 16.0, 18.0, 40.0, 73.0, 97.0, 151.0, 281.0, 536.0, 1109.0, 2346.0, 5674.0, 17507.0, 75170.0, 719393.0, 178600.0, 31527.0, 9461.0, 3416.0, 1500.0, 659.0, 380.0, 223.0, 118.0, 76.0, 47.0, 25.0, 16.0, 13.0, 17.0, 5.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.9208984375, -11.505859375, -11.0908203125, -10.67578125, -10.2607421875, -9.845703125, -9.4306640625, -9.015625, -8.6005859375, -8.185546875, -7.7705078125, -7.35546875, -6.9404296875, -6.525390625, -6.1103515625, -5.6953125, -5.2802734375, -4.865234375, -4.4501953125, -4.03515625, -3.6201171875, -3.205078125, -2.7900390625, -2.375, -1.9599609375, -1.544921875, -1.1298828125, -0.71484375, -0.2998046875, 0.115234375, 0.5302734375, 0.9453125, 1.3603515625, 1.775390625, 2.1904296875, 2.60546875, 3.0205078125, 3.435546875, 3.8505859375, 4.265625, 4.6806640625, 5.095703125, 5.5107421875, 5.92578125, 6.3408203125, 6.755859375, 7.1708984375, 7.5859375, 8.0009765625, 8.416015625, 8.8310546875, 9.24609375, 9.6611328125, 10.076171875, 10.4912109375, 10.90625, 11.3212890625, 11.736328125, 12.1513671875, 12.56640625, 12.9814453125, 13.396484375, 13.8115234375, 14.2265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 4.0, 6.0, 6.0, 7.0, 14.0, 10.0, 13.0, 18.0, 18.0, 23.0, 33.0, 41.0, 58.0, 75.0, 95.0, 120.0, 105.0, 86.0, 73.0, 47.0, 38.0, 28.0, 26.0, 9.0, 12.0, 4.0, 4.0, 6.0, 4.0, 6.0, 1.0, 0.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.3936767578125, -8.037353515625, -7.6810302734375, -7.32470703125, -6.9683837890625, -6.612060546875, -6.2557373046875, -5.8994140625, -5.5430908203125, -5.186767578125, -4.8304443359375, -4.47412109375, -4.1177978515625, -3.761474609375, -3.4051513671875, -3.048828125, -2.6925048828125, -2.336181640625, -1.9798583984375, -1.62353515625, -1.2672119140625, -0.910888671875, -0.5545654296875, -0.1982421875, 0.1580810546875, 0.514404296875, 0.8707275390625, 1.22705078125, 1.5833740234375, 1.939697265625, 2.2960205078125, 2.65234375, 3.0086669921875, 3.364990234375, 3.7213134765625, 4.07763671875, 4.4339599609375, 4.790283203125, 5.1466064453125, 5.5029296875, 5.8592529296875, 6.215576171875, 6.5718994140625, 6.92822265625, 7.2845458984375, 7.640869140625, 7.9971923828125, 8.353515625, 8.7098388671875, 9.066162109375, 9.4224853515625, 9.77880859375, 10.1351318359375, 10.491455078125, 10.8477783203125, 11.2041015625, 11.5604248046875, 11.916748046875, 12.2730712890625, 12.62939453125, 12.9857177734375, 13.342041015625, 13.6983642578125, 14.0546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 10.0, 7.0, 29.0, 44.0, 105.0, 187.0, 340.0, 148.0, 66.0, 37.0, 11.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-558.8031005859375, -546.2099609375, -533.6168823242188, -521.0237426757812, -508.4306335449219, -495.8375244140625, -483.244384765625, -470.6512756347656, -458.05816650390625, -445.4650573730469, -432.8719482421875, -420.27880859375, -407.6856994628906, -395.09259033203125, -382.49945068359375, -369.9063415527344, -357.313232421875, -344.7201232910156, -332.12701416015625, -319.53387451171875, -306.9407653808594, -294.34765625, -281.7545166015625, -269.1614074707031, -256.56829833984375, -243.97518920898438, -231.38206481933594, -218.7889404296875, -206.19583129882812, -193.60272216796875, -181.0095977783203, -168.41647338867188, -155.8233642578125, -143.23025512695312, -130.6371307373047, -118.04401397705078, -105.45089721679688, -92.85778045654297, -80.26466369628906, -67.67154693603516, -55.07843017578125, -42.485313415527344, -29.892196655273438, -17.29907989501953, -4.705963134765625, 7.887153625488281, 20.480270385742188, 33.073387145996094, 45.66650390625, 58.259620666503906, 70.85273742675781, 83.44585418701172, 96.03897094726562, 108.63208770751953, 121.22520446777344, 133.81832885742188, 146.41143798828125, 159.00454711914062, 171.59767150878906, 184.1907958984375, 196.78390502929688, 209.37701416015625, 221.9701385498047, 234.56326293945312, 247.1563720703125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 7.0, 5.0, 2.0, 7.0, 11.0, 9.0, 12.0, 11.0, 11.0, 15.0, 17.0, 26.0, 25.0, 28.0, 26.0, 30.0, 32.0, 52.0, 51.0, 105.0, 106.0, 75.0, 41.0, 47.0, 36.0, 25.0, 23.0, 24.0, 19.0, 19.0, 20.0, 15.0, 12.0, 10.0, 11.0, 10.0, 7.0, 4.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-241.28353881835938, -234.0697479248047, -226.85594177246094, -219.64215087890625, -212.4283447265625, -205.2145538330078, -198.00076293945312, -190.78695678710938, -183.57315063476562, -176.35935974121094, -169.1455535888672, -161.9317626953125, -154.71795654296875, -147.50416564941406, -140.29037475585938, -133.07656860351562, -125.86277770996094, -118.64897918701172, -111.4351806640625, -104.22138977050781, -97.00758361816406, -89.79379272460938, -82.57999420166016, -75.36619567871094, -68.15239715576172, -60.9385986328125, -53.72480010986328, -46.51100540161133, -39.29720687866211, -32.08340835571289, -24.869613647460938, -17.65581512451172, -10.4420166015625, -3.2282190322875977, 3.9855785369873047, 11.19937515258789, 18.41317367553711, 25.626972198486328, 32.84076690673828, 40.0545654296875, 47.26836395263672, 54.48216247558594, 61.695960998535156, 68.90975952148438, 76.12355041503906, 83.33735656738281, 90.5511474609375, 97.76494598388672, 104.97874450683594, 112.19254302978516, 119.40634155273438, 126.62013244628906, 133.8339385986328, 141.0477294921875, 148.26153564453125, 155.47532653808594, 162.68911743164062, 169.9029083251953, 177.11671447753906, 184.33050537109375, 191.5443115234375, 198.7581024169922, 205.97189331054688, 213.18569946289062, 220.39950561523438]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 7.0, 9.0, 13.0, 21.0, 34.0, 38.0, 58.0, 59.0, 102.0, 147.0, 199.0, 300.0, 459.0, 702.0, 1241.0, 2172.0, 4817.0, 18742.0, 460945.0, 3590127.0, 96152.0, 10056.0, 3450.0, 1677.0, 942.0, 629.0, 358.0, 252.0, 155.0, 116.0, 89.0, 55.0, 50.0, 35.0, 20.0, 12.0, 12.0, 7.0, 4.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.28125, -47.599609375, -45.91796875, -44.236328125, -42.5546875, -40.873046875, -39.19140625, -37.509765625, -35.828125, -34.146484375, -32.46484375, -30.783203125, -29.1015625, -27.419921875, -25.73828125, -24.056640625, -22.375, -20.693359375, -19.01171875, -17.330078125, -15.6484375, -13.966796875, -12.28515625, -10.603515625, -8.921875, -7.240234375, -5.55859375, -3.876953125, -2.1953125, -0.513671875, 1.16796875, 2.849609375, 4.53125, 6.212890625, 7.89453125, 9.576171875, 11.2578125, 12.939453125, 14.62109375, 16.302734375, 17.984375, 19.666015625, 21.34765625, 23.029296875, 24.7109375, 26.392578125, 28.07421875, 29.755859375, 31.4375, 33.119140625, 34.80078125, 36.482421875, 38.1640625, 39.845703125, 41.52734375, 43.208984375, 44.890625, 46.572265625, 48.25390625, 49.935546875, 51.6171875, 53.298828125, 54.98046875, 56.662109375, 58.34375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 8.0, 5.0, 6.0, 17.0, 18.0, 16.0, 24.0, 21.0, 40.0, 31.0, 40.0, 38.0, 39.0, 47.0, 44.0, 49.0, 42.0, 50.0, 43.0, 50.0, 48.0, 25.0, 47.0, 42.0, 26.0, 29.0, 25.0, 15.0, 23.0, 19.0, 12.0, 12.0, 6.0, 9.0, 3.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-18.0625, -17.556396484375, -17.05029296875, -16.544189453125, -16.0380859375, -15.531982421875, -15.02587890625, -14.519775390625, -14.013671875, -13.507568359375, -13.00146484375, -12.495361328125, -11.9892578125, -11.483154296875, -10.97705078125, -10.470947265625, -9.96484375, -9.458740234375, -8.95263671875, -8.446533203125, -7.9404296875, -7.434326171875, -6.92822265625, -6.422119140625, -5.916015625, -5.409912109375, -4.90380859375, -4.397705078125, -3.8916015625, -3.385498046875, -2.87939453125, -2.373291015625, -1.8671875, -1.361083984375, -0.85498046875, -0.348876953125, 0.1572265625, 0.663330078125, 1.16943359375, 1.675537109375, 2.181640625, 2.687744140625, 3.19384765625, 3.699951171875, 4.2060546875, 4.712158203125, 5.21826171875, 5.724365234375, 6.23046875, 6.736572265625, 7.24267578125, 7.748779296875, 8.2548828125, 8.760986328125, 9.26708984375, 9.773193359375, 10.279296875, 10.785400390625, 11.29150390625, 11.797607421875, 12.3037109375, 12.809814453125, 13.31591796875, 13.822021484375, 14.328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 1.0, 3.0, 10.0, 10.0, 6.0, 20.0, 25.0, 38.0, 49.0, 100.0, 151.0, 361.0, 885.0, 2497.0, 8814.0, 53062.0, 3801220.0, 301656.0, 18450.0, 4380.0, 1422.0, 520.0, 252.0, 133.0, 69.0, 36.0, 30.0, 19.0, 14.0, 13.0, 10.0, 7.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.3125, -73.14453125, -70.9765625, -68.80859375, -66.640625, -64.47265625, -62.3046875, -60.13671875, -57.96875, -55.80078125, -53.6328125, -51.46484375, -49.296875, -47.12890625, -44.9609375, -42.79296875, -40.625, -38.45703125, -36.2890625, -34.12109375, -31.953125, -29.78515625, -27.6171875, -25.44921875, -23.28125, -21.11328125, -18.9453125, -16.77734375, -14.609375, -12.44140625, -10.2734375, -8.10546875, -5.9375, -3.76953125, -1.6015625, 0.56640625, 2.734375, 4.90234375, 7.0703125, 9.23828125, 11.40625, 13.57421875, 15.7421875, 17.91015625, 20.078125, 22.24609375, 24.4140625, 26.58203125, 28.75, 30.91796875, 33.0859375, 35.25390625, 37.421875, 39.58984375, 41.7578125, 43.92578125, 46.09375, 48.26171875, 50.4296875, 52.59765625, 54.765625, 56.93359375, 59.1015625, 61.26953125, 63.4375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 7.0, 6.0, 7.0, 10.0, 18.0, 23.0, 51.0, 70.0, 166.0, 475.0, 1245.0, 1153.0, 459.0, 167.0, 84.0, 36.0, 26.0, 19.0, 12.0, 9.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.0, -42.1669921875, -40.333984375, -38.5009765625, -36.66796875, -34.8349609375, -33.001953125, -31.1689453125, -29.3359375, -27.5029296875, -25.669921875, -23.8369140625, -22.00390625, -20.1708984375, -18.337890625, -16.5048828125, -14.671875, -12.8388671875, -11.005859375, -9.1728515625, -7.33984375, -5.5068359375, -3.673828125, -1.8408203125, -0.0078125, 1.8251953125, 3.658203125, 5.4912109375, 7.32421875, 9.1572265625, 10.990234375, 12.8232421875, 14.65625, 16.4892578125, 18.322265625, 20.1552734375, 21.98828125, 23.8212890625, 25.654296875, 27.4873046875, 29.3203125, 31.1533203125, 32.986328125, 34.8193359375, 36.65234375, 38.4853515625, 40.318359375, 42.1513671875, 43.984375, 45.8173828125, 47.650390625, 49.4833984375, 51.31640625, 53.1494140625, 54.982421875, 56.8154296875, 58.6484375, 60.4814453125, 62.314453125, 64.1474609375, 65.98046875, 67.8134765625, 69.646484375, 71.4794921875, 73.3125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 11.0, 16.0, 17.0, 35.0, 57.0, 71.0, 130.0, 170.0, 146.0, 126.0, 91.0, 56.0, 19.0, 9.0, 12.0, 6.0, 11.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.5888977050781, -268.89727783203125, -260.20562744140625, -251.5139923095703, -242.82235717773438, -234.1307373046875, -225.43910217285156, -216.74746704101562, -208.0558319091797, -199.36419677734375, -190.6725616455078, -181.98092651367188, -173.289306640625, -164.59765625, -155.90603637695312, -147.2144012451172, -138.52276611328125, -129.8311309814453, -121.13949584960938, -112.44786834716797, -103.75623321533203, -95.0645980834961, -86.37297058105469, -77.68133544921875, -68.98970031738281, -60.298065185546875, -51.6064338684082, -42.91480255126953, -34.223167419433594, -25.531532287597656, -16.839900970458984, -8.148269653320312, 0.54339599609375, 9.235029220581055, 17.92666244506836, 26.618295669555664, 35.30992889404297, 44.001564025878906, 52.69319534301758, 61.38482666015625, 70.07646179199219, 78.76809692382812, 87.45973205566406, 96.15135955810547, 104.8429946899414, 113.53462982177734, 122.22625732421875, 130.9178924560547, 139.60952758789062, 148.30116271972656, 156.9927978515625, 165.68443298339844, 174.37606811523438, 183.06768798828125, 191.7593231201172, 200.45095825195312, 209.14259338378906, 217.834228515625, 226.52586364746094, 235.21749877929688, 243.90911865234375, 252.60076904296875, 261.2923889160156, 269.9840087890625, 278.6756591796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 12.0, 17.0, 15.0, 14.0, 26.0, 27.0, 22.0, 30.0, 39.0, 37.0, 45.0, 43.0, 55.0, 49.0, 48.0, 57.0, 49.0, 50.0, 45.0, 42.0, 36.0, 34.0, 25.0, 30.0, 24.0, 22.0, 13.0, 18.0, 15.0, 9.0, 9.0, 9.0, 6.0, 6.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.28927612304688, -120.28993225097656, -115.29058074951172, -110.29122924804688, -105.29188537597656, -100.29254150390625, -95.2931900024414, -90.29383850097656, -85.29449462890625, -80.29515075683594, -75.2957992553711, -70.29644775390625, -65.29710388183594, -60.29775619506836, -55.29840850830078, -50.2990608215332, -45.299713134765625, -40.30036544799805, -35.30101776123047, -30.30167007446289, -25.302322387695312, -20.302974700927734, -15.303627014160156, -10.304279327392578, -5.304931640625, -0.3055839538574219, 4.693763732910156, 9.693111419677734, 14.692459106445312, 19.69180679321289, 24.69115447998047, 29.690502166748047, 34.689849853515625, 39.6891975402832, 44.68854522705078, 49.68789291381836, 54.68724060058594, 59.686588287353516, 64.6859359741211, 69.68528747558594, 74.68463134765625, 79.68397521972656, 84.6833267211914, 89.68267822265625, 94.68202209472656, 99.68136596679688, 104.68071746826172, 109.68006896972656, 114.67941284179688, 119.67875671386719, 124.67810821533203, 129.67745971679688, 134.6768035888672, 139.6761474609375, 144.67550659179688, 149.6748504638672, 154.6741943359375, 159.6735382080078, 164.67288208007812, 169.6722412109375, 174.6715850830078, 179.67092895507812, 184.6702880859375, 189.6696319580078, 194.66897583007812]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 7.0, 10.0, 13.0, 17.0, 34.0, 47.0, 93.0, 155.0, 262.0, 382.0, 679.0, 1226.0, 2145.0, 3984.0, 8080.0, 17688.0, 40932.0, 106968.0, 315821.0, 347416.0, 119748.0, 45137.0, 19169.0, 8736.0, 4387.0, 2235.0, 1342.0, 749.0, 439.0, 255.0, 147.0, 104.0, 54.0, 44.0, 11.0, 16.0, 6.0, 10.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.734375, -23.911376953125, -23.08837890625, -22.265380859375, -21.4423828125, -20.619384765625, -19.79638671875, -18.973388671875, -18.150390625, -17.327392578125, -16.50439453125, -15.681396484375, -14.8583984375, -14.035400390625, -13.21240234375, -12.389404296875, -11.56640625, -10.743408203125, -9.92041015625, -9.097412109375, -8.2744140625, -7.451416015625, -6.62841796875, -5.805419921875, -4.982421875, -4.159423828125, -3.33642578125, -2.513427734375, -1.6904296875, -0.867431640625, -0.04443359375, 0.778564453125, 1.6015625, 2.424560546875, 3.24755859375, 4.070556640625, 4.8935546875, 5.716552734375, 6.53955078125, 7.362548828125, 8.185546875, 9.008544921875, 9.83154296875, 10.654541015625, 11.4775390625, 12.300537109375, 13.12353515625, 13.946533203125, 14.76953125, 15.592529296875, 16.41552734375, 17.238525390625, 18.0615234375, 18.884521484375, 19.70751953125, 20.530517578125, 21.353515625, 22.176513671875, 22.99951171875, 23.822509765625, 24.6455078125, 25.468505859375, 26.29150390625, 27.114501953125, 27.9375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 5.0, 9.0, 10.0, 10.0, 15.0, 10.0, 12.0, 14.0, 33.0, 35.0, 31.0, 34.0, 49.0, 47.0, 45.0, 46.0, 55.0, 50.0, 53.0, 41.0, 52.0, 30.0, 28.0, 41.0, 29.0, 31.0, 31.0, 30.0, 21.0, 13.0, 9.0, 14.0, 6.0, 6.0, 11.0, 8.0, 7.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.890625, -17.359619140625, -16.82861328125, -16.297607421875, -15.7666015625, -15.235595703125, -14.70458984375, -14.173583984375, -13.642578125, -13.111572265625, -12.58056640625, -12.049560546875, -11.5185546875, -10.987548828125, -10.45654296875, -9.925537109375, -9.39453125, -8.863525390625, -8.33251953125, -7.801513671875, -7.2705078125, -6.739501953125, -6.20849609375, -5.677490234375, -5.146484375, -4.615478515625, -4.08447265625, -3.553466796875, -3.0224609375, -2.491455078125, -1.96044921875, -1.429443359375, -0.8984375, -0.367431640625, 0.16357421875, 0.694580078125, 1.2255859375, 1.756591796875, 2.28759765625, 2.818603515625, 3.349609375, 3.880615234375, 4.41162109375, 4.942626953125, 5.4736328125, 6.004638671875, 6.53564453125, 7.066650390625, 7.59765625, 8.128662109375, 8.65966796875, 9.190673828125, 9.7216796875, 10.252685546875, 10.78369140625, 11.314697265625, 11.845703125, 12.376708984375, 12.90771484375, 13.438720703125, 13.9697265625, 14.500732421875, 15.03173828125, 15.562744140625, 16.09375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 4.0, 10.0, 8.0, 13.0, 15.0, 19.0, 34.0, 43.0, 69.0, 70.0, 110.0, 153.0, 276.0, 374.0, 621.0, 1147.0, 2483.0, 7217.0, 34347.0, 649679.0, 311639.0, 28629.0, 6385.0, 2345.0, 1096.0, 634.0, 376.0, 223.0, 147.0, 117.0, 78.0, 51.0, 32.0, 26.0, 17.0, 14.0, 22.0, 8.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-58.875, -57.2373046875, -55.599609375, -53.9619140625, -52.32421875, -50.6865234375, -49.048828125, -47.4111328125, -45.7734375, -44.1357421875, -42.498046875, -40.8603515625, -39.22265625, -37.5849609375, -35.947265625, -34.3095703125, -32.671875, -31.0341796875, -29.396484375, -27.7587890625, -26.12109375, -24.4833984375, -22.845703125, -21.2080078125, -19.5703125, -17.9326171875, -16.294921875, -14.6572265625, -13.01953125, -11.3818359375, -9.744140625, -8.1064453125, -6.46875, -4.8310546875, -3.193359375, -1.5556640625, 0.08203125, 1.7197265625, 3.357421875, 4.9951171875, 6.6328125, 8.2705078125, 9.908203125, 11.5458984375, 13.18359375, 14.8212890625, 16.458984375, 18.0966796875, 19.734375, 21.3720703125, 23.009765625, 24.6474609375, 26.28515625, 27.9228515625, 29.560546875, 31.1982421875, 32.8359375, 34.4736328125, 36.111328125, 37.7490234375, 39.38671875, 41.0244140625, 42.662109375, 44.2998046875, 45.9375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 9.0, 7.0, 10.0, 11.0, 17.0, 17.0, 21.0, 30.0, 26.0, 44.0, 49.0, 38.0, 57.0, 44.0, 55.0, 47.0, 62.0, 56.0, 54.0, 57.0, 43.0, 41.0, 29.0, 28.0, 23.0, 19.0, 14.0, 18.0, 15.0, 12.0, 8.0, 11.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-59.9375, -57.923828125, -55.91015625, -53.896484375, -51.8828125, -49.869140625, -47.85546875, -45.841796875, -43.828125, -41.814453125, -39.80078125, -37.787109375, -35.7734375, -33.759765625, -31.74609375, -29.732421875, -27.71875, -25.705078125, -23.69140625, -21.677734375, -19.6640625, -17.650390625, -15.63671875, -13.623046875, -11.609375, -9.595703125, -7.58203125, -5.568359375, -3.5546875, -1.541015625, 0.47265625, 2.486328125, 4.5, 6.513671875, 8.52734375, 10.541015625, 12.5546875, 14.568359375, 16.58203125, 18.595703125, 20.609375, 22.623046875, 24.63671875, 26.650390625, 28.6640625, 30.677734375, 32.69140625, 34.705078125, 36.71875, 38.732421875, 40.74609375, 42.759765625, 44.7734375, 46.787109375, 48.80078125, 50.814453125, 52.828125, 54.841796875, 56.85546875, 58.869140625, 60.8828125, 62.896484375, 64.91015625, 66.923828125, 68.9375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 1.0, 4.0, 12.0, 8.0, 12.0, 21.0, 25.0, 25.0, 35.0, 56.0, 65.0, 104.0, 175.0, 322.0, 668.0, 1514.0, 3893.0, 14356.0, 91441.0, 819410.0, 94407.0, 15101.0, 3942.0, 1460.0, 584.0, 327.0, 183.0, 110.0, 73.0, 48.0, 46.0, 24.0, 28.0, 18.0, 13.0, 13.0, 7.0, 5.0, 4.0, 2.0, 3.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.75, -10.4088134765625, -10.067626953125, -9.7264404296875, -9.38525390625, -9.0440673828125, -8.702880859375, -8.3616943359375, -8.0205078125, -7.6793212890625, -7.338134765625, -6.9969482421875, -6.65576171875, -6.3145751953125, -5.973388671875, -5.6322021484375, -5.291015625, -4.9498291015625, -4.608642578125, -4.2674560546875, -3.92626953125, -3.5850830078125, -3.243896484375, -2.9027099609375, -2.5615234375, -2.2203369140625, -1.879150390625, -1.5379638671875, -1.19677734375, -0.8555908203125, -0.514404296875, -0.1732177734375, 0.16796875, 0.5091552734375, 0.850341796875, 1.1915283203125, 1.53271484375, 1.8739013671875, 2.215087890625, 2.5562744140625, 2.8974609375, 3.2386474609375, 3.579833984375, 3.9210205078125, 4.26220703125, 4.6033935546875, 4.944580078125, 5.2857666015625, 5.626953125, 5.9681396484375, 6.309326171875, 6.6505126953125, 6.99169921875, 7.3328857421875, 7.674072265625, 8.0152587890625, 8.3564453125, 8.6976318359375, 9.038818359375, 9.3800048828125, 9.72119140625, 10.0623779296875, 10.403564453125, 10.7447509765625, 11.0859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 6.0, 6.0, 8.0, 17.0, 12.0, 21.0, 29.0, 34.0, 53.0, 66.0, 100.0, 133.0, 146.0, 84.0, 57.0, 44.0, 31.0, 32.0, 29.0, 16.0, 6.0, 10.0, 7.0, 3.0, 6.0, 7.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.003231048583984375, -0.0031434595584869385, -0.003055870532989502, -0.0029682815074920654, -0.002880692481994629, -0.0027931034564971924, -0.002705514430999756, -0.0026179254055023193, -0.002530336380004883, -0.0024427473545074463, -0.0023551583290100098, -0.0022675693035125732, -0.0021799802780151367, -0.0020923912525177, -0.0020048022270202637, -0.0019172132015228271, -0.0018296241760253906, -0.001742035150527954, -0.0016544461250305176, -0.001566857099533081, -0.0014792680740356445, -0.001391679048538208, -0.0013040900230407715, -0.001216500997543335, -0.0011289119720458984, -0.001041322946548462, -0.0009537339210510254, -0.0008661448955535889, -0.0007785558700561523, -0.0006909668445587158, -0.0006033778190612793, -0.0005157887935638428, -0.00042819976806640625, -0.0003406107425689697, -0.0002530217170715332, -0.00016543269157409668, -7.784366607666016e-05, 9.745359420776367e-06, 9.733438491821289e-05, 0.00018492341041564941, 0.00027251243591308594, 0.00036010146141052246, 0.000447690486907959, 0.0005352795124053955, 0.000622868537902832, 0.0007104575634002686, 0.0007980465888977051, 0.0008856356143951416, 0.0009732246398925781, 0.0010608136653900146, 0.0011484026908874512, 0.0012359917163848877, 0.0013235807418823242, 0.0014111697673797607, 0.0014987587928771973, 0.0015863478183746338, 0.0016739368438720703, 0.0017615258693695068, 0.0018491148948669434, 0.0019367039203643799, 0.0020242929458618164, 0.002111881971359253, 0.0021994709968566895, 0.002287060022354126, 0.0023746490478515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 10.0, 7.0, 12.0, 15.0, 20.0, 30.0, 35.0, 50.0, 88.0, 116.0, 192.0, 321.0, 624.0, 1101.0, 2301.0, 5173.0, 14162.0, 48595.0, 248756.0, 625894.0, 69898.0, 18725.0, 6683.0, 2792.0, 1285.0, 680.0, 348.0, 194.0, 134.0, 85.0, 49.0, 51.0, 32.0, 27.0, 13.0, 13.0, 13.0, 6.0, 4.0, 3.0, 1.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.86517333984375, -8.5975341796875, -8.32989501953125, -8.062255859375, -7.79461669921875, -7.5269775390625, -7.25933837890625, -6.99169921875, -6.72406005859375, -6.4564208984375, -6.18878173828125, -5.921142578125, -5.65350341796875, -5.3858642578125, -5.11822509765625, -4.8505859375, -4.58294677734375, -4.3153076171875, -4.04766845703125, -3.780029296875, -3.51239013671875, -3.2447509765625, -2.97711181640625, -2.70947265625, -2.44183349609375, -2.1741943359375, -1.90655517578125, -1.638916015625, -1.37127685546875, -1.1036376953125, -0.83599853515625, -0.568359375, -0.30072021484375, -0.0330810546875, 0.23455810546875, 0.502197265625, 0.76983642578125, 1.0374755859375, 1.30511474609375, 1.57275390625, 1.84039306640625, 2.1080322265625, 2.37567138671875, 2.643310546875, 2.91094970703125, 3.1785888671875, 3.44622802734375, 3.7138671875, 3.98150634765625, 4.2491455078125, 4.51678466796875, 4.784423828125, 5.05206298828125, 5.3197021484375, 5.58734130859375, 5.85498046875, 6.12261962890625, 6.3902587890625, 6.65789794921875, 6.925537109375, 7.19317626953125, 7.4608154296875, 7.72845458984375, 7.99609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 4.0, 7.0, 5.0, 8.0, 20.0, 17.0, 30.0, 27.0, 23.0, 48.0, 67.0, 79.0, 70.0, 61.0, 64.0, 72.0, 64.0, 82.0, 52.0, 37.0, 34.0, 37.0, 15.0, 12.0, 13.0, 11.0, 6.0, 3.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.421875, -8.16943359375, -7.9169921875, -7.66455078125, -7.412109375, -7.15966796875, -6.9072265625, -6.65478515625, -6.40234375, -6.14990234375, -5.8974609375, -5.64501953125, -5.392578125, -5.14013671875, -4.8876953125, -4.63525390625, -4.3828125, -4.13037109375, -3.8779296875, -3.62548828125, -3.373046875, -3.12060546875, -2.8681640625, -2.61572265625, -2.36328125, -2.11083984375, -1.8583984375, -1.60595703125, -1.353515625, -1.10107421875, -0.8486328125, -0.59619140625, -0.34375, -0.09130859375, 0.1611328125, 0.41357421875, 0.666015625, 0.91845703125, 1.1708984375, 1.42333984375, 1.67578125, 1.92822265625, 2.1806640625, 2.43310546875, 2.685546875, 2.93798828125, 3.1904296875, 3.44287109375, 3.6953125, 3.94775390625, 4.2001953125, 4.45263671875, 4.705078125, 4.95751953125, 5.2099609375, 5.46240234375, 5.71484375, 5.96728515625, 6.2197265625, 6.47216796875, 6.724609375, 6.97705078125, 7.2294921875, 7.48193359375, 7.734375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 9.0, 25.0, 54.0, 162.0, 455.0, 171.0, 73.0, 21.0, 11.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-602.2530517578125, -587.0902709960938, -571.927490234375, -556.7647094726562, -541.6019287109375, -526.4391479492188, -511.2763671875, -496.1135559082031, -480.9507751464844, -465.7879943847656, -450.6252136230469, -435.4624328613281, -420.2996520996094, -405.1368408203125, -389.97406005859375, -374.811279296875, -359.64849853515625, -344.4857177734375, -329.32293701171875, -314.16015625, -298.99737548828125, -283.8345947265625, -268.67181396484375, -253.50900268554688, -238.34625244140625, -223.1834716796875, -208.02069091796875, -192.85791015625, -177.6951141357422, -162.53233337402344, -147.3695526123047, -132.20675659179688, -117.04397583007812, -101.88119506835938, -86.7184066772461, -71.55562591552734, -56.39284133911133, -41.23005676269531, -26.067276000976562, -10.904487609863281, 4.258293151855469, 19.421077728271484, 34.5838623046875, 49.74664306640625, 64.909423828125, 80.07221221923828, 95.23499298095703, 110.39778137207031, 125.56056213378906, 140.7233428955078, 155.88612365722656, 171.04891967773438, 186.21170043945312, 201.37448120117188, 216.53726196289062, 231.70004272460938, 246.86282348632812, 262.0256042480469, 277.1883850097656, 292.3511657714844, 307.5139465332031, 322.6767578125, 337.83953857421875, 353.0023193359375, 368.16510009765625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 6.0, 5.0, 12.0, 15.0, 11.0, 11.0, 13.0, 16.0, 14.0, 22.0, 18.0, 21.0, 26.0, 14.0, 31.0, 42.0, 63.0, 111.0, 108.0, 77.0, 51.0, 32.0, 27.0, 32.0, 23.0, 27.0, 24.0, 22.0, 13.0, 15.0, 17.0, 6.0, 19.0, 14.0, 4.0, 7.0, 3.0, 6.0, 5.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-211.69078063964844, -205.30520629882812, -198.91964721679688, -192.53407287597656, -186.1485137939453, -179.762939453125, -173.37738037109375, -166.99180603027344, -160.60623168945312, -154.2206573486328, -147.83509826660156, -141.44952392578125, -135.06396484375, -128.6783905029297, -122.2928237915039, -115.90725708007812, -109.52169799804688, -103.1361312866211, -96.75056457519531, -90.364990234375, -83.97943115234375, -77.59385681152344, -71.20829010009766, -64.82272338867188, -58.437156677246094, -52.05158996582031, -45.66602325439453, -39.280452728271484, -32.8948860168457, -26.509319305419922, -20.123748779296875, -13.738182067871094, -7.35260009765625, -0.9670324325561523, 5.418535232543945, 11.80410385131836, 18.18967056274414, 24.575237274169922, 30.96080780029297, 37.34637451171875, 43.73194122314453, 50.11750793457031, 56.503074645996094, 62.88864517211914, 69.27421569824219, 75.65977478027344, 82.04534912109375, 88.43091583251953, 94.81648254394531, 101.2020492553711, 107.58761596679688, 113.97319030761719, 120.35874938964844, 126.74432373046875, 133.1298828125, 139.5154571533203, 145.90103149414062, 152.28660583496094, 158.6721649169922, 165.0577392578125, 171.44329833984375, 177.82887268066406, 184.21444702148438, 190.60000610351562, 196.98556518554688]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 2.0, 13.0, 5.0, 12.0, 16.0, 29.0, 35.0, 52.0, 83.0, 112.0, 191.0, 257.0, 345.0, 608.0, 924.0, 1509.0, 2595.0, 4744.0, 10237.0, 29314.0, 193420.0, 2216173.0, 1551184.0, 137940.0, 25300.0, 8983.0, 4302.0, 2244.0, 1313.0, 805.0, 491.0, 339.0, 230.0, 144.0, 99.0, 65.0, 55.0, 38.0, 18.0, 16.0, 10.0, 9.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.4375, -39.208984375, -37.98046875, -36.751953125, -35.5234375, -34.294921875, -33.06640625, -31.837890625, -30.609375, -29.380859375, -28.15234375, -26.923828125, -25.6953125, -24.466796875, -23.23828125, -22.009765625, -20.78125, -19.552734375, -18.32421875, -17.095703125, -15.8671875, -14.638671875, -13.41015625, -12.181640625, -10.953125, -9.724609375, -8.49609375, -7.267578125, -6.0390625, -4.810546875, -3.58203125, -2.353515625, -1.125, 0.103515625, 1.33203125, 2.560546875, 3.7890625, 5.017578125, 6.24609375, 7.474609375, 8.703125, 9.931640625, 11.16015625, 12.388671875, 13.6171875, 14.845703125, 16.07421875, 17.302734375, 18.53125, 19.759765625, 20.98828125, 22.216796875, 23.4453125, 24.673828125, 25.90234375, 27.130859375, 28.359375, 29.587890625, 30.81640625, 32.044921875, 33.2734375, 34.501953125, 35.73046875, 36.958984375, 38.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 4.0, 10.0, 9.0, 7.0, 25.0, 29.0, 24.0, 36.0, 25.0, 41.0, 47.0, 38.0, 50.0, 56.0, 54.0, 51.0, 54.0, 56.0, 40.0, 47.0, 38.0, 35.0, 36.0, 23.0, 28.0, 33.0, 22.0, 15.0, 10.0, 12.0, 4.0, 6.0, 6.0, 2.0, 3.0, 6.0, 2.0, 2.0], "bins": [-22.078125, -21.54345703125, -21.0087890625, -20.47412109375, -19.939453125, -19.40478515625, -18.8701171875, -18.33544921875, -17.80078125, -17.26611328125, -16.7314453125, -16.19677734375, -15.662109375, -15.12744140625, -14.5927734375, -14.05810546875, -13.5234375, -12.98876953125, -12.4541015625, -11.91943359375, -11.384765625, -10.85009765625, -10.3154296875, -9.78076171875, -9.24609375, -8.71142578125, -8.1767578125, -7.64208984375, -7.107421875, -6.57275390625, -6.0380859375, -5.50341796875, -4.96875, -4.43408203125, -3.8994140625, -3.36474609375, -2.830078125, -2.29541015625, -1.7607421875, -1.22607421875, -0.69140625, -0.15673828125, 0.3779296875, 0.91259765625, 1.447265625, 1.98193359375, 2.5166015625, 3.05126953125, 3.5859375, 4.12060546875, 4.6552734375, 5.18994140625, 5.724609375, 6.25927734375, 6.7939453125, 7.32861328125, 7.86328125, 8.39794921875, 8.9326171875, 9.46728515625, 10.001953125, 10.53662109375, 11.0712890625, 11.60595703125, 12.140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 20.0, 25.0, 60.0, 138.0, 297.0, 886.0, 3908.0, 90328.0, 4080923.0, 14889.0, 1858.0, 522.0, 206.0, 93.0, 51.0, 29.0, 14.0, 5.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.75, -196.8359375, -190.921875, -185.0078125, -179.09375, -173.1796875, -167.265625, -161.3515625, -155.4375, -149.5234375, -143.609375, -137.6953125, -131.78125, -125.8671875, -119.953125, -114.0390625, -108.125, -102.2109375, -96.296875, -90.3828125, -84.46875, -78.5546875, -72.640625, -66.7265625, -60.8125, -54.8984375, -48.984375, -43.0703125, -37.15625, -31.2421875, -25.328125, -19.4140625, -13.5, -7.5859375, -1.671875, 4.2421875, 10.15625, 16.0703125, 21.984375, 27.8984375, 33.8125, 39.7265625, 45.640625, 51.5546875, 57.46875, 63.3828125, 69.296875, 75.2109375, 81.125, 87.0390625, 92.953125, 98.8671875, 104.78125, 110.6953125, 116.609375, 122.5234375, 128.4375, 134.3515625, 140.265625, 146.1796875, 152.09375, 158.0078125, 163.921875, 169.8359375, 175.75]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 7.0, 21.0, 26.0, 30.0, 54.0, 111.0, 214.0, 465.0, 1135.0, 1116.0, 427.0, 213.0, 117.0, 47.0, 27.0, 20.0, 15.0, 10.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.78125, -53.78466796875, -50.7880859375, -47.79150390625, -44.794921875, -41.79833984375, -38.8017578125, -35.80517578125, -32.80859375, -29.81201171875, -26.8154296875, -23.81884765625, -20.822265625, -17.82568359375, -14.8291015625, -11.83251953125, -8.8359375, -5.83935546875, -2.8427734375, 0.15380859375, 3.150390625, 6.14697265625, 9.1435546875, 12.14013671875, 15.13671875, 18.13330078125, 21.1298828125, 24.12646484375, 27.123046875, 30.11962890625, 33.1162109375, 36.11279296875, 39.109375, 42.10595703125, 45.1025390625, 48.09912109375, 51.095703125, 54.09228515625, 57.0888671875, 60.08544921875, 63.08203125, 66.07861328125, 69.0751953125, 72.07177734375, 75.068359375, 78.06494140625, 81.0615234375, 84.05810546875, 87.0546875, 90.05126953125, 93.0478515625, 96.04443359375, 99.041015625, 102.03759765625, 105.0341796875, 108.03076171875, 111.02734375, 114.02392578125, 117.0205078125, 120.01708984375, 123.013671875, 126.01025390625, 129.0068359375, 132.00341796875, 135.0]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 14.0, 11.0, 30.0, 52.0, 92.0, 212.0, 254.0, 142.0, 79.0, 39.0, 26.0, 9.0, 7.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-951.506591796875, -925.99169921875, -900.476806640625, -874.9619140625, -849.447021484375, -823.93212890625, -798.417236328125, -772.9022827148438, -747.3873901367188, -721.8724975585938, -696.3576049804688, -670.8427124023438, -645.3278198242188, -619.8128662109375, -594.2979736328125, -568.7830810546875, -543.2681884765625, -517.7532958984375, -492.2384033203125, -466.7235107421875, -441.2085876464844, -415.6936950683594, -390.1788024902344, -364.66387939453125, -339.1490478515625, -313.6341552734375, -288.1192626953125, -262.6043701171875, -237.08944702148438, -211.57455444335938, -186.05966186523438, -160.5447540283203, -135.02984619140625, -109.51494598388672, -84.00004577636719, -58.48515319824219, -32.970252990722656, -7.455352783203125, 18.059539794921875, 43.57444763183594, 69.08934020996094, 94.60424041748047, 120.119140625, 145.634033203125, 171.14892578125, 196.66383361816406, 222.17872619628906, 247.69363403320312, 273.2085266113281, 298.7234191894531, 324.2383117675781, 349.75323486328125, 375.26812744140625, 400.78302001953125, 426.29791259765625, 451.81280517578125, 477.32769775390625, 502.84259033203125, 528.3574829101562, 553.8723754882812, 579.3872680664062, 604.9022216796875, 630.4171142578125, 655.9320068359375, 681.4468994140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 4.0, 8.0, 11.0, 11.0, 16.0, 14.0, 28.0, 32.0, 35.0, 45.0, 45.0, 49.0, 44.0, 75.0, 68.0, 93.0, 68.0, 41.0, 57.0, 44.0, 29.0, 46.0, 34.0, 21.0, 23.0, 22.0, 9.0, 5.0, 10.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-360.6197204589844, -347.94769287109375, -335.275634765625, -322.6036071777344, -309.93157958984375, -297.259521484375, -284.5874938964844, -271.91546630859375, -259.243408203125, -246.5713653564453, -233.8993377685547, -221.227294921875, -208.55526733398438, -195.8832244873047, -183.211181640625, -170.53915405273438, -157.86712646484375, -145.19508361816406, -132.52305603027344, -119.85101318359375, -107.1789779663086, -94.50694274902344, -81.83489990234375, -69.1628646850586, -56.49082946777344, -43.81879425048828, -31.14675521850586, -18.474716186523438, -5.802680969238281, 6.869354248046875, 19.541397094726562, 32.21343231201172, 44.88543701171875, 57.557472229003906, 70.22950744628906, 82.90155029296875, 95.5735855102539, 108.24562072753906, 120.91766357421875, 133.58969116210938, 146.26173400878906, 158.93377685546875, 171.60580444335938, 184.27784729003906, 196.94989013671875, 209.62191772460938, 222.29396057128906, 234.96600341796875, 247.63803100585938, 260.31005859375, 272.98211669921875, 285.6541442871094, 298.326171875, 310.99822998046875, 323.6702575683594, 336.34228515625, 349.01434326171875, 361.6863708496094, 374.3584289550781, 387.03045654296875, 399.7024841308594, 412.37451171875, 425.04656982421875, 437.7185974121094, 450.390625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 4.0, 7.0, 10.0, 13.0, 15.0, 24.0, 39.0, 38.0, 63.0, 81.0, 131.0, 167.0, 232.0, 318.0, 540.0, 787.0, 1406.0, 2322.0, 4733.0, 9212.0, 21403.0, 60688.0, 255311.0, 530039.0, 102093.0, 32114.0, 12787.0, 6045.0, 3149.0, 1688.0, 1049.0, 628.0, 441.0, 284.0, 193.0, 120.0, 94.0, 85.0, 53.0, 43.0, 23.0, 25.0, 8.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0], "bins": [-26.625, -25.8232421875, -25.021484375, -24.2197265625, -23.41796875, -22.6162109375, -21.814453125, -21.0126953125, -20.2109375, -19.4091796875, -18.607421875, -17.8056640625, -17.00390625, -16.2021484375, -15.400390625, -14.5986328125, -13.796875, -12.9951171875, -12.193359375, -11.3916015625, -10.58984375, -9.7880859375, -8.986328125, -8.1845703125, -7.3828125, -6.5810546875, -5.779296875, -4.9775390625, -4.17578125, -3.3740234375, -2.572265625, -1.7705078125, -0.96875, -0.1669921875, 0.634765625, 1.4365234375, 2.23828125, 3.0400390625, 3.841796875, 4.6435546875, 5.4453125, 6.2470703125, 7.048828125, 7.8505859375, 8.65234375, 9.4541015625, 10.255859375, 11.0576171875, 11.859375, 12.6611328125, 13.462890625, 14.2646484375, 15.06640625, 15.8681640625, 16.669921875, 17.4716796875, 18.2734375, 19.0751953125, 19.876953125, 20.6787109375, 21.48046875, 22.2822265625, 23.083984375, 23.8857421875, 24.6875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 5.0, 8.0, 10.0, 10.0, 6.0, 12.0, 18.0, 12.0, 23.0, 31.0, 25.0, 44.0, 30.0, 39.0, 46.0, 48.0, 51.0, 60.0, 52.0, 47.0, 43.0, 41.0, 34.0, 50.0, 42.0, 30.0, 23.0, 30.0, 24.0, 18.0, 19.0, 11.0, 5.0, 11.0, 10.0, 7.0, 9.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-23.3125, -22.70166015625, -22.0908203125, -21.47998046875, -20.869140625, -20.25830078125, -19.6474609375, -19.03662109375, -18.42578125, -17.81494140625, -17.2041015625, -16.59326171875, -15.982421875, -15.37158203125, -14.7607421875, -14.14990234375, -13.5390625, -12.92822265625, -12.3173828125, -11.70654296875, -11.095703125, -10.48486328125, -9.8740234375, -9.26318359375, -8.65234375, -8.04150390625, -7.4306640625, -6.81982421875, -6.208984375, -5.59814453125, -4.9873046875, -4.37646484375, -3.765625, -3.15478515625, -2.5439453125, -1.93310546875, -1.322265625, -0.71142578125, -0.1005859375, 0.51025390625, 1.12109375, 1.73193359375, 2.3427734375, 2.95361328125, 3.564453125, 4.17529296875, 4.7861328125, 5.39697265625, 6.0078125, 6.61865234375, 7.2294921875, 7.84033203125, 8.451171875, 9.06201171875, 9.6728515625, 10.28369140625, 10.89453125, 11.50537109375, 12.1162109375, 12.72705078125, 13.337890625, 13.94873046875, 14.5595703125, 15.17041015625, 15.78125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 11.0, 14.0, 15.0, 18.0, 36.0, 58.0, 106.0, 116.0, 228.0, 397.0, 720.0, 2231.0, 14311.0, 845836.0, 173129.0, 8196.0, 1701.0, 628.0, 287.0, 194.0, 94.0, 66.0, 54.0, 38.0, 22.0, 14.0, 11.0, 10.0, 2.0, 2.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-83.0625, -80.92578125, -78.7890625, -76.65234375, -74.515625, -72.37890625, -70.2421875, -68.10546875, -65.96875, -63.83203125, -61.6953125, -59.55859375, -57.421875, -55.28515625, -53.1484375, -51.01171875, -48.875, -46.73828125, -44.6015625, -42.46484375, -40.328125, -38.19140625, -36.0546875, -33.91796875, -31.78125, -29.64453125, -27.5078125, -25.37109375, -23.234375, -21.09765625, -18.9609375, -16.82421875, -14.6875, -12.55078125, -10.4140625, -8.27734375, -6.140625, -4.00390625, -1.8671875, 0.26953125, 2.40625, 4.54296875, 6.6796875, 8.81640625, 10.953125, 13.08984375, 15.2265625, 17.36328125, 19.5, 21.63671875, 23.7734375, 25.91015625, 28.046875, 30.18359375, 32.3203125, 34.45703125, 36.59375, 38.73046875, 40.8671875, 43.00390625, 45.140625, 47.27734375, 49.4140625, 51.55078125, 53.6875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 5.0, 3.0, 4.0, 3.0, 14.0, 9.0, 10.0, 8.0, 16.0, 17.0, 6.0, 27.0, 27.0, 21.0, 28.0, 27.0, 41.0, 40.0, 51.0, 76.0, 68.0, 69.0, 69.0, 59.0, 47.0, 28.0, 30.0, 38.0, 31.0, 18.0, 22.0, 10.0, 17.0, 7.0, 18.0, 9.0, 4.0, 4.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-79.625, -77.0439453125, -74.462890625, -71.8818359375, -69.30078125, -66.7197265625, -64.138671875, -61.5576171875, -58.9765625, -56.3955078125, -53.814453125, -51.2333984375, -48.65234375, -46.0712890625, -43.490234375, -40.9091796875, -38.328125, -35.7470703125, -33.166015625, -30.5849609375, -28.00390625, -25.4228515625, -22.841796875, -20.2607421875, -17.6796875, -15.0986328125, -12.517578125, -9.9365234375, -7.35546875, -4.7744140625, -2.193359375, 0.3876953125, 2.96875, 5.5498046875, 8.130859375, 10.7119140625, 13.29296875, 15.8740234375, 18.455078125, 21.0361328125, 23.6171875, 26.1982421875, 28.779296875, 31.3603515625, 33.94140625, 36.5224609375, 39.103515625, 41.6845703125, 44.265625, 46.8466796875, 49.427734375, 52.0087890625, 54.58984375, 57.1708984375, 59.751953125, 62.3330078125, 64.9140625, 67.4951171875, 70.076171875, 72.6572265625, 75.23828125, 77.8193359375, 80.400390625, 82.9814453125, 85.5625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 6.0, 12.0, 16.0, 22.0, 22.0, 48.0, 43.0, 72.0, 128.0, 204.0, 406.0, 866.0, 2369.0, 9633.0, 100628.0, 906092.0, 21305.0, 4026.0, 1336.0, 538.0, 264.0, 159.0, 82.0, 69.0, 56.0, 37.0, 17.0, 15.0, 14.0, 9.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-10.0390625, -9.7274169921875, -9.415771484375, -9.1041259765625, -8.79248046875, -8.4808349609375, -8.169189453125, -7.8575439453125, -7.5458984375, -7.2342529296875, -6.922607421875, -6.6109619140625, -6.29931640625, -5.9876708984375, -5.676025390625, -5.3643798828125, -5.052734375, -4.7410888671875, -4.429443359375, -4.1177978515625, -3.80615234375, -3.4945068359375, -3.182861328125, -2.8712158203125, -2.5595703125, -2.2479248046875, -1.936279296875, -1.6246337890625, -1.31298828125, -1.0013427734375, -0.689697265625, -0.3780517578125, -0.06640625, 0.2452392578125, 0.556884765625, 0.8685302734375, 1.18017578125, 1.4918212890625, 1.803466796875, 2.1151123046875, 2.4267578125, 2.7384033203125, 3.050048828125, 3.3616943359375, 3.67333984375, 3.9849853515625, 4.296630859375, 4.6082763671875, 4.919921875, 5.2315673828125, 5.543212890625, 5.8548583984375, 6.16650390625, 6.4781494140625, 6.789794921875, 7.1014404296875, 7.4130859375, 7.7247314453125, 8.036376953125, 8.3480224609375, 8.65966796875, 8.9713134765625, 9.282958984375, 9.5946044921875, 9.90625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 6.0, 5.0, 10.0, 16.0, 32.0, 40.0, 80.0, 189.0, 300.0, 149.0, 61.0, 36.0, 25.0, 16.0, 10.0, 9.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025463104248046875, -0.0024143755435943604, -0.002282440662384033, -0.002150505781173706, -0.002018570899963379, -0.0018866360187530518, -0.0017547011375427246, -0.0016227662563323975, -0.0014908313751220703, -0.0013588964939117432, -0.001226961612701416, -0.0010950267314910889, -0.0009630918502807617, -0.0008311569690704346, -0.0006992220878601074, -0.0005672872066497803, -0.0004353523254394531, -0.000303417444229126, -0.00017148256301879883, -3.954768180847168e-05, 9.238719940185547e-05, 0.00022432208061218262, 0.00035625696182250977, 0.0004881918430328369, 0.0006201267242431641, 0.0007520616054534912, 0.0008839964866638184, 0.0010159313678741455, 0.0011478662490844727, 0.0012798011302947998, 0.001411736011505127, 0.001543670892715454, 0.0016756057739257812, 0.0018075406551361084, 0.0019394755363464355, 0.0020714104175567627, 0.00220334529876709, 0.002335280179977417, 0.002467215061187744, 0.0025991499423980713, 0.0027310848236083984, 0.0028630197048187256, 0.0029949545860290527, 0.00312688946723938, 0.003258824348449707, 0.003390759229660034, 0.0035226941108703613, 0.0036546289920806885, 0.0037865638732910156, 0.003918498754501343, 0.00405043363571167, 0.004182368516921997, 0.004314303398132324, 0.004446238279342651, 0.0045781731605529785, 0.004710108041763306, 0.004842042922973633, 0.00497397780418396, 0.005105912685394287, 0.005237847566604614, 0.005369782447814941, 0.0055017173290252686, 0.005633652210235596, 0.005765587091445923, 0.00589752197265625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 12.0, 11.0, 19.0, 13.0, 23.0, 47.0, 65.0, 92.0, 139.0, 230.0, 403.0, 736.0, 1436.0, 3024.0, 7341.0, 21921.0, 106700.0, 818487.0, 61705.0, 15508.0, 5495.0, 2496.0, 1137.0, 552.0, 383.0, 212.0, 103.0, 84.0, 60.0, 31.0, 23.0, 13.0, 15.0, 6.0, 5.0, 6.0, 6.0, 2.0, 1.0, 2.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6640625, -5.4942626953125, -5.324462890625, -5.1546630859375, -4.98486328125, -4.8150634765625, -4.645263671875, -4.4754638671875, -4.3056640625, -4.1358642578125, -3.966064453125, -3.7962646484375, -3.62646484375, -3.4566650390625, -3.286865234375, -3.1170654296875, -2.947265625, -2.7774658203125, -2.607666015625, -2.4378662109375, -2.26806640625, -2.0982666015625, -1.928466796875, -1.7586669921875, -1.5888671875, -1.4190673828125, -1.249267578125, -1.0794677734375, -0.90966796875, -0.7398681640625, -0.570068359375, -0.4002685546875, -0.23046875, -0.0606689453125, 0.109130859375, 0.2789306640625, 0.44873046875, 0.6185302734375, 0.788330078125, 0.9581298828125, 1.1279296875, 1.2977294921875, 1.467529296875, 1.6373291015625, 1.80712890625, 1.9769287109375, 2.146728515625, 2.3165283203125, 2.486328125, 2.6561279296875, 2.825927734375, 2.9957275390625, 3.16552734375, 3.3353271484375, 3.505126953125, 3.6749267578125, 3.8447265625, 4.0145263671875, 4.184326171875, 4.3541259765625, 4.52392578125, 4.6937255859375, 4.863525390625, 5.0333251953125, 5.203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 3.0, 10.0, 12.0, 10.0, 11.0, 13.0, 18.0, 25.0, 31.0, 39.0, 50.0, 93.0, 130.0, 163.0, 111.0, 67.0, 50.0, 31.0, 29.0, 16.0, 17.0, 10.0, 12.0, 13.0, 6.0, 1.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5625, -8.31304931640625, -8.0635986328125, -7.81414794921875, -7.564697265625, -7.31524658203125, -7.0657958984375, -6.81634521484375, -6.56689453125, -6.31744384765625, -6.0679931640625, -5.81854248046875, -5.569091796875, -5.31964111328125, -5.0701904296875, -4.82073974609375, -4.5712890625, -4.32183837890625, -4.0723876953125, -3.82293701171875, -3.573486328125, -3.32403564453125, -3.0745849609375, -2.82513427734375, -2.57568359375, -2.32623291015625, -2.0767822265625, -1.82733154296875, -1.577880859375, -1.32843017578125, -1.0789794921875, -0.82952880859375, -0.580078125, -0.33062744140625, -0.0811767578125, 0.16827392578125, 0.417724609375, 0.66717529296875, 0.9166259765625, 1.16607666015625, 1.41552734375, 1.66497802734375, 1.9144287109375, 2.16387939453125, 2.413330078125, 2.66278076171875, 2.9122314453125, 3.16168212890625, 3.4111328125, 3.66058349609375, 3.9100341796875, 4.15948486328125, 4.408935546875, 4.65838623046875, 4.9078369140625, 5.15728759765625, 5.40673828125, 5.65618896484375, 5.9056396484375, 6.15509033203125, 6.404541015625, 6.65399169921875, 6.9034423828125, 7.15289306640625, 7.40234375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 14.0, 21.0, 39.0, 84.0, 454.0, 216.0, 59.0, 43.0, 21.0, 16.0, 16.0, 6.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.70700073242188, -206.44189453125, -194.17677307128906, -181.9116668701172, -169.64654541015625, -157.38143920898438, -145.1163330078125, -132.85122680664062, -120.58610534667969, -108.32099151611328, -96.05587768554688, -83.790771484375, -71.5256576538086, -59.26054382324219, -46.99543762207031, -34.730323791503906, -22.4652099609375, -10.200098037719727, 2.065013885498047, 14.330123901367188, 26.595237731933594, 38.8603515625, 51.125457763671875, 63.39057159423828, 75.65568542480469, 87.9207992553711, 100.1859130859375, 112.45101928710938, 124.71613311767578, 136.9812469482422, 149.24635314941406, 161.511474609375, 173.776611328125, 186.04171752929688, 198.3068389892578, 210.5719451904297, 222.83706665039062, 235.1021728515625, 247.36727905273438, 259.63238525390625, 271.89752197265625, 284.1626281738281, 296.427734375, 308.69287109375, 320.9579772949219, 333.22308349609375, 345.4881896972656, 357.7532958984375, 370.0184020996094, 382.28350830078125, 394.5486145019531, 406.813720703125, 419.078857421875, 431.3439636230469, 443.60906982421875, 455.8741760253906, 468.1392822265625, 480.4043884277344, 492.66949462890625, 504.93463134765625, 517.19970703125, 529.46484375, 541.72998046875, 553.9950561523438, 566.2601928710938]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 14.0, 8.0, 14.0, 7.0, 15.0, 24.0, 23.0, 35.0, 43.0, 27.0, 163.0, 311.0, 76.0, 38.0, 35.0, 27.0, 22.0, 28.0, 17.0, 10.0, 13.0, 19.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-424.27703857421875, -413.479248046875, -402.6814270019531, -391.8836364746094, -381.0858459472656, -370.28802490234375, -359.490234375, -348.69244384765625, -337.8946533203125, -327.09686279296875, -316.2990417480469, -305.5012512207031, -294.7034606933594, -283.9056396484375, -273.10784912109375, -262.31005859375, -251.51223754882812, -240.7144317626953, -229.91664123535156, -219.11883544921875, -208.321044921875, -197.5232391357422, -186.72543334960938, -175.92764282226562, -165.1298370361328, -154.33203125, -143.53424072265625, -132.73643493652344, -121.93863677978516, -111.14083862304688, -100.34303283691406, -89.54523468017578, -78.7474365234375, -67.94963836669922, -57.15183639526367, -46.354034423828125, -35.556236267089844, -24.758438110351562, -13.96063232421875, -3.1628341674804688, 7.6349639892578125, 18.432764053344727, 29.23056411743164, 40.02836608886719, 50.82616424560547, 61.62396240234375, 72.42176818847656, 83.21956634521484, 94.01736450195312, 104.8151626586914, 115.61296081542969, 126.4107666015625, 137.20855712890625, 148.00636291503906, 158.80416870117188, 169.60195922851562, 180.39976501464844, 191.19757080078125, 201.995361328125, 212.7931671142578, 223.59097290039062, 234.38876342773438, 245.1865692138672, 255.984375, 266.78216552734375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 6.0, 12.0, 10.0, 18.0, 18.0, 20.0, 26.0, 21.0, 27.0, 36.0, 42.0, 64.0, 219.0, 160.0, 59.0, 39.0, 33.0, 18.0, 13.0, 22.0, 16.0, 21.0, 16.0, 9.0, 7.0, 5.0, 7.0, 4.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.381591796875, -19.76318359375, -19.144775390625, -18.5263671875, -17.907958984375, -17.28955078125, -16.671142578125, -16.052734375, -15.434326171875, -14.81591796875, -14.197509765625, -13.5791015625, -12.960693359375, -12.34228515625, -11.723876953125, -11.10546875, -10.487060546875, -9.86865234375, -9.250244140625, -8.6318359375, -8.013427734375, -7.39501953125, -6.776611328125, -6.158203125, -5.539794921875, -4.92138671875, -4.302978515625, -3.6845703125, -3.066162109375, -2.44775390625, -1.829345703125, -1.2109375, -0.592529296875, 0.02587890625, 0.644287109375, 1.2626953125, 1.881103515625, 2.49951171875, 3.117919921875, 3.736328125, 4.354736328125, 4.97314453125, 5.591552734375, 6.2099609375, 6.828369140625, 7.44677734375, 8.065185546875, 8.68359375, 9.302001953125, 9.92041015625, 10.538818359375, 11.1572265625, 11.775634765625, 12.39404296875, 13.012451171875, 13.630859375, 14.249267578125, 14.86767578125, 15.486083984375, 16.1044921875, 16.722900390625, 17.34130859375, 17.959716796875, 18.578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 9.0, 13.0, 6.0, 28.0, 30.0, 70.0, 146.0, 336.0, 1123.0, 8057.0, 8363413.0, 13015.0, 1546.0, 421.0, 166.0, 82.0, 47.0, 22.0, 18.0, 9.0, 2.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-355.33447265625, -343.3227233886719, -331.31097412109375, -319.29925537109375, -307.2875061035156, -295.2757568359375, -283.2640380859375, -271.2522888183594, -259.24053955078125, -247.22879028320312, -235.21705627441406, -223.205322265625, -211.19357299804688, -199.18182373046875, -187.1700897216797, -175.15835571289062, -163.1466064453125, -151.13485717773438, -139.1231231689453, -127.11138153076172, -115.09963989257812, -103.08789825439453, -91.07615661621094, -79.06441497802734, -67.05267333984375, -55.040931701660156, -43.02919006347656, -31.01744842529297, -19.005706787109375, -6.993965148925781, 5.0177764892578125, 17.029518127441406, 29.041290283203125, 41.05303192138672, 53.06477355957031, 65.0765151977539, 77.0882568359375, 89.0999984741211, 101.11174011230469, 113.12348175048828, 125.13522338867188, 137.14697265625, 149.15870666503906, 161.17044067382812, 173.18218994140625, 185.19393920898438, 197.20567321777344, 209.2174072265625, 221.22915649414062, 233.24090576171875, 245.2526397705078, 257.2643737792969, 269.276123046875, 281.2878723144531, 293.29962158203125, 305.31134033203125, 317.3230895996094, 329.3348388671875, 341.3465576171875, 353.3583068847656, 365.37005615234375, 377.3818054199219, 389.3935546875, 401.4052734375, 413.4170227050781]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 9.0, 9.0, 4.0, 4.0, 7.0, 4.0, 4.0, 4.0, 0.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-434.44000244140625, -422.5452880859375, -410.6506042480469, -398.7558898925781, -386.8612060546875, -374.96649169921875, -363.07177734375, -351.17706298828125, -339.2823791503906, -327.3876647949219, -315.49298095703125, -303.5982666015625, -291.70355224609375, -279.8088684082031, -267.9141540527344, -256.01947021484375, -244.124755859375, -232.2300567626953, -220.33535766601562, -208.44064331054688, -196.5459442138672, -184.6512451171875, -172.75653076171875, -160.86183166503906, -148.96713256835938, -137.0724334716797, -125.17772674560547, -113.28302001953125, -101.38832092285156, -89.49362182617188, -77.59891510009766, -65.70420837402344, -53.809478759765625, -41.91477584838867, -30.02007293701172, -18.125370025634766, -6.2306671142578125, 5.664035797119141, 17.558738708496094, 29.453445434570312, 41.34814453125, 53.24284744262695, 65.1375503540039, 77.03225708007812, 88.92695617675781, 100.8216552734375, 112.71636199951172, 124.61106872558594, 136.50576782226562, 148.4004669189453, 160.295166015625, 172.18988037109375, 184.08457946777344, 195.97927856445312, 207.87399291992188, 219.76869201660156, 231.66339111328125, 243.55809020996094, 255.45278930664062, 267.3475036621094, 279.2421875, 291.13690185546875, 303.0316162109375, 314.92633056640625, 326.8210144042969]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 11.0, 15.0, 17.0, 8.0, 20.0, 24.0, 36.0, 63.0, 75.0, 115.0, 151.0, 240.0, 384.0, 635.0, 1043.0, 1876.0, 3492.0, 6913.0, 14705.0, 32820.0, 74380.0, 145635.0, 128143.0, 60574.0, 27001.0, 12453.0, 6093.0, 3024.0, 1626.0, 976.0, 600.0, 361.0, 231.0, 148.0, 101.0, 69.0, 56.0, 40.0, 28.0, 22.0, 23.0, 6.0, 11.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-125.0, -121.416015625, -117.83203125, -114.248046875, -110.6640625, -107.080078125, -103.49609375, -99.912109375, -96.328125, -92.744140625, -89.16015625, -85.576171875, -81.9921875, -78.408203125, -74.82421875, -71.240234375, -67.65625, -64.072265625, -60.48828125, -56.904296875, -53.3203125, -49.736328125, -46.15234375, -42.568359375, -38.984375, -35.400390625, -31.81640625, -28.232421875, -24.6484375, -21.064453125, -17.48046875, -13.896484375, -10.3125, -6.728515625, -3.14453125, 0.439453125, 4.0234375, 7.607421875, 11.19140625, 14.775390625, 18.359375, 21.943359375, 25.52734375, 29.111328125, 32.6953125, 36.279296875, 39.86328125, 43.447265625, 47.03125, 50.615234375, 54.19921875, 57.783203125, 61.3671875, 64.951171875, 68.53515625, 72.119140625, 75.703125, 79.287109375, 82.87109375, 86.455078125, 90.0390625, 93.623046875, 97.20703125, 100.791015625, 104.375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 13.0, 10.0, 16.0, 13.0, 28.0, 24.0, 37.0, 36.0, 52.0, 71.0, 72.0, 85.0, 96.0, 80.0, 73.0, 67.0, 54.0, 38.0, 25.0, 20.0, 23.0, 12.0, 11.0, 7.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.0625, -31.219970703125, -30.37744140625, -29.534912109375, -28.6923828125, -27.849853515625, -27.00732421875, -26.164794921875, -25.322265625, -24.479736328125, -23.63720703125, -22.794677734375, -21.9521484375, -21.109619140625, -20.26708984375, -19.424560546875, -18.58203125, -17.739501953125, -16.89697265625, -16.054443359375, -15.2119140625, -14.369384765625, -13.52685546875, -12.684326171875, -11.841796875, -10.999267578125, -10.15673828125, -9.314208984375, -8.4716796875, -7.629150390625, -6.78662109375, -5.944091796875, -5.1015625, -4.259033203125, -3.41650390625, -2.573974609375, -1.7314453125, -0.888916015625, -0.04638671875, 0.796142578125, 1.638671875, 2.481201171875, 3.32373046875, 4.166259765625, 5.0087890625, 5.851318359375, 6.69384765625, 7.536376953125, 8.37890625, 9.221435546875, 10.06396484375, 10.906494140625, 11.7490234375, 12.591552734375, 13.43408203125, 14.276611328125, 15.119140625, 15.961669921875, 16.80419921875, 17.646728515625, 18.4892578125, 19.331787109375, 20.17431640625, 21.016845703125, 21.859375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 11.0, 21.0, 38.0, 105.0, 127.0, 93.0, 35.0, 15.0, 10.0, 9.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-300.0721130371094, -292.0474853515625, -284.02288818359375, -275.9982604980469, -267.9736328125, -259.9490051269531, -251.92440795898438, -243.8997802734375, -235.87515258789062, -227.8505401611328, -219.82591247558594, -211.80130004882812, -203.77667236328125, -195.75205993652344, -187.72744750976562, -179.70281982421875, -171.67820739746094, -163.65359497070312, -155.62896728515625, -147.60435485839844, -139.57972717285156, -131.55511474609375, -123.5304946899414, -115.50587463378906, -107.48125457763672, -99.45663452148438, -91.43201446533203, -83.40739440917969, -75.38278198242188, -67.358154296875, -59.33354187011719, -51.308921813964844, -43.28428649902344, -35.259666442871094, -27.235048294067383, -19.210430145263672, -11.185810089111328, -3.1611900329589844, 4.863426208496094, 12.888046264648438, 20.91266632080078, 28.937286376953125, 36.96190643310547, 44.98652267456055, 53.01114273071289, 61.035762786865234, 69.06037902832031, 77.08499908447266, 85.109619140625, 93.13423919677734, 101.15885925292969, 109.1834716796875, 117.20809936523438, 125.23271179199219, 133.25732421875, 141.28195190429688, 149.30657958984375, 157.33119201660156, 165.35581970214844, 173.38043212890625, 181.40505981445312, 189.42967224121094, 197.45428466796875, 205.47891235351562, 213.50352478027344]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 4.0, 4.0, 6.0, 7.0, 4.0, 17.0, 38.0, 89.0, 102.0, 75.0, 49.0, 29.0, 15.0, 4.0, 6.0, 5.0, 6.0, 0.0, 2.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.60195922851562, -134.61439514160156, -130.62684631347656, -126.6392822265625, -122.65171813964844, -118.6641616821289, -114.67660522460938, -110.68904113769531, -106.70147705078125, -102.71392059326172, -98.72635650634766, -94.73880004882812, -90.75123596191406, -86.76367950439453, -82.776123046875, -78.78855895996094, -74.8010025024414, -70.81344604492188, -66.82588195800781, -62.83832550048828, -58.85076141357422, -54.86320495605469, -50.87564468383789, -46.888084411621094, -42.9005241394043, -38.9129638671875, -34.9254035949707, -30.93784523010254, -26.950284957885742, -22.962724685668945, -18.97516632080078, -14.987606048583984, -11.000045776367188, -7.012485980987549, -3.02492618560791, 0.9626331329345703, 4.950193405151367, 8.937753677368164, 12.925312042236328, 16.912872314453125, 20.900432586669922, 24.88799285888672, 28.875553131103516, 32.86311340332031, 36.850669860839844, 40.838233947753906, 44.82579040527344, 48.813350677490234, 52.80091094970703, 56.78847122192383, 60.776031494140625, 64.76358795166016, 68.75115203857422, 72.73870849609375, 76.72627258300781, 80.71382904052734, 84.70138549804688, 88.6889419555664, 92.67650604248047, 96.6640625, 100.65162658691406, 104.6391830444336, 108.62673950195312, 112.61430358886719, 116.60186767578125]}, "eval/loss": 4.626309871673584, "eval/wer": 0.8567830226100753, "eval/runtime": 668.3691, "eval/samples_per_second": 3.953, "eval/steps_per_second": 0.495, "train/train_runtime": 105887.1553, "train/train_samples_per_second": 5.39, "train/train_steps_per_second": 0.168, "train/total_flos": 0.0, "train/train_loss": 2.9837629611785585} \ No newline at end of file