diff --git "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" --- "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" +++ "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.2609, "train/learning_rate": 3.953521126760564e-06, "train/epoch": 21.86, "train/global_step": 19500, "_runtime": 118007, "_timestamp": 1648259351, "_step": 19512, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 2.0, 0.0, 4.0, 10.0, 9.0, 6.0, 9.0, 9.0, 13.0, 14.0, 13.0, 16.0, 14.0, 26.0, 28.0, 32.0, 36.0, 42.0, 40.0, 39.0, 44.0, 41.0, 43.0, 45.0, 40.0, 41.0, 34.0, 44.0, 43.0, 38.0, 30.0, 25.0, 23.0, 30.0, 20.0, 19.0, 13.0, 16.0, 10.0, 6.0, 8.0, 6.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.773677825927734, -20.236312866210938, -19.69894790649414, -19.161582946777344, -18.624216079711914, -18.086851119995117, -17.54948616027832, -17.012121200561523, -16.474756240844727, -15.93739128112793, -15.400025367736816, -14.86266040802002, -14.325295448303223, -13.78792953491211, -13.250564575195312, -12.713199615478516, -12.175833702087402, -11.638468742370605, -11.101102828979492, -10.563737869262695, -10.026372909545898, -9.489007949829102, -8.951642036437988, -8.414277076721191, -7.876911640167236, -7.339546203613281, -6.802181243896484, -6.264815807342529, -5.727450370788574, -5.190085411071777, -4.652719974517822, -4.115354537963867, -3.577988624572754, -3.040623426437378, -2.503258228302002, -1.9658927917480469, -1.428527593612671, -0.8911623954772949, -0.35379695892333984, 0.18356823921203613, 0.7209334373474121, 1.258298635482788, 1.7956639528274536, 2.333029270172119, 2.870394468307495, 3.407759666442871, 3.945125102996826, 4.482490539550781, 5.019855499267578, 5.557220935821533, 6.09458589553833, 6.631951332092285, 7.169316291809082, 7.706681728363037, 8.244047164916992, 8.781412124633789, 9.318777084350586, 9.856142044067383, 10.393507957458496, 10.930872917175293, 11.46823787689209, 12.005603790283203, 12.54296875, 13.080333709716797, 13.61769962310791]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 4.0, 9.0, 5.0, 12.0, 10.0, 7.0, 9.0, 22.0, 13.0, 22.0, 19.0, 12.0, 21.0, 21.0, 20.0, 36.0, 32.0, 29.0, 30.0, 43.0, 49.0, 44.0, 44.0, 34.0, 46.0, 47.0, 34.0, 41.0, 32.0, 33.0, 27.0, 23.0, 18.0, 32.0, 10.0, 16.0, 21.0, 13.0, 14.0, 8.0, 3.0, 9.0, 6.0, 8.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-15.525087356567383, -15.04666805267334, -14.568248748779297, -14.089829444885254, -13.611410140991211, -13.132989883422852, -12.654570579528809, -12.176151275634766, -11.697731971740723, -11.21931266784668, -10.740893363952637, -10.262474060058594, -9.784053802490234, -9.305635452270508, -8.827215194702148, -8.348795890808105, -7.8703765869140625, -7.3919572830200195, -6.913537979125977, -6.435118198394775, -5.956698894500732, -5.4782795906066895, -4.999859809875488, -4.521440505981445, -4.043021202087402, -3.5646018981933594, -3.0861823558807373, -2.6077628135681152, -2.1293435096740723, -1.6509242057800293, -1.1725046634674072, -0.6940851211547852, -0.2156658172607422, 0.26275360584259033, 0.7411730289459229, 1.2195924520492554, 1.698011875152588, 2.176431179046631, 2.654850721359253, 3.133270263671875, 3.611689567565918, 4.090108871459961, 4.568528175354004, 5.046947956085205, 5.525367259979248, 6.003786563873291, 6.482206344604492, 6.960625648498535, 7.439044952392578, 7.917464256286621, 8.395883560180664, 8.874302864074707, 9.35272216796875, 9.83114242553711, 10.309561729431152, 10.787981033325195, 11.266400337219238, 11.744819641113281, 12.223238945007324, 12.701658248901367, 13.180078506469727, 13.658496856689453, 14.136917114257812, 14.615336418151855, 15.093755722045898]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 8.0, 9.0, 29.0, 38.0, 82.0, 105.0, 204.0, 374.0, 613.0, 1049.0, 1868.0, 3197.0, 5767.0, 10291.0, 18625.0, 33443.0, 59118.0, 106599.0, 191991.0, 338871.0, 561121.0, 780596.0, 773383.0, 551120.0, 330416.0, 187334.0, 104899.0, 58312.0, 32589.0, 18124.0, 10396.0, 5809.0, 3354.0, 1854.0, 1069.0, 646.0, 422.0, 223.0, 130.0, 71.0, 44.0, 31.0, 20.0, 11.0, 10.0, 11.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.5625, -26.70068359375, -25.8388671875, -24.97705078125, -24.115234375, -23.25341796875, -22.3916015625, -21.52978515625, -20.66796875, -19.80615234375, -18.9443359375, -18.08251953125, -17.220703125, -16.35888671875, -15.4970703125, -14.63525390625, -13.7734375, -12.91162109375, -12.0498046875, -11.18798828125, -10.326171875, -9.46435546875, -8.6025390625, -7.74072265625, -6.87890625, -6.01708984375, -5.1552734375, -4.29345703125, -3.431640625, -2.56982421875, -1.7080078125, -0.84619140625, 0.015625, 0.87744140625, 1.7392578125, 2.60107421875, 3.462890625, 4.32470703125, 5.1865234375, 6.04833984375, 6.91015625, 7.77197265625, 8.6337890625, 9.49560546875, 10.357421875, 11.21923828125, 12.0810546875, 12.94287109375, 13.8046875, 14.66650390625, 15.5283203125, 16.39013671875, 17.251953125, 18.11376953125, 18.9755859375, 19.83740234375, 20.69921875, 21.56103515625, 22.4228515625, 23.28466796875, 24.146484375, 25.00830078125, 25.8701171875, 26.73193359375, 27.59375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 8.0, 7.0, 4.0, 8.0, 9.0, 6.0, 5.0, 11.0, 13.0, 21.0, 8.0, 17.0, 23.0, 13.0, 23.0, 26.0, 26.0, 32.0, 27.0, 41.0, 29.0, 44.0, 43.0, 27.0, 43.0, 37.0, 38.0, 44.0, 51.0, 37.0, 31.0, 28.0, 30.0, 26.0, 18.0, 23.0, 25.0, 15.0, 16.0, 11.0, 12.0, 8.0, 7.0, 10.0, 3.0, 2.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.390625, -15.8968505859375, -15.403076171875, -14.9093017578125, -14.41552734375, -13.9217529296875, -13.427978515625, -12.9342041015625, -12.4404296875, -11.9466552734375, -11.452880859375, -10.9591064453125, -10.46533203125, -9.9715576171875, -9.477783203125, -8.9840087890625, -8.490234375, -7.9964599609375, -7.502685546875, -7.0089111328125, -6.51513671875, -6.0213623046875, -5.527587890625, -5.0338134765625, -4.5400390625, -4.0462646484375, -3.552490234375, -3.0587158203125, -2.56494140625, -2.0711669921875, -1.577392578125, -1.0836181640625, -0.58984375, -0.0960693359375, 0.397705078125, 0.8914794921875, 1.38525390625, 1.8790283203125, 2.372802734375, 2.8665771484375, 3.3603515625, 3.8541259765625, 4.347900390625, 4.8416748046875, 5.33544921875, 5.8292236328125, 6.322998046875, 6.8167724609375, 7.310546875, 7.8043212890625, 8.298095703125, 8.7918701171875, 9.28564453125, 9.7794189453125, 10.273193359375, 10.7669677734375, 11.2607421875, 11.7545166015625, 12.248291015625, 12.7420654296875, 13.23583984375, 13.7296142578125, 14.223388671875, 14.7171630859375, 15.2109375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 9.0, 14.0, 21.0, 45.0, 56.0, 95.0, 167.0, 285.0, 411.0, 747.0, 1296.0, 2053.0, 3510.0, 6276.0, 10517.0, 18531.0, 31791.0, 54954.0, 92458.0, 154517.0, 251333.0, 388724.0, 549180.0, 659820.0, 631417.0, 487430.0, 330940.0, 208451.0, 126714.0, 76304.0, 44387.0, 25942.0, 14904.0, 8909.0, 5034.0, 2949.0, 1694.0, 964.0, 594.0, 334.0, 185.0, 111.0, 79.0, 48.0, 30.0, 20.0, 15.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.171875, -19.51708984375, -18.8623046875, -18.20751953125, -17.552734375, -16.89794921875, -16.2431640625, -15.58837890625, -14.93359375, -14.27880859375, -13.6240234375, -12.96923828125, -12.314453125, -11.65966796875, -11.0048828125, -10.35009765625, -9.6953125, -9.04052734375, -8.3857421875, -7.73095703125, -7.076171875, -6.42138671875, -5.7666015625, -5.11181640625, -4.45703125, -3.80224609375, -3.1474609375, -2.49267578125, -1.837890625, -1.18310546875, -0.5283203125, 0.12646484375, 0.78125, 1.43603515625, 2.0908203125, 2.74560546875, 3.400390625, 4.05517578125, 4.7099609375, 5.36474609375, 6.01953125, 6.67431640625, 7.3291015625, 7.98388671875, 8.638671875, 9.29345703125, 9.9482421875, 10.60302734375, 11.2578125, 11.91259765625, 12.5673828125, 13.22216796875, 13.876953125, 14.53173828125, 15.1865234375, 15.84130859375, 16.49609375, 17.15087890625, 17.8056640625, 18.46044921875, 19.115234375, 19.77001953125, 20.4248046875, 21.07958984375, 21.734375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 8.0, 8.0, 12.0, 18.0, 24.0, 32.0, 43.0, 46.0, 70.0, 79.0, 124.0, 129.0, 172.0, 155.0, 206.0, 255.0, 282.0, 298.0, 297.0, 283.0, 238.0, 264.0, 203.0, 135.0, 158.0, 122.0, 108.0, 68.0, 60.0, 46.0, 36.0, 26.0, 24.0, 12.0, 11.0, 9.0, 7.0, 0.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4921875, -8.177734375, -7.86328125, -7.548828125, -7.234375, -6.919921875, -6.60546875, -6.291015625, -5.9765625, -5.662109375, -5.34765625, -5.033203125, -4.71875, -4.404296875, -4.08984375, -3.775390625, -3.4609375, -3.146484375, -2.83203125, -2.517578125, -2.203125, -1.888671875, -1.57421875, -1.259765625, -0.9453125, -0.630859375, -0.31640625, -0.001953125, 0.3125, 0.626953125, 0.94140625, 1.255859375, 1.5703125, 1.884765625, 2.19921875, 2.513671875, 2.828125, 3.142578125, 3.45703125, 3.771484375, 4.0859375, 4.400390625, 4.71484375, 5.029296875, 5.34375, 5.658203125, 5.97265625, 6.287109375, 6.6015625, 6.916015625, 7.23046875, 7.544921875, 7.859375, 8.173828125, 8.48828125, 8.802734375, 9.1171875, 9.431640625, 9.74609375, 10.060546875, 10.375, 10.689453125, 11.00390625, 11.318359375, 11.6328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 1.0, 9.0, 8.0, 17.0, 19.0, 16.0, 14.0, 24.0, 28.0, 36.0, 21.0, 35.0, 33.0, 47.0, 46.0, 51.0, 48.0, 42.0, 52.0, 56.0, 42.0, 45.0, 41.0, 36.0, 26.0, 31.0, 38.0, 26.0, 20.0, 16.0, 16.0, 13.0, 13.0, 10.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.74880599975586, -17.044118881225586, -16.339431762695312, -15.634745597839355, -14.930058479309082, -14.225371360778809, -13.520685195922852, -12.815998077392578, -12.111310958862305, -11.406623840332031, -10.701936721801758, -9.9972505569458, -9.292563438415527, -8.587876319885254, -7.883189678192139, -7.178503036499023, -6.47381591796875, -5.769128799438477, -5.064442157745361, -4.359755516052246, -3.6550683975219727, -2.9503815174102783, -2.245694637298584, -1.5410079956054688, -0.8363208770751953, -0.13163399696350098, 0.5730528831481934, 1.2777397632598877, 1.982426643371582, 2.6871135234832764, 3.3918004035949707, 4.096487045288086, 4.801172256469727, 5.505859375, 6.210546016693115, 6.9152326583862305, 7.619919776916504, 8.324606895446777, 9.029293060302734, 9.733980178833008, 10.438667297363281, 11.143354415893555, 11.848041534423828, 12.552727699279785, 13.257414817810059, 13.962101936340332, 14.666788101196289, 15.371475219726562, 16.076162338256836, 16.78084945678711, 17.485536575317383, 18.190223693847656, 18.894908905029297, 19.59959602355957, 20.304283142089844, 21.008970260620117, 21.71365737915039, 22.418344497680664, 23.123031616210938, 23.82771873474121, 24.532405853271484, 25.237091064453125, 25.9417781829834, 26.646465301513672, 27.351152420043945]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 15.0, 6.0, 17.0, 9.0, 12.0, 16.0, 12.0, 13.0, 16.0, 19.0, 33.0, 34.0, 25.0, 32.0, 35.0, 40.0, 42.0, 36.0, 41.0, 57.0, 41.0, 45.0, 38.0, 39.0, 32.0, 32.0, 32.0, 37.0, 32.0, 24.0, 17.0, 23.0, 14.0, 17.0, 14.0, 16.0, 11.0, 9.0, 4.0, 2.0, 8.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.06359100341797, -19.425167083740234, -18.7867431640625, -18.148319244384766, -17.50989532470703, -16.871471405029297, -16.233047485351562, -15.594623565673828, -14.956199645996094, -14.31777572631836, -13.679351806640625, -13.04092788696289, -12.402503967285156, -11.764080047607422, -11.125656127929688, -10.487232208251953, -9.848808288574219, -9.210384368896484, -8.57196044921875, -7.933536529541016, -7.295112609863281, -6.656688690185547, -6.0182647705078125, -5.379840850830078, -4.741416931152344, -4.102993011474609, -3.464569091796875, -2.8261451721191406, -2.1877212524414062, -1.5492973327636719, -0.9108734130859375, -0.2724494934082031, 0.36597251892089844, 1.0043964385986328, 1.6428203582763672, 2.2812442779541016, 2.919668197631836, 3.5580921173095703, 4.196516036987305, 4.834939956665039, 5.473363876342773, 6.111787796020508, 6.750211715698242, 7.388635635375977, 8.027059555053711, 8.665483474731445, 9.30390739440918, 9.942331314086914, 10.580755233764648, 11.219179153442383, 11.857603073120117, 12.496026992797852, 13.134450912475586, 13.77287483215332, 14.411298751831055, 15.049722671508789, 15.688146591186523, 16.326570510864258, 16.964994430541992, 17.603418350219727, 18.24184226989746, 18.880266189575195, 19.51869010925293, 20.157114028930664, 20.7955379486084]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 5.0, 13.0, 13.0, 27.0, 60.0, 68.0, 112.0, 145.0, 240.0, 390.0, 542.0, 822.0, 1240.0, 1955.0, 2982.0, 4479.0, 6747.0, 10498.0, 16177.0, 23978.0, 35520.0, 50978.0, 71072.0, 92667.0, 113005.0, 122672.0, 119214.0, 103050.0, 81382.0, 59310.0, 42465.0, 28989.0, 19668.0, 13094.0, 8630.0, 5722.0, 3691.0, 2322.0, 1593.0, 1004.0, 701.0, 432.0, 307.0, 177.0, 138.0, 94.0, 61.0, 35.0, 20.0, 20.0, 11.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.53125, -17.908203125, -17.28515625, -16.662109375, -16.0390625, -15.416015625, -14.79296875, -14.169921875, -13.546875, -12.923828125, -12.30078125, -11.677734375, -11.0546875, -10.431640625, -9.80859375, -9.185546875, -8.5625, -7.939453125, -7.31640625, -6.693359375, -6.0703125, -5.447265625, -4.82421875, -4.201171875, -3.578125, -2.955078125, -2.33203125, -1.708984375, -1.0859375, -0.462890625, 0.16015625, 0.783203125, 1.40625, 2.029296875, 2.65234375, 3.275390625, 3.8984375, 4.521484375, 5.14453125, 5.767578125, 6.390625, 7.013671875, 7.63671875, 8.259765625, 8.8828125, 9.505859375, 10.12890625, 10.751953125, 11.375, 11.998046875, 12.62109375, 13.244140625, 13.8671875, 14.490234375, 15.11328125, 15.736328125, 16.359375, 16.982421875, 17.60546875, 18.228515625, 18.8515625, 19.474609375, 20.09765625, 20.720703125, 21.34375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 8.0, 6.0, 11.0, 13.0, 17.0, 8.0, 20.0, 22.0, 32.0, 26.0, 27.0, 31.0, 42.0, 45.0, 27.0, 48.0, 38.0, 51.0, 51.0, 51.0, 52.0, 36.0, 37.0, 28.0, 44.0, 31.0, 29.0, 17.0, 26.0, 24.0, 18.0, 24.0, 10.0, 16.0, 8.0, 11.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.890625, -19.232666015625, -18.57470703125, -17.916748046875, -17.2587890625, -16.600830078125, -15.94287109375, -15.284912109375, -14.626953125, -13.968994140625, -13.31103515625, -12.653076171875, -11.9951171875, -11.337158203125, -10.67919921875, -10.021240234375, -9.36328125, -8.705322265625, -8.04736328125, -7.389404296875, -6.7314453125, -6.073486328125, -5.41552734375, -4.757568359375, -4.099609375, -3.441650390625, -2.78369140625, -2.125732421875, -1.4677734375, -0.809814453125, -0.15185546875, 0.506103515625, 1.1640625, 1.822021484375, 2.47998046875, 3.137939453125, 3.7958984375, 4.453857421875, 5.11181640625, 5.769775390625, 6.427734375, 7.085693359375, 7.74365234375, 8.401611328125, 9.0595703125, 9.717529296875, 10.37548828125, 11.033447265625, 11.69140625, 12.349365234375, 13.00732421875, 13.665283203125, 14.3232421875, 14.981201171875, 15.63916015625, 16.297119140625, 16.955078125, 17.613037109375, 18.27099609375, 18.928955078125, 19.5869140625, 20.244873046875, 20.90283203125, 21.560791015625, 22.21875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 11.0, 4.0, 15.0, 18.0, 31.0, 41.0, 60.0, 73.0, 113.0, 168.0, 233.0, 369.0, 594.0, 937.0, 1551.0, 2559.0, 4266.0, 7319.0, 12488.0, 22510.0, 39596.0, 71021.0, 120886.0, 182403.0, 203363.0, 155244.0, 96099.0, 54402.0, 30514.0, 17177.0, 9839.0, 5768.0, 3366.0, 2044.0, 1229.0, 781.0, 525.0, 297.0, 199.0, 125.0, 97.0, 65.0, 46.0, 24.0, 25.0, 19.0, 13.0, 9.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-32.375, -31.3056640625, -30.236328125, -29.1669921875, -28.09765625, -27.0283203125, -25.958984375, -24.8896484375, -23.8203125, -22.7509765625, -21.681640625, -20.6123046875, -19.54296875, -18.4736328125, -17.404296875, -16.3349609375, -15.265625, -14.1962890625, -13.126953125, -12.0576171875, -10.98828125, -9.9189453125, -8.849609375, -7.7802734375, -6.7109375, -5.6416015625, -4.572265625, -3.5029296875, -2.43359375, -1.3642578125, -0.294921875, 0.7744140625, 1.84375, 2.9130859375, 3.982421875, 5.0517578125, 6.12109375, 7.1904296875, 8.259765625, 9.3291015625, 10.3984375, 11.4677734375, 12.537109375, 13.6064453125, 14.67578125, 15.7451171875, 16.814453125, 17.8837890625, 18.953125, 20.0224609375, 21.091796875, 22.1611328125, 23.23046875, 24.2998046875, 25.369140625, 26.4384765625, 27.5078125, 28.5771484375, 29.646484375, 30.7158203125, 31.78515625, 32.8544921875, 33.923828125, 34.9931640625, 36.0625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 5.0, 13.0, 15.0, 11.0, 10.0, 16.0, 23.0, 14.0, 15.0, 28.0, 32.0, 25.0, 33.0, 29.0, 34.0, 33.0, 43.0, 48.0, 37.0, 29.0, 35.0, 38.0, 35.0, 23.0, 40.0, 25.0, 33.0, 38.0, 32.0, 25.0, 16.0, 13.0, 21.0, 15.0, 16.0, 5.0, 10.0, 10.0, 14.0, 6.0, 13.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.578125, -12.19189453125, -11.8056640625, -11.41943359375, -11.033203125, -10.64697265625, -10.2607421875, -9.87451171875, -9.48828125, -9.10205078125, -8.7158203125, -8.32958984375, -7.943359375, -7.55712890625, -7.1708984375, -6.78466796875, -6.3984375, -6.01220703125, -5.6259765625, -5.23974609375, -4.853515625, -4.46728515625, -4.0810546875, -3.69482421875, -3.30859375, -2.92236328125, -2.5361328125, -2.14990234375, -1.763671875, -1.37744140625, -0.9912109375, -0.60498046875, -0.21875, 0.16748046875, 0.5537109375, 0.93994140625, 1.326171875, 1.71240234375, 2.0986328125, 2.48486328125, 2.87109375, 3.25732421875, 3.6435546875, 4.02978515625, 4.416015625, 4.80224609375, 5.1884765625, 5.57470703125, 5.9609375, 6.34716796875, 6.7333984375, 7.11962890625, 7.505859375, 7.89208984375, 8.2783203125, 8.66455078125, 9.05078125, 9.43701171875, 9.8232421875, 10.20947265625, 10.595703125, 10.98193359375, 11.3681640625, 11.75439453125, 12.140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 16.0, 13.0, 12.0, 18.0, 16.0, 50.0, 50.0, 70.0, 86.0, 120.0, 200.0, 305.0, 443.0, 786.0, 1495.0, 3192.0, 9027.0, 32540.0, 149322.0, 474376.0, 287787.0, 63340.0, 15507.0, 4959.0, 2098.0, 1020.0, 568.0, 354.0, 245.0, 164.0, 107.0, 68.0, 55.0, 50.0, 19.0, 29.0, 14.0, 3.0, 11.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.65625, -30.59130859375, -29.5263671875, -28.46142578125, -27.396484375, -26.33154296875, -25.2666015625, -24.20166015625, -23.13671875, -22.07177734375, -21.0068359375, -19.94189453125, -18.876953125, -17.81201171875, -16.7470703125, -15.68212890625, -14.6171875, -13.55224609375, -12.4873046875, -11.42236328125, -10.357421875, -9.29248046875, -8.2275390625, -7.16259765625, -6.09765625, -5.03271484375, -3.9677734375, -2.90283203125, -1.837890625, -0.77294921875, 0.2919921875, 1.35693359375, 2.421875, 3.48681640625, 4.5517578125, 5.61669921875, 6.681640625, 7.74658203125, 8.8115234375, 9.87646484375, 10.94140625, 12.00634765625, 13.0712890625, 14.13623046875, 15.201171875, 16.26611328125, 17.3310546875, 18.39599609375, 19.4609375, 20.52587890625, 21.5908203125, 22.65576171875, 23.720703125, 24.78564453125, 25.8505859375, 26.91552734375, 27.98046875, 29.04541015625, 30.1103515625, 31.17529296875, 32.240234375, 33.30517578125, 34.3701171875, 35.43505859375, 36.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 8.0, 12.0, 11.0, 30.0, 29.0, 46.0, 63.0, 96.0, 105.0, 114.0, 106.0, 103.0, 73.0, 48.0, 54.0, 35.0, 25.0, 18.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021266937255859375, -0.002052873373031616, -0.001979053020477295, -0.0019052326679229736, -0.0018314123153686523, -0.001757591962814331, -0.0016837716102600098, -0.0016099512577056885, -0.0015361309051513672, -0.001462310552597046, -0.0013884902000427246, -0.0013146698474884033, -0.001240849494934082, -0.0011670291423797607, -0.0010932087898254395, -0.0010193884372711182, -0.0009455680847167969, -0.0008717477321624756, -0.0007979273796081543, -0.000724107027053833, -0.0006502866744995117, -0.0005764663219451904, -0.0005026459693908691, -0.00042882561683654785, -0.00035500526428222656, -0.0002811849117279053, -0.00020736455917358398, -0.0001335442066192627, -5.9723854064941406e-05, 1.4096498489379883e-05, 8.791685104370117e-05, 0.00016173720359802246, 0.00023555755615234375, 0.00030937790870666504, 0.00038319826126098633, 0.0004570186138153076, 0.0005308389663696289, 0.0006046593189239502, 0.0006784796714782715, 0.0007523000240325928, 0.0008261203765869141, 0.0008999407291412354, 0.0009737610816955566, 0.001047581434249878, 0.0011214017868041992, 0.0011952221393585205, 0.0012690424919128418, 0.001342862844467163, 0.0014166831970214844, 0.0014905035495758057, 0.001564323902130127, 0.0016381442546844482, 0.0017119646072387695, 0.0017857849597930908, 0.0018596053123474121, 0.0019334256649017334, 0.0020072460174560547, 0.002081066370010376, 0.0021548867225646973, 0.0022287070751190186, 0.00230252742767334, 0.002376347780227661, 0.0024501681327819824, 0.0025239884853363037, 0.002597808837890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 8.0, 8.0, 11.0, 14.0, 34.0, 28.0, 55.0, 53.0, 90.0, 148.0, 186.0, 228.0, 310.0, 393.0, 606.0, 859.0, 1297.0, 2338.0, 5096.0, 14594.0, 48106.0, 161153.0, 359158.0, 295291.0, 108203.0, 31128.0, 9731.0, 3706.0, 1807.0, 1151.0, 768.0, 551.0, 395.0, 298.0, 229.0, 131.0, 114.0, 72.0, 55.0, 43.0, 31.0, 19.0, 27.0, 6.0, 12.0, 4.0, 2.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.78125, -31.7177734375, -30.654296875, -29.5908203125, -28.52734375, -27.4638671875, -26.400390625, -25.3369140625, -24.2734375, -23.2099609375, -22.146484375, -21.0830078125, -20.01953125, -18.9560546875, -17.892578125, -16.8291015625, -15.765625, -14.7021484375, -13.638671875, -12.5751953125, -11.51171875, -10.4482421875, -9.384765625, -8.3212890625, -7.2578125, -6.1943359375, -5.130859375, -4.0673828125, -3.00390625, -1.9404296875, -0.876953125, 0.1865234375, 1.25, 2.3134765625, 3.376953125, 4.4404296875, 5.50390625, 6.5673828125, 7.630859375, 8.6943359375, 9.7578125, 10.8212890625, 11.884765625, 12.9482421875, 14.01171875, 15.0751953125, 16.138671875, 17.2021484375, 18.265625, 19.3291015625, 20.392578125, 21.4560546875, 22.51953125, 23.5830078125, 24.646484375, 25.7099609375, 26.7734375, 27.8369140625, 28.900390625, 29.9638671875, 31.02734375, 32.0908203125, 33.154296875, 34.2177734375, 35.28125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 9.0, 10.0, 23.0, 29.0, 40.0, 59.0, 73.0, 87.0, 95.0, 98.0, 107.0, 97.0, 73.0, 54.0, 50.0, 30.0, 17.0, 11.0, 8.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.59375, -10.2774658203125, -9.961181640625, -9.6448974609375, -9.32861328125, -9.0123291015625, -8.696044921875, -8.3797607421875, -8.0634765625, -7.7471923828125, -7.430908203125, -7.1146240234375, -6.79833984375, -6.4820556640625, -6.165771484375, -5.8494873046875, -5.533203125, -5.2169189453125, -4.900634765625, -4.5843505859375, -4.26806640625, -3.9517822265625, -3.635498046875, -3.3192138671875, -3.0029296875, -2.6866455078125, -2.370361328125, -2.0540771484375, -1.73779296875, -1.4215087890625, -1.105224609375, -0.7889404296875, -0.47265625, -0.1563720703125, 0.159912109375, 0.4761962890625, 0.79248046875, 1.1087646484375, 1.425048828125, 1.7413330078125, 2.0576171875, 2.3739013671875, 2.690185546875, 3.0064697265625, 3.32275390625, 3.6390380859375, 3.955322265625, 4.2716064453125, 4.587890625, 4.9041748046875, 5.220458984375, 5.5367431640625, 5.85302734375, 6.1693115234375, 6.485595703125, 6.8018798828125, 7.1181640625, 7.4344482421875, 7.750732421875, 8.0670166015625, 8.38330078125, 8.6995849609375, 9.015869140625, 9.3321533203125, 9.6484375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 11.0, 8.0, 8.0, 12.0, 15.0, 22.0, 16.0, 20.0, 29.0, 35.0, 34.0, 43.0, 31.0, 45.0, 53.0, 46.0, 48.0, 62.0, 57.0, 37.0, 67.0, 45.0, 43.0, 44.0, 27.0, 18.0, 22.0, 19.0, 15.0, 24.0, 13.0, 8.0, 8.0, 7.0, 8.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.716394424438477, -20.0308780670166, -19.345359802246094, -18.65984344482422, -17.974327087402344, -17.28881072998047, -16.603294372558594, -15.917776107788086, -15.232259750366211, -14.546743392944336, -13.861226081848145, -13.175708770751953, -12.490192413330078, -11.804676055908203, -11.119158744812012, -10.43364143371582, -9.748125076293945, -9.06260871887207, -8.377091407775879, -7.691574573516846, -7.0060577392578125, -6.320540904998779, -5.635024070739746, -4.949507236480713, -4.26399040222168, -3.5784735679626465, -2.8929567337036133, -2.20743989944458, -1.5219230651855469, -0.8364062309265137, -0.15088939666748047, 0.5346274375915527, 1.2201423645019531, 1.9056591987609863, 2.5911760330200195, 3.2766928672790527, 3.962209701538086, 4.647726535797119, 5.333243370056152, 6.0187602043151855, 6.704277038574219, 7.389793872833252, 8.075310707092285, 8.760828018188477, 9.446344375610352, 10.131860733032227, 10.817378044128418, 11.50289535522461, 12.188411712646484, 12.87392807006836, 13.55944538116455, 14.244962692260742, 14.930479049682617, 15.615995407104492, 16.301513671875, 16.987030029296875, 17.67254638671875, 18.358062744140625, 19.0435791015625, 19.729097366333008, 20.414613723754883, 21.100130081176758, 21.785648345947266, 22.47116470336914, 23.156681060791016]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 6.0, 11.0, 14.0, 14.0, 15.0, 11.0, 9.0, 9.0, 14.0, 21.0, 12.0, 25.0, 26.0, 31.0, 36.0, 33.0, 41.0, 30.0, 40.0, 45.0, 40.0, 36.0, 56.0, 31.0, 34.0, 36.0, 31.0, 34.0, 29.0, 32.0, 25.0, 22.0, 23.0, 23.0, 15.0, 18.0, 17.0, 9.0, 13.0, 13.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-19.24850845336914, -18.684755325317383, -18.121004104614258, -17.5572509765625, -16.993497848510742, -16.429744720458984, -15.86599349975586, -15.302240371704102, -14.738487243652344, -14.174735069274902, -13.610981941223145, -13.047229766845703, -12.483476638793945, -11.919724464416504, -11.355972290039062, -10.792219161987305, -10.228466987609863, -9.664714813232422, -9.100961685180664, -8.537209510803223, -7.973456382751465, -7.409704208374023, -6.845951557159424, -6.282198905944824, -5.718446254730225, -5.154693603515625, -4.590940952301025, -4.027188301086426, -3.4634358882904053, -2.8996832370758057, -2.335930824279785, -1.7721781730651855, -1.208425521850586, -0.6446729302406311, -0.08092033863067627, 0.4828321933746338, 1.0465848445892334, 1.610337495803833, 2.1740899085998535, 2.737842559814453, 3.3015952110290527, 3.8653478622436523, 4.429100513458252, 4.992853164672852, 5.556605339050293, 6.120358467102051, 6.684110641479492, 7.247863292694092, 7.811615943908691, 8.375368118286133, 8.93912124633789, 9.502873420715332, 10.06662654876709, 10.630378723144531, 11.194131851196289, 11.75788402557373, 12.321636199951172, 12.885388374328613, 13.449141502380371, 14.012893676757812, 14.57664680480957, 15.140398979187012, 15.704151153564453, 16.26790428161621, 16.83165740966797]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 11.0, 10.0, 15.0, 30.0, 55.0, 86.0, 155.0, 239.0, 367.0, 593.0, 971.0, 1674.0, 2690.0, 4404.0, 7331.0, 11718.0, 18836.0, 28795.0, 42796.0, 60646.0, 81256.0, 101449.0, 116136.0, 120584.0, 113253.0, 96249.0, 75464.0, 55550.0, 38420.0, 25482.0, 16513.0, 10461.0, 6384.0, 3919.0, 2363.0, 1446.0, 871.0, 559.0, 306.0, 173.0, 114.0, 68.0, 38.0, 21.0, 9.0, 11.0, 12.0, 7.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-16.515625, -15.989013671875, -15.46240234375, -14.935791015625, -14.4091796875, -13.882568359375, -13.35595703125, -12.829345703125, -12.302734375, -11.776123046875, -11.24951171875, -10.722900390625, -10.1962890625, -9.669677734375, -9.14306640625, -8.616455078125, -8.08984375, -7.563232421875, -7.03662109375, -6.510009765625, -5.9833984375, -5.456787109375, -4.93017578125, -4.403564453125, -3.876953125, -3.350341796875, -2.82373046875, -2.297119140625, -1.7705078125, -1.243896484375, -0.71728515625, -0.190673828125, 0.3359375, 0.862548828125, 1.38916015625, 1.915771484375, 2.4423828125, 2.968994140625, 3.49560546875, 4.022216796875, 4.548828125, 5.075439453125, 5.60205078125, 6.128662109375, 6.6552734375, 7.181884765625, 7.70849609375, 8.235107421875, 8.76171875, 9.288330078125, 9.81494140625, 10.341552734375, 10.8681640625, 11.394775390625, 11.92138671875, 12.447998046875, 12.974609375, 13.501220703125, 14.02783203125, 14.554443359375, 15.0810546875, 15.607666015625, 16.13427734375, 16.660888671875, 17.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 8.0, 6.0, 7.0, 14.0, 20.0, 14.0, 9.0, 8.0, 28.0, 13.0, 23.0, 25.0, 27.0, 32.0, 34.0, 33.0, 38.0, 38.0, 53.0, 48.0, 36.0, 35.0, 32.0, 33.0, 38.0, 36.0, 39.0, 37.0, 27.0, 31.0, 18.0, 21.0, 17.0, 14.0, 27.0, 13.0, 12.0, 7.0, 8.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.5, -17.928955078125, -17.35791015625, -16.786865234375, -16.2158203125, -15.644775390625, -15.07373046875, -14.502685546875, -13.931640625, -13.360595703125, -12.78955078125, -12.218505859375, -11.6474609375, -11.076416015625, -10.50537109375, -9.934326171875, -9.36328125, -8.792236328125, -8.22119140625, -7.650146484375, -7.0791015625, -6.508056640625, -5.93701171875, -5.365966796875, -4.794921875, -4.223876953125, -3.65283203125, -3.081787109375, -2.5107421875, -1.939697265625, -1.36865234375, -0.797607421875, -0.2265625, 0.344482421875, 0.91552734375, 1.486572265625, 2.0576171875, 2.628662109375, 3.19970703125, 3.770751953125, 4.341796875, 4.912841796875, 5.48388671875, 6.054931640625, 6.6259765625, 7.197021484375, 7.76806640625, 8.339111328125, 8.91015625, 9.481201171875, 10.05224609375, 10.623291015625, 11.1943359375, 11.765380859375, 12.33642578125, 12.907470703125, 13.478515625, 14.049560546875, 14.62060546875, 15.191650390625, 15.7626953125, 16.333740234375, 16.90478515625, 17.475830078125, 18.046875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 7.0, 10.0, 15.0, 26.0, 28.0, 38.0, 73.0, 127.0, 174.0, 294.0, 466.0, 624.0, 1042.0, 1459.0, 2182.0, 3258.0, 4820.0, 7042.0, 10307.0, 15299.0, 21782.0, 30118.0, 40813.0, 53693.0, 68012.0, 80947.0, 91998.0, 97118.0, 96851.0, 90657.0, 79517.0, 65573.0, 51155.0, 39555.0, 28498.0, 20472.0, 14040.0, 10043.0, 6712.0, 4517.0, 3138.0, 1990.0, 1332.0, 927.0, 669.0, 406.0, 267.0, 191.0, 86.0, 82.0, 44.0, 25.0, 17.0, 15.0, 7.0, 10.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.7890625, -15.2784423828125, -14.767822265625, -14.2572021484375, -13.74658203125, -13.2359619140625, -12.725341796875, -12.2147216796875, -11.7041015625, -11.1934814453125, -10.682861328125, -10.1722412109375, -9.66162109375, -9.1510009765625, -8.640380859375, -8.1297607421875, -7.619140625, -7.1085205078125, -6.597900390625, -6.0872802734375, -5.57666015625, -5.0660400390625, -4.555419921875, -4.0447998046875, -3.5341796875, -3.0235595703125, -2.512939453125, -2.0023193359375, -1.49169921875, -0.9810791015625, -0.470458984375, 0.0401611328125, 0.55078125, 1.0614013671875, 1.572021484375, 2.0826416015625, 2.59326171875, 3.1038818359375, 3.614501953125, 4.1251220703125, 4.6357421875, 5.1463623046875, 5.656982421875, 6.1676025390625, 6.67822265625, 7.1888427734375, 7.699462890625, 8.2100830078125, 8.720703125, 9.2313232421875, 9.741943359375, 10.2525634765625, 10.76318359375, 11.2738037109375, 11.784423828125, 12.2950439453125, 12.8056640625, 13.3162841796875, 13.826904296875, 14.3375244140625, 14.84814453125, 15.3587646484375, 15.869384765625, 16.3800048828125, 16.890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 10.0, 8.0, 8.0, 11.0, 7.0, 13.0, 17.0, 17.0, 18.0, 30.0, 28.0, 29.0, 32.0, 34.0, 34.0, 35.0, 35.0, 38.0, 33.0, 39.0, 44.0, 35.0, 36.0, 34.0, 38.0, 42.0, 36.0, 32.0, 24.0, 24.0, 33.0, 22.0, 16.0, 20.0, 15.0, 14.0, 11.0, 13.0, 5.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0], "bins": [-13.90625, -13.512939453125, -13.11962890625, -12.726318359375, -12.3330078125, -11.939697265625, -11.54638671875, -11.153076171875, -10.759765625, -10.366455078125, -9.97314453125, -9.579833984375, -9.1865234375, -8.793212890625, -8.39990234375, -8.006591796875, -7.61328125, -7.219970703125, -6.82666015625, -6.433349609375, -6.0400390625, -5.646728515625, -5.25341796875, -4.860107421875, -4.466796875, -4.073486328125, -3.68017578125, -3.286865234375, -2.8935546875, -2.500244140625, -2.10693359375, -1.713623046875, -1.3203125, -0.927001953125, -0.53369140625, -0.140380859375, 0.2529296875, 0.646240234375, 1.03955078125, 1.432861328125, 1.826171875, 2.219482421875, 2.61279296875, 3.006103515625, 3.3994140625, 3.792724609375, 4.18603515625, 4.579345703125, 4.97265625, 5.365966796875, 5.75927734375, 6.152587890625, 6.5458984375, 6.939208984375, 7.33251953125, 7.725830078125, 8.119140625, 8.512451171875, 8.90576171875, 9.299072265625, 9.6923828125, 10.085693359375, 10.47900390625, 10.872314453125, 11.265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 10.0, 6.0, 14.0, 17.0, 31.0, 36.0, 48.0, 68.0, 116.0, 172.0, 231.0, 372.0, 593.0, 1000.0, 1586.0, 2601.0, 4297.0, 7387.0, 12716.0, 21366.0, 34549.0, 55233.0, 81881.0, 112320.0, 136326.0, 144092.0, 130486.0, 103973.0, 73735.0, 48400.0, 29882.0, 18209.0, 10862.0, 6281.0, 3758.0, 2215.0, 1387.0, 817.0, 509.0, 318.0, 214.0, 141.0, 88.0, 59.0, 48.0, 31.0, 24.0, 20.0, 12.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.71484375, -6.50067138671875, -6.2864990234375, -6.07232666015625, -5.858154296875, -5.64398193359375, -5.4298095703125, -5.21563720703125, -5.00146484375, -4.78729248046875, -4.5731201171875, -4.35894775390625, -4.144775390625, -3.93060302734375, -3.7164306640625, -3.50225830078125, -3.2880859375, -3.07391357421875, -2.8597412109375, -2.64556884765625, -2.431396484375, -2.21722412109375, -2.0030517578125, -1.78887939453125, -1.57470703125, -1.36053466796875, -1.1463623046875, -0.93218994140625, -0.718017578125, -0.50384521484375, -0.2896728515625, -0.07550048828125, 0.138671875, 0.35284423828125, 0.5670166015625, 0.78118896484375, 0.995361328125, 1.20953369140625, 1.4237060546875, 1.63787841796875, 1.85205078125, 2.06622314453125, 2.2803955078125, 2.49456787109375, 2.708740234375, 2.92291259765625, 3.1370849609375, 3.35125732421875, 3.5654296875, 3.77960205078125, 3.9937744140625, 4.20794677734375, 4.422119140625, 4.63629150390625, 4.8504638671875, 5.06463623046875, 5.27880859375, 5.49298095703125, 5.7071533203125, 5.92132568359375, 6.135498046875, 6.34967041015625, 6.5638427734375, 6.77801513671875, 6.9921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 4.0, 6.0, 13.0, 10.0, 16.0, 30.0, 22.0, 42.0, 38.0, 40.0, 44.0, 48.0, 59.0, 50.0, 55.0, 70.0, 59.0, 75.0, 49.0, 43.0, 41.0, 37.0, 42.0, 18.0, 19.0, 16.0, 5.0, 10.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.001148223876953125, -0.001118585467338562, -0.001088947057723999, -0.001059308648109436, -0.001029670238494873, -0.00100003182888031, -0.0009703934192657471, -0.0009407550096511841, -0.0009111166000366211, -0.0008814781904220581, -0.0008518397808074951, -0.0008222013711929321, -0.0007925629615783691, -0.0007629245519638062, -0.0007332861423492432, -0.0007036477327346802, -0.0006740093231201172, -0.0006443709135055542, -0.0006147325038909912, -0.0005850940942764282, -0.0005554556846618652, -0.0005258172750473022, -0.0004961788654327393, -0.00046654045581817627, -0.0004369020462036133, -0.0004072636365890503, -0.0003776252269744873, -0.0003479868173599243, -0.00031834840774536133, -0.00028870999813079834, -0.00025907158851623535, -0.00022943317890167236, -0.00019979476928710938, -0.0001701563596725464, -0.0001405179500579834, -0.00011087954044342041, -8.124113082885742e-05, -5.1602721214294434e-05, -2.1964311599731445e-05, 7.674098014831543e-06, 3.731250762939453e-05, 6.695091724395752e-05, 9.658932685852051e-05, 0.0001262277364730835, 0.00015586614608764648, 0.00018550455570220947, 0.00021514296531677246, 0.00024478137493133545, 0.00027441978454589844, 0.0003040581941604614, 0.0003336966037750244, 0.0003633350133895874, 0.0003929734230041504, 0.0004226118326187134, 0.00045225024223327637, 0.00048188865184783936, 0.0005115270614624023, 0.0005411654710769653, 0.0005708038806915283, 0.0006004422903060913, 0.0006300806999206543, 0.0006597191095352173, 0.0006893575191497803, 0.0007189959287643433, 0.0007486343383789062]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 7.0, 7.0, 22.0, 38.0, 37.0, 80.0, 94.0, 144.0, 273.0, 450.0, 710.0, 1216.0, 1957.0, 3494.0, 6121.0, 10480.0, 18771.0, 32422.0, 53738.0, 84763.0, 119102.0, 146564.0, 155415.0, 136580.0, 103453.0, 69798.0, 43231.0, 25057.0, 14672.0, 8264.0, 4801.0, 2680.0, 1576.0, 999.0, 563.0, 327.0, 222.0, 140.0, 77.0, 64.0, 41.0, 30.0, 22.0, 10.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.5234375, -7.29034423828125, -7.0572509765625, -6.82415771484375, -6.591064453125, -6.35797119140625, -6.1248779296875, -5.89178466796875, -5.65869140625, -5.42559814453125, -5.1925048828125, -4.95941162109375, -4.726318359375, -4.49322509765625, -4.2601318359375, -4.02703857421875, -3.7939453125, -3.56085205078125, -3.3277587890625, -3.09466552734375, -2.861572265625, -2.62847900390625, -2.3953857421875, -2.16229248046875, -1.92919921875, -1.69610595703125, -1.4630126953125, -1.22991943359375, -0.996826171875, -0.76373291015625, -0.5306396484375, -0.29754638671875, -0.064453125, 0.16864013671875, 0.4017333984375, 0.63482666015625, 0.867919921875, 1.10101318359375, 1.3341064453125, 1.56719970703125, 1.80029296875, 2.03338623046875, 2.2664794921875, 2.49957275390625, 2.732666015625, 2.96575927734375, 3.1988525390625, 3.43194580078125, 3.6650390625, 3.89813232421875, 4.1312255859375, 4.36431884765625, 4.597412109375, 4.83050537109375, 5.0635986328125, 5.29669189453125, 5.52978515625, 5.76287841796875, 5.9959716796875, 6.22906494140625, 6.462158203125, 6.69525146484375, 6.9283447265625, 7.16143798828125, 7.39453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 9.0, 11.0, 7.0, 11.0, 21.0, 19.0, 28.0, 46.0, 35.0, 41.0, 58.0, 53.0, 57.0, 62.0, 68.0, 54.0, 61.0, 59.0, 52.0, 51.0, 44.0, 32.0, 21.0, 18.0, 13.0, 14.0, 8.0, 17.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9375, -2.838714599609375, -2.73992919921875, -2.641143798828125, -2.5423583984375, -2.443572998046875, -2.34478759765625, -2.246002197265625, -2.147216796875, -2.048431396484375, -1.94964599609375, -1.850860595703125, -1.7520751953125, -1.653289794921875, -1.55450439453125, -1.455718994140625, -1.35693359375, -1.258148193359375, -1.15936279296875, -1.060577392578125, -0.9617919921875, -0.863006591796875, -0.76422119140625, -0.665435791015625, -0.566650390625, -0.467864990234375, -0.36907958984375, -0.270294189453125, -0.1715087890625, -0.072723388671875, 0.02606201171875, 0.124847412109375, 0.2236328125, 0.322418212890625, 0.42120361328125, 0.519989013671875, 0.6187744140625, 0.717559814453125, 0.81634521484375, 0.915130615234375, 1.013916015625, 1.112701416015625, 1.21148681640625, 1.310272216796875, 1.4090576171875, 1.507843017578125, 1.60662841796875, 1.705413818359375, 1.80419921875, 1.902984619140625, 2.00177001953125, 2.100555419921875, 2.1993408203125, 2.298126220703125, 2.39691162109375, 2.495697021484375, 2.594482421875, 2.693267822265625, 2.79205322265625, 2.890838623046875, 2.9896240234375, 3.088409423828125, 3.18719482421875, 3.285980224609375, 3.384765625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 5.0, 14.0, 18.0, 18.0, 17.0, 19.0, 25.0, 42.0, 35.0, 34.0, 34.0, 39.0, 53.0, 49.0, 57.0, 61.0, 54.0, 49.0, 54.0, 52.0, 35.0, 37.0, 30.0, 28.0, 26.0, 15.0, 18.0, 9.0, 17.0, 13.0, 14.0, 7.0, 13.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.32432746887207, -19.636077880859375, -18.947826385498047, -18.25957679748535, -17.571327209472656, -16.88307762145996, -16.194828033447266, -15.506576538085938, -14.818326950073242, -14.130077362060547, -13.441826820373535, -12.753576278686523, -12.065326690673828, -11.377077102661133, -10.688826560974121, -10.00057601928711, -9.312326431274414, -8.624076843261719, -7.935826301574707, -7.2475762367248535, -6.559326171875, -5.8710761070251465, -5.182826042175293, -4.4945759773254395, -3.806325912475586, -3.1180758476257324, -2.429825782775879, -1.7415757179260254, -1.0533256530761719, -0.36507558822631836, 0.32317447662353516, 1.0114245414733887, 1.6996726989746094, 2.387922763824463, 3.0761728286743164, 3.76442289352417, 4.452672958374023, 5.140923023223877, 5.8291730880737305, 6.517423152923584, 7.2056732177734375, 7.893923282623291, 8.582173347473145, 9.270423889160156, 9.958673477172852, 10.646923065185547, 11.335173606872559, 12.02342414855957, 12.711673736572266, 13.399923324584961, 14.088173866271973, 14.776424407958984, 15.46467399597168, 16.152923583984375, 16.841175079345703, 17.5294246673584, 18.217674255371094, 18.90592384338379, 19.594173431396484, 20.282424926757812, 20.970674514770508, 21.658924102783203, 22.34717559814453, 23.035425186157227, 23.723674774169922]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 4.0, 8.0, 4.0, 16.0, 16.0, 12.0, 15.0, 12.0, 15.0, 24.0, 17.0, 21.0, 25.0, 35.0, 36.0, 33.0, 36.0, 45.0, 33.0, 42.0, 34.0, 37.0, 39.0, 39.0, 38.0, 42.0, 25.0, 23.0, 37.0, 25.0, 26.0, 29.0, 14.0, 17.0, 17.0, 17.0, 16.0, 15.0, 19.0, 8.0, 6.0, 4.0, 9.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.89996337890625, -18.314741134643555, -17.729520797729492, -17.144298553466797, -16.559078216552734, -15.973855972290039, -15.38863468170166, -14.803413391113281, -14.218192100524902, -13.632970809936523, -13.047749519348145, -12.462528228759766, -11.87730598449707, -11.292085647583008, -10.706863403320312, -10.121642112731934, -9.536420822143555, -8.951199531555176, -8.365978240966797, -7.78075647354126, -7.195535182952881, -6.610313892364502, -6.025092124938965, -5.439870834350586, -4.854649543762207, -4.269428253173828, -3.68420672416687, -3.098985195159912, -2.513763904571533, -1.9285426139831543, -1.3433210849761963, -0.7580995559692383, -0.17287635803222656, 0.4123450517654419, 0.9975664615631104, 1.5827878713607788, 2.1680092811584473, 2.753230571746826, 3.338452100753784, 3.923673629760742, 4.508894920349121, 5.0941162109375, 5.679337501525879, 6.264559268951416, 6.849780559539795, 7.435001850128174, 8.020223617553711, 8.60544490814209, 9.190666198730469, 9.775887489318848, 10.361108779907227, 10.946330070495605, 11.531551361083984, 12.11677360534668, 12.701994895935059, 13.287216186523438, 13.872437477111816, 14.457658767700195, 15.042880058288574, 15.628101348876953, 16.21332359313965, 16.79854393005371, 17.383766174316406, 17.96898651123047, 18.554208755493164]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 7.0, 10.0, 25.0, 55.0, 71.0, 86.0, 155.0, 251.0, 397.0, 662.0, 1110.0, 1736.0, 2838.0, 4573.0, 7474.0, 12383.0, 20919.0, 35206.0, 59539.0, 100183.0, 170675.0, 283082.0, 445579.0, 619145.0, 696907.0, 611887.0, 437287.0, 274901.0, 165528.0, 97694.0, 57818.0, 34462.0, 20601.0, 12250.0, 7373.0, 4614.0, 2699.0, 1596.0, 969.0, 610.0, 369.0, 220.0, 139.0, 87.0, 49.0, 26.0, 14.0, 6.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.109375, -18.52099609375, -17.9326171875, -17.34423828125, -16.755859375, -16.16748046875, -15.5791015625, -14.99072265625, -14.40234375, -13.81396484375, -13.2255859375, -12.63720703125, -12.048828125, -11.46044921875, -10.8720703125, -10.28369140625, -9.6953125, -9.10693359375, -8.5185546875, -7.93017578125, -7.341796875, -6.75341796875, -6.1650390625, -5.57666015625, -4.98828125, -4.39990234375, -3.8115234375, -3.22314453125, -2.634765625, -2.04638671875, -1.4580078125, -0.86962890625, -0.28125, 0.30712890625, 0.8955078125, 1.48388671875, 2.072265625, 2.66064453125, 3.2490234375, 3.83740234375, 4.42578125, 5.01416015625, 5.6025390625, 6.19091796875, 6.779296875, 7.36767578125, 7.9560546875, 8.54443359375, 9.1328125, 9.72119140625, 10.3095703125, 10.89794921875, 11.486328125, 12.07470703125, 12.6630859375, 13.25146484375, 13.83984375, 14.42822265625, 15.0166015625, 15.60498046875, 16.193359375, 16.78173828125, 17.3701171875, 17.95849609375, 18.546875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 6.0, 5.0, 3.0, 9.0, 13.0, 15.0, 17.0, 10.0, 15.0, 11.0, 26.0, 21.0, 34.0, 31.0, 28.0, 24.0, 32.0, 33.0, 39.0, 44.0, 46.0, 38.0, 28.0, 38.0, 40.0, 43.0, 31.0, 34.0, 36.0, 28.0, 20.0, 14.0, 27.0, 25.0, 13.0, 20.0, 18.0, 19.0, 11.0, 9.0, 11.0, 8.0, 6.0, 3.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-15.0859375, -14.6158447265625, -14.145751953125, -13.6756591796875, -13.20556640625, -12.7354736328125, -12.265380859375, -11.7952880859375, -11.3251953125, -10.8551025390625, -10.385009765625, -9.9149169921875, -9.44482421875, -8.9747314453125, -8.504638671875, -8.0345458984375, -7.564453125, -7.0943603515625, -6.624267578125, -6.1541748046875, -5.68408203125, -5.2139892578125, -4.743896484375, -4.2738037109375, -3.8037109375, -3.3336181640625, -2.863525390625, -2.3934326171875, -1.92333984375, -1.4532470703125, -0.983154296875, -0.5130615234375, -0.04296875, 0.4271240234375, 0.897216796875, 1.3673095703125, 1.83740234375, 2.3074951171875, 2.777587890625, 3.2476806640625, 3.7177734375, 4.1878662109375, 4.657958984375, 5.1280517578125, 5.59814453125, 6.0682373046875, 6.538330078125, 7.0084228515625, 7.478515625, 7.9486083984375, 8.418701171875, 8.8887939453125, 9.35888671875, 9.8289794921875, 10.299072265625, 10.7691650390625, 11.2392578125, 11.7093505859375, 12.179443359375, 12.6495361328125, 13.11962890625, 13.5897216796875, 14.059814453125, 14.5299072265625, 15.0]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 20.0, 24.0, 34.0, 59.0, 73.0, 128.0, 171.0, 278.0, 422.0, 573.0, 945.0, 1440.0, 2305.0, 3591.0, 5606.0, 8694.0, 13855.0, 22372.0, 36357.0, 58471.0, 93750.0, 149300.0, 232063.0, 345221.0, 475348.0, 578396.0, 592371.0, 501788.0, 374573.0, 254182.0, 165496.0, 104468.0, 64737.0, 40060.0, 24898.0, 15522.0, 9627.0, 6068.0, 3861.0, 2562.0, 1625.0, 986.0, 655.0, 444.0, 298.0, 221.0, 105.0, 76.0, 60.0, 31.0, 17.0, 15.0, 15.0, 11.0, 5.0, 2.0], "bins": [-16.984375, -16.4864501953125, -15.988525390625, -15.4906005859375, -14.99267578125, -14.4947509765625, -13.996826171875, -13.4989013671875, -13.0009765625, -12.5030517578125, -12.005126953125, -11.5072021484375, -11.00927734375, -10.5113525390625, -10.013427734375, -9.5155029296875, -9.017578125, -8.5196533203125, -8.021728515625, -7.5238037109375, -7.02587890625, -6.5279541015625, -6.030029296875, -5.5321044921875, -5.0341796875, -4.5362548828125, -4.038330078125, -3.5404052734375, -3.04248046875, -2.5445556640625, -2.046630859375, -1.5487060546875, -1.05078125, -0.5528564453125, -0.054931640625, 0.4429931640625, 0.94091796875, 1.4388427734375, 1.936767578125, 2.4346923828125, 2.9326171875, 3.4305419921875, 3.928466796875, 4.4263916015625, 4.92431640625, 5.4222412109375, 5.920166015625, 6.4180908203125, 6.916015625, 7.4139404296875, 7.911865234375, 8.4097900390625, 8.90771484375, 9.4056396484375, 9.903564453125, 10.4014892578125, 10.8994140625, 11.3973388671875, 11.895263671875, 12.3931884765625, 12.89111328125, 13.3890380859375, 13.886962890625, 14.3848876953125, 14.8828125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 4.0, 9.0, 5.0, 11.0, 12.0, 19.0, 33.0, 43.0, 41.0, 53.0, 72.0, 83.0, 99.0, 125.0, 141.0, 164.0, 184.0, 209.0, 181.0, 239.0, 257.0, 236.0, 210.0, 205.0, 222.0, 180.0, 171.0, 146.0, 115.0, 111.0, 91.0, 70.0, 72.0, 47.0, 48.0, 38.0, 25.0, 25.0, 17.0, 10.0, 16.0, 6.0, 8.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.828125, -6.60186767578125, -6.3756103515625, -6.14935302734375, -5.923095703125, -5.69683837890625, -5.4705810546875, -5.24432373046875, -5.01806640625, -4.79180908203125, -4.5655517578125, -4.33929443359375, -4.113037109375, -3.88677978515625, -3.6605224609375, -3.43426513671875, -3.2080078125, -2.98175048828125, -2.7554931640625, -2.52923583984375, -2.302978515625, -2.07672119140625, -1.8504638671875, -1.62420654296875, -1.39794921875, -1.17169189453125, -0.9454345703125, -0.71917724609375, -0.492919921875, -0.26666259765625, -0.0404052734375, 0.18585205078125, 0.412109375, 0.63836669921875, 0.8646240234375, 1.09088134765625, 1.317138671875, 1.54339599609375, 1.7696533203125, 1.99591064453125, 2.22216796875, 2.44842529296875, 2.6746826171875, 2.90093994140625, 3.127197265625, 3.35345458984375, 3.5797119140625, 3.80596923828125, 4.0322265625, 4.25848388671875, 4.4847412109375, 4.71099853515625, 4.937255859375, 5.16351318359375, 5.3897705078125, 5.61602783203125, 5.84228515625, 6.06854248046875, 6.2947998046875, 6.52105712890625, 6.747314453125, 6.97357177734375, 7.1998291015625, 7.42608642578125, 7.65234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 6.0, 12.0, 15.0, 10.0, 18.0, 23.0, 25.0, 34.0, 29.0, 29.0, 41.0, 31.0, 35.0, 47.0, 65.0, 41.0, 46.0, 52.0, 39.0, 36.0, 33.0, 46.0, 37.0, 36.0, 24.0, 22.0, 24.0, 25.0, 21.0, 22.0, 7.0, 12.0, 5.0, 11.0, 3.0, 4.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.0733642578125, -17.490182876586914, -16.907001495361328, -16.323822021484375, -15.740640640258789, -15.157459259033203, -14.574277877807617, -13.991097450256348, -13.407917022705078, -12.824735641479492, -12.241555213928223, -11.658373832702637, -11.075193405151367, -10.492012023925781, -9.908830642700195, -9.325650215148926, -8.74246883392334, -8.159287452697754, -7.576107025146484, -6.992925643920898, -6.409745216369629, -5.826563835144043, -5.243382930755615, -4.6602020263671875, -4.07702112197876, -3.493840217590332, -2.9106593132019043, -2.3274781703948975, -1.7442972660064697, -1.161116361618042, -0.5779352188110352, 0.005245685577392578, 0.5884265899658203, 1.171607494354248, 1.7547885179519653, 2.3379695415496826, 2.9211504459381104, 3.504331350326538, 4.087512493133545, 4.670693397521973, 5.2538743019104, 5.837055206298828, 6.420236110687256, 7.003417015075684, 7.5865983963012695, 8.169778823852539, 8.752960205078125, 9.336141586303711, 9.91932201385498, 10.502503395080566, 11.085683822631836, 11.668865203857422, 12.252045631408691, 12.835227012634277, 13.418407440185547, 14.001588821411133, 14.584770202636719, 15.167951583862305, 15.751132011413574, 16.334312438964844, 16.91749382019043, 17.500675201416016, 18.0838565826416, 18.667037963867188, 19.25021743774414]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 2.0, 6.0, 5.0, 11.0, 10.0, 13.0, 17.0, 13.0, 18.0, 23.0, 22.0, 22.0, 28.0, 24.0, 34.0, 38.0, 35.0, 34.0, 49.0, 43.0, 43.0, 34.0, 27.0, 32.0, 30.0, 32.0, 37.0, 36.0, 35.0, 25.0, 28.0, 23.0, 22.0, 21.0, 21.0, 14.0, 19.0, 9.0, 11.0, 11.0, 14.0, 7.0, 3.0, 1.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.57736587524414, -17.02031898498535, -16.463272094726562, -15.906224250793457, -15.349177360534668, -14.792129516601562, -14.235082626342773, -13.678035736083984, -13.120988845825195, -12.563941955566406, -12.0068941116333, -11.449847221374512, -10.892800331115723, -10.335752487182617, -9.778705596923828, -9.221658706665039, -8.664610862731934, -8.107563972473145, -7.550516605377197, -6.99346923828125, -6.436422348022461, -5.879374980926514, -5.322327613830566, -4.765280723571777, -4.20823335647583, -3.651186227798462, -3.0941390991210938, -2.5370917320251465, -1.9800446033477783, -1.4229974746704102, -0.8659501075744629, -0.3089029788970947, 0.24814414978027344, 0.8051913380622864, 1.3622385263442993, 1.919285774230957, 2.476332902908325, 3.0333800315856934, 3.5904273986816406, 4.14747428894043, 4.704521656036377, 5.261569023132324, 5.818615913391113, 6.3756632804870605, 6.932710647583008, 7.489757537841797, 8.046804428100586, 8.603852272033691, 9.16089916229248, 9.71794605255127, 10.274993896484375, 10.832040786743164, 11.389087677001953, 11.946134567260742, 12.503182411193848, 13.060229301452637, 13.617277145385742, 14.174324035644531, 14.731371879577637, 15.288418769836426, 15.845465660095215, 16.40251350402832, 16.95956039428711, 17.5166072845459, 18.073654174804688]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 10.0, 8.0, 12.0, 18.0, 38.0, 60.0, 66.0, 107.0, 205.0, 317.0, 445.0, 688.0, 1101.0, 1583.0, 2395.0, 3514.0, 5385.0, 7930.0, 11475.0, 16505.0, 23473.0, 33537.0, 45768.0, 61740.0, 80276.0, 98271.0, 111247.0, 113128.0, 102871.0, 85922.0, 67678.0, 50867.0, 36984.0, 26197.0, 18695.0, 12980.0, 8850.0, 6121.0, 4066.0, 2712.0, 1827.0, 1207.0, 789.0, 521.0, 352.0, 219.0, 129.0, 86.0, 73.0, 43.0, 24.0, 12.0, 16.0, 15.0, 4.0, 4.0, 4.0, 1.0], "bins": [-21.890625, -21.23046875, -20.5703125, -19.91015625, -19.25, -18.58984375, -17.9296875, -17.26953125, -16.609375, -15.94921875, -15.2890625, -14.62890625, -13.96875, -13.30859375, -12.6484375, -11.98828125, -11.328125, -10.66796875, -10.0078125, -9.34765625, -8.6875, -8.02734375, -7.3671875, -6.70703125, -6.046875, -5.38671875, -4.7265625, -4.06640625, -3.40625, -2.74609375, -2.0859375, -1.42578125, -0.765625, -0.10546875, 0.5546875, 1.21484375, 1.875, 2.53515625, 3.1953125, 3.85546875, 4.515625, 5.17578125, 5.8359375, 6.49609375, 7.15625, 7.81640625, 8.4765625, 9.13671875, 9.796875, 10.45703125, 11.1171875, 11.77734375, 12.4375, 13.09765625, 13.7578125, 14.41796875, 15.078125, 15.73828125, 16.3984375, 17.05859375, 17.71875, 18.37890625, 19.0390625, 19.69921875, 20.359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 2.0, 7.0, 14.0, 10.0, 9.0, 16.0, 12.0, 20.0, 17.0, 28.0, 25.0, 32.0, 27.0, 34.0, 39.0, 29.0, 42.0, 42.0, 27.0, 44.0, 36.0, 29.0, 29.0, 35.0, 21.0, 32.0, 39.0, 34.0, 34.0, 29.0, 27.0, 30.0, 11.0, 20.0, 10.0, 20.0, 16.0, 9.0, 12.0, 3.0, 7.0, 4.0, 7.0, 11.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-13.3359375, -12.94921875, -12.5625, -12.17578125, -11.7890625, -11.40234375, -11.015625, -10.62890625, -10.2421875, -9.85546875, -9.46875, -9.08203125, -8.6953125, -8.30859375, -7.921875, -7.53515625, -7.1484375, -6.76171875, -6.375, -5.98828125, -5.6015625, -5.21484375, -4.828125, -4.44140625, -4.0546875, -3.66796875, -3.28125, -2.89453125, -2.5078125, -2.12109375, -1.734375, -1.34765625, -0.9609375, -0.57421875, -0.1875, 0.19921875, 0.5859375, 0.97265625, 1.359375, 1.74609375, 2.1328125, 2.51953125, 2.90625, 3.29296875, 3.6796875, 4.06640625, 4.453125, 4.83984375, 5.2265625, 5.61328125, 6.0, 6.38671875, 6.7734375, 7.16015625, 7.546875, 7.93359375, 8.3203125, 8.70703125, 9.09375, 9.48046875, 9.8671875, 10.25390625, 10.640625, 11.02734375, 11.4140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 14.0, 24.0, 17.0, 60.0, 57.0, 112.0, 158.0, 280.0, 413.0, 713.0, 1202.0, 2157.0, 3771.0, 6820.0, 12036.0, 22042.0, 40751.0, 75614.0, 137072.0, 215294.0, 218507.0, 140145.0, 78070.0, 41944.0, 22671.0, 12357.0, 6925.0, 3855.0, 2220.0, 1315.0, 724.0, 431.0, 299.0, 168.0, 132.0, 71.0, 46.0, 23.0, 15.0, 12.0, 10.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.8125, -45.3505859375, -43.888671875, -42.4267578125, -40.96484375, -39.5029296875, -38.041015625, -36.5791015625, -35.1171875, -33.6552734375, -32.193359375, -30.7314453125, -29.26953125, -27.8076171875, -26.345703125, -24.8837890625, -23.421875, -21.9599609375, -20.498046875, -19.0361328125, -17.57421875, -16.1123046875, -14.650390625, -13.1884765625, -11.7265625, -10.2646484375, -8.802734375, -7.3408203125, -5.87890625, -4.4169921875, -2.955078125, -1.4931640625, -0.03125, 1.4306640625, 2.892578125, 4.3544921875, 5.81640625, 7.2783203125, 8.740234375, 10.2021484375, 11.6640625, 13.1259765625, 14.587890625, 16.0498046875, 17.51171875, 18.9736328125, 20.435546875, 21.8974609375, 23.359375, 24.8212890625, 26.283203125, 27.7451171875, 29.20703125, 30.6689453125, 32.130859375, 33.5927734375, 35.0546875, 36.5166015625, 37.978515625, 39.4404296875, 40.90234375, 42.3642578125, 43.826171875, 45.2880859375, 46.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 11.0, 17.0, 14.0, 15.0, 22.0, 8.0, 24.0, 27.0, 31.0, 29.0, 24.0, 53.0, 42.0, 61.0, 53.0, 52.0, 50.0, 54.0, 36.0, 42.0, 40.0, 41.0, 37.0, 30.0, 28.0, 35.0, 23.0, 16.0, 13.0, 11.0, 7.0, 7.0, 6.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.5390625, -14.103759765625, -13.66845703125, -13.233154296875, -12.7978515625, -12.362548828125, -11.92724609375, -11.491943359375, -11.056640625, -10.621337890625, -10.18603515625, -9.750732421875, -9.3154296875, -8.880126953125, -8.44482421875, -8.009521484375, -7.57421875, -7.138916015625, -6.70361328125, -6.268310546875, -5.8330078125, -5.397705078125, -4.96240234375, -4.527099609375, -4.091796875, -3.656494140625, -3.22119140625, -2.785888671875, -2.3505859375, -1.915283203125, -1.47998046875, -1.044677734375, -0.609375, -0.174072265625, 0.26123046875, 0.696533203125, 1.1318359375, 1.567138671875, 2.00244140625, 2.437744140625, 2.873046875, 3.308349609375, 3.74365234375, 4.178955078125, 4.6142578125, 5.049560546875, 5.48486328125, 5.920166015625, 6.35546875, 6.790771484375, 7.22607421875, 7.661376953125, 8.0966796875, 8.531982421875, 8.96728515625, 9.402587890625, 9.837890625, 10.273193359375, 10.70849609375, 11.143798828125, 11.5791015625, 12.014404296875, 12.44970703125, 12.885009765625, 13.3203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 6.0, 17.0, 16.0, 25.0, 38.0, 32.0, 54.0, 81.0, 98.0, 126.0, 223.0, 313.0, 495.0, 753.0, 1230.0, 2167.0, 4318.0, 8899.0, 21336.0, 59754.0, 197683.0, 425913.0, 217296.0, 65191.0, 22705.0, 9443.0, 4424.0, 2233.0, 1273.0, 844.0, 501.0, 346.0, 216.0, 150.0, 93.0, 57.0, 60.0, 30.0, 30.0, 19.0, 18.0, 10.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-28.34375, -27.445068359375, -26.54638671875, -25.647705078125, -24.7490234375, -23.850341796875, -22.95166015625, -22.052978515625, -21.154296875, -20.255615234375, -19.35693359375, -18.458251953125, -17.5595703125, -16.660888671875, -15.76220703125, -14.863525390625, -13.96484375, -13.066162109375, -12.16748046875, -11.268798828125, -10.3701171875, -9.471435546875, -8.57275390625, -7.674072265625, -6.775390625, -5.876708984375, -4.97802734375, -4.079345703125, -3.1806640625, -2.281982421875, -1.38330078125, -0.484619140625, 0.4140625, 1.312744140625, 2.21142578125, 3.110107421875, 4.0087890625, 4.907470703125, 5.80615234375, 6.704833984375, 7.603515625, 8.502197265625, 9.40087890625, 10.299560546875, 11.1982421875, 12.096923828125, 12.99560546875, 13.894287109375, 14.79296875, 15.691650390625, 16.59033203125, 17.489013671875, 18.3876953125, 19.286376953125, 20.18505859375, 21.083740234375, 21.982421875, 22.881103515625, 23.77978515625, 24.678466796875, 25.5771484375, 26.475830078125, 27.37451171875, 28.273193359375, 29.171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 7.0, 11.0, 16.0, 21.0, 22.0, 25.0, 36.0, 52.0, 63.0, 95.0, 126.0, 120.0, 94.0, 77.0, 62.0, 48.0, 30.0, 25.0, 14.0, 11.0, 12.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026645660400390625, -0.002589315176010132, -0.002514064311981201, -0.0024388134479522705, -0.00236356258392334, -0.002288311719894409, -0.0022130608558654785, -0.002137809991836548, -0.002062559127807617, -0.0019873082637786865, -0.0019120573997497559, -0.0018368065357208252, -0.0017615556716918945, -0.0016863048076629639, -0.0016110539436340332, -0.0015358030796051025, -0.0014605522155761719, -0.0013853013515472412, -0.0013100504875183105, -0.0012347996234893799, -0.0011595487594604492, -0.0010842978954315186, -0.0010090470314025879, -0.0009337961673736572, -0.0008585453033447266, -0.0007832944393157959, -0.0007080435752868652, -0.0006327927112579346, -0.0005575418472290039, -0.00048229098320007324, -0.0004070401191711426, -0.0003317892551422119, -0.00025653839111328125, -0.00018128752708435059, -0.00010603666305541992, -3.078579902648926e-05, 4.4465065002441406e-05, 0.00011971592903137207, 0.00019496679306030273, 0.0002702176570892334, 0.00034546852111816406, 0.0004207193851470947, 0.0004959702491760254, 0.0005712211132049561, 0.0006464719772338867, 0.0007217228412628174, 0.000796973705291748, 0.0008722245693206787, 0.0009474754333496094, 0.00102272629737854, 0.0010979771614074707, 0.0011732280254364014, 0.001248478889465332, 0.0013237297534942627, 0.0013989806175231934, 0.001474231481552124, 0.0015494823455810547, 0.0016247332096099854, 0.001699984073638916, 0.0017752349376678467, 0.0018504858016967773, 0.001925736665725708, 0.0020009875297546387, 0.0020762383937835693, 0.0021514892578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 17.0, 17.0, 19.0, 30.0, 37.0, 44.0, 67.0, 102.0, 153.0, 198.0, 282.0, 411.0, 547.0, 881.0, 1456.0, 2524.0, 4694.0, 8717.0, 17338.0, 36902.0, 78026.0, 153175.0, 236175.0, 227049.0, 141639.0, 70967.0, 32848.0, 15812.0, 7856.0, 4035.0, 2322.0, 1371.0, 858.0, 575.0, 376.0, 297.0, 215.0, 137.0, 89.0, 76.0, 56.0, 37.0, 18.0, 27.0, 14.0, 13.0, 8.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-16.859375, -16.347412109375, -15.83544921875, -15.323486328125, -14.8115234375, -14.299560546875, -13.78759765625, -13.275634765625, -12.763671875, -12.251708984375, -11.73974609375, -11.227783203125, -10.7158203125, -10.203857421875, -9.69189453125, -9.179931640625, -8.66796875, -8.156005859375, -7.64404296875, -7.132080078125, -6.6201171875, -6.108154296875, -5.59619140625, -5.084228515625, -4.572265625, -4.060302734375, -3.54833984375, -3.036376953125, -2.5244140625, -2.012451171875, -1.50048828125, -0.988525390625, -0.4765625, 0.035400390625, 0.54736328125, 1.059326171875, 1.5712890625, 2.083251953125, 2.59521484375, 3.107177734375, 3.619140625, 4.131103515625, 4.64306640625, 5.155029296875, 5.6669921875, 6.178955078125, 6.69091796875, 7.202880859375, 7.71484375, 8.226806640625, 8.73876953125, 9.250732421875, 9.7626953125, 10.274658203125, 10.78662109375, 11.298583984375, 11.810546875, 12.322509765625, 12.83447265625, 13.346435546875, 13.8583984375, 14.370361328125, 14.88232421875, 15.394287109375, 15.90625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 18.0, 13.0, 16.0, 17.0, 29.0, 43.0, 49.0, 63.0, 65.0, 74.0, 83.0, 93.0, 88.0, 72.0, 59.0, 57.0, 45.0, 21.0, 23.0, 17.0, 16.0, 10.0, 11.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.796875, -7.58685302734375, -7.3768310546875, -7.16680908203125, -6.956787109375, -6.74676513671875, -6.5367431640625, -6.32672119140625, -6.11669921875, -5.90667724609375, -5.6966552734375, -5.48663330078125, -5.276611328125, -5.06658935546875, -4.8565673828125, -4.64654541015625, -4.4365234375, -4.22650146484375, -4.0164794921875, -3.80645751953125, -3.596435546875, -3.38641357421875, -3.1763916015625, -2.96636962890625, -2.75634765625, -2.54632568359375, -2.3363037109375, -2.12628173828125, -1.916259765625, -1.70623779296875, -1.4962158203125, -1.28619384765625, -1.076171875, -0.86614990234375, -0.6561279296875, -0.44610595703125, -0.236083984375, -0.02606201171875, 0.1839599609375, 0.39398193359375, 0.60400390625, 0.81402587890625, 1.0240478515625, 1.23406982421875, 1.444091796875, 1.65411376953125, 1.8641357421875, 2.07415771484375, 2.2841796875, 2.49420166015625, 2.7042236328125, 2.91424560546875, 3.124267578125, 3.33428955078125, 3.5443115234375, 3.75433349609375, 3.96435546875, 4.17437744140625, 4.3843994140625, 4.59442138671875, 4.804443359375, 5.01446533203125, 5.2244873046875, 5.43450927734375, 5.64453125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 5.0, 10.0, 13.0, 8.0, 16.0, 12.0, 18.0, 29.0, 26.0, 28.0, 32.0, 44.0, 34.0, 35.0, 37.0, 33.0, 51.0, 40.0, 39.0, 43.0, 40.0, 41.0, 33.0, 47.0, 31.0, 26.0, 28.0, 26.0, 28.0, 13.0, 13.0, 15.0, 16.0, 12.0, 7.0, 7.0, 8.0, 8.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-11.777668952941895, -11.38436222076416, -10.991055488586426, -10.597749710083008, -10.204442977905273, -9.811136245727539, -9.417829513549805, -9.02452278137207, -8.631216049194336, -8.237909317016602, -7.844603061676025, -7.451296329498291, -7.057990074157715, -6.6646833419799805, -6.271376609802246, -5.878069877624512, -5.484764099121094, -5.091457366943359, -4.698151111602783, -4.304844379425049, -3.9115378856658936, -3.5182313919067383, -3.124924659729004, -2.7316181659698486, -2.3383116722106934, -1.945005178451538, -1.5516985654830933, -1.1583919525146484, -0.7650854587554932, -0.3717789649963379, 0.021527767181396484, 0.41483426094055176, 0.8081417083740234, 1.2014482021331787, 1.5947548151016235, 1.9880614280700684, 2.3813679218292236, 2.774674415588379, 3.1679811477661133, 3.5612876415252686, 3.954594135284424, 4.347900867462158, 4.741207122802734, 5.134513854980469, 5.527820587158203, 5.921126842498779, 6.314433574676514, 6.70773983001709, 7.101046562194824, 7.494353294372559, 7.887659549713135, 8.280965805053711, 8.674272537231445, 9.06757926940918, 9.460886001586914, 9.854192733764648, 10.247499465942383, 10.640806198120117, 11.034112930297852, 11.427419662475586, 11.820725440979004, 12.214032173156738, 12.607338905334473, 13.000645637512207, 13.393951416015625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 11.0, 10.0, 8.0, 9.0, 13.0, 13.0, 15.0, 17.0, 21.0, 18.0, 28.0, 23.0, 27.0, 32.0, 26.0, 35.0, 29.0, 39.0, 34.0, 35.0, 33.0, 35.0, 36.0, 38.0, 32.0, 21.0, 32.0, 25.0, 22.0, 28.0, 34.0, 25.0, 33.0, 22.0, 13.0, 19.0, 16.0, 16.0, 12.0, 6.0, 8.0, 5.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 7.0, 2.0, 3.0], "bins": [-12.982728958129883, -12.602767944335938, -12.222805976867676, -11.84284496307373, -11.462882995605469, -11.082921981811523, -10.702960968017578, -10.322999954223633, -9.943037986755371, -9.563076972961426, -9.183115005493164, -8.803153991699219, -8.423192977905273, -8.043231010437012, -7.663269996643066, -7.283308506011963, -6.903347015380859, -6.523385524749756, -6.143424034118652, -5.763463020324707, -5.3835015296936035, -5.0035400390625, -4.623579025268555, -4.243617534637451, -3.8636560440063477, -3.483694553375244, -3.1037333011627197, -2.7237720489501953, -2.343810558319092, -1.9638491868972778, -1.5838878154754639, -1.2039265632629395, -0.8239660263061523, -0.4440046548843384, -0.06404328346252441, 0.31591808795928955, 0.6958794593811035, 1.0758408308029175, 1.4558022022247314, 1.8357634544372559, 2.2157249450683594, 2.595686435699463, 2.9756476879119873, 3.3556089401245117, 3.7355704307556152, 4.115531921386719, 4.495492935180664, 4.875454425811768, 5.255415916442871, 5.635377407073975, 6.015338897705078, 6.395299911499023, 6.775261402130127, 7.1552228927612305, 7.535183906555176, 7.915145397186279, 8.295106887817383, 8.675067901611328, 9.05502986907959, 9.434990882873535, 9.814952850341797, 10.194913864135742, 10.574874877929688, 10.954835891723633, 11.334797859191895]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 20.0, 20.0, 38.0, 40.0, 109.0, 139.0, 212.0, 346.0, 581.0, 993.0, 1559.0, 2709.0, 4490.0, 7481.0, 12446.0, 20506.0, 32965.0, 50519.0, 74672.0, 101066.0, 124299.0, 135564.0, 129282.0, 109704.0, 82452.0, 57587.0, 38035.0, 23805.0, 14735.0, 8876.0, 5354.0, 3160.0, 1942.0, 1109.0, 690.0, 380.0, 261.0, 149.0, 104.0, 53.0, 32.0, 26.0, 15.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.109375, -9.7900390625, -9.470703125, -9.1513671875, -8.83203125, -8.5126953125, -8.193359375, -7.8740234375, -7.5546875, -7.2353515625, -6.916015625, -6.5966796875, -6.27734375, -5.9580078125, -5.638671875, -5.3193359375, -5.0, -4.6806640625, -4.361328125, -4.0419921875, -3.72265625, -3.4033203125, -3.083984375, -2.7646484375, -2.4453125, -2.1259765625, -1.806640625, -1.4873046875, -1.16796875, -0.8486328125, -0.529296875, -0.2099609375, 0.109375, 0.4287109375, 0.748046875, 1.0673828125, 1.38671875, 1.7060546875, 2.025390625, 2.3447265625, 2.6640625, 2.9833984375, 3.302734375, 3.6220703125, 3.94140625, 4.2607421875, 4.580078125, 4.8994140625, 5.21875, 5.5380859375, 5.857421875, 6.1767578125, 6.49609375, 6.8154296875, 7.134765625, 7.4541015625, 7.7734375, 8.0927734375, 8.412109375, 8.7314453125, 9.05078125, 9.3701171875, 9.689453125, 10.0087890625, 10.328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 7.0, 7.0, 10.0, 11.0, 10.0, 13.0, 20.0, 19.0, 13.0, 27.0, 27.0, 24.0, 24.0, 27.0, 30.0, 44.0, 42.0, 32.0, 33.0, 42.0, 29.0, 35.0, 37.0, 32.0, 32.0, 35.0, 31.0, 40.0, 36.0, 28.0, 26.0, 25.0, 22.0, 21.0, 16.0, 14.0, 14.0, 13.0, 5.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0], "bins": [-14.625, -14.215087890625, -13.80517578125, -13.395263671875, -12.9853515625, -12.575439453125, -12.16552734375, -11.755615234375, -11.345703125, -10.935791015625, -10.52587890625, -10.115966796875, -9.7060546875, -9.296142578125, -8.88623046875, -8.476318359375, -8.06640625, -7.656494140625, -7.24658203125, -6.836669921875, -6.4267578125, -6.016845703125, -5.60693359375, -5.197021484375, -4.787109375, -4.377197265625, -3.96728515625, -3.557373046875, -3.1474609375, -2.737548828125, -2.32763671875, -1.917724609375, -1.5078125, -1.097900390625, -0.68798828125, -0.278076171875, 0.1318359375, 0.541748046875, 0.95166015625, 1.361572265625, 1.771484375, 2.181396484375, 2.59130859375, 3.001220703125, 3.4111328125, 3.821044921875, 4.23095703125, 4.640869140625, 5.05078125, 5.460693359375, 5.87060546875, 6.280517578125, 6.6904296875, 7.100341796875, 7.51025390625, 7.920166015625, 8.330078125, 8.739990234375, 9.14990234375, 9.559814453125, 9.9697265625, 10.379638671875, 10.78955078125, 11.199462890625, 11.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 9.0, 15.0, 20.0, 22.0, 34.0, 65.0, 79.0, 114.0, 179.0, 314.0, 473.0, 760.0, 1100.0, 1817.0, 2936.0, 4741.0, 7326.0, 11553.0, 18384.0, 28087.0, 42205.0, 62294.0, 85804.0, 110040.0, 126134.0, 127988.0, 115815.0, 93354.0, 69562.0, 48006.0, 32053.0, 20723.0, 13328.0, 8476.0, 5478.0, 3341.0, 2115.0, 1419.0, 871.0, 554.0, 323.0, 212.0, 128.0, 104.0, 73.0, 43.0, 28.0, 19.0, 12.0, 8.0, 9.0, 3.0, 5.0, 4.0, 2.0, 3.0], "bins": [-12.109375, -11.744140625, -11.37890625, -11.013671875, -10.6484375, -10.283203125, -9.91796875, -9.552734375, -9.1875, -8.822265625, -8.45703125, -8.091796875, -7.7265625, -7.361328125, -6.99609375, -6.630859375, -6.265625, -5.900390625, -5.53515625, -5.169921875, -4.8046875, -4.439453125, -4.07421875, -3.708984375, -3.34375, -2.978515625, -2.61328125, -2.248046875, -1.8828125, -1.517578125, -1.15234375, -0.787109375, -0.421875, -0.056640625, 0.30859375, 0.673828125, 1.0390625, 1.404296875, 1.76953125, 2.134765625, 2.5, 2.865234375, 3.23046875, 3.595703125, 3.9609375, 4.326171875, 4.69140625, 5.056640625, 5.421875, 5.787109375, 6.15234375, 6.517578125, 6.8828125, 7.248046875, 7.61328125, 7.978515625, 8.34375, 8.708984375, 9.07421875, 9.439453125, 9.8046875, 10.169921875, 10.53515625, 10.900390625, 11.265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 8.0, 12.0, 3.0, 9.0, 12.0, 14.0, 19.0, 15.0, 25.0, 20.0, 37.0, 32.0, 37.0, 40.0, 39.0, 48.0, 43.0, 55.0, 47.0, 56.0, 54.0, 39.0, 34.0, 43.0, 42.0, 35.0, 20.0, 36.0, 28.0, 15.0, 14.0, 17.0, 11.0, 13.0, 8.0, 11.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.411376953125, -9.04931640625, -8.687255859375, -8.3251953125, -7.963134765625, -7.60107421875, -7.239013671875, -6.876953125, -6.514892578125, -6.15283203125, -5.790771484375, -5.4287109375, -5.066650390625, -4.70458984375, -4.342529296875, -3.98046875, -3.618408203125, -3.25634765625, -2.894287109375, -2.5322265625, -2.170166015625, -1.80810546875, -1.446044921875, -1.083984375, -0.721923828125, -0.35986328125, 0.002197265625, 0.3642578125, 0.726318359375, 1.08837890625, 1.450439453125, 1.8125, 2.174560546875, 2.53662109375, 2.898681640625, 3.2607421875, 3.622802734375, 3.98486328125, 4.346923828125, 4.708984375, 5.071044921875, 5.43310546875, 5.795166015625, 6.1572265625, 6.519287109375, 6.88134765625, 7.243408203125, 7.60546875, 7.967529296875, 8.32958984375, 8.691650390625, 9.0537109375, 9.415771484375, 9.77783203125, 10.139892578125, 10.501953125, 10.864013671875, 11.22607421875, 11.588134765625, 11.9501953125, 12.312255859375, 12.67431640625, 13.036376953125, 13.3984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 4.0, 8.0, 18.0, 26.0, 41.0, 45.0, 69.0, 84.0, 112.0, 169.0, 244.0, 319.0, 511.0, 705.0, 1009.0, 1539.0, 2204.0, 3326.0, 5063.0, 8099.0, 12746.0, 20326.0, 32562.0, 50612.0, 76168.0, 105686.0, 133006.0, 143540.0, 131592.0, 104900.0, 75226.0, 49943.0, 31853.0, 20484.0, 12621.0, 8087.0, 5233.0, 3405.0, 2160.0, 1449.0, 998.0, 757.0, 458.0, 326.0, 224.0, 201.0, 114.0, 84.0, 61.0, 41.0, 36.0, 26.0, 12.0, 10.0, 5.0, 9.0, 5.0, 2.0, 0.0, 2.0], "bins": [-4.6953125, -4.54620361328125, -4.3970947265625, -4.24798583984375, -4.098876953125, -3.94976806640625, -3.8006591796875, -3.65155029296875, -3.50244140625, -3.35333251953125, -3.2042236328125, -3.05511474609375, -2.906005859375, -2.75689697265625, -2.6077880859375, -2.45867919921875, -2.3095703125, -2.16046142578125, -2.0113525390625, -1.86224365234375, -1.713134765625, -1.56402587890625, -1.4149169921875, -1.26580810546875, -1.11669921875, -0.96759033203125, -0.8184814453125, -0.66937255859375, -0.520263671875, -0.37115478515625, -0.2220458984375, -0.07293701171875, 0.076171875, 0.22528076171875, 0.3743896484375, 0.52349853515625, 0.672607421875, 0.82171630859375, 0.9708251953125, 1.11993408203125, 1.26904296875, 1.41815185546875, 1.5672607421875, 1.71636962890625, 1.865478515625, 2.01458740234375, 2.1636962890625, 2.31280517578125, 2.4619140625, 2.61102294921875, 2.7601318359375, 2.90924072265625, 3.058349609375, 3.20745849609375, 3.3565673828125, 3.50567626953125, 3.65478515625, 3.80389404296875, 3.9530029296875, 4.10211181640625, 4.251220703125, 4.40032958984375, 4.5494384765625, 4.69854736328125, 4.84765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 8.0, 21.0, 22.0, 21.0, 42.0, 41.0, 42.0, 55.0, 60.0, 50.0, 86.0, 77.0, 63.0, 63.0, 70.0, 58.0, 47.0, 39.0, 28.0, 32.0, 22.0, 11.0, 14.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007843971252441406, -0.000762157142162323, -0.0007399171590805054, -0.0007176771759986877, -0.0006954371929168701, -0.0006731972098350525, -0.0006509572267532349, -0.0006287172436714172, -0.0006064772605895996, -0.000584237277507782, -0.0005619972944259644, -0.0005397573113441467, -0.0005175173282623291, -0.0004952773451805115, -0.00047303736209869385, -0.0004507973790168762, -0.0004285573959350586, -0.00040631741285324097, -0.00038407742977142334, -0.0003618374466896057, -0.0003395974636077881, -0.00031735748052597046, -0.00029511749744415283, -0.0002728775143623352, -0.0002506375312805176, -0.00022839754819869995, -0.00020615756511688232, -0.0001839175820350647, -0.00016167759895324707, -0.00013943761587142944, -0.00011719763278961182, -9.495764970779419e-05, -7.271766662597656e-05, -5.0477683544158936e-05, -2.823770046234131e-05, -5.997717380523682e-06, 1.6242265701293945e-05, 3.848224878311157e-05, 6.07222318649292e-05, 8.296221494674683e-05, 0.00010520219802856445, 0.00012744218111038208, 0.0001496821641921997, 0.00017192214727401733, 0.00019416213035583496, 0.0002164021134376526, 0.00023864209651947021, 0.00026088207960128784, 0.00028312206268310547, 0.0003053620457649231, 0.0003276020288467407, 0.00034984201192855835, 0.000372081995010376, 0.0003943219780921936, 0.00041656196117401123, 0.00043880194425582886, 0.0004610419273376465, 0.0004832819104194641, 0.0005055218935012817, 0.0005277618765830994, 0.000550001859664917, 0.0005722418427467346, 0.0005944818258285522, 0.0006167218089103699, 0.0006389617919921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 14.0, 17.0, 22.0, 31.0, 54.0, 80.0, 108.0, 147.0, 198.0, 326.0, 536.0, 804.0, 1270.0, 2027.0, 3233.0, 5152.0, 8598.0, 14437.0, 23984.0, 39311.0, 62143.0, 93133.0, 126154.0, 148638.0, 148084.0, 122841.0, 90033.0, 60447.0, 37913.0, 23249.0, 13700.0, 8241.0, 5090.0, 3082.0, 1960.0, 1202.0, 798.0, 515.0, 348.0, 216.0, 150.0, 101.0, 54.0, 35.0, 28.0, 11.0, 14.0, 13.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.796875, -4.64678955078125, -4.4967041015625, -4.34661865234375, -4.196533203125, -4.04644775390625, -3.8963623046875, -3.74627685546875, -3.59619140625, -3.44610595703125, -3.2960205078125, -3.14593505859375, -2.995849609375, -2.84576416015625, -2.6956787109375, -2.54559326171875, -2.3955078125, -2.24542236328125, -2.0953369140625, -1.94525146484375, -1.795166015625, -1.64508056640625, -1.4949951171875, -1.34490966796875, -1.19482421875, -1.04473876953125, -0.8946533203125, -0.74456787109375, -0.594482421875, -0.44439697265625, -0.2943115234375, -0.14422607421875, 0.005859375, 0.15594482421875, 0.3060302734375, 0.45611572265625, 0.606201171875, 0.75628662109375, 0.9063720703125, 1.05645751953125, 1.20654296875, 1.35662841796875, 1.5067138671875, 1.65679931640625, 1.806884765625, 1.95697021484375, 2.1070556640625, 2.25714111328125, 2.4072265625, 2.55731201171875, 2.7073974609375, 2.85748291015625, 3.007568359375, 3.15765380859375, 3.3077392578125, 3.45782470703125, 3.60791015625, 3.75799560546875, 3.9080810546875, 4.05816650390625, 4.208251953125, 4.35833740234375, 4.5084228515625, 4.65850830078125, 4.80859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 6.0, 11.0, 6.0, 8.0, 22.0, 17.0, 20.0, 29.0, 30.0, 27.0, 40.0, 47.0, 40.0, 38.0, 53.0, 50.0, 54.0, 54.0, 59.0, 36.0, 46.0, 42.0, 41.0, 25.0, 44.0, 26.0, 22.0, 16.0, 18.0, 13.0, 17.0, 7.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23828125, -2.1700439453125, -2.101806640625, -2.0335693359375, -1.96533203125, -1.8970947265625, -1.828857421875, -1.7606201171875, -1.6923828125, -1.6241455078125, -1.555908203125, -1.4876708984375, -1.41943359375, -1.3511962890625, -1.282958984375, -1.2147216796875, -1.146484375, -1.0782470703125, -1.010009765625, -0.9417724609375, -0.87353515625, -0.8052978515625, -0.737060546875, -0.6688232421875, -0.6005859375, -0.5323486328125, -0.464111328125, -0.3958740234375, -0.32763671875, -0.2593994140625, -0.191162109375, -0.1229248046875, -0.0546875, 0.0135498046875, 0.081787109375, 0.1500244140625, 0.21826171875, 0.2864990234375, 0.354736328125, 0.4229736328125, 0.4912109375, 0.5594482421875, 0.627685546875, 0.6959228515625, 0.76416015625, 0.8323974609375, 0.900634765625, 0.9688720703125, 1.037109375, 1.1053466796875, 1.173583984375, 1.2418212890625, 1.31005859375, 1.3782958984375, 1.446533203125, 1.5147705078125, 1.5830078125, 1.6512451171875, 1.719482421875, 1.7877197265625, 1.85595703125, 1.9241943359375, 1.992431640625, 2.0606689453125, 2.12890625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 3.0, 10.0, 10.0, 8.0, 10.0, 11.0, 19.0, 16.0, 26.0, 21.0, 31.0, 33.0, 41.0, 29.0, 41.0, 44.0, 45.0, 49.0, 44.0, 51.0, 45.0, 43.0, 41.0, 41.0, 36.0, 31.0, 31.0, 28.0, 21.0, 27.0, 11.0, 16.0, 14.0, 11.0, 10.0, 16.0, 4.0, 11.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.864256858825684, -11.450348854064941, -11.0364408493042, -10.622532844543457, -10.208624839782715, -9.794716835021973, -9.38080883026123, -8.966900825500488, -8.552992820739746, -8.139084815979004, -7.725176811218262, -7.3112688064575195, -6.897360801696777, -6.483452796936035, -6.069544792175293, -5.655636787414551, -5.24172830581665, -4.827820301055908, -4.413912296295166, -4.000004291534424, -3.5860962867736816, -3.1721880435943604, -2.758280038833618, -2.344372034072876, -1.9304640293121338, -1.5165560245513916, -1.1026480197906494, -0.6887398958206177, -0.2748318910598755, 0.13907623291015625, 0.5529842376708984, 0.9668922424316406, 1.3808002471923828, 1.794708251953125, 2.208616256713867, 2.6225242614746094, 3.0364322662353516, 3.450340509414673, 3.864248514175415, 4.278156280517578, 4.69206428527832, 5.1059722900390625, 5.519880294799805, 5.933788299560547, 6.347696304321289, 6.761604309082031, 7.175512313842773, 7.589420318603516, 8.003328323364258, 8.417236328125, 8.831144332885742, 9.245052337646484, 9.658960342407227, 10.072868347167969, 10.486776351928711, 10.900684356689453, 11.314593315124512, 11.728501319885254, 12.142409324645996, 12.556317329406738, 12.97022533416748, 13.384133338928223, 13.798041343688965, 14.211949348449707, 14.62585735321045]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 6.0, 10.0, 12.0, 5.0, 20.0, 19.0, 25.0, 10.0, 26.0, 22.0, 25.0, 37.0, 39.0, 47.0, 27.0, 41.0, 44.0, 35.0, 37.0, 41.0, 38.0, 37.0, 43.0, 44.0, 40.0, 32.0, 25.0, 20.0, 26.0, 26.0, 22.0, 9.0, 16.0, 13.0, 10.0, 11.0, 13.0, 8.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0], "bins": [-16.73340606689453, -16.26563835144043, -15.797870635986328, -15.330102920532227, -14.862335205078125, -14.394567489624023, -13.926798820495605, -13.459031105041504, -12.991263389587402, -12.5234956741333, -12.0557279586792, -11.587960243225098, -11.12019157409668, -10.652423858642578, -10.184656143188477, -9.716888427734375, -9.249120712280273, -8.781352996826172, -8.31358528137207, -7.8458170890808105, -7.378049373626709, -6.910281658172607, -6.442513465881348, -5.974745750427246, -5.5069780349731445, -5.039210319519043, -4.571442604064941, -4.103674411773682, -3.63590669631958, -3.1681389808654785, -2.700371026992798, -2.232603073120117, -1.7648353576660156, -1.2970675230026245, -0.8292996883392334, -0.3615318536758423, 0.10623598098754883, 0.5740036964416504, 1.041771650314331, 1.5095396041870117, 1.9773073196411133, 2.445075035095215, 2.9128429889678955, 3.380610942840576, 3.8483786582946777, 4.316146373748779, 4.783914566040039, 5.251682281494141, 5.719449996948242, 6.187217712402344, 6.654985427856445, 7.122753620147705, 7.590521335601807, 8.05828857421875, 8.526057243347168, 8.99382495880127, 9.461592674255371, 9.929360389709473, 10.397128105163574, 10.864895820617676, 11.332664489746094, 11.800432205200195, 12.268199920654297, 12.735967636108398, 13.2037353515625]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 10.0, 19.0, 33.0, 44.0, 68.0, 124.0, 164.0, 257.0, 453.0, 696.0, 1094.0, 1690.0, 2681.0, 4279.0, 6795.0, 11133.0, 18292.0, 30463.0, 51355.0, 87454.0, 151748.0, 259781.0, 419933.0, 594224.0, 689236.0, 636043.0, 477717.0, 307464.0, 183157.0, 105298.0, 61875.0, 35637.0, 21473.0, 12825.0, 7848.0, 4857.0, 3069.0, 1893.0, 1164.0, 739.0, 451.0, 263.0, 172.0, 119.0, 87.0, 42.0, 29.0, 16.0, 11.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.75, -11.4110107421875, -11.072021484375, -10.7330322265625, -10.39404296875, -10.0550537109375, -9.716064453125, -9.3770751953125, -9.0380859375, -8.6990966796875, -8.360107421875, -8.0211181640625, -7.68212890625, -7.3431396484375, -7.004150390625, -6.6651611328125, -6.326171875, -5.9871826171875, -5.648193359375, -5.3092041015625, -4.97021484375, -4.6312255859375, -4.292236328125, -3.9532470703125, -3.6142578125, -3.2752685546875, -2.936279296875, -2.5972900390625, -2.25830078125, -1.9193115234375, -1.580322265625, -1.2413330078125, -0.90234375, -0.5633544921875, -0.224365234375, 0.1146240234375, 0.45361328125, 0.7926025390625, 1.131591796875, 1.4705810546875, 1.8095703125, 2.1485595703125, 2.487548828125, 2.8265380859375, 3.16552734375, 3.5045166015625, 3.843505859375, 4.1824951171875, 4.521484375, 4.8604736328125, 5.199462890625, 5.5384521484375, 5.87744140625, 6.2164306640625, 6.555419921875, 6.8944091796875, 7.2333984375, 7.5723876953125, 7.911376953125, 8.2503662109375, 8.58935546875, 8.9283447265625, 9.267333984375, 9.6063232421875, 9.9453125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 6.0, 3.0, 11.0, 6.0, 8.0, 11.0, 9.0, 19.0, 19.0, 19.0, 22.0, 17.0, 22.0, 30.0, 34.0, 28.0, 24.0, 44.0, 37.0, 41.0, 40.0, 39.0, 48.0, 30.0, 42.0, 49.0, 44.0, 26.0, 27.0, 19.0, 27.0, 18.0, 28.0, 18.0, 24.0, 19.0, 12.0, 14.0, 14.0, 7.0, 5.0, 10.0, 8.0, 6.0, 2.0, 8.0, 3.0, 3.0, 2.0, 3.0, 3.0], "bins": [-13.0078125, -12.6378173828125, -12.267822265625, -11.8978271484375, -11.52783203125, -11.1578369140625, -10.787841796875, -10.4178466796875, -10.0478515625, -9.6778564453125, -9.307861328125, -8.9378662109375, -8.56787109375, -8.1978759765625, -7.827880859375, -7.4578857421875, -7.087890625, -6.7178955078125, -6.347900390625, -5.9779052734375, -5.60791015625, -5.2379150390625, -4.867919921875, -4.4979248046875, -4.1279296875, -3.7579345703125, -3.387939453125, -3.0179443359375, -2.64794921875, -2.2779541015625, -1.907958984375, -1.5379638671875, -1.16796875, -0.7979736328125, -0.427978515625, -0.0579833984375, 0.31201171875, 0.6820068359375, 1.052001953125, 1.4219970703125, 1.7919921875, 2.1619873046875, 2.531982421875, 2.9019775390625, 3.27197265625, 3.6419677734375, 4.011962890625, 4.3819580078125, 4.751953125, 5.1219482421875, 5.491943359375, 5.8619384765625, 6.23193359375, 6.6019287109375, 6.971923828125, 7.3419189453125, 7.7119140625, 8.0819091796875, 8.451904296875, 8.8218994140625, 9.19189453125, 9.5618896484375, 9.931884765625, 10.3018798828125, 10.671875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 10.0, 6.0, 14.0, 24.0, 51.0, 86.0, 127.0, 224.0, 325.0, 579.0, 864.0, 1421.0, 2383.0, 3955.0, 6628.0, 11096.0, 18720.0, 31690.0, 54096.0, 91301.0, 154053.0, 252126.0, 394447.0, 555933.0, 662299.0, 629043.0, 487180.0, 328097.0, 205545.0, 123212.0, 73107.0, 43092.0, 25245.0, 14867.0, 8955.0, 5292.0, 3171.0, 1940.0, 1161.0, 761.0, 416.0, 321.0, 167.0, 98.0, 62.0, 39.0, 23.0, 13.0, 10.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0], "bins": [-13.15625, -12.766845703125, -12.37744140625, -11.988037109375, -11.5986328125, -11.209228515625, -10.81982421875, -10.430419921875, -10.041015625, -9.651611328125, -9.26220703125, -8.872802734375, -8.4833984375, -8.093994140625, -7.70458984375, -7.315185546875, -6.92578125, -6.536376953125, -6.14697265625, -5.757568359375, -5.3681640625, -4.978759765625, -4.58935546875, -4.199951171875, -3.810546875, -3.421142578125, -3.03173828125, -2.642333984375, -2.2529296875, -1.863525390625, -1.47412109375, -1.084716796875, -0.6953125, -0.305908203125, 0.08349609375, 0.472900390625, 0.8623046875, 1.251708984375, 1.64111328125, 2.030517578125, 2.419921875, 2.809326171875, 3.19873046875, 3.588134765625, 3.9775390625, 4.366943359375, 4.75634765625, 5.145751953125, 5.53515625, 5.924560546875, 6.31396484375, 6.703369140625, 7.0927734375, 7.482177734375, 7.87158203125, 8.260986328125, 8.650390625, 9.039794921875, 9.42919921875, 9.818603515625, 10.2080078125, 10.597412109375, 10.98681640625, 11.376220703125, 11.765625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 5.0, 3.0, 8.0, 9.0, 19.0, 18.0, 24.0, 26.0, 28.0, 48.0, 53.0, 81.0, 98.0, 113.0, 90.0, 142.0, 144.0, 199.0, 163.0, 177.0, 213.0, 208.0, 209.0, 223.0, 190.0, 219.0, 179.0, 161.0, 155.0, 145.0, 136.0, 100.0, 83.0, 71.0, 64.0, 47.0, 39.0, 41.0, 30.0, 23.0, 22.0, 17.0, 7.0, 11.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.62890625, -4.47735595703125, -4.3258056640625, -4.17425537109375, -4.022705078125, -3.87115478515625, -3.7196044921875, -3.56805419921875, -3.41650390625, -3.26495361328125, -3.1134033203125, -2.96185302734375, -2.810302734375, -2.65875244140625, -2.5072021484375, -2.35565185546875, -2.2041015625, -2.05255126953125, -1.9010009765625, -1.74945068359375, -1.597900390625, -1.44635009765625, -1.2947998046875, -1.14324951171875, -0.99169921875, -0.84014892578125, -0.6885986328125, -0.53704833984375, -0.385498046875, -0.23394775390625, -0.0823974609375, 0.06915283203125, 0.220703125, 0.37225341796875, 0.5238037109375, 0.67535400390625, 0.826904296875, 0.97845458984375, 1.1300048828125, 1.28155517578125, 1.43310546875, 1.58465576171875, 1.7362060546875, 1.88775634765625, 2.039306640625, 2.19085693359375, 2.3424072265625, 2.49395751953125, 2.6455078125, 2.79705810546875, 2.9486083984375, 3.10015869140625, 3.251708984375, 3.40325927734375, 3.5548095703125, 3.70635986328125, 3.85791015625, 4.00946044921875, 4.1610107421875, 4.31256103515625, 4.464111328125, 4.61566162109375, 4.7672119140625, 4.91876220703125, 5.0703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 5.0, 4.0, 8.0, 5.0, 2.0, 10.0, 12.0, 16.0, 22.0, 17.0, 23.0, 27.0, 17.0, 35.0, 42.0, 44.0, 57.0, 47.0, 46.0, 58.0, 44.0, 67.0, 42.0, 40.0, 63.0, 28.0, 38.0, 25.0, 34.0, 26.0, 14.0, 12.0, 14.0, 14.0, 8.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.058917045593262, -12.617138862609863, -12.175360679626465, -11.73358154296875, -11.291803359985352, -10.850025177001953, -10.408246994018555, -9.966468811035156, -9.524690628051758, -9.08291244506836, -8.641134262084961, -8.199356079101562, -7.757576942443848, -7.315798759460449, -6.874020576477051, -6.432242393493652, -5.9904632568359375, -5.548685073852539, -5.106906414031982, -4.665128231048584, -4.223349571228027, -3.781571388244629, -3.3397932052612305, -2.898014783859253, -2.4562363624572754, -2.014457941055298, -1.5726796388626099, -1.1309013366699219, -0.6891229152679443, -0.2473444938659668, 0.19443368911743164, 0.6362121105194092, 1.0779895782470703, 1.5197679996490479, 1.9615463018417358, 2.403324604034424, 2.8451030254364014, 3.286881446838379, 3.7286596298217773, 4.170437812805176, 4.612216472625732, 5.053994655609131, 5.4957733154296875, 5.937551498413086, 6.379329681396484, 6.821108341217041, 7.2628865242004395, 7.704665184020996, 8.146443367004395, 8.588221549987793, 9.029999732971191, 9.471778869628906, 9.913557052612305, 10.355335235595703, 10.797113418579102, 11.2388916015625, 11.680669784545898, 12.122447967529297, 12.564226150512695, 13.006004333496094, 13.447783470153809, 13.889561653137207, 14.331339836120605, 14.773118019104004, 15.214897155761719]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 8.0, 14.0, 9.0, 16.0, 21.0, 21.0, 21.0, 26.0, 26.0, 30.0, 26.0, 36.0, 40.0, 34.0, 28.0, 41.0, 34.0, 37.0, 41.0, 42.0, 41.0, 44.0, 46.0, 36.0, 26.0, 30.0, 30.0, 28.0, 29.0, 17.0, 11.0, 23.0, 9.0, 15.0, 11.0, 9.0, 7.0, 7.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.620450973510742, -13.18293571472168, -12.745421409606934, -12.307907104492188, -11.870391845703125, -11.432876586914062, -10.995362281799316, -10.55784797668457, -10.120332717895508, -9.682817459106445, -9.2453031539917, -8.807788848876953, -8.37027359008789, -7.932758808135986, -7.495244026184082, -7.057729244232178, -6.620214462280273, -6.182699680328369, -5.745184898376465, -5.3076701164245605, -4.870155334472656, -4.432640552520752, -3.9951257705688477, -3.5576109886169434, -3.120096206665039, -2.6825814247131348, -2.2450666427612305, -1.8075518608093262, -1.3700370788574219, -0.9325222969055176, -0.4950075149536133, -0.057492733001708984, 0.3800220489501953, 0.8175368309020996, 1.255051612854004, 1.6925663948059082, 2.1300811767578125, 2.567595958709717, 3.005110740661621, 3.4426255226135254, 3.8801403045654297, 4.317655086517334, 4.755169868469238, 5.192684650421143, 5.630199432373047, 6.067714214324951, 6.5052289962768555, 6.94274377822876, 7.380258560180664, 7.817773342132568, 8.255288124084473, 8.692802429199219, 9.130317687988281, 9.567832946777344, 10.00534725189209, 10.442861557006836, 10.880376815795898, 11.317892074584961, 11.755406379699707, 12.192920684814453, 12.630435943603516, 13.067951202392578, 13.505465507507324, 13.94297981262207, 14.380495071411133]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 8.0, 4.0, 6.0, 4.0, 23.0, 27.0, 35.0, 39.0, 78.0, 108.0, 173.0, 226.0, 346.0, 513.0, 716.0, 1027.0, 1544.0, 2251.0, 3213.0, 4477.0, 6704.0, 9751.0, 14340.0, 22133.0, 34738.0, 56566.0, 92762.0, 146761.0, 188959.0, 165363.0, 109959.0, 66935.0, 40524.0, 25800.0, 16652.0, 11295.0, 7564.0, 5205.0, 3642.0, 2578.0, 1739.0, 1192.0, 812.0, 590.0, 393.0, 255.0, 159.0, 121.0, 102.0, 50.0, 39.0, 20.0, 12.0, 10.0, 4.0, 9.0, 5.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-18.515625, -17.8916015625, -17.267578125, -16.6435546875, -16.01953125, -15.3955078125, -14.771484375, -14.1474609375, -13.5234375, -12.8994140625, -12.275390625, -11.6513671875, -11.02734375, -10.4033203125, -9.779296875, -9.1552734375, -8.53125, -7.9072265625, -7.283203125, -6.6591796875, -6.03515625, -5.4111328125, -4.787109375, -4.1630859375, -3.5390625, -2.9150390625, -2.291015625, -1.6669921875, -1.04296875, -0.4189453125, 0.205078125, 0.8291015625, 1.453125, 2.0771484375, 2.701171875, 3.3251953125, 3.94921875, 4.5732421875, 5.197265625, 5.8212890625, 6.4453125, 7.0693359375, 7.693359375, 8.3173828125, 8.94140625, 9.5654296875, 10.189453125, 10.8134765625, 11.4375, 12.0615234375, 12.685546875, 13.3095703125, 13.93359375, 14.5576171875, 15.181640625, 15.8056640625, 16.4296875, 17.0537109375, 17.677734375, 18.3017578125, 18.92578125, 19.5498046875, 20.173828125, 20.7978515625, 21.421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 9.0, 4.0, 5.0, 6.0, 12.0, 11.0, 15.0, 27.0, 25.0, 12.0, 17.0, 29.0, 28.0, 36.0, 36.0, 37.0, 36.0, 38.0, 44.0, 37.0, 34.0, 41.0, 40.0, 40.0, 43.0, 42.0, 35.0, 43.0, 28.0, 24.0, 25.0, 25.0, 21.0, 19.0, 13.0, 13.0, 8.0, 12.0, 8.0, 7.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-12.9453125, -12.5506591796875, -12.156005859375, -11.7613525390625, -11.36669921875, -10.9720458984375, -10.577392578125, -10.1827392578125, -9.7880859375, -9.3934326171875, -8.998779296875, -8.6041259765625, -8.20947265625, -7.8148193359375, -7.420166015625, -7.0255126953125, -6.630859375, -6.2362060546875, -5.841552734375, -5.4468994140625, -5.05224609375, -4.6575927734375, -4.262939453125, -3.8682861328125, -3.4736328125, -3.0789794921875, -2.684326171875, -2.2896728515625, -1.89501953125, -1.5003662109375, -1.105712890625, -0.7110595703125, -0.31640625, 0.0782470703125, 0.472900390625, 0.8675537109375, 1.26220703125, 1.6568603515625, 2.051513671875, 2.4461669921875, 2.8408203125, 3.2354736328125, 3.630126953125, 4.0247802734375, 4.41943359375, 4.8140869140625, 5.208740234375, 5.6033935546875, 5.998046875, 6.3927001953125, 6.787353515625, 7.1820068359375, 7.57666015625, 7.9713134765625, 8.365966796875, 8.7606201171875, 9.1552734375, 9.5499267578125, 9.944580078125, 10.3392333984375, 10.73388671875, 11.1285400390625, 11.523193359375, 11.9178466796875, 12.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 7.0, 12.0, 12.0, 17.0, 23.0, 49.0, 58.0, 81.0, 77.0, 134.0, 182.0, 234.0, 364.0, 554.0, 728.0, 1130.0, 1558.0, 2225.0, 3327.0, 5130.0, 7618.0, 12132.0, 19230.0, 33027.0, 61150.0, 123501.0, 236990.0, 248508.0, 132776.0, 65324.0, 34798.0, 20529.0, 12536.0, 8029.0, 5257.0, 3454.0, 2376.0, 1664.0, 1118.0, 786.0, 527.0, 349.0, 278.0, 189.0, 140.0, 111.0, 95.0, 52.0, 39.0, 29.0, 17.0, 11.0, 4.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-27.78125, -26.85693359375, -25.9326171875, -25.00830078125, -24.083984375, -23.15966796875, -22.2353515625, -21.31103515625, -20.38671875, -19.46240234375, -18.5380859375, -17.61376953125, -16.689453125, -15.76513671875, -14.8408203125, -13.91650390625, -12.9921875, -12.06787109375, -11.1435546875, -10.21923828125, -9.294921875, -8.37060546875, -7.4462890625, -6.52197265625, -5.59765625, -4.67333984375, -3.7490234375, -2.82470703125, -1.900390625, -0.97607421875, -0.0517578125, 0.87255859375, 1.796875, 2.72119140625, 3.6455078125, 4.56982421875, 5.494140625, 6.41845703125, 7.3427734375, 8.26708984375, 9.19140625, 10.11572265625, 11.0400390625, 11.96435546875, 12.888671875, 13.81298828125, 14.7373046875, 15.66162109375, 16.5859375, 17.51025390625, 18.4345703125, 19.35888671875, 20.283203125, 21.20751953125, 22.1318359375, 23.05615234375, 23.98046875, 24.90478515625, 25.8291015625, 26.75341796875, 27.677734375, 28.60205078125, 29.5263671875, 30.45068359375, 31.375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 13.0, 10.0, 7.0, 13.0, 19.0, 17.0, 27.0, 39.0, 37.0, 35.0, 27.0, 39.0, 48.0, 49.0, 65.0, 53.0, 62.0, 43.0, 54.0, 44.0, 50.0, 35.0, 40.0, 28.0, 18.0, 25.0, 17.0, 22.0, 13.0, 15.0, 6.0, 9.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.40625, -13.01220703125, -12.6181640625, -12.22412109375, -11.830078125, -11.43603515625, -11.0419921875, -10.64794921875, -10.25390625, -9.85986328125, -9.4658203125, -9.07177734375, -8.677734375, -8.28369140625, -7.8896484375, -7.49560546875, -7.1015625, -6.70751953125, -6.3134765625, -5.91943359375, -5.525390625, -5.13134765625, -4.7373046875, -4.34326171875, -3.94921875, -3.55517578125, -3.1611328125, -2.76708984375, -2.373046875, -1.97900390625, -1.5849609375, -1.19091796875, -0.796875, -0.40283203125, -0.0087890625, 0.38525390625, 0.779296875, 1.17333984375, 1.5673828125, 1.96142578125, 2.35546875, 2.74951171875, 3.1435546875, 3.53759765625, 3.931640625, 4.32568359375, 4.7197265625, 5.11376953125, 5.5078125, 5.90185546875, 6.2958984375, 6.68994140625, 7.083984375, 7.47802734375, 7.8720703125, 8.26611328125, 8.66015625, 9.05419921875, 9.4482421875, 9.84228515625, 10.236328125, 10.63037109375, 11.0244140625, 11.41845703125, 11.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 15.0, 11.0, 26.0, 27.0, 42.0, 67.0, 103.0, 152.0, 226.0, 345.0, 519.0, 819.0, 1275.0, 2051.0, 3412.0, 5634.0, 9773.0, 18282.0, 37255.0, 89652.0, 231217.0, 343497.0, 173425.0, 66281.0, 28925.0, 14861.0, 8204.0, 4692.0, 2748.0, 1731.0, 1105.0, 718.0, 474.0, 321.0, 213.0, 146.0, 88.0, 64.0, 50.0, 31.0, 21.0, 14.0, 12.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.84375, -15.321533203125, -14.79931640625, -14.277099609375, -13.7548828125, -13.232666015625, -12.71044921875, -12.188232421875, -11.666015625, -11.143798828125, -10.62158203125, -10.099365234375, -9.5771484375, -9.054931640625, -8.53271484375, -8.010498046875, -7.48828125, -6.966064453125, -6.44384765625, -5.921630859375, -5.3994140625, -4.877197265625, -4.35498046875, -3.832763671875, -3.310546875, -2.788330078125, -2.26611328125, -1.743896484375, -1.2216796875, -0.699462890625, -0.17724609375, 0.344970703125, 0.8671875, 1.389404296875, 1.91162109375, 2.433837890625, 2.9560546875, 3.478271484375, 4.00048828125, 4.522705078125, 5.044921875, 5.567138671875, 6.08935546875, 6.611572265625, 7.1337890625, 7.656005859375, 8.17822265625, 8.700439453125, 9.22265625, 9.744873046875, 10.26708984375, 10.789306640625, 11.3115234375, 11.833740234375, 12.35595703125, 12.878173828125, 13.400390625, 13.922607421875, 14.44482421875, 14.967041015625, 15.4892578125, 16.011474609375, 16.53369140625, 17.055908203125, 17.578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 13.0, 10.0, 14.0, 22.0, 26.0, 55.0, 99.0, 165.0, 174.0, 144.0, 84.0, 53.0, 31.0, 20.0, 18.0, 12.0, 9.0, 3.0, 9.0, 4.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002483367919921875, -0.002415284514427185, -0.002347201108932495, -0.002279117703437805, -0.0022110342979431152, -0.0021429508924484253, -0.0020748674869537354, -0.0020067840814590454, -0.0019387006759643555, -0.0018706172704696655, -0.0018025338649749756, -0.0017344504594802856, -0.0016663670539855957, -0.0015982836484909058, -0.0015302002429962158, -0.0014621168375015259, -0.001394033432006836, -0.001325950026512146, -0.001257866621017456, -0.0011897832155227661, -0.0011216998100280762, -0.0010536164045333862, -0.0009855329990386963, -0.0009174495935440063, -0.0008493661880493164, -0.0007812827825546265, -0.0007131993770599365, -0.0006451159715652466, -0.0005770325660705566, -0.0005089491605758667, -0.00044086575508117676, -0.0003727823495864868, -0.0003046989440917969, -0.00023661553859710693, -0.000168532133102417, -0.00010044872760772705, -3.236532211303711e-05, 3.571808338165283e-05, 0.00010380148887634277, 0.00017188489437103271, 0.00023996829986572266, 0.0003080517053604126, 0.00037613511085510254, 0.0004442185163497925, 0.0005123019218444824, 0.0005803853273391724, 0.0006484687328338623, 0.0007165521383285522, 0.0007846355438232422, 0.0008527189493179321, 0.0009208023548126221, 0.000988885760307312, 0.001056969165802002, 0.001125052571296692, 0.0011931359767913818, 0.0012612193822860718, 0.0013293027877807617, 0.0013973861932754517, 0.0014654695987701416, 0.0015335530042648315, 0.0016016364097595215, 0.0016697198152542114, 0.0017378032207489014, 0.0018058866262435913, 0.0018739700317382812]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 18.0, 31.0, 52.0, 76.0, 131.0, 171.0, 264.0, 428.0, 646.0, 924.0, 1430.0, 2242.0, 3460.0, 5499.0, 8839.0, 14814.0, 25694.0, 44547.0, 78791.0, 129913.0, 182233.0, 190581.0, 143183.0, 89842.0, 51559.0, 29080.0, 16870.0, 10025.0, 6168.0, 3927.0, 2466.0, 1586.0, 1077.0, 670.0, 439.0, 307.0, 194.0, 132.0, 91.0, 54.0, 34.0, 19.0, 16.0, 7.0, 10.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.625, -10.30419921875, -9.9833984375, -9.66259765625, -9.341796875, -9.02099609375, -8.7001953125, -8.37939453125, -8.05859375, -7.73779296875, -7.4169921875, -7.09619140625, -6.775390625, -6.45458984375, -6.1337890625, -5.81298828125, -5.4921875, -5.17138671875, -4.8505859375, -4.52978515625, -4.208984375, -3.88818359375, -3.5673828125, -3.24658203125, -2.92578125, -2.60498046875, -2.2841796875, -1.96337890625, -1.642578125, -1.32177734375, -1.0009765625, -0.68017578125, -0.359375, -0.03857421875, 0.2822265625, 0.60302734375, 0.923828125, 1.24462890625, 1.5654296875, 1.88623046875, 2.20703125, 2.52783203125, 2.8486328125, 3.16943359375, 3.490234375, 3.81103515625, 4.1318359375, 4.45263671875, 4.7734375, 5.09423828125, 5.4150390625, 5.73583984375, 6.056640625, 6.37744140625, 6.6982421875, 7.01904296875, 7.33984375, 7.66064453125, 7.9814453125, 8.30224609375, 8.623046875, 8.94384765625, 9.2646484375, 9.58544921875, 9.90625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 4.0, 5.0, 9.0, 10.0, 12.0, 18.0, 16.0, 17.0, 16.0, 22.0, 25.0, 44.0, 44.0, 34.0, 59.0, 41.0, 62.0, 67.0, 55.0, 61.0, 56.0, 52.0, 48.0, 43.0, 30.0, 23.0, 32.0, 24.0, 19.0, 8.0, 10.0, 2.0, 7.0, 6.0, 3.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1015625, -3.9761962890625, -3.850830078125, -3.7254638671875, -3.60009765625, -3.4747314453125, -3.349365234375, -3.2239990234375, -3.0986328125, -2.9732666015625, -2.847900390625, -2.7225341796875, -2.59716796875, -2.4718017578125, -2.346435546875, -2.2210693359375, -2.095703125, -1.9703369140625, -1.844970703125, -1.7196044921875, -1.59423828125, -1.4688720703125, -1.343505859375, -1.2181396484375, -1.0927734375, -0.9674072265625, -0.842041015625, -0.7166748046875, -0.59130859375, -0.4659423828125, -0.340576171875, -0.2152099609375, -0.08984375, 0.0355224609375, 0.160888671875, 0.2862548828125, 0.41162109375, 0.5369873046875, 0.662353515625, 0.7877197265625, 0.9130859375, 1.0384521484375, 1.163818359375, 1.2891845703125, 1.41455078125, 1.5399169921875, 1.665283203125, 1.7906494140625, 1.916015625, 2.0413818359375, 2.166748046875, 2.2921142578125, 2.41748046875, 2.5428466796875, 2.668212890625, 2.7935791015625, 2.9189453125, 3.0443115234375, 3.169677734375, 3.2950439453125, 3.42041015625, 3.5457763671875, 3.671142578125, 3.7965087890625, 3.921875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 11.0, 9.0, 21.0, 13.0, 20.0, 22.0, 24.0, 24.0, 23.0, 46.0, 33.0, 38.0, 45.0, 37.0, 48.0, 58.0, 56.0, 46.0, 44.0, 40.0, 30.0, 30.0, 35.0, 28.0, 31.0, 23.0, 21.0, 25.0, 9.0, 24.0, 9.0, 11.0, 9.0, 12.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.692245483398438, -11.324390411376953, -10.956535339355469, -10.588680267333984, -10.2208251953125, -9.852971076965332, -9.485116004943848, -9.117260932922363, -8.749405860900879, -8.381550788879395, -8.01369571685791, -7.645841121673584, -7.2779860496521, -6.910130977630615, -6.542276382446289, -6.174421310424805, -5.80656623840332, -5.438711166381836, -5.070856094360352, -4.703001499176025, -4.335146427154541, -3.9672913551330566, -3.5994365215301514, -3.231581687927246, -2.8637266159057617, -2.4958715438842773, -2.128016710281372, -1.7601617574691772, -1.3923068046569824, -1.0244518518447876, -0.6565968990325928, -0.2887420654296875, 0.07911396026611328, 0.4469689130783081, 0.8148238658905029, 1.1826788187026978, 1.5505337715148926, 1.9183887243270874, 2.2862436771392822, 2.6540985107421875, 3.021953582763672, 3.3898086547851562, 3.7576634883880615, 4.125518321990967, 4.493373394012451, 4.8612284660339355, 5.229083061218262, 5.596938133239746, 5.9647932052612305, 6.332648277282715, 6.700503349304199, 7.068357944488525, 7.43621301651001, 7.804068088531494, 8.17192268371582, 8.539777755737305, 8.907632827758789, 9.275487899780273, 9.643342971801758, 10.011198043823242, 10.379053115844727, 10.746907234191895, 11.114762306213379, 11.482617378234863, 11.850472450256348]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 0.0, 4.0, 8.0, 4.0, 8.0, 6.0, 19.0, 13.0, 21.0, 22.0, 16.0, 17.0, 24.0, 25.0, 27.0, 29.0, 25.0, 33.0, 36.0, 37.0, 37.0, 31.0, 38.0, 34.0, 37.0, 49.0, 42.0, 32.0, 35.0, 34.0, 25.0, 35.0, 18.0, 30.0, 20.0, 24.0, 10.0, 12.0, 15.0, 11.0, 13.0, 11.0, 9.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.09140682220459, -10.72424030303955, -10.357072830200195, -9.989906311035156, -9.622739791870117, -9.255573272705078, -8.888405799865723, -8.521239280700684, -8.154072761535645, -7.786905765533447, -7.419739246368408, -7.052572250366211, -6.685405731201172, -6.318238735198975, -5.951071739196777, -5.583905220031738, -5.216738224029541, -4.849571228027344, -4.482404708862305, -4.115237712860107, -3.7480711936950684, -3.380904197692871, -3.013737440109253, -2.6465706825256348, -2.2794039249420166, -1.9122371673583984, -1.5450704097747803, -1.1779035329818726, -0.8107367753982544, -0.44357001781463623, -0.07640314102172852, 0.29076361656188965, 0.6579303741455078, 1.025097131729126, 1.3922638893127441, 1.7594307661056519, 2.1265974044799805, 2.4937644004821777, 2.860931158065796, 3.228097915649414, 3.5952646732330322, 3.9624314308166504, 4.329598426818848, 4.696764945983887, 5.063931941986084, 5.431098461151123, 5.79826545715332, 6.165431976318359, 6.532598972320557, 6.899765968322754, 7.266932487487793, 7.63409948348999, 8.001266479492188, 8.368432998657227, 8.735599517822266, 9.102766036987305, 9.46993350982666, 9.8371000289917, 10.204267501831055, 10.571434020996094, 10.938600540161133, 11.305767059326172, 11.672934532165527, 12.040101051330566, 12.407267570495605]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 16.0, 19.0, 23.0, 30.0, 62.0, 87.0, 147.0, 227.0, 316.0, 503.0, 771.0, 1232.0, 1896.0, 3014.0, 4557.0, 7366.0, 11665.0, 18885.0, 28989.0, 44722.0, 66271.0, 92371.0, 116700.0, 131683.0, 131027.0, 114281.0, 88808.0, 63820.0, 43070.0, 27829.0, 17759.0, 11052.0, 7119.0, 4332.0, 2869.0, 1761.0, 1078.0, 741.0, 473.0, 326.0, 214.0, 157.0, 104.0, 61.0, 41.0, 24.0, 19.0, 17.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.28125, -8.9813232421875, -8.681396484375, -8.3814697265625, -8.08154296875, -7.7816162109375, -7.481689453125, -7.1817626953125, -6.8818359375, -6.5819091796875, -6.281982421875, -5.9820556640625, -5.68212890625, -5.3822021484375, -5.082275390625, -4.7823486328125, -4.482421875, -4.1824951171875, -3.882568359375, -3.5826416015625, -3.28271484375, -2.9827880859375, -2.682861328125, -2.3829345703125, -2.0830078125, -1.7830810546875, -1.483154296875, -1.1832275390625, -0.88330078125, -0.5833740234375, -0.283447265625, 0.0164794921875, 0.31640625, 0.6163330078125, 0.916259765625, 1.2161865234375, 1.51611328125, 1.8160400390625, 2.115966796875, 2.4158935546875, 2.7158203125, 3.0157470703125, 3.315673828125, 3.6156005859375, 3.91552734375, 4.2154541015625, 4.515380859375, 4.8153076171875, 5.115234375, 5.4151611328125, 5.715087890625, 6.0150146484375, 6.31494140625, 6.6148681640625, 6.914794921875, 7.2147216796875, 7.5146484375, 7.8145751953125, 8.114501953125, 8.4144287109375, 8.71435546875, 9.0142822265625, 9.314208984375, 9.6141357421875, 9.9140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 13.0, 21.0, 13.0, 8.0, 26.0, 24.0, 24.0, 27.0, 30.0, 27.0, 29.0, 29.0, 31.0, 53.0, 29.0, 42.0, 31.0, 31.0, 37.0, 33.0, 46.0, 43.0, 31.0, 36.0, 22.0, 22.0, 16.0, 29.0, 24.0, 20.0, 18.0, 14.0, 15.0, 8.0, 9.0, 9.0, 8.0, 6.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-11.328125, -10.9727783203125, -10.617431640625, -10.2620849609375, -9.90673828125, -9.5513916015625, -9.196044921875, -8.8406982421875, -8.4853515625, -8.1300048828125, -7.774658203125, -7.4193115234375, -7.06396484375, -6.7086181640625, -6.353271484375, -5.9979248046875, -5.642578125, -5.2872314453125, -4.931884765625, -4.5765380859375, -4.22119140625, -3.8658447265625, -3.510498046875, -3.1551513671875, -2.7998046875, -2.4444580078125, -2.089111328125, -1.7337646484375, -1.37841796875, -1.0230712890625, -0.667724609375, -0.3123779296875, 0.04296875, 0.3983154296875, 0.753662109375, 1.1090087890625, 1.46435546875, 1.8197021484375, 2.175048828125, 2.5303955078125, 2.8857421875, 3.2410888671875, 3.596435546875, 3.9517822265625, 4.30712890625, 4.6624755859375, 5.017822265625, 5.3731689453125, 5.728515625, 6.0838623046875, 6.439208984375, 6.7945556640625, 7.14990234375, 7.5052490234375, 7.860595703125, 8.2159423828125, 8.5712890625, 8.9266357421875, 9.281982421875, 9.6373291015625, 9.99267578125, 10.3480224609375, 10.703369140625, 11.0587158203125, 11.4140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 6.0, 9.0, 12.0, 9.0, 28.0, 36.0, 46.0, 76.0, 123.0, 195.0, 272.0, 400.0, 750.0, 1078.0, 1763.0, 2826.0, 4565.0, 7569.0, 12191.0, 19654.0, 31140.0, 47658.0, 70838.0, 98266.0, 122902.0, 137400.0, 131911.0, 111315.0, 83227.0, 58524.0, 38655.0, 24691.0, 15171.0, 9637.0, 5896.0, 3779.0, 2241.0, 1342.0, 819.0, 522.0, 352.0, 220.0, 151.0, 109.0, 62.0, 53.0, 19.0, 18.0, 17.0, 13.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.322998046875, -10.96630859375, -10.609619140625, -10.2529296875, -9.896240234375, -9.53955078125, -9.182861328125, -8.826171875, -8.469482421875, -8.11279296875, -7.756103515625, -7.3994140625, -7.042724609375, -6.68603515625, -6.329345703125, -5.97265625, -5.615966796875, -5.25927734375, -4.902587890625, -4.5458984375, -4.189208984375, -3.83251953125, -3.475830078125, -3.119140625, -2.762451171875, -2.40576171875, -2.049072265625, -1.6923828125, -1.335693359375, -0.97900390625, -0.622314453125, -0.265625, 0.091064453125, 0.44775390625, 0.804443359375, 1.1611328125, 1.517822265625, 1.87451171875, 2.231201171875, 2.587890625, 2.944580078125, 3.30126953125, 3.657958984375, 4.0146484375, 4.371337890625, 4.72802734375, 5.084716796875, 5.44140625, 5.798095703125, 6.15478515625, 6.511474609375, 6.8681640625, 7.224853515625, 7.58154296875, 7.938232421875, 8.294921875, 8.651611328125, 9.00830078125, 9.364990234375, 9.7216796875, 10.078369140625, 10.43505859375, 10.791748046875, 11.1484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 8.0, 10.0, 16.0, 14.0, 16.0, 20.0, 28.0, 30.0, 28.0, 30.0, 31.0, 25.0, 50.0, 39.0, 41.0, 33.0, 32.0, 45.0, 43.0, 37.0, 41.0, 39.0, 37.0, 40.0, 35.0, 31.0, 24.0, 23.0, 16.0, 8.0, 18.0, 17.0, 11.0, 15.0, 7.0, 9.0, 11.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6484375, -8.3824462890625, -8.116455078125, -7.8504638671875, -7.58447265625, -7.3184814453125, -7.052490234375, -6.7864990234375, -6.5205078125, -6.2545166015625, -5.988525390625, -5.7225341796875, -5.45654296875, -5.1905517578125, -4.924560546875, -4.6585693359375, -4.392578125, -4.1265869140625, -3.860595703125, -3.5946044921875, -3.32861328125, -3.0626220703125, -2.796630859375, -2.5306396484375, -2.2646484375, -1.9986572265625, -1.732666015625, -1.4666748046875, -1.20068359375, -0.9346923828125, -0.668701171875, -0.4027099609375, -0.13671875, 0.1292724609375, 0.395263671875, 0.6612548828125, 0.92724609375, 1.1932373046875, 1.459228515625, 1.7252197265625, 1.9912109375, 2.2572021484375, 2.523193359375, 2.7891845703125, 3.05517578125, 3.3211669921875, 3.587158203125, 3.8531494140625, 4.119140625, 4.3851318359375, 4.651123046875, 4.9171142578125, 5.18310546875, 5.4490966796875, 5.715087890625, 5.9810791015625, 6.2470703125, 6.5130615234375, 6.779052734375, 7.0450439453125, 7.31103515625, 7.5770263671875, 7.843017578125, 8.1090087890625, 8.375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 13.0, 13.0, 23.0, 30.0, 39.0, 43.0, 58.0, 60.0, 87.0, 166.0, 195.0, 289.0, 352.0, 569.0, 837.0, 1284.0, 2085.0, 3559.0, 6792.0, 14435.0, 33993.0, 84221.0, 189962.0, 287151.0, 228669.0, 110864.0, 44533.0, 18687.0, 8351.0, 4236.0, 2384.0, 1485.0, 911.0, 622.0, 441.0, 310.0, 225.0, 142.0, 115.0, 77.0, 54.0, 58.0, 41.0, 28.0, 18.0, 13.0, 6.0, 13.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.3203125, -9.9942626953125, -9.668212890625, -9.3421630859375, -9.01611328125, -8.6900634765625, -8.364013671875, -8.0379638671875, -7.7119140625, -7.3858642578125, -7.059814453125, -6.7337646484375, -6.40771484375, -6.0816650390625, -5.755615234375, -5.4295654296875, -5.103515625, -4.7774658203125, -4.451416015625, -4.1253662109375, -3.79931640625, -3.4732666015625, -3.147216796875, -2.8211669921875, -2.4951171875, -2.1690673828125, -1.843017578125, -1.5169677734375, -1.19091796875, -0.8648681640625, -0.538818359375, -0.2127685546875, 0.11328125, 0.4393310546875, 0.765380859375, 1.0914306640625, 1.41748046875, 1.7435302734375, 2.069580078125, 2.3956298828125, 2.7216796875, 3.0477294921875, 3.373779296875, 3.6998291015625, 4.02587890625, 4.3519287109375, 4.677978515625, 5.0040283203125, 5.330078125, 5.6561279296875, 5.982177734375, 6.3082275390625, 6.63427734375, 6.9603271484375, 7.286376953125, 7.6124267578125, 7.9384765625, 8.2645263671875, 8.590576171875, 8.9166259765625, 9.24267578125, 9.5687255859375, 9.894775390625, 10.2208251953125, 10.546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 0.0, 5.0, 10.0, 6.0, 13.0, 13.0, 18.0, 32.0, 27.0, 28.0, 46.0, 53.0, 59.0, 81.0, 103.0, 70.0, 76.0, 55.0, 57.0, 50.0, 46.0, 26.0, 21.0, 25.0, 16.0, 9.0, 7.0, 3.0, 9.0, 7.0, 5.0, 3.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007796287536621094, -0.0007524192333221436, -0.0007252097129821777, -0.0006980001926422119, -0.0006707906723022461, -0.0006435811519622803, -0.0006163716316223145, -0.0005891621112823486, -0.0005619525909423828, -0.000534743070602417, -0.0005075335502624512, -0.00048032402992248535, -0.00045311450958251953, -0.0004259049892425537, -0.0003986954689025879, -0.00037148594856262207, -0.00034427642822265625, -0.00031706690788269043, -0.0002898573875427246, -0.0002626478672027588, -0.00023543834686279297, -0.00020822882652282715, -0.00018101930618286133, -0.0001538097858428955, -0.0001266002655029297, -9.939074516296387e-05, -7.218122482299805e-05, -4.4971704483032227e-05, -1.7762184143066406e-05, 9.447336196899414e-06, 3.6656856536865234e-05, 6.386637687683105e-05, 9.107589721679688e-05, 0.0001182854175567627, 0.00014549493789672852, 0.00017270445823669434, 0.00019991397857666016, 0.00022712349891662598, 0.0002543330192565918, 0.0002815425395965576, 0.00030875205993652344, 0.00033596158027648926, 0.0003631711006164551, 0.0003903806209564209, 0.0004175901412963867, 0.00044479966163635254, 0.00047200918197631836, 0.0004992187023162842, 0.00052642822265625, 0.0005536377429962158, 0.0005808472633361816, 0.0006080567836761475, 0.0006352663040161133, 0.0006624758243560791, 0.0006896853446960449, 0.0007168948650360107, 0.0007441043853759766, 0.0007713139057159424, 0.0007985234260559082, 0.000825732946395874, 0.0008529424667358398, 0.0008801519870758057, 0.0009073615074157715, 0.0009345710277557373, 0.0009617805480957031]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 10.0, 11.0, 23.0, 23.0, 38.0, 59.0, 91.0, 158.0, 192.0, 283.0, 429.0, 659.0, 1122.0, 1805.0, 3184.0, 5658.0, 11151.0, 22563.0, 45806.0, 89870.0, 153621.0, 206230.0, 200273.0, 141688.0, 80446.0, 40785.0, 19722.0, 10031.0, 5205.0, 2883.0, 1692.0, 997.0, 637.0, 414.0, 265.0, 166.0, 117.0, 81.0, 54.0, 42.0, 28.0, 12.0, 9.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2421875, -7.02215576171875, -6.8021240234375, -6.58209228515625, -6.362060546875, -6.14202880859375, -5.9219970703125, -5.70196533203125, -5.48193359375, -5.26190185546875, -5.0418701171875, -4.82183837890625, -4.601806640625, -4.38177490234375, -4.1617431640625, -3.94171142578125, -3.7216796875, -3.50164794921875, -3.2816162109375, -3.06158447265625, -2.841552734375, -2.62152099609375, -2.4014892578125, -2.18145751953125, -1.96142578125, -1.74139404296875, -1.5213623046875, -1.30133056640625, -1.081298828125, -0.86126708984375, -0.6412353515625, -0.42120361328125, -0.201171875, 0.01885986328125, 0.2388916015625, 0.45892333984375, 0.678955078125, 0.89898681640625, 1.1190185546875, 1.33905029296875, 1.55908203125, 1.77911376953125, 1.9991455078125, 2.21917724609375, 2.439208984375, 2.65924072265625, 2.8792724609375, 3.09930419921875, 3.3193359375, 3.53936767578125, 3.7593994140625, 3.97943115234375, 4.199462890625, 4.41949462890625, 4.6395263671875, 4.85955810546875, 5.07958984375, 5.29962158203125, 5.5196533203125, 5.73968505859375, 5.959716796875, 6.17974853515625, 6.3997802734375, 6.61981201171875, 6.83984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 0.0, 2.0, 3.0, 5.0, 9.0, 15.0, 14.0, 6.0, 5.0, 12.0, 16.0, 21.0, 22.0, 35.0, 27.0, 31.0, 41.0, 46.0, 35.0, 44.0, 47.0, 47.0, 59.0, 44.0, 42.0, 39.0, 46.0, 40.0, 30.0, 33.0, 28.0, 14.0, 14.0, 20.0, 19.0, 19.0, 11.0, 13.0, 9.0, 7.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5537109375, -1.503753662109375, -1.45379638671875, -1.403839111328125, -1.3538818359375, -1.303924560546875, -1.25396728515625, -1.204010009765625, -1.154052734375, -1.104095458984375, -1.05413818359375, -1.004180908203125, -0.9542236328125, -0.904266357421875, -0.85430908203125, -0.804351806640625, -0.75439453125, -0.704437255859375, -0.65447998046875, -0.604522705078125, -0.5545654296875, -0.504608154296875, -0.45465087890625, -0.404693603515625, -0.354736328125, -0.304779052734375, -0.25482177734375, -0.204864501953125, -0.1549072265625, -0.104949951171875, -0.05499267578125, -0.005035400390625, 0.044921875, 0.094879150390625, 0.14483642578125, 0.194793701171875, 0.2447509765625, 0.294708251953125, 0.34466552734375, 0.394622802734375, 0.444580078125, 0.494537353515625, 0.54449462890625, 0.594451904296875, 0.6444091796875, 0.694366455078125, 0.74432373046875, 0.794281005859375, 0.84423828125, 0.894195556640625, 0.94415283203125, 0.994110107421875, 1.0440673828125, 1.094024658203125, 1.14398193359375, 1.193939208984375, 1.243896484375, 1.293853759765625, 1.34381103515625, 1.393768310546875, 1.4437255859375, 1.493682861328125, 1.54364013671875, 1.593597412109375, 1.6435546875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 4.0, 5.0, 8.0, 8.0, 6.0, 10.0, 13.0, 8.0, 19.0, 15.0, 22.0, 20.0, 37.0, 30.0, 37.0, 41.0, 50.0, 50.0, 38.0, 43.0, 57.0, 46.0, 41.0, 53.0, 42.0, 30.0, 32.0, 27.0, 38.0, 31.0, 24.0, 26.0, 20.0, 18.0, 13.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.746591567993164, -11.363208770751953, -10.979825973510742, -10.596443176269531, -10.21306037902832, -9.829678535461426, -9.446295738220215, -9.062912940979004, -8.679530143737793, -8.296147346496582, -7.912764549255371, -7.529382228851318, -7.145999431610107, -6.7626166343688965, -6.379234313964844, -5.995851516723633, -5.612468719482422, -5.229085922241211, -4.845703125, -4.462320804595947, -4.078938007354736, -3.6955552101135254, -3.3121726512908936, -2.9287900924682617, -2.545407295227051, -2.16202449798584, -1.778641939163208, -1.3952592611312866, -1.0118765830993652, -0.6284939050674438, -0.24511122703552246, 0.13827133178710938, 0.5216541290283203, 0.9050368070602417, 1.288419485092163, 1.6718021631240845, 2.055184841156006, 2.438567638397217, 2.8219501972198486, 3.2053327560424805, 3.5887155532836914, 3.9720983505249023, 4.355481147766113, 4.738863468170166, 5.122246265411377, 5.505629062652588, 5.889011383056641, 6.272394180297852, 6.6557769775390625, 7.039159774780273, 7.422542572021484, 7.805924892425537, 8.189308166503906, 8.5726900100708, 8.956072807312012, 9.339455604553223, 9.722838401794434, 10.106221199035645, 10.489603996276855, 10.872986793518066, 11.256368637084961, 11.639751434326172, 12.023134231567383, 12.406517028808594, 12.789899826049805]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 4.0, 9.0, 4.0, 7.0, 6.0, 14.0, 7.0, 18.0, 16.0, 24.0, 20.0, 26.0, 24.0, 23.0, 31.0, 39.0, 35.0, 28.0, 44.0, 39.0, 29.0, 41.0, 36.0, 47.0, 34.0, 35.0, 46.0, 43.0, 27.0, 29.0, 27.0, 22.0, 27.0, 22.0, 10.0, 13.0, 19.0, 10.0, 11.0, 12.0, 9.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-12.811087608337402, -12.423457145690918, -12.035826683044434, -11.64819622039795, -11.260565757751465, -10.87293529510498, -10.485305786132812, -10.097675323486328, -9.710044860839844, -9.32241439819336, -8.934783935546875, -8.54715347290039, -8.159523010253906, -7.771892547607422, -7.384262561798096, -6.996632099151611, -6.609001159667969, -6.221370697021484, -5.833740234375, -5.446109771728516, -5.058479309082031, -4.670848846435547, -4.283218860626221, -3.8955883979797363, -3.507957935333252, -3.1203274726867676, -2.732697010040283, -2.345066785812378, -1.9574363231658936, -1.5698058605194092, -1.182175636291504, -0.7945451736450195, -0.40691566467285156, -0.019285261631011963, 0.36834514141082764, 0.7559754848480225, 1.1436059474945068, 1.5312364101409912, 1.9188666343688965, 2.306497097015381, 2.6941275596618652, 3.0817580223083496, 3.469388484954834, 3.8570187091827393, 4.2446489334106445, 4.632279396057129, 5.019909858703613, 5.407540321350098, 5.795170783996582, 6.182801246643066, 6.570431709289551, 6.958062171936035, 7.3456926345825195, 7.733323097229004, 8.120952606201172, 8.508583068847656, 8.89621353149414, 9.283843994140625, 9.67147445678711, 10.059104919433594, 10.446735382080078, 10.834365844726562, 11.221996307373047, 11.609626770019531, 11.997257232666016]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 2.0, 7.0, 5.0, 19.0, 15.0, 39.0, 59.0, 87.0, 111.0, 208.0, 303.0, 473.0, 730.0, 1138.0, 1736.0, 2776.0, 4328.0, 6820.0, 11157.0, 17680.0, 28842.0, 48235.0, 81401.0, 140457.0, 239505.0, 384767.0, 550945.0, 659126.0, 642301.0, 511662.0, 345460.0, 210472.0, 122775.0, 71249.0, 41940.0, 25460.0, 15640.0, 9670.0, 6058.0, 3800.0, 2422.0, 1540.0, 1077.0, 625.0, 432.0, 271.0, 152.0, 111.0, 70.0, 37.0, 31.0, 28.0, 13.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.5625, -8.28515625, -8.0078125, -7.73046875, -7.453125, -7.17578125, -6.8984375, -6.62109375, -6.34375, -6.06640625, -5.7890625, -5.51171875, -5.234375, -4.95703125, -4.6796875, -4.40234375, -4.125, -3.84765625, -3.5703125, -3.29296875, -3.015625, -2.73828125, -2.4609375, -2.18359375, -1.90625, -1.62890625, -1.3515625, -1.07421875, -0.796875, -0.51953125, -0.2421875, 0.03515625, 0.3125, 0.58984375, 0.8671875, 1.14453125, 1.421875, 1.69921875, 1.9765625, 2.25390625, 2.53125, 2.80859375, 3.0859375, 3.36328125, 3.640625, 3.91796875, 4.1953125, 4.47265625, 4.75, 5.02734375, 5.3046875, 5.58203125, 5.859375, 6.13671875, 6.4140625, 6.69140625, 6.96875, 7.24609375, 7.5234375, 7.80078125, 8.078125, 8.35546875, 8.6328125, 8.91015625, 9.1875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 10.0, 6.0, 6.0, 12.0, 12.0, 14.0, 16.0, 24.0, 23.0, 21.0, 25.0, 22.0, 30.0, 35.0, 38.0, 38.0, 40.0, 32.0, 39.0, 44.0, 41.0, 39.0, 49.0, 40.0, 35.0, 33.0, 29.0, 38.0, 31.0, 23.0, 27.0, 17.0, 13.0, 11.0, 16.0, 15.0, 8.0, 8.0, 11.0, 4.0, 3.0, 10.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-11.296875, -10.954345703125, -10.61181640625, -10.269287109375, -9.9267578125, -9.584228515625, -9.24169921875, -8.899169921875, -8.556640625, -8.214111328125, -7.87158203125, -7.529052734375, -7.1865234375, -6.843994140625, -6.50146484375, -6.158935546875, -5.81640625, -5.473876953125, -5.13134765625, -4.788818359375, -4.4462890625, -4.103759765625, -3.76123046875, -3.418701171875, -3.076171875, -2.733642578125, -2.39111328125, -2.048583984375, -1.7060546875, -1.363525390625, -1.02099609375, -0.678466796875, -0.3359375, 0.006591796875, 0.34912109375, 0.691650390625, 1.0341796875, 1.376708984375, 1.71923828125, 2.061767578125, 2.404296875, 2.746826171875, 3.08935546875, 3.431884765625, 3.7744140625, 4.116943359375, 4.45947265625, 4.802001953125, 5.14453125, 5.487060546875, 5.82958984375, 6.172119140625, 6.5146484375, 6.857177734375, 7.19970703125, 7.542236328125, 7.884765625, 8.227294921875, 8.56982421875, 8.912353515625, 9.2548828125, 9.597412109375, 9.93994140625, 10.282470703125, 10.625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 8.0, 7.0, 14.0, 23.0, 38.0, 59.0, 89.0, 145.0, 224.0, 347.0, 583.0, 857.0, 1479.0, 2576.0, 4255.0, 7161.0, 12094.0, 21733.0, 36778.0, 64410.0, 110851.0, 190757.0, 314517.0, 485665.0, 652635.0, 698561.0, 581800.0, 401931.0, 250982.0, 149202.0, 86146.0, 50151.0, 28180.0, 16645.0, 9598.0, 5374.0, 3359.0, 1950.0, 1214.0, 701.0, 431.0, 276.0, 168.0, 118.0, 72.0, 41.0, 39.0, 14.0, 15.0, 5.0, 2.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.3203125, -10.969482421875, -10.61865234375, -10.267822265625, -9.9169921875, -9.566162109375, -9.21533203125, -8.864501953125, -8.513671875, -8.162841796875, -7.81201171875, -7.461181640625, -7.1103515625, -6.759521484375, -6.40869140625, -6.057861328125, -5.70703125, -5.356201171875, -5.00537109375, -4.654541015625, -4.3037109375, -3.952880859375, -3.60205078125, -3.251220703125, -2.900390625, -2.549560546875, -2.19873046875, -1.847900390625, -1.4970703125, -1.146240234375, -0.79541015625, -0.444580078125, -0.09375, 0.257080078125, 0.60791015625, 0.958740234375, 1.3095703125, 1.660400390625, 2.01123046875, 2.362060546875, 2.712890625, 3.063720703125, 3.41455078125, 3.765380859375, 4.1162109375, 4.467041015625, 4.81787109375, 5.168701171875, 5.51953125, 5.870361328125, 6.22119140625, 6.572021484375, 6.9228515625, 7.273681640625, 7.62451171875, 7.975341796875, 8.326171875, 8.677001953125, 9.02783203125, 9.378662109375, 9.7294921875, 10.080322265625, 10.43115234375, 10.781982421875, 11.1328125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 9.0, 11.0, 8.0, 17.0, 24.0, 19.0, 27.0, 33.0, 59.0, 64.0, 71.0, 99.0, 110.0, 149.0, 162.0, 163.0, 196.0, 213.0, 206.0, 245.0, 232.0, 237.0, 217.0, 212.0, 185.0, 173.0, 176.0, 121.0, 134.0, 104.0, 82.0, 70.0, 48.0, 47.0, 31.0, 27.0, 22.0, 15.0, 10.0, 16.0, 7.0, 6.0, 3.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19921875, -4.0537109375, -3.908203125, -3.7626953125, -3.6171875, -3.4716796875, -3.326171875, -3.1806640625, -3.03515625, -2.8896484375, -2.744140625, -2.5986328125, -2.453125, -2.3076171875, -2.162109375, -2.0166015625, -1.87109375, -1.7255859375, -1.580078125, -1.4345703125, -1.2890625, -1.1435546875, -0.998046875, -0.8525390625, -0.70703125, -0.5615234375, -0.416015625, -0.2705078125, -0.125, 0.0205078125, 0.166015625, 0.3115234375, 0.45703125, 0.6025390625, 0.748046875, 0.8935546875, 1.0390625, 1.1845703125, 1.330078125, 1.4755859375, 1.62109375, 1.7666015625, 1.912109375, 2.0576171875, 2.203125, 2.3486328125, 2.494140625, 2.6396484375, 2.78515625, 2.9306640625, 3.076171875, 3.2216796875, 3.3671875, 3.5126953125, 3.658203125, 3.8037109375, 3.94921875, 4.0947265625, 4.240234375, 4.3857421875, 4.53125, 4.6767578125, 4.822265625, 4.9677734375, 5.11328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 11.0, 5.0, 12.0, 7.0, 8.0, 14.0, 14.0, 12.0, 23.0, 23.0, 27.0, 32.0, 30.0, 34.0, 52.0, 39.0, 42.0, 39.0, 46.0, 48.0, 37.0, 51.0, 39.0, 45.0, 31.0, 27.0, 37.0, 40.0, 32.0, 19.0, 12.0, 15.0, 13.0, 8.0, 14.0, 17.0, 4.0, 4.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-12.323286056518555, -11.973710060119629, -11.624134063720703, -11.274559020996094, -10.924983024597168, -10.575407028198242, -10.225831031799316, -9.87625503540039, -9.526679039001465, -9.177103042602539, -8.827527046203613, -8.477951049804688, -8.128376007080078, -7.778800010681152, -7.429224014282227, -7.079648017883301, -6.730072498321533, -6.380496501922607, -6.03092098236084, -5.681344985961914, -5.331768989562988, -4.9821929931640625, -4.632617473602295, -4.283041477203369, -3.9334657192230225, -3.583889961242676, -3.23431396484375, -2.8847382068634033, -2.5351624488830566, -2.185586452484131, -1.8360106945037842, -1.4864346981048584, -1.1368589401245117, -0.7872830629348755, -0.43770724534988403, -0.08813142776489258, 0.26144444942474365, 0.6110203266143799, 0.9605960845947266, 1.3101720809936523, 1.659747838973999, 2.0093235969543457, 2.3588995933532715, 2.708475351333618, 3.058051109313965, 3.4076271057128906, 3.7572028636932373, 4.106779098510742, 4.45635461807251, 4.8059306144714355, 5.155506134033203, 5.505082130432129, 5.854658126831055, 6.2042341232299805, 6.553809642791748, 6.903385639190674, 7.252961158752441, 7.602537155151367, 7.952112674713135, 8.301689147949219, 8.651264190673828, 9.000840187072754, 9.35041618347168, 9.699992179870605, 10.049568176269531]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 6.0, 9.0, 12.0, 15.0, 17.0, 10.0, 16.0, 28.0, 33.0, 21.0, 38.0, 33.0, 39.0, 30.0, 40.0, 42.0, 35.0, 32.0, 45.0, 41.0, 37.0, 34.0, 47.0, 40.0, 33.0, 28.0, 25.0, 30.0, 19.0, 23.0, 14.0, 17.0, 19.0, 12.0, 12.0, 9.0, 10.0, 12.0, 5.0, 5.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.490553855895996, -11.114930152893066, -10.739306449890137, -10.363682746887207, -9.988059043884277, -9.612435340881348, -9.236811637878418, -8.861187934875488, -8.485564231872559, -8.109940528869629, -7.734316825866699, -7.3586931228637695, -6.98306941986084, -6.60744571685791, -6.2318220138549805, -5.856198310852051, -5.480574607849121, -5.104950904846191, -4.729327201843262, -4.353703498840332, -3.9780797958374023, -3.6024560928344727, -3.226832389831543, -2.8512086868286133, -2.4755849838256836, -2.099961280822754, -1.7243375778198242, -1.3487138748168945, -0.9730901718139648, -0.5974664688110352, -0.22184276580810547, 0.15378093719482422, 0.5294036865234375, 0.9050273895263672, 1.2806510925292969, 1.6562747955322266, 2.0318984985351562, 2.407522201538086, 2.7831459045410156, 3.1587696075439453, 3.534393310546875, 3.9100170135498047, 4.285640716552734, 4.661264419555664, 5.036888122558594, 5.412511825561523, 5.788135528564453, 6.163759231567383, 6.5393829345703125, 6.915006637573242, 7.290630340576172, 7.666254043579102, 8.041877746582031, 8.417501449584961, 8.79312515258789, 9.16874885559082, 9.54437255859375, 9.91999626159668, 10.29561996459961, 10.671243667602539, 11.046867370605469, 11.422491073608398, 11.798114776611328, 12.173738479614258, 12.549362182617188]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 6.0, 7.0, 12.0, 11.0, 20.0, 26.0, 37.0, 54.0, 68.0, 104.0, 147.0, 232.0, 274.0, 367.0, 593.0, 826.0, 1143.0, 1763.0, 2565.0, 3853.0, 5729.0, 8589.0, 13126.0, 21309.0, 35879.0, 64820.0, 120472.0, 194813.0, 216769.0, 151693.0, 84292.0, 45684.0, 26377.0, 16118.0, 10131.0, 6640.0, 4386.0, 3046.0, 1981.0, 1354.0, 949.0, 691.0, 426.0, 351.0, 231.0, 166.0, 138.0, 80.0, 52.0, 50.0, 36.0, 30.0, 13.0, 10.0, 10.0, 6.0, 4.0, 3.0, 4.0, 3.0], "bins": [-18.109375, -17.547119140625, -16.98486328125, -16.422607421875, -15.8603515625, -15.298095703125, -14.73583984375, -14.173583984375, -13.611328125, -13.049072265625, -12.48681640625, -11.924560546875, -11.3623046875, -10.800048828125, -10.23779296875, -9.675537109375, -9.11328125, -8.551025390625, -7.98876953125, -7.426513671875, -6.8642578125, -6.302001953125, -5.73974609375, -5.177490234375, -4.615234375, -4.052978515625, -3.49072265625, -2.928466796875, -2.3662109375, -1.803955078125, -1.24169921875, -0.679443359375, -0.1171875, 0.445068359375, 1.00732421875, 1.569580078125, 2.1318359375, 2.694091796875, 3.25634765625, 3.818603515625, 4.380859375, 4.943115234375, 5.50537109375, 6.067626953125, 6.6298828125, 7.192138671875, 7.75439453125, 8.316650390625, 8.87890625, 9.441162109375, 10.00341796875, 10.565673828125, 11.1279296875, 11.690185546875, 12.25244140625, 12.814697265625, 13.376953125, 13.939208984375, 14.50146484375, 15.063720703125, 15.6259765625, 16.188232421875, 16.75048828125, 17.312744140625, 17.875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 13.0, 11.0, 9.0, 10.0, 12.0, 10.0, 19.0, 21.0, 33.0, 26.0, 34.0, 42.0, 34.0, 35.0, 39.0, 40.0, 36.0, 37.0, 44.0, 39.0, 37.0, 53.0, 43.0, 44.0, 25.0, 36.0, 16.0, 24.0, 24.0, 15.0, 17.0, 19.0, 19.0, 15.0, 9.0, 10.0, 8.0, 7.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.390625, -12.0181884765625, -11.645751953125, -11.2733154296875, -10.90087890625, -10.5284423828125, -10.156005859375, -9.7835693359375, -9.4111328125, -9.0386962890625, -8.666259765625, -8.2938232421875, -7.92138671875, -7.5489501953125, -7.176513671875, -6.8040771484375, -6.431640625, -6.0592041015625, -5.686767578125, -5.3143310546875, -4.94189453125, -4.5694580078125, -4.197021484375, -3.8245849609375, -3.4521484375, -3.0797119140625, -2.707275390625, -2.3348388671875, -1.96240234375, -1.5899658203125, -1.217529296875, -0.8450927734375, -0.47265625, -0.1002197265625, 0.272216796875, 0.6446533203125, 1.01708984375, 1.3895263671875, 1.761962890625, 2.1343994140625, 2.5068359375, 2.8792724609375, 3.251708984375, 3.6241455078125, 3.99658203125, 4.3690185546875, 4.741455078125, 5.1138916015625, 5.486328125, 5.8587646484375, 6.231201171875, 6.6036376953125, 6.97607421875, 7.3485107421875, 7.720947265625, 8.0933837890625, 8.4658203125, 8.8382568359375, 9.210693359375, 9.5831298828125, 9.95556640625, 10.3280029296875, 10.700439453125, 11.0728759765625, 11.4453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [6.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 14.0, 17.0, 19.0, 38.0, 46.0, 91.0, 147.0, 235.0, 348.0, 549.0, 830.0, 1265.0, 1803.0, 2704.0, 4203.0, 6644.0, 10390.0, 16800.0, 27508.0, 48559.0, 93090.0, 179249.0, 251383.0, 183098.0, 94692.0, 50011.0, 28304.0, 16886.0, 10556.0, 6574.0, 4189.0, 2850.0, 1773.0, 1274.0, 801.0, 564.0, 325.0, 231.0, 167.0, 121.0, 73.0, 33.0, 35.0, 12.0, 19.0, 6.0, 4.0, 8.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.552490234375, -17.90185546875, -17.251220703125, -16.6005859375, -15.949951171875, -15.29931640625, -14.648681640625, -13.998046875, -13.347412109375, -12.69677734375, -12.046142578125, -11.3955078125, -10.744873046875, -10.09423828125, -9.443603515625, -8.79296875, -8.142333984375, -7.49169921875, -6.841064453125, -6.1904296875, -5.539794921875, -4.88916015625, -4.238525390625, -3.587890625, -2.937255859375, -2.28662109375, -1.635986328125, -0.9853515625, -0.334716796875, 0.31591796875, 0.966552734375, 1.6171875, 2.267822265625, 2.91845703125, 3.569091796875, 4.2197265625, 4.870361328125, 5.52099609375, 6.171630859375, 6.822265625, 7.472900390625, 8.12353515625, 8.774169921875, 9.4248046875, 10.075439453125, 10.72607421875, 11.376708984375, 12.02734375, 12.677978515625, 13.32861328125, 13.979248046875, 14.6298828125, 15.280517578125, 15.93115234375, 16.581787109375, 17.232421875, 17.883056640625, 18.53369140625, 19.184326171875, 19.8349609375, 20.485595703125, 21.13623046875, 21.786865234375, 22.4375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 5.0, 5.0, 3.0, 15.0, 15.0, 12.0, 14.0, 19.0, 13.0, 22.0, 28.0, 28.0, 22.0, 31.0, 39.0, 42.0, 34.0, 50.0, 38.0, 48.0, 38.0, 41.0, 53.0, 46.0, 42.0, 34.0, 40.0, 36.0, 26.0, 28.0, 22.0, 21.0, 12.0, 13.0, 12.0, 16.0, 15.0, 9.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.265625, -8.99603271484375, -8.7264404296875, -8.45684814453125, -8.187255859375, -7.91766357421875, -7.6480712890625, -7.37847900390625, -7.10888671875, -6.83929443359375, -6.5697021484375, -6.30010986328125, -6.030517578125, -5.76092529296875, -5.4913330078125, -5.22174072265625, -4.9521484375, -4.68255615234375, -4.4129638671875, -4.14337158203125, -3.873779296875, -3.60418701171875, -3.3345947265625, -3.06500244140625, -2.79541015625, -2.52581787109375, -2.2562255859375, -1.98663330078125, -1.717041015625, -1.44744873046875, -1.1778564453125, -0.90826416015625, -0.638671875, -0.36907958984375, -0.0994873046875, 0.17010498046875, 0.439697265625, 0.70928955078125, 0.9788818359375, 1.24847412109375, 1.51806640625, 1.78765869140625, 2.0572509765625, 2.32684326171875, 2.596435546875, 2.86602783203125, 3.1356201171875, 3.40521240234375, 3.6748046875, 3.94439697265625, 4.2139892578125, 4.48358154296875, 4.753173828125, 5.02276611328125, 5.2923583984375, 5.56195068359375, 5.83154296875, 6.10113525390625, 6.3707275390625, 6.64031982421875, 6.909912109375, 7.17950439453125, 7.4490966796875, 7.71868896484375, 7.98828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 11.0, 25.0, 29.0, 42.0, 58.0, 127.0, 191.0, 312.0, 427.0, 729.0, 1151.0, 1999.0, 3343.0, 5638.0, 10154.0, 18546.0, 35063.0, 68659.0, 135015.0, 228783.0, 236478.0, 144867.0, 73560.0, 37391.0, 19908.0, 10945.0, 6120.0, 3485.0, 2066.0, 1278.0, 835.0, 468.0, 289.0, 187.0, 134.0, 80.0, 58.0, 34.0, 27.0, 15.0, 6.0, 6.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.546875, -8.30303955078125, -8.0592041015625, -7.81536865234375, -7.571533203125, -7.32769775390625, -7.0838623046875, -6.84002685546875, -6.59619140625, -6.35235595703125, -6.1085205078125, -5.86468505859375, -5.620849609375, -5.37701416015625, -5.1331787109375, -4.88934326171875, -4.6455078125, -4.40167236328125, -4.1578369140625, -3.91400146484375, -3.670166015625, -3.42633056640625, -3.1824951171875, -2.93865966796875, -2.69482421875, -2.45098876953125, -2.2071533203125, -1.96331787109375, -1.719482421875, -1.47564697265625, -1.2318115234375, -0.98797607421875, -0.744140625, -0.50030517578125, -0.2564697265625, -0.01263427734375, 0.231201171875, 0.47503662109375, 0.7188720703125, 0.96270751953125, 1.20654296875, 1.45037841796875, 1.6942138671875, 1.93804931640625, 2.181884765625, 2.42572021484375, 2.6695556640625, 2.91339111328125, 3.1572265625, 3.40106201171875, 3.6448974609375, 3.88873291015625, 4.132568359375, 4.37640380859375, 4.6202392578125, 4.86407470703125, 5.10791015625, 5.35174560546875, 5.5955810546875, 5.83941650390625, 6.083251953125, 6.32708740234375, 6.5709228515625, 6.81475830078125, 7.05859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 11.0, 9.0, 10.0, 12.0, 22.0, 31.0, 50.0, 66.0, 83.0, 121.0, 100.0, 114.0, 77.0, 56.0, 58.0, 31.0, 33.0, 25.0, 8.0, 15.0, 7.0, 3.0, 5.0, 7.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008149147033691406, -0.0007890611886978149, -0.0007632076740264893, -0.0007373541593551636, -0.0007115006446838379, -0.0006856471300125122, -0.0006597936153411865, -0.0006339401006698608, -0.0006080865859985352, -0.0005822330713272095, -0.0005563795566558838, -0.0005305260419845581, -0.0005046725273132324, -0.00047881901264190674, -0.00045296549797058105, -0.00042711198329925537, -0.0004012584686279297, -0.000375404953956604, -0.0003495514392852783, -0.00032369792461395264, -0.00029784440994262695, -0.00027199089527130127, -0.0002461373805999756, -0.0002202838659286499, -0.00019443035125732422, -0.00016857683658599854, -0.00014272332191467285, -0.00011686980724334717, -9.101629257202148e-05, -6.51627779006958e-05, -3.930926322937012e-05, -1.3455748558044434e-05, 1.239776611328125e-05, 3.8251280784606934e-05, 6.410479545593262e-05, 8.99583101272583e-05, 0.00011581182479858398, 0.00014166533946990967, 0.00016751885414123535, 0.00019337236881256104, 0.00021922588348388672, 0.0002450793981552124, 0.0002709329128265381, 0.00029678642749786377, 0.00032263994216918945, 0.00034849345684051514, 0.0003743469715118408, 0.0004002004861831665, 0.0004260540008544922, 0.00045190751552581787, 0.00047776103019714355, 0.0005036145448684692, 0.0005294680595397949, 0.0005553215742111206, 0.0005811750888824463, 0.000607028603553772, 0.0006328821182250977, 0.0006587356328964233, 0.000684589147567749, 0.0007104426622390747, 0.0007362961769104004, 0.0007621496915817261, 0.0007880032062530518, 0.0008138567209243774, 0.0008397102355957031]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 15.0, 23.0, 32.0, 47.0, 54.0, 102.0, 144.0, 260.0, 366.0, 508.0, 857.0, 1219.0, 1867.0, 2912.0, 4706.0, 7399.0, 11533.0, 18055.0, 27949.0, 42981.0, 64342.0, 91109.0, 117361.0, 135753.0, 134734.0, 116039.0, 88830.0, 62726.0, 41574.0, 26904.0, 17407.0, 10988.0, 7036.0, 4471.0, 2939.0, 1818.0, 1237.0, 769.0, 492.0, 328.0, 233.0, 140.0, 94.0, 69.0, 40.0, 31.0, 16.0, 17.0, 7.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-4.671875, -4.52569580078125, -4.3795166015625, -4.23333740234375, -4.087158203125, -3.94097900390625, -3.7947998046875, -3.64862060546875, -3.50244140625, -3.35626220703125, -3.2100830078125, -3.06390380859375, -2.917724609375, -2.77154541015625, -2.6253662109375, -2.47918701171875, -2.3330078125, -2.18682861328125, -2.0406494140625, -1.89447021484375, -1.748291015625, -1.60211181640625, -1.4559326171875, -1.30975341796875, -1.16357421875, -1.01739501953125, -0.8712158203125, -0.72503662109375, -0.578857421875, -0.43267822265625, -0.2864990234375, -0.14031982421875, 0.005859375, 0.15203857421875, 0.2982177734375, 0.44439697265625, 0.590576171875, 0.73675537109375, 0.8829345703125, 1.02911376953125, 1.17529296875, 1.32147216796875, 1.4676513671875, 1.61383056640625, 1.760009765625, 1.90618896484375, 2.0523681640625, 2.19854736328125, 2.3447265625, 2.49090576171875, 2.6370849609375, 2.78326416015625, 2.929443359375, 3.07562255859375, 3.2218017578125, 3.36798095703125, 3.51416015625, 3.66033935546875, 3.8065185546875, 3.95269775390625, 4.098876953125, 4.24505615234375, 4.3912353515625, 4.53741455078125, 4.68359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 8.0, 5.0, 10.0, 17.0, 18.0, 23.0, 17.0, 17.0, 25.0, 38.0, 42.0, 36.0, 53.0, 46.0, 61.0, 52.0, 59.0, 59.0, 58.0, 55.0, 52.0, 42.0, 44.0, 28.0, 23.0, 23.0, 24.0, 13.0, 16.0, 4.0, 8.0, 8.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.26031494140625, -2.1905517578125, -2.12078857421875, -2.051025390625, -1.98126220703125, -1.9114990234375, -1.84173583984375, -1.77197265625, -1.70220947265625, -1.6324462890625, -1.56268310546875, -1.492919921875, -1.42315673828125, -1.3533935546875, -1.28363037109375, -1.2138671875, -1.14410400390625, -1.0743408203125, -1.00457763671875, -0.934814453125, -0.86505126953125, -0.7952880859375, -0.72552490234375, -0.65576171875, -0.58599853515625, -0.5162353515625, -0.44647216796875, -0.376708984375, -0.30694580078125, -0.2371826171875, -0.16741943359375, -0.09765625, -0.02789306640625, 0.0418701171875, 0.11163330078125, 0.181396484375, 0.25115966796875, 0.3209228515625, 0.39068603515625, 0.46044921875, 0.53021240234375, 0.5999755859375, 0.66973876953125, 0.739501953125, 0.80926513671875, 0.8790283203125, 0.94879150390625, 1.0185546875, 1.08831787109375, 1.1580810546875, 1.22784423828125, 1.297607421875, 1.36737060546875, 1.4371337890625, 1.50689697265625, 1.57666015625, 1.64642333984375, 1.7161865234375, 1.78594970703125, 1.855712890625, 1.92547607421875, 1.9952392578125, 2.06500244140625, 2.134765625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 5.0, 7.0, 6.0, 11.0, 11.0, 15.0, 13.0, 11.0, 14.0, 10.0, 17.0, 28.0, 24.0, 30.0, 39.0, 39.0, 33.0, 35.0, 35.0, 33.0, 36.0, 35.0, 45.0, 50.0, 40.0, 34.0, 34.0, 28.0, 37.0, 32.0, 25.0, 25.0, 27.0, 17.0, 16.0, 15.0, 17.0, 14.0, 6.0, 8.0, 6.0, 8.0, 3.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0], "bins": [-9.889148712158203, -9.5872220993042, -9.285295486450195, -8.983369827270508, -8.681443214416504, -8.3795166015625, -8.077590942382812, -7.775664329528809, -7.473737716674805, -7.171811103820801, -6.869884967803955, -6.567958831787109, -6.2660322189331055, -5.964105606079102, -5.662179470062256, -5.36025333404541, -5.058326721191406, -4.756400108337402, -4.454473972320557, -4.152547836303711, -3.850621223449707, -3.5486948490142822, -3.2467684745788574, -2.9448421001434326, -2.642915725708008, -2.340989351272583, -2.039062976837158, -1.7371366024017334, -1.4352102279663086, -1.1332838535308838, -0.831357479095459, -0.5294311046600342, -0.22750568389892578, 0.07442069053649902, 0.37634706497192383, 0.6782734394073486, 0.9801998138427734, 1.2821261882781982, 1.584052562713623, 1.8859789371490479, 2.1879053115844727, 2.4898316860198975, 2.7917580604553223, 3.093684434890747, 3.395610809326172, 3.6975371837615967, 3.9994635581970215, 4.301389694213867, 4.603316307067871, 4.905242919921875, 5.207169055938721, 5.509095191955566, 5.81102180480957, 6.112948417663574, 6.41487455368042, 6.716800689697266, 7.0187273025512695, 7.320653915405273, 7.622580051422119, 7.924506187438965, 8.226432800292969, 8.528359413146973, 8.830286026000977, 9.132211685180664, 9.434138298034668]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 0.0, 7.0, 3.0, 5.0, 6.0, 9.0, 6.0, 9.0, 18.0, 12.0, 12.0, 23.0, 24.0, 27.0, 30.0, 29.0, 27.0, 36.0, 33.0, 44.0, 39.0, 36.0, 47.0, 26.0, 35.0, 47.0, 45.0, 38.0, 38.0, 35.0, 27.0, 25.0, 28.0, 19.0, 18.0, 24.0, 23.0, 15.0, 13.0, 9.0, 14.0, 9.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.72310733795166, -10.374978065490723, -10.026848793029785, -9.678719520568848, -9.33059024810791, -8.982460975646973, -8.634331703186035, -8.286202430725098, -7.93807315826416, -7.589943885803223, -7.241814613342285, -6.893685340881348, -6.54555606842041, -6.197426795959473, -5.849297523498535, -5.501168251037598, -5.15303897857666, -4.804909706115723, -4.456780433654785, -4.108651161193848, -3.76052188873291, -3.4123926162719727, -3.064263343811035, -2.7161340713500977, -2.36800479888916, -2.0198755264282227, -1.6717462539672852, -1.3236169815063477, -0.9754877090454102, -0.6273584365844727, -0.27922916412353516, 0.06890010833740234, 0.41702842712402344, 0.7651576995849609, 1.1132869720458984, 1.461416244506836, 1.8095455169677734, 2.157674789428711, 2.5058040618896484, 2.853933334350586, 3.2020626068115234, 3.550191879272461, 3.8983211517333984, 4.246450424194336, 4.594579696655273, 4.942708969116211, 5.290838241577148, 5.638967514038086, 5.987096786499023, 6.335226058959961, 6.683355331420898, 7.031484603881836, 7.379613876342773, 7.727743148803711, 8.075872421264648, 8.424001693725586, 8.772130966186523, 9.120260238647461, 9.468389511108398, 9.816518783569336, 10.164648056030273, 10.512777328491211, 10.860906600952148, 11.209035873413086, 11.557165145874023]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 10.0, 11.0, 25.0, 25.0, 70.0, 82.0, 139.0, 246.0, 430.0, 729.0, 1156.0, 1976.0, 3402.0, 5764.0, 9977.0, 16939.0, 28143.0, 44760.0, 69548.0, 98724.0, 127424.0, 143008.0, 138539.0, 116841.0, 87128.0, 59374.0, 37864.0, 23004.0, 13838.0, 7948.0, 4664.0, 2722.0, 1630.0, 987.0, 517.0, 368.0, 207.0, 132.0, 90.0, 50.0, 20.0, 21.0, 13.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3046875, -9.980712890625, -9.65673828125, -9.332763671875, -9.0087890625, -8.684814453125, -8.36083984375, -8.036865234375, -7.712890625, -7.388916015625, -7.06494140625, -6.740966796875, -6.4169921875, -6.093017578125, -5.76904296875, -5.445068359375, -5.12109375, -4.797119140625, -4.47314453125, -4.149169921875, -3.8251953125, -3.501220703125, -3.17724609375, -2.853271484375, -2.529296875, -2.205322265625, -1.88134765625, -1.557373046875, -1.2333984375, -0.909423828125, -0.58544921875, -0.261474609375, 0.0625, 0.386474609375, 0.71044921875, 1.034423828125, 1.3583984375, 1.682373046875, 2.00634765625, 2.330322265625, 2.654296875, 2.978271484375, 3.30224609375, 3.626220703125, 3.9501953125, 4.274169921875, 4.59814453125, 4.922119140625, 5.24609375, 5.570068359375, 5.89404296875, 6.218017578125, 6.5419921875, 6.865966796875, 7.18994140625, 7.513916015625, 7.837890625, 8.161865234375, 8.48583984375, 8.809814453125, 9.1337890625, 9.457763671875, 9.78173828125, 10.105712890625, 10.4296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 9.0, 5.0, 4.0, 4.0, 7.0, 9.0, 12.0, 12.0, 18.0, 13.0, 26.0, 21.0, 31.0, 32.0, 26.0, 26.0, 32.0, 44.0, 42.0, 55.0, 37.0, 40.0, 32.0, 42.0, 40.0, 55.0, 37.0, 38.0, 33.0, 26.0, 24.0, 22.0, 12.0, 27.0, 16.0, 12.0, 16.0, 18.0, 8.0, 10.0, 6.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.125, -9.767333984375, -9.40966796875, -9.052001953125, -8.6943359375, -8.336669921875, -7.97900390625, -7.621337890625, -7.263671875, -6.906005859375, -6.54833984375, -6.190673828125, -5.8330078125, -5.475341796875, -5.11767578125, -4.760009765625, -4.40234375, -4.044677734375, -3.68701171875, -3.329345703125, -2.9716796875, -2.614013671875, -2.25634765625, -1.898681640625, -1.541015625, -1.183349609375, -0.82568359375, -0.468017578125, -0.1103515625, 0.247314453125, 0.60498046875, 0.962646484375, 1.3203125, 1.677978515625, 2.03564453125, 2.393310546875, 2.7509765625, 3.108642578125, 3.46630859375, 3.823974609375, 4.181640625, 4.539306640625, 4.89697265625, 5.254638671875, 5.6123046875, 5.969970703125, 6.32763671875, 6.685302734375, 7.04296875, 7.400634765625, 7.75830078125, 8.115966796875, 8.4736328125, 8.831298828125, 9.18896484375, 9.546630859375, 9.904296875, 10.261962890625, 10.61962890625, 10.977294921875, 11.3349609375, 11.692626953125, 12.05029296875, 12.407958984375, 12.765625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 1.0, 4.0, 5.0, 5.0, 5.0, 5.0, 10.0, 20.0, 29.0, 33.0, 81.0, 119.0, 187.0, 322.0, 514.0, 906.0, 1424.0, 2667.0, 4744.0, 8845.0, 15747.0, 28386.0, 49181.0, 81465.0, 119992.0, 154818.0, 164649.0, 144596.0, 106749.0, 69155.0, 41041.0, 23348.0, 12893.0, 7243.0, 4030.0, 2308.0, 1227.0, 726.0, 389.0, 260.0, 150.0, 90.0, 72.0, 41.0, 23.0, 16.0, 13.0, 12.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8828125, -13.46630859375, -13.0498046875, -12.63330078125, -12.216796875, -11.80029296875, -11.3837890625, -10.96728515625, -10.55078125, -10.13427734375, -9.7177734375, -9.30126953125, -8.884765625, -8.46826171875, -8.0517578125, -7.63525390625, -7.21875, -6.80224609375, -6.3857421875, -5.96923828125, -5.552734375, -5.13623046875, -4.7197265625, -4.30322265625, -3.88671875, -3.47021484375, -3.0537109375, -2.63720703125, -2.220703125, -1.80419921875, -1.3876953125, -0.97119140625, -0.5546875, -0.13818359375, 0.2783203125, 0.69482421875, 1.111328125, 1.52783203125, 1.9443359375, 2.36083984375, 2.77734375, 3.19384765625, 3.6103515625, 4.02685546875, 4.443359375, 4.85986328125, 5.2763671875, 5.69287109375, 6.109375, 6.52587890625, 6.9423828125, 7.35888671875, 7.775390625, 8.19189453125, 8.6083984375, 9.02490234375, 9.44140625, 9.85791015625, 10.2744140625, 10.69091796875, 11.107421875, 11.52392578125, 11.9404296875, 12.35693359375, 12.7734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 3.0, 5.0, 9.0, 8.0, 7.0, 15.0, 16.0, 10.0, 17.0, 10.0, 27.0, 26.0, 25.0, 33.0, 31.0, 34.0, 31.0, 35.0, 52.0, 43.0, 40.0, 45.0, 47.0, 37.0, 38.0, 32.0, 36.0, 38.0, 39.0, 29.0, 27.0, 22.0, 25.0, 18.0, 11.0, 18.0, 10.0, 17.0, 7.0, 4.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.0078125, -6.77557373046875, -6.5433349609375, -6.31109619140625, -6.078857421875, -5.84661865234375, -5.6143798828125, -5.38214111328125, -5.14990234375, -4.91766357421875, -4.6854248046875, -4.45318603515625, -4.220947265625, -3.98870849609375, -3.7564697265625, -3.52423095703125, -3.2919921875, -3.05975341796875, -2.8275146484375, -2.59527587890625, -2.363037109375, -2.13079833984375, -1.8985595703125, -1.66632080078125, -1.43408203125, -1.20184326171875, -0.9696044921875, -0.73736572265625, -0.505126953125, -0.27288818359375, -0.0406494140625, 0.19158935546875, 0.423828125, 0.65606689453125, 0.8883056640625, 1.12054443359375, 1.352783203125, 1.58502197265625, 1.8172607421875, 2.04949951171875, 2.28173828125, 2.51397705078125, 2.7462158203125, 2.97845458984375, 3.210693359375, 3.44293212890625, 3.6751708984375, 3.90740966796875, 4.1396484375, 4.37188720703125, 4.6041259765625, 4.83636474609375, 5.068603515625, 5.30084228515625, 5.5330810546875, 5.76531982421875, 5.99755859375, 6.22979736328125, 6.4620361328125, 6.69427490234375, 6.926513671875, 7.15875244140625, 7.3909912109375, 7.62322998046875, 7.85546875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 8.0, 11.0, 21.0, 24.0, 41.0, 75.0, 104.0, 193.0, 296.0, 458.0, 765.0, 1238.0, 2207.0, 3856.0, 6693.0, 12129.0, 21736.0, 38777.0, 67440.0, 108976.0, 155010.0, 179601.0, 161482.0, 116992.0, 73091.0, 42726.0, 23835.0, 13373.0, 7482.0, 4154.0, 2286.0, 1374.0, 769.0, 532.0, 313.0, 167.0, 93.0, 78.0, 46.0, 29.0, 22.0, 9.0, 12.0, 13.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.484375, -5.3160400390625, -5.147705078125, -4.9793701171875, -4.81103515625, -4.6427001953125, -4.474365234375, -4.3060302734375, -4.1376953125, -3.9693603515625, -3.801025390625, -3.6326904296875, -3.46435546875, -3.2960205078125, -3.127685546875, -2.9593505859375, -2.791015625, -2.6226806640625, -2.454345703125, -2.2860107421875, -2.11767578125, -1.9493408203125, -1.781005859375, -1.6126708984375, -1.4443359375, -1.2760009765625, -1.107666015625, -0.9393310546875, -0.77099609375, -0.6026611328125, -0.434326171875, -0.2659912109375, -0.09765625, 0.0706787109375, 0.239013671875, 0.4073486328125, 0.57568359375, 0.7440185546875, 0.912353515625, 1.0806884765625, 1.2490234375, 1.4173583984375, 1.585693359375, 1.7540283203125, 1.92236328125, 2.0906982421875, 2.259033203125, 2.4273681640625, 2.595703125, 2.7640380859375, 2.932373046875, 3.1007080078125, 3.26904296875, 3.4373779296875, 3.605712890625, 3.7740478515625, 3.9423828125, 4.1107177734375, 4.279052734375, 4.4473876953125, 4.61572265625, 4.7840576171875, 4.952392578125, 5.1207275390625, 5.2890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 6.0, 11.0, 10.0, 15.0, 24.0, 35.0, 42.0, 45.0, 44.0, 50.0, 57.0, 63.0, 66.0, 79.0, 73.0, 59.0, 52.0, 43.0, 38.0, 26.0, 20.0, 25.0, 29.0, 16.0, 10.0, 19.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006122589111328125, -0.0005932524800300598, -0.0005742460489273071, -0.0005552396178245544, -0.0005362331867218018, -0.0005172267556190491, -0.0004982203245162964, -0.0004792138934135437, -0.000460207462310791, -0.00044120103120803833, -0.00042219460010528564, -0.00040318816900253296, -0.0003841817378997803, -0.0003651753067970276, -0.0003461688756942749, -0.0003271624445915222, -0.00030815601348876953, -0.00028914958238601685, -0.00027014315128326416, -0.0002511367201805115, -0.0002321302890777588, -0.0002131238579750061, -0.00019411742687225342, -0.00017511099576950073, -0.00015610456466674805, -0.00013709813356399536, -0.00011809170246124268, -9.908527135848999e-05, -8.00788402557373e-05, -6.107240915298462e-05, -4.2065978050231934e-05, -2.3059546947479248e-05, -4.0531158447265625e-06, 1.4953315258026123e-05, 3.395974636077881e-05, 5.2966177463531494e-05, 7.197260856628418e-05, 9.097903966903687e-05, 0.00010998547077178955, 0.00012899190187454224, 0.00014799833297729492, 0.0001670047640800476, 0.0001860111951828003, 0.00020501762628555298, 0.00022402405738830566, 0.00024303048849105835, 0.00026203691959381104, 0.0002810433506965637, 0.0003000497817993164, 0.0003190562129020691, 0.0003380626440048218, 0.00035706907510757446, 0.00037607550621032715, 0.00039508193731307983, 0.0004140883684158325, 0.0004330947995185852, 0.0004521012306213379, 0.0004711076617240906, 0.0004901140928268433, 0.000509120523929596, 0.0005281269550323486, 0.0005471333861351013, 0.000566139817237854, 0.0005851462483406067, 0.0006041526794433594]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 2.0, 5.0, 14.0, 19.0, 18.0, 37.0, 62.0, 90.0, 109.0, 182.0, 358.0, 511.0, 963.0, 1600.0, 2744.0, 4600.0, 7876.0, 13792.0, 23596.0, 38565.0, 60909.0, 89527.0, 119654.0, 141211.0, 143479.0, 126563.0, 96983.0, 67930.0, 43044.0, 26368.0, 15666.0, 9131.0, 5373.0, 3095.0, 1790.0, 1038.0, 664.0, 379.0, 222.0, 155.0, 82.0, 53.0, 30.0, 28.0, 17.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-4.58203125, -4.451568603515625, -4.32110595703125, -4.190643310546875, -4.0601806640625, -3.929718017578125, -3.79925537109375, -3.668792724609375, -3.538330078125, -3.407867431640625, -3.27740478515625, -3.146942138671875, -3.0164794921875, -2.886016845703125, -2.75555419921875, -2.625091552734375, -2.49462890625, -2.364166259765625, -2.23370361328125, -2.103240966796875, -1.9727783203125, -1.842315673828125, -1.71185302734375, -1.581390380859375, -1.450927734375, -1.320465087890625, -1.19000244140625, -1.059539794921875, -0.9290771484375, -0.798614501953125, -0.66815185546875, -0.537689208984375, -0.4072265625, -0.276763916015625, -0.14630126953125, -0.015838623046875, 0.1146240234375, 0.245086669921875, 0.37554931640625, 0.506011962890625, 0.636474609375, 0.766937255859375, 0.89739990234375, 1.027862548828125, 1.1583251953125, 1.288787841796875, 1.41925048828125, 1.549713134765625, 1.68017578125, 1.810638427734375, 1.94110107421875, 2.071563720703125, 2.2020263671875, 2.332489013671875, 2.46295166015625, 2.593414306640625, 2.723876953125, 2.854339599609375, 2.98480224609375, 3.115264892578125, 3.2457275390625, 3.376190185546875, 3.50665283203125, 3.637115478515625, 3.767578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 13.0, 7.0, 15.0, 17.0, 26.0, 23.0, 25.0, 32.0, 30.0, 39.0, 37.0, 36.0, 37.0, 55.0, 57.0, 52.0, 69.0, 32.0, 59.0, 33.0, 50.0, 41.0, 28.0, 34.0, 27.0, 24.0, 11.0, 14.0, 14.0, 11.0, 11.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4208984375, -1.373779296875, -1.32666015625, -1.279541015625, -1.232421875, -1.185302734375, -1.13818359375, -1.091064453125, -1.0439453125, -0.996826171875, -0.94970703125, -0.902587890625, -0.85546875, -0.808349609375, -0.76123046875, -0.714111328125, -0.6669921875, -0.619873046875, -0.57275390625, -0.525634765625, -0.478515625, -0.431396484375, -0.38427734375, -0.337158203125, -0.2900390625, -0.242919921875, -0.19580078125, -0.148681640625, -0.1015625, -0.054443359375, -0.00732421875, 0.039794921875, 0.0869140625, 0.134033203125, 0.18115234375, 0.228271484375, 0.275390625, 0.322509765625, 0.36962890625, 0.416748046875, 0.4638671875, 0.510986328125, 0.55810546875, 0.605224609375, 0.65234375, 0.699462890625, 0.74658203125, 0.793701171875, 0.8408203125, 0.887939453125, 0.93505859375, 0.982177734375, 1.029296875, 1.076416015625, 1.12353515625, 1.170654296875, 1.2177734375, 1.264892578125, 1.31201171875, 1.359130859375, 1.40625, 1.453369140625, 1.50048828125, 1.547607421875, 1.5947265625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 9.0, 7.0, 6.0, 10.0, 10.0, 6.0, 14.0, 20.0, 17.0, 24.0, 35.0, 37.0, 31.0, 24.0, 33.0, 37.0, 37.0, 36.0, 48.0, 38.0, 40.0, 45.0, 44.0, 46.0, 35.0, 33.0, 25.0, 35.0, 23.0, 37.0, 29.0, 19.0, 22.0, 15.0, 15.0, 8.0, 8.0, 11.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-10.26678466796875, -9.94711685180664, -9.627449989318848, -9.307782173156738, -8.988115310668945, -8.668447494506836, -8.348780632019043, -8.029112815856934, -7.709445476531982, -7.389778137207031, -7.07011079788208, -6.750443458557129, -6.4307756423950195, -6.111108779907227, -5.791440963745117, -5.471773624420166, -5.152106285095215, -4.832438945770264, -4.5127716064453125, -4.193104267120361, -3.873436689376831, -3.55376935005188, -3.2341017723083496, -2.9144344329833984, -2.5947670936584473, -2.275099754333496, -1.9554322957992554, -1.6357648372650146, -1.3160974979400635, -0.9964301586151123, -0.6767627000808716, -0.35709524154663086, -0.037428855895996094, 0.28223854303359985, 0.6019059419631958, 0.9215733408927917, 1.2412407398223877, 1.5609080791473389, 1.8805755376815796, 2.2002429962158203, 2.5199103355407715, 2.8395776748657227, 3.159245014190674, 3.478912591934204, 3.7985799312591553, 4.118247032165527, 4.437914848327637, 4.757582187652588, 5.077249526977539, 5.39691686630249, 5.716584205627441, 6.036251544952393, 6.355918884277344, 6.675586700439453, 6.995254039764404, 7.3149213790893555, 7.634588718414307, 7.954256057739258, 8.273923873901367, 8.59359073638916, 8.91325855255127, 9.232925415039062, 9.552593231201172, 9.872261047363281, 10.191927909851074]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 5.0, 3.0, 8.0, 13.0, 12.0, 7.0, 15.0, 17.0, 21.0, 13.0, 11.0, 35.0, 24.0, 34.0, 32.0, 24.0, 35.0, 31.0, 31.0, 38.0, 41.0, 49.0, 39.0, 36.0, 42.0, 38.0, 29.0, 33.0, 33.0, 27.0, 26.0, 21.0, 24.0, 23.0, 22.0, 15.0, 17.0, 10.0, 13.0, 13.0, 5.0, 8.0, 2.0, 5.0, 10.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0], "bins": [-11.122969627380371, -10.776812553405762, -10.430655479431152, -10.084498405456543, -9.738340377807617, -9.392183303833008, -9.046026229858398, -8.699869155883789, -8.35371208190918, -8.00755500793457, -7.661397933959961, -7.315240383148193, -6.969083309173584, -6.622926235198975, -6.276768684387207, -5.930611610412598, -5.584454536437988, -5.238297462463379, -4.8921403884887695, -4.545982837677002, -4.199825763702393, -3.853668689727783, -3.5075113773345947, -3.1613540649414062, -2.815196990966797, -2.4690399169921875, -2.122882604598999, -1.7767254114151, -1.4305682182312012, -1.0844110250473022, -0.7382538318634033, -0.39209651947021484, -0.04593849182128906, 0.30021870136260986, 0.6463758945465088, 0.9925330877304077, 1.3386902809143066, 1.6848474740982056, 2.0310046672821045, 2.377161979675293, 2.7233190536499023, 3.0694761276245117, 3.4156334400177, 3.7617907524108887, 4.107947826385498, 4.454104900360107, 4.800262451171875, 5.146419525146484, 5.492576599121094, 5.838733673095703, 6.1848907470703125, 6.53104829788208, 6.8772053718566895, 7.223362445831299, 7.569519996643066, 7.915677070617676, 8.261834144592285, 8.607991218566895, 8.954148292541504, 9.300305366516113, 9.646463394165039, 9.992620468139648, 10.338777542114258, 10.684934616088867, 11.031091690063477]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 2.0, 10.0, 15.0, 28.0, 46.0, 62.0, 106.0, 182.0, 275.0, 393.0, 641.0, 1007.0, 1615.0, 2480.0, 4078.0, 6440.0, 10431.0, 16563.0, 26920.0, 44244.0, 74767.0, 125473.0, 212894.0, 342067.0, 498090.0, 621110.0, 642031.0, 546499.0, 391745.0, 249810.0, 148901.0, 88229.0, 52266.0, 31698.0, 19676.0, 12041.0, 7562.0, 4839.0, 3170.0, 2076.0, 1437.0, 794.0, 543.0, 370.0, 227.0, 141.0, 103.0, 67.0, 43.0, 28.0, 20.0, 12.0, 12.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.453125, -7.2060546875, -6.958984375, -6.7119140625, -6.46484375, -6.2177734375, -5.970703125, -5.7236328125, -5.4765625, -5.2294921875, -4.982421875, -4.7353515625, -4.48828125, -4.2412109375, -3.994140625, -3.7470703125, -3.5, -3.2529296875, -3.005859375, -2.7587890625, -2.51171875, -2.2646484375, -2.017578125, -1.7705078125, -1.5234375, -1.2763671875, -1.029296875, -0.7822265625, -0.53515625, -0.2880859375, -0.041015625, 0.2060546875, 0.453125, 0.7001953125, 0.947265625, 1.1943359375, 1.44140625, 1.6884765625, 1.935546875, 2.1826171875, 2.4296875, 2.6767578125, 2.923828125, 3.1708984375, 3.41796875, 3.6650390625, 3.912109375, 4.1591796875, 4.40625, 4.6533203125, 4.900390625, 5.1474609375, 5.39453125, 5.6416015625, 5.888671875, 6.1357421875, 6.3828125, 6.6298828125, 6.876953125, 7.1240234375, 7.37109375, 7.6181640625, 7.865234375, 8.1123046875, 8.359375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 10.0, 17.0, 8.0, 12.0, 15.0, 13.0, 15.0, 24.0, 24.0, 26.0, 15.0, 22.0, 37.0, 31.0, 31.0, 40.0, 37.0, 35.0, 44.0, 31.0, 39.0, 38.0, 43.0, 31.0, 45.0, 38.0, 24.0, 22.0, 28.0, 27.0, 15.0, 24.0, 17.0, 22.0, 23.0, 6.0, 13.0, 11.0, 16.0, 4.0, 7.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-9.4921875, -9.1973876953125, -8.902587890625, -8.6077880859375, -8.31298828125, -8.0181884765625, -7.723388671875, -7.4285888671875, -7.1337890625, -6.8389892578125, -6.544189453125, -6.2493896484375, -5.95458984375, -5.6597900390625, -5.364990234375, -5.0701904296875, -4.775390625, -4.4805908203125, -4.185791015625, -3.8909912109375, -3.59619140625, -3.3013916015625, -3.006591796875, -2.7117919921875, -2.4169921875, -2.1221923828125, -1.827392578125, -1.5325927734375, -1.23779296875, -0.9429931640625, -0.648193359375, -0.3533935546875, -0.05859375, 0.2362060546875, 0.531005859375, 0.8258056640625, 1.12060546875, 1.4154052734375, 1.710205078125, 2.0050048828125, 2.2998046875, 2.5946044921875, 2.889404296875, 3.1842041015625, 3.47900390625, 3.7738037109375, 4.068603515625, 4.3634033203125, 4.658203125, 4.9530029296875, 5.247802734375, 5.5426025390625, 5.83740234375, 6.1322021484375, 6.427001953125, 6.7218017578125, 7.0166015625, 7.3114013671875, 7.606201171875, 7.9010009765625, 8.19580078125, 8.4906005859375, 8.785400390625, 9.0802001953125, 9.375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 10.0, 8.0, 10.0, 28.0, 50.0, 103.0, 157.0, 237.0, 449.0, 826.0, 1496.0, 2669.0, 4891.0, 9133.0, 16885.0, 31720.0, 59583.0, 111555.0, 207140.0, 367960.0, 594569.0, 783113.0, 752757.0, 538178.0, 323706.0, 179963.0, 96298.0, 51694.0, 27393.0, 14371.0, 7871.0, 4230.0, 2301.0, 1227.0, 743.0, 378.0, 244.0, 131.0, 93.0, 37.0, 30.0, 12.0, 10.0, 3.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.4453125, -12.0780029296875, -11.710693359375, -11.3433837890625, -10.97607421875, -10.6087646484375, -10.241455078125, -9.8741455078125, -9.5068359375, -9.1395263671875, -8.772216796875, -8.4049072265625, -8.03759765625, -7.6702880859375, -7.302978515625, -6.9356689453125, -6.568359375, -6.2010498046875, -5.833740234375, -5.4664306640625, -5.09912109375, -4.7318115234375, -4.364501953125, -3.9971923828125, -3.6298828125, -3.2625732421875, -2.895263671875, -2.5279541015625, -2.16064453125, -1.7933349609375, -1.426025390625, -1.0587158203125, -0.69140625, -0.3240966796875, 0.043212890625, 0.4105224609375, 0.77783203125, 1.1451416015625, 1.512451171875, 1.8797607421875, 2.2470703125, 2.6143798828125, 2.981689453125, 3.3489990234375, 3.71630859375, 4.0836181640625, 4.450927734375, 4.8182373046875, 5.185546875, 5.5528564453125, 5.920166015625, 6.2874755859375, 6.65478515625, 7.0220947265625, 7.389404296875, 7.7567138671875, 8.1240234375, 8.4913330078125, 8.858642578125, 9.2259521484375, 9.59326171875, 9.9605712890625, 10.327880859375, 10.6951904296875, 11.0625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 8.0, 4.0, 11.0, 13.0, 17.0, 39.0, 32.0, 35.0, 61.0, 52.0, 47.0, 77.0, 84.0, 85.0, 123.0, 135.0, 151.0, 169.0, 161.0, 198.0, 182.0, 192.0, 212.0, 215.0, 206.0, 190.0, 189.0, 151.0, 137.0, 143.0, 110.0, 103.0, 101.0, 82.0, 70.0, 52.0, 43.0, 42.0, 30.0, 35.0, 17.0, 12.0, 15.0, 8.0, 10.0, 7.0, 3.0, 2.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.53515625, -3.419219970703125, -3.30328369140625, -3.187347412109375, -3.0714111328125, -2.955474853515625, -2.83953857421875, -2.723602294921875, -2.607666015625, -2.491729736328125, -2.37579345703125, -2.259857177734375, -2.1439208984375, -2.027984619140625, -1.91204833984375, -1.796112060546875, -1.68017578125, -1.564239501953125, -1.44830322265625, -1.332366943359375, -1.2164306640625, -1.100494384765625, -0.98455810546875, -0.868621826171875, -0.752685546875, -0.636749267578125, -0.52081298828125, -0.404876708984375, -0.2889404296875, -0.173004150390625, -0.05706787109375, 0.058868408203125, 0.1748046875, 0.290740966796875, 0.40667724609375, 0.522613525390625, 0.6385498046875, 0.754486083984375, 0.87042236328125, 0.986358642578125, 1.102294921875, 1.218231201171875, 1.33416748046875, 1.450103759765625, 1.5660400390625, 1.681976318359375, 1.79791259765625, 1.913848876953125, 2.02978515625, 2.145721435546875, 2.26165771484375, 2.377593994140625, 2.4935302734375, 2.609466552734375, 2.72540283203125, 2.841339111328125, 2.957275390625, 3.073211669921875, 3.18914794921875, 3.305084228515625, 3.4210205078125, 3.536956787109375, 3.65289306640625, 3.768829345703125, 3.884765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 2.0, 4.0, 4.0, 7.0, 12.0, 6.0, 16.0, 17.0, 12.0, 18.0, 31.0, 24.0, 42.0, 36.0, 42.0, 31.0, 37.0, 50.0, 51.0, 47.0, 36.0, 49.0, 46.0, 43.0, 45.0, 39.0, 31.0, 20.0, 22.0, 35.0, 27.0, 22.0, 17.0, 17.0, 6.0, 11.0, 8.0, 4.0, 9.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.670071601867676, -10.343198776245117, -10.016325950622559, -9.689452171325684, -9.362579345703125, -9.035706520080566, -8.708833694458008, -8.38196086883545, -8.05508804321289, -7.728215217590332, -7.401341915130615, -7.074469089508057, -6.74759578704834, -6.420722961425781, -6.093850135803223, -5.766977310180664, -5.440103530883789, -5.1132307052612305, -4.786357402801514, -4.459484577178955, -4.132611274719238, -3.8057384490966797, -3.478865623474121, -3.1519925594329834, -2.8251194953918457, -2.498246431350708, -2.1713733673095703, -1.8445005416870117, -1.517627477645874, -1.1907544136047363, -0.8638814687728882, -0.53700852394104, -0.21013641357421875, 0.11673659086227417, 0.4436095952987671, 0.77048259973526, 1.097355604171753, 1.4242286682128906, 1.7511016130447388, 2.077974557876587, 2.4048476219177246, 2.7317206859588623, 3.05859375, 3.3854665756225586, 3.7123396396636963, 4.039212703704834, 4.366085529327393, 4.692958831787109, 5.019831657409668, 5.346704483032227, 5.673577785491943, 6.000450611114502, 6.327323913574219, 6.654196739196777, 6.981069564819336, 7.3079423904418945, 7.634815692901611, 7.96168851852417, 8.288561820983887, 8.615434646606445, 8.942307472229004, 9.269180297851562, 9.596054077148438, 9.922926902770996, 10.249799728393555]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 5.0, 8.0, 11.0, 16.0, 17.0, 25.0, 13.0, 25.0, 39.0, 34.0, 32.0, 35.0, 46.0, 39.0, 40.0, 50.0, 43.0, 43.0, 42.0, 41.0, 30.0, 33.0, 39.0, 31.0, 32.0, 28.0, 22.0, 23.0, 23.0, 12.0, 16.0, 19.0, 9.0, 15.0, 13.0, 8.0, 8.0, 9.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.519853591918945, -11.165569305419922, -10.811284065246582, -10.456999778747559, -10.102714538574219, -9.748430252075195, -9.394145965576172, -9.039860725402832, -8.685576438903809, -8.331292152404785, -7.977006912231445, -7.622722625732422, -7.26843786239624, -6.914153099060059, -6.559868335723877, -6.205583572387695, -5.851298809051514, -5.497014045715332, -5.14272928237915, -4.788444519042969, -4.434160232543945, -4.079875469207764, -3.725590705871582, -3.3713061809539795, -3.017021417617798, -2.662736654281616, -2.3084521293640137, -1.954167366027832, -1.59988272190094, -1.2455980777740479, -0.8913133144378662, -0.5370287895202637, -0.18274402618408203, 0.17154064774513245, 0.5258253216743469, 0.8801100254058838, 1.2343946695327759, 1.588679313659668, 1.9429640769958496, 2.297248601913452, 2.651533365249634, 3.0058181285858154, 3.360102653503418, 3.7143874168395996, 4.068672180175781, 4.422956466674805, 4.7772417068481445, 5.131525993347168, 5.48581075668335, 5.840095520019531, 6.194380283355713, 6.5486650466918945, 6.902949333190918, 7.2572340965271, 7.611518859863281, 7.965803146362305, 8.320088386535645, 8.674372673034668, 9.028657913208008, 9.382942199707031, 9.737227439880371, 10.091511726379395, 10.445796966552734, 10.800081253051758, 11.154365539550781]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 6.0, 15.0, 30.0, 51.0, 76.0, 83.0, 141.0, 186.0, 233.0, 428.0, 612.0, 884.0, 1221.0, 1708.0, 2373.0, 3258.0, 4577.0, 6188.0, 8848.0, 13646.0, 23409.0, 48106.0, 106587.0, 209769.0, 260276.0, 176303.0, 83177.0, 37656.0, 19302.0, 11601.0, 7929.0, 5670.0, 4066.0, 2896.0, 2093.0, 1531.0, 1091.0, 781.0, 578.0, 353.0, 255.0, 163.0, 127.0, 98.0, 57.0, 39.0, 26.0, 16.0, 13.0, 9.0, 7.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-15.7734375, -15.2857666015625, -14.798095703125, -14.3104248046875, -13.82275390625, -13.3350830078125, -12.847412109375, -12.3597412109375, -11.8720703125, -11.3843994140625, -10.896728515625, -10.4090576171875, -9.92138671875, -9.4337158203125, -8.946044921875, -8.4583740234375, -7.970703125, -7.4830322265625, -6.995361328125, -6.5076904296875, -6.02001953125, -5.5323486328125, -5.044677734375, -4.5570068359375, -4.0693359375, -3.5816650390625, -3.093994140625, -2.6063232421875, -2.11865234375, -1.6309814453125, -1.143310546875, -0.6556396484375, -0.16796875, 0.3197021484375, 0.807373046875, 1.2950439453125, 1.78271484375, 2.2703857421875, 2.758056640625, 3.2457275390625, 3.7333984375, 4.2210693359375, 4.708740234375, 5.1964111328125, 5.68408203125, 6.1717529296875, 6.659423828125, 7.1470947265625, 7.634765625, 8.1224365234375, 8.610107421875, 9.0977783203125, 9.58544921875, 10.0731201171875, 10.560791015625, 11.0484619140625, 11.5361328125, 12.0238037109375, 12.511474609375, 12.9991455078125, 13.48681640625, 13.9744873046875, 14.462158203125, 14.9498291015625, 15.4375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 2.0, 5.0, 12.0, 7.0, 12.0, 16.0, 14.0, 18.0, 19.0, 22.0, 33.0, 31.0, 41.0, 53.0, 46.0, 42.0, 39.0, 53.0, 50.0, 53.0, 36.0, 43.0, 31.0, 41.0, 32.0, 29.0, 25.0, 27.0, 22.0, 17.0, 19.0, 18.0, 13.0, 20.0, 15.0, 11.0, 6.0, 5.0, 3.0, 5.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.6171875, -11.253662109375, -10.89013671875, -10.526611328125, -10.1630859375, -9.799560546875, -9.43603515625, -9.072509765625, -8.708984375, -8.345458984375, -7.98193359375, -7.618408203125, -7.2548828125, -6.891357421875, -6.52783203125, -6.164306640625, -5.80078125, -5.437255859375, -5.07373046875, -4.710205078125, -4.3466796875, -3.983154296875, -3.61962890625, -3.256103515625, -2.892578125, -2.529052734375, -2.16552734375, -1.802001953125, -1.4384765625, -1.074951171875, -0.71142578125, -0.347900390625, 0.015625, 0.379150390625, 0.74267578125, 1.106201171875, 1.4697265625, 1.833251953125, 2.19677734375, 2.560302734375, 2.923828125, 3.287353515625, 3.65087890625, 4.014404296875, 4.3779296875, 4.741455078125, 5.10498046875, 5.468505859375, 5.83203125, 6.195556640625, 6.55908203125, 6.922607421875, 7.2861328125, 7.649658203125, 8.01318359375, 8.376708984375, 8.740234375, 9.103759765625, 9.46728515625, 9.830810546875, 10.1943359375, 10.557861328125, 10.92138671875, 11.284912109375, 11.6484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 9.0, 14.0, 19.0, 22.0, 52.0, 67.0, 78.0, 133.0, 219.0, 276.0, 454.0, 703.0, 1007.0, 1464.0, 2179.0, 3170.0, 4834.0, 7235.0, 11229.0, 18206.0, 32778.0, 66677.0, 145753.0, 259794.0, 238315.0, 122673.0, 56236.0, 28547.0, 16209.0, 10196.0, 6703.0, 4358.0, 2906.0, 1963.0, 1377.0, 904.0, 570.0, 403.0, 255.0, 187.0, 119.0, 92.0, 59.0, 38.0, 22.0, 10.0, 13.0, 14.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.3125, -15.784423828125, -15.25634765625, -14.728271484375, -14.2001953125, -13.672119140625, -13.14404296875, -12.615966796875, -12.087890625, -11.559814453125, -11.03173828125, -10.503662109375, -9.9755859375, -9.447509765625, -8.91943359375, -8.391357421875, -7.86328125, -7.335205078125, -6.80712890625, -6.279052734375, -5.7509765625, -5.222900390625, -4.69482421875, -4.166748046875, -3.638671875, -3.110595703125, -2.58251953125, -2.054443359375, -1.5263671875, -0.998291015625, -0.47021484375, 0.057861328125, 0.5859375, 1.114013671875, 1.64208984375, 2.170166015625, 2.6982421875, 3.226318359375, 3.75439453125, 4.282470703125, 4.810546875, 5.338623046875, 5.86669921875, 6.394775390625, 6.9228515625, 7.450927734375, 7.97900390625, 8.507080078125, 9.03515625, 9.563232421875, 10.09130859375, 10.619384765625, 11.1474609375, 11.675537109375, 12.20361328125, 12.731689453125, 13.259765625, 13.787841796875, 14.31591796875, 14.843994140625, 15.3720703125, 15.900146484375, 16.42822265625, 16.956298828125, 17.484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 7.0, 12.0, 10.0, 11.0, 10.0, 10.0, 18.0, 19.0, 21.0, 23.0, 24.0, 25.0, 29.0, 29.0, 48.0, 28.0, 32.0, 24.0, 30.0, 43.0, 41.0, 38.0, 44.0, 44.0, 32.0, 34.0, 29.0, 28.0, 29.0, 29.0, 22.0, 25.0, 16.0, 18.0, 20.0, 12.0, 15.0, 14.0, 7.0, 14.0, 4.0, 4.0, 2.0, 2.0, 7.0, 4.0, 1.0, 0.0, 4.0, 5.0, 1.0, 2.0, 1.0], "bins": [-6.5390625, -6.33349609375, -6.1279296875, -5.92236328125, -5.716796875, -5.51123046875, -5.3056640625, -5.10009765625, -4.89453125, -4.68896484375, -4.4833984375, -4.27783203125, -4.072265625, -3.86669921875, -3.6611328125, -3.45556640625, -3.25, -3.04443359375, -2.8388671875, -2.63330078125, -2.427734375, -2.22216796875, -2.0166015625, -1.81103515625, -1.60546875, -1.39990234375, -1.1943359375, -0.98876953125, -0.783203125, -0.57763671875, -0.3720703125, -0.16650390625, 0.0390625, 0.24462890625, 0.4501953125, 0.65576171875, 0.861328125, 1.06689453125, 1.2724609375, 1.47802734375, 1.68359375, 1.88916015625, 2.0947265625, 2.30029296875, 2.505859375, 2.71142578125, 2.9169921875, 3.12255859375, 3.328125, 3.53369140625, 3.7392578125, 3.94482421875, 4.150390625, 4.35595703125, 4.5615234375, 4.76708984375, 4.97265625, 5.17822265625, 5.3837890625, 5.58935546875, 5.794921875, 6.00048828125, 6.2060546875, 6.41162109375, 6.6171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 12.0, 18.0, 19.0, 23.0, 48.0, 56.0, 103.0, 127.0, 159.0, 250.0, 371.0, 557.0, 846.0, 1264.0, 1979.0, 3105.0, 5024.0, 8072.0, 14110.0, 26048.0, 50513.0, 101672.0, 188069.0, 245928.0, 186546.0, 101325.0, 50344.0, 25838.0, 14231.0, 8206.0, 4884.0, 3011.0, 1937.0, 1259.0, 818.0, 539.0, 380.0, 248.0, 196.0, 123.0, 98.0, 65.0, 41.0, 36.0, 16.0, 19.0, 14.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-6.61328125, -6.41583251953125, -6.2183837890625, -6.02093505859375, -5.823486328125, -5.62603759765625, -5.4285888671875, -5.23114013671875, -5.03369140625, -4.83624267578125, -4.6387939453125, -4.44134521484375, -4.243896484375, -4.04644775390625, -3.8489990234375, -3.65155029296875, -3.4541015625, -3.25665283203125, -3.0592041015625, -2.86175537109375, -2.664306640625, -2.46685791015625, -2.2694091796875, -2.07196044921875, -1.87451171875, -1.67706298828125, -1.4796142578125, -1.28216552734375, -1.084716796875, -0.88726806640625, -0.6898193359375, -0.49237060546875, -0.294921875, -0.09747314453125, 0.0999755859375, 0.29742431640625, 0.494873046875, 0.69232177734375, 0.8897705078125, 1.08721923828125, 1.28466796875, 1.48211669921875, 1.6795654296875, 1.87701416015625, 2.074462890625, 2.27191162109375, 2.4693603515625, 2.66680908203125, 2.8642578125, 3.06170654296875, 3.2591552734375, 3.45660400390625, 3.654052734375, 3.85150146484375, 4.0489501953125, 4.24639892578125, 4.44384765625, 4.64129638671875, 4.8387451171875, 5.03619384765625, 5.233642578125, 5.43109130859375, 5.6285400390625, 5.82598876953125, 6.0234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 12.0, 12.0, 12.0, 19.0, 29.0, 33.0, 46.0, 71.0, 89.0, 102.0, 110.0, 108.0, 72.0, 64.0, 50.0, 37.0, 22.0, 13.0, 16.0, 12.0, 11.0, 6.0, 6.0, 6.0, 3.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.000728607177734375, -0.0007091313600540161, -0.0006896555423736572, -0.0006701797246932983, -0.0006507039070129395, -0.0006312280893325806, -0.0006117522716522217, -0.0005922764539718628, -0.0005728006362915039, -0.000553324818611145, -0.0005338490009307861, -0.0005143731832504272, -0.0004948973655700684, -0.00047542154788970947, -0.0004559457302093506, -0.0004364699125289917, -0.0004169940948486328, -0.0003975182771682739, -0.00037804245948791504, -0.00035856664180755615, -0.00033909082412719727, -0.0003196150064468384, -0.0003001391887664795, -0.0002806633710861206, -0.0002611875534057617, -0.00024171173572540283, -0.00022223591804504395, -0.00020276010036468506, -0.00018328428268432617, -0.00016380846500396729, -0.0001443326473236084, -0.0001248568296432495, -0.00010538101196289062, -8.590519428253174e-05, -6.642937660217285e-05, -4.6953558921813965e-05, -2.7477741241455078e-05, -8.001923561096191e-06, 1.1473894119262695e-05, 3.094971179962158e-05, 5.042552947998047e-05, 6.990134716033936e-05, 8.937716484069824e-05, 0.00010885298252105713, 0.00012832880020141602, 0.0001478046178817749, 0.0001672804355621338, 0.00018675625324249268, 0.00020623207092285156, 0.00022570788860321045, 0.00024518370628356934, 0.0002646595239639282, 0.0002841353416442871, 0.000303611159324646, 0.0003230869770050049, 0.00034256279468536377, 0.00036203861236572266, 0.00038151443004608154, 0.00040099024772644043, 0.0004204660654067993, 0.0004399418830871582, 0.0004594177007675171, 0.000478893518447876, 0.0004983693361282349, 0.0005178451538085938]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 10.0, 6.0, 10.0, 15.0, 18.0, 32.0, 32.0, 54.0, 67.0, 94.0, 152.0, 236.0, 353.0, 455.0, 707.0, 1100.0, 1645.0, 2469.0, 3807.0, 6255.0, 10295.0, 17157.0, 29005.0, 48956.0, 79172.0, 119533.0, 155340.0, 165537.0, 141706.0, 101106.0, 64439.0, 39080.0, 23333.0, 13848.0, 8271.0, 4991.0, 3152.0, 2015.0, 1325.0, 873.0, 625.0, 422.0, 236.0, 203.0, 124.0, 109.0, 70.0, 42.0, 32.0, 18.0, 12.0, 11.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.7845458984375, -4.631591796875, -4.4786376953125, -4.32568359375, -4.1727294921875, -4.019775390625, -3.8668212890625, -3.7138671875, -3.5609130859375, -3.407958984375, -3.2550048828125, -3.10205078125, -2.9490966796875, -2.796142578125, -2.6431884765625, -2.490234375, -2.3372802734375, -2.184326171875, -2.0313720703125, -1.87841796875, -1.7254638671875, -1.572509765625, -1.4195556640625, -1.2666015625, -1.1136474609375, -0.960693359375, -0.8077392578125, -0.65478515625, -0.5018310546875, -0.348876953125, -0.1959228515625, -0.04296875, 0.1099853515625, 0.262939453125, 0.4158935546875, 0.56884765625, 0.7218017578125, 0.874755859375, 1.0277099609375, 1.1806640625, 1.3336181640625, 1.486572265625, 1.6395263671875, 1.79248046875, 1.9454345703125, 2.098388671875, 2.2513427734375, 2.404296875, 2.5572509765625, 2.710205078125, 2.8631591796875, 3.01611328125, 3.1690673828125, 3.322021484375, 3.4749755859375, 3.6279296875, 3.7808837890625, 3.933837890625, 4.0867919921875, 4.23974609375, 4.3927001953125, 4.545654296875, 4.6986083984375, 4.8515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 0.0, 0.0, 5.0, 1.0, 4.0, 7.0, 4.0, 10.0, 9.0, 9.0, 10.0, 14.0, 12.0, 20.0, 35.0, 34.0, 45.0, 51.0, 59.0, 53.0, 67.0, 51.0, 79.0, 62.0, 62.0, 53.0, 41.0, 43.0, 32.0, 31.0, 19.0, 13.0, 16.0, 9.0, 10.0, 8.0, 5.0, 4.0, 6.0, 5.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.900390625, -1.8343505859375, -1.768310546875, -1.7022705078125, -1.63623046875, -1.5701904296875, -1.504150390625, -1.4381103515625, -1.3720703125, -1.3060302734375, -1.239990234375, -1.1739501953125, -1.10791015625, -1.0418701171875, -0.975830078125, -0.9097900390625, -0.84375, -0.7777099609375, -0.711669921875, -0.6456298828125, -0.57958984375, -0.5135498046875, -0.447509765625, -0.3814697265625, -0.3154296875, -0.2493896484375, -0.183349609375, -0.1173095703125, -0.05126953125, 0.0147705078125, 0.080810546875, 0.1468505859375, 0.212890625, 0.2789306640625, 0.344970703125, 0.4110107421875, 0.47705078125, 0.5430908203125, 0.609130859375, 0.6751708984375, 0.7412109375, 0.8072509765625, 0.873291015625, 0.9393310546875, 1.00537109375, 1.0714111328125, 1.137451171875, 1.2034912109375, 1.26953125, 1.3355712890625, 1.401611328125, 1.4676513671875, 1.53369140625, 1.5997314453125, 1.665771484375, 1.7318115234375, 1.7978515625, 1.8638916015625, 1.929931640625, 1.9959716796875, 2.06201171875, 2.1280517578125, 2.194091796875, 2.2601318359375, 2.326171875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 6.0, 2.0, 3.0, 4.0, 8.0, 7.0, 13.0, 5.0, 21.0, 16.0, 22.0, 31.0, 24.0, 24.0, 46.0, 38.0, 41.0, 43.0, 41.0, 41.0, 41.0, 51.0, 39.0, 39.0, 34.0, 43.0, 47.0, 40.0, 30.0, 33.0, 19.0, 20.0, 18.0, 18.0, 12.0, 18.0, 13.0, 11.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.107765197753906, -9.804533004760742, -9.501300811767578, -9.19806957244873, -8.894837379455566, -8.591605186462402, -8.288373947143555, -7.985141754150391, -7.681909561157227, -7.3786773681640625, -7.075445652008057, -6.772213935852051, -6.468981742858887, -6.165749549865723, -5.862517833709717, -5.559286117553711, -5.256053924560547, -4.952821731567383, -4.649590015411377, -4.346358299255371, -4.043126106262207, -3.739894151687622, -3.436662197113037, -3.133430242538452, -2.830198287963867, -2.5269663333892822, -2.2237343788146973, -1.9205024242401123, -1.6172704696655273, -1.3140385150909424, -1.0108065605163574, -0.7075746059417725, -0.4043426513671875, -0.10111069679260254, 0.20212125778198242, 0.5053532123565674, 0.8085851669311523, 1.1118171215057373, 1.4150490760803223, 1.7182810306549072, 2.021512985229492, 2.324744939804077, 2.627976894378662, 2.931208848953247, 3.234440803527832, 3.537672758102417, 3.840904712677002, 4.144136428833008, 4.447368621826172, 4.750600814819336, 5.053832530975342, 5.357064247131348, 5.660296440124512, 5.963528633117676, 6.266760349273682, 6.5699920654296875, 6.873224258422852, 7.176456451416016, 7.4796881675720215, 7.782919883728027, 8.086152076721191, 8.389384269714355, 8.692615509033203, 8.995847702026367, 9.299079895019531]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 5.0, 9.0, 11.0, 16.0, 19.0, 23.0, 20.0, 22.0, 35.0, 20.0, 42.0, 42.0, 45.0, 29.0, 41.0, 47.0, 47.0, 38.0, 40.0, 36.0, 44.0, 34.0, 28.0, 40.0, 21.0, 34.0, 25.0, 20.0, 22.0, 13.0, 12.0, 22.0, 14.0, 15.0, 7.0, 10.0, 10.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-10.586897850036621, -10.261792182922363, -9.936685562133789, -9.611579895019531, -9.286473274230957, -8.9613676071167, -8.636260986328125, -8.311155319213867, -7.986049652099609, -7.660943508148193, -7.335837364196777, -7.0107316970825195, -6.6856255531311035, -6.3605194091796875, -6.0354132652282715, -5.7103071212768555, -5.3852009773254395, -5.060094833374023, -4.734988689422607, -4.409882545471191, -4.084776878356934, -3.7596707344055176, -3.4345645904541016, -3.1094586849212646, -2.7843525409698486, -2.4592463970184326, -2.1341404914855957, -1.8090343475341797, -1.4839283227920532, -1.1588222980499268, -0.8337161540985107, -0.5086102485656738, -0.1835041046142578, 0.14160194993019104, 0.4667080044746399, 0.7918140888214111, 1.1169201135635376, 1.442026138305664, 1.76713228225708, 2.092238187789917, 2.417344331741333, 2.742450475692749, 3.067556381225586, 3.392662525177002, 3.717768669128418, 4.042874336242676, 4.36798095703125, 4.693086624145508, 5.018192768096924, 5.34329891204834, 5.668405055999756, 5.993511199951172, 6.31861686706543, 6.643723011016846, 6.968829154968262, 7.2939348220825195, 7.619041442871094, 7.94414758682251, 8.269253730773926, 8.594359397888184, 8.919466018676758, 9.244571685791016, 9.569677352905273, 9.894783973693848, 10.219889640808105]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 10.0, 14.0, 26.0, 37.0, 77.0, 117.0, 192.0, 332.0, 674.0, 1023.0, 1731.0, 3213.0, 5285.0, 9223.0, 15442.0, 24696.0, 38503.0, 57663.0, 80653.0, 104231.0, 122756.0, 128808.0, 121297.0, 101690.0, 78763.0, 55598.0, 37393.0, 23484.0, 14601.0, 8760.0, 5259.0, 3046.0, 1702.0, 993.0, 522.0, 293.0, 189.0, 108.0, 68.0, 33.0, 20.0, 17.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.717041015625, -6.48095703125, -6.244873046875, -6.0087890625, -5.772705078125, -5.53662109375, -5.300537109375, -5.064453125, -4.828369140625, -4.59228515625, -4.356201171875, -4.1201171875, -3.884033203125, -3.64794921875, -3.411865234375, -3.17578125, -2.939697265625, -2.70361328125, -2.467529296875, -2.2314453125, -1.995361328125, -1.75927734375, -1.523193359375, -1.287109375, -1.051025390625, -0.81494140625, -0.578857421875, -0.3427734375, -0.106689453125, 0.12939453125, 0.365478515625, 0.6015625, 0.837646484375, 1.07373046875, 1.309814453125, 1.5458984375, 1.781982421875, 2.01806640625, 2.254150390625, 2.490234375, 2.726318359375, 2.96240234375, 3.198486328125, 3.4345703125, 3.670654296875, 3.90673828125, 4.142822265625, 4.37890625, 4.614990234375, 4.85107421875, 5.087158203125, 5.3232421875, 5.559326171875, 5.79541015625, 6.031494140625, 6.267578125, 6.503662109375, 6.73974609375, 6.975830078125, 7.2119140625, 7.447998046875, 7.68408203125, 7.920166015625, 8.15625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 1.0, 5.0, 13.0, 10.0, 10.0, 17.0, 22.0, 19.0, 26.0, 19.0, 30.0, 26.0, 29.0, 32.0, 46.0, 48.0, 49.0, 46.0, 31.0, 56.0, 51.0, 39.0, 43.0, 33.0, 33.0, 39.0, 21.0, 35.0, 31.0, 14.0, 15.0, 16.0, 21.0, 13.0, 9.0, 13.0, 9.0, 8.0, 8.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.4765625, -11.1312255859375, -10.785888671875, -10.4405517578125, -10.09521484375, -9.7498779296875, -9.404541015625, -9.0592041015625, -8.7138671875, -8.3685302734375, -8.023193359375, -7.6778564453125, -7.33251953125, -6.9871826171875, -6.641845703125, -6.2965087890625, -5.951171875, -5.6058349609375, -5.260498046875, -4.9151611328125, -4.56982421875, -4.2244873046875, -3.879150390625, -3.5338134765625, -3.1884765625, -2.8431396484375, -2.497802734375, -2.1524658203125, -1.80712890625, -1.4617919921875, -1.116455078125, -0.7711181640625, -0.42578125, -0.0804443359375, 0.264892578125, 0.6102294921875, 0.95556640625, 1.3009033203125, 1.646240234375, 1.9915771484375, 2.3369140625, 2.6822509765625, 3.027587890625, 3.3729248046875, 3.71826171875, 4.0635986328125, 4.408935546875, 4.7542724609375, 5.099609375, 5.4449462890625, 5.790283203125, 6.1356201171875, 6.48095703125, 6.8262939453125, 7.171630859375, 7.5169677734375, 7.8623046875, 8.2076416015625, 8.552978515625, 8.8983154296875, 9.24365234375, 9.5889892578125, 9.934326171875, 10.2796630859375, 10.625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 14.0, 10.0, 19.0, 32.0, 56.0, 80.0, 150.0, 241.0, 361.0, 619.0, 1045.0, 1780.0, 3196.0, 5444.0, 9576.0, 16554.0, 28326.0, 47115.0, 74249.0, 107878.0, 138618.0, 152187.0, 142734.0, 113461.0, 79553.0, 51493.0, 30889.0, 18041.0, 10290.0, 6096.0, 3560.0, 1953.0, 1172.0, 685.0, 407.0, 274.0, 149.0, 87.0, 55.0, 34.0, 18.0, 14.0, 18.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.819091796875, -8.52099609375, -8.222900390625, -7.9248046875, -7.626708984375, -7.32861328125, -7.030517578125, -6.732421875, -6.434326171875, -6.13623046875, -5.838134765625, -5.5400390625, -5.241943359375, -4.94384765625, -4.645751953125, -4.34765625, -4.049560546875, -3.75146484375, -3.453369140625, -3.1552734375, -2.857177734375, -2.55908203125, -2.260986328125, -1.962890625, -1.664794921875, -1.36669921875, -1.068603515625, -0.7705078125, -0.472412109375, -0.17431640625, 0.123779296875, 0.421875, 0.719970703125, 1.01806640625, 1.316162109375, 1.6142578125, 1.912353515625, 2.21044921875, 2.508544921875, 2.806640625, 3.104736328125, 3.40283203125, 3.700927734375, 3.9990234375, 4.297119140625, 4.59521484375, 4.893310546875, 5.19140625, 5.489501953125, 5.78759765625, 6.085693359375, 6.3837890625, 6.681884765625, 6.97998046875, 7.278076171875, 7.576171875, 7.874267578125, 8.17236328125, 8.470458984375, 8.7685546875, 9.066650390625, 9.36474609375, 9.662841796875, 9.9609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 10.0, 13.0, 12.0, 6.0, 11.0, 21.0, 23.0, 25.0, 24.0, 24.0, 38.0, 29.0, 42.0, 44.0, 42.0, 49.0, 43.0, 50.0, 45.0, 39.0, 44.0, 36.0, 40.0, 59.0, 40.0, 28.0, 26.0, 27.0, 19.0, 19.0, 17.0, 15.0, 10.0, 9.0, 5.0, 6.0, 8.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69140625, -7.45263671875, -7.2138671875, -6.97509765625, -6.736328125, -6.49755859375, -6.2587890625, -6.02001953125, -5.78125, -5.54248046875, -5.3037109375, -5.06494140625, -4.826171875, -4.58740234375, -4.3486328125, -4.10986328125, -3.87109375, -3.63232421875, -3.3935546875, -3.15478515625, -2.916015625, -2.67724609375, -2.4384765625, -2.19970703125, -1.9609375, -1.72216796875, -1.4833984375, -1.24462890625, -1.005859375, -0.76708984375, -0.5283203125, -0.28955078125, -0.05078125, 0.18798828125, 0.4267578125, 0.66552734375, 0.904296875, 1.14306640625, 1.3818359375, 1.62060546875, 1.859375, 2.09814453125, 2.3369140625, 2.57568359375, 2.814453125, 3.05322265625, 3.2919921875, 3.53076171875, 3.76953125, 4.00830078125, 4.2470703125, 4.48583984375, 4.724609375, 4.96337890625, 5.2021484375, 5.44091796875, 5.6796875, 5.91845703125, 6.1572265625, 6.39599609375, 6.634765625, 6.87353515625, 7.1123046875, 7.35107421875, 7.58984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 7.0, 6.0, 7.0, 16.0, 21.0, 29.0, 51.0, 90.0, 167.0, 336.0, 505.0, 1054.0, 2183.0, 4504.0, 9948.0, 22851.0, 51562.0, 107650.0, 187164.0, 237765.0, 199397.0, 118404.0, 57495.0, 25902.0, 11325.0, 5148.0, 2360.0, 1189.0, 609.0, 365.0, 158.0, 98.0, 80.0, 39.0, 30.0, 18.0, 8.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.5008544921875, -6.318115234375, -6.1353759765625, -5.95263671875, -5.7698974609375, -5.587158203125, -5.4044189453125, -5.2216796875, -5.0389404296875, -4.856201171875, -4.6734619140625, -4.49072265625, -4.3079833984375, -4.125244140625, -3.9425048828125, -3.759765625, -3.5770263671875, -3.394287109375, -3.2115478515625, -3.02880859375, -2.8460693359375, -2.663330078125, -2.4805908203125, -2.2978515625, -2.1151123046875, -1.932373046875, -1.7496337890625, -1.56689453125, -1.3841552734375, -1.201416015625, -1.0186767578125, -0.8359375, -0.6531982421875, -0.470458984375, -0.2877197265625, -0.10498046875, 0.0777587890625, 0.260498046875, 0.4432373046875, 0.6259765625, 0.8087158203125, 0.991455078125, 1.1741943359375, 1.35693359375, 1.5396728515625, 1.722412109375, 1.9051513671875, 2.087890625, 2.2706298828125, 2.453369140625, 2.6361083984375, 2.81884765625, 3.0015869140625, 3.184326171875, 3.3670654296875, 3.5498046875, 3.7325439453125, 3.915283203125, 4.0980224609375, 4.28076171875, 4.4635009765625, 4.646240234375, 4.8289794921875, 5.01171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 12.0, 13.0, 17.0, 14.0, 22.0, 23.0, 42.0, 37.0, 30.0, 57.0, 51.0, 61.0, 78.0, 53.0, 71.0, 52.0, 54.0, 50.0, 46.0, 32.0, 38.0, 29.0, 28.0, 23.0, 9.0, 11.0, 11.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004935264587402344, -0.00047822296619415283, -0.0004629194736480713, -0.00044761598110198975, -0.0004323124885559082, -0.00041700899600982666, -0.0004017055034637451, -0.0003864020109176636, -0.00037109851837158203, -0.0003557950258255005, -0.00034049153327941895, -0.0003251880407333374, -0.00030988454818725586, -0.0002945810556411743, -0.0002792775630950928, -0.00026397407054901123, -0.0002486705780029297, -0.00023336708545684814, -0.0002180635929107666, -0.00020276010036468506, -0.00018745660781860352, -0.00017215311527252197, -0.00015684962272644043, -0.0001415461301803589, -0.00012624263763427734, -0.0001109391450881958, -9.563565254211426e-05, -8.033215999603271e-05, -6.502866744995117e-05, -4.972517490386963e-05, -3.4421682357788086e-05, -1.9118189811706543e-05, -3.814697265625e-06, 1.1488795280456543e-05, 2.6792287826538086e-05, 4.209578037261963e-05, 5.739927291870117e-05, 7.270276546478271e-05, 8.800625801086426e-05, 0.0001033097505569458, 0.00011861324310302734, 0.0001339167356491089, 0.00014922022819519043, 0.00016452372074127197, 0.00017982721328735352, 0.00019513070583343506, 0.0002104341983795166, 0.00022573769092559814, 0.0002410411834716797, 0.00025634467601776123, 0.0002716481685638428, 0.0002869516611099243, 0.00030225515365600586, 0.0003175586462020874, 0.00033286213874816895, 0.0003481656312942505, 0.00036346912384033203, 0.0003787726163864136, 0.0003940761089324951, 0.00040937960147857666, 0.0004246830940246582, 0.00043998658657073975, 0.0004552900791168213, 0.00047059357166290283, 0.0004858970642089844]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 10.0, 18.0, 29.0, 37.0, 64.0, 110.0, 149.0, 236.0, 354.0, 558.0, 1003.0, 1552.0, 2826.0, 4550.0, 7733.0, 13516.0, 22788.0, 37254.0, 59868.0, 90428.0, 122881.0, 145866.0, 147779.0, 128221.0, 95641.0, 64187.0, 40572.0, 24726.0, 14550.0, 8596.0, 4994.0, 2957.0, 1761.0, 1030.0, 694.0, 394.0, 223.0, 147.0, 103.0, 36.0, 28.0, 35.0, 21.0, 8.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.767578125, -3.6536865234375, -3.539794921875, -3.4259033203125, -3.31201171875, -3.1981201171875, -3.084228515625, -2.9703369140625, -2.8564453125, -2.7425537109375, -2.628662109375, -2.5147705078125, -2.40087890625, -2.2869873046875, -2.173095703125, -2.0592041015625, -1.9453125, -1.8314208984375, -1.717529296875, -1.6036376953125, -1.48974609375, -1.3758544921875, -1.261962890625, -1.1480712890625, -1.0341796875, -0.9202880859375, -0.806396484375, -0.6925048828125, -0.57861328125, -0.4647216796875, -0.350830078125, -0.2369384765625, -0.123046875, -0.0091552734375, 0.104736328125, 0.2186279296875, 0.33251953125, 0.4464111328125, 0.560302734375, 0.6741943359375, 0.7880859375, 0.9019775390625, 1.015869140625, 1.1297607421875, 1.24365234375, 1.3575439453125, 1.471435546875, 1.5853271484375, 1.69921875, 1.8131103515625, 1.927001953125, 2.0408935546875, 2.15478515625, 2.2686767578125, 2.382568359375, 2.4964599609375, 2.6103515625, 2.7242431640625, 2.838134765625, 2.9520263671875, 3.06591796875, 3.1798095703125, 3.293701171875, 3.4075927734375, 3.521484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 5.0, 10.0, 8.0, 11.0, 13.0, 15.0, 22.0, 28.0, 27.0, 23.0, 27.0, 35.0, 45.0, 27.0, 47.0, 51.0, 40.0, 49.0, 44.0, 46.0, 41.0, 38.0, 41.0, 32.0, 30.0, 32.0, 26.0, 28.0, 25.0, 23.0, 15.0, 16.0, 19.0, 8.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.1640625, -1.1301116943359375, -1.096160888671875, -1.0622100830078125, -1.02825927734375, -0.9943084716796875, -0.960357666015625, -0.9264068603515625, -0.8924560546875, -0.8585052490234375, -0.824554443359375, -0.7906036376953125, -0.75665283203125, -0.7227020263671875, -0.688751220703125, -0.6548004150390625, -0.620849609375, -0.5868988037109375, -0.552947998046875, -0.5189971923828125, -0.48504638671875, -0.4510955810546875, -0.417144775390625, -0.3831939697265625, -0.3492431640625, -0.3152923583984375, -0.281341552734375, -0.2473907470703125, -0.21343994140625, -0.1794891357421875, -0.145538330078125, -0.1115875244140625, -0.07763671875, -0.0436859130859375, -0.009735107421875, 0.0242156982421875, 0.05816650390625, 0.0921173095703125, 0.126068115234375, 0.1600189208984375, 0.1939697265625, 0.2279205322265625, 0.261871337890625, 0.2958221435546875, 0.32977294921875, 0.3637237548828125, 0.397674560546875, 0.4316253662109375, 0.465576171875, 0.4995269775390625, 0.533477783203125, 0.5674285888671875, 0.60137939453125, 0.6353302001953125, 0.669281005859375, 0.7032318115234375, 0.7371826171875, 0.7711334228515625, 0.805084228515625, 0.8390350341796875, 0.87298583984375, 0.9069366455078125, 0.940887451171875, 0.9748382568359375, 1.0087890625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 7.0, 4.0, 6.0, 2.0, 8.0, 8.0, 10.0, 15.0, 13.0, 18.0, 19.0, 23.0, 27.0, 25.0, 35.0, 28.0, 42.0, 46.0, 53.0, 42.0, 36.0, 49.0, 51.0, 43.0, 43.0, 41.0, 42.0, 33.0, 38.0, 29.0, 25.0, 24.0, 20.0, 24.0, 16.0, 11.0, 12.0, 5.0, 10.0, 6.0, 3.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.13676643371582, -9.825839042663574, -9.514912605285645, -9.203985214233398, -8.893057823181152, -8.582130432128906, -8.271203994750977, -7.9602766036987305, -7.649349689483643, -7.338422775268555, -7.027495384216309, -6.716568470001221, -6.405641555786133, -6.094714164733887, -5.783787250518799, -5.472860336303711, -5.161932945251465, -4.851006031036377, -4.540078639984131, -4.229151725769043, -3.918224573135376, -3.607297420501709, -3.296370506286621, -2.985443353652954, -2.674516201019287, -2.36358904838562, -2.052661895751953, -1.7417349815368652, -1.4308078289031982, -1.1198806762695312, -0.8089536428451538, -0.49802660942077637, -0.18709850311279297, 0.12382858991622925, 0.43475568294525146, 0.7456827759742737, 1.056609869003296, 1.367537021636963, 1.6784640550613403, 1.9893910884857178, 2.3003182411193848, 2.6112453937530518, 2.9221725463867188, 3.2330994606018066, 3.5440266132354736, 3.8549537658691406, 4.1658806800842285, 4.476807594299316, 4.7877349853515625, 5.09866189956665, 5.4095892906188965, 5.720516204833984, 6.0314435958862305, 6.342370510101318, 6.653297424316406, 6.964224815368652, 7.27515172958374, 7.586078643798828, 7.897006034851074, 8.20793342590332, 8.51885986328125, 8.829787254333496, 9.140714645385742, 9.451641082763672, 9.762568473815918]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 4.0, 6.0, 10.0, 9.0, 13.0, 11.0, 15.0, 21.0, 22.0, 26.0, 25.0, 24.0, 43.0, 38.0, 36.0, 42.0, 47.0, 38.0, 46.0, 49.0, 31.0, 49.0, 48.0, 45.0, 39.0, 30.0, 30.0, 23.0, 28.0, 16.0, 18.0, 13.0, 17.0, 15.0, 10.0, 9.0, 17.0, 14.0, 3.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.968842506408691, -9.619991302490234, -9.271141052246094, -8.922289848327637, -8.57343864440918, -8.224588394165039, -7.875737190246582, -7.526886463165283, -7.178035736083984, -6.8291850090026855, -6.480334281921387, -6.13148307800293, -5.782632350921631, -5.433781623840332, -5.084930419921875, -4.736079692840576, -4.387228965759277, -4.0383782386779785, -3.6895272731781006, -3.3406763076782227, -2.991825580596924, -2.642974853515625, -2.294123888015747, -1.9452729225158691, -1.5964221954345703, -1.247571349143982, -0.8987205028533936, -0.5498696565628052, -0.2010188102722168, 0.14783203601837158, 0.49668288230895996, 0.8455338478088379, 1.1943845748901367, 1.543235421180725, 1.8920862674713135, 2.2409372329711914, 2.5897879600524902, 2.938638687133789, 3.287489652633667, 3.636340618133545, 3.9851913452148438, 4.334042072296143, 4.682892799377441, 5.031744003295898, 5.380594730377197, 5.729445457458496, 6.078296661376953, 6.427147388458252, 6.775998115539551, 7.12484884262085, 7.473699569702148, 7.8225507736206055, 8.171401977539062, 8.520252227783203, 8.86910343170166, 9.217954635620117, 9.566804885864258, 9.915656089782715, 10.264506340026855, 10.613357543945312, 10.962207794189453, 11.31105899810791, 11.659910202026367, 12.008760452270508, 12.357611656188965]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 8.0, 16.0, 29.0, 38.0, 73.0, 113.0, 200.0, 295.0, 469.0, 712.0, 1119.0, 1794.0, 2678.0, 4239.0, 6736.0, 10418.0, 16480.0, 25853.0, 41913.0, 67370.0, 110829.0, 180355.0, 286312.0, 419400.0, 547881.0, 610568.0, 571933.0, 453369.0, 314218.0, 199344.0, 121591.0, 74013.0, 45439.0, 27903.0, 17778.0, 11328.0, 7288.0, 4824.0, 3102.0, 2082.0, 1447.0, 955.0, 629.0, 390.0, 260.0, 175.0, 132.0, 56.0, 43.0, 26.0, 21.0, 10.0, 10.0, 11.0, 3.0, 4.0, 3.0], "bins": [-6.91015625, -6.6982421875, -6.486328125, -6.2744140625, -6.0625, -5.8505859375, -5.638671875, -5.4267578125, -5.21484375, -5.0029296875, -4.791015625, -4.5791015625, -4.3671875, -4.1552734375, -3.943359375, -3.7314453125, -3.51953125, -3.3076171875, -3.095703125, -2.8837890625, -2.671875, -2.4599609375, -2.248046875, -2.0361328125, -1.82421875, -1.6123046875, -1.400390625, -1.1884765625, -0.9765625, -0.7646484375, -0.552734375, -0.3408203125, -0.12890625, 0.0830078125, 0.294921875, 0.5068359375, 0.71875, 0.9306640625, 1.142578125, 1.3544921875, 1.56640625, 1.7783203125, 1.990234375, 2.2021484375, 2.4140625, 2.6259765625, 2.837890625, 3.0498046875, 3.26171875, 3.4736328125, 3.685546875, 3.8974609375, 4.109375, 4.3212890625, 4.533203125, 4.7451171875, 4.95703125, 5.1689453125, 5.380859375, 5.5927734375, 5.8046875, 6.0166015625, 6.228515625, 6.4404296875, 6.65234375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 11.0, 5.0, 12.0, 14.0, 11.0, 13.0, 23.0, 24.0, 27.0, 31.0, 31.0, 42.0, 44.0, 42.0, 43.0, 55.0, 40.0, 43.0, 48.0, 42.0, 49.0, 39.0, 53.0, 35.0, 33.0, 28.0, 22.0, 23.0, 17.0, 15.0, 17.0, 14.0, 17.0, 12.0, 5.0, 8.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.42822265625, -9.1142578125, -8.80029296875, -8.486328125, -8.17236328125, -7.8583984375, -7.54443359375, -7.23046875, -6.91650390625, -6.6025390625, -6.28857421875, -5.974609375, -5.66064453125, -5.3466796875, -5.03271484375, -4.71875, -4.40478515625, -4.0908203125, -3.77685546875, -3.462890625, -3.14892578125, -2.8349609375, -2.52099609375, -2.20703125, -1.89306640625, -1.5791015625, -1.26513671875, -0.951171875, -0.63720703125, -0.3232421875, -0.00927734375, 0.3046875, 0.61865234375, 0.9326171875, 1.24658203125, 1.560546875, 1.87451171875, 2.1884765625, 2.50244140625, 2.81640625, 3.13037109375, 3.4443359375, 3.75830078125, 4.072265625, 4.38623046875, 4.7001953125, 5.01416015625, 5.328125, 5.64208984375, 5.9560546875, 6.27001953125, 6.583984375, 6.89794921875, 7.2119140625, 7.52587890625, 7.83984375, 8.15380859375, 8.4677734375, 8.78173828125, 9.095703125, 9.40966796875, 9.7236328125, 10.03759765625, 10.3515625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 11.0, 22.0, 14.0, 23.0, 51.0, 91.0, 109.0, 171.0, 285.0, 474.0, 723.0, 1142.0, 1753.0, 2851.0, 4522.0, 7388.0, 12164.0, 20057.0, 32703.0, 53753.0, 87728.0, 142997.0, 229806.0, 353513.0, 503164.0, 621722.0, 625910.0, 511948.0, 362126.0, 236510.0, 148549.0, 90327.0, 55029.0, 33227.0, 20599.0, 12395.0, 7761.0, 4717.0, 2911.0, 1870.0, 1146.0, 755.0, 466.0, 294.0, 178.0, 137.0, 71.0, 36.0, 33.0, 20.0, 15.0, 10.0, 7.0, 6.0, 0.0, 1.0, 1.0, 3.0], "bins": [-8.4453125, -8.181640625, -7.91796875, -7.654296875, -7.390625, -7.126953125, -6.86328125, -6.599609375, -6.3359375, -6.072265625, -5.80859375, -5.544921875, -5.28125, -5.017578125, -4.75390625, -4.490234375, -4.2265625, -3.962890625, -3.69921875, -3.435546875, -3.171875, -2.908203125, -2.64453125, -2.380859375, -2.1171875, -1.853515625, -1.58984375, -1.326171875, -1.0625, -0.798828125, -0.53515625, -0.271484375, -0.0078125, 0.255859375, 0.51953125, 0.783203125, 1.046875, 1.310546875, 1.57421875, 1.837890625, 2.1015625, 2.365234375, 2.62890625, 2.892578125, 3.15625, 3.419921875, 3.68359375, 3.947265625, 4.2109375, 4.474609375, 4.73828125, 5.001953125, 5.265625, 5.529296875, 5.79296875, 6.056640625, 6.3203125, 6.583984375, 6.84765625, 7.111328125, 7.375, 7.638671875, 7.90234375, 8.166015625, 8.4296875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 8.0, 5.0, 7.0, 14.0, 11.0, 20.0, 30.0, 23.0, 39.0, 46.0, 66.0, 58.0, 93.0, 90.0, 105.0, 136.0, 145.0, 140.0, 172.0, 222.0, 222.0, 221.0, 228.0, 213.0, 204.0, 206.0, 196.0, 161.0, 162.0, 130.0, 127.0, 119.0, 98.0, 76.0, 56.0, 51.0, 30.0, 23.0, 27.0, 16.0, 16.0, 14.0, 10.0, 9.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.48828125, -3.3790283203125, -3.269775390625, -3.1605224609375, -3.05126953125, -2.9420166015625, -2.832763671875, -2.7235107421875, -2.6142578125, -2.5050048828125, -2.395751953125, -2.2864990234375, -2.17724609375, -2.0679931640625, -1.958740234375, -1.8494873046875, -1.740234375, -1.6309814453125, -1.521728515625, -1.4124755859375, -1.30322265625, -1.1939697265625, -1.084716796875, -0.9754638671875, -0.8662109375, -0.7569580078125, -0.647705078125, -0.5384521484375, -0.42919921875, -0.3199462890625, -0.210693359375, -0.1014404296875, 0.0078125, 0.1170654296875, 0.226318359375, 0.3355712890625, 0.44482421875, 0.5540771484375, 0.663330078125, 0.7725830078125, 0.8818359375, 0.9910888671875, 1.100341796875, 1.2095947265625, 1.31884765625, 1.4281005859375, 1.537353515625, 1.6466064453125, 1.755859375, 1.8651123046875, 1.974365234375, 2.0836181640625, 2.19287109375, 2.3021240234375, 2.411376953125, 2.5206298828125, 2.6298828125, 2.7391357421875, 2.848388671875, 2.9576416015625, 3.06689453125, 3.1761474609375, 3.285400390625, 3.3946533203125, 3.50390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 6.0, 6.0, 6.0, 4.0, 11.0, 13.0, 7.0, 16.0, 17.0, 20.0, 30.0, 33.0, 39.0, 36.0, 32.0, 42.0, 50.0, 53.0, 38.0, 47.0, 45.0, 43.0, 46.0, 56.0, 48.0, 33.0, 39.0, 32.0, 25.0, 16.0, 18.0, 12.0, 14.0, 17.0, 8.0, 12.0, 5.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.56261920928955, -9.249836921691895, -8.937055587768555, -8.624273300170898, -8.311491012573242, -7.998709201812744, -7.685927391052246, -7.37314510345459, -7.060363292694092, -6.747581481933594, -6.4347991943359375, -6.1220173835754395, -5.809235572814941, -5.496453285217285, -5.183671474456787, -4.870889663696289, -4.558107376098633, -4.245325565338135, -3.9325432777404785, -3.6197614669799805, -3.3069794178009033, -2.994197368621826, -2.681415557861328, -2.368633508682251, -2.055851459503174, -1.7430694103240967, -1.430287480354309, -1.1175055503845215, -0.8047235012054443, -0.4919414520263672, -0.1791595220565796, 0.133622407913208, 0.44640445709228516, 0.7591864466667175, 1.07196843624115, 1.3847503662109375, 1.6975324153900146, 2.010314464569092, 2.32309627532959, 2.635878324508667, 2.948660373687744, 3.2614424228668213, 3.5742244720458984, 3.8870062828063965, 4.1997880935668945, 4.512570381164551, 4.825352191925049, 5.138134002685547, 5.450916290283203, 5.763698101043701, 6.076480388641357, 6.3892621994018555, 6.702044486999512, 7.01482629776001, 7.327608108520508, 7.640390396118164, 7.953172206878662, 8.26595401763916, 8.578736305236816, 8.891518592834473, 9.204299926757812, 9.517082214355469, 9.829864501953125, 10.142645835876465, 10.455428123474121]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 10.0, 7.0, 5.0, 9.0, 11.0, 20.0, 17.0, 19.0, 27.0, 41.0, 33.0, 45.0, 33.0, 35.0, 37.0, 52.0, 49.0, 47.0, 47.0, 54.0, 51.0, 31.0, 31.0, 39.0, 34.0, 28.0, 28.0, 21.0, 28.0, 13.0, 18.0, 13.0, 14.0, 10.0, 7.0, 10.0, 7.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.06818962097168, -9.72366714477539, -9.379143714904785, -9.034621238708496, -8.69009780883789, -8.345575332641602, -8.001052856445312, -7.656529426574707, -7.31200647354126, -6.9674835205078125, -6.622960567474365, -6.278437614440918, -5.933915138244629, -5.589391708374023, -5.244869232177734, -4.900346279144287, -4.55582332611084, -4.211300373077393, -3.8667774200439453, -3.522254705429077, -3.17773175239563, -2.8332087993621826, -2.4886860847473145, -2.144163131713867, -1.79964017868042, -1.4551172256469727, -1.110594391822815, -0.7660715579986572, -0.42154860496520996, -0.0770256519317627, 0.26749706268310547, 0.6120200157165527, 0.95654296875, 1.3010659217834473, 1.645588755607605, 1.9901115894317627, 2.33463454246521, 2.6791574954986572, 3.0236802101135254, 3.3682031631469727, 3.71272611618042, 4.057249069213867, 4.4017720222473145, 4.746294975280762, 5.090817451477051, 5.435340881347656, 5.779863357543945, 6.124386310577393, 6.46890926361084, 6.813432216644287, 7.157955169677734, 7.502477645874023, 7.847001075744629, 8.191523551940918, 8.536046981811523, 8.880569458007812, 9.225091934204102, 9.56961441040039, 9.914137840270996, 10.258660316467285, 10.60318374633789, 10.94770622253418, 11.292228698730469, 11.636752128601074, 11.98127555847168]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 7.0, 4.0, 13.0, 12.0, 16.0, 34.0, 54.0, 63.0, 103.0, 125.0, 214.0, 301.0, 478.0, 675.0, 1078.0, 1665.0, 2460.0, 3676.0, 5703.0, 8702.0, 13527.0, 20553.0, 30856.0, 45071.0, 64265.0, 86820.0, 109468.0, 124633.0, 124213.0, 111034.0, 88662.0, 65332.0, 46180.0, 31465.0, 20917.0, 13895.0, 9027.0, 5972.0, 3834.0, 2461.0, 1753.0, 1109.0, 731.0, 445.0, 307.0, 202.0, 136.0, 95.0, 74.0, 47.0, 27.0, 25.0, 17.0, 12.0, 7.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.546875, -5.3621826171875, -5.177490234375, -4.9927978515625, -4.80810546875, -4.6234130859375, -4.438720703125, -4.2540283203125, -4.0693359375, -3.8846435546875, -3.699951171875, -3.5152587890625, -3.33056640625, -3.1458740234375, -2.961181640625, -2.7764892578125, -2.591796875, -2.4071044921875, -2.222412109375, -2.0377197265625, -1.85302734375, -1.6683349609375, -1.483642578125, -1.2989501953125, -1.1142578125, -0.9295654296875, -0.744873046875, -0.5601806640625, -0.37548828125, -0.1907958984375, -0.006103515625, 0.1785888671875, 0.36328125, 0.5479736328125, 0.732666015625, 0.9173583984375, 1.10205078125, 1.2867431640625, 1.471435546875, 1.6561279296875, 1.8408203125, 2.0255126953125, 2.210205078125, 2.3948974609375, 2.57958984375, 2.7642822265625, 2.948974609375, 3.1336669921875, 3.318359375, 3.5030517578125, 3.687744140625, 3.8724365234375, 4.05712890625, 4.2418212890625, 4.426513671875, 4.6112060546875, 4.7958984375, 4.9805908203125, 5.165283203125, 5.3499755859375, 5.53466796875, 5.7193603515625, 5.904052734375, 6.0887451171875, 6.2734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 6.0, 7.0, 5.0, 13.0, 11.0, 18.0, 21.0, 18.0, 21.0, 33.0, 32.0, 34.0, 50.0, 51.0, 40.0, 39.0, 47.0, 43.0, 47.0, 47.0, 42.0, 41.0, 36.0, 45.0, 34.0, 34.0, 23.0, 27.0, 13.0, 24.0, 12.0, 14.0, 12.0, 14.0, 8.0, 8.0, 5.0, 5.0, 7.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0078125, -10.6561279296875, -10.304443359375, -9.9527587890625, -9.60107421875, -9.2493896484375, -8.897705078125, -8.5460205078125, -8.1943359375, -7.8426513671875, -7.490966796875, -7.1392822265625, -6.78759765625, -6.4359130859375, -6.084228515625, -5.7325439453125, -5.380859375, -5.0291748046875, -4.677490234375, -4.3258056640625, -3.97412109375, -3.6224365234375, -3.270751953125, -2.9190673828125, -2.5673828125, -2.2156982421875, -1.864013671875, -1.5123291015625, -1.16064453125, -0.8089599609375, -0.457275390625, -0.1055908203125, 0.24609375, 0.5977783203125, 0.949462890625, 1.3011474609375, 1.65283203125, 2.0045166015625, 2.356201171875, 2.7078857421875, 3.0595703125, 3.4112548828125, 3.762939453125, 4.1146240234375, 4.46630859375, 4.8179931640625, 5.169677734375, 5.5213623046875, 5.873046875, 6.2247314453125, 6.576416015625, 6.9281005859375, 7.27978515625, 7.6314697265625, 7.983154296875, 8.3348388671875, 8.6865234375, 9.0382080078125, 9.389892578125, 9.7415771484375, 10.09326171875, 10.4449462890625, 10.796630859375, 11.1483154296875, 11.5]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 7.0, 2.0, 15.0, 10.0, 18.0, 23.0, 42.0, 56.0, 81.0, 145.0, 167.0, 298.0, 458.0, 762.0, 1222.0, 2107.0, 3805.0, 6748.0, 13074.0, 26869.0, 56468.0, 117195.0, 211994.0, 253921.0, 176494.0, 89579.0, 43040.0, 20733.0, 10184.0, 5458.0, 2986.0, 1725.0, 1001.0, 671.0, 365.0, 265.0, 156.0, 138.0, 82.0, 56.0, 37.0, 24.0, 25.0, 9.0, 11.0, 11.0, 5.0, 3.0, 2.0, 5.0, 5.0], "bins": [-15.1015625, -14.6856689453125, -14.269775390625, -13.8538818359375, -13.43798828125, -13.0220947265625, -12.606201171875, -12.1903076171875, -11.7744140625, -11.3585205078125, -10.942626953125, -10.5267333984375, -10.11083984375, -9.6949462890625, -9.279052734375, -8.8631591796875, -8.447265625, -8.0313720703125, -7.615478515625, -7.1995849609375, -6.78369140625, -6.3677978515625, -5.951904296875, -5.5360107421875, -5.1201171875, -4.7042236328125, -4.288330078125, -3.8724365234375, -3.45654296875, -3.0406494140625, -2.624755859375, -2.2088623046875, -1.79296875, -1.3770751953125, -0.961181640625, -0.5452880859375, -0.12939453125, 0.2864990234375, 0.702392578125, 1.1182861328125, 1.5341796875, 1.9500732421875, 2.365966796875, 2.7818603515625, 3.19775390625, 3.6136474609375, 4.029541015625, 4.4454345703125, 4.861328125, 5.2772216796875, 5.693115234375, 6.1090087890625, 6.52490234375, 6.9407958984375, 7.356689453125, 7.7725830078125, 8.1884765625, 8.6043701171875, 9.020263671875, 9.4361572265625, 9.85205078125, 10.2679443359375, 10.683837890625, 11.0997314453125, 11.515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 4.0, 4.0, 9.0, 7.0, 13.0, 11.0, 10.0, 14.0, 20.0, 20.0, 17.0, 28.0, 29.0, 29.0, 33.0, 29.0, 38.0, 40.0, 46.0, 48.0, 50.0, 47.0, 42.0, 38.0, 38.0, 44.0, 33.0, 31.0, 26.0, 23.0, 28.0, 24.0, 21.0, 14.0, 17.0, 11.0, 10.0, 10.0, 11.0, 13.0, 8.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0], "bins": [-7.93359375, -7.72357177734375, -7.5135498046875, -7.30352783203125, -7.093505859375, -6.88348388671875, -6.6734619140625, -6.46343994140625, -6.25341796875, -6.04339599609375, -5.8333740234375, -5.62335205078125, -5.413330078125, -5.20330810546875, -4.9932861328125, -4.78326416015625, -4.5732421875, -4.36322021484375, -4.1531982421875, -3.94317626953125, -3.733154296875, -3.52313232421875, -3.3131103515625, -3.10308837890625, -2.89306640625, -2.68304443359375, -2.4730224609375, -2.26300048828125, -2.052978515625, -1.84295654296875, -1.6329345703125, -1.42291259765625, -1.212890625, -1.00286865234375, -0.7928466796875, -0.58282470703125, -0.372802734375, -0.16278076171875, 0.0472412109375, 0.25726318359375, 0.46728515625, 0.67730712890625, 0.8873291015625, 1.09735107421875, 1.307373046875, 1.51739501953125, 1.7274169921875, 1.93743896484375, 2.1474609375, 2.35748291015625, 2.5675048828125, 2.77752685546875, 2.987548828125, 3.19757080078125, 3.4075927734375, 3.61761474609375, 3.82763671875, 4.03765869140625, 4.2476806640625, 4.45770263671875, 4.667724609375, 4.87774658203125, 5.0877685546875, 5.29779052734375, 5.5078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 11.0, 17.0, 12.0, 17.0, 45.0, 57.0, 70.0, 140.0, 181.0, 286.0, 424.0, 649.0, 1111.0, 1902.0, 3289.0, 5776.0, 10223.0, 19155.0, 36225.0, 69509.0, 127857.0, 200064.0, 218853.0, 158321.0, 90984.0, 47811.0, 24956.0, 13118.0, 7301.0, 4073.0, 2382.0, 1411.0, 844.0, 523.0, 318.0, 193.0, 130.0, 98.0, 62.0, 37.0, 34.0, 19.0, 22.0, 12.0, 3.0, 10.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.18359375, -5.02264404296875, -4.8616943359375, -4.70074462890625, -4.539794921875, -4.37884521484375, -4.2178955078125, -4.05694580078125, -3.89599609375, -3.73504638671875, -3.5740966796875, -3.41314697265625, -3.252197265625, -3.09124755859375, -2.9302978515625, -2.76934814453125, -2.6083984375, -2.44744873046875, -2.2864990234375, -2.12554931640625, -1.964599609375, -1.80364990234375, -1.6427001953125, -1.48175048828125, -1.32080078125, -1.15985107421875, -0.9989013671875, -0.83795166015625, -0.677001953125, -0.51605224609375, -0.3551025390625, -0.19415283203125, -0.033203125, 0.12774658203125, 0.2886962890625, 0.44964599609375, 0.610595703125, 0.77154541015625, 0.9324951171875, 1.09344482421875, 1.25439453125, 1.41534423828125, 1.5762939453125, 1.73724365234375, 1.898193359375, 2.05914306640625, 2.2200927734375, 2.38104248046875, 2.5419921875, 2.70294189453125, 2.8638916015625, 3.02484130859375, 3.185791015625, 3.34674072265625, 3.5076904296875, 3.66864013671875, 3.82958984375, 3.99053955078125, 4.1514892578125, 4.31243896484375, 4.473388671875, 4.63433837890625, 4.7952880859375, 4.95623779296875, 5.1171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 0.0, 1.0, 6.0, 4.0, 2.0, 3.0, 6.0, 1.0, 10.0, 13.0, 14.0, 17.0, 15.0, 17.0, 31.0, 34.0, 35.0, 36.0, 50.0, 52.0, 63.0, 64.0, 52.0, 49.0, 63.0, 60.0, 60.0, 40.0, 29.0, 27.0, 32.0, 23.0, 18.0, 14.0, 11.0, 11.0, 8.0, 8.0, 2.0, 10.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00027298927307128906, -0.0002635084092617035, -0.0002540275454521179, -0.00024454668164253235, -0.00023506581783294678, -0.0002255849540233612, -0.00021610409021377563, -0.00020662322640419006, -0.0001971423625946045, -0.00018766149878501892, -0.00017818063497543335, -0.00016869977116584778, -0.0001592189073562622, -0.00014973804354667664, -0.00014025717973709106, -0.0001307763159275055, -0.00012129545211791992, -0.00011181458830833435, -0.00010233372449874878, -9.285286068916321e-05, -8.337199687957764e-05, -7.389113306999207e-05, -6.44102692604065e-05, -5.492940545082092e-05, -4.544854164123535e-05, -3.596767783164978e-05, -2.648681402206421e-05, -1.7005950212478638e-05, -7.525086402893066e-06, 1.955777406692505e-06, 1.1436641216278076e-05, 2.0917505025863647e-05, 3.039836883544922e-05, 3.987923264503479e-05, 4.936009645462036e-05, 5.884096026420593e-05, 6.83218240737915e-05, 7.780268788337708e-05, 8.728355169296265e-05, 9.676441550254822e-05, 0.00010624527931213379, 0.00011572614312171936, 0.00012520700693130493, 0.0001346878707408905, 0.00014416873455047607, 0.00015364959836006165, 0.00016313046216964722, 0.0001726113259792328, 0.00018209218978881836, 0.00019157305359840393, 0.0002010539174079895, 0.00021053478121757507, 0.00022001564502716064, 0.00022949650883674622, 0.0002389773726463318, 0.00024845823645591736, 0.00025793910026550293, 0.0002674199640750885, 0.00027690082788467407, 0.00028638169169425964, 0.0002958625555038452, 0.0003053434193134308, 0.00031482428312301636, 0.00032430514693260193, 0.0003337860107421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 19.0, 15.0, 17.0, 33.0, 46.0, 74.0, 112.0, 157.0, 253.0, 356.0, 577.0, 850.0, 1353.0, 2063.0, 3205.0, 4843.0, 7553.0, 11964.0, 18091.0, 28209.0, 43142.0, 65661.0, 93533.0, 122494.0, 140212.0, 136872.0, 114918.0, 84719.0, 58230.0, 38472.0, 24995.0, 15908.0, 10548.0, 6635.0, 4293.0, 2787.0, 1837.0, 1214.0, 783.0, 504.0, 313.0, 243.0, 158.0, 95.0, 69.0, 40.0, 31.0, 16.0, 13.0, 14.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0], "bins": [-3.908203125, -3.7855224609375, -3.662841796875, -3.5401611328125, -3.41748046875, -3.2947998046875, -3.172119140625, -3.0494384765625, -2.9267578125, -2.8040771484375, -2.681396484375, -2.5587158203125, -2.43603515625, -2.3133544921875, -2.190673828125, -2.0679931640625, -1.9453125, -1.8226318359375, -1.699951171875, -1.5772705078125, -1.45458984375, -1.3319091796875, -1.209228515625, -1.0865478515625, -0.9638671875, -0.8411865234375, -0.718505859375, -0.5958251953125, -0.47314453125, -0.3504638671875, -0.227783203125, -0.1051025390625, 0.017578125, 0.1402587890625, 0.262939453125, 0.3856201171875, 0.50830078125, 0.6309814453125, 0.753662109375, 0.8763427734375, 0.9990234375, 1.1217041015625, 1.244384765625, 1.3670654296875, 1.48974609375, 1.6124267578125, 1.735107421875, 1.8577880859375, 1.98046875, 2.1031494140625, 2.225830078125, 2.3485107421875, 2.47119140625, 2.5938720703125, 2.716552734375, 2.8392333984375, 2.9619140625, 3.0845947265625, 3.207275390625, 3.3299560546875, 3.45263671875, 3.5753173828125, 3.697998046875, 3.8206787109375, 3.943359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 6.0, 9.0, 11.0, 15.0, 17.0, 30.0, 29.0, 28.0, 31.0, 35.0, 33.0, 58.0, 48.0, 58.0, 52.0, 57.0, 59.0, 50.0, 53.0, 38.0, 36.0, 41.0, 29.0, 31.0, 28.0, 12.0, 12.0, 17.0, 17.0, 10.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.634765625, -1.58538818359375, -1.5360107421875, -1.48663330078125, -1.437255859375, -1.38787841796875, -1.3385009765625, -1.28912353515625, -1.23974609375, -1.19036865234375, -1.1409912109375, -1.09161376953125, -1.042236328125, -0.99285888671875, -0.9434814453125, -0.89410400390625, -0.8447265625, -0.79534912109375, -0.7459716796875, -0.69659423828125, -0.647216796875, -0.59783935546875, -0.5484619140625, -0.49908447265625, -0.44970703125, -0.40032958984375, -0.3509521484375, -0.30157470703125, -0.252197265625, -0.20281982421875, -0.1534423828125, -0.10406494140625, -0.0546875, -0.00531005859375, 0.0440673828125, 0.09344482421875, 0.142822265625, 0.19219970703125, 0.2415771484375, 0.29095458984375, 0.34033203125, 0.38970947265625, 0.4390869140625, 0.48846435546875, 0.537841796875, 0.58721923828125, 0.6365966796875, 0.68597412109375, 0.7353515625, 0.78472900390625, 0.8341064453125, 0.88348388671875, 0.932861328125, 0.98223876953125, 1.0316162109375, 1.08099365234375, 1.13037109375, 1.17974853515625, 1.2291259765625, 1.27850341796875, 1.327880859375, 1.37725830078125, 1.4266357421875, 1.47601318359375, 1.525390625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 1.0, 6.0, 5.0, 7.0, 12.0, 10.0, 13.0, 15.0, 23.0, 25.0, 29.0, 34.0, 40.0, 31.0, 51.0, 38.0, 43.0, 43.0, 45.0, 46.0, 49.0, 57.0, 50.0, 43.0, 41.0, 41.0, 42.0, 28.0, 16.0, 17.0, 15.0, 18.0, 8.0, 14.0, 7.0, 6.0, 10.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.186450958251953, -9.86924934387207, -9.552048683166504, -9.234847068786621, -8.917645454406738, -8.600444793701172, -8.283243179321289, -7.966041564941406, -7.648840427398682, -7.331639289855957, -7.014437675476074, -6.69723653793335, -6.380035400390625, -6.062833786010742, -5.745632648468018, -5.428431510925293, -5.11122989654541, -4.7940287590026855, -4.476827144622803, -4.159626007080078, -3.8424246311187744, -3.5252232551574707, -3.208022117614746, -2.8908207416534424, -2.5736193656921387, -2.256417989730835, -1.9392167329788208, -1.6220154762268066, -1.304814100265503, -0.9876127243041992, -0.6704114675521851, -0.3532102108001709, -0.03600788116455078, 0.28119343519210815, 0.5983947515487671, 0.915596067905426, 1.232797384262085, 1.5499987602233887, 1.8672000169754028, 2.184401273727417, 2.5016026496887207, 2.8188040256500244, 3.136005401611328, 3.4532065391540527, 3.7704079151153564, 4.08760929107666, 4.404810428619385, 4.722011566162109, 5.039213180541992, 5.356414318084717, 5.6736159324646, 5.990817070007324, 6.308018684387207, 6.625219821929932, 6.942420959472656, 7.259622573852539, 7.576823711395264, 7.894024848937988, 8.211226463317871, 8.528428077697754, 8.84562873840332, 9.162830352783203, 9.480031967163086, 9.797232627868652, 10.114434242248535]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 3.0, 5.0, 10.0, 15.0, 5.0, 6.0, 13.0, 22.0, 22.0, 27.0, 35.0, 31.0, 46.0, 40.0, 37.0, 42.0, 46.0, 51.0, 37.0, 52.0, 60.0, 42.0, 34.0, 36.0, 33.0, 36.0, 32.0, 28.0, 26.0, 19.0, 18.0, 15.0, 15.0, 18.0, 9.0, 4.0, 9.0, 4.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.89285659790039, -9.553511619567871, -9.214167594909668, -8.874822616577148, -8.535477638244629, -8.19613265991211, -7.856788635253906, -7.517443656921387, -7.178098678588867, -6.838754177093506, -6.499409198760986, -6.160064697265625, -5.8207197189331055, -5.481375217437744, -5.142030715942383, -4.802685737609863, -4.463341236114502, -4.123996734619141, -3.784651756286621, -3.4453072547912598, -3.1059622764587402, -2.766617774963379, -2.4272730350494385, -2.087928295135498, -1.7485835552215576, -1.4092388153076172, -1.0698940753936768, -0.7305494546890259, -0.39120471477508545, -0.05185997486114502, 0.28748464584350586, 0.6268293857574463, 0.9661741256713867, 1.3055188655853271, 1.6448636054992676, 1.9842082262039185, 2.3235530853271484, 2.6628975868225098, 3.00224232673645, 3.3415870666503906, 3.680931806564331, 4.0202765464782715, 4.359621047973633, 4.698966026306152, 5.038310527801514, 5.377655506134033, 5.7170000076293945, 6.056344985961914, 6.395689487457275, 6.735033988952637, 7.074378967285156, 7.413723468780518, 7.753068447113037, 8.092412948608398, 8.431757926940918, 8.771102905273438, 9.11044692993164, 9.44979190826416, 9.789135932922363, 10.128480911254883, 10.467825889587402, 10.807170867919922, 11.146514892578125, 11.485859870910645, 11.825204849243164]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 11.0, 11.0, 24.0, 23.0, 35.0, 65.0, 103.0, 184.0, 273.0, 491.0, 804.0, 1386.0, 2330.0, 3957.0, 6659.0, 11144.0, 17943.0, 28223.0, 43781.0, 62918.0, 85150.0, 105630.0, 120937.0, 124341.0, 115018.0, 96272.0, 73705.0, 52588.0, 35564.0, 23330.0, 14555.0, 8461.0, 5142.0, 3055.0, 1821.0, 1044.0, 603.0, 400.0, 240.0, 135.0, 75.0, 46.0, 36.0, 16.0, 16.0, 13.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.609375, -6.40447998046875, -6.1995849609375, -5.99468994140625, -5.789794921875, -5.58489990234375, -5.3800048828125, -5.17510986328125, -4.97021484375, -4.76531982421875, -4.5604248046875, -4.35552978515625, -4.150634765625, -3.94573974609375, -3.7408447265625, -3.53594970703125, -3.3310546875, -3.12615966796875, -2.9212646484375, -2.71636962890625, -2.511474609375, -2.30657958984375, -2.1016845703125, -1.89678955078125, -1.69189453125, -1.48699951171875, -1.2821044921875, -1.07720947265625, -0.872314453125, -0.66741943359375, -0.4625244140625, -0.25762939453125, -0.052734375, 0.15216064453125, 0.3570556640625, 0.56195068359375, 0.766845703125, 0.97174072265625, 1.1766357421875, 1.38153076171875, 1.58642578125, 1.79132080078125, 1.9962158203125, 2.20111083984375, 2.406005859375, 2.61090087890625, 2.8157958984375, 3.02069091796875, 3.2255859375, 3.43048095703125, 3.6353759765625, 3.84027099609375, 4.045166015625, 4.25006103515625, 4.4549560546875, 4.65985107421875, 4.86474609375, 5.06964111328125, 5.2745361328125, 5.47943115234375, 5.684326171875, 5.88922119140625, 6.0941162109375, 6.29901123046875, 6.50390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 9.0, 3.0, 8.0, 13.0, 7.0, 8.0, 9.0, 15.0, 17.0, 20.0, 21.0, 25.0, 43.0, 41.0, 28.0, 40.0, 39.0, 60.0, 40.0, 52.0, 47.0, 49.0, 40.0, 32.0, 34.0, 32.0, 41.0, 32.0, 36.0, 26.0, 15.0, 31.0, 14.0, 8.0, 15.0, 8.0, 11.0, 17.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.288818359375, -9.95263671875, -9.616455078125, -9.2802734375, -8.944091796875, -8.60791015625, -8.271728515625, -7.935546875, -7.599365234375, -7.26318359375, -6.927001953125, -6.5908203125, -6.254638671875, -5.91845703125, -5.582275390625, -5.24609375, -4.909912109375, -4.57373046875, -4.237548828125, -3.9013671875, -3.565185546875, -3.22900390625, -2.892822265625, -2.556640625, -2.220458984375, -1.88427734375, -1.548095703125, -1.2119140625, -0.875732421875, -0.53955078125, -0.203369140625, 0.1328125, 0.468994140625, 0.80517578125, 1.141357421875, 1.4775390625, 1.813720703125, 2.14990234375, 2.486083984375, 2.822265625, 3.158447265625, 3.49462890625, 3.830810546875, 4.1669921875, 4.503173828125, 4.83935546875, 5.175537109375, 5.51171875, 5.847900390625, 6.18408203125, 6.520263671875, 6.8564453125, 7.192626953125, 7.52880859375, 7.864990234375, 8.201171875, 8.537353515625, 8.87353515625, 9.209716796875, 9.5458984375, 9.882080078125, 10.21826171875, 10.554443359375, 10.890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 9.0, 16.0, 20.0, 28.0, 50.0, 55.0, 124.0, 161.0, 280.0, 390.0, 634.0, 1081.0, 1721.0, 2849.0, 4567.0, 7520.0, 12584.0, 19624.0, 31644.0, 47296.0, 68145.0, 91333.0, 113727.0, 126842.0, 126095.0, 112108.0, 89363.0, 65801.0, 45248.0, 30024.0, 18876.0, 11821.0, 7327.0, 4333.0, 2576.0, 1620.0, 980.0, 605.0, 397.0, 243.0, 160.0, 87.0, 61.0, 60.0, 21.0, 16.0, 17.0, 5.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.04296875, -6.822509765625, -6.60205078125, -6.381591796875, -6.1611328125, -5.940673828125, -5.72021484375, -5.499755859375, -5.279296875, -5.058837890625, -4.83837890625, -4.617919921875, -4.3974609375, -4.177001953125, -3.95654296875, -3.736083984375, -3.515625, -3.295166015625, -3.07470703125, -2.854248046875, -2.6337890625, -2.413330078125, -2.19287109375, -1.972412109375, -1.751953125, -1.531494140625, -1.31103515625, -1.090576171875, -0.8701171875, -0.649658203125, -0.42919921875, -0.208740234375, 0.01171875, 0.232177734375, 0.45263671875, 0.673095703125, 0.8935546875, 1.114013671875, 1.33447265625, 1.554931640625, 1.775390625, 1.995849609375, 2.21630859375, 2.436767578125, 2.6572265625, 2.877685546875, 3.09814453125, 3.318603515625, 3.5390625, 3.759521484375, 3.97998046875, 4.200439453125, 4.4208984375, 4.641357421875, 4.86181640625, 5.082275390625, 5.302734375, 5.523193359375, 5.74365234375, 5.964111328125, 6.1845703125, 6.405029296875, 6.62548828125, 6.845947265625, 7.06640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 2.0, 8.0, 18.0, 16.0, 11.0, 19.0, 19.0, 16.0, 23.0, 23.0, 22.0, 26.0, 31.0, 34.0, 30.0, 36.0, 42.0, 36.0, 43.0, 25.0, 34.0, 42.0, 31.0, 42.0, 36.0, 50.0, 32.0, 30.0, 27.0, 23.0, 29.0, 25.0, 22.0, 22.0, 12.0, 9.0, 5.0, 9.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9453125, -5.7535400390625, -5.561767578125, -5.3699951171875, -5.17822265625, -4.9864501953125, -4.794677734375, -4.6029052734375, -4.4111328125, -4.2193603515625, -4.027587890625, -3.8358154296875, -3.64404296875, -3.4522705078125, -3.260498046875, -3.0687255859375, -2.876953125, -2.6851806640625, -2.493408203125, -2.3016357421875, -2.10986328125, -1.9180908203125, -1.726318359375, -1.5345458984375, -1.3427734375, -1.1510009765625, -0.959228515625, -0.7674560546875, -0.57568359375, -0.3839111328125, -0.192138671875, -0.0003662109375, 0.19140625, 0.3831787109375, 0.574951171875, 0.7667236328125, 0.95849609375, 1.1502685546875, 1.342041015625, 1.5338134765625, 1.7255859375, 1.9173583984375, 2.109130859375, 2.3009033203125, 2.49267578125, 2.6844482421875, 2.876220703125, 3.0679931640625, 3.259765625, 3.4515380859375, 3.643310546875, 3.8350830078125, 4.02685546875, 4.2186279296875, 4.410400390625, 4.6021728515625, 4.7939453125, 4.9857177734375, 5.177490234375, 5.3692626953125, 5.56103515625, 5.7528076171875, 5.944580078125, 6.1363525390625, 6.328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 14.0, 15.0, 19.0, 47.0, 49.0, 91.0, 128.0, 166.0, 272.0, 396.0, 640.0, 949.0, 1379.0, 2097.0, 3059.0, 4694.0, 7235.0, 10476.0, 15702.0, 22572.0, 32709.0, 44951.0, 60577.0, 76678.0, 93857.0, 104555.0, 107824.0, 102507.0, 89835.0, 73008.0, 56380.0, 41965.0, 30023.0, 20774.0, 14114.0, 9555.0, 6501.0, 4225.0, 2929.0, 1910.0, 1231.0, 807.0, 559.0, 364.0, 242.0, 151.0, 112.0, 72.0, 43.0, 37.0, 20.0, 12.0, 13.0, 5.0, 7.0, 2.0, 2.0, 3.0], "bins": [-2.171875, -2.10479736328125, -2.0377197265625, -1.97064208984375, -1.903564453125, -1.83648681640625, -1.7694091796875, -1.70233154296875, -1.63525390625, -1.56817626953125, -1.5010986328125, -1.43402099609375, -1.366943359375, -1.29986572265625, -1.2327880859375, -1.16571044921875, -1.0986328125, -1.03155517578125, -0.9644775390625, -0.89739990234375, -0.830322265625, -0.76324462890625, -0.6961669921875, -0.62908935546875, -0.56201171875, -0.49493408203125, -0.4278564453125, -0.36077880859375, -0.293701171875, -0.22662353515625, -0.1595458984375, -0.09246826171875, -0.025390625, 0.04168701171875, 0.1087646484375, 0.17584228515625, 0.242919921875, 0.30999755859375, 0.3770751953125, 0.44415283203125, 0.51123046875, 0.57830810546875, 0.6453857421875, 0.71246337890625, 0.779541015625, 0.84661865234375, 0.9136962890625, 0.98077392578125, 1.0478515625, 1.11492919921875, 1.1820068359375, 1.24908447265625, 1.316162109375, 1.38323974609375, 1.4503173828125, 1.51739501953125, 1.58447265625, 1.65155029296875, 1.7186279296875, 1.78570556640625, 1.852783203125, 1.91986083984375, 1.9869384765625, 2.05401611328125, 2.12109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 4.0, 6.0, 10.0, 10.0, 16.0, 16.0, 21.0, 26.0, 40.0, 33.0, 44.0, 38.0, 54.0, 76.0, 44.0, 61.0, 52.0, 47.0, 59.0, 42.0, 56.0, 33.0, 34.0, 31.0, 27.0, 24.0, 25.0, 21.0, 8.0, 12.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003502368927001953, -0.0003388449549674988, -0.00032745301723480225, -0.0003160610795021057, -0.0003046691417694092, -0.00029327720403671265, -0.0002818852663040161, -0.0002704933285713196, -0.00025910139083862305, -0.0002477094531059265, -0.00023631751537322998, -0.00022492557764053345, -0.00021353363990783691, -0.00020214170217514038, -0.00019074976444244385, -0.00017935782670974731, -0.00016796588897705078, -0.00015657395124435425, -0.00014518201351165771, -0.00013379007577896118, -0.00012239813804626465, -0.00011100620031356812, -9.961426258087158e-05, -8.822232484817505e-05, -7.683038711547852e-05, -6.543844938278198e-05, -5.404651165008545e-05, -4.2654573917388916e-05, -3.126263618469238e-05, -1.987069845199585e-05, -8.478760719299316e-06, 2.913177013397217e-06, 1.430511474609375e-05, 2.5697052478790283e-05, 3.7088990211486816e-05, 4.848092794418335e-05, 5.987286567687988e-05, 7.126480340957642e-05, 8.265674114227295e-05, 9.404867887496948e-05, 0.00010544061660766602, 0.00011683255434036255, 0.00012822449207305908, 0.00013961642980575562, 0.00015100836753845215, 0.00016240030527114868, 0.00017379224300384521, 0.00018518418073654175, 0.00019657611846923828, 0.00020796805620193481, 0.00021935999393463135, 0.00023075193166732788, 0.00024214386940002441, 0.00025353580713272095, 0.0002649277448654175, 0.000276319682598114, 0.00028771162033081055, 0.0002991035580635071, 0.0003104954957962036, 0.00032188743352890015, 0.0003332793712615967, 0.0003446713089942932, 0.00035606324672698975, 0.0003674551844596863, 0.0003788471221923828]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 12.0, 15.0, 27.0, 51.0, 74.0, 124.0, 204.0, 373.0, 622.0, 897.0, 1557.0, 2597.0, 4319.0, 7147.0, 11376.0, 18518.0, 29464.0, 44405.0, 64853.0, 88094.0, 110894.0, 125774.0, 127221.0, 114710.0, 92965.0, 69108.0, 48165.0, 32038.0, 20370.0, 12655.0, 7800.0, 4816.0, 2901.0, 1784.0, 1034.0, 631.0, 348.0, 239.0, 154.0, 87.0, 59.0, 30.0, 20.0, 12.0, 9.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.443359375, -2.3621826171875, -2.281005859375, -2.1998291015625, -2.11865234375, -2.0374755859375, -1.956298828125, -1.8751220703125, -1.7939453125, -1.7127685546875, -1.631591796875, -1.5504150390625, -1.46923828125, -1.3880615234375, -1.306884765625, -1.2257080078125, -1.14453125, -1.0633544921875, -0.982177734375, -0.9010009765625, -0.81982421875, -0.7386474609375, -0.657470703125, -0.5762939453125, -0.4951171875, -0.4139404296875, -0.332763671875, -0.2515869140625, -0.17041015625, -0.0892333984375, -0.008056640625, 0.0731201171875, 0.154296875, 0.2354736328125, 0.316650390625, 0.3978271484375, 0.47900390625, 0.5601806640625, 0.641357421875, 0.7225341796875, 0.8037109375, 0.8848876953125, 0.966064453125, 1.0472412109375, 1.12841796875, 1.2095947265625, 1.290771484375, 1.3719482421875, 1.453125, 1.5343017578125, 1.615478515625, 1.6966552734375, 1.77783203125, 1.8590087890625, 1.940185546875, 2.0213623046875, 2.1025390625, 2.1837158203125, 2.264892578125, 2.3460693359375, 2.42724609375, 2.5084228515625, 2.589599609375, 2.6707763671875, 2.751953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 4.0, 1.0, 3.0, 6.0, 4.0, 6.0, 6.0, 12.0, 10.0, 21.0, 16.0, 26.0, 22.0, 36.0, 33.0, 26.0, 31.0, 43.0, 33.0, 45.0, 30.0, 52.0, 38.0, 46.0, 39.0, 36.0, 46.0, 40.0, 53.0, 28.0, 32.0, 27.0, 28.0, 24.0, 15.0, 19.0, 13.0, 11.0, 6.0, 4.0, 12.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.999847412109375, -0.96942138671875, -0.938995361328125, -0.9085693359375, -0.878143310546875, -0.84771728515625, -0.817291259765625, -0.786865234375, -0.756439208984375, -0.72601318359375, -0.695587158203125, -0.6651611328125, -0.634735107421875, -0.60430908203125, -0.573883056640625, -0.54345703125, -0.513031005859375, -0.48260498046875, -0.452178955078125, -0.4217529296875, -0.391326904296875, -0.36090087890625, -0.330474853515625, -0.300048828125, -0.269622802734375, -0.23919677734375, -0.208770751953125, -0.1783447265625, -0.147918701171875, -0.11749267578125, -0.087066650390625, -0.056640625, -0.026214599609375, 0.00421142578125, 0.034637451171875, 0.0650634765625, 0.095489501953125, 0.12591552734375, 0.156341552734375, 0.186767578125, 0.217193603515625, 0.24761962890625, 0.278045654296875, 0.3084716796875, 0.338897705078125, 0.36932373046875, 0.399749755859375, 0.43017578125, 0.460601806640625, 0.49102783203125, 0.521453857421875, 0.5518798828125, 0.582305908203125, 0.61273193359375, 0.643157958984375, 0.673583984375, 0.704010009765625, 0.73443603515625, 0.764862060546875, 0.7952880859375, 0.825714111328125, 0.85614013671875, 0.886566162109375, 0.9169921875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 7.0, 4.0, 7.0, 6.0, 7.0, 10.0, 9.0, 9.0, 12.0, 24.0, 16.0, 26.0, 33.0, 41.0, 35.0, 38.0, 40.0, 31.0, 53.0, 47.0, 49.0, 57.0, 42.0, 45.0, 43.0, 55.0, 29.0, 30.0, 30.0, 22.0, 24.0, 26.0, 22.0, 7.0, 8.0, 10.0, 7.0, 5.0, 10.0, 9.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.721860885620117, -9.4244384765625, -9.127016067504883, -8.829593658447266, -8.532171249389648, -8.234748840332031, -7.937326431274414, -7.639904022216797, -7.34248161315918, -7.0450592041015625, -6.747636795043945, -6.450214385986328, -6.152791976928711, -5.855369567871094, -5.557947158813477, -5.260524749755859, -4.963102340698242, -4.665679931640625, -4.368257522583008, -4.070835113525391, -3.7734127044677734, -3.4759902954101562, -3.178567886352539, -2.881145477294922, -2.5837230682373047, -2.2863006591796875, -1.9888782501220703, -1.6914558410644531, -1.394033432006836, -1.0966110229492188, -0.7991886138916016, -0.5017662048339844, -0.2043447494506836, 0.0930776596069336, 0.3905000686645508, 0.687922477722168, 0.9853448867797852, 1.2827672958374023, 1.5801897048950195, 1.8776121139526367, 2.175034523010254, 2.472456932067871, 2.7698793411254883, 3.0673017501831055, 3.3647241592407227, 3.66214656829834, 3.959568977355957, 4.256991386413574, 4.554413795471191, 4.851836204528809, 5.149258613586426, 5.446681022644043, 5.74410343170166, 6.041525840759277, 6.3389482498168945, 6.636370658874512, 6.933793067932129, 7.231215476989746, 7.528637886047363, 7.8260602951049805, 8.123482704162598, 8.420905113220215, 8.718327522277832, 9.01574993133545, 9.313172340393066]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 3.0, 3.0, 5.0, 9.0, 5.0, 9.0, 11.0, 23.0, 16.0, 17.0, 28.0, 31.0, 30.0, 39.0, 34.0, 41.0, 43.0, 48.0, 57.0, 50.0, 61.0, 41.0, 33.0, 38.0, 36.0, 36.0, 28.0, 33.0, 30.0, 24.0, 29.0, 24.0, 17.0, 15.0, 9.0, 13.0, 4.0, 11.0, 6.0, 3.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.233407020568848, -8.8818359375, -8.530264854431152, -8.178693771362305, -7.827122688293457, -7.475551605224609, -7.123980522155762, -6.772409439086914, -6.420838356018066, -6.069267272949219, -5.717696189880371, -5.366125106811523, -5.014554023742676, -4.662982940673828, -4.3114118576049805, -3.9598405361175537, -3.608269214630127, -3.2566981315612793, -2.9051270484924316, -2.553555965423584, -2.2019848823547363, -1.8504136800765991, -1.498842477798462, -1.1472713947296143, -0.7957003116607666, -0.44412919878959656, -0.09255808591842651, 0.2590130567550659, 0.6105841398239136, 0.9621552228927612, 1.3137264251708984, 1.665297508239746, 2.0168685913085938, 2.3684396743774414, 2.720010757446289, 3.0715818405151367, 3.4231529235839844, 3.774724006652832, 4.12629508972168, 4.477866172790527, 4.829437255859375, 5.181008338928223, 5.53257942199707, 5.884150505065918, 6.235721588134766, 6.587292671203613, 6.938863754272461, 7.290434837341309, 7.6420063972473145, 7.993577480316162, 8.345149040222168, 8.696720123291016, 9.048291206359863, 9.399862289428711, 9.751433372497559, 10.103004455566406, 10.454575538635254, 10.806146621704102, 11.15771770477295, 11.509288787841797, 11.860859870910645, 12.212430953979492, 12.56400203704834, 12.915573120117188, 13.267144203186035]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 1.0, 21.0, 20.0, 29.0, 39.0, 65.0, 127.0, 173.0, 292.0, 446.0, 737.0, 1248.0, 1988.0, 3207.0, 5192.0, 8705.0, 14511.0, 24421.0, 41533.0, 71396.0, 126968.0, 222762.0, 371777.0, 552287.0, 682900.0, 676545.0, 534846.0, 353007.0, 210029.0, 119748.0, 68670.0, 39641.0, 23479.0, 14265.0, 8682.0, 5388.0, 3325.0, 2157.0, 1327.0, 860.0, 523.0, 316.0, 217.0, 163.0, 103.0, 48.0, 33.0, 22.0, 15.0, 11.0, 11.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.70703125, -6.46710205078125, -6.2271728515625, -5.98724365234375, -5.747314453125, -5.50738525390625, -5.2674560546875, -5.02752685546875, -4.78759765625, -4.54766845703125, -4.3077392578125, -4.06781005859375, -3.827880859375, -3.58795166015625, -3.3480224609375, -3.10809326171875, -2.8681640625, -2.62823486328125, -2.3883056640625, -2.14837646484375, -1.908447265625, -1.66851806640625, -1.4285888671875, -1.18865966796875, -0.94873046875, -0.70880126953125, -0.4688720703125, -0.22894287109375, 0.010986328125, 0.25091552734375, 0.4908447265625, 0.73077392578125, 0.970703125, 1.21063232421875, 1.4505615234375, 1.69049072265625, 1.930419921875, 2.17034912109375, 2.4102783203125, 2.65020751953125, 2.89013671875, 3.13006591796875, 3.3699951171875, 3.60992431640625, 3.849853515625, 4.08978271484375, 4.3297119140625, 4.56964111328125, 4.8095703125, 5.04949951171875, 5.2894287109375, 5.52935791015625, 5.769287109375, 6.00921630859375, 6.2491455078125, 6.48907470703125, 6.72900390625, 6.96893310546875, 7.2088623046875, 7.44879150390625, 7.688720703125, 7.92864990234375, 8.1685791015625, 8.40850830078125, 8.6484375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 2.0, 2.0, 3.0, 4.0, 5.0, 12.0, 8.0, 11.0, 18.0, 27.0, 22.0, 17.0, 21.0, 34.0, 29.0, 35.0, 40.0, 41.0, 50.0, 49.0, 52.0, 53.0, 35.0, 48.0, 32.0, 39.0, 32.0, 25.0, 34.0, 44.0, 23.0, 24.0, 22.0, 20.0, 16.0, 12.0, 12.0, 12.0, 8.0, 8.0, 5.0, 11.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.2734375, -7.98681640625, -7.7001953125, -7.41357421875, -7.126953125, -6.84033203125, -6.5537109375, -6.26708984375, -5.98046875, -5.69384765625, -5.4072265625, -5.12060546875, -4.833984375, -4.54736328125, -4.2607421875, -3.97412109375, -3.6875, -3.40087890625, -3.1142578125, -2.82763671875, -2.541015625, -2.25439453125, -1.9677734375, -1.68115234375, -1.39453125, -1.10791015625, -0.8212890625, -0.53466796875, -0.248046875, 0.03857421875, 0.3251953125, 0.61181640625, 0.8984375, 1.18505859375, 1.4716796875, 1.75830078125, 2.044921875, 2.33154296875, 2.6181640625, 2.90478515625, 3.19140625, 3.47802734375, 3.7646484375, 4.05126953125, 4.337890625, 4.62451171875, 4.9111328125, 5.19775390625, 5.484375, 5.77099609375, 6.0576171875, 6.34423828125, 6.630859375, 6.91748046875, 7.2041015625, 7.49072265625, 7.77734375, 8.06396484375, 8.3505859375, 8.63720703125, 8.923828125, 9.21044921875, 9.4970703125, 9.78369140625, 10.0703125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 11.0, 10.0, 11.0, 23.0, 30.0, 50.0, 74.0, 137.0, 191.0, 328.0, 513.0, 842.0, 1378.0, 2331.0, 3809.0, 6332.0, 10825.0, 18152.0, 31011.0, 52304.0, 88808.0, 149815.0, 245848.0, 385585.0, 552555.0, 665216.0, 638572.0, 495376.0, 333051.0, 206800.0, 124292.0, 73244.0, 43371.0, 25608.0, 15074.0, 9087.0, 5375.0, 3144.0, 2018.0, 1211.0, 676.0, 408.0, 281.0, 195.0, 107.0, 78.0, 39.0, 32.0, 19.0, 18.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-9.2734375, -8.999267578125, -8.72509765625, -8.450927734375, -8.1767578125, -7.902587890625, -7.62841796875, -7.354248046875, -7.080078125, -6.805908203125, -6.53173828125, -6.257568359375, -5.9833984375, -5.709228515625, -5.43505859375, -5.160888671875, -4.88671875, -4.612548828125, -4.33837890625, -4.064208984375, -3.7900390625, -3.515869140625, -3.24169921875, -2.967529296875, -2.693359375, -2.419189453125, -2.14501953125, -1.870849609375, -1.5966796875, -1.322509765625, -1.04833984375, -0.774169921875, -0.5, -0.225830078125, 0.04833984375, 0.322509765625, 0.5966796875, 0.870849609375, 1.14501953125, 1.419189453125, 1.693359375, 1.967529296875, 2.24169921875, 2.515869140625, 2.7900390625, 3.064208984375, 3.33837890625, 3.612548828125, 3.88671875, 4.160888671875, 4.43505859375, 4.709228515625, 4.9833984375, 5.257568359375, 5.53173828125, 5.805908203125, 6.080078125, 6.354248046875, 6.62841796875, 6.902587890625, 7.1767578125, 7.450927734375, 7.72509765625, 7.999267578125, 8.2734375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 13.0, 13.0, 17.0, 12.0, 15.0, 25.0, 39.0, 45.0, 63.0, 63.0, 83.0, 80.0, 96.0, 127.0, 121.0, 127.0, 169.0, 198.0, 196.0, 210.0, 248.0, 227.0, 226.0, 200.0, 198.0, 176.0, 166.0, 145.0, 116.0, 112.0, 95.0, 86.0, 65.0, 61.0, 43.0, 43.0, 26.0, 30.0, 19.0, 13.0, 12.0, 7.0, 11.0, 5.0, 5.0, 7.0, 2.0, 5.0, 0.0, 3.0, 0.0, 3.0], "bins": [-3.517578125, -3.411407470703125, -3.30523681640625, -3.199066162109375, -3.0928955078125, -2.986724853515625, -2.88055419921875, -2.774383544921875, -2.668212890625, -2.562042236328125, -2.45587158203125, -2.349700927734375, -2.2435302734375, -2.137359619140625, -2.03118896484375, -1.925018310546875, -1.81884765625, -1.712677001953125, -1.60650634765625, -1.500335693359375, -1.3941650390625, -1.287994384765625, -1.18182373046875, -1.075653076171875, -0.969482421875, -0.863311767578125, -0.75714111328125, -0.650970458984375, -0.5447998046875, -0.438629150390625, -0.33245849609375, -0.226287841796875, -0.1201171875, -0.013946533203125, 0.09222412109375, 0.198394775390625, 0.3045654296875, 0.410736083984375, 0.51690673828125, 0.623077392578125, 0.729248046875, 0.835418701171875, 0.94158935546875, 1.047760009765625, 1.1539306640625, 1.260101318359375, 1.36627197265625, 1.472442626953125, 1.57861328125, 1.684783935546875, 1.79095458984375, 1.897125244140625, 2.0032958984375, 2.109466552734375, 2.21563720703125, 2.321807861328125, 2.427978515625, 2.534149169921875, 2.64031982421875, 2.746490478515625, 2.8526611328125, 2.958831787109375, 3.06500244140625, 3.171173095703125, 3.27734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 5.0, 9.0, 8.0, 10.0, 7.0, 3.0, 10.0, 17.0, 23.0, 28.0, 34.0, 31.0, 45.0, 43.0, 40.0, 50.0, 51.0, 44.0, 62.0, 41.0, 41.0, 36.0, 53.0, 33.0, 43.0, 27.0, 17.0, 28.0, 25.0, 25.0, 11.0, 20.0, 13.0, 5.0, 13.0, 7.0, 4.0, 5.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.101362228393555, -9.80017375946045, -9.498985290527344, -9.197795867919922, -8.896607398986816, -8.595418930053711, -8.294230461120605, -7.9930419921875, -7.6918535232543945, -7.390665054321289, -7.089476108551025, -6.78828763961792, -6.4870991706848145, -6.185910224914551, -5.884721755981445, -5.58353328704834, -5.282344341278076, -4.981155872344971, -4.679966926574707, -4.378778457641602, -4.077589988708496, -3.7764012813568115, -3.475212574005127, -3.1740241050720215, -2.872835397720337, -2.5716466903686523, -2.270458221435547, -1.9692695140838623, -1.6680809259414673, -1.3668923377990723, -1.0657036304473877, -0.7645151615142822, -0.46332645416259766, -0.16213783621788025, 0.13905078172683716, 0.44023942947387695, 0.741428017616272, 1.042616605758667, 1.3438053131103516, 1.644993782043457, 1.9461824893951416, 2.247371196746826, 2.5485596656799316, 2.849748373031616, 3.150937080383301, 3.4521255493164062, 3.753314256668091, 4.054502487182617, 4.355691432952881, 4.656879901885986, 4.95806884765625, 5.2592573165893555, 5.560445785522461, 5.861634254455566, 6.16282320022583, 6.4640116691589355, 6.765200614929199, 7.066389083862305, 7.367578029632568, 7.668766498565674, 7.969954967498779, 8.271143913269043, 8.572332382202148, 8.873520851135254, 9.17470932006836]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 2.0, 3.0, 5.0, 10.0, 9.0, 9.0, 17.0, 19.0, 19.0, 30.0, 29.0, 33.0, 30.0, 31.0, 35.0, 33.0, 38.0, 33.0, 25.0, 47.0, 44.0, 42.0, 42.0, 31.0, 37.0, 43.0, 25.0, 29.0, 35.0, 30.0, 25.0, 25.0, 21.0, 15.0, 22.0, 12.0, 6.0, 10.0, 10.0, 5.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.25527572631836, -7.960122108459473, -7.664968490600586, -7.369814872741699, -7.0746612548828125, -6.779507637023926, -6.484354496002197, -6.1892008781433105, -5.894047260284424, -5.598893642425537, -5.30374002456665, -5.008586406707764, -4.713433265686035, -4.418279647827148, -4.123126029968262, -3.827972412109375, -3.5328187942504883, -3.2376651763916016, -2.942511558532715, -2.6473581790924072, -2.3522045612335205, -2.057050943374634, -1.7618974447250366, -1.4667439460754395, -1.1715903282165527, -0.8764367699623108, -0.5812832117080688, -0.2861296534538269, 0.009023904800415039, 0.30417752265930176, 0.5993310213088989, 0.8944845199584961, 1.1896371841430664, 1.4847908020019531, 1.7799443006515503, 2.0750977993011475, 2.370251417160034, 2.665405035018921, 2.9605584144592285, 3.2557120323181152, 3.550865650177002, 3.8460192680358887, 4.141172885894775, 4.436326503753662, 4.731479644775391, 5.026633262634277, 5.321786880493164, 5.616940498352051, 5.9120941162109375, 6.207247734069824, 6.502401351928711, 6.797554969787598, 7.092708587646484, 7.387862205505371, 7.6830153465271, 7.978168964385986, 8.273323059082031, 8.568476676940918, 8.863630294799805, 9.158783912658691, 9.453937530517578, 9.749091148376465, 10.044244766235352, 10.339397430419922, 10.634551048278809]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 15.0, 29.0, 32.0, 74.0, 100.0, 161.0, 216.0, 353.0, 576.0, 886.0, 1340.0, 2240.0, 3530.0, 5905.0, 9640.0, 15287.0, 24911.0, 39278.0, 61452.0, 89130.0, 118941.0, 139772.0, 141271.0, 122707.0, 93750.0, 65093.0, 42219.0, 26642.0, 16221.0, 10120.0, 6158.0, 3864.0, 2435.0, 1461.0, 1012.0, 602.0, 392.0, 236.0, 154.0, 108.0, 83.0, 51.0, 29.0, 27.0, 10.0, 9.0, 9.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.296875, -5.1207275390625, -4.944580078125, -4.7684326171875, -4.59228515625, -4.4161376953125, -4.239990234375, -4.0638427734375, -3.8876953125, -3.7115478515625, -3.535400390625, -3.3592529296875, -3.18310546875, -3.0069580078125, -2.830810546875, -2.6546630859375, -2.478515625, -2.3023681640625, -2.126220703125, -1.9500732421875, -1.77392578125, -1.5977783203125, -1.421630859375, -1.2454833984375, -1.0693359375, -0.8931884765625, -0.717041015625, -0.5408935546875, -0.36474609375, -0.1885986328125, -0.012451171875, 0.1636962890625, 0.33984375, 0.5159912109375, 0.692138671875, 0.8682861328125, 1.04443359375, 1.2205810546875, 1.396728515625, 1.5728759765625, 1.7490234375, 1.9251708984375, 2.101318359375, 2.2774658203125, 2.45361328125, 2.6297607421875, 2.805908203125, 2.9820556640625, 3.158203125, 3.3343505859375, 3.510498046875, 3.6866455078125, 3.86279296875, 4.0389404296875, 4.215087890625, 4.3912353515625, 4.5673828125, 4.7435302734375, 4.919677734375, 5.0958251953125, 5.27197265625, 5.4481201171875, 5.624267578125, 5.8004150390625, 5.9765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 9.0, 5.0, 8.0, 9.0, 8.0, 11.0, 17.0, 24.0, 21.0, 24.0, 30.0, 29.0, 27.0, 39.0, 30.0, 35.0, 44.0, 37.0, 48.0, 49.0, 25.0, 33.0, 34.0, 32.0, 38.0, 38.0, 37.0, 32.0, 27.0, 22.0, 22.0, 28.0, 17.0, 17.0, 13.0, 11.0, 12.0, 8.0, 5.0, 11.0, 4.0, 6.0, 2.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.5546875, -8.2623291015625, -7.969970703125, -7.6776123046875, -7.38525390625, -7.0928955078125, -6.800537109375, -6.5081787109375, -6.2158203125, -5.9234619140625, -5.631103515625, -5.3387451171875, -5.04638671875, -4.7540283203125, -4.461669921875, -4.1693115234375, -3.876953125, -3.5845947265625, -3.292236328125, -2.9998779296875, -2.70751953125, -2.4151611328125, -2.122802734375, -1.8304443359375, -1.5380859375, -1.2457275390625, -0.953369140625, -0.6610107421875, -0.36865234375, -0.0762939453125, 0.216064453125, 0.5084228515625, 0.80078125, 1.0931396484375, 1.385498046875, 1.6778564453125, 1.97021484375, 2.2625732421875, 2.554931640625, 2.8472900390625, 3.1396484375, 3.4320068359375, 3.724365234375, 4.0167236328125, 4.30908203125, 4.6014404296875, 4.893798828125, 5.1861572265625, 5.478515625, 5.7708740234375, 6.063232421875, 6.3555908203125, 6.64794921875, 6.9403076171875, 7.232666015625, 7.5250244140625, 7.8173828125, 8.1097412109375, 8.402099609375, 8.6944580078125, 8.98681640625, 9.2791748046875, 9.571533203125, 9.8638916015625, 10.15625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 6.0, 8.0, 11.0, 18.0, 25.0, 35.0, 60.0, 70.0, 117.0, 154.0, 204.0, 325.0, 479.0, 651.0, 1130.0, 1638.0, 2556.0, 4182.0, 6802.0, 11184.0, 18816.0, 32056.0, 53783.0, 87551.0, 132535.0, 170543.0, 171470.0, 131628.0, 87049.0, 53642.0, 31872.0, 18598.0, 11107.0, 6765.0, 4123.0, 2480.0, 1646.0, 1080.0, 665.0, 495.0, 291.0, 189.0, 155.0, 98.0, 84.0, 56.0, 30.0, 34.0, 12.0, 20.0, 8.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0], "bins": [-8.1015625, -7.85601806640625, -7.6104736328125, -7.36492919921875, -7.119384765625, -6.87384033203125, -6.6282958984375, -6.38275146484375, -6.13720703125, -5.89166259765625, -5.6461181640625, -5.40057373046875, -5.155029296875, -4.90948486328125, -4.6639404296875, -4.41839599609375, -4.1728515625, -3.92730712890625, -3.6817626953125, -3.43621826171875, -3.190673828125, -2.94512939453125, -2.6995849609375, -2.45404052734375, -2.20849609375, -1.96295166015625, -1.7174072265625, -1.47186279296875, -1.226318359375, -0.98077392578125, -0.7352294921875, -0.48968505859375, -0.244140625, 0.00140380859375, 0.2469482421875, 0.49249267578125, 0.738037109375, 0.98358154296875, 1.2291259765625, 1.47467041015625, 1.72021484375, 1.96575927734375, 2.2113037109375, 2.45684814453125, 2.702392578125, 2.94793701171875, 3.1934814453125, 3.43902587890625, 3.6845703125, 3.93011474609375, 4.1756591796875, 4.42120361328125, 4.666748046875, 4.91229248046875, 5.1578369140625, 5.40338134765625, 5.64892578125, 5.89447021484375, 6.1400146484375, 6.38555908203125, 6.631103515625, 6.87664794921875, 7.1221923828125, 7.36773681640625, 7.61328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 5.0, 8.0, 6.0, 9.0, 9.0, 14.0, 16.0, 17.0, 19.0, 28.0, 16.0, 30.0, 32.0, 30.0, 29.0, 34.0, 21.0, 28.0, 49.0, 35.0, 45.0, 33.0, 32.0, 39.0, 27.0, 31.0, 31.0, 36.0, 30.0, 36.0, 26.0, 30.0, 17.0, 14.0, 17.0, 21.0, 12.0, 12.0, 13.0, 12.0, 6.0, 5.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.4140625, -5.24462890625, -5.0751953125, -4.90576171875, -4.736328125, -4.56689453125, -4.3974609375, -4.22802734375, -4.05859375, -3.88916015625, -3.7197265625, -3.55029296875, -3.380859375, -3.21142578125, -3.0419921875, -2.87255859375, -2.703125, -2.53369140625, -2.3642578125, -2.19482421875, -2.025390625, -1.85595703125, -1.6865234375, -1.51708984375, -1.34765625, -1.17822265625, -1.0087890625, -0.83935546875, -0.669921875, -0.50048828125, -0.3310546875, -0.16162109375, 0.0078125, 0.17724609375, 0.3466796875, 0.51611328125, 0.685546875, 0.85498046875, 1.0244140625, 1.19384765625, 1.36328125, 1.53271484375, 1.7021484375, 1.87158203125, 2.041015625, 2.21044921875, 2.3798828125, 2.54931640625, 2.71875, 2.88818359375, 3.0576171875, 3.22705078125, 3.396484375, 3.56591796875, 3.7353515625, 3.90478515625, 4.07421875, 4.24365234375, 4.4130859375, 4.58251953125, 4.751953125, 4.92138671875, 5.0908203125, 5.26025390625, 5.4296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 12.0, 20.0, 15.0, 30.0, 43.0, 61.0, 85.0, 129.0, 179.0, 270.0, 408.0, 575.0, 911.0, 1561.0, 2329.0, 3912.0, 6711.0, 11033.0, 18996.0, 32358.0, 55021.0, 91190.0, 138718.0, 177440.0, 172676.0, 128858.0, 82941.0, 50320.0, 29368.0, 17062.0, 9848.0, 5973.0, 3571.0, 2110.0, 1347.0, 839.0, 546.0, 332.0, 256.0, 173.0, 101.0, 80.0, 61.0, 26.0, 26.0, 15.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.4140625, -3.299896240234375, -3.18572998046875, -3.071563720703125, -2.9573974609375, -2.843231201171875, -2.72906494140625, -2.614898681640625, -2.500732421875, -2.386566162109375, -2.27239990234375, -2.158233642578125, -2.0440673828125, -1.929901123046875, -1.81573486328125, -1.701568603515625, -1.58740234375, -1.473236083984375, -1.35906982421875, -1.244903564453125, -1.1307373046875, -1.016571044921875, -0.90240478515625, -0.788238525390625, -0.674072265625, -0.559906005859375, -0.44573974609375, -0.331573486328125, -0.2174072265625, -0.103240966796875, 0.01092529296875, 0.125091552734375, 0.2392578125, 0.353424072265625, 0.46759033203125, 0.581756591796875, 0.6959228515625, 0.810089111328125, 0.92425537109375, 1.038421630859375, 1.152587890625, 1.266754150390625, 1.38092041015625, 1.495086669921875, 1.6092529296875, 1.723419189453125, 1.83758544921875, 1.951751708984375, 2.06591796875, 2.180084228515625, 2.29425048828125, 2.408416748046875, 2.5225830078125, 2.636749267578125, 2.75091552734375, 2.865081787109375, 2.979248046875, 3.093414306640625, 3.20758056640625, 3.321746826171875, 3.4359130859375, 3.550079345703125, 3.66424560546875, 3.778411865234375, 3.892578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 12.0, 13.0, 15.0, 19.0, 25.0, 29.0, 39.0, 36.0, 49.0, 56.0, 66.0, 70.0, 68.0, 78.0, 67.0, 58.0, 63.0, 53.0, 38.0, 27.0, 27.0, 23.0, 15.0, 10.0, 7.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00023353099822998047, -0.00022476352751255035, -0.00021599605679512024, -0.00020722858607769012, -0.00019846111536026, -0.0001896936446428299, -0.00018092617392539978, -0.00017215870320796967, -0.00016339123249053955, -0.00015462376177310944, -0.00014585629105567932, -0.0001370888203382492, -0.0001283213496208191, -0.00011955387890338898, -0.00011078640818595886, -0.00010201893746852875, -9.325146675109863e-05, -8.448399603366852e-05, -7.57165253162384e-05, -6.694905459880829e-05, -5.8181583881378174e-05, -4.941411316394806e-05, -4.0646642446517944e-05, -3.187917172908783e-05, -2.3111701011657715e-05, -1.43442302942276e-05, -5.576759576797485e-06, 3.1907111406326294e-06, 1.1958181858062744e-05, 2.072565257549286e-05, 2.9493123292922974e-05, 3.826059401035309e-05, 4.70280647277832e-05, 5.579553544521332e-05, 6.456300616264343e-05, 7.333047688007355e-05, 8.209794759750366e-05, 9.086541831493378e-05, 9.963288903236389e-05, 0.000108400359749794, 0.00011716783046722412, 0.00012593530118465424, 0.00013470277190208435, 0.00014347024261951447, 0.00015223771333694458, 0.0001610051840543747, 0.0001697726547718048, 0.00017854012548923492, 0.00018730759620666504, 0.00019607506692409515, 0.00020484253764152527, 0.00021361000835895538, 0.0002223774790763855, 0.0002311449497938156, 0.00023991242051124573, 0.00024867989122867584, 0.00025744736194610596, 0.00026621483266353607, 0.0002749823033809662, 0.0002837497740983963, 0.0002925172448158264, 0.00030128471553325653, 0.00031005218625068665, 0.00031881965696811676, 0.0003275871276855469]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 12.0, 11.0, 22.0, 36.0, 61.0, 107.0, 162.0, 238.0, 412.0, 598.0, 1027.0, 1557.0, 2530.0, 4073.0, 6654.0, 10763.0, 17222.0, 27597.0, 43927.0, 67645.0, 98575.0, 130848.0, 149068.0, 141713.0, 115372.0, 81681.0, 54457.0, 34654.0, 21915.0, 13578.0, 8314.0, 5175.0, 3198.0, 1968.0, 1275.0, 808.0, 511.0, 295.0, 184.0, 125.0, 80.0, 46.0, 26.0, 14.0, 11.0, 11.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.09375, -3.975921630859375, -3.85809326171875, -3.740264892578125, -3.6224365234375, -3.504608154296875, -3.38677978515625, -3.268951416015625, -3.151123046875, -3.033294677734375, -2.91546630859375, -2.797637939453125, -2.6798095703125, -2.561981201171875, -2.44415283203125, -2.326324462890625, -2.20849609375, -2.090667724609375, -1.97283935546875, -1.855010986328125, -1.7371826171875, -1.619354248046875, -1.50152587890625, -1.383697509765625, -1.265869140625, -1.148040771484375, -1.03021240234375, -0.912384033203125, -0.7945556640625, -0.676727294921875, -0.55889892578125, -0.441070556640625, -0.3232421875, -0.205413818359375, -0.08758544921875, 0.030242919921875, 0.1480712890625, 0.265899658203125, 0.38372802734375, 0.501556396484375, 0.619384765625, 0.737213134765625, 0.85504150390625, 0.972869873046875, 1.0906982421875, 1.208526611328125, 1.32635498046875, 1.444183349609375, 1.56201171875, 1.679840087890625, 1.79766845703125, 1.915496826171875, 2.0333251953125, 2.151153564453125, 2.26898193359375, 2.386810302734375, 2.504638671875, 2.622467041015625, 2.74029541015625, 2.858123779296875, 2.9759521484375, 3.093780517578125, 3.21160888671875, 3.329437255859375, 3.447265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 9.0, 3.0, 9.0, 11.0, 13.0, 16.0, 12.0, 21.0, 18.0, 25.0, 27.0, 31.0, 39.0, 37.0, 54.0, 45.0, 55.0, 67.0, 48.0, 46.0, 50.0, 37.0, 36.0, 41.0, 44.0, 29.0, 29.0, 37.0, 22.0, 17.0, 16.0, 14.0, 8.0, 12.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.439453125, -1.393280029296875, -1.34710693359375, -1.300933837890625, -1.2547607421875, -1.208587646484375, -1.16241455078125, -1.116241455078125, -1.070068359375, -1.023895263671875, -0.97772216796875, -0.931549072265625, -0.8853759765625, -0.839202880859375, -0.79302978515625, -0.746856689453125, -0.70068359375, -0.654510498046875, -0.60833740234375, -0.562164306640625, -0.5159912109375, -0.469818115234375, -0.42364501953125, -0.377471923828125, -0.331298828125, -0.285125732421875, -0.23895263671875, -0.192779541015625, -0.1466064453125, -0.100433349609375, -0.05426025390625, -0.008087158203125, 0.0380859375, 0.084259033203125, 0.13043212890625, 0.176605224609375, 0.2227783203125, 0.268951416015625, 0.31512451171875, 0.361297607421875, 0.407470703125, 0.453643798828125, 0.49981689453125, 0.545989990234375, 0.5921630859375, 0.638336181640625, 0.68450927734375, 0.730682373046875, 0.77685546875, 0.823028564453125, 0.86920166015625, 0.915374755859375, 0.9615478515625, 1.007720947265625, 1.05389404296875, 1.100067138671875, 1.146240234375, 1.192413330078125, 1.23858642578125, 1.284759521484375, 1.3309326171875, 1.377105712890625, 1.42327880859375, 1.469451904296875, 1.515625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 1.0, 5.0, 10.0, 9.0, 12.0, 8.0, 9.0, 8.0, 16.0, 21.0, 31.0, 37.0, 45.0, 48.0, 51.0, 52.0, 39.0, 54.0, 48.0, 56.0, 38.0, 50.0, 45.0, 43.0, 34.0, 27.0, 29.0, 22.0, 23.0, 23.0, 24.0, 18.0, 13.0, 5.0, 6.0, 8.0, 5.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.853266716003418, -10.541560173034668, -10.229853630065918, -9.918148040771484, -9.606441497802734, -9.294734954833984, -8.983028411865234, -8.671321868896484, -8.35961627960205, -8.0479097366333, -7.736203670501709, -7.424497127532959, -7.112791061401367, -6.801084518432617, -6.489377975463867, -6.177671909332275, -5.865965366363525, -5.554258823394775, -5.242552757263184, -4.930846214294434, -4.619140148162842, -4.307433605194092, -3.995727300643921, -3.68402099609375, -3.372314691543579, -3.060608386993408, -2.7489020824432373, -2.4371957778930664, -2.1254892349243164, -1.813783049583435, -1.5020766258239746, -1.1903703212738037, -0.8786640167236328, -0.5669577121734619, -0.25525134801864624, 0.056455016136169434, 0.36816132068634033, 0.6798676252365112, 0.9915740489959717, 1.3032803535461426, 1.6149866580963135, 1.9266929626464844, 2.2383992671966553, 2.550105571746826, 2.861812114715576, 3.173518180847168, 3.485224723815918, 3.796931028366089, 4.10863733291626, 4.42034387588501, 4.732049942016602, 5.043756484985352, 5.355462551116943, 5.667169094085693, 5.978875160217285, 6.290581703186035, 6.602288246154785, 6.913994789123535, 7.225700855255127, 7.537407398223877, 7.849113464355469, 8.160820007324219, 8.472526550292969, 8.784233093261719, 9.095938682556152]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 3.0, 7.0, 4.0, 2.0, 7.0, 8.0, 5.0, 8.0, 9.0, 19.0, 21.0, 17.0, 29.0, 33.0, 22.0, 34.0, 43.0, 28.0, 31.0, 40.0, 29.0, 34.0, 43.0, 44.0, 39.0, 43.0, 32.0, 36.0, 35.0, 32.0, 29.0, 34.0, 31.0, 26.0, 21.0, 23.0, 14.0, 22.0, 9.0, 11.0, 11.0, 6.0, 4.0, 10.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.970574855804443, -7.683684349060059, -7.396793842315674, -7.109903335571289, -6.8230133056640625, -6.5361223220825195, -6.249232292175293, -5.962341785430908, -5.675451278686523, -5.388560771942139, -5.101670265197754, -4.814779758453369, -4.527889251708984, -4.240999221801758, -3.954108715057373, -3.6672182083129883, -3.3803277015686035, -3.0934371948242188, -2.806546688079834, -2.5196564197540283, -2.2327659130096436, -1.9458754062652588, -1.6589850187301636, -1.3720946311950684, -1.0852041244506836, -0.7983136773109436, -0.5114232301712036, -0.22453278303146362, 0.06235766410827637, 0.34924817085266113, 0.6361385583877563, 0.9230289459228516, 1.2099199295043945, 1.4968104362487793, 1.7837008237838745, 2.0705912113189697, 2.3574817180633545, 2.6443722248077393, 2.931262493133545, 3.2181529998779297, 3.5050435066223145, 3.791934013366699, 4.078824520111084, 4.365715026855469, 4.652605056762695, 4.939496040344238, 5.226386070251465, 5.51327657699585, 5.800167083740234, 6.087057590484619, 6.373948097229004, 6.660838603973389, 6.947729110717773, 7.234619140625, 7.521509647369385, 7.8084001541137695, 8.095291137695312, 8.382181167602539, 8.669072151184082, 8.955962181091309, 9.242853164672852, 9.529743194580078, 9.816634178161621, 10.103524208068848, 10.390414237976074]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 14.0, 21.0, 43.0, 49.0, 96.0, 131.0, 224.0, 338.0, 557.0, 875.0, 1418.0, 2190.0, 3273.0, 5287.0, 7741.0, 11979.0, 17360.0, 25018.0, 35525.0, 48260.0, 62627.0, 77383.0, 90562.0, 98216.0, 101336.0, 97166.0, 86261.0, 72617.0, 57651.0, 44115.0, 32128.0, 22553.0, 15542.0, 10477.0, 6899.0, 4583.0, 3030.0, 1871.0, 1142.0, 733.0, 452.0, 326.0, 190.0, 129.0, 76.0, 39.0, 26.0, 14.0, 13.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.3125, -5.14825439453125, -4.9840087890625, -4.81976318359375, -4.655517578125, -4.49127197265625, -4.3270263671875, -4.16278076171875, -3.99853515625, -3.83428955078125, -3.6700439453125, -3.50579833984375, -3.341552734375, -3.17730712890625, -3.0130615234375, -2.84881591796875, -2.6845703125, -2.52032470703125, -2.3560791015625, -2.19183349609375, -2.027587890625, -1.86334228515625, -1.6990966796875, -1.53485107421875, -1.37060546875, -1.20635986328125, -1.0421142578125, -0.87786865234375, -0.713623046875, -0.54937744140625, -0.3851318359375, -0.22088623046875, -0.056640625, 0.10760498046875, 0.2718505859375, 0.43609619140625, 0.600341796875, 0.76458740234375, 0.9288330078125, 1.09307861328125, 1.25732421875, 1.42156982421875, 1.5858154296875, 1.75006103515625, 1.914306640625, 2.07855224609375, 2.2427978515625, 2.40704345703125, 2.5712890625, 2.73553466796875, 2.8997802734375, 3.06402587890625, 3.228271484375, 3.39251708984375, 3.5567626953125, 3.72100830078125, 3.88525390625, 4.04949951171875, 4.2137451171875, 4.37799072265625, 4.542236328125, 4.70648193359375, 4.8707275390625, 5.03497314453125, 5.19921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 8.0, 4.0, 5.0, 12.0, 16.0, 15.0, 18.0, 23.0, 24.0, 34.0, 20.0, 34.0, 30.0, 30.0, 36.0, 41.0, 31.0, 34.0, 45.0, 42.0, 45.0, 38.0, 30.0, 32.0, 31.0, 33.0, 38.0, 27.0, 26.0, 24.0, 24.0, 19.0, 19.0, 13.0, 9.0, 11.0, 9.0, 13.0, 8.0, 7.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-8.9296875, -8.6497802734375, -8.369873046875, -8.0899658203125, -7.81005859375, -7.5301513671875, -7.250244140625, -6.9703369140625, -6.6904296875, -6.4105224609375, -6.130615234375, -5.8507080078125, -5.57080078125, -5.2908935546875, -5.010986328125, -4.7310791015625, -4.451171875, -4.1712646484375, -3.891357421875, -3.6114501953125, -3.33154296875, -3.0516357421875, -2.771728515625, -2.4918212890625, -2.2119140625, -1.9320068359375, -1.652099609375, -1.3721923828125, -1.09228515625, -0.8123779296875, -0.532470703125, -0.2525634765625, 0.02734375, 0.3072509765625, 0.587158203125, 0.8670654296875, 1.14697265625, 1.4268798828125, 1.706787109375, 1.9866943359375, 2.2666015625, 2.5465087890625, 2.826416015625, 3.1063232421875, 3.38623046875, 3.6661376953125, 3.946044921875, 4.2259521484375, 4.505859375, 4.7857666015625, 5.065673828125, 5.3455810546875, 5.62548828125, 5.9053955078125, 6.185302734375, 6.4652099609375, 6.7451171875, 7.0250244140625, 7.304931640625, 7.5848388671875, 7.86474609375, 8.1446533203125, 8.424560546875, 8.7044677734375, 8.984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 1.0, 12.0, 18.0, 36.0, 48.0, 89.0, 152.0, 224.0, 333.0, 466.0, 744.0, 1162.0, 1795.0, 2752.0, 4272.0, 6381.0, 9584.0, 14410.0, 21251.0, 30295.0, 41737.0, 55782.0, 72144.0, 87360.0, 99547.0, 104187.0, 102171.0, 93410.0, 78736.0, 62852.0, 47530.0, 34600.0, 24442.0, 16600.0, 11339.0, 7624.0, 4959.0, 3371.0, 2165.0, 1433.0, 900.0, 563.0, 389.0, 239.0, 154.0, 97.0, 54.0, 40.0, 46.0, 25.0, 14.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-5.4765625, -5.3038330078125, -5.131103515625, -4.9583740234375, -4.78564453125, -4.6129150390625, -4.440185546875, -4.2674560546875, -4.0947265625, -3.9219970703125, -3.749267578125, -3.5765380859375, -3.40380859375, -3.2310791015625, -3.058349609375, -2.8856201171875, -2.712890625, -2.5401611328125, -2.367431640625, -2.1947021484375, -2.02197265625, -1.8492431640625, -1.676513671875, -1.5037841796875, -1.3310546875, -1.1583251953125, -0.985595703125, -0.8128662109375, -0.64013671875, -0.4674072265625, -0.294677734375, -0.1219482421875, 0.05078125, 0.2235107421875, 0.396240234375, 0.5689697265625, 0.74169921875, 0.9144287109375, 1.087158203125, 1.2598876953125, 1.4326171875, 1.6053466796875, 1.778076171875, 1.9508056640625, 2.12353515625, 2.2962646484375, 2.468994140625, 2.6417236328125, 2.814453125, 2.9871826171875, 3.159912109375, 3.3326416015625, 3.50537109375, 3.6781005859375, 3.850830078125, 4.0235595703125, 4.1962890625, 4.3690185546875, 4.541748046875, 4.7144775390625, 4.88720703125, 5.0599365234375, 5.232666015625, 5.4053955078125, 5.578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 11.0, 6.0, 10.0, 9.0, 14.0, 16.0, 16.0, 22.0, 24.0, 27.0, 33.0, 28.0, 34.0, 36.0, 29.0, 37.0, 52.0, 34.0, 46.0, 41.0, 40.0, 37.0, 36.0, 33.0, 25.0, 30.0, 30.0, 28.0, 26.0, 12.0, 22.0, 26.0, 25.0, 14.0, 13.0, 16.0, 11.0, 8.0, 7.0, 6.0, 1.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.61627197265625, -5.4356689453125, -5.25506591796875, -5.074462890625, -4.89385986328125, -4.7132568359375, -4.53265380859375, -4.35205078125, -4.17144775390625, -3.9908447265625, -3.81024169921875, -3.629638671875, -3.44903564453125, -3.2684326171875, -3.08782958984375, -2.9072265625, -2.72662353515625, -2.5460205078125, -2.36541748046875, -2.184814453125, -2.00421142578125, -1.8236083984375, -1.64300537109375, -1.46240234375, -1.28179931640625, -1.1011962890625, -0.92059326171875, -0.739990234375, -0.55938720703125, -0.3787841796875, -0.19818115234375, -0.017578125, 0.16302490234375, 0.3436279296875, 0.52423095703125, 0.704833984375, 0.88543701171875, 1.0660400390625, 1.24664306640625, 1.42724609375, 1.60784912109375, 1.7884521484375, 1.96905517578125, 2.149658203125, 2.33026123046875, 2.5108642578125, 2.69146728515625, 2.8720703125, 3.05267333984375, 3.2332763671875, 3.41387939453125, 3.594482421875, 3.77508544921875, 3.9556884765625, 4.13629150390625, 4.31689453125, 4.49749755859375, 4.6781005859375, 4.85870361328125, 5.039306640625, 5.21990966796875, 5.4005126953125, 5.58111572265625, 5.76171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 9.0, 25.0, 29.0, 46.0, 72.0, 113.0, 151.0, 239.0, 396.0, 613.0, 1006.0, 1752.0, 2646.0, 4624.0, 7560.0, 11856.0, 19686.0, 30820.0, 47048.0, 68678.0, 92504.0, 114254.0, 128583.0, 126791.0, 112202.0, 89538.0, 65361.0, 44699.0, 29363.0, 18560.0, 11536.0, 6844.0, 4142.0, 2573.0, 1573.0, 968.0, 592.0, 390.0, 260.0, 152.0, 92.0, 78.0, 53.0, 22.0, 17.0, 14.0, 6.0, 0.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.486328125, -2.408477783203125, -2.33062744140625, -2.252777099609375, -2.1749267578125, -2.097076416015625, -2.01922607421875, -1.941375732421875, -1.863525390625, -1.785675048828125, -1.70782470703125, -1.629974365234375, -1.5521240234375, -1.474273681640625, -1.39642333984375, -1.318572998046875, -1.24072265625, -1.162872314453125, -1.08502197265625, -1.007171630859375, -0.9293212890625, -0.851470947265625, -0.77362060546875, -0.695770263671875, -0.617919921875, -0.540069580078125, -0.46221923828125, -0.384368896484375, -0.3065185546875, -0.228668212890625, -0.15081787109375, -0.072967529296875, 0.0048828125, 0.082733154296875, 0.16058349609375, 0.238433837890625, 0.3162841796875, 0.394134521484375, 0.47198486328125, 0.549835205078125, 0.627685546875, 0.705535888671875, 0.78338623046875, 0.861236572265625, 0.9390869140625, 1.016937255859375, 1.09478759765625, 1.172637939453125, 1.25048828125, 1.328338623046875, 1.40618896484375, 1.484039306640625, 1.5618896484375, 1.639739990234375, 1.71759033203125, 1.795440673828125, 1.873291015625, 1.951141357421875, 2.02899169921875, 2.106842041015625, 2.1846923828125, 2.262542724609375, 2.34039306640625, 2.418243408203125, 2.49609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 1.0, 9.0, 9.0, 7.0, 11.0, 11.0, 16.0, 20.0, 29.0, 30.0, 28.0, 36.0, 40.0, 53.0, 46.0, 46.0, 49.0, 52.0, 60.0, 53.0, 54.0, 56.0, 48.0, 41.0, 27.0, 33.0, 24.0, 27.0, 15.0, 11.0, 12.0, 5.0, 3.0, 8.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003371238708496094, -0.0003274008631706238, -0.0003176778554916382, -0.0003079548478126526, -0.000298231840133667, -0.0002885088324546814, -0.0002787858247756958, -0.0002690628170967102, -0.0002593398094177246, -0.000249616801738739, -0.00023989379405975342, -0.00023017078638076782, -0.00022044777870178223, -0.00021072477102279663, -0.00020100176334381104, -0.00019127875566482544, -0.00018155574798583984, -0.00017183274030685425, -0.00016210973262786865, -0.00015238672494888306, -0.00014266371726989746, -0.00013294070959091187, -0.00012321770191192627, -0.00011349469423294067, -0.00010377168655395508, -9.404867887496948e-05, -8.432567119598389e-05, -7.460266351699829e-05, -6.48796558380127e-05, -5.51566481590271e-05, -4.5433640480041504e-05, -3.571063280105591e-05, -2.5987625122070312e-05, -1.6264617443084717e-05, -6.541609764099121e-06, 3.1813979148864746e-06, 1.290440559387207e-05, 2.2627413272857666e-05, 3.235042095184326e-05, 4.207342863082886e-05, 5.179643630981445e-05, 6.151944398880005e-05, 7.124245166778564e-05, 8.096545934677124e-05, 9.068846702575684e-05, 0.00010041147470474243, 0.00011013448238372803, 0.00011985749006271362, 0.00012958049774169922, 0.00013930350542068481, 0.0001490265130996704, 0.000158749520778656, 0.0001684725284576416, 0.0001781955361366272, 0.0001879185438156128, 0.0001976415514945984, 0.00020736455917358398, 0.00021708756685256958, 0.00022681057453155518, 0.00023653358221054077, 0.00024625658988952637, 0.00025597959756851196, 0.00026570260524749756, 0.00027542561292648315, 0.00028514862060546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 10.0, 11.0, 17.0, 24.0, 41.0, 60.0, 92.0, 156.0, 212.0, 416.0, 627.0, 1026.0, 1772.0, 3046.0, 5305.0, 9071.0, 15755.0, 26528.0, 43006.0, 65564.0, 93440.0, 119803.0, 137158.0, 137387.0, 120335.0, 93412.0, 66452.0, 42934.0, 26863.0, 15894.0, 9209.0, 5313.0, 3051.0, 1814.0, 1059.0, 597.0, 372.0, 271.0, 164.0, 91.0, 62.0, 45.0, 32.0, 17.0, 17.0, 7.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0], "bins": [-3.0234375, -2.93707275390625, -2.8507080078125, -2.76434326171875, -2.677978515625, -2.59161376953125, -2.5052490234375, -2.41888427734375, -2.33251953125, -2.24615478515625, -2.1597900390625, -2.07342529296875, -1.987060546875, -1.90069580078125, -1.8143310546875, -1.72796630859375, -1.6416015625, -1.55523681640625, -1.4688720703125, -1.38250732421875, -1.296142578125, -1.20977783203125, -1.1234130859375, -1.03704833984375, -0.95068359375, -0.86431884765625, -0.7779541015625, -0.69158935546875, -0.605224609375, -0.51885986328125, -0.4324951171875, -0.34613037109375, -0.259765625, -0.17340087890625, -0.0870361328125, -0.00067138671875, 0.085693359375, 0.17205810546875, 0.2584228515625, 0.34478759765625, 0.43115234375, 0.51751708984375, 0.6038818359375, 0.69024658203125, 0.776611328125, 0.86297607421875, 0.9493408203125, 1.03570556640625, 1.1220703125, 1.20843505859375, 1.2947998046875, 1.38116455078125, 1.467529296875, 1.55389404296875, 1.6402587890625, 1.72662353515625, 1.81298828125, 1.89935302734375, 1.9857177734375, 2.07208251953125, 2.158447265625, 2.24481201171875, 2.3311767578125, 2.41754150390625, 2.50390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 3.0, 13.0, 10.0, 10.0, 14.0, 18.0, 24.0, 27.0, 32.0, 28.0, 37.0, 37.0, 53.0, 52.0, 58.0, 49.0, 44.0, 55.0, 48.0, 47.0, 54.0, 36.0, 32.0, 37.0, 37.0, 25.0, 23.0, 16.0, 13.0, 13.0, 11.0, 14.0, 7.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3388671875, -1.3030166625976562, -1.2671661376953125, -1.2313156127929688, -1.195465087890625, -1.1596145629882812, -1.1237640380859375, -1.0879135131835938, -1.05206298828125, -1.0162124633789062, -0.9803619384765625, -0.9445114135742188, -0.908660888671875, -0.8728103637695312, -0.8369598388671875, -0.8011093139648438, -0.7652587890625, -0.7294082641601562, -0.6935577392578125, -0.6577072143554688, -0.621856689453125, -0.5860061645507812, -0.5501556396484375, -0.5143051147460938, -0.47845458984375, -0.44260406494140625, -0.4067535400390625, -0.37090301513671875, -0.335052490234375, -0.29920196533203125, -0.2633514404296875, -0.22750091552734375, -0.191650390625, -0.15579986572265625, -0.1199493408203125, -0.08409881591796875, -0.048248291015625, -0.01239776611328125, 0.0234527587890625, 0.05930328369140625, 0.09515380859375, 0.13100433349609375, 0.1668548583984375, 0.20270538330078125, 0.238555908203125, 0.27440643310546875, 0.3102569580078125, 0.34610748291015625, 0.3819580078125, 0.41780853271484375, 0.4536590576171875, 0.48950958251953125, 0.525360107421875, 0.5612106323242188, 0.5970611572265625, 0.6329116821289062, 0.66876220703125, 0.7046127319335938, 0.7404632568359375, 0.7763137817382812, 0.812164306640625, 0.8480148315429688, 0.8838653564453125, 0.9197158813476562, 0.95556640625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 8.0, 6.0, 10.0, 9.0, 10.0, 25.0, 14.0, 29.0, 33.0, 39.0, 60.0, 46.0, 49.0, 51.0, 47.0, 40.0, 35.0, 51.0, 46.0, 42.0, 40.0, 34.0, 38.0, 26.0, 29.0, 25.0, 28.0, 21.0, 16.0, 10.0, 15.0, 14.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.233351707458496, -9.934505462646484, -9.635658264160156, -9.336811065673828, -9.037964820861816, -8.739118576049805, -8.440271377563477, -8.141424179077148, -7.842577934265137, -7.543731212615967, -7.244884490966797, -6.946037769317627, -6.647191047668457, -6.348344326019287, -6.049497604370117, -5.750650882720947, -5.451804161071777, -5.152957439422607, -4.8541107177734375, -4.555263996124268, -4.256417274475098, -3.9575705528259277, -3.658723831176758, -3.359877109527588, -3.061030387878418, -2.762183666229248, -2.463336944580078, -2.164490222930908, -1.8656435012817383, -1.5667967796325684, -1.2679500579833984, -0.9691033363342285, -0.6702556610107422, -0.37140893936157227, -0.07256221771240234, 0.22628450393676758, 0.5251312255859375, 0.8239779472351074, 1.1228246688842773, 1.4216713905334473, 1.7205181121826172, 2.019364833831787, 2.318211555480957, 2.617058277130127, 2.915904998779297, 3.214751720428467, 3.5135984420776367, 3.8124451637268066, 4.111291885375977, 4.4101386070251465, 4.708985328674316, 5.007832050323486, 5.306678771972656, 5.605525493621826, 5.904372215270996, 6.203218936920166, 6.502065658569336, 6.800912380218506, 7.099759101867676, 7.398605823516846, 7.697452545166016, 7.9962992668151855, 8.295145988464355, 8.593992233276367, 8.892839431762695]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 2.0, 6.0, 8.0, 9.0, 10.0, 9.0, 14.0, 13.0, 18.0, 21.0, 30.0, 20.0, 30.0, 30.0, 28.0, 35.0, 33.0, 45.0, 36.0, 40.0, 35.0, 33.0, 43.0, 43.0, 44.0, 40.0, 34.0, 45.0, 28.0, 35.0, 26.0, 16.0, 26.0, 17.0, 17.0, 9.0, 16.0, 16.0, 16.0, 5.0, 8.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.006915092468262, -7.6960978507995605, -7.385280609130859, -7.074462890625, -6.763645648956299, -6.452828407287598, -6.1420111656188965, -5.831193923950195, -5.520376205444336, -5.209558963775635, -4.898741722106934, -4.587924003601074, -4.277106761932373, -3.966289520263672, -3.6554722785949707, -3.3446547985076904, -3.0338377952575684, -2.723020553588867, -2.412203073501587, -2.1013858318328857, -1.790568470954895, -1.4797511100769043, -1.1689338684082031, -0.8581163883209229, -0.5472991466522217, -0.23648181557655334, 0.07433551549911499, 0.38515281677246094, 0.6959701776504517, 1.0067875385284424, 1.3176047801971436, 1.6284222602844238, 1.939239501953125, 2.250056743621826, 2.5608742237091064, 2.8716914653778076, 3.182508945465088, 3.493326187133789, 3.8041434288024902, 4.114960670471191, 4.425778388977051, 4.736595630645752, 5.047412872314453, 5.3582305908203125, 5.669047832489014, 5.979865074157715, 6.290682315826416, 6.601499557495117, 6.912316799163818, 7.2231340408325195, 7.533951282501221, 7.844768524169922, 8.155586242675781, 8.46640396118164, 8.777220726013184, 9.088038444519043, 9.398855209350586, 9.709672927856445, 10.020489692687988, 10.331307411193848, 10.64212417602539, 10.95294189453125, 11.26375961303711, 11.574576377868652, 11.885394096374512]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 12.0, 19.0, 30.0, 59.0, 81.0, 132.0, 221.0, 386.0, 616.0, 1001.0, 1692.0, 2773.0, 4630.0, 8123.0, 14060.0, 24538.0, 43974.0, 80749.0, 149900.0, 273977.0, 466945.0, 675012.0, 762091.0, 657606.0, 446685.0, 259342.0, 141920.0, 76707.0, 42516.0, 24101.0, 13802.0, 8038.0, 4864.0, 2956.0, 1725.0, 1089.0, 690.0, 447.0, 269.0, 182.0, 133.0, 75.0, 44.0, 24.0, 19.0, 10.0, 7.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.5, -8.2381591796875, -7.976318359375, -7.7144775390625, -7.45263671875, -7.1907958984375, -6.928955078125, -6.6671142578125, -6.4052734375, -6.1434326171875, -5.881591796875, -5.6197509765625, -5.35791015625, -5.0960693359375, -4.834228515625, -4.5723876953125, -4.310546875, -4.0487060546875, -3.786865234375, -3.5250244140625, -3.26318359375, -3.0013427734375, -2.739501953125, -2.4776611328125, -2.2158203125, -1.9539794921875, -1.692138671875, -1.4302978515625, -1.16845703125, -0.9066162109375, -0.644775390625, -0.3829345703125, -0.12109375, 0.1407470703125, 0.402587890625, 0.6644287109375, 0.92626953125, 1.1881103515625, 1.449951171875, 1.7117919921875, 1.9736328125, 2.2354736328125, 2.497314453125, 2.7591552734375, 3.02099609375, 3.2828369140625, 3.544677734375, 3.8065185546875, 4.068359375, 4.3302001953125, 4.592041015625, 4.8538818359375, 5.11572265625, 5.3775634765625, 5.639404296875, 5.9012451171875, 6.1630859375, 6.4249267578125, 6.686767578125, 6.9486083984375, 7.21044921875, 7.4722900390625, 7.734130859375, 7.9959716796875, 8.2578125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 3.0, 12.0, 11.0, 10.0, 14.0, 10.0, 22.0, 21.0, 22.0, 22.0, 29.0, 22.0, 33.0, 20.0, 40.0, 34.0, 33.0, 40.0, 38.0, 44.0, 34.0, 35.0, 39.0, 50.0, 36.0, 36.0, 36.0, 36.0, 19.0, 38.0, 20.0, 18.0, 21.0, 15.0, 10.0, 11.0, 13.0, 6.0, 6.0, 8.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.51953125, -7.26263427734375, -7.0057373046875, -6.74884033203125, -6.491943359375, -6.23504638671875, -5.9781494140625, -5.72125244140625, -5.46435546875, -5.20745849609375, -4.9505615234375, -4.69366455078125, -4.436767578125, -4.17987060546875, -3.9229736328125, -3.66607666015625, -3.4091796875, -3.15228271484375, -2.8953857421875, -2.63848876953125, -2.381591796875, -2.12469482421875, -1.8677978515625, -1.61090087890625, -1.35400390625, -1.09710693359375, -0.8402099609375, -0.58331298828125, -0.326416015625, -0.06951904296875, 0.1873779296875, 0.44427490234375, 0.701171875, 0.95806884765625, 1.2149658203125, 1.47186279296875, 1.728759765625, 1.98565673828125, 2.2425537109375, 2.49945068359375, 2.75634765625, 3.01324462890625, 3.2701416015625, 3.52703857421875, 3.783935546875, 4.04083251953125, 4.2977294921875, 4.55462646484375, 4.8115234375, 5.06842041015625, 5.3253173828125, 5.58221435546875, 5.839111328125, 6.09600830078125, 6.3529052734375, 6.60980224609375, 6.86669921875, 7.12359619140625, 7.3804931640625, 7.63739013671875, 7.894287109375, 8.15118408203125, 8.4080810546875, 8.66497802734375, 8.921875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 2.0, 4.0, 5.0, 10.0, 34.0, 46.0, 55.0, 98.0, 153.0, 236.0, 308.0, 500.0, 787.0, 1223.0, 1991.0, 3234.0, 5067.0, 8168.0, 12923.0, 20561.0, 34311.0, 54860.0, 88796.0, 143116.0, 226637.0, 342793.0, 482698.0, 592650.0, 606053.0, 514631.0, 375822.0, 253334.0, 160834.0, 99987.0, 62127.0, 37969.0, 23320.0, 14557.0, 8940.0, 5577.0, 3687.0, 2248.0, 1438.0, 908.0, 564.0, 360.0, 244.0, 165.0, 81.0, 62.0, 51.0, 26.0, 23.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0], "bins": [-8.203125, -7.94775390625, -7.6923828125, -7.43701171875, -7.181640625, -6.92626953125, -6.6708984375, -6.41552734375, -6.16015625, -5.90478515625, -5.6494140625, -5.39404296875, -5.138671875, -4.88330078125, -4.6279296875, -4.37255859375, -4.1171875, -3.86181640625, -3.6064453125, -3.35107421875, -3.095703125, -2.84033203125, -2.5849609375, -2.32958984375, -2.07421875, -1.81884765625, -1.5634765625, -1.30810546875, -1.052734375, -0.79736328125, -0.5419921875, -0.28662109375, -0.03125, 0.22412109375, 0.4794921875, 0.73486328125, 0.990234375, 1.24560546875, 1.5009765625, 1.75634765625, 2.01171875, 2.26708984375, 2.5224609375, 2.77783203125, 3.033203125, 3.28857421875, 3.5439453125, 3.79931640625, 4.0546875, 4.31005859375, 4.5654296875, 4.82080078125, 5.076171875, 5.33154296875, 5.5869140625, 5.84228515625, 6.09765625, 6.35302734375, 6.6083984375, 6.86376953125, 7.119140625, 7.37451171875, 7.6298828125, 7.88525390625, 8.140625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 12.0, 3.0, 11.0, 12.0, 11.0, 37.0, 35.0, 50.0, 59.0, 78.0, 82.0, 109.0, 106.0, 160.0, 145.0, 193.0, 209.0, 237.0, 208.0, 239.0, 237.0, 254.0, 235.0, 218.0, 171.0, 174.0, 138.0, 119.0, 113.0, 103.0, 78.0, 65.0, 50.0, 32.0, 20.0, 16.0, 17.0, 16.0, 11.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9140625, -3.787841796875, -3.66162109375, -3.535400390625, -3.4091796875, -3.282958984375, -3.15673828125, -3.030517578125, -2.904296875, -2.778076171875, -2.65185546875, -2.525634765625, -2.3994140625, -2.273193359375, -2.14697265625, -2.020751953125, -1.89453125, -1.768310546875, -1.64208984375, -1.515869140625, -1.3896484375, -1.263427734375, -1.13720703125, -1.010986328125, -0.884765625, -0.758544921875, -0.63232421875, -0.506103515625, -0.3798828125, -0.253662109375, -0.12744140625, -0.001220703125, 0.125, 0.251220703125, 0.37744140625, 0.503662109375, 0.6298828125, 0.756103515625, 0.88232421875, 1.008544921875, 1.134765625, 1.260986328125, 1.38720703125, 1.513427734375, 1.6396484375, 1.765869140625, 1.89208984375, 2.018310546875, 2.14453125, 2.270751953125, 2.39697265625, 2.523193359375, 2.6494140625, 2.775634765625, 2.90185546875, 3.028076171875, 3.154296875, 3.280517578125, 3.40673828125, 3.532958984375, 3.6591796875, 3.785400390625, 3.91162109375, 4.037841796875, 4.1640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 4.0, 10.0, 8.0, 6.0, 7.0, 16.0, 17.0, 27.0, 31.0, 36.0, 39.0, 43.0, 46.0, 50.0, 44.0, 49.0, 60.0, 53.0, 53.0, 42.0, 44.0, 38.0, 45.0, 33.0, 54.0, 25.0, 30.0, 15.0, 8.0, 17.0, 16.0, 9.0, 11.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.51759147644043, -12.170232772827148, -11.822874069213867, -11.475516319274902, -11.128157615661621, -10.78079891204834, -10.433440208435059, -10.086082458496094, -9.738723754882812, -9.391365051269531, -9.04400634765625, -8.696648597717285, -8.349289894104004, -8.001931190490723, -7.654572486877441, -7.307214260101318, -6.959855556488037, -6.612496852874756, -6.265138626098633, -5.917779922485352, -5.5704216957092285, -5.223062992095947, -4.875704765319824, -4.528346061706543, -4.180987358093262, -3.8336288928985596, -3.4862704277038574, -3.138911724090576, -2.791553497314453, -2.444194793701172, -2.0968363285064697, -1.7494778633117676, -1.4021196365356445, -1.0547611713409424, -0.7074026465415955, -0.36004412174224854, -0.012685656547546387, 0.33467280864715576, 0.6820313930511475, 1.0293898582458496, 1.3767483234405518, 1.724106788635254, 2.071465253829956, 2.418823719024658, 2.7661824226379395, 3.1135406494140625, 3.4608993530273438, 3.808257818222046, 4.155616283416748, 4.502974987030029, 4.850333213806152, 5.197691917419434, 5.545050144195557, 5.892408847808838, 6.239767074584961, 6.587125778198242, 6.934484481811523, 7.281843185424805, 7.629201412200928, 7.976560115814209, 8.323918342590332, 8.671277046203613, 9.018635749816895, 9.36599349975586, 9.71335220336914]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 11.0, 14.0, 9.0, 13.0, 13.0, 15.0, 18.0, 26.0, 29.0, 31.0, 30.0, 32.0, 35.0, 33.0, 53.0, 34.0, 31.0, 34.0, 47.0, 58.0, 43.0, 33.0, 29.0, 30.0, 38.0, 23.0, 31.0, 26.0, 27.0, 23.0, 20.0, 21.0, 12.0, 15.0, 11.0, 13.0, 11.0, 3.0, 3.0, 0.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.340636253356934, -8.03688907623291, -7.73314094543457, -7.429393291473389, -7.125645637512207, -6.821898460388184, -6.518150806427002, -6.21440315246582, -5.910655498504639, -5.606907844543457, -5.303160190582275, -4.999412536621094, -4.69566535949707, -4.3919172286987305, -4.088170051574707, -3.7844223976135254, -3.4806747436523438, -3.176927089691162, -2.8731794357299805, -2.569432020187378, -2.2656843662261963, -1.9619367122650146, -1.6581891775131226, -1.3544416427612305, -1.0506939888000488, -0.746946394443512, -0.4431988000869751, -0.13945120573043823, 0.16429638862609863, 0.4680440425872803, 0.7717915773391724, 1.0755391120910645, 1.3792877197265625, 1.6830353736877441, 1.9867829084396362, 2.2905304431915283, 2.59427809715271, 2.8980257511138916, 3.201773166656494, 3.505520820617676, 3.8092684745788574, 4.113016128540039, 4.416763782501221, 4.720511436462402, 5.024258613586426, 5.328006744384766, 5.631753921508789, 5.935501575469971, 6.239249229431152, 6.542996883392334, 6.846744537353516, 7.150492191314697, 7.454239845275879, 7.757987022399902, 8.061735153198242, 8.365482330322266, 8.669229507446289, 8.972976684570312, 9.276724815368652, 9.580471992492676, 9.884220123291016, 10.187967300415039, 10.491715431213379, 10.795462608337402, 11.099210739135742]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 9.0, 9.0, 18.0, 16.0, 22.0, 33.0, 62.0, 81.0, 113.0, 185.0, 249.0, 415.0, 546.0, 864.0, 1289.0, 1959.0, 3172.0, 4877.0, 7745.0, 12048.0, 18785.0, 29227.0, 43946.0, 63695.0, 87243.0, 110125.0, 126034.0, 127399.0, 113777.0, 91801.0, 67920.0, 46630.0, 31546.0, 20419.0, 12908.0, 8373.0, 5122.0, 3403.0, 2185.0, 1460.0, 967.0, 646.0, 410.0, 271.0, 164.0, 121.0, 94.0, 51.0, 43.0, 28.0, 17.0, 5.0, 9.0, 9.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.859375, -4.70306396484375, -4.5467529296875, -4.39044189453125, -4.234130859375, -4.07781982421875, -3.9215087890625, -3.76519775390625, -3.60888671875, -3.45257568359375, -3.2962646484375, -3.13995361328125, -2.983642578125, -2.82733154296875, -2.6710205078125, -2.51470947265625, -2.3583984375, -2.20208740234375, -2.0457763671875, -1.88946533203125, -1.733154296875, -1.57684326171875, -1.4205322265625, -1.26422119140625, -1.10791015625, -0.95159912109375, -0.7952880859375, -0.63897705078125, -0.482666015625, -0.32635498046875, -0.1700439453125, -0.01373291015625, 0.142578125, 0.29888916015625, 0.4552001953125, 0.61151123046875, 0.767822265625, 0.92413330078125, 1.0804443359375, 1.23675537109375, 1.39306640625, 1.54937744140625, 1.7056884765625, 1.86199951171875, 2.018310546875, 2.17462158203125, 2.3309326171875, 2.48724365234375, 2.6435546875, 2.79986572265625, 2.9561767578125, 3.11248779296875, 3.268798828125, 3.42510986328125, 3.5814208984375, 3.73773193359375, 3.89404296875, 4.05035400390625, 4.2066650390625, 4.36297607421875, 4.519287109375, 4.67559814453125, 4.8319091796875, 4.98822021484375, 5.14453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 8.0, 13.0, 11.0, 9.0, 11.0, 17.0, 17.0, 19.0, 22.0, 19.0, 40.0, 30.0, 24.0, 44.0, 40.0, 35.0, 37.0, 39.0, 35.0, 43.0, 42.0, 31.0, 42.0, 47.0, 36.0, 34.0, 34.0, 29.0, 23.0, 21.0, 22.0, 20.0, 20.0, 15.0, 14.0, 8.0, 9.0, 8.0, 12.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.15625, -7.851806640625, -7.54736328125, -7.242919921875, -6.9384765625, -6.634033203125, -6.32958984375, -6.025146484375, -5.720703125, -5.416259765625, -5.11181640625, -4.807373046875, -4.5029296875, -4.198486328125, -3.89404296875, -3.589599609375, -3.28515625, -2.980712890625, -2.67626953125, -2.371826171875, -2.0673828125, -1.762939453125, -1.45849609375, -1.154052734375, -0.849609375, -0.545166015625, -0.24072265625, 0.063720703125, 0.3681640625, 0.672607421875, 0.97705078125, 1.281494140625, 1.5859375, 1.890380859375, 2.19482421875, 2.499267578125, 2.8037109375, 3.108154296875, 3.41259765625, 3.717041015625, 4.021484375, 4.325927734375, 4.63037109375, 4.934814453125, 5.2392578125, 5.543701171875, 5.84814453125, 6.152587890625, 6.45703125, 6.761474609375, 7.06591796875, 7.370361328125, 7.6748046875, 7.979248046875, 8.28369140625, 8.588134765625, 8.892578125, 9.197021484375, 9.50146484375, 9.805908203125, 10.1103515625, 10.414794921875, 10.71923828125, 11.023681640625, 11.328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 4.0, 11.0, 9.0, 27.0, 21.0, 36.0, 65.0, 75.0, 117.0, 156.0, 267.0, 394.0, 616.0, 1047.0, 1717.0, 2886.0, 5151.0, 8953.0, 16479.0, 30078.0, 54155.0, 94906.0, 149249.0, 193000.0, 181505.0, 129465.0, 78459.0, 44093.0, 24107.0, 13462.0, 7490.0, 4178.0, 2476.0, 1449.0, 887.0, 558.0, 326.0, 219.0, 146.0, 86.0, 82.0, 42.0, 35.0, 22.0, 18.0, 10.0, 13.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.53125, -8.2545166015625, -7.977783203125, -7.7010498046875, -7.42431640625, -7.1475830078125, -6.870849609375, -6.5941162109375, -6.3173828125, -6.0406494140625, -5.763916015625, -5.4871826171875, -5.21044921875, -4.9337158203125, -4.656982421875, -4.3802490234375, -4.103515625, -3.8267822265625, -3.550048828125, -3.2733154296875, -2.99658203125, -2.7198486328125, -2.443115234375, -2.1663818359375, -1.8896484375, -1.6129150390625, -1.336181640625, -1.0594482421875, -0.78271484375, -0.5059814453125, -0.229248046875, 0.0474853515625, 0.32421875, 0.6009521484375, 0.877685546875, 1.1544189453125, 1.43115234375, 1.7078857421875, 1.984619140625, 2.2613525390625, 2.5380859375, 2.8148193359375, 3.091552734375, 3.3682861328125, 3.64501953125, 3.9217529296875, 4.198486328125, 4.4752197265625, 4.751953125, 5.0286865234375, 5.305419921875, 5.5821533203125, 5.85888671875, 6.1356201171875, 6.412353515625, 6.6890869140625, 6.9658203125, 7.2425537109375, 7.519287109375, 7.7960205078125, 8.07275390625, 8.3494873046875, 8.626220703125, 8.9029541015625, 9.1796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 2.0, 9.0, 5.0, 11.0, 14.0, 15.0, 10.0, 14.0, 17.0, 29.0, 27.0, 22.0, 22.0, 34.0, 30.0, 47.0, 48.0, 49.0, 35.0, 41.0, 39.0, 47.0, 57.0, 42.0, 40.0, 34.0, 32.0, 37.0, 23.0, 25.0, 25.0, 20.0, 21.0, 15.0, 11.0, 11.0, 7.0, 7.0, 8.0, 6.0, 5.0, 2.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.93359375, -6.72735595703125, -6.5211181640625, -6.31488037109375, -6.108642578125, -5.90240478515625, -5.6961669921875, -5.48992919921875, -5.28369140625, -5.07745361328125, -4.8712158203125, -4.66497802734375, -4.458740234375, -4.25250244140625, -4.0462646484375, -3.84002685546875, -3.6337890625, -3.42755126953125, -3.2213134765625, -3.01507568359375, -2.808837890625, -2.60260009765625, -2.3963623046875, -2.19012451171875, -1.98388671875, -1.77764892578125, -1.5714111328125, -1.36517333984375, -1.158935546875, -0.95269775390625, -0.7464599609375, -0.54022216796875, -0.333984375, -0.12774658203125, 0.0784912109375, 0.28472900390625, 0.490966796875, 0.69720458984375, 0.9034423828125, 1.10968017578125, 1.31591796875, 1.52215576171875, 1.7283935546875, 1.93463134765625, 2.140869140625, 2.34710693359375, 2.5533447265625, 2.75958251953125, 2.9658203125, 3.17205810546875, 3.3782958984375, 3.58453369140625, 3.790771484375, 3.99700927734375, 4.2032470703125, 4.40948486328125, 4.61572265625, 4.82196044921875, 5.0281982421875, 5.23443603515625, 5.440673828125, 5.64691162109375, 5.8531494140625, 6.05938720703125, 6.265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 16.0, 25.0, 39.0, 47.0, 85.0, 123.0, 189.0, 296.0, 499.0, 748.0, 1204.0, 1899.0, 3108.0, 5033.0, 8208.0, 13391.0, 21844.0, 36857.0, 59994.0, 94969.0, 136882.0, 167466.0, 160024.0, 122801.0, 82210.0, 51248.0, 31007.0, 18843.0, 11264.0, 6830.0, 4275.0, 2636.0, 1627.0, 1063.0, 649.0, 415.0, 298.0, 173.0, 93.0, 68.0, 42.0, 24.0, 16.0, 8.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.607421875, -3.50079345703125, -3.3941650390625, -3.28753662109375, -3.180908203125, -3.07427978515625, -2.9676513671875, -2.86102294921875, -2.75439453125, -2.64776611328125, -2.5411376953125, -2.43450927734375, -2.327880859375, -2.22125244140625, -2.1146240234375, -2.00799560546875, -1.9013671875, -1.79473876953125, -1.6881103515625, -1.58148193359375, -1.474853515625, -1.36822509765625, -1.2615966796875, -1.15496826171875, -1.04833984375, -0.94171142578125, -0.8350830078125, -0.72845458984375, -0.621826171875, -0.51519775390625, -0.4085693359375, -0.30194091796875, -0.1953125, -0.08868408203125, 0.0179443359375, 0.12457275390625, 0.231201171875, 0.33782958984375, 0.4444580078125, 0.55108642578125, 0.65771484375, 0.76434326171875, 0.8709716796875, 0.97760009765625, 1.084228515625, 1.19085693359375, 1.2974853515625, 1.40411376953125, 1.5107421875, 1.61737060546875, 1.7239990234375, 1.83062744140625, 1.937255859375, 2.04388427734375, 2.1505126953125, 2.25714111328125, 2.36376953125, 2.47039794921875, 2.5770263671875, 2.68365478515625, 2.790283203125, 2.89691162109375, 3.0035400390625, 3.11016845703125, 3.216796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 10.0, 12.0, 27.0, 28.0, 36.0, 42.0, 72.0, 81.0, 64.0, 93.0, 84.0, 81.0, 86.0, 76.0, 48.0, 26.0, 32.0, 19.0, 15.0, 9.0, 11.0, 5.0, 6.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027251243591308594, -0.0002617053687572479, -0.0002508983016014099, -0.0002400912344455719, -0.0002292841672897339, -0.00021847710013389587, -0.00020767003297805786, -0.00019686296582221985, -0.00018605589866638184, -0.00017524883151054382, -0.0001644417643547058, -0.0001536346971988678, -0.00014282763004302979, -0.00013202056288719177, -0.00012121349573135376, -0.00011040642857551575, -9.959936141967773e-05, -8.879229426383972e-05, -7.798522710800171e-05, -6.71781599521637e-05, -5.6371092796325684e-05, -4.556402564048767e-05, -3.475695848464966e-05, -2.3949891328811646e-05, -1.3142824172973633e-05, -2.33575701713562e-06, 8.471310138702393e-06, 1.9278377294540405e-05, 3.0085444450378418e-05, 4.089251160621643e-05, 5.169957876205444e-05, 6.250664591789246e-05, 7.331371307373047e-05, 8.412078022956848e-05, 9.49278473854065e-05, 0.00010573491454124451, 0.00011654198169708252, 0.00012734904885292053, 0.00013815611600875854, 0.00014896318316459656, 0.00015977025032043457, 0.00017057731747627258, 0.0001813843846321106, 0.0001921914517879486, 0.00020299851894378662, 0.00021380558609962463, 0.00022461265325546265, 0.00023541972041130066, 0.00024622678756713867, 0.0002570338547229767, 0.0002678409218788147, 0.0002786479890346527, 0.0002894550561904907, 0.00030026212334632874, 0.00031106919050216675, 0.00032187625765800476, 0.0003326833248138428, 0.0003434903919696808, 0.0003542974591255188, 0.0003651045262813568, 0.0003759115934371948, 0.00038671866059303284, 0.00039752572774887085, 0.00040833279490470886, 0.0004191398620605469]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 7.0, 12.0, 14.0, 18.0, 42.0, 45.0, 67.0, 93.0, 132.0, 186.0, 280.0, 386.0, 564.0, 840.0, 1290.0, 1896.0, 2727.0, 4317.0, 6715.0, 10074.0, 15713.0, 23913.0, 36104.0, 53526.0, 75592.0, 99922.0, 119874.0, 128849.0, 120882.0, 101704.0, 77567.0, 55341.0, 37632.0, 24897.0, 16536.0, 10384.0, 6829.0, 4487.0, 3104.0, 1961.0, 1291.0, 852.0, 596.0, 378.0, 293.0, 194.0, 137.0, 91.0, 64.0, 44.0, 41.0, 24.0, 7.0, 11.0, 5.0, 7.0, 5.0, 3.0, 2.0, 2.0], "bins": [-3.1875, -3.086456298828125, -2.98541259765625, -2.884368896484375, -2.7833251953125, -2.682281494140625, -2.58123779296875, -2.480194091796875, -2.379150390625, -2.278106689453125, -2.17706298828125, -2.076019287109375, -1.9749755859375, -1.873931884765625, -1.77288818359375, -1.671844482421875, -1.57080078125, -1.469757080078125, -1.36871337890625, -1.267669677734375, -1.1666259765625, -1.065582275390625, -0.96453857421875, -0.863494873046875, -0.762451171875, -0.661407470703125, -0.56036376953125, -0.459320068359375, -0.3582763671875, -0.257232666015625, -0.15618896484375, -0.055145263671875, 0.0458984375, 0.146942138671875, 0.24798583984375, 0.349029541015625, 0.4500732421875, 0.551116943359375, 0.65216064453125, 0.753204345703125, 0.854248046875, 0.955291748046875, 1.05633544921875, 1.157379150390625, 1.2584228515625, 1.359466552734375, 1.46051025390625, 1.561553955078125, 1.66259765625, 1.763641357421875, 1.86468505859375, 1.965728759765625, 2.0667724609375, 2.167816162109375, 2.26885986328125, 2.369903564453125, 2.470947265625, 2.571990966796875, 2.67303466796875, 2.774078369140625, 2.8751220703125, 2.976165771484375, 3.07720947265625, 3.178253173828125, 3.279296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 3.0, 2.0, 5.0, 6.0, 9.0, 12.0, 12.0, 11.0, 18.0, 15.0, 25.0, 32.0, 35.0, 40.0, 32.0, 39.0, 40.0, 38.0, 41.0, 42.0, 52.0, 45.0, 38.0, 40.0, 39.0, 22.0, 31.0, 40.0, 27.0, 32.0, 26.0, 28.0, 13.0, 17.0, 13.0, 17.0, 12.0, 9.0, 9.0, 6.0, 6.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.115234375, -1.07635498046875, -1.0374755859375, -0.99859619140625, -0.959716796875, -0.92083740234375, -0.8819580078125, -0.84307861328125, -0.80419921875, -0.76531982421875, -0.7264404296875, -0.68756103515625, -0.648681640625, -0.60980224609375, -0.5709228515625, -0.53204345703125, -0.4931640625, -0.45428466796875, -0.4154052734375, -0.37652587890625, -0.337646484375, -0.29876708984375, -0.2598876953125, -0.22100830078125, -0.18212890625, -0.14324951171875, -0.1043701171875, -0.06549072265625, -0.026611328125, 0.01226806640625, 0.0511474609375, 0.09002685546875, 0.12890625, 0.16778564453125, 0.2066650390625, 0.24554443359375, 0.284423828125, 0.32330322265625, 0.3621826171875, 0.40106201171875, 0.43994140625, 0.47882080078125, 0.5177001953125, 0.55657958984375, 0.595458984375, 0.63433837890625, 0.6732177734375, 0.71209716796875, 0.7509765625, 0.78985595703125, 0.8287353515625, 0.86761474609375, 0.906494140625, 0.94537353515625, 0.9842529296875, 1.02313232421875, 1.06201171875, 1.10089111328125, 1.1397705078125, 1.17864990234375, 1.217529296875, 1.25640869140625, 1.2952880859375, 1.33416748046875, 1.373046875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 7.0, 0.0, 7.0, 12.0, 12.0, 8.0, 18.0, 24.0, 25.0, 35.0, 41.0, 42.0, 53.0, 45.0, 54.0, 44.0, 61.0, 44.0, 59.0, 46.0, 61.0, 48.0, 43.0, 47.0, 28.0, 25.0, 28.0, 20.0, 21.0, 7.0, 12.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.344079971313477, -12.984573364257812, -12.625065803527832, -12.265558242797852, -11.906051635742188, -11.546545028686523, -11.187037467956543, -10.827529907226562, -10.468023300170898, -10.108516693115234, -9.749009132385254, -9.389501571655273, -9.02999496459961, -8.670488357543945, -8.310980796813965, -7.951473712921143, -7.59196662902832, -7.232459545135498, -6.872952461242676, -6.5134453773498535, -6.153938293457031, -5.794431209564209, -5.434924125671387, -5.0754170417785645, -4.715909957885742, -4.35640287399292, -3.9968957901000977, -3.6373887062072754, -3.277881622314453, -2.918374538421631, -2.5588674545288086, -2.1993603706359863, -1.8398542404174805, -1.4803471565246582, -1.120840072631836, -0.7613329887390137, -0.4018259048461914, -0.04231882095336914, 0.3171882629394531, 0.6766953468322754, 1.0362024307250977, 1.39570951461792, 1.7552165985107422, 2.1147236824035645, 2.4742307662963867, 2.833737850189209, 3.1932449340820312, 3.5527520179748535, 3.912259101867676, 4.271766185760498, 4.63127326965332, 4.990780353546143, 5.350287437438965, 5.709794521331787, 6.069301605224609, 6.428808689117432, 6.788315773010254, 7.147822856903076, 7.507329940795898, 7.866837024688721, 8.226344108581543, 8.585851669311523, 8.945358276367188, 9.304864883422852, 9.664372444152832]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 12.0, 6.0, 12.0, 12.0, 10.0, 17.0, 18.0, 24.0, 18.0, 28.0, 34.0, 29.0, 34.0, 41.0, 29.0, 30.0, 40.0, 45.0, 40.0, 47.0, 42.0, 44.0, 44.0, 33.0, 30.0, 28.0, 34.0, 24.0, 30.0, 24.0, 21.0, 20.0, 15.0, 20.0, 11.0, 16.0, 9.0, 9.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.287129402160645, -7.985505104064941, -7.683880805969238, -7.382256507873535, -7.080632209777832, -6.779007911682129, -6.477383136749268, -6.1757588386535645, -5.874134540557861, -5.572510242462158, -5.270885944366455, -4.969261646270752, -4.667636871337891, -4.3660125732421875, -4.064388275146484, -3.7627639770507812, -3.461139678955078, -3.159515380859375, -2.857891082763672, -2.5562665462493896, -2.2546422481536865, -1.9530179500579834, -1.6513935327529907, -1.349769115447998, -1.048144817352295, -0.746520459651947, -0.4448961019515991, -0.14327174425125122, 0.15835261344909668, 0.4599769115447998, 0.7616013288497925, 1.0632257461547852, 1.3648490905761719, 1.666473388671875, 1.9680978059768677, 2.2697222232818604, 2.5713465213775635, 2.8729708194732666, 3.174595355987549, 3.476219654083252, 3.777843952178955, 4.079468250274658, 4.381092548370361, 4.6827168464660645, 4.984341621398926, 5.285965919494629, 5.587590217590332, 5.889214515686035, 6.190838813781738, 6.492463111877441, 6.7940874099731445, 7.095711708068848, 7.397336006164551, 7.698960304260254, 8.000584602355957, 8.302209854125977, 8.60383415222168, 8.905458450317383, 9.207082748413086, 9.508707046508789, 9.810331344604492, 10.111955642700195, 10.413579940795898, 10.715204238891602, 11.016828536987305]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 9.0, 11.0, 11.0, 18.0, 34.0, 31.0, 45.0, 85.0, 137.0, 199.0, 308.0, 465.0, 638.0, 977.0, 1486.0, 2371.0, 3539.0, 5379.0, 7993.0, 11940.0, 17788.0, 25194.0, 35307.0, 47545.0, 61088.0, 75383.0, 87983.0, 97542.0, 100148.0, 95769.0, 86736.0, 73090.0, 58662.0, 44850.0, 32963.0, 23583.0, 16302.0, 10964.0, 7553.0, 4995.0, 3205.0, 2104.0, 1436.0, 938.0, 602.0, 414.0, 257.0, 173.0, 118.0, 76.0, 43.0, 20.0, 20.0, 14.0, 8.0, 6.0, 11.0, 3.0, 0.0, 1.0], "bins": [-5.17578125, -5.01605224609375, -4.8563232421875, -4.69659423828125, -4.536865234375, -4.37713623046875, -4.2174072265625, -4.05767822265625, -3.89794921875, -3.73822021484375, -3.5784912109375, -3.41876220703125, -3.259033203125, -3.09930419921875, -2.9395751953125, -2.77984619140625, -2.6201171875, -2.46038818359375, -2.3006591796875, -2.14093017578125, -1.981201171875, -1.82147216796875, -1.6617431640625, -1.50201416015625, -1.34228515625, -1.18255615234375, -1.0228271484375, -0.86309814453125, -0.703369140625, -0.54364013671875, -0.3839111328125, -0.22418212890625, -0.064453125, 0.09527587890625, 0.2550048828125, 0.41473388671875, 0.574462890625, 0.73419189453125, 0.8939208984375, 1.05364990234375, 1.21337890625, 1.37310791015625, 1.5328369140625, 1.69256591796875, 1.852294921875, 2.01202392578125, 2.1717529296875, 2.33148193359375, 2.4912109375, 2.65093994140625, 2.8106689453125, 2.97039794921875, 3.130126953125, 3.28985595703125, 3.4495849609375, 3.60931396484375, 3.76904296875, 3.92877197265625, 4.0885009765625, 4.24822998046875, 4.407958984375, 4.56768798828125, 4.7274169921875, 4.88714599609375, 5.046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 1.0, 4.0, 7.0, 8.0, 7.0, 8.0, 10.0, 11.0, 14.0, 18.0, 15.0, 21.0, 19.0, 34.0, 37.0, 25.0, 30.0, 36.0, 37.0, 39.0, 39.0, 38.0, 42.0, 49.0, 51.0, 28.0, 39.0, 35.0, 44.0, 23.0, 34.0, 20.0, 23.0, 18.0, 26.0, 20.0, 20.0, 17.0, 8.0, 14.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.92578125, -7.62225341796875, -7.3187255859375, -7.01519775390625, -6.711669921875, -6.40814208984375, -6.1046142578125, -5.80108642578125, -5.49755859375, -5.19403076171875, -4.8905029296875, -4.58697509765625, -4.283447265625, -3.97991943359375, -3.6763916015625, -3.37286376953125, -3.0693359375, -2.76580810546875, -2.4622802734375, -2.15875244140625, -1.855224609375, -1.55169677734375, -1.2481689453125, -0.94464111328125, -0.64111328125, -0.33758544921875, -0.0340576171875, 0.26947021484375, 0.572998046875, 0.87652587890625, 1.1800537109375, 1.48358154296875, 1.787109375, 2.09063720703125, 2.3941650390625, 2.69769287109375, 3.001220703125, 3.30474853515625, 3.6082763671875, 3.91180419921875, 4.21533203125, 4.51885986328125, 4.8223876953125, 5.12591552734375, 5.429443359375, 5.73297119140625, 6.0364990234375, 6.34002685546875, 6.6435546875, 6.94708251953125, 7.2506103515625, 7.55413818359375, 7.857666015625, 8.16119384765625, 8.4647216796875, 8.76824951171875, 9.07177734375, 9.37530517578125, 9.6788330078125, 9.98236083984375, 10.285888671875, 10.58941650390625, 10.8929443359375, 11.19647216796875, 11.5]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 12.0, 26.0, 41.0, 35.0, 86.0, 111.0, 154.0, 297.0, 400.0, 637.0, 1064.0, 1620.0, 2515.0, 3788.0, 5821.0, 9036.0, 13247.0, 19471.0, 28397.0, 39895.0, 53843.0, 70006.0, 84839.0, 98268.0, 104346.0, 103522.0, 94733.0, 81679.0, 65285.0, 49942.0, 36609.0, 26091.0, 17582.0, 12064.0, 7961.0, 5255.0, 3491.0, 2250.0, 1452.0, 974.0, 631.0, 399.0, 251.0, 152.0, 104.0, 67.0, 41.0, 28.0, 18.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.453125, -5.2764892578125, -5.099853515625, -4.9232177734375, -4.74658203125, -4.5699462890625, -4.393310546875, -4.2166748046875, -4.0400390625, -3.8634033203125, -3.686767578125, -3.5101318359375, -3.33349609375, -3.1568603515625, -2.980224609375, -2.8035888671875, -2.626953125, -2.4503173828125, -2.273681640625, -2.0970458984375, -1.92041015625, -1.7437744140625, -1.567138671875, -1.3905029296875, -1.2138671875, -1.0372314453125, -0.860595703125, -0.6839599609375, -0.50732421875, -0.3306884765625, -0.154052734375, 0.0225830078125, 0.19921875, 0.3758544921875, 0.552490234375, 0.7291259765625, 0.90576171875, 1.0823974609375, 1.259033203125, 1.4356689453125, 1.6123046875, 1.7889404296875, 1.965576171875, 2.1422119140625, 2.31884765625, 2.4954833984375, 2.672119140625, 2.8487548828125, 3.025390625, 3.2020263671875, 3.378662109375, 3.5552978515625, 3.73193359375, 3.9085693359375, 4.085205078125, 4.2618408203125, 4.4384765625, 4.6151123046875, 4.791748046875, 4.9683837890625, 5.14501953125, 5.3216552734375, 5.498291015625, 5.6749267578125, 5.8515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 5.0, 15.0, 13.0, 10.0, 18.0, 14.0, 13.0, 17.0, 26.0, 41.0, 20.0, 32.0, 38.0, 35.0, 36.0, 44.0, 44.0, 44.0, 35.0, 53.0, 35.0, 34.0, 29.0, 36.0, 27.0, 32.0, 35.0, 19.0, 27.0, 20.0, 20.0, 17.0, 12.0, 13.0, 13.0, 10.0, 11.0, 9.0, 10.0, 9.0, 5.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.9453125, -5.76177978515625, -5.5782470703125, -5.39471435546875, -5.211181640625, -5.02764892578125, -4.8441162109375, -4.66058349609375, -4.47705078125, -4.29351806640625, -4.1099853515625, -3.92645263671875, -3.742919921875, -3.55938720703125, -3.3758544921875, -3.19232177734375, -3.0087890625, -2.82525634765625, -2.6417236328125, -2.45819091796875, -2.274658203125, -2.09112548828125, -1.9075927734375, -1.72406005859375, -1.54052734375, -1.35699462890625, -1.1734619140625, -0.98992919921875, -0.806396484375, -0.62286376953125, -0.4393310546875, -0.25579833984375, -0.072265625, 0.11126708984375, 0.2947998046875, 0.47833251953125, 0.661865234375, 0.84539794921875, 1.0289306640625, 1.21246337890625, 1.39599609375, 1.57952880859375, 1.7630615234375, 1.94659423828125, 2.130126953125, 2.31365966796875, 2.4971923828125, 2.68072509765625, 2.8642578125, 3.04779052734375, 3.2313232421875, 3.41485595703125, 3.598388671875, 3.78192138671875, 3.9654541015625, 4.14898681640625, 4.33251953125, 4.51605224609375, 4.6995849609375, 4.88311767578125, 5.066650390625, 5.25018310546875, 5.4337158203125, 5.61724853515625, 5.80078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 12.0, 10.0, 19.0, 26.0, 40.0, 64.0, 98.0, 162.0, 287.0, 393.0, 607.0, 1069.0, 1745.0, 2942.0, 4684.0, 7636.0, 12458.0, 19677.0, 30847.0, 46949.0, 67300.0, 89578.0, 111518.0, 124770.0, 124769.0, 111967.0, 90933.0, 67614.0, 46475.0, 31414.0, 20062.0, 12654.0, 7555.0, 4776.0, 2906.0, 1766.0, 1074.0, 638.0, 379.0, 269.0, 150.0, 98.0, 62.0, 38.0, 33.0, 13.0, 11.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.24737548828125, -2.1724853515625, -2.09759521484375, -2.022705078125, -1.94781494140625, -1.8729248046875, -1.79803466796875, -1.72314453125, -1.64825439453125, -1.5733642578125, -1.49847412109375, -1.423583984375, -1.34869384765625, -1.2738037109375, -1.19891357421875, -1.1240234375, -1.04913330078125, -0.9742431640625, -0.89935302734375, -0.824462890625, -0.74957275390625, -0.6746826171875, -0.59979248046875, -0.52490234375, -0.45001220703125, -0.3751220703125, -0.30023193359375, -0.225341796875, -0.15045166015625, -0.0755615234375, -0.00067138671875, 0.07421875, 0.14910888671875, 0.2239990234375, 0.29888916015625, 0.373779296875, 0.44866943359375, 0.5235595703125, 0.59844970703125, 0.67333984375, 0.74822998046875, 0.8231201171875, 0.89801025390625, 0.972900390625, 1.04779052734375, 1.1226806640625, 1.19757080078125, 1.2724609375, 1.34735107421875, 1.4222412109375, 1.49713134765625, 1.572021484375, 1.64691162109375, 1.7218017578125, 1.79669189453125, 1.87158203125, 1.94647216796875, 2.0213623046875, 2.09625244140625, 2.171142578125, 2.24603271484375, 2.3209228515625, 2.39581298828125, 2.470703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 9.0, 6.0, 6.0, 8.0, 12.0, 27.0, 21.0, 24.0, 29.0, 32.0, 24.0, 34.0, 32.0, 56.0, 53.0, 64.0, 41.0, 59.0, 49.0, 49.0, 55.0, 47.0, 50.0, 39.0, 28.0, 29.0, 26.0, 16.0, 10.0, 20.0, 11.0, 9.0, 3.0, 8.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002574920654296875, -0.0002483353018760681, -0.00023917853832244873, -0.00023002177476882935, -0.00022086501121520996, -0.00021170824766159058, -0.0002025514841079712, -0.0001933947205543518, -0.00018423795700073242, -0.00017508119344711304, -0.00016592442989349365, -0.00015676766633987427, -0.00014761090278625488, -0.0001384541392326355, -0.0001292973756790161, -0.00012014061212539673, -0.00011098384857177734, -0.00010182708501815796, -9.267032146453857e-05, -8.351355791091919e-05, -7.43567943572998e-05, -6.520003080368042e-05, -5.6043267250061035e-05, -4.688650369644165e-05, -3.7729740142822266e-05, -2.857297658920288e-05, -1.9416213035583496e-05, -1.0259449481964111e-05, -1.1026859283447266e-06, 8.054077625274658e-06, 1.7210841178894043e-05, 2.6367604732513428e-05, 3.552436828613281e-05, 4.46811318397522e-05, 5.383789539337158e-05, 6.299465894699097e-05, 7.215142250061035e-05, 8.130818605422974e-05, 9.046494960784912e-05, 9.96217131614685e-05, 0.00010877847671508789, 0.00011793524026870728, 0.00012709200382232666, 0.00013624876737594604, 0.00014540553092956543, 0.00015456229448318481, 0.0001637190580368042, 0.00017287582159042358, 0.00018203258514404297, 0.00019118934869766235, 0.00020034611225128174, 0.00020950287580490112, 0.0002186596393585205, 0.0002278164029121399, 0.00023697316646575928, 0.00024612993001937866, 0.00025528669357299805, 0.00026444345712661743, 0.0002736002206802368, 0.0002827569842338562, 0.0002919137477874756, 0.00030107051134109497, 0.00031022727489471436, 0.00031938403844833374, 0.0003285408020019531]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 9.0, 12.0, 17.0, 24.0, 43.0, 56.0, 108.0, 121.0, 194.0, 316.0, 470.0, 732.0, 1134.0, 1702.0, 2613.0, 3898.0, 6017.0, 8942.0, 13391.0, 19847.0, 28486.0, 40472.0, 55163.0, 70768.0, 86797.0, 99823.0, 105935.0, 104007.0, 95337.0, 80170.0, 63915.0, 48213.0, 35034.0, 24659.0, 16590.0, 11308.0, 7537.0, 5076.0, 3336.0, 2169.0, 1412.0, 933.0, 614.0, 403.0, 267.0, 170.0, 107.0, 76.0, 57.0, 20.0, 25.0, 19.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.96337890625, -1.8974609375, -1.83154296875, -1.765625, -1.69970703125, -1.6337890625, -1.56787109375, -1.501953125, -1.43603515625, -1.3701171875, -1.30419921875, -1.23828125, -1.17236328125, -1.1064453125, -1.04052734375, -0.974609375, -0.90869140625, -0.8427734375, -0.77685546875, -0.7109375, -0.64501953125, -0.5791015625, -0.51318359375, -0.447265625, -0.38134765625, -0.3154296875, -0.24951171875, -0.18359375, -0.11767578125, -0.0517578125, 0.01416015625, 0.080078125, 0.14599609375, 0.2119140625, 0.27783203125, 0.34375, 0.40966796875, 0.4755859375, 0.54150390625, 0.607421875, 0.67333984375, 0.7392578125, 0.80517578125, 0.87109375, 0.93701171875, 1.0029296875, 1.06884765625, 1.134765625, 1.20068359375, 1.2666015625, 1.33251953125, 1.3984375, 1.46435546875, 1.5302734375, 1.59619140625, 1.662109375, 1.72802734375, 1.7939453125, 1.85986328125, 1.92578125, 1.99169921875, 2.0576171875, 2.12353515625, 2.189453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 6.0, 10.0, 7.0, 12.0, 19.0, 9.0, 13.0, 22.0, 30.0, 21.0, 27.0, 28.0, 34.0, 48.0, 33.0, 36.0, 38.0, 50.0, 34.0, 49.0, 38.0, 42.0, 35.0, 29.0, 27.0, 33.0, 26.0, 36.0, 37.0, 20.0, 26.0, 16.0, 16.0, 14.0, 13.0, 8.0, 6.0, 7.0, 12.0, 8.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.99169921875, -0.9619293212890625, -0.932159423828125, -0.9023895263671875, -0.87261962890625, -0.8428497314453125, -0.813079833984375, -0.7833099365234375, -0.7535400390625, -0.7237701416015625, -0.694000244140625, -0.6642303466796875, -0.63446044921875, -0.6046905517578125, -0.574920654296875, -0.5451507568359375, -0.515380859375, -0.4856109619140625, -0.455841064453125, -0.4260711669921875, -0.39630126953125, -0.3665313720703125, -0.336761474609375, -0.3069915771484375, -0.2772216796875, -0.2474517822265625, -0.217681884765625, -0.1879119873046875, -0.15814208984375, -0.1283721923828125, -0.098602294921875, -0.0688323974609375, -0.0390625, -0.0092926025390625, 0.020477294921875, 0.0502471923828125, 0.08001708984375, 0.1097869873046875, 0.139556884765625, 0.1693267822265625, 0.1990966796875, 0.2288665771484375, 0.258636474609375, 0.2884063720703125, 0.31817626953125, 0.3479461669921875, 0.377716064453125, 0.4074859619140625, 0.437255859375, 0.4670257568359375, 0.496795654296875, 0.5265655517578125, 0.55633544921875, 0.5861053466796875, 0.615875244140625, 0.6456451416015625, 0.6754150390625, 0.7051849365234375, 0.734954833984375, 0.7647247314453125, 0.79449462890625, 0.8242645263671875, 0.854034423828125, 0.8838043212890625, 0.91357421875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 6.0, 3.0, 5.0, 9.0, 13.0, 10.0, 12.0, 9.0, 18.0, 25.0, 26.0, 38.0, 52.0, 42.0, 51.0, 48.0, 52.0, 52.0, 48.0, 69.0, 59.0, 49.0, 52.0, 42.0, 41.0, 30.0, 35.0, 29.0, 22.0, 14.0, 10.0, 12.0, 6.0, 9.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.93912410736084, -13.576814651489258, -13.214505195617676, -12.852195739746094, -12.489886283874512, -12.12757682800293, -11.765267372131348, -11.402957916259766, -11.040648460388184, -10.678339004516602, -10.31602954864502, -9.953720092773438, -9.591410636901855, -9.229101181030273, -8.866791725158691, -8.50448226928711, -8.142172813415527, -7.779863357543945, -7.417553901672363, -7.055244445800781, -6.692934989929199, -6.330625534057617, -5.968316078186035, -5.606006622314453, -5.243697166442871, -4.881387710571289, -4.519078254699707, -4.156768798828125, -3.794459342956543, -3.432149887084961, -3.069840431213379, -2.707530975341797, -2.3452205657958984, -1.9829111099243164, -1.6206016540527344, -1.2582921981811523, -0.8959827423095703, -0.5336732864379883, -0.17136383056640625, 0.19094562530517578, 0.5532550811767578, 0.9155645370483398, 1.2778739929199219, 1.640183448791504, 2.002492904663086, 2.364802360534668, 2.72711181640625, 3.089421272277832, 3.451730728149414, 3.814040184020996, 4.176349639892578, 4.53865909576416, 4.900968551635742, 5.263278007507324, 5.625587463378906, 5.987896919250488, 6.35020637512207, 6.712515830993652, 7.074825286865234, 7.437134742736816, 7.799444198608398, 8.16175365447998, 8.524063110351562, 8.886372566223145, 9.248682022094727]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 6.0, 5.0, 9.0, 6.0, 9.0, 9.0, 10.0, 21.0, 18.0, 22.0, 22.0, 17.0, 32.0, 27.0, 33.0, 30.0, 43.0, 41.0, 38.0, 32.0, 50.0, 56.0, 51.0, 46.0, 32.0, 41.0, 41.0, 37.0, 33.0, 31.0, 25.0, 16.0, 23.0, 19.0, 17.0, 14.0, 9.0, 10.0, 6.0, 3.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.019362449645996, -8.685686111450195, -8.352008819580078, -8.018332481384277, -7.684655666351318, -7.350978851318359, -7.0173020362854, -6.683625221252441, -6.349948883056641, -6.016272068023682, -5.682595252990723, -5.348918914794922, -5.015242099761963, -4.681565284729004, -4.347888469696045, -4.014211654663086, -3.680534839630127, -3.346858024597168, -3.013181447982788, -2.679504632949829, -2.345828056335449, -2.0121512413024902, -1.6784744262695312, -1.3447978496551514, -1.0111210346221924, -0.677444338798523, -0.34376758337020874, -0.010090827941894531, 0.3235858678817749, 0.6572625637054443, 0.9909393787384033, 1.3246159553527832, 1.6582927703857422, 1.9919694662094116, 2.325646162033081, 2.65932297706604, 2.99299955368042, 3.326676368713379, 3.660353183746338, 3.9940297603607178, 4.327706336975098, 4.661383152008057, 4.995059967041016, 5.328736305236816, 5.662413120269775, 5.996089935302734, 6.329766750335693, 6.663443565368652, 6.997120380401611, 7.33079719543457, 7.664474010467529, 7.998150825500488, 8.331827163696289, 8.665504455566406, 8.999180793762207, 9.332857131958008, 9.666534423828125, 10.000210762023926, 10.333888053894043, 10.667564392089844, 11.001241683959961, 11.334918022155762, 11.668594360351562, 12.00227165222168, 12.33594799041748]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 21.0, 13.0, 13.0, 25.0, 42.0, 66.0, 104.0, 171.0, 259.0, 391.0, 727.0, 1071.0, 1822.0, 2915.0, 4716.0, 8300.0, 14038.0, 24339.0, 44085.0, 80100.0, 149873.0, 273257.0, 463075.0, 661445.0, 749556.0, 655513.0, 454451.0, 268059.0, 147508.0, 80671.0, 44797.0, 25647.0, 14879.0, 8704.0, 5149.0, 3206.0, 1952.0, 1269.0, 750.0, 460.0, 323.0, 189.0, 120.0, 66.0, 48.0, 37.0, 18.0, 10.0, 9.0, 11.0, 6.0, 1.0, 3.0, 2.0], "bins": [-8.9375, -8.67840576171875, -8.4193115234375, -8.16021728515625, -7.901123046875, -7.64202880859375, -7.3829345703125, -7.12384033203125, -6.86474609375, -6.60565185546875, -6.3465576171875, -6.08746337890625, -5.828369140625, -5.56927490234375, -5.3101806640625, -5.05108642578125, -4.7919921875, -4.53289794921875, -4.2738037109375, -4.01470947265625, -3.755615234375, -3.49652099609375, -3.2374267578125, -2.97833251953125, -2.71923828125, -2.46014404296875, -2.2010498046875, -1.94195556640625, -1.682861328125, -1.42376708984375, -1.1646728515625, -0.90557861328125, -0.646484375, -0.38739013671875, -0.1282958984375, 0.13079833984375, 0.389892578125, 0.64898681640625, 0.9080810546875, 1.16717529296875, 1.42626953125, 1.68536376953125, 1.9444580078125, 2.20355224609375, 2.462646484375, 2.72174072265625, 2.9808349609375, 3.23992919921875, 3.4990234375, 3.75811767578125, 4.0172119140625, 4.27630615234375, 4.535400390625, 4.79449462890625, 5.0535888671875, 5.31268310546875, 5.57177734375, 5.83087158203125, 6.0899658203125, 6.34906005859375, 6.608154296875, 6.86724853515625, 7.1263427734375, 7.38543701171875, 7.64453125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 6.0, 3.0, 4.0, 5.0, 9.0, 6.0, 8.0, 10.0, 16.0, 16.0, 15.0, 26.0, 23.0, 25.0, 19.0, 28.0, 42.0, 44.0, 30.0, 50.0, 39.0, 43.0, 57.0, 41.0, 54.0, 39.0, 40.0, 45.0, 41.0, 26.0, 25.0, 38.0, 18.0, 22.0, 17.0, 24.0, 11.0, 11.0, 4.0, 10.0, 1.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.0546875, -8.75634765625, -8.4580078125, -8.15966796875, -7.861328125, -7.56298828125, -7.2646484375, -6.96630859375, -6.66796875, -6.36962890625, -6.0712890625, -5.77294921875, -5.474609375, -5.17626953125, -4.8779296875, -4.57958984375, -4.28125, -3.98291015625, -3.6845703125, -3.38623046875, -3.087890625, -2.78955078125, -2.4912109375, -2.19287109375, -1.89453125, -1.59619140625, -1.2978515625, -0.99951171875, -0.701171875, -0.40283203125, -0.1044921875, 0.19384765625, 0.4921875, 0.79052734375, 1.0888671875, 1.38720703125, 1.685546875, 1.98388671875, 2.2822265625, 2.58056640625, 2.87890625, 3.17724609375, 3.4755859375, 3.77392578125, 4.072265625, 4.37060546875, 4.6689453125, 4.96728515625, 5.265625, 5.56396484375, 5.8623046875, 6.16064453125, 6.458984375, 6.75732421875, 7.0556640625, 7.35400390625, 7.65234375, 7.95068359375, 8.2490234375, 8.54736328125, 8.845703125, 9.14404296875, 9.4423828125, 9.74072265625, 10.0390625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 12.0, 27.0, 36.0, 58.0, 100.0, 145.0, 259.0, 418.0, 636.0, 1132.0, 1785.0, 3008.0, 5171.0, 8430.0, 14664.0, 24583.0, 41808.0, 70937.0, 120120.0, 199059.0, 316739.0, 469944.0, 613059.0, 654800.0, 565696.0, 409816.0, 267652.0, 164099.0, 97627.0, 57973.0, 34771.0, 20055.0, 12068.0, 7064.0, 4258.0, 2525.0, 1522.0, 881.0, 553.0, 303.0, 188.0, 109.0, 66.0, 42.0, 29.0, 18.0, 19.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.546875, -8.264892578125, -7.98291015625, -7.700927734375, -7.4189453125, -7.136962890625, -6.85498046875, -6.572998046875, -6.291015625, -6.009033203125, -5.72705078125, -5.445068359375, -5.1630859375, -4.881103515625, -4.59912109375, -4.317138671875, -4.03515625, -3.753173828125, -3.47119140625, -3.189208984375, -2.9072265625, -2.625244140625, -2.34326171875, -2.061279296875, -1.779296875, -1.497314453125, -1.21533203125, -0.933349609375, -0.6513671875, -0.369384765625, -0.08740234375, 0.194580078125, 0.4765625, 0.758544921875, 1.04052734375, 1.322509765625, 1.6044921875, 1.886474609375, 2.16845703125, 2.450439453125, 2.732421875, 3.014404296875, 3.29638671875, 3.578369140625, 3.8603515625, 4.142333984375, 4.42431640625, 4.706298828125, 4.98828125, 5.270263671875, 5.55224609375, 5.834228515625, 6.1162109375, 6.398193359375, 6.68017578125, 6.962158203125, 7.244140625, 7.526123046875, 7.80810546875, 8.090087890625, 8.3720703125, 8.654052734375, 8.93603515625, 9.218017578125, 9.5]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 5.0, 8.0, 8.0, 11.0, 17.0, 14.0, 22.0, 34.0, 25.0, 40.0, 43.0, 59.0, 62.0, 76.0, 89.0, 107.0, 130.0, 147.0, 142.0, 149.0, 154.0, 181.0, 201.0, 188.0, 202.0, 172.0, 211.0, 173.0, 180.0, 154.0, 156.0, 117.0, 119.0, 117.0, 101.0, 82.0, 61.0, 59.0, 52.0, 38.0, 30.0, 39.0, 19.0, 25.0, 14.0, 6.0, 11.0, 2.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.35546875, -3.252532958984375, -3.14959716796875, -3.046661376953125, -2.9437255859375, -2.840789794921875, -2.73785400390625, -2.634918212890625, -2.531982421875, -2.429046630859375, -2.32611083984375, -2.223175048828125, -2.1202392578125, -2.017303466796875, -1.91436767578125, -1.811431884765625, -1.70849609375, -1.605560302734375, -1.50262451171875, -1.399688720703125, -1.2967529296875, -1.193817138671875, -1.09088134765625, -0.987945556640625, -0.885009765625, -0.782073974609375, -0.67913818359375, -0.576202392578125, -0.4732666015625, -0.370330810546875, -0.26739501953125, -0.164459228515625, -0.0615234375, 0.041412353515625, 0.14434814453125, 0.247283935546875, 0.3502197265625, 0.453155517578125, 0.55609130859375, 0.659027099609375, 0.761962890625, 0.864898681640625, 0.96783447265625, 1.070770263671875, 1.1737060546875, 1.276641845703125, 1.37957763671875, 1.482513427734375, 1.58544921875, 1.688385009765625, 1.79132080078125, 1.894256591796875, 1.9971923828125, 2.100128173828125, 2.20306396484375, 2.305999755859375, 2.408935546875, 2.511871337890625, 2.61480712890625, 2.717742919921875, 2.8206787109375, 2.923614501953125, 3.02655029296875, 3.129486083984375, 3.232421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 2.0, 9.0, 6.0, 9.0, 7.0, 12.0, 15.0, 12.0, 25.0, 26.0, 27.0, 31.0, 37.0, 44.0, 35.0, 48.0, 49.0, 48.0, 45.0, 64.0, 39.0, 46.0, 38.0, 45.0, 34.0, 38.0, 31.0, 29.0, 24.0, 26.0, 11.0, 19.0, 20.0, 7.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.034927368164062, -9.720091819763184, -9.405256271362305, -9.090420722961426, -8.775585174560547, -8.460749626159668, -8.145914077758789, -7.83107852935791, -7.516242980957031, -7.201407432556152, -6.886571884155273, -6.5717363357543945, -6.256900787353516, -5.942065238952637, -5.627229690551758, -5.312394142150879, -4.997559070587158, -4.682723522186279, -4.3678879737854, -4.0530524253845215, -3.7382168769836426, -3.4233813285827637, -3.108546018600464, -2.793710470199585, -2.478874921798706, -2.164039373397827, -1.8492038249969482, -1.5343683958053589, -1.21953284740448, -0.9046972990036011, -0.5898618698120117, -0.2750263214111328, 0.039809226989746094, 0.3546447455883026, 0.6694802641868591, 0.9843157529830933, 1.2991513013839722, 1.613986849784851, 1.9288222789764404, 2.2436578273773193, 2.5584933757781982, 2.873328924179077, 3.188164472579956, 3.502999782562256, 3.8178353309631348, 4.132670879364014, 4.447506427764893, 4.7623419761657715, 5.07717752456665, 5.392013072967529, 5.706848621368408, 6.021684169769287, 6.336519718170166, 6.651355266571045, 6.966190338134766, 7.2810258865356445, 7.595861434936523, 7.910696983337402, 8.225532531738281, 8.54036808013916, 8.855203628540039, 9.170039176940918, 9.484874725341797, 9.799710273742676, 10.114545822143555]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 6.0, 8.0, 13.0, 9.0, 12.0, 22.0, 14.0, 19.0, 31.0, 17.0, 30.0, 28.0, 33.0, 38.0, 38.0, 44.0, 39.0, 40.0, 50.0, 38.0, 41.0, 42.0, 35.0, 37.0, 35.0, 31.0, 39.0, 31.0, 20.0, 21.0, 19.0, 18.0, 17.0, 15.0, 11.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 6.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.960723876953125, -9.648113250732422, -9.335502624511719, -9.022891998291016, -8.710280418395996, -8.397669792175293, -8.08505916595459, -7.772448539733887, -7.459837913513184, -7.1472272872924805, -6.834616184234619, -6.522005558013916, -6.209394931793213, -5.896783828735352, -5.584173202514648, -5.271562576293945, -4.958951473236084, -4.646340847015381, -4.3337297439575195, -4.021119117736816, -3.7085084915161133, -3.395897626876831, -3.083286762237549, -2.7706761360168457, -2.4580652713775635, -2.1454544067382812, -1.8328437805175781, -1.520232915878296, -1.2076221704483032, -0.8950114250183105, -0.5824005603790283, -0.2697899341583252, 0.04282093048095703, 0.3554317057132721, 0.6680424809455872, 0.9806532859802246, 1.2932640314102173, 1.60587477684021, 1.9184856414794922, 2.2310962677001953, 2.5437071323394775, 2.8563179969787598, 3.168928623199463, 3.481539487838745, 3.7941503524780273, 4.1067609786987305, 4.419371604919434, 4.731982231140137, 5.044593334197998, 5.357203960418701, 5.6698150634765625, 5.982425689697266, 6.295036315917969, 6.607646942138672, 6.920258045196533, 7.232868671417236, 7.545479774475098, 7.858090400695801, 8.170701026916504, 8.483312606811523, 8.795923233032227, 9.10853385925293, 9.421144485473633, 9.733755111694336, 10.046365737915039]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 9.0, 20.0, 21.0, 28.0, 49.0, 51.0, 62.0, 111.0, 167.0, 222.0, 344.0, 478.0, 740.0, 1146.0, 1742.0, 2794.0, 4569.0, 7806.0, 12957.0, 21828.0, 36344.0, 58810.0, 88996.0, 122964.0, 147611.0, 149836.0, 128263.0, 95162.0, 64131.0, 40029.0, 24401.0, 14190.0, 8703.0, 5112.0, 3182.0, 1895.0, 1266.0, 788.0, 553.0, 371.0, 223.0, 175.0, 125.0, 74.0, 70.0, 44.0, 29.0, 15.0, 14.0, 12.0, 6.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.8515625, -5.66339111328125, -5.4752197265625, -5.28704833984375, -5.098876953125, -4.91070556640625, -4.7225341796875, -4.53436279296875, -4.34619140625, -4.15802001953125, -3.9698486328125, -3.78167724609375, -3.593505859375, -3.40533447265625, -3.2171630859375, -3.02899169921875, -2.8408203125, -2.65264892578125, -2.4644775390625, -2.27630615234375, -2.088134765625, -1.89996337890625, -1.7117919921875, -1.52362060546875, -1.33544921875, -1.14727783203125, -0.9591064453125, -0.77093505859375, -0.582763671875, -0.39459228515625, -0.2064208984375, -0.01824951171875, 0.169921875, 0.35809326171875, 0.5462646484375, 0.73443603515625, 0.922607421875, 1.11077880859375, 1.2989501953125, 1.48712158203125, 1.67529296875, 1.86346435546875, 2.0516357421875, 2.23980712890625, 2.427978515625, 2.61614990234375, 2.8043212890625, 2.99249267578125, 3.1806640625, 3.36883544921875, 3.5570068359375, 3.74517822265625, 3.933349609375, 4.12152099609375, 4.3096923828125, 4.49786376953125, 4.68603515625, 4.87420654296875, 5.0623779296875, 5.25054931640625, 5.438720703125, 5.62689208984375, 5.8150634765625, 6.00323486328125, 6.19140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 2.0, 3.0, 5.0, 9.0, 7.0, 16.0, 13.0, 9.0, 11.0, 15.0, 15.0, 24.0, 21.0, 26.0, 34.0, 29.0, 35.0, 43.0, 39.0, 38.0, 45.0, 33.0, 43.0, 43.0, 48.0, 35.0, 37.0, 39.0, 33.0, 20.0, 32.0, 26.0, 25.0, 24.0, 12.0, 16.0, 14.0, 13.0, 17.0, 9.0, 10.0, 2.0, 1.0, 10.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 2.0, 1.0], "bins": [-9.78125, -9.4715576171875, -9.161865234375, -8.8521728515625, -8.54248046875, -8.2327880859375, -7.923095703125, -7.6134033203125, -7.3037109375, -6.9940185546875, -6.684326171875, -6.3746337890625, -6.06494140625, -5.7552490234375, -5.445556640625, -5.1358642578125, -4.826171875, -4.5164794921875, -4.206787109375, -3.8970947265625, -3.58740234375, -3.2777099609375, -2.968017578125, -2.6583251953125, -2.3486328125, -2.0389404296875, -1.729248046875, -1.4195556640625, -1.10986328125, -0.8001708984375, -0.490478515625, -0.1807861328125, 0.12890625, 0.4385986328125, 0.748291015625, 1.0579833984375, 1.36767578125, 1.6773681640625, 1.987060546875, 2.2967529296875, 2.6064453125, 2.9161376953125, 3.225830078125, 3.5355224609375, 3.84521484375, 4.1549072265625, 4.464599609375, 4.7742919921875, 5.083984375, 5.3936767578125, 5.703369140625, 6.0130615234375, 6.32275390625, 6.6324462890625, 6.942138671875, 7.2518310546875, 7.5615234375, 7.8712158203125, 8.180908203125, 8.4906005859375, 8.80029296875, 9.1099853515625, 9.419677734375, 9.7293701171875, 10.0390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 12.0, 6.0, 5.0, 20.0, 16.0, 29.0, 44.0, 51.0, 78.0, 121.0, 186.0, 238.0, 382.0, 619.0, 1007.0, 1714.0, 2760.0, 5058.0, 9043.0, 17133.0, 32658.0, 61529.0, 111495.0, 179056.0, 212293.0, 175111.0, 109436.0, 59455.0, 31219.0, 16551.0, 8994.0, 5062.0, 2786.0, 1680.0, 954.0, 648.0, 344.0, 213.0, 157.0, 106.0, 82.0, 56.0, 46.0, 30.0, 18.0, 13.0, 11.0, 12.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 5.0], "bins": [-9.921875, -9.6163330078125, -9.310791015625, -9.0052490234375, -8.69970703125, -8.3941650390625, -8.088623046875, -7.7830810546875, -7.4775390625, -7.1719970703125, -6.866455078125, -6.5609130859375, -6.25537109375, -5.9498291015625, -5.644287109375, -5.3387451171875, -5.033203125, -4.7276611328125, -4.422119140625, -4.1165771484375, -3.81103515625, -3.5054931640625, -3.199951171875, -2.8944091796875, -2.5888671875, -2.2833251953125, -1.977783203125, -1.6722412109375, -1.36669921875, -1.0611572265625, -0.755615234375, -0.4500732421875, -0.14453125, 0.1610107421875, 0.466552734375, 0.7720947265625, 1.07763671875, 1.3831787109375, 1.688720703125, 1.9942626953125, 2.2998046875, 2.6053466796875, 2.910888671875, 3.2164306640625, 3.52197265625, 3.8275146484375, 4.133056640625, 4.4385986328125, 4.744140625, 5.0496826171875, 5.355224609375, 5.6607666015625, 5.96630859375, 6.2718505859375, 6.577392578125, 6.8829345703125, 7.1884765625, 7.4940185546875, 7.799560546875, 8.1051025390625, 8.41064453125, 8.7161865234375, 9.021728515625, 9.3272705078125, 9.6328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 7.0, 8.0, 10.0, 15.0, 17.0, 17.0, 14.0, 25.0, 25.0, 22.0, 26.0, 23.0, 30.0, 30.0, 29.0, 32.0, 49.0, 36.0, 39.0, 47.0, 50.0, 43.0, 30.0, 37.0, 37.0, 32.0, 33.0, 38.0, 17.0, 31.0, 25.0, 24.0, 17.0, 11.0, 10.0, 8.0, 7.0, 10.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.58203125, -5.38409423828125, -5.1861572265625, -4.98822021484375, -4.790283203125, -4.59234619140625, -4.3944091796875, -4.19647216796875, -3.99853515625, -3.80059814453125, -3.6026611328125, -3.40472412109375, -3.206787109375, -3.00885009765625, -2.8109130859375, -2.61297607421875, -2.4150390625, -2.21710205078125, -2.0191650390625, -1.82122802734375, -1.623291015625, -1.42535400390625, -1.2274169921875, -1.02947998046875, -0.83154296875, -0.63360595703125, -0.4356689453125, -0.23773193359375, -0.039794921875, 0.15814208984375, 0.3560791015625, 0.55401611328125, 0.751953125, 0.94989013671875, 1.1478271484375, 1.34576416015625, 1.543701171875, 1.74163818359375, 1.9395751953125, 2.13751220703125, 2.33544921875, 2.53338623046875, 2.7313232421875, 2.92926025390625, 3.127197265625, 3.32513427734375, 3.5230712890625, 3.72100830078125, 3.9189453125, 4.11688232421875, 4.3148193359375, 4.51275634765625, 4.710693359375, 4.90863037109375, 5.1065673828125, 5.30450439453125, 5.50244140625, 5.70037841796875, 5.8983154296875, 6.09625244140625, 6.294189453125, 6.49212646484375, 6.6900634765625, 6.88800048828125, 7.0859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 6.0, 13.0, 15.0, 23.0, 45.0, 60.0, 98.0, 146.0, 227.0, 340.0, 572.0, 1033.0, 1674.0, 2809.0, 4918.0, 8272.0, 14858.0, 25181.0, 43862.0, 72756.0, 113568.0, 156527.0, 175079.0, 151935.0, 108693.0, 68492.0, 40879.0, 23713.0, 13762.0, 7894.0, 4569.0, 2591.0, 1517.0, 898.0, 596.0, 320.0, 222.0, 161.0, 98.0, 52.0, 31.0, 18.0, 12.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-3.525390625, -3.416717529296875, -3.30804443359375, -3.199371337890625, -3.0906982421875, -2.982025146484375, -2.87335205078125, -2.764678955078125, -2.656005859375, -2.547332763671875, -2.43865966796875, -2.329986572265625, -2.2213134765625, -2.112640380859375, -2.00396728515625, -1.895294189453125, -1.78662109375, -1.677947998046875, -1.56927490234375, -1.460601806640625, -1.3519287109375, -1.243255615234375, -1.13458251953125, -1.025909423828125, -0.917236328125, -0.808563232421875, -0.69989013671875, -0.591217041015625, -0.4825439453125, -0.373870849609375, -0.26519775390625, -0.156524658203125, -0.0478515625, 0.060821533203125, 0.16949462890625, 0.278167724609375, 0.3868408203125, 0.495513916015625, 0.60418701171875, 0.712860107421875, 0.821533203125, 0.930206298828125, 1.03887939453125, 1.147552490234375, 1.2562255859375, 1.364898681640625, 1.47357177734375, 1.582244873046875, 1.69091796875, 1.799591064453125, 1.90826416015625, 2.016937255859375, 2.1256103515625, 2.234283447265625, 2.34295654296875, 2.451629638671875, 2.560302734375, 2.668975830078125, 2.77764892578125, 2.886322021484375, 2.9949951171875, 3.103668212890625, 3.21234130859375, 3.321014404296875, 3.4296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 1.0, 10.0, 16.0, 19.0, 16.0, 10.0, 21.0, 23.0, 34.0, 32.0, 55.0, 53.0, 46.0, 64.0, 35.0, 63.0, 55.0, 60.0, 44.0, 40.0, 40.0, 45.0, 32.0, 39.0, 24.0, 26.0, 15.0, 17.0, 17.0, 13.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020647048950195312, -0.0002001747488975525, -0.00019387900829315186, -0.00018758326768875122, -0.00018128752708435059, -0.00017499178647994995, -0.00016869604587554932, -0.00016240030527114868, -0.00015610456466674805, -0.0001498088240623474, -0.00014351308345794678, -0.00013721734285354614, -0.0001309216022491455, -0.00012462586164474487, -0.00011833012104034424, -0.0001120343804359436, -0.00010573863983154297, -9.944289922714233e-05, -9.31471586227417e-05, -8.685141801834106e-05, -8.055567741394043e-05, -7.42599368095398e-05, -6.796419620513916e-05, -6.166845560073853e-05, -5.537271499633789e-05, -4.9076974391937256e-05, -4.278123378753662e-05, -3.6485493183135986e-05, -3.018975257873535e-05, -2.3894011974334717e-05, -1.7598271369934082e-05, -1.1302530765533447e-05, -5.0067901611328125e-06, 1.2889504432678223e-06, 7.584691047668457e-06, 1.3880431652069092e-05, 2.0176172256469727e-05, 2.647191286087036e-05, 3.2767653465270996e-05, 3.906339406967163e-05, 4.5359134674072266e-05, 5.16548752784729e-05, 5.7950615882873535e-05, 6.424635648727417e-05, 7.05420970916748e-05, 7.683783769607544e-05, 8.313357830047607e-05, 8.942931890487671e-05, 9.572505950927734e-05, 0.00010202080011367798, 0.00010831654071807861, 0.00011461228132247925, 0.00012090802192687988, 0.00012720376253128052, 0.00013349950313568115, 0.0001397952437400818, 0.00014609098434448242, 0.00015238672494888306, 0.0001586824655532837, 0.00016497820615768433, 0.00017127394676208496, 0.0001775696873664856, 0.00018386542797088623, 0.00019016116857528687, 0.0001964569091796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 9.0, 9.0, 7.0, 20.0, 22.0, 36.0, 60.0, 87.0, 145.0, 191.0, 309.0, 548.0, 793.0, 1259.0, 1922.0, 3165.0, 5172.0, 8117.0, 13048.0, 20951.0, 32959.0, 49974.0, 72438.0, 99171.0, 123471.0, 135347.0, 129035.0, 108053.0, 81353.0, 56952.0, 38130.0, 24328.0, 15617.0, 9886.0, 5885.0, 3717.0, 2263.0, 1454.0, 950.0, 613.0, 417.0, 248.0, 156.0, 90.0, 67.0, 32.0, 29.0, 22.0, 8.0, 10.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 3.0], "bins": [-3.46484375, -3.358795166015625, -3.25274658203125, -3.146697998046875, -3.0406494140625, -2.934600830078125, -2.82855224609375, -2.722503662109375, -2.616455078125, -2.510406494140625, -2.40435791015625, -2.298309326171875, -2.1922607421875, -2.086212158203125, -1.98016357421875, -1.874114990234375, -1.76806640625, -1.662017822265625, -1.55596923828125, -1.449920654296875, -1.3438720703125, -1.237823486328125, -1.13177490234375, -1.025726318359375, -0.919677734375, -0.813629150390625, -0.70758056640625, -0.601531982421875, -0.4954833984375, -0.389434814453125, -0.28338623046875, -0.177337646484375, -0.0712890625, 0.034759521484375, 0.14080810546875, 0.246856689453125, 0.3529052734375, 0.458953857421875, 0.56500244140625, 0.671051025390625, 0.777099609375, 0.883148193359375, 0.98919677734375, 1.095245361328125, 1.2012939453125, 1.307342529296875, 1.41339111328125, 1.519439697265625, 1.62548828125, 1.731536865234375, 1.83758544921875, 1.943634033203125, 2.0496826171875, 2.155731201171875, 2.26177978515625, 2.367828369140625, 2.473876953125, 2.579925537109375, 2.68597412109375, 2.792022705078125, 2.8980712890625, 3.004119873046875, 3.11016845703125, 3.216217041015625, 3.322265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 4.0, 5.0, 6.0, 9.0, 6.0, 27.0, 16.0, 10.0, 28.0, 23.0, 28.0, 28.0, 30.0, 36.0, 36.0, 44.0, 55.0, 56.0, 65.0, 41.0, 45.0, 59.0, 41.0, 32.0, 38.0, 44.0, 38.0, 19.0, 31.0, 23.0, 14.0, 10.0, 9.0, 6.0, 9.0, 9.0, 4.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5947265625, -1.546905517578125, -1.49908447265625, -1.451263427734375, -1.4034423828125, -1.355621337890625, -1.30780029296875, -1.259979248046875, -1.212158203125, -1.164337158203125, -1.11651611328125, -1.068695068359375, -1.0208740234375, -0.973052978515625, -0.92523193359375, -0.877410888671875, -0.82958984375, -0.781768798828125, -0.73394775390625, -0.686126708984375, -0.6383056640625, -0.590484619140625, -0.54266357421875, -0.494842529296875, -0.447021484375, -0.399200439453125, -0.35137939453125, -0.303558349609375, -0.2557373046875, -0.207916259765625, -0.16009521484375, -0.112274169921875, -0.064453125, -0.016632080078125, 0.03118896484375, 0.079010009765625, 0.1268310546875, 0.174652099609375, 0.22247314453125, 0.270294189453125, 0.318115234375, 0.365936279296875, 0.41375732421875, 0.461578369140625, 0.5093994140625, 0.557220458984375, 0.60504150390625, 0.652862548828125, 0.70068359375, 0.748504638671875, 0.79632568359375, 0.844146728515625, 0.8919677734375, 0.939788818359375, 0.98760986328125, 1.035430908203125, 1.083251953125, 1.131072998046875, 1.17889404296875, 1.226715087890625, 1.2745361328125, 1.322357177734375, 1.37017822265625, 1.417999267578125, 1.4658203125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 7.0, 4.0, 6.0, 4.0, 7.0, 5.0, 10.0, 8.0, 13.0, 10.0, 20.0, 23.0, 37.0, 22.0, 32.0, 39.0, 36.0, 40.0, 41.0, 45.0, 43.0, 42.0, 51.0, 46.0, 38.0, 43.0, 40.0, 36.0, 35.0, 27.0, 35.0, 24.0, 27.0, 11.0, 20.0, 19.0, 14.0, 7.0, 8.0, 6.0, 3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.912544250488281, -8.624547958374023, -8.336551666259766, -8.048555374145508, -7.76055908203125, -7.472562789916992, -7.184566974639893, -6.896570682525635, -6.608574390411377, -6.320578098297119, -6.032581806182861, -5.7445855140686035, -5.456589698791504, -5.168593406677246, -4.880597114562988, -4.5926008224487305, -4.304604530334473, -4.016608238220215, -3.728611946105957, -3.4406158924102783, -3.1526196002960205, -2.8646233081817627, -2.576627254486084, -2.288630962371826, -2.0006346702575684, -1.7126383781433105, -1.4246422052383423, -1.136646032333374, -0.8486497402191162, -0.5606534481048584, -0.27265727519989014, 0.015338897705078125, 0.30333518981933594, 0.591331422328949, 0.879327654838562, 1.1673238277435303, 1.455320119857788, 1.743316411972046, 2.0313124656677246, 2.3193087577819824, 2.6073050498962402, 2.895301342010498, 3.183297634124756, 3.4712936878204346, 3.7592899799346924, 4.047286033630371, 4.335282325744629, 4.623278617858887, 4.9112749099731445, 5.199271202087402, 5.48726749420166, 5.775263786315918, 6.063260078430176, 6.351256370544434, 6.639252185821533, 6.927248477935791, 7.215244770050049, 7.503241062164307, 7.7912373542785645, 8.079233169555664, 8.367229461669922, 8.65522575378418, 8.943222045898438, 9.231218338012695, 9.519214630126953]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 4.0, 5.0, 8.0, 11.0, 12.0, 11.0, 16.0, 15.0, 12.0, 16.0, 21.0, 31.0, 34.0, 27.0, 27.0, 26.0, 45.0, 45.0, 37.0, 45.0, 49.0, 34.0, 47.0, 36.0, 35.0, 36.0, 35.0, 32.0, 32.0, 28.0, 26.0, 19.0, 20.0, 22.0, 18.0, 12.0, 15.0, 8.0, 7.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.609414100646973, -9.308955192565918, -9.008496284484863, -8.708036422729492, -8.407577514648438, -8.107118606567383, -7.806659698486328, -7.506200313568115, -7.205740928649902, -6.905282020568848, -6.604822635650635, -6.30436372756958, -6.003904342651367, -5.7034454345703125, -5.402986526489258, -5.102527141571045, -4.80206823348999, -4.5016093254089355, -4.201149940490723, -3.900691032409668, -3.600231647491455, -3.2997727394104004, -2.9993135929107666, -2.698854446411133, -2.398395299911499, -2.0979361534118652, -1.7974770069122314, -1.4970179796218872, -1.1965588331222534, -0.8960996866226196, -0.5956406593322754, -0.2951815128326416, 0.0052776336669921875, 0.3057367503643036, 0.606195867061615, 0.906654953956604, 1.2071141004562378, 1.5075732469558716, 1.8080322742462158, 2.1084914207458496, 2.4089505672454834, 2.709409713745117, 3.009868860244751, 3.3103280067443848, 3.6107869148254395, 3.9112462997436523, 4.211705207824707, 4.512164115905762, 4.812623500823975, 5.113082408905029, 5.413541793823242, 5.714000701904297, 6.01446008682251, 6.3149189949035645, 6.615378379821777, 6.915837287902832, 7.216296195983887, 7.516755104064941, 7.817214488983154, 8.117673873901367, 8.418132781982422, 8.718591690063477, 9.019050598144531, 9.319509506225586, 9.619969367980957]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 7.0, 11.0, 15.0, 13.0, 44.0, 59.0, 87.0, 110.0, 179.0, 339.0, 502.0, 733.0, 1113.0, 1673.0, 2590.0, 4006.0, 5864.0, 8880.0, 12954.0, 18686.0, 26661.0, 36980.0, 49272.0, 63524.0, 78656.0, 91103.0, 99750.0, 100116.0, 95174.0, 84091.0, 69857.0, 55550.0, 41760.0, 30764.0, 21559.0, 15097.0, 10376.0, 6929.0, 4614.0, 3018.0, 2084.0, 1326.0, 854.0, 568.0, 357.0, 241.0, 139.0, 104.0, 72.0, 40.0, 24.0, 16.0, 16.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.984375, -4.82464599609375, -4.6649169921875, -4.50518798828125, -4.345458984375, -4.18572998046875, -4.0260009765625, -3.86627197265625, -3.70654296875, -3.54681396484375, -3.3870849609375, -3.22735595703125, -3.067626953125, -2.90789794921875, -2.7481689453125, -2.58843994140625, -2.4287109375, -2.26898193359375, -2.1092529296875, -1.94952392578125, -1.789794921875, -1.63006591796875, -1.4703369140625, -1.31060791015625, -1.15087890625, -0.99114990234375, -0.8314208984375, -0.67169189453125, -0.511962890625, -0.35223388671875, -0.1925048828125, -0.03277587890625, 0.126953125, 0.28668212890625, 0.4464111328125, 0.60614013671875, 0.765869140625, 0.92559814453125, 1.0853271484375, 1.24505615234375, 1.40478515625, 1.56451416015625, 1.7242431640625, 1.88397216796875, 2.043701171875, 2.20343017578125, 2.3631591796875, 2.52288818359375, 2.6826171875, 2.84234619140625, 3.0020751953125, 3.16180419921875, 3.321533203125, 3.48126220703125, 3.6409912109375, 3.80072021484375, 3.96044921875, 4.12017822265625, 4.2799072265625, 4.43963623046875, 4.599365234375, 4.75909423828125, 4.9188232421875, 5.07855224609375, 5.23828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 7.0, 2.0, 4.0, 7.0, 11.0, 9.0, 13.0, 18.0, 14.0, 15.0, 16.0, 27.0, 24.0, 31.0, 33.0, 35.0, 30.0, 31.0, 32.0, 47.0, 30.0, 39.0, 41.0, 45.0, 48.0, 27.0, 32.0, 32.0, 40.0, 36.0, 26.0, 20.0, 23.0, 22.0, 18.0, 19.0, 13.0, 13.0, 13.0, 9.0, 10.0, 4.0, 1.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-9.2109375, -8.9163818359375, -8.621826171875, -8.3272705078125, -8.03271484375, -7.7381591796875, -7.443603515625, -7.1490478515625, -6.8544921875, -6.5599365234375, -6.265380859375, -5.9708251953125, -5.67626953125, -5.3817138671875, -5.087158203125, -4.7926025390625, -4.498046875, -4.2034912109375, -3.908935546875, -3.6143798828125, -3.31982421875, -3.0252685546875, -2.730712890625, -2.4361572265625, -2.1416015625, -1.8470458984375, -1.552490234375, -1.2579345703125, -0.96337890625, -0.6688232421875, -0.374267578125, -0.0797119140625, 0.21484375, 0.5093994140625, 0.803955078125, 1.0985107421875, 1.39306640625, 1.6876220703125, 1.982177734375, 2.2767333984375, 2.5712890625, 2.8658447265625, 3.160400390625, 3.4549560546875, 3.74951171875, 4.0440673828125, 4.338623046875, 4.6331787109375, 4.927734375, 5.2222900390625, 5.516845703125, 5.8114013671875, 6.10595703125, 6.4005126953125, 6.695068359375, 6.9896240234375, 7.2841796875, 7.5787353515625, 7.873291015625, 8.1678466796875, 8.46240234375, 8.7569580078125, 9.051513671875, 9.3460693359375, 9.640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 8.0, 16.0, 20.0, 24.0, 53.0, 70.0, 135.0, 192.0, 299.0, 525.0, 892.0, 1470.0, 2518.0, 4271.0, 7204.0, 12128.0, 20189.0, 32352.0, 49621.0, 72006.0, 96663.0, 117493.0, 129101.0, 127132.0, 111232.0, 87058.0, 63731.0, 42646.0, 27661.0, 17007.0, 10203.0, 6039.0, 3495.0, 2049.0, 1227.0, 716.0, 431.0, 271.0, 158.0, 84.0, 53.0, 42.0, 24.0, 20.0, 10.0, 3.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.66015625, -6.43682861328125, -6.2135009765625, -5.99017333984375, -5.766845703125, -5.54351806640625, -5.3201904296875, -5.09686279296875, -4.87353515625, -4.65020751953125, -4.4268798828125, -4.20355224609375, -3.980224609375, -3.75689697265625, -3.5335693359375, -3.31024169921875, -3.0869140625, -2.86358642578125, -2.6402587890625, -2.41693115234375, -2.193603515625, -1.97027587890625, -1.7469482421875, -1.52362060546875, -1.30029296875, -1.07696533203125, -0.8536376953125, -0.63031005859375, -0.406982421875, -0.18365478515625, 0.0396728515625, 0.26300048828125, 0.486328125, 0.70965576171875, 0.9329833984375, 1.15631103515625, 1.379638671875, 1.60296630859375, 1.8262939453125, 2.04962158203125, 2.27294921875, 2.49627685546875, 2.7196044921875, 2.94293212890625, 3.166259765625, 3.38958740234375, 3.6129150390625, 3.83624267578125, 4.0595703125, 4.28289794921875, 4.5062255859375, 4.72955322265625, 4.952880859375, 5.17620849609375, 5.3995361328125, 5.62286376953125, 5.84619140625, 6.06951904296875, 6.2928466796875, 6.51617431640625, 6.739501953125, 6.96282958984375, 7.1861572265625, 7.40948486328125, 7.6328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 5.0, 3.0, 13.0, 6.0, 10.0, 9.0, 20.0, 16.0, 14.0, 23.0, 19.0, 24.0, 32.0, 26.0, 41.0, 33.0, 38.0, 35.0, 42.0, 43.0, 31.0, 42.0, 41.0, 44.0, 45.0, 34.0, 40.0, 34.0, 28.0, 22.0, 28.0, 21.0, 15.0, 20.0, 17.0, 12.0, 11.0, 9.0, 15.0, 12.0, 9.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-7.1015625, -6.90380859375, -6.7060546875, -6.50830078125, -6.310546875, -6.11279296875, -5.9150390625, -5.71728515625, -5.51953125, -5.32177734375, -5.1240234375, -4.92626953125, -4.728515625, -4.53076171875, -4.3330078125, -4.13525390625, -3.9375, -3.73974609375, -3.5419921875, -3.34423828125, -3.146484375, -2.94873046875, -2.7509765625, -2.55322265625, -2.35546875, -2.15771484375, -1.9599609375, -1.76220703125, -1.564453125, -1.36669921875, -1.1689453125, -0.97119140625, -0.7734375, -0.57568359375, -0.3779296875, -0.18017578125, 0.017578125, 0.21533203125, 0.4130859375, 0.61083984375, 0.80859375, 1.00634765625, 1.2041015625, 1.40185546875, 1.599609375, 1.79736328125, 1.9951171875, 2.19287109375, 2.390625, 2.58837890625, 2.7861328125, 2.98388671875, 3.181640625, 3.37939453125, 3.5771484375, 3.77490234375, 3.97265625, 4.17041015625, 4.3681640625, 4.56591796875, 4.763671875, 4.96142578125, 5.1591796875, 5.35693359375, 5.5546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 13.0, 28.0, 38.0, 39.0, 115.0, 149.0, 239.0, 371.0, 652.0, 1198.0, 1928.0, 3307.0, 5925.0, 9751.0, 16420.0, 27125.0, 43344.0, 65214.0, 91753.0, 117914.0, 134914.0, 136130.0, 119562.0, 93735.0, 66168.0, 43708.0, 27730.0, 16912.0, 10021.0, 5862.0, 3435.0, 1957.0, 1149.0, 669.0, 424.0, 248.0, 141.0, 81.0, 74.0, 39.0, 33.0, 5.0, 16.0, 8.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.556640625, -2.479217529296875, -2.40179443359375, -2.324371337890625, -2.2469482421875, -2.169525146484375, -2.09210205078125, -2.014678955078125, -1.937255859375, -1.859832763671875, -1.78240966796875, -1.704986572265625, -1.6275634765625, -1.550140380859375, -1.47271728515625, -1.395294189453125, -1.31787109375, -1.240447998046875, -1.16302490234375, -1.085601806640625, -1.0081787109375, -0.930755615234375, -0.85333251953125, -0.775909423828125, -0.698486328125, -0.621063232421875, -0.54364013671875, -0.466217041015625, -0.3887939453125, -0.311370849609375, -0.23394775390625, -0.156524658203125, -0.0791015625, -0.001678466796875, 0.07574462890625, 0.153167724609375, 0.2305908203125, 0.308013916015625, 0.38543701171875, 0.462860107421875, 0.540283203125, 0.617706298828125, 0.69512939453125, 0.772552490234375, 0.8499755859375, 0.927398681640625, 1.00482177734375, 1.082244873046875, 1.15966796875, 1.237091064453125, 1.31451416015625, 1.391937255859375, 1.4693603515625, 1.546783447265625, 1.62420654296875, 1.701629638671875, 1.779052734375, 1.856475830078125, 1.93389892578125, 2.011322021484375, 2.0887451171875, 2.166168212890625, 2.24359130859375, 2.321014404296875, 2.3984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 1.0, 6.0, 15.0, 6.0, 13.0, 11.0, 14.0, 18.0, 19.0, 16.0, 19.0, 35.0, 29.0, 46.0, 45.0, 42.0, 51.0, 57.0, 41.0, 57.0, 51.0, 35.0, 41.0, 38.0, 44.0, 35.0, 35.0, 30.0, 24.0, 20.0, 19.0, 14.0, 13.0, 11.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00024366378784179688, -0.00023605301976203918, -0.0002284422516822815, -0.0002208314836025238, -0.0002132207155227661, -0.00020560994744300842, -0.00019799917936325073, -0.00019038841128349304, -0.00018277764320373535, -0.00017516687512397766, -0.00016755610704421997, -0.00015994533896446228, -0.0001523345708847046, -0.0001447238028049469, -0.0001371130347251892, -0.00012950226664543152, -0.00012189149856567383, -0.00011428073048591614, -0.00010666996240615845, -9.905919432640076e-05, -9.144842624664307e-05, -8.383765816688538e-05, -7.622689008712769e-05, -6.861612200737e-05, -6.1005353927612305e-05, -5.3394585847854614e-05, -4.5783817768096924e-05, -3.8173049688339233e-05, -3.056228160858154e-05, -2.2951513528823853e-05, -1.5340745449066162e-05, -7.729977369308472e-06, -1.1920928955078125e-07, 7.491558790206909e-06, 1.51023268699646e-05, 2.271309494972229e-05, 3.032386302947998e-05, 3.793463110923767e-05, 4.554539918899536e-05, 5.315616726875305e-05, 6.076693534851074e-05, 6.837770342826843e-05, 7.598847150802612e-05, 8.359923958778381e-05, 9.12100076675415e-05, 9.88207757472992e-05, 0.00010643154382705688, 0.00011404231190681458, 0.00012165307998657227, 0.00012926384806632996, 0.00013687461614608765, 0.00014448538422584534, 0.00015209615230560303, 0.00015970692038536072, 0.0001673176884651184, 0.0001749284565448761, 0.0001825392246246338, 0.00019014999270439148, 0.00019776076078414917, 0.00020537152886390686, 0.00021298229694366455, 0.00022059306502342224, 0.00022820383310317993, 0.00023581460118293762, 0.0002434253692626953]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 7.0, 2.0, 7.0, 13.0, 14.0, 22.0, 33.0, 48.0, 85.0, 138.0, 196.0, 252.0, 463.0, 735.0, 1255.0, 2060.0, 3302.0, 5330.0, 8701.0, 13992.0, 22608.0, 35249.0, 51986.0, 74638.0, 98170.0, 117523.0, 127089.0, 123327.0, 106109.0, 83234.0, 59816.0, 41041.0, 26753.0, 16932.0, 10700.0, 6439.0, 4075.0, 2385.0, 1442.0, 869.0, 576.0, 318.0, 202.0, 154.0, 104.0, 56.0, 37.0, 23.0, 15.0, 11.0, 12.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-2.421875, -2.34295654296875, -2.2640380859375, -2.18511962890625, -2.106201171875, -2.02728271484375, -1.9483642578125, -1.86944580078125, -1.79052734375, -1.71160888671875, -1.6326904296875, -1.55377197265625, -1.474853515625, -1.39593505859375, -1.3170166015625, -1.23809814453125, -1.1591796875, -1.08026123046875, -1.0013427734375, -0.92242431640625, -0.843505859375, -0.76458740234375, -0.6856689453125, -0.60675048828125, -0.52783203125, -0.44891357421875, -0.3699951171875, -0.29107666015625, -0.212158203125, -0.13323974609375, -0.0543212890625, 0.02459716796875, 0.103515625, 0.18243408203125, 0.2613525390625, 0.34027099609375, 0.419189453125, 0.49810791015625, 0.5770263671875, 0.65594482421875, 0.73486328125, 0.81378173828125, 0.8927001953125, 0.97161865234375, 1.050537109375, 1.12945556640625, 1.2083740234375, 1.28729248046875, 1.3662109375, 1.44512939453125, 1.5240478515625, 1.60296630859375, 1.681884765625, 1.76080322265625, 1.8397216796875, 1.91864013671875, 1.99755859375, 2.07647705078125, 2.1553955078125, 2.23431396484375, 2.313232421875, 2.39215087890625, 2.4710693359375, 2.54998779296875, 2.62890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 13.0, 10.0, 11.0, 10.0, 27.0, 22.0, 26.0, 25.0, 37.0, 38.0, 32.0, 42.0, 44.0, 41.0, 43.0, 43.0, 50.0, 49.0, 41.0, 41.0, 51.0, 36.0, 26.0, 26.0, 35.0, 28.0, 22.0, 20.0, 15.0, 16.0, 7.0, 12.0, 8.0, 6.0, 4.0, 6.0, 6.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0126953125, -0.9803619384765625, -0.948028564453125, -0.9156951904296875, -0.88336181640625, -0.8510284423828125, -0.818695068359375, -0.7863616943359375, -0.7540283203125, -0.7216949462890625, -0.689361572265625, -0.6570281982421875, -0.62469482421875, -0.5923614501953125, -0.560028076171875, -0.5276947021484375, -0.495361328125, -0.4630279541015625, -0.430694580078125, -0.3983612060546875, -0.36602783203125, -0.3336944580078125, -0.301361083984375, -0.2690277099609375, -0.2366943359375, -0.2043609619140625, -0.172027587890625, -0.1396942138671875, -0.10736083984375, -0.0750274658203125, -0.042694091796875, -0.0103607177734375, 0.02197265625, 0.0543060302734375, 0.086639404296875, 0.1189727783203125, 0.15130615234375, 0.1836395263671875, 0.215972900390625, 0.2483062744140625, 0.2806396484375, 0.3129730224609375, 0.345306396484375, 0.3776397705078125, 0.40997314453125, 0.4423065185546875, 0.474639892578125, 0.5069732666015625, 0.539306640625, 0.5716400146484375, 0.603973388671875, 0.6363067626953125, 0.66864013671875, 0.7009735107421875, 0.733306884765625, 0.7656402587890625, 0.7979736328125, 0.8303070068359375, 0.862640380859375, 0.8949737548828125, 0.92730712890625, 0.9596405029296875, 0.991973876953125, 1.0243072509765625, 1.056640625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 4.0, 18.0, 6.0, 15.0, 19.0, 21.0, 34.0, 27.0, 32.0, 29.0, 48.0, 35.0, 55.0, 47.0, 47.0, 48.0, 54.0, 41.0, 42.0, 53.0, 50.0, 44.0, 30.0, 24.0, 24.0, 17.0, 25.0, 21.0, 12.0, 12.0, 11.0, 6.0, 8.0, 5.0, 7.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.399574279785156, -9.093140602111816, -8.786706924438477, -8.480274200439453, -8.173840522766113, -7.867406845092773, -7.560973644256592, -7.25454044342041, -6.94810676574707, -6.6416730880737305, -6.335239887237549, -6.028806686401367, -5.722373008728027, -5.4159393310546875, -5.109506130218506, -4.803072929382324, -4.496639251708984, -4.1902055740356445, -3.883772373199463, -3.577338933944702, -3.2709054946899414, -2.9644720554351807, -2.65803861618042, -2.351605176925659, -2.0451717376708984, -1.7387382984161377, -1.432304859161377, -1.1258714199066162, -0.8194379806518555, -0.5130045413970947, -0.20657110214233398, 0.09986233711242676, 0.4062967300415039, 0.7127301692962646, 1.0191636085510254, 1.3255970478057861, 1.6320304870605469, 1.9384639263153076, 2.2448973655700684, 2.551330804824829, 2.85776424407959, 3.1641976833343506, 3.4706311225891113, 3.777064561843872, 4.083498001098633, 4.389931678771973, 4.696364879608154, 5.002798080444336, 5.309231758117676, 5.615665435791016, 5.922098636627197, 6.228531837463379, 6.534965515136719, 6.841399192810059, 7.14783239364624, 7.454265594482422, 7.760699272155762, 8.067132949829102, 8.373565673828125, 8.679999351501465, 8.986433029174805, 9.292866706848145, 9.599300384521484, 9.905733108520508, 10.212166786193848]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 9.0, 5.0, 5.0, 8.0, 8.0, 16.0, 13.0, 16.0, 15.0, 10.0, 20.0, 18.0, 28.0, 22.0, 21.0, 33.0, 28.0, 47.0, 36.0, 37.0, 35.0, 30.0, 41.0, 41.0, 47.0, 42.0, 40.0, 40.0, 33.0, 32.0, 34.0, 25.0, 29.0, 22.0, 27.0, 16.0, 12.0, 14.0, 6.0, 6.0, 10.0, 6.0, 8.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.561555862426758, -9.239623069763184, -8.91769027709961, -8.595757484436035, -8.273824691772461, -7.9518914222717285, -7.629958629608154, -7.308025360107422, -6.986092567443848, -6.664159774780273, -6.342226982116699, -6.020294189453125, -5.698360919952393, -5.376428127288818, -5.054495334625244, -4.732562065124512, -4.410629749298096, -4.0886969566345215, -3.766763925552368, -3.444831132888794, -3.1228981018066406, -2.8009653091430664, -2.479032516479492, -2.157099485397339, -1.8351666927337646, -1.5132337808609009, -1.191300868988037, -0.8693680763244629, -0.5474351644515991, -0.22550225257873535, 0.09643054008483887, 0.4183635711669922, 0.7402963638305664, 1.0622292757034302, 1.384162187576294, 1.7060949802398682, 2.0280280113220215, 2.3499608039855957, 2.67189359664917, 2.9938266277313232, 3.3157594203948975, 3.6376922130584717, 3.959625244140625, 4.281558036804199, 4.603490829467773, 4.925423622131348, 5.247356414794922, 5.569289684295654, 5.8912224769592285, 6.213155269622803, 6.535088062286377, 6.857021331787109, 7.178954124450684, 7.500886917114258, 7.822819709777832, 8.144752502441406, 8.46668529510498, 8.788618087768555, 9.110550880432129, 9.432483673095703, 9.754416465759277, 10.076349258422852, 10.398283004760742, 10.720215797424316, 11.04214859008789]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [3.0, 6.0, 2.0, 7.0, 8.0, 20.0, 18.0, 43.0, 62.0, 94.0, 111.0, 203.0, 298.0, 412.0, 662.0, 1014.0, 1583.0, 2220.0, 3645.0, 5457.0, 8562.0, 13799.0, 22160.0, 35553.0, 58742.0, 95979.0, 159087.0, 254999.0, 385199.0, 521372.0, 607155.0, 592226.0, 487321.0, 346905.0, 225025.0, 139454.0, 84202.0, 51749.0, 32037.0, 19897.0, 12637.0, 8293.0, 5494.0, 3464.0, 2332.0, 1497.0, 1070.0, 715.0, 472.0, 317.0, 200.0, 161.0, 127.0, 74.0, 47.0, 32.0, 26.0, 14.0, 11.0, 16.0, 5.0, 7.0, 1.0, 1.0], "bins": [-7.06640625, -6.8375244140625, -6.608642578125, -6.3797607421875, -6.15087890625, -5.9219970703125, -5.693115234375, -5.4642333984375, -5.2353515625, -5.0064697265625, -4.777587890625, -4.5487060546875, -4.31982421875, -4.0909423828125, -3.862060546875, -3.6331787109375, -3.404296875, -3.1754150390625, -2.946533203125, -2.7176513671875, -2.48876953125, -2.2598876953125, -2.031005859375, -1.8021240234375, -1.5732421875, -1.3443603515625, -1.115478515625, -0.8865966796875, -0.65771484375, -0.4288330078125, -0.199951171875, 0.0289306640625, 0.2578125, 0.4866943359375, 0.715576171875, 0.9444580078125, 1.17333984375, 1.4022216796875, 1.631103515625, 1.8599853515625, 2.0888671875, 2.3177490234375, 2.546630859375, 2.7755126953125, 3.00439453125, 3.2332763671875, 3.462158203125, 3.6910400390625, 3.919921875, 4.1488037109375, 4.377685546875, 4.6065673828125, 4.83544921875, 5.0643310546875, 5.293212890625, 5.5220947265625, 5.7509765625, 5.9798583984375, 6.208740234375, 6.4376220703125, 6.66650390625, 6.8953857421875, 7.124267578125, 7.3531494140625, 7.58203125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 4.0, 15.0, 9.0, 11.0, 13.0, 11.0, 14.0, 18.0, 21.0, 20.0, 14.0, 23.0, 24.0, 24.0, 31.0, 34.0, 49.0, 38.0, 34.0, 41.0, 30.0, 52.0, 49.0, 30.0, 33.0, 32.0, 26.0, 39.0, 41.0, 33.0, 31.0, 26.0, 24.0, 17.0, 14.0, 14.0, 12.0, 10.0, 3.0, 3.0, 10.0, 7.0, 3.0, 4.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -7.9974365234375, -7.713623046875, -7.4298095703125, -7.14599609375, -6.8621826171875, -6.578369140625, -6.2945556640625, -6.0107421875, -5.7269287109375, -5.443115234375, -5.1593017578125, -4.87548828125, -4.5916748046875, -4.307861328125, -4.0240478515625, -3.740234375, -3.4564208984375, -3.172607421875, -2.8887939453125, -2.60498046875, -2.3211669921875, -2.037353515625, -1.7535400390625, -1.4697265625, -1.1859130859375, -0.902099609375, -0.6182861328125, -0.33447265625, -0.0506591796875, 0.233154296875, 0.5169677734375, 0.80078125, 1.0845947265625, 1.368408203125, 1.6522216796875, 1.93603515625, 2.2198486328125, 2.503662109375, 2.7874755859375, 3.0712890625, 3.3551025390625, 3.638916015625, 3.9227294921875, 4.20654296875, 4.4903564453125, 4.774169921875, 5.0579833984375, 5.341796875, 5.6256103515625, 5.909423828125, 6.1932373046875, 6.47705078125, 6.7608642578125, 7.044677734375, 7.3284912109375, 7.6123046875, 7.8961181640625, 8.179931640625, 8.4637451171875, 8.74755859375, 9.0313720703125, 9.315185546875, 9.5989990234375, 9.8828125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 17.0, 24.0, 45.0, 59.0, 103.0, 176.0, 286.0, 482.0, 832.0, 1524.0, 2544.0, 4553.0, 8230.0, 15214.0, 27495.0, 50821.0, 92175.0, 165071.0, 285048.0, 460228.0, 645044.0, 726614.0, 632684.0, 447598.0, 273234.0, 158310.0, 88715.0, 48190.0, 26076.0, 14724.0, 7922.0, 4397.0, 2457.0, 1372.0, 798.0, 503.0, 276.0, 165.0, 104.0, 64.0, 42.0, 21.0, 16.0, 9.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.9609375, -10.623291015625, -10.28564453125, -9.947998046875, -9.6103515625, -9.272705078125, -8.93505859375, -8.597412109375, -8.259765625, -7.922119140625, -7.58447265625, -7.246826171875, -6.9091796875, -6.571533203125, -6.23388671875, -5.896240234375, -5.55859375, -5.220947265625, -4.88330078125, -4.545654296875, -4.2080078125, -3.870361328125, -3.53271484375, -3.195068359375, -2.857421875, -2.519775390625, -2.18212890625, -1.844482421875, -1.5068359375, -1.169189453125, -0.83154296875, -0.493896484375, -0.15625, 0.181396484375, 0.51904296875, 0.856689453125, 1.1943359375, 1.531982421875, 1.86962890625, 2.207275390625, 2.544921875, 2.882568359375, 3.22021484375, 3.557861328125, 3.8955078125, 4.233154296875, 4.57080078125, 4.908447265625, 5.24609375, 5.583740234375, 5.92138671875, 6.259033203125, 6.5966796875, 6.934326171875, 7.27197265625, 7.609619140625, 7.947265625, 8.284912109375, 8.62255859375, 8.960205078125, 9.2978515625, 9.635498046875, 9.97314453125, 10.310791015625, 10.6484375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 12.0, 6.0, 22.0, 19.0, 36.0, 30.0, 45.0, 48.0, 76.0, 97.0, 87.0, 106.0, 132.0, 153.0, 167.0, 171.0, 206.0, 239.0, 221.0, 234.0, 225.0, 212.0, 212.0, 197.0, 157.0, 144.0, 161.0, 112.0, 107.0, 89.0, 70.0, 59.0, 44.0, 33.0, 37.0, 31.0, 19.0, 11.0, 15.0, 7.0, 7.0, 3.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0078125, -3.8814697265625, -3.755126953125, -3.6287841796875, -3.50244140625, -3.3760986328125, -3.249755859375, -3.1234130859375, -2.9970703125, -2.8707275390625, -2.744384765625, -2.6180419921875, -2.49169921875, -2.3653564453125, -2.239013671875, -2.1126708984375, -1.986328125, -1.8599853515625, -1.733642578125, -1.6072998046875, -1.48095703125, -1.3546142578125, -1.228271484375, -1.1019287109375, -0.9755859375, -0.8492431640625, -0.722900390625, -0.5965576171875, -0.47021484375, -0.3438720703125, -0.217529296875, -0.0911865234375, 0.03515625, 0.1614990234375, 0.287841796875, 0.4141845703125, 0.54052734375, 0.6668701171875, 0.793212890625, 0.9195556640625, 1.0458984375, 1.1722412109375, 1.298583984375, 1.4249267578125, 1.55126953125, 1.6776123046875, 1.803955078125, 1.9302978515625, 2.056640625, 2.1829833984375, 2.309326171875, 2.4356689453125, 2.56201171875, 2.6883544921875, 2.814697265625, 2.9410400390625, 3.0673828125, 3.1937255859375, 3.320068359375, 3.4464111328125, 3.57275390625, 3.6990966796875, 3.825439453125, 3.9517822265625, 4.078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 4.0, 4.0, 7.0, 8.0, 11.0, 14.0, 13.0, 23.0, 13.0, 22.0, 24.0, 24.0, 40.0, 34.0, 39.0, 36.0, 40.0, 42.0, 37.0, 50.0, 46.0, 48.0, 44.0, 46.0, 44.0, 38.0, 29.0, 31.0, 31.0, 26.0, 15.0, 20.0, 13.0, 18.0, 10.0, 10.0, 4.0, 3.0, 3.0, 6.0, 7.0, 8.0, 3.0, 1.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.288443565368652, -8.988513946533203, -8.688583374023438, -8.388652801513672, -8.088723182678223, -7.788793087005615, -7.488862991333008, -7.1889328956604, -6.889002799987793, -6.5890727043151855, -6.289142608642578, -5.989212512969971, -5.689282417297363, -5.389352321624756, -5.089422225952148, -4.789492130279541, -4.489562034606934, -4.189631938934326, -3.8897018432617188, -3.5897717475891113, -3.289841651916504, -2.9899115562438965, -2.689981460571289, -2.3900513648986816, -2.090121269226074, -1.7901911735534668, -1.4902610778808594, -1.190330982208252, -0.8904008865356445, -0.5904707908630371, -0.2905406951904297, 0.009389400482177734, 0.30931949615478516, 0.6092495918273926, 0.9091796875, 1.2091097831726074, 1.5090398788452148, 1.8089699745178223, 2.1089000701904297, 2.408830165863037, 2.7087602615356445, 3.008690357208252, 3.3086204528808594, 3.608550548553467, 3.908480644226074, 4.208410739898682, 4.508340835571289, 4.8082709312438965, 5.108201026916504, 5.408131122589111, 5.708061218261719, 6.007991313934326, 6.307921409606934, 6.607851505279541, 6.907781600952148, 7.207711696624756, 7.507641792297363, 7.807571887969971, 8.107501983642578, 8.407432556152344, 8.707362174987793, 9.007291793823242, 9.307222366333008, 9.607152938842773, 9.907082557678223]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 2.0, 7.0, 11.0, 8.0, 13.0, 20.0, 16.0, 15.0, 20.0, 20.0, 19.0, 25.0, 31.0, 24.0, 39.0, 32.0, 31.0, 29.0, 42.0, 39.0, 38.0, 31.0, 38.0, 30.0, 36.0, 25.0, 33.0, 29.0, 39.0, 27.0, 30.0, 31.0, 19.0, 16.0, 17.0, 11.0, 14.0, 10.0, 12.0, 14.0, 9.0, 13.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.885379791259766, -8.593806266784668, -8.30223274230957, -8.010659217834473, -7.719086170196533, -7.4275126457214355, -7.135939121246338, -6.844366073608398, -6.552792549133301, -6.261219024658203, -5.9696455001831055, -5.678071975708008, -5.386498928070068, -5.094925403594971, -4.803351879119873, -4.511778831481934, -4.220204830169678, -3.92863130569458, -3.6370580196380615, -3.345484495162964, -3.0539112091064453, -2.7623376846313477, -2.47076416015625, -2.1791908740997314, -1.8876173496246338, -1.5960439443588257, -1.3044705390930176, -1.01289701461792, -0.7213236093521118, -0.4297502040863037, -0.13817667961120605, 0.1533966064453125, 0.44497013092041016, 0.7365435361862183, 1.0281169414520264, 1.319690465927124, 1.6112638711929321, 1.9028372764587402, 2.194410800933838, 2.4859840869903564, 2.777557611465454, 3.0691311359405518, 3.3607044219970703, 3.652277946472168, 3.9438514709472656, 4.235424995422363, 4.526998519897461, 4.8185715675354, 5.110145092010498, 5.401718616485596, 5.693292140960693, 5.984865188598633, 6.2764387130737305, 6.568012237548828, 6.859585762023926, 7.151159286499023, 7.442732810974121, 7.734306335449219, 8.025879859924316, 8.317453384399414, 8.609026908874512, 8.90060043334961, 9.19217300415039, 9.483746528625488, 9.775320053100586]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 20.0, 28.0, 38.0, 61.0, 113.0, 147.0, 245.0, 344.0, 573.0, 951.0, 1499.0, 2310.0, 3886.0, 6133.0, 9744.0, 15698.0, 24175.0, 36489.0, 52857.0, 74002.0, 94648.0, 113822.0, 122803.0, 118784.0, 102832.0, 83004.0, 60728.0, 43119.0, 28988.0, 18481.0, 11945.0, 7460.0, 4864.0, 2887.0, 1794.0, 1151.0, 714.0, 441.0, 247.0, 192.0, 111.0, 73.0, 50.0, 33.0, 20.0, 13.0, 10.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.54296875, -4.39501953125, -4.2470703125, -4.09912109375, -3.951171875, -3.80322265625, -3.6552734375, -3.50732421875, -3.359375, -3.21142578125, -3.0634765625, -2.91552734375, -2.767578125, -2.61962890625, -2.4716796875, -2.32373046875, -2.17578125, -2.02783203125, -1.8798828125, -1.73193359375, -1.583984375, -1.43603515625, -1.2880859375, -1.14013671875, -0.9921875, -0.84423828125, -0.6962890625, -0.54833984375, -0.400390625, -0.25244140625, -0.1044921875, 0.04345703125, 0.19140625, 0.33935546875, 0.4873046875, 0.63525390625, 0.783203125, 0.93115234375, 1.0791015625, 1.22705078125, 1.375, 1.52294921875, 1.6708984375, 1.81884765625, 1.966796875, 2.11474609375, 2.2626953125, 2.41064453125, 2.55859375, 2.70654296875, 2.8544921875, 3.00244140625, 3.150390625, 3.29833984375, 3.4462890625, 3.59423828125, 3.7421875, 3.89013671875, 4.0380859375, 4.18603515625, 4.333984375, 4.48193359375, 4.6298828125, 4.77783203125, 4.92578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 2.0, 5.0, 2.0, 6.0, 3.0, 4.0, 10.0, 11.0, 12.0, 18.0, 14.0, 13.0, 26.0, 15.0, 26.0, 27.0, 22.0, 29.0, 31.0, 26.0, 38.0, 30.0, 30.0, 34.0, 25.0, 41.0, 28.0, 36.0, 39.0, 42.0, 32.0, 32.0, 25.0, 21.0, 31.0, 32.0, 26.0, 24.0, 14.0, 15.0, 13.0, 16.0, 14.0, 16.0, 8.0, 4.0, 9.0, 8.0, 6.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.375, -8.0855712890625, -7.796142578125, -7.5067138671875, -7.21728515625, -6.9278564453125, -6.638427734375, -6.3489990234375, -6.0595703125, -5.7701416015625, -5.480712890625, -5.1912841796875, -4.90185546875, -4.6124267578125, -4.322998046875, -4.0335693359375, -3.744140625, -3.4547119140625, -3.165283203125, -2.8758544921875, -2.58642578125, -2.2969970703125, -2.007568359375, -1.7181396484375, -1.4287109375, -1.1392822265625, -0.849853515625, -0.5604248046875, -0.27099609375, 0.0184326171875, 0.307861328125, 0.5972900390625, 0.88671875, 1.1761474609375, 1.465576171875, 1.7550048828125, 2.04443359375, 2.3338623046875, 2.623291015625, 2.9127197265625, 3.2021484375, 3.4915771484375, 3.781005859375, 4.0704345703125, 4.35986328125, 4.6492919921875, 4.938720703125, 5.2281494140625, 5.517578125, 5.8070068359375, 6.096435546875, 6.3858642578125, 6.67529296875, 6.9647216796875, 7.254150390625, 7.5435791015625, 7.8330078125, 8.1224365234375, 8.411865234375, 8.7012939453125, 8.99072265625, 9.2801513671875, 9.569580078125, 9.8590087890625, 10.1484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 8.0, 12.0, 26.0, 22.0, 37.0, 57.0, 100.0, 150.0, 228.0, 361.0, 577.0, 851.0, 1400.0, 2308.0, 3655.0, 5890.0, 9952.0, 16294.0, 27173.0, 44568.0, 72112.0, 108236.0, 145107.0, 162908.0, 146163.0, 109972.0, 73361.0, 46034.0, 27854.0, 16870.0, 10185.0, 5928.0, 3663.0, 2425.0, 1466.0, 897.0, 606.0, 397.0, 254.0, 150.0, 100.0, 68.0, 42.0, 29.0, 20.0, 9.0, 7.0, 9.0, 6.0, 6.0, 1.0, 6.0], "bins": [-8.0546875, -7.8280029296875, -7.601318359375, -7.3746337890625, -7.14794921875, -6.9212646484375, -6.694580078125, -6.4678955078125, -6.2412109375, -6.0145263671875, -5.787841796875, -5.5611572265625, -5.33447265625, -5.1077880859375, -4.881103515625, -4.6544189453125, -4.427734375, -4.2010498046875, -3.974365234375, -3.7476806640625, -3.52099609375, -3.2943115234375, -3.067626953125, -2.8409423828125, -2.6142578125, -2.3875732421875, -2.160888671875, -1.9342041015625, -1.70751953125, -1.4808349609375, -1.254150390625, -1.0274658203125, -0.80078125, -0.5740966796875, -0.347412109375, -0.1207275390625, 0.10595703125, 0.3326416015625, 0.559326171875, 0.7860107421875, 1.0126953125, 1.2393798828125, 1.466064453125, 1.6927490234375, 1.91943359375, 2.1461181640625, 2.372802734375, 2.5994873046875, 2.826171875, 3.0528564453125, 3.279541015625, 3.5062255859375, 3.73291015625, 3.9595947265625, 4.186279296875, 4.4129638671875, 4.6396484375, 4.8663330078125, 5.093017578125, 5.3197021484375, 5.54638671875, 5.7730712890625, 5.999755859375, 6.2264404296875, 6.453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 7.0, 2.0, 7.0, 5.0, 15.0, 17.0, 13.0, 14.0, 15.0, 22.0, 20.0, 35.0, 25.0, 35.0, 44.0, 48.0, 58.0, 50.0, 49.0, 53.0, 53.0, 29.0, 44.0, 41.0, 33.0, 42.0, 38.0, 31.0, 27.0, 24.0, 20.0, 17.0, 17.0, 12.0, 10.0, 9.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.49609375, -7.25372314453125, -7.0113525390625, -6.76898193359375, -6.526611328125, -6.28424072265625, -6.0418701171875, -5.79949951171875, -5.55712890625, -5.31475830078125, -5.0723876953125, -4.83001708984375, -4.587646484375, -4.34527587890625, -4.1029052734375, -3.86053466796875, -3.6181640625, -3.37579345703125, -3.1334228515625, -2.89105224609375, -2.648681640625, -2.40631103515625, -2.1639404296875, -1.92156982421875, -1.67919921875, -1.43682861328125, -1.1944580078125, -0.95208740234375, -0.709716796875, -0.46734619140625, -0.2249755859375, 0.01739501953125, 0.259765625, 0.50213623046875, 0.7445068359375, 0.98687744140625, 1.229248046875, 1.47161865234375, 1.7139892578125, 1.95635986328125, 2.19873046875, 2.44110107421875, 2.6834716796875, 2.92584228515625, 3.168212890625, 3.41058349609375, 3.6529541015625, 3.89532470703125, 4.1376953125, 4.38006591796875, 4.6224365234375, 4.86480712890625, 5.107177734375, 5.34954833984375, 5.5919189453125, 5.83428955078125, 6.07666015625, 6.31903076171875, 6.5614013671875, 6.80377197265625, 7.046142578125, 7.28851318359375, 7.5308837890625, 7.77325439453125, 8.015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 7.0, 16.0, 26.0, 20.0, 33.0, 62.0, 79.0, 135.0, 196.0, 342.0, 594.0, 891.0, 1670.0, 2902.0, 5504.0, 10265.0, 19860.0, 37936.0, 70838.0, 123640.0, 185688.0, 206562.0, 161943.0, 100491.0, 55722.0, 29556.0, 15451.0, 8040.0, 4394.0, 2328.0, 1312.0, 790.0, 465.0, 275.0, 174.0, 110.0, 79.0, 47.0, 38.0, 20.0, 18.0, 11.0, 9.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -4.00775146484375, -3.8709716796875, -3.73419189453125, -3.597412109375, -3.46063232421875, -3.3238525390625, -3.18707275390625, -3.05029296875, -2.91351318359375, -2.7767333984375, -2.63995361328125, -2.503173828125, -2.36639404296875, -2.2296142578125, -2.09283447265625, -1.9560546875, -1.81927490234375, -1.6824951171875, -1.54571533203125, -1.408935546875, -1.27215576171875, -1.1353759765625, -0.99859619140625, -0.86181640625, -0.72503662109375, -0.5882568359375, -0.45147705078125, -0.314697265625, -0.17791748046875, -0.0411376953125, 0.09564208984375, 0.232421875, 0.36920166015625, 0.5059814453125, 0.64276123046875, 0.779541015625, 0.91632080078125, 1.0531005859375, 1.18988037109375, 1.32666015625, 1.46343994140625, 1.6002197265625, 1.73699951171875, 1.873779296875, 2.01055908203125, 2.1473388671875, 2.28411865234375, 2.4208984375, 2.55767822265625, 2.6944580078125, 2.83123779296875, 2.968017578125, 3.10479736328125, 3.2415771484375, 3.37835693359375, 3.51513671875, 3.65191650390625, 3.7886962890625, 3.92547607421875, 4.062255859375, 4.19903564453125, 4.3358154296875, 4.47259521484375, 4.609375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 13.0, 12.0, 14.0, 16.0, 24.0, 23.0, 25.0, 40.0, 33.0, 40.0, 39.0, 54.0, 56.0, 57.0, 51.0, 56.0, 58.0, 51.0, 50.0, 33.0, 38.0, 52.0, 35.0, 22.0, 18.0, 16.0, 17.0, 14.0, 4.0, 9.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00023162364959716797, -0.0002250969409942627, -0.00021857023239135742, -0.00021204352378845215, -0.00020551681518554688, -0.0001989901065826416, -0.00019246339797973633, -0.00018593668937683105, -0.00017940998077392578, -0.0001728832721710205, -0.00016635656356811523, -0.00015982985496520996, -0.0001533031463623047, -0.00014677643775939941, -0.00014024972915649414, -0.00013372302055358887, -0.0001271963119506836, -0.00012066960334777832, -0.00011414289474487305, -0.00010761618614196777, -0.0001010894775390625, -9.456276893615723e-05, -8.803606033325195e-05, -8.150935173034668e-05, -7.49826431274414e-05, -6.845593452453613e-05, -6.192922592163086e-05, -5.5402517318725586e-05, -4.887580871582031e-05, -4.234910011291504e-05, -3.5822391510009766e-05, -2.9295682907104492e-05, -2.276897430419922e-05, -1.6242265701293945e-05, -9.715557098388672e-06, -3.1888484954833984e-06, 3.337860107421875e-06, 9.864568710327148e-06, 1.6391277313232422e-05, 2.2917985916137695e-05, 2.944469451904297e-05, 3.597140312194824e-05, 4.2498111724853516e-05, 4.902482032775879e-05, 5.555152893066406e-05, 6.207823753356934e-05, 6.860494613647461e-05, 7.513165473937988e-05, 8.165836334228516e-05, 8.818507194519043e-05, 9.47117805480957e-05, 0.00010123848915100098, 0.00010776519775390625, 0.00011429190635681152, 0.0001208186149597168, 0.00012734532356262207, 0.00013387203216552734, 0.00014039874076843262, 0.0001469254493713379, 0.00015345215797424316, 0.00015997886657714844, 0.0001665055751800537, 0.00017303228378295898, 0.00017955899238586426, 0.00018608570098876953]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 12.0, 21.0, 28.0, 26.0, 42.0, 56.0, 104.0, 113.0, 184.0, 291.0, 410.0, 709.0, 1199.0, 2189.0, 4055.0, 7880.0, 15558.0, 31010.0, 58752.0, 102399.0, 155736.0, 191438.0, 179126.0, 130059.0, 78633.0, 42661.0, 21918.0, 11112.0, 5692.0, 2917.0, 1625.0, 935.0, 597.0, 353.0, 237.0, 150.0, 93.0, 78.0, 49.0, 26.0, 22.0, 19.0, 18.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.36328125, -5.19952392578125, -5.0357666015625, -4.87200927734375, -4.708251953125, -4.54449462890625, -4.3807373046875, -4.21697998046875, -4.05322265625, -3.88946533203125, -3.7257080078125, -3.56195068359375, -3.398193359375, -3.23443603515625, -3.0706787109375, -2.90692138671875, -2.7431640625, -2.57940673828125, -2.4156494140625, -2.25189208984375, -2.088134765625, -1.92437744140625, -1.7606201171875, -1.59686279296875, -1.43310546875, -1.26934814453125, -1.1055908203125, -0.94183349609375, -0.778076171875, -0.61431884765625, -0.4505615234375, -0.28680419921875, -0.123046875, 0.04071044921875, 0.2044677734375, 0.36822509765625, 0.531982421875, 0.69573974609375, 0.8594970703125, 1.02325439453125, 1.18701171875, 1.35076904296875, 1.5145263671875, 1.67828369140625, 1.842041015625, 2.00579833984375, 2.1695556640625, 2.33331298828125, 2.4970703125, 2.66082763671875, 2.8245849609375, 2.98834228515625, 3.152099609375, 3.31585693359375, 3.4796142578125, 3.64337158203125, 3.80712890625, 3.97088623046875, 4.1346435546875, 4.29840087890625, 4.462158203125, 4.62591552734375, 4.7896728515625, 4.95343017578125, 5.1171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 3.0, 5.0, 4.0, 4.0, 5.0, 15.0, 17.0, 18.0, 18.0, 22.0, 24.0, 25.0, 27.0, 26.0, 35.0, 34.0, 45.0, 46.0, 44.0, 34.0, 47.0, 39.0, 52.0, 46.0, 50.0, 34.0, 44.0, 31.0, 16.0, 37.0, 27.0, 15.0, 15.0, 18.0, 19.0, 9.0, 9.0, 13.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.295654296875, -1.25048828125, -1.205322265625, -1.16015625, -1.114990234375, -1.06982421875, -1.024658203125, -0.9794921875, -0.934326171875, -0.88916015625, -0.843994140625, -0.798828125, -0.753662109375, -0.70849609375, -0.663330078125, -0.6181640625, -0.572998046875, -0.52783203125, -0.482666015625, -0.4375, -0.392333984375, -0.34716796875, -0.302001953125, -0.2568359375, -0.211669921875, -0.16650390625, -0.121337890625, -0.076171875, -0.031005859375, 0.01416015625, 0.059326171875, 0.1044921875, 0.149658203125, 0.19482421875, 0.239990234375, 0.28515625, 0.330322265625, 0.37548828125, 0.420654296875, 0.4658203125, 0.510986328125, 0.55615234375, 0.601318359375, 0.646484375, 0.691650390625, 0.73681640625, 0.781982421875, 0.8271484375, 0.872314453125, 0.91748046875, 0.962646484375, 1.0078125, 1.052978515625, 1.09814453125, 1.143310546875, 1.1884765625, 1.233642578125, 1.27880859375, 1.323974609375, 1.369140625, 1.414306640625, 1.45947265625, 1.504638671875, 1.5498046875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 10.0, 7.0, 12.0, 15.0, 14.0, 19.0, 19.0, 30.0, 31.0, 23.0, 33.0, 38.0, 47.0, 30.0, 45.0, 46.0, 49.0, 57.0, 44.0, 61.0, 49.0, 45.0, 27.0, 35.0, 35.0, 29.0, 23.0, 32.0, 12.0, 14.0, 9.0, 9.0, 9.0, 3.0, 8.0, 2.0, 5.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.87856674194336, -9.560656547546387, -9.242746353149414, -8.924836158752441, -8.606925964355469, -8.289015769958496, -7.971105098724365, -7.653194904327393, -7.33528470993042, -7.017374515533447, -6.699464321136475, -6.381554126739502, -6.063643455505371, -5.745733261108398, -5.427823066711426, -5.109912872314453, -4.7920026779174805, -4.474092483520508, -4.156182289123535, -3.8382718563079834, -3.5203616619110107, -3.202451467514038, -2.8845410346984863, -2.5666308403015137, -2.248720645904541, -1.9308104515075684, -1.6129001379013062, -1.294989824295044, -0.9770796298980713, -0.6591694355010986, -0.3412591218948364, -0.02334880828857422, 0.29456138610839844, 0.6124716401100159, 0.9303818941116333, 1.2482922077178955, 1.5662024021148682, 1.8841125965118408, 2.2020230293273926, 2.5199332237243652, 2.837843418121338, 3.1557536125183105, 3.473663806915283, 3.791574239730835, 4.109484672546387, 4.427394866943359, 4.745305061340332, 5.063215255737305, 5.381125450134277, 5.69903564453125, 6.016945838928223, 6.334856033325195, 6.652766227722168, 6.970676422119141, 7.2885870933532715, 7.606497287750244, 7.924407482147217, 8.242318153381348, 8.56022834777832, 8.878138542175293, 9.196048736572266, 9.513958930969238, 9.831869125366211, 10.149779319763184, 10.467689514160156]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 3.0, 15.0, 9.0, 17.0, 7.0, 19.0, 13.0, 18.0, 17.0, 20.0, 23.0, 31.0, 26.0, 33.0, 35.0, 25.0, 30.0, 38.0, 43.0, 33.0, 40.0, 36.0, 35.0, 27.0, 27.0, 31.0, 32.0, 42.0, 30.0, 33.0, 27.0, 22.0, 14.0, 18.0, 8.0, 14.0, 18.0, 12.0, 11.0, 11.0, 10.0, 10.0, 7.0, 6.0, 1.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-9.10458755493164, -8.820202827453613, -8.53581714630127, -8.251432418823242, -7.967047691345215, -7.682662487030029, -7.398277282714844, -7.113892555236816, -6.829507827758789, -6.5451226234436035, -6.260737895965576, -5.976352691650391, -5.691967964172363, -5.407582759857178, -5.123197555541992, -4.838812828063965, -4.554427623748779, -4.270042419433594, -3.9856576919555664, -3.701272487640381, -3.4168877601623535, -3.132502555847168, -2.8481175899505615, -2.563732624053955, -2.2793476581573486, -1.9949626922607422, -1.7105777263641357, -1.4261926412582397, -1.1418076753616333, -0.8574227094650269, -0.5730376243591309, -0.2886526584625244, -0.004267692565917969, 0.28011730313301086, 0.5645022988319397, 0.8488873243331909, 1.1332722902297974, 1.4176572561264038, 1.7020423412322998, 1.9864273071289062, 2.2708122730255127, 2.555197238922119, 2.8395822048187256, 3.123967170715332, 3.4083523750305176, 3.692737102508545, 3.9771223068237305, 4.261507034301758, 4.545892238616943, 4.830277442932129, 5.114662170410156, 5.399047374725342, 5.683432102203369, 5.967817306518555, 6.252202033996582, 6.536587238311768, 6.820972442626953, 7.105357646942139, 7.389742374420166, 7.674127578735352, 7.958512306213379, 8.242897033691406, 8.52728271484375, 8.811667442321777, 9.096052169799805]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 9.0, 5.0, 9.0, 18.0, 35.0, 61.0, 85.0, 136.0, 267.0, 433.0, 782.0, 1259.0, 2069.0, 3219.0, 5316.0, 8418.0, 13050.0, 19875.0, 29379.0, 41585.0, 57676.0, 74670.0, 90955.0, 103490.0, 109467.0, 106547.0, 95667.0, 79616.0, 62093.0, 46511.0, 32963.0, 22396.0, 14997.0, 9745.0, 6156.0, 3879.0, 2303.0, 1366.0, 879.0, 460.0, 303.0, 175.0, 99.0, 61.0, 34.0, 22.0, 12.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.77734375, -5.60040283203125, -5.4234619140625, -5.24652099609375, -5.069580078125, -4.89263916015625, -4.7156982421875, -4.53875732421875, -4.36181640625, -4.18487548828125, -4.0079345703125, -3.83099365234375, -3.654052734375, -3.47711181640625, -3.3001708984375, -3.12322998046875, -2.9462890625, -2.76934814453125, -2.5924072265625, -2.41546630859375, -2.238525390625, -2.06158447265625, -1.8846435546875, -1.70770263671875, -1.53076171875, -1.35382080078125, -1.1768798828125, -0.99993896484375, -0.822998046875, -0.64605712890625, -0.4691162109375, -0.29217529296875, -0.115234375, 0.06170654296875, 0.2386474609375, 0.41558837890625, 0.592529296875, 0.76947021484375, 0.9464111328125, 1.12335205078125, 1.30029296875, 1.47723388671875, 1.6541748046875, 1.83111572265625, 2.008056640625, 2.18499755859375, 2.3619384765625, 2.53887939453125, 2.7158203125, 2.89276123046875, 3.0697021484375, 3.24664306640625, 3.423583984375, 3.60052490234375, 3.7774658203125, 3.95440673828125, 4.13134765625, 4.30828857421875, 4.4852294921875, 4.66217041015625, 4.839111328125, 5.01605224609375, 5.1929931640625, 5.36993408203125, 5.546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 12.0, 6.0, 9.0, 15.0, 14.0, 18.0, 16.0, 14.0, 27.0, 16.0, 32.0, 40.0, 18.0, 31.0, 28.0, 33.0, 40.0, 37.0, 36.0, 44.0, 44.0, 33.0, 32.0, 28.0, 40.0, 29.0, 36.0, 36.0, 28.0, 25.0, 15.0, 21.0, 20.0, 19.0, 16.0, 13.0, 14.0, 11.0, 10.0, 9.0, 7.0, 5.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.75, -9.44775390625, -9.1455078125, -8.84326171875, -8.541015625, -8.23876953125, -7.9365234375, -7.63427734375, -7.33203125, -7.02978515625, -6.7275390625, -6.42529296875, -6.123046875, -5.82080078125, -5.5185546875, -5.21630859375, -4.9140625, -4.61181640625, -4.3095703125, -4.00732421875, -3.705078125, -3.40283203125, -3.1005859375, -2.79833984375, -2.49609375, -2.19384765625, -1.8916015625, -1.58935546875, -1.287109375, -0.98486328125, -0.6826171875, -0.38037109375, -0.078125, 0.22412109375, 0.5263671875, 0.82861328125, 1.130859375, 1.43310546875, 1.7353515625, 2.03759765625, 2.33984375, 2.64208984375, 2.9443359375, 3.24658203125, 3.548828125, 3.85107421875, 4.1533203125, 4.45556640625, 4.7578125, 5.06005859375, 5.3623046875, 5.66455078125, 5.966796875, 6.26904296875, 6.5712890625, 6.87353515625, 7.17578125, 7.47802734375, 7.7802734375, 8.08251953125, 8.384765625, 8.68701171875, 8.9892578125, 9.29150390625, 9.59375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 3.0, 10.0, 22.0, 34.0, 46.0, 68.0, 114.0, 170.0, 274.0, 416.0, 602.0, 922.0, 1453.0, 2108.0, 3182.0, 4942.0, 7454.0, 10959.0, 16346.0, 23551.0, 32927.0, 45216.0, 59732.0, 74420.0, 87744.0, 98385.0, 101208.0, 98170.0, 88616.0, 75389.0, 60619.0, 45875.0, 33772.0, 23680.0, 16595.0, 11211.0, 7579.0, 5146.0, 3245.0, 2138.0, 1438.0, 948.0, 650.0, 394.0, 285.0, 190.0, 117.0, 71.0, 51.0, 30.0, 18.0, 7.0, 10.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.8046875, -5.626220703125, -5.44775390625, -5.269287109375, -5.0908203125, -4.912353515625, -4.73388671875, -4.555419921875, -4.376953125, -4.198486328125, -4.02001953125, -3.841552734375, -3.6630859375, -3.484619140625, -3.30615234375, -3.127685546875, -2.94921875, -2.770751953125, -2.59228515625, -2.413818359375, -2.2353515625, -2.056884765625, -1.87841796875, -1.699951171875, -1.521484375, -1.343017578125, -1.16455078125, -0.986083984375, -0.8076171875, -0.629150390625, -0.45068359375, -0.272216796875, -0.09375, 0.084716796875, 0.26318359375, 0.441650390625, 0.6201171875, 0.798583984375, 0.97705078125, 1.155517578125, 1.333984375, 1.512451171875, 1.69091796875, 1.869384765625, 2.0478515625, 2.226318359375, 2.40478515625, 2.583251953125, 2.76171875, 2.940185546875, 3.11865234375, 3.297119140625, 3.4755859375, 3.654052734375, 3.83251953125, 4.010986328125, 4.189453125, 4.367919921875, 4.54638671875, 4.724853515625, 4.9033203125, 5.081787109375, 5.26025390625, 5.438720703125, 5.6171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 0.0, 7.0, 16.0, 10.0, 14.0, 19.0, 15.0, 21.0, 21.0, 26.0, 25.0, 32.0, 31.0, 38.0, 41.0, 32.0, 37.0, 41.0, 49.0, 42.0, 40.0, 50.0, 39.0, 37.0, 26.0, 33.0, 34.0, 28.0, 30.0, 23.0, 20.0, 17.0, 20.0, 8.0, 9.0, 13.0, 12.0, 6.0, 10.0, 4.0, 8.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.375, -6.16436767578125, -5.9537353515625, -5.74310302734375, -5.532470703125, -5.32183837890625, -5.1112060546875, -4.90057373046875, -4.68994140625, -4.47930908203125, -4.2686767578125, -4.05804443359375, -3.847412109375, -3.63677978515625, -3.4261474609375, -3.21551513671875, -3.0048828125, -2.79425048828125, -2.5836181640625, -2.37298583984375, -2.162353515625, -1.95172119140625, -1.7410888671875, -1.53045654296875, -1.31982421875, -1.10919189453125, -0.8985595703125, -0.68792724609375, -0.477294921875, -0.26666259765625, -0.0560302734375, 0.15460205078125, 0.365234375, 0.57586669921875, 0.7864990234375, 0.99713134765625, 1.207763671875, 1.41839599609375, 1.6290283203125, 1.83966064453125, 2.05029296875, 2.26092529296875, 2.4715576171875, 2.68218994140625, 2.892822265625, 3.10345458984375, 3.3140869140625, 3.52471923828125, 3.7353515625, 3.94598388671875, 4.1566162109375, 4.36724853515625, 4.577880859375, 4.78851318359375, 4.9991455078125, 5.20977783203125, 5.42041015625, 5.63104248046875, 5.8416748046875, 6.05230712890625, 6.262939453125, 6.47357177734375, 6.6842041015625, 6.89483642578125, 7.10546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 8.0, 9.0, 14.0, 13.0, 25.0, 39.0, 73.0, 99.0, 121.0, 186.0, 345.0, 519.0, 808.0, 1320.0, 2081.0, 3531.0, 5757.0, 9687.0, 15496.0, 24814.0, 38478.0, 57093.0, 79698.0, 103522.0, 121976.0, 128061.0, 120719.0, 101312.0, 78287.0, 54870.0, 37247.0, 23872.0, 14931.0, 9247.0, 5446.0, 3300.0, 2045.0, 1241.0, 782.0, 489.0, 346.0, 222.0, 165.0, 90.0, 51.0, 40.0, 31.0, 19.0, 16.0, 10.0, 7.0, 1.0, 2.0, 5.0, 2.0], "bins": [-2.546875, -2.47296142578125, -2.3990478515625, -2.32513427734375, -2.251220703125, -2.17730712890625, -2.1033935546875, -2.02947998046875, -1.95556640625, -1.88165283203125, -1.8077392578125, -1.73382568359375, -1.659912109375, -1.58599853515625, -1.5120849609375, -1.43817138671875, -1.3642578125, -1.29034423828125, -1.2164306640625, -1.14251708984375, -1.068603515625, -0.99468994140625, -0.9207763671875, -0.84686279296875, -0.77294921875, -0.69903564453125, -0.6251220703125, -0.55120849609375, -0.477294921875, -0.40338134765625, -0.3294677734375, -0.25555419921875, -0.181640625, -0.10772705078125, -0.0338134765625, 0.04010009765625, 0.114013671875, 0.18792724609375, 0.2618408203125, 0.33575439453125, 0.40966796875, 0.48358154296875, 0.5574951171875, 0.63140869140625, 0.705322265625, 0.77923583984375, 0.8531494140625, 0.92706298828125, 1.0009765625, 1.07489013671875, 1.1488037109375, 1.22271728515625, 1.296630859375, 1.37054443359375, 1.4444580078125, 1.51837158203125, 1.59228515625, 1.66619873046875, 1.7401123046875, 1.81402587890625, 1.887939453125, 1.96185302734375, 2.0357666015625, 2.10968017578125, 2.18359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 7.0, 9.0, 14.0, 27.0, 22.0, 21.0, 24.0, 47.0, 38.0, 45.0, 64.0, 51.0, 57.0, 54.0, 50.0, 53.0, 51.0, 59.0, 30.0, 39.0, 30.0, 28.0, 18.0, 21.0, 24.0, 18.0, 17.0, 14.0, 9.0, 9.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00030159950256347656, -0.00029271095991134644, -0.0002838224172592163, -0.0002749338746070862, -0.00026604533195495605, -0.00025715678930282593, -0.0002482682466506958, -0.00023937970399856567, -0.00023049116134643555, -0.00022160261869430542, -0.0002127140760421753, -0.00020382553339004517, -0.00019493699073791504, -0.0001860484480857849, -0.00017715990543365479, -0.00016827136278152466, -0.00015938282012939453, -0.0001504942774772644, -0.00014160573482513428, -0.00013271719217300415, -0.00012382864952087402, -0.0001149401068687439, -0.00010605156421661377, -9.716302156448364e-05, -8.827447891235352e-05, -7.938593626022339e-05, -7.049739360809326e-05, -6.160885095596313e-05, -5.272030830383301e-05, -4.383176565170288e-05, -3.4943222999572754e-05, -2.6054680347442627e-05, -1.71661376953125e-05, -8.277595043182373e-06, 6.109476089477539e-07, 9.499490261077881e-06, 1.8388032913208008e-05, 2.7276575565338135e-05, 3.616511821746826e-05, 4.505366086959839e-05, 5.3942203521728516e-05, 6.283074617385864e-05, 7.171928882598877e-05, 8.06078314781189e-05, 8.949637413024902e-05, 9.838491678237915e-05, 0.00010727345943450928, 0.0001161620020866394, 0.00012505054473876953, 0.00013393908739089966, 0.00014282763004302979, 0.0001517161726951599, 0.00016060471534729004, 0.00016949325799942017, 0.0001783818006515503, 0.00018727034330368042, 0.00019615888595581055, 0.00020504742860794067, 0.0002139359712600708, 0.00022282451391220093, 0.00023171305656433105, 0.00024060159921646118, 0.0002494901418685913, 0.00025837868452072144, 0.00026726722717285156]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 11.0, 14.0, 26.0, 25.0, 60.0, 68.0, 109.0, 143.0, 218.0, 302.0, 449.0, 648.0, 989.0, 1482.0, 2335.0, 3460.0, 5531.0, 8618.0, 12960.0, 19881.0, 29108.0, 42261.0, 57832.0, 77158.0, 94121.0, 108669.0, 113226.0, 108381.0, 95345.0, 76957.0, 58739.0, 42478.0, 29465.0, 19829.0, 12930.0, 8465.0, 5583.0, 3635.0, 2325.0, 1574.0, 1041.0, 680.0, 427.0, 297.0, 204.0, 155.0, 129.0, 73.0, 45.0, 42.0, 22.0, 9.0, 4.0, 4.0, 6.0, 4.0, 3.0, 1.0], "bins": [-2.306640625, -2.235687255859375, -2.16473388671875, -2.093780517578125, -2.0228271484375, -1.951873779296875, -1.88092041015625, -1.809967041015625, -1.739013671875, -1.668060302734375, -1.59710693359375, -1.526153564453125, -1.4552001953125, -1.384246826171875, -1.31329345703125, -1.242340087890625, -1.17138671875, -1.100433349609375, -1.02947998046875, -0.958526611328125, -0.8875732421875, -0.816619873046875, -0.74566650390625, -0.674713134765625, -0.603759765625, -0.532806396484375, -0.46185302734375, -0.390899658203125, -0.3199462890625, -0.248992919921875, -0.17803955078125, -0.107086181640625, -0.0361328125, 0.034820556640625, 0.10577392578125, 0.176727294921875, 0.2476806640625, 0.318634033203125, 0.38958740234375, 0.460540771484375, 0.531494140625, 0.602447509765625, 0.67340087890625, 0.744354248046875, 0.8153076171875, 0.886260986328125, 0.95721435546875, 1.028167724609375, 1.09912109375, 1.170074462890625, 1.24102783203125, 1.311981201171875, 1.3829345703125, 1.453887939453125, 1.52484130859375, 1.595794677734375, 1.666748046875, 1.737701416015625, 1.80865478515625, 1.879608154296875, 1.9505615234375, 2.021514892578125, 2.09246826171875, 2.163421630859375, 2.234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 2.0, 4.0, 5.0, 5.0, 8.0, 14.0, 9.0, 17.0, 12.0, 23.0, 21.0, 34.0, 29.0, 32.0, 43.0, 46.0, 42.0, 43.0, 43.0, 67.0, 59.0, 55.0, 50.0, 47.0, 56.0, 37.0, 27.0, 16.0, 31.0, 25.0, 20.0, 14.0, 12.0, 10.0, 8.0, 7.0, 6.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1328125, -1.097747802734375, -1.06268310546875, -1.027618408203125, -0.9925537109375, -0.957489013671875, -0.92242431640625, -0.887359619140625, -0.852294921875, -0.817230224609375, -0.78216552734375, -0.747100830078125, -0.7120361328125, -0.676971435546875, -0.64190673828125, -0.606842041015625, -0.57177734375, -0.536712646484375, -0.50164794921875, -0.466583251953125, -0.4315185546875, -0.396453857421875, -0.36138916015625, -0.326324462890625, -0.291259765625, -0.256195068359375, -0.22113037109375, -0.186065673828125, -0.1510009765625, -0.115936279296875, -0.08087158203125, -0.045806884765625, -0.0107421875, 0.024322509765625, 0.05938720703125, 0.094451904296875, 0.1295166015625, 0.164581298828125, 0.19964599609375, 0.234710693359375, 0.269775390625, 0.304840087890625, 0.33990478515625, 0.374969482421875, 0.4100341796875, 0.445098876953125, 0.48016357421875, 0.515228271484375, 0.55029296875, 0.585357666015625, 0.62042236328125, 0.655487060546875, 0.6905517578125, 0.725616455078125, 0.76068115234375, 0.795745849609375, 0.830810546875, 0.865875244140625, 0.90093994140625, 0.936004638671875, 0.9710693359375, 1.006134033203125, 1.04119873046875, 1.076263427734375, 1.111328125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 10.0, 7.0, 7.0, 10.0, 8.0, 12.0, 23.0, 21.0, 13.0, 15.0, 26.0, 34.0, 41.0, 35.0, 44.0, 45.0, 51.0, 40.0, 48.0, 52.0, 44.0, 58.0, 52.0, 27.0, 42.0, 42.0, 27.0, 29.0, 18.0, 21.0, 20.0, 15.0, 11.0, 7.0, 9.0, 7.0, 9.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.097945213317871, -9.78134536743164, -9.464744567871094, -9.148144721984863, -8.831544876098633, -8.514944076538086, -8.198344230651855, -7.881744384765625, -7.565144062042236, -7.248543739318848, -6.931943893432617, -6.6153435707092285, -6.29874324798584, -5.982143402099609, -5.665543079376221, -5.348942756652832, -5.032342910766602, -4.715742588043213, -4.399142742156982, -4.082542419433594, -3.765942335128784, -3.4493422508239746, -3.132741928100586, -2.8161418437957764, -2.499541759490967, -2.1829416751861572, -1.866341471672058, -1.549741268157959, -1.2331411838531494, -0.9165410995483398, -0.5999408960342407, -0.2833406925201416, 0.03325939178466797, 0.3498595356941223, 0.6664596796035767, 0.983059823513031, 1.2996599674224854, 1.616260051727295, 1.932860255241394, 2.249460458755493, 2.5660605430603027, 2.8826606273651123, 3.199260711669922, 3.5158610343933105, 3.83246111869812, 4.14906120300293, 4.465661525726318, 4.782261848449707, 5.0988616943359375, 5.415462017059326, 5.732061862945557, 6.048662185668945, 6.365262031555176, 6.6818623542785645, 6.998462677001953, 7.315062522888184, 7.631662845611572, 7.948263168334961, 8.264863014221191, 8.581462860107422, 8.898063659667969, 9.2146635055542, 9.53126335144043, 9.847864151000977, 10.164463996887207]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 3.0, 2.0, 4.0, 2.0, 11.0, 7.0, 4.0, 5.0, 7.0, 11.0, 14.0, 12.0, 11.0, 14.0, 22.0, 16.0, 23.0, 25.0, 24.0, 30.0, 26.0, 36.0, 36.0, 39.0, 27.0, 29.0, 46.0, 41.0, 47.0, 30.0, 30.0, 30.0, 36.0, 38.0, 25.0, 28.0, 19.0, 23.0, 24.0, 22.0, 16.0, 15.0, 15.0, 12.0, 10.0, 9.0, 11.0, 9.0, 6.0, 5.0, 9.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.459339141845703, -9.157861709594727, -8.856383323669434, -8.55490493774414, -8.253427505493164, -7.951949596405029, -7.6504716873168945, -7.34899377822876, -7.047515869140625, -6.74603796005249, -6.4445600509643555, -6.143082141876221, -5.841604232788086, -5.540126323699951, -5.238648414611816, -4.937170505523682, -4.635692596435547, -4.334214687347412, -4.032736778259277, -3.7312588691711426, -3.429780960083008, -3.128303050994873, -2.8268251419067383, -2.5253472328186035, -2.2238693237304688, -1.922391414642334, -1.6209135055541992, -1.3194355964660645, -1.0179576873779297, -0.7164797782897949, -0.41500186920166016, -0.11352396011352539, 0.18795394897460938, 0.48943185806274414, 0.7909097671508789, 1.0923876762390137, 1.3938655853271484, 1.6953434944152832, 1.996821403503418, 2.2982993125915527, 2.5997772216796875, 2.9012551307678223, 3.202733039855957, 3.504210948944092, 3.8056888580322266, 4.107166767120361, 4.408644676208496, 4.710122585296631, 5.011600494384766, 5.3130784034729, 5.614556312561035, 5.91603422164917, 6.217512130737305, 6.5189900398254395, 6.820467948913574, 7.121945858001709, 7.423423767089844, 7.7249016761779785, 8.026379585266113, 8.327857971191406, 8.629335403442383, 8.93081283569336, 9.232291221618652, 9.533769607543945, 9.835247039794922]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 10.0, 23.0, 33.0, 53.0, 95.0, 148.0, 201.0, 373.0, 586.0, 956.0, 1609.0, 2895.0, 5021.0, 9150.0, 16666.0, 30948.0, 58223.0, 112527.0, 216732.0, 399186.0, 638218.0, 800260.0, 743718.0, 520005.0, 299698.0, 158236.0, 82136.0, 43412.0, 23214.0, 12920.0, 7040.0, 4013.0, 2317.0, 1455.0, 776.0, 519.0, 285.0, 189.0, 129.0, 100.0, 56.0, 44.0, 27.0, 18.0, 15.0, 13.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.0, -9.6749267578125, -9.349853515625, -9.0247802734375, -8.69970703125, -8.3746337890625, -8.049560546875, -7.7244873046875, -7.3994140625, -7.0743408203125, -6.749267578125, -6.4241943359375, -6.09912109375, -5.7740478515625, -5.448974609375, -5.1239013671875, -4.798828125, -4.4737548828125, -4.148681640625, -3.8236083984375, -3.49853515625, -3.1734619140625, -2.848388671875, -2.5233154296875, -2.1982421875, -1.8731689453125, -1.548095703125, -1.2230224609375, -0.89794921875, -0.5728759765625, -0.247802734375, 0.0772705078125, 0.40234375, 0.7274169921875, 1.052490234375, 1.3775634765625, 1.70263671875, 2.0277099609375, 2.352783203125, 2.6778564453125, 3.0029296875, 3.3280029296875, 3.653076171875, 3.9781494140625, 4.30322265625, 4.6282958984375, 4.953369140625, 5.2784423828125, 5.603515625, 5.9285888671875, 6.253662109375, 6.5787353515625, 6.90380859375, 7.2288818359375, 7.553955078125, 7.8790283203125, 8.2041015625, 8.5291748046875, 8.854248046875, 9.1793212890625, 9.50439453125, 9.8294677734375, 10.154541015625, 10.4796142578125, 10.8046875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 6.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 7.0, 12.0, 11.0, 14.0, 10.0, 17.0, 22.0, 18.0, 13.0, 24.0, 20.0, 33.0, 32.0, 30.0, 29.0, 37.0, 39.0, 35.0, 38.0, 40.0, 37.0, 38.0, 30.0, 45.0, 35.0, 22.0, 38.0, 17.0, 25.0, 28.0, 22.0, 23.0, 23.0, 14.0, 14.0, 14.0, 17.0, 9.0, 15.0, 7.0, 5.0, 8.0, 9.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.50830078125, -8.2275390625, -7.94677734375, -7.666015625, -7.38525390625, -7.1044921875, -6.82373046875, -6.54296875, -6.26220703125, -5.9814453125, -5.70068359375, -5.419921875, -5.13916015625, -4.8583984375, -4.57763671875, -4.296875, -4.01611328125, -3.7353515625, -3.45458984375, -3.173828125, -2.89306640625, -2.6123046875, -2.33154296875, -2.05078125, -1.77001953125, -1.4892578125, -1.20849609375, -0.927734375, -0.64697265625, -0.3662109375, -0.08544921875, 0.1953125, 0.47607421875, 0.7568359375, 1.03759765625, 1.318359375, 1.59912109375, 1.8798828125, 2.16064453125, 2.44140625, 2.72216796875, 3.0029296875, 3.28369140625, 3.564453125, 3.84521484375, 4.1259765625, 4.40673828125, 4.6875, 4.96826171875, 5.2490234375, 5.52978515625, 5.810546875, 6.09130859375, 6.3720703125, 6.65283203125, 6.93359375, 7.21435546875, 7.4951171875, 7.77587890625, 8.056640625, 8.33740234375, 8.6181640625, 8.89892578125, 9.1796875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 6.0, 7.0, 26.0, 35.0, 59.0, 73.0, 126.0, 205.0, 366.0, 520.0, 834.0, 1394.0, 2209.0, 3813.0, 6293.0, 10493.0, 18015.0, 30637.0, 52541.0, 87689.0, 148289.0, 242053.0, 373830.0, 522583.0, 626910.0, 620579.0, 507275.0, 360257.0, 230875.0, 141171.0, 84237.0, 49474.0, 28914.0, 17082.0, 10291.0, 6009.0, 3482.0, 2142.0, 1318.0, 821.0, 483.0, 301.0, 204.0, 122.0, 92.0, 51.0, 42.0, 17.0, 12.0, 10.0, 4.0, 8.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.52734375, -8.2109375, -7.89453125, -7.578125, -7.26171875, -6.9453125, -6.62890625, -6.3125, -5.99609375, -5.6796875, -5.36328125, -5.046875, -4.73046875, -4.4140625, -4.09765625, -3.78125, -3.46484375, -3.1484375, -2.83203125, -2.515625, -2.19921875, -1.8828125, -1.56640625, -1.25, -0.93359375, -0.6171875, -0.30078125, 0.015625, 0.33203125, 0.6484375, 0.96484375, 1.28125, 1.59765625, 1.9140625, 2.23046875, 2.546875, 2.86328125, 3.1796875, 3.49609375, 3.8125, 4.12890625, 4.4453125, 4.76171875, 5.078125, 5.39453125, 5.7109375, 6.02734375, 6.34375, 6.66015625, 6.9765625, 7.29296875, 7.609375, 7.92578125, 8.2421875, 8.55859375, 8.875, 9.19140625, 9.5078125, 9.82421875, 10.140625, 10.45703125, 10.7734375, 11.08984375, 11.40625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 3.0, 9.0, 9.0, 10.0, 10.0, 17.0, 18.0, 33.0, 44.0, 46.0, 67.0, 76.0, 84.0, 106.0, 141.0, 147.0, 170.0, 173.0, 209.0, 234.0, 216.0, 265.0, 235.0, 218.0, 204.0, 187.0, 187.0, 158.0, 146.0, 120.0, 120.0, 98.0, 72.0, 56.0, 39.0, 28.0, 31.0, 18.0, 25.0, 14.0, 7.0, 5.0, 6.0, 7.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.0849609375, -3.943359375, -3.8017578125, -3.66015625, -3.5185546875, -3.376953125, -3.2353515625, -3.09375, -2.9521484375, -2.810546875, -2.6689453125, -2.52734375, -2.3857421875, -2.244140625, -2.1025390625, -1.9609375, -1.8193359375, -1.677734375, -1.5361328125, -1.39453125, -1.2529296875, -1.111328125, -0.9697265625, -0.828125, -0.6865234375, -0.544921875, -0.4033203125, -0.26171875, -0.1201171875, 0.021484375, 0.1630859375, 0.3046875, 0.4462890625, 0.587890625, 0.7294921875, 0.87109375, 1.0126953125, 1.154296875, 1.2958984375, 1.4375, 1.5791015625, 1.720703125, 1.8623046875, 2.00390625, 2.1455078125, 2.287109375, 2.4287109375, 2.5703125, 2.7119140625, 2.853515625, 2.9951171875, 3.13671875, 3.2783203125, 3.419921875, 3.5615234375, 3.703125, 3.8447265625, 3.986328125, 4.1279296875, 4.26953125, 4.4111328125, 4.552734375, 4.6943359375, 4.8359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 6.0, 9.0, 5.0, 14.0, 17.0, 15.0, 15.0, 27.0, 24.0, 28.0, 33.0, 36.0, 46.0, 50.0, 57.0, 55.0, 52.0, 50.0, 63.0, 51.0, 47.0, 49.0, 44.0, 37.0, 34.0, 27.0, 23.0, 19.0, 16.0, 20.0, 6.0, 10.0, 3.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.596428871154785, -12.192436218261719, -11.788442611694336, -11.38444995880127, -10.980457305908203, -10.57646369934082, -10.172471046447754, -9.768478393554688, -9.364484786987305, -8.960492134094238, -8.556498527526855, -8.152505874633789, -7.748513221740723, -7.344520092010498, -6.940526962280273, -6.536534309387207, -6.132541656494141, -5.728548526763916, -5.32455587387085, -4.920562744140625, -4.516570091247559, -4.112576961517334, -3.7085838317871094, -3.304590940475464, -2.9005980491638184, -2.496605157852173, -2.0926122665405273, -1.6886191368103027, -1.2846262454986572, -0.8806333541870117, -0.4766402244567871, -0.0726473331451416, 0.3313446044921875, 0.7353375554084778, 1.139330506324768, 1.5433235168457031, 1.9473164081573486, 2.351309299468994, 2.7553024291992188, 3.1592953205108643, 3.5632882118225098, 3.9672811031341553, 4.371273994445801, 4.775267124176025, 5.17926025390625, 5.583252906799316, 5.987246036529541, 6.391239166259766, 6.795231819152832, 7.199224948883057, 7.603217601776123, 8.007210731506348, 8.411203384399414, 8.815196990966797, 9.219189643859863, 9.62318229675293, 10.027175903320312, 10.431168556213379, 10.835162162780762, 11.239154815673828, 11.643147468566895, 12.047140121459961, 12.451133728027344, 12.85512638092041, 13.259119033813477]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 2.0, 5.0, 2.0, 4.0, 9.0, 7.0, 11.0, 13.0, 21.0, 18.0, 11.0, 12.0, 30.0, 25.0, 21.0, 21.0, 34.0, 39.0, 33.0, 35.0, 35.0, 39.0, 46.0, 43.0, 32.0, 34.0, 38.0, 26.0, 30.0, 45.0, 31.0, 35.0, 30.0, 24.0, 14.0, 21.0, 19.0, 17.0, 9.0, 11.0, 14.0, 13.0, 7.0, 14.0, 4.0, 10.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-11.058971405029297, -10.731158256530762, -10.403345108032227, -10.075531005859375, -9.74771785736084, -9.419904708862305, -9.092090606689453, -8.764277458190918, -8.436464309692383, -8.108651161193848, -7.780837535858154, -7.453023910522461, -7.125210762023926, -6.797397613525391, -6.469583988189697, -6.141770362854004, -5.813957214355469, -5.486144065856934, -5.15833044052124, -4.830516815185547, -4.502703666687012, -4.174890518188477, -3.847076892852783, -3.519263505935669, -3.1914501190185547, -2.8636367321014404, -2.535823345184326, -2.208009958267212, -1.8801965713500977, -1.5523831844329834, -1.2245697975158691, -0.8967564105987549, -0.5689420700073242, -0.24112868309020996, 0.0866847038269043, 0.41449809074401855, 0.7423114776611328, 1.070124864578247, 1.3979382514953613, 1.7257516384124756, 2.05356502532959, 2.381378412246704, 2.7091917991638184, 3.0370051860809326, 3.364818572998047, 3.692631959915161, 4.020445346832275, 4.348258972167969, 4.676072120666504, 5.003885269165039, 5.331698894500732, 5.659512519836426, 5.987325668334961, 6.315138816833496, 6.6429524421691895, 6.970766067504883, 7.298579216003418, 7.626392364501953, 7.9542059898376465, 8.28201961517334, 8.609832763671875, 8.93764591217041, 9.265459060668945, 9.593273162841797, 9.921086311340332]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 13.0, 21.0, 22.0, 27.0, 42.0, 59.0, 106.0, 147.0, 257.0, 434.0, 698.0, 1203.0, 1903.0, 3145.0, 5498.0, 9132.0, 14316.0, 23885.0, 37343.0, 57422.0, 81856.0, 108266.0, 129917.0, 136711.0, 124847.0, 101092.0, 73738.0, 51009.0, 32940.0, 20476.0, 12683.0, 7638.0, 4543.0, 2872.0, 1594.0, 974.0, 634.0, 395.0, 259.0, 153.0, 86.0, 67.0, 47.0, 23.0, 22.0, 14.0, 11.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3984375, -5.2315673828125, -5.064697265625, -4.8978271484375, -4.73095703125, -4.5640869140625, -4.397216796875, -4.2303466796875, -4.0634765625, -3.8966064453125, -3.729736328125, -3.5628662109375, -3.39599609375, -3.2291259765625, -3.062255859375, -2.8953857421875, -2.728515625, -2.5616455078125, -2.394775390625, -2.2279052734375, -2.06103515625, -1.8941650390625, -1.727294921875, -1.5604248046875, -1.3935546875, -1.2266845703125, -1.059814453125, -0.8929443359375, -0.72607421875, -0.5592041015625, -0.392333984375, -0.2254638671875, -0.05859375, 0.1082763671875, 0.275146484375, 0.4420166015625, 0.60888671875, 0.7757568359375, 0.942626953125, 1.1094970703125, 1.2763671875, 1.4432373046875, 1.610107421875, 1.7769775390625, 1.94384765625, 2.1107177734375, 2.277587890625, 2.4444580078125, 2.611328125, 2.7781982421875, 2.945068359375, 3.1119384765625, 3.27880859375, 3.4456787109375, 3.612548828125, 3.7794189453125, 3.9462890625, 4.1131591796875, 4.280029296875, 4.4468994140625, 4.61376953125, 4.7806396484375, 4.947509765625, 5.1143798828125, 5.28125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 6.0, 13.0, 10.0, 16.0, 16.0, 15.0, 23.0, 26.0, 25.0, 37.0, 32.0, 46.0, 40.0, 34.0, 39.0, 34.0, 43.0, 40.0, 49.0, 43.0, 45.0, 41.0, 33.0, 41.0, 29.0, 31.0, 23.0, 23.0, 15.0, 28.0, 14.0, 10.0, 16.0, 15.0, 8.0, 8.0, 4.0, 7.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.078125, -11.695068359375, -11.31201171875, -10.928955078125, -10.5458984375, -10.162841796875, -9.77978515625, -9.396728515625, -9.013671875, -8.630615234375, -8.24755859375, -7.864501953125, -7.4814453125, -7.098388671875, -6.71533203125, -6.332275390625, -5.94921875, -5.566162109375, -5.18310546875, -4.800048828125, -4.4169921875, -4.033935546875, -3.65087890625, -3.267822265625, -2.884765625, -2.501708984375, -2.11865234375, -1.735595703125, -1.3525390625, -0.969482421875, -0.58642578125, -0.203369140625, 0.1796875, 0.562744140625, 0.94580078125, 1.328857421875, 1.7119140625, 2.094970703125, 2.47802734375, 2.861083984375, 3.244140625, 3.627197265625, 4.01025390625, 4.393310546875, 4.7763671875, 5.159423828125, 5.54248046875, 5.925537109375, 6.30859375, 6.691650390625, 7.07470703125, 7.457763671875, 7.8408203125, 8.223876953125, 8.60693359375, 8.989990234375, 9.373046875, 9.756103515625, 10.13916015625, 10.522216796875, 10.9052734375, 11.288330078125, 11.67138671875, 12.054443359375, 12.4375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 8.0, 14.0, 31.0, 35.0, 52.0, 94.0, 108.0, 190.0, 303.0, 464.0, 752.0, 1192.0, 1916.0, 3306.0, 5175.0, 9057.0, 15841.0, 27058.0, 46071.0, 76292.0, 117369.0, 157790.0, 172169.0, 147124.0, 104154.0, 66525.0, 39229.0, 23135.0, 13513.0, 7813.0, 4528.0, 2766.0, 1654.0, 1025.0, 626.0, 420.0, 284.0, 183.0, 77.0, 72.0, 48.0, 30.0, 22.0, 14.0, 11.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.875, -7.623779296875, -7.37255859375, -7.121337890625, -6.8701171875, -6.618896484375, -6.36767578125, -6.116455078125, -5.865234375, -5.614013671875, -5.36279296875, -5.111572265625, -4.8603515625, -4.609130859375, -4.35791015625, -4.106689453125, -3.85546875, -3.604248046875, -3.35302734375, -3.101806640625, -2.8505859375, -2.599365234375, -2.34814453125, -2.096923828125, -1.845703125, -1.594482421875, -1.34326171875, -1.092041015625, -0.8408203125, -0.589599609375, -0.33837890625, -0.087158203125, 0.1640625, 0.415283203125, 0.66650390625, 0.917724609375, 1.1689453125, 1.420166015625, 1.67138671875, 1.922607421875, 2.173828125, 2.425048828125, 2.67626953125, 2.927490234375, 3.1787109375, 3.429931640625, 3.68115234375, 3.932373046875, 4.18359375, 4.434814453125, 4.68603515625, 4.937255859375, 5.1884765625, 5.439697265625, 5.69091796875, 5.942138671875, 6.193359375, 6.444580078125, 6.69580078125, 6.947021484375, 7.1982421875, 7.449462890625, 7.70068359375, 7.951904296875, 8.203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 4.0, 13.0, 9.0, 13.0, 11.0, 14.0, 12.0, 23.0, 18.0, 31.0, 33.0, 33.0, 31.0, 30.0, 35.0, 38.0, 38.0, 34.0, 39.0, 41.0, 43.0, 45.0, 33.0, 43.0, 40.0, 35.0, 31.0, 32.0, 30.0, 20.0, 29.0, 16.0, 17.0, 14.0, 22.0, 12.0, 11.0, 5.0, 5.0, 6.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.0546875, -6.8232421875, -6.591796875, -6.3603515625, -6.12890625, -5.8974609375, -5.666015625, -5.4345703125, -5.203125, -4.9716796875, -4.740234375, -4.5087890625, -4.27734375, -4.0458984375, -3.814453125, -3.5830078125, -3.3515625, -3.1201171875, -2.888671875, -2.6572265625, -2.42578125, -2.1943359375, -1.962890625, -1.7314453125, -1.5, -1.2685546875, -1.037109375, -0.8056640625, -0.57421875, -0.3427734375, -0.111328125, 0.1201171875, 0.3515625, 0.5830078125, 0.814453125, 1.0458984375, 1.27734375, 1.5087890625, 1.740234375, 1.9716796875, 2.203125, 2.4345703125, 2.666015625, 2.8974609375, 3.12890625, 3.3603515625, 3.591796875, 3.8232421875, 4.0546875, 4.2861328125, 4.517578125, 4.7490234375, 4.98046875, 5.2119140625, 5.443359375, 5.6748046875, 5.90625, 6.1376953125, 6.369140625, 6.6005859375, 6.83203125, 7.0634765625, 7.294921875, 7.5263671875, 7.7578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 10.0, 16.0, 23.0, 39.0, 62.0, 89.0, 149.0, 212.0, 289.0, 511.0, 811.0, 1327.0, 2071.0, 3560.0, 5794.0, 9487.0, 15890.0, 26519.0, 43767.0, 71113.0, 108152.0, 147519.0, 166156.0, 148737.0, 109774.0, 72256.0, 45639.0, 27237.0, 16322.0, 9807.0, 5846.0, 3522.0, 2145.0, 1370.0, 832.0, 501.0, 356.0, 196.0, 148.0, 102.0, 63.0, 42.0, 39.0, 18.0, 17.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.28515625, -3.18414306640625, -3.0831298828125, -2.98211669921875, -2.881103515625, -2.78009033203125, -2.6790771484375, -2.57806396484375, -2.47705078125, -2.37603759765625, -2.2750244140625, -2.17401123046875, -2.072998046875, -1.97198486328125, -1.8709716796875, -1.76995849609375, -1.6689453125, -1.56793212890625, -1.4669189453125, -1.36590576171875, -1.264892578125, -1.16387939453125, -1.0628662109375, -0.96185302734375, -0.86083984375, -0.75982666015625, -0.6588134765625, -0.55780029296875, -0.456787109375, -0.35577392578125, -0.2547607421875, -0.15374755859375, -0.052734375, 0.04827880859375, 0.1492919921875, 0.25030517578125, 0.351318359375, 0.45233154296875, 0.5533447265625, 0.65435791015625, 0.75537109375, 0.85638427734375, 0.9573974609375, 1.05841064453125, 1.159423828125, 1.26043701171875, 1.3614501953125, 1.46246337890625, 1.5634765625, 1.66448974609375, 1.7655029296875, 1.86651611328125, 1.967529296875, 2.06854248046875, 2.1695556640625, 2.27056884765625, 2.37158203125, 2.47259521484375, 2.5736083984375, 2.67462158203125, 2.775634765625, 2.87664794921875, 2.9776611328125, 3.07867431640625, 3.1796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 11.0, 20.0, 11.0, 16.0, 16.0, 22.0, 27.0, 36.0, 31.0, 37.0, 30.0, 53.0, 42.0, 59.0, 42.0, 48.0, 49.0, 53.0, 45.0, 53.0, 44.0, 32.0, 23.0, 19.0, 27.0, 22.0, 19.0, 22.0, 8.0, 5.0, 11.0, 4.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00015103816986083984, -0.00014622695744037628, -0.00014141574501991272, -0.00013660453259944916, -0.0001317933201789856, -0.00012698210775852203, -0.00012217089533805847, -0.00011735968291759491, -0.00011254847049713135, -0.00010773725807666779, -0.00010292604565620422, -9.811483323574066e-05, -9.33036208152771e-05, -8.849240839481354e-05, -8.368119597434998e-05, -7.886998355388641e-05, -7.405877113342285e-05, -6.924755871295929e-05, -6.443634629249573e-05, -5.9625133872032166e-05, -5.4813921451568604e-05, -5.000270903110504e-05, -4.519149661064148e-05, -4.038028419017792e-05, -3.5569071769714355e-05, -3.0757859349250793e-05, -2.594664692878723e-05, -2.113543450832367e-05, -1.6324222087860107e-05, -1.1513009667396545e-05, -6.701797246932983e-06, -1.8905848264694214e-06, 2.9206275939941406e-06, 7.731840014457703e-06, 1.2543052434921265e-05, 1.7354264855384827e-05, 2.216547727584839e-05, 2.697668969631195e-05, 3.178790211677551e-05, 3.6599114537239075e-05, 4.141032695770264e-05, 4.62215393781662e-05, 5.103275179862976e-05, 5.584396421909332e-05, 6.0655176639556885e-05, 6.546638906002045e-05, 7.027760148048401e-05, 7.508881390094757e-05, 7.990002632141113e-05, 8.47112387418747e-05, 8.952245116233826e-05, 9.433366358280182e-05, 9.914487600326538e-05, 0.00010395608842372894, 0.0001087673008441925, 0.00011357851326465607, 0.00011838972568511963, 0.0001232009381055832, 0.00012801215052604675, 0.00013282336294651031, 0.00013763457536697388, 0.00014244578778743744, 0.000147257000207901, 0.00015206821262836456, 0.00015687942504882812]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 6.0, 16.0, 11.0, 29.0, 57.0, 55.0, 107.0, 182.0, 276.0, 445.0, 623.0, 1022.0, 1621.0, 2571.0, 4111.0, 6454.0, 10512.0, 16959.0, 26713.0, 42006.0, 63496.0, 91085.0, 118111.0, 136754.0, 136829.0, 119036.0, 91040.0, 64037.0, 42191.0, 27107.0, 16922.0, 10509.0, 6564.0, 4174.0, 2558.0, 1602.0, 1006.0, 639.0, 399.0, 262.0, 174.0, 119.0, 68.0, 39.0, 20.0, 18.0, 8.0, 11.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -2.977630615234375, -2.86737060546875, -2.757110595703125, -2.6468505859375, -2.536590576171875, -2.42633056640625, -2.316070556640625, -2.205810546875, -2.095550537109375, -1.98529052734375, -1.875030517578125, -1.7647705078125, -1.654510498046875, -1.54425048828125, -1.433990478515625, -1.32373046875, -1.213470458984375, -1.10321044921875, -0.992950439453125, -0.8826904296875, -0.772430419921875, -0.66217041015625, -0.551910400390625, -0.441650390625, -0.331390380859375, -0.22113037109375, -0.110870361328125, -0.0006103515625, 0.109649658203125, 0.21990966796875, 0.330169677734375, 0.4404296875, 0.550689697265625, 0.66094970703125, 0.771209716796875, 0.8814697265625, 0.991729736328125, 1.10198974609375, 1.212249755859375, 1.322509765625, 1.432769775390625, 1.54302978515625, 1.653289794921875, 1.7635498046875, 1.873809814453125, 1.98406982421875, 2.094329833984375, 2.20458984375, 2.314849853515625, 2.42510986328125, 2.535369873046875, 2.6456298828125, 2.755889892578125, 2.86614990234375, 2.976409912109375, 3.086669921875, 3.196929931640625, 3.30718994140625, 3.417449951171875, 3.5277099609375, 3.637969970703125, 3.74822998046875, 3.858489990234375, 3.96875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 5.0, 0.0, 5.0, 5.0, 5.0, 11.0, 15.0, 14.0, 19.0, 17.0, 18.0, 33.0, 30.0, 26.0, 21.0, 32.0, 35.0, 50.0, 31.0, 50.0, 56.0, 44.0, 60.0, 44.0, 56.0, 37.0, 33.0, 40.0, 30.0, 29.0, 22.0, 18.0, 21.0, 15.0, 10.0, 15.0, 10.0, 10.0, 7.0, 3.0, 9.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3681640625, -1.3250885009765625, -1.282012939453125, -1.2389373779296875, -1.19586181640625, -1.1527862548828125, -1.109710693359375, -1.0666351318359375, -1.0235595703125, -0.9804840087890625, -0.937408447265625, -0.8943328857421875, -0.85125732421875, -0.8081817626953125, -0.765106201171875, -0.7220306396484375, -0.678955078125, -0.6358795166015625, -0.592803955078125, -0.5497283935546875, -0.50665283203125, -0.4635772705078125, -0.420501708984375, -0.3774261474609375, -0.3343505859375, -0.2912750244140625, -0.248199462890625, -0.2051239013671875, -0.16204833984375, -0.1189727783203125, -0.075897216796875, -0.0328216552734375, 0.01025390625, 0.0533294677734375, 0.096405029296875, 0.1394805908203125, 0.18255615234375, 0.2256317138671875, 0.268707275390625, 0.3117828369140625, 0.3548583984375, 0.3979339599609375, 0.441009521484375, 0.4840850830078125, 0.52716064453125, 0.5702362060546875, 0.613311767578125, 0.6563873291015625, 0.699462890625, 0.7425384521484375, 0.785614013671875, 0.8286895751953125, 0.87176513671875, 0.9148406982421875, 0.957916259765625, 1.0009918212890625, 1.0440673828125, 1.0871429443359375, 1.130218505859375, 1.1732940673828125, 1.21636962890625, 1.2594451904296875, 1.302520751953125, 1.3455963134765625, 1.388671875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 9.0, 7.0, 6.0, 15.0, 21.0, 12.0, 26.0, 23.0, 31.0, 30.0, 39.0, 39.0, 48.0, 56.0, 67.0, 53.0, 59.0, 64.0, 50.0, 45.0, 55.0, 42.0, 39.0, 28.0, 36.0, 22.0, 17.0, 19.0, 10.0, 6.0, 5.0, 8.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.86880111694336, -13.450138092041016, -13.031474113464355, -12.612811088562012, -12.194147109985352, -11.775484085083008, -11.356821060180664, -10.93815803527832, -10.51949405670166, -10.100831031799316, -9.682167053222656, -9.263504028320312, -8.844841003417969, -8.426177024841309, -8.007513999938965, -7.588850498199463, -7.170186996459961, -6.751523494720459, -6.332859992980957, -5.914196968078613, -5.495533466339111, -5.076869964599609, -4.658206939697266, -4.239543437957764, -3.8208799362182617, -3.4022164344787598, -2.983553171157837, -2.564889907836914, -2.146226406097412, -1.7275629043579102, -1.3088996410369873, -0.8902363777160645, -0.4715719223022461, -0.05290853977203369, 0.3657548427581787, 0.7844182252883911, 1.2030816078186035, 1.6217451095581055, 2.0404083728790283, 2.459071636199951, 2.877735137939453, 3.296398639678955, 3.715061902999878, 4.133725166320801, 4.552388668060303, 4.971052169799805, 5.389715194702148, 5.80837869644165, 6.227042198181152, 6.645705699920654, 7.064369201660156, 7.4830322265625, 7.901695728302002, 8.320359230041504, 8.739022254943848, 9.157686233520508, 9.576349258422852, 9.995012283325195, 10.413676261901855, 10.8323392868042, 11.25100326538086, 11.669666290283203, 12.088329315185547, 12.50699234008789, 12.92565631866455]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 7.0, 4.0, 5.0, 8.0, 7.0, 13.0, 24.0, 17.0, 10.0, 24.0, 19.0, 17.0, 33.0, 22.0, 30.0, 34.0, 37.0, 32.0, 31.0, 50.0, 35.0, 45.0, 36.0, 37.0, 31.0, 33.0, 37.0, 31.0, 36.0, 38.0, 33.0, 21.0, 20.0, 16.0, 15.0, 19.0, 13.0, 8.0, 16.0, 10.0, 11.0, 8.0, 10.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-11.050389289855957, -10.724064826965332, -10.397741317749023, -10.071416854858398, -9.74509334564209, -9.418768882751465, -9.092445373535156, -8.766120910644531, -8.439797401428223, -8.113472938537598, -7.787149429321289, -7.460825443267822, -7.1345014572143555, -6.808177471160889, -6.481853485107422, -6.155529022216797, -5.82920503616333, -5.502881050109863, -5.1765570640563965, -4.85023307800293, -4.523909091949463, -4.197585105895996, -3.87126088142395, -3.5449368953704834, -3.2186129093170166, -2.89228892326355, -2.565964937210083, -2.239640712738037, -1.9133168458938599, -1.586992859840393, -1.2606687545776367, -0.9343447685241699, -0.6080207824707031, -0.28169676661491394, 0.044627249240875244, 0.3709512948989868, 0.6972752809524536, 1.0235992670059204, 1.3499233722686768, 1.6762473583221436, 2.0025713443756104, 2.328895330429077, 2.655219316482544, 2.98154354095459, 3.3078675270080566, 3.6341915130615234, 3.9605154991149902, 4.286839485168457, 4.613163471221924, 4.939487457275391, 5.265811443328857, 5.592135429382324, 5.918459415435791, 6.244783401489258, 6.571107864379883, 6.897431373596191, 7.223755836486816, 7.550079822540283, 7.87640380859375, 8.202728271484375, 8.529051780700684, 8.855376243591309, 9.181699752807617, 9.508024215698242, 9.83434772491455]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 13.0, 27.0, 37.0, 64.0, 101.0, 120.0, 240.0, 336.0, 612.0, 886.0, 1348.0, 2226.0, 3345.0, 5435.0, 8334.0, 12963.0, 19802.0, 29280.0, 42179.0, 58002.0, 75169.0, 93880.0, 106550.0, 111912.0, 106847.0, 95504.0, 78885.0, 60212.0, 43815.0, 30855.0, 20953.0, 13859.0, 8931.0, 5731.0, 3667.0, 2332.0, 1474.0, 959.0, 613.0, 354.0, 255.0, 170.0, 97.0, 70.0, 31.0, 20.0, 24.0, 14.0, 8.0, 7.0, 3.0, 3.0], "bins": [-7.0859375, -6.88671875, -6.6875, -6.48828125, -6.2890625, -6.08984375, -5.890625, -5.69140625, -5.4921875, -5.29296875, -5.09375, -4.89453125, -4.6953125, -4.49609375, -4.296875, -4.09765625, -3.8984375, -3.69921875, -3.5, -3.30078125, -3.1015625, -2.90234375, -2.703125, -2.50390625, -2.3046875, -2.10546875, -1.90625, -1.70703125, -1.5078125, -1.30859375, -1.109375, -0.91015625, -0.7109375, -0.51171875, -0.3125, -0.11328125, 0.0859375, 0.28515625, 0.484375, 0.68359375, 0.8828125, 1.08203125, 1.28125, 1.48046875, 1.6796875, 1.87890625, 2.078125, 2.27734375, 2.4765625, 2.67578125, 2.875, 3.07421875, 3.2734375, 3.47265625, 3.671875, 3.87109375, 4.0703125, 4.26953125, 4.46875, 4.66796875, 4.8671875, 5.06640625, 5.265625, 5.46484375, 5.6640625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 2.0, 8.0, 7.0, 5.0, 14.0, 14.0, 14.0, 18.0, 17.0, 21.0, 26.0, 27.0, 29.0, 27.0, 25.0, 34.0, 23.0, 41.0, 42.0, 41.0, 41.0, 35.0, 41.0, 34.0, 34.0, 38.0, 40.0, 29.0, 41.0, 22.0, 22.0, 24.0, 13.0, 28.0, 16.0, 13.0, 17.0, 15.0, 14.0, 7.0, 10.0, 5.0, 12.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.2265625, -10.8914794921875, -10.556396484375, -10.2213134765625, -9.88623046875, -9.5511474609375, -9.216064453125, -8.8809814453125, -8.5458984375, -8.2108154296875, -7.875732421875, -7.5406494140625, -7.20556640625, -6.8704833984375, -6.535400390625, -6.2003173828125, -5.865234375, -5.5301513671875, -5.195068359375, -4.8599853515625, -4.52490234375, -4.1898193359375, -3.854736328125, -3.5196533203125, -3.1845703125, -2.8494873046875, -2.514404296875, -2.1793212890625, -1.84423828125, -1.5091552734375, -1.174072265625, -0.8389892578125, -0.50390625, -0.1688232421875, 0.166259765625, 0.5013427734375, 0.83642578125, 1.1715087890625, 1.506591796875, 1.8416748046875, 2.1767578125, 2.5118408203125, 2.846923828125, 3.1820068359375, 3.51708984375, 3.8521728515625, 4.187255859375, 4.5223388671875, 4.857421875, 5.1925048828125, 5.527587890625, 5.8626708984375, 6.19775390625, 6.5328369140625, 6.867919921875, 7.2030029296875, 7.5380859375, 7.8731689453125, 8.208251953125, 8.5433349609375, 8.87841796875, 9.2135009765625, 9.548583984375, 9.8836669921875, 10.21875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 19.0, 23.0, 30.0, 44.0, 64.0, 92.0, 149.0, 210.0, 291.0, 437.0, 657.0, 1088.0, 1657.0, 2435.0, 3678.0, 5754.0, 8594.0, 13275.0, 19235.0, 28416.0, 40873.0, 56204.0, 73654.0, 91672.0, 104516.0, 110634.0, 107106.0, 95757.0, 78908.0, 61168.0, 45291.0, 31805.0, 21716.0, 14749.0, 9773.0, 6359.0, 4159.0, 2695.0, 1805.0, 1143.0, 806.0, 538.0, 350.0, 236.0, 145.0, 108.0, 68.0, 49.0, 38.0, 19.0, 19.0, 11.0, 6.0, 9.0, 6.0], "bins": [-7.34375, -7.13177490234375, -6.9197998046875, -6.70782470703125, -6.495849609375, -6.28387451171875, -6.0718994140625, -5.85992431640625, -5.64794921875, -5.43597412109375, -5.2239990234375, -5.01202392578125, -4.800048828125, -4.58807373046875, -4.3760986328125, -4.16412353515625, -3.9521484375, -3.74017333984375, -3.5281982421875, -3.31622314453125, -3.104248046875, -2.89227294921875, -2.6802978515625, -2.46832275390625, -2.25634765625, -2.04437255859375, -1.8323974609375, -1.62042236328125, -1.408447265625, -1.19647216796875, -0.9844970703125, -0.77252197265625, -0.560546875, -0.34857177734375, -0.1365966796875, 0.07537841796875, 0.287353515625, 0.49932861328125, 0.7113037109375, 0.92327880859375, 1.13525390625, 1.34722900390625, 1.5592041015625, 1.77117919921875, 1.983154296875, 2.19512939453125, 2.4071044921875, 2.61907958984375, 2.8310546875, 3.04302978515625, 3.2550048828125, 3.46697998046875, 3.678955078125, 3.89093017578125, 4.1029052734375, 4.31488037109375, 4.52685546875, 4.73883056640625, 4.9508056640625, 5.16278076171875, 5.374755859375, 5.58673095703125, 5.7987060546875, 6.01068115234375, 6.22265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 10.0, 5.0, 5.0, 8.0, 7.0, 15.0, 22.0, 14.0, 34.0, 18.0, 23.0, 22.0, 32.0, 30.0, 37.0, 28.0, 27.0, 30.0, 41.0, 38.0, 34.0, 42.0, 39.0, 48.0, 36.0, 45.0, 38.0, 34.0, 31.0, 32.0, 19.0, 20.0, 25.0, 18.0, 16.0, 10.0, 13.0, 10.0, 10.0, 8.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.46875, -7.24932861328125, -7.0299072265625, -6.81048583984375, -6.591064453125, -6.37164306640625, -6.1522216796875, -5.93280029296875, -5.71337890625, -5.49395751953125, -5.2745361328125, -5.05511474609375, -4.835693359375, -4.61627197265625, -4.3968505859375, -4.17742919921875, -3.9580078125, -3.73858642578125, -3.5191650390625, -3.29974365234375, -3.080322265625, -2.86090087890625, -2.6414794921875, -2.42205810546875, -2.20263671875, -1.98321533203125, -1.7637939453125, -1.54437255859375, -1.324951171875, -1.10552978515625, -0.8861083984375, -0.66668701171875, -0.447265625, -0.22784423828125, -0.0084228515625, 0.21099853515625, 0.430419921875, 0.64984130859375, 0.8692626953125, 1.08868408203125, 1.30810546875, 1.52752685546875, 1.7469482421875, 1.96636962890625, 2.185791015625, 2.40521240234375, 2.6246337890625, 2.84405517578125, 3.0634765625, 3.28289794921875, 3.5023193359375, 3.72174072265625, 3.941162109375, 4.16058349609375, 4.3800048828125, 4.59942626953125, 4.81884765625, 5.03826904296875, 5.2576904296875, 5.47711181640625, 5.696533203125, 5.91595458984375, 6.1353759765625, 6.35479736328125, 6.57421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 6.0, 5.0, 10.0, 18.0, 13.0, 26.0, 37.0, 57.0, 82.0, 114.0, 198.0, 272.0, 464.0, 763.0, 1242.0, 2109.0, 3593.0, 6307.0, 11172.0, 19970.0, 33880.0, 56483.0, 86874.0, 120508.0, 146341.0, 151893.0, 133992.0, 102116.0, 68604.0, 42654.0, 25152.0, 14165.0, 8069.0, 4668.0, 2658.0, 1557.0, 897.0, 573.0, 349.0, 227.0, 133.0, 102.0, 71.0, 47.0, 13.0, 25.0, 19.0, 11.0, 8.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.333984375, -3.230499267578125, -3.12701416015625, -3.023529052734375, -2.9200439453125, -2.816558837890625, -2.71307373046875, -2.609588623046875, -2.506103515625, -2.402618408203125, -2.29913330078125, -2.195648193359375, -2.0921630859375, -1.988677978515625, -1.88519287109375, -1.781707763671875, -1.67822265625, -1.574737548828125, -1.47125244140625, -1.367767333984375, -1.2642822265625, -1.160797119140625, -1.05731201171875, -0.953826904296875, -0.850341796875, -0.746856689453125, -0.64337158203125, -0.539886474609375, -0.4364013671875, -0.332916259765625, -0.22943115234375, -0.125946044921875, -0.0224609375, 0.081024169921875, 0.18450927734375, 0.287994384765625, 0.3914794921875, 0.494964599609375, 0.59844970703125, 0.701934814453125, 0.805419921875, 0.908905029296875, 1.01239013671875, 1.115875244140625, 1.2193603515625, 1.322845458984375, 1.42633056640625, 1.529815673828125, 1.63330078125, 1.736785888671875, 1.84027099609375, 1.943756103515625, 2.0472412109375, 2.150726318359375, 2.25421142578125, 2.357696533203125, 2.461181640625, 2.564666748046875, 2.66815185546875, 2.771636962890625, 2.8751220703125, 2.978607177734375, 3.08209228515625, 3.185577392578125, 3.2890625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 13.0, 16.0, 20.0, 27.0, 39.0, 62.0, 72.0, 71.0, 102.0, 85.0, 90.0, 94.0, 69.0, 57.0, 38.0, 39.0, 26.0, 17.0, 17.0, 11.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006232261657714844, -0.0006034821271896362, -0.0005837380886077881, -0.0005639940500259399, -0.0005442500114440918, -0.0005245059728622437, -0.0005047619342803955, -0.00048501789569854736, -0.0004652738571166992, -0.0004455298185348511, -0.00042578577995300293, -0.0004060417413711548, -0.00038629770278930664, -0.0003665536642074585, -0.00034680962562561035, -0.0003270655870437622, -0.00030732154846191406, -0.0002875775098800659, -0.0002678334712982178, -0.00024808943271636963, -0.00022834539413452148, -0.00020860135555267334, -0.0001888573169708252, -0.00016911327838897705, -0.0001493692398071289, -0.00012962520122528076, -0.00010988116264343262, -9.013712406158447e-05, -7.039308547973633e-05, -5.0649046897888184e-05, -3.090500831604004e-05, -1.1160969734191895e-05, 8.58306884765625e-06, 2.8327107429504395e-05, 4.807114601135254e-05, 6.781518459320068e-05, 8.755922317504883e-05, 0.00010730326175689697, 0.00012704730033874512, 0.00014679133892059326, 0.0001665353775024414, 0.00018627941608428955, 0.0002060234546661377, 0.00022576749324798584, 0.000245511531829834, 0.00026525557041168213, 0.0002849996089935303, 0.0003047436475753784, 0.00032448768615722656, 0.0003442317247390747, 0.00036397576332092285, 0.000383719801902771, 0.00040346384048461914, 0.0004232078790664673, 0.00044295191764831543, 0.0004626959562301636, 0.0004824399948120117, 0.0005021840333938599, 0.000521928071975708, 0.0005416721105575562, 0.0005614161491394043, 0.0005811601877212524, 0.0006009042263031006, 0.0006206482648849487, 0.0006403923034667969]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 12.0, 25.0, 35.0, 36.0, 52.0, 88.0, 118.0, 179.0, 260.0, 438.0, 717.0, 1048.0, 1673.0, 2628.0, 4296.0, 7017.0, 11073.0, 17794.0, 28001.0, 43450.0, 62552.0, 87148.0, 110128.0, 125756.0, 128064.0, 115662.0, 94314.0, 70479.0, 48609.0, 32239.0, 20434.0, 12812.0, 8014.0, 5009.0, 3088.0, 1937.0, 1190.0, 752.0, 508.0, 320.0, 210.0, 139.0, 80.0, 61.0, 40.0, 32.0, 12.0, 6.0, 8.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-3.1484375, -3.053466796875, -2.95849609375, -2.863525390625, -2.7685546875, -2.673583984375, -2.57861328125, -2.483642578125, -2.388671875, -2.293701171875, -2.19873046875, -2.103759765625, -2.0087890625, -1.913818359375, -1.81884765625, -1.723876953125, -1.62890625, -1.533935546875, -1.43896484375, -1.343994140625, -1.2490234375, -1.154052734375, -1.05908203125, -0.964111328125, -0.869140625, -0.774169921875, -0.67919921875, -0.584228515625, -0.4892578125, -0.394287109375, -0.29931640625, -0.204345703125, -0.109375, -0.014404296875, 0.08056640625, 0.175537109375, 0.2705078125, 0.365478515625, 0.46044921875, 0.555419921875, 0.650390625, 0.745361328125, 0.84033203125, 0.935302734375, 1.0302734375, 1.125244140625, 1.22021484375, 1.315185546875, 1.41015625, 1.505126953125, 1.60009765625, 1.695068359375, 1.7900390625, 1.885009765625, 1.97998046875, 2.074951171875, 2.169921875, 2.264892578125, 2.35986328125, 2.454833984375, 2.5498046875, 2.644775390625, 2.73974609375, 2.834716796875, 2.9296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 7.0, 8.0, 13.0, 12.0, 18.0, 19.0, 19.0, 25.0, 29.0, 28.0, 35.0, 28.0, 46.0, 44.0, 38.0, 36.0, 54.0, 54.0, 58.0, 46.0, 39.0, 43.0, 36.0, 39.0, 37.0, 30.0, 25.0, 22.0, 18.0, 22.0, 11.0, 12.0, 6.0, 15.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.110687255859375, -1.07391357421875, -1.037139892578125, -1.0003662109375, -0.963592529296875, -0.92681884765625, -0.890045166015625, -0.853271484375, -0.816497802734375, -0.77972412109375, -0.742950439453125, -0.7061767578125, -0.669403076171875, -0.63262939453125, -0.595855712890625, -0.55908203125, -0.522308349609375, -0.48553466796875, -0.448760986328125, -0.4119873046875, -0.375213623046875, -0.33843994140625, -0.301666259765625, -0.264892578125, -0.228118896484375, -0.19134521484375, -0.154571533203125, -0.1177978515625, -0.081024169921875, -0.04425048828125, -0.007476806640625, 0.029296875, 0.066070556640625, 0.10284423828125, 0.139617919921875, 0.1763916015625, 0.213165283203125, 0.24993896484375, 0.286712646484375, 0.323486328125, 0.360260009765625, 0.39703369140625, 0.433807373046875, 0.4705810546875, 0.507354736328125, 0.54412841796875, 0.580902099609375, 0.61767578125, 0.654449462890625, 0.69122314453125, 0.727996826171875, 0.7647705078125, 0.801544189453125, 0.83831787109375, 0.875091552734375, 0.911865234375, 0.948638916015625, 0.98541259765625, 1.022186279296875, 1.0589599609375, 1.095733642578125, 1.13250732421875, 1.169281005859375, 1.2060546875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 13.0, 16.0, 16.0, 12.0, 31.0, 31.0, 28.0, 35.0, 40.0, 47.0, 50.0, 70.0, 42.0, 65.0, 58.0, 53.0, 49.0, 51.0, 37.0, 48.0, 43.0, 25.0, 29.0, 22.0, 14.0, 8.0, 15.0, 11.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.977128982543945, -14.556797981262207, -14.136466979980469, -13.71613597869873, -13.295804977416992, -12.875473022460938, -12.4551420211792, -12.034811019897461, -11.614480018615723, -11.194149017333984, -10.773818016052246, -10.353487014770508, -9.933155059814453, -9.512825012207031, -9.092493057250977, -8.672162055969238, -8.2518310546875, -7.831500053405762, -7.411169052124023, -6.990837574005127, -6.570506572723389, -6.15017557144165, -5.729844093322754, -5.309513092041016, -4.889182090759277, -4.468851089477539, -4.048520088195801, -3.6281886100769043, -3.207857608795166, -2.7875266075134277, -2.3671953678131104, -1.946864128112793, -1.5265331268310547, -1.1062020063400269, -0.685870885848999, -0.2655397653579712, 0.15479135513305664, 0.5751223564147949, 0.9954535961151123, 1.4157848358154297, 1.836115837097168, 2.2564468383789062, 2.6767780780792236, 3.097109317779541, 3.5174403190612793, 3.9377713203430176, 4.358102798461914, 4.778433799743652, 5.198764801025391, 5.619095802307129, 6.039426803588867, 6.459758281707764, 6.880089282989502, 7.30042028427124, 7.720751762390137, 8.141082763671875, 8.561413764953613, 8.981744766235352, 9.40207576751709, 9.822406768798828, 10.242738723754883, 10.663068771362305, 11.08340072631836, 11.503731727600098, 11.924062728881836]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 5.0, 7.0, 7.0, 5.0, 9.0, 6.0, 16.0, 17.0, 18.0, 25.0, 28.0, 32.0, 23.0, 31.0, 25.0, 47.0, 37.0, 46.0, 35.0, 46.0, 40.0, 50.0, 42.0, 36.0, 52.0, 34.0, 29.0, 30.0, 28.0, 34.0, 27.0, 23.0, 19.0, 15.0, 18.0, 12.0, 15.0, 6.0, 8.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.78874397277832, -12.384432792663574, -11.980122566223145, -11.575811386108398, -11.171501159667969, -10.767189979553223, -10.362878799438477, -9.958568572998047, -9.5542573928833, -9.149946212768555, -8.745635986328125, -8.341324806213379, -7.937014102935791, -7.532703399658203, -7.128392219543457, -6.724081516265869, -6.319770812988281, -5.915460109710693, -5.5111494064331055, -5.106838226318359, -4.7025275230407715, -4.298216819763184, -3.8939058780670166, -3.4895949363708496, -3.0852842330932617, -2.680973529815674, -2.276662588119507, -1.8723517656326294, -1.468040943145752, -1.063730239868164, -0.6594192981719971, -0.2551083564758301, 0.1492023468017578, 0.5535131692886353, 0.9578239917755127, 1.3621348142623901, 1.7664456367492676, 2.1707563400268555, 2.5750672817230225, 2.9793782234191895, 3.3836889266967773, 3.7879996299743652, 4.192310333251953, 4.596621513366699, 5.000932216644287, 5.405242919921875, 5.809554100036621, 6.213864803314209, 6.618175506591797, 7.022486209869385, 7.426796913146973, 7.831108093261719, 8.235418319702148, 8.639729499816895, 9.04404067993164, 9.44835090637207, 9.852662086486816, 10.256973266601562, 10.661283493041992, 11.065594673156738, 11.469905853271484, 11.874216079711914, 12.27852725982666, 12.682838439941406, 13.087148666381836]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 6.0, 11.0, 14.0, 13.0, 29.0, 64.0, 93.0, 156.0, 229.0, 444.0, 686.0, 1066.0, 1717.0, 2829.0, 4565.0, 7687.0, 12828.0, 22098.0, 38693.0, 67740.0, 121089.0, 211257.0, 356850.0, 539188.0, 681160.0, 687260.0, 552461.0, 369714.0, 220601.0, 125159.0, 70563.0, 39772.0, 23272.0, 13737.0, 8210.0, 4900.0, 3101.0, 1890.0, 1193.0, 751.0, 459.0, 271.0, 158.0, 105.0, 55.0, 52.0, 31.0, 20.0, 15.0, 13.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.6015625, -9.27099609375, -8.9404296875, -8.60986328125, -8.279296875, -7.94873046875, -7.6181640625, -7.28759765625, -6.95703125, -6.62646484375, -6.2958984375, -5.96533203125, -5.634765625, -5.30419921875, -4.9736328125, -4.64306640625, -4.3125, -3.98193359375, -3.6513671875, -3.32080078125, -2.990234375, -2.65966796875, -2.3291015625, -1.99853515625, -1.66796875, -1.33740234375, -1.0068359375, -0.67626953125, -0.345703125, -0.01513671875, 0.3154296875, 0.64599609375, 0.9765625, 1.30712890625, 1.6376953125, 1.96826171875, 2.298828125, 2.62939453125, 2.9599609375, 3.29052734375, 3.62109375, 3.95166015625, 4.2822265625, 4.61279296875, 4.943359375, 5.27392578125, 5.6044921875, 5.93505859375, 6.265625, 6.59619140625, 6.9267578125, 7.25732421875, 7.587890625, 7.91845703125, 8.2490234375, 8.57958984375, 8.91015625, 9.24072265625, 9.5712890625, 9.90185546875, 10.232421875, 10.56298828125, 10.8935546875, 11.22412109375, 11.5546875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 8.0, 9.0, 8.0, 11.0, 20.0, 19.0, 24.0, 30.0, 28.0, 34.0, 28.0, 50.0, 42.0, 46.0, 33.0, 54.0, 40.0, 57.0, 39.0, 49.0, 35.0, 44.0, 33.0, 23.0, 33.0, 32.0, 29.0, 24.0, 24.0, 18.0, 14.0, 12.0, 13.0, 7.0, 7.0, 4.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0390625, -12.6455078125, -12.251953125, -11.8583984375, -11.46484375, -11.0712890625, -10.677734375, -10.2841796875, -9.890625, -9.4970703125, -9.103515625, -8.7099609375, -8.31640625, -7.9228515625, -7.529296875, -7.1357421875, -6.7421875, -6.3486328125, -5.955078125, -5.5615234375, -5.16796875, -4.7744140625, -4.380859375, -3.9873046875, -3.59375, -3.2001953125, -2.806640625, -2.4130859375, -2.01953125, -1.6259765625, -1.232421875, -0.8388671875, -0.4453125, -0.0517578125, 0.341796875, 0.7353515625, 1.12890625, 1.5224609375, 1.916015625, 2.3095703125, 2.703125, 3.0966796875, 3.490234375, 3.8837890625, 4.27734375, 4.6708984375, 5.064453125, 5.4580078125, 5.8515625, 6.2451171875, 6.638671875, 7.0322265625, 7.42578125, 7.8193359375, 8.212890625, 8.6064453125, 9.0, 9.3935546875, 9.787109375, 10.1806640625, 10.57421875, 10.9677734375, 11.361328125, 11.7548828125, 12.1484375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 10.0, 17.0, 37.0, 68.0, 101.0, 134.0, 201.0, 321.0, 476.0, 694.0, 1114.0, 1736.0, 2603.0, 4149.0, 6244.0, 9729.0, 15082.0, 23737.0, 36639.0, 56707.0, 87318.0, 132425.0, 196206.0, 280518.0, 379060.0, 465476.0, 515529.0, 498589.0, 429671.0, 333344.0, 239485.0, 164354.0, 109492.0, 72219.0, 46519.0, 29732.0, 19286.0, 12439.0, 7990.0, 5221.0, 3299.0, 2175.0, 1427.0, 932.0, 620.0, 409.0, 265.0, 177.0, 116.0, 71.0, 44.0, 25.0, 19.0, 12.0, 13.0, 3.0, 4.0, 1.0], "bins": [-9.7890625, -9.4903564453125, -9.191650390625, -8.8929443359375, -8.59423828125, -8.2955322265625, -7.996826171875, -7.6981201171875, -7.3994140625, -7.1007080078125, -6.802001953125, -6.5032958984375, -6.20458984375, -5.9058837890625, -5.607177734375, -5.3084716796875, -5.009765625, -4.7110595703125, -4.412353515625, -4.1136474609375, -3.81494140625, -3.5162353515625, -3.217529296875, -2.9188232421875, -2.6201171875, -2.3214111328125, -2.022705078125, -1.7239990234375, -1.42529296875, -1.1265869140625, -0.827880859375, -0.5291748046875, -0.23046875, 0.0682373046875, 0.366943359375, 0.6656494140625, 0.96435546875, 1.2630615234375, 1.561767578125, 1.8604736328125, 2.1591796875, 2.4578857421875, 2.756591796875, 3.0552978515625, 3.35400390625, 3.6527099609375, 3.951416015625, 4.2501220703125, 4.548828125, 4.8475341796875, 5.146240234375, 5.4449462890625, 5.74365234375, 6.0423583984375, 6.341064453125, 6.6397705078125, 6.9384765625, 7.2371826171875, 7.535888671875, 7.8345947265625, 8.13330078125, 8.4320068359375, 8.730712890625, 9.0294189453125, 9.328125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 9.0, 12.0, 13.0, 23.0, 16.0, 28.0, 39.0, 45.0, 50.0, 50.0, 65.0, 81.0, 82.0, 129.0, 121.0, 165.0, 153.0, 162.0, 170.0, 223.0, 185.0, 201.0, 197.0, 197.0, 198.0, 185.0, 181.0, 173.0, 155.0, 118.0, 109.0, 95.0, 97.0, 59.0, 65.0, 46.0, 39.0, 36.0, 30.0, 18.0, 13.0, 10.0, 7.0, 5.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-4.765625, -4.62078857421875, -4.4759521484375, -4.33111572265625, -4.186279296875, -4.04144287109375, -3.8966064453125, -3.75177001953125, -3.60693359375, -3.46209716796875, -3.3172607421875, -3.17242431640625, -3.027587890625, -2.88275146484375, -2.7379150390625, -2.59307861328125, -2.4482421875, -2.30340576171875, -2.1585693359375, -2.01373291015625, -1.868896484375, -1.72406005859375, -1.5792236328125, -1.43438720703125, -1.28955078125, -1.14471435546875, -0.9998779296875, -0.85504150390625, -0.710205078125, -0.56536865234375, -0.4205322265625, -0.27569580078125, -0.130859375, 0.01397705078125, 0.1588134765625, 0.30364990234375, 0.448486328125, 0.59332275390625, 0.7381591796875, 0.88299560546875, 1.02783203125, 1.17266845703125, 1.3175048828125, 1.46234130859375, 1.607177734375, 1.75201416015625, 1.8968505859375, 2.04168701171875, 2.1865234375, 2.33135986328125, 2.4761962890625, 2.62103271484375, 2.765869140625, 2.91070556640625, 3.0555419921875, 3.20037841796875, 3.34521484375, 3.49005126953125, 3.6348876953125, 3.77972412109375, 3.924560546875, 4.06939697265625, 4.2142333984375, 4.35906982421875, 4.50390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 9.0, 2.0, 5.0, 9.0, 13.0, 19.0, 23.0, 15.0, 27.0, 18.0, 33.0, 28.0, 37.0, 39.0, 43.0, 48.0, 48.0, 55.0, 43.0, 48.0, 51.0, 45.0, 46.0, 38.0, 35.0, 32.0, 32.0, 39.0, 18.0, 21.0, 23.0, 5.0, 8.0, 9.0, 8.0, 11.0, 3.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.418136596679688, -12.995078086853027, -12.57201862335205, -12.14896011352539, -11.725900650024414, -11.302842140197754, -10.879783630371094, -10.456724166870117, -10.03366470336914, -9.61060619354248, -9.187546730041504, -8.764488220214844, -8.341428756713867, -7.918370246887207, -7.495311260223389, -7.07225227355957, -6.64919376373291, -6.226134777069092, -5.803075790405273, -5.380017280578613, -4.956957817077637, -4.533899307250977, -4.110840320587158, -3.68778133392334, -3.2647223472595215, -2.841663360595703, -2.4186043739318848, -1.9955456256866455, -1.5724866390228271, -1.1494276523590088, -0.7263689041137695, -0.30330991744995117, 0.11974811553955078, 0.5428070425987244, 0.965865969657898, 1.3889248371124268, 1.8119838237762451, 2.2350428104400635, 2.6581015586853027, 3.081160545349121, 3.5042195320129395, 3.927278518676758, 4.350337505340576, 4.7733964920043945, 5.196455001831055, 5.619514465332031, 6.042572975158691, 6.46563196182251, 6.888690948486328, 7.3117499351501465, 7.734808921813965, 8.157867431640625, 8.580926895141602, 9.003985404968262, 9.427043914794922, 9.850103378295898, 10.273162841796875, 10.696221351623535, 11.119280815124512, 11.542339324951172, 11.965398788452148, 12.388457298278809, 12.811515808105469, 13.234575271606445, 13.657633781433105]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 12.0, 10.0, 10.0, 16.0, 19.0, 23.0, 27.0, 31.0, 31.0, 37.0, 39.0, 43.0, 43.0, 39.0, 40.0, 58.0, 35.0, 45.0, 48.0, 46.0, 33.0, 34.0, 44.0, 28.0, 28.0, 22.0, 24.0, 23.0, 24.0, 22.0, 16.0, 11.0, 8.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.35157585144043, -13.881315231323242, -13.411053657531738, -12.940792083740234, -12.470531463623047, -12.00027084350586, -11.530009269714355, -11.059747695922852, -10.589487075805664, -10.119226455688477, -9.648964881896973, -9.178703308105469, -8.708442687988281, -8.238182067871094, -7.76792049407959, -7.297659397125244, -6.827398300170898, -6.357137203216553, -5.886876106262207, -5.416615009307861, -4.946353912353516, -4.47609281539917, -4.005831718444824, -3.5355706214904785, -3.065309524536133, -2.595048427581787, -2.1247873306274414, -1.6545262336730957, -1.18426513671875, -0.7140040397644043, -0.2437429428100586, 0.2265181541442871, 0.6967782974243164, 1.167039394378662, 1.6373004913330078, 2.1075615882873535, 2.577822685241699, 3.048083782196045, 3.5183448791503906, 3.9886059761047363, 4.458867073059082, 4.929128170013428, 5.399389266967773, 5.869650363922119, 6.339911460876465, 6.8101725578308105, 7.280433654785156, 7.750694751739502, 8.220955848693848, 8.691217422485352, 9.161478042602539, 9.631738662719727, 10.10200023651123, 10.572261810302734, 11.042522430419922, 11.51278305053711, 11.983044624328613, 12.453306198120117, 12.923566818237305, 13.393827438354492, 13.864089012145996, 14.3343505859375, 14.804611206054688, 15.274871826171875, 15.745133399963379]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 14.0, 20.0, 19.0, 37.0, 65.0, 115.0, 186.0, 338.0, 656.0, 1151.0, 2222.0, 4667.0, 9469.0, 19620.0, 39572.0, 75560.0, 128719.0, 182208.0, 198147.0, 163279.0, 105242.0, 58684.0, 29801.0, 14530.0, 7135.0, 3425.0, 1681.0, 844.0, 485.0, 247.0, 129.0, 94.0, 69.0, 35.0, 30.0, 23.0, 15.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.59375, -8.3004150390625, -8.007080078125, -7.7137451171875, -7.42041015625, -7.1270751953125, -6.833740234375, -6.5404052734375, -6.2470703125, -5.9537353515625, -5.660400390625, -5.3670654296875, -5.07373046875, -4.7803955078125, -4.487060546875, -4.1937255859375, -3.900390625, -3.6070556640625, -3.313720703125, -3.0203857421875, -2.72705078125, -2.4337158203125, -2.140380859375, -1.8470458984375, -1.5537109375, -1.2603759765625, -0.967041015625, -0.6737060546875, -0.38037109375, -0.0870361328125, 0.206298828125, 0.4996337890625, 0.79296875, 1.0863037109375, 1.379638671875, 1.6729736328125, 1.96630859375, 2.2596435546875, 2.552978515625, 2.8463134765625, 3.1396484375, 3.4329833984375, 3.726318359375, 4.0196533203125, 4.31298828125, 4.6063232421875, 4.899658203125, 5.1929931640625, 5.486328125, 5.7796630859375, 6.072998046875, 6.3663330078125, 6.65966796875, 6.9530029296875, 7.246337890625, 7.5396728515625, 7.8330078125, 8.1263427734375, 8.419677734375, 8.7130126953125, 9.00634765625, 9.2996826171875, 9.593017578125, 9.8863525390625, 10.1796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 5.0, 5.0, 5.0, 11.0, 18.0, 24.0, 20.0, 27.0, 29.0, 39.0, 33.0, 36.0, 39.0, 52.0, 41.0, 42.0, 46.0, 43.0, 44.0, 55.0, 50.0, 36.0, 49.0, 36.0, 29.0, 31.0, 28.0, 19.0, 23.0, 24.0, 12.0, 13.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5390625, -15.0299072265625, -14.520751953125, -14.0115966796875, -13.50244140625, -12.9932861328125, -12.484130859375, -11.9749755859375, -11.4658203125, -10.9566650390625, -10.447509765625, -9.9383544921875, -9.42919921875, -8.9200439453125, -8.410888671875, -7.9017333984375, -7.392578125, -6.8834228515625, -6.374267578125, -5.8651123046875, -5.35595703125, -4.8468017578125, -4.337646484375, -3.8284912109375, -3.3193359375, -2.8101806640625, -2.301025390625, -1.7918701171875, -1.28271484375, -0.7735595703125, -0.264404296875, 0.2447509765625, 0.75390625, 1.2630615234375, 1.772216796875, 2.2813720703125, 2.79052734375, 3.2996826171875, 3.808837890625, 4.3179931640625, 4.8271484375, 5.3363037109375, 5.845458984375, 6.3546142578125, 6.86376953125, 7.3729248046875, 7.882080078125, 8.3912353515625, 8.900390625, 9.4095458984375, 9.918701171875, 10.4278564453125, 10.93701171875, 11.4461669921875, 11.955322265625, 12.4644775390625, 12.9736328125, 13.4827880859375, 13.991943359375, 14.5010986328125, 15.01025390625, 15.5194091796875, 16.028564453125, 16.5377197265625, 17.046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 12.0, 19.0, 30.0, 40.0, 55.0, 86.0, 110.0, 168.0, 301.0, 516.0, 851.0, 1544.0, 2904.0, 5842.0, 12045.0, 26195.0, 59006.0, 126486.0, 223427.0, 254982.0, 173552.0, 86372.0, 39040.0, 17554.0, 8430.0, 4046.0, 2102.0, 1140.0, 654.0, 391.0, 225.0, 132.0, 88.0, 60.0, 41.0, 27.0, 20.0, 19.0, 7.0, 7.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.453125, -13.990478515625, -13.52783203125, -13.065185546875, -12.6025390625, -12.139892578125, -11.67724609375, -11.214599609375, -10.751953125, -10.289306640625, -9.82666015625, -9.364013671875, -8.9013671875, -8.438720703125, -7.97607421875, -7.513427734375, -7.05078125, -6.588134765625, -6.12548828125, -5.662841796875, -5.2001953125, -4.737548828125, -4.27490234375, -3.812255859375, -3.349609375, -2.886962890625, -2.42431640625, -1.961669921875, -1.4990234375, -1.036376953125, -0.57373046875, -0.111083984375, 0.3515625, 0.814208984375, 1.27685546875, 1.739501953125, 2.2021484375, 2.664794921875, 3.12744140625, 3.590087890625, 4.052734375, 4.515380859375, 4.97802734375, 5.440673828125, 5.9033203125, 6.365966796875, 6.82861328125, 7.291259765625, 7.75390625, 8.216552734375, 8.67919921875, 9.141845703125, 9.6044921875, 10.067138671875, 10.52978515625, 10.992431640625, 11.455078125, 11.917724609375, 12.38037109375, 12.843017578125, 13.3056640625, 13.768310546875, 14.23095703125, 14.693603515625, 15.15625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 9.0, 4.0, 11.0, 7.0, 16.0, 13.0, 11.0, 16.0, 21.0, 18.0, 20.0, 23.0, 24.0, 24.0, 29.0, 28.0, 40.0, 46.0, 31.0, 45.0, 42.0, 44.0, 49.0, 37.0, 36.0, 34.0, 34.0, 43.0, 23.0, 33.0, 18.0, 17.0, 18.0, 23.0, 17.0, 18.0, 12.0, 15.0, 6.0, 9.0, 7.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0], "bins": [-8.65625, -8.40081787109375, -8.1453857421875, -7.88995361328125, -7.634521484375, -7.37908935546875, -7.1236572265625, -6.86822509765625, -6.61279296875, -6.35736083984375, -6.1019287109375, -5.84649658203125, -5.591064453125, -5.33563232421875, -5.0802001953125, -4.82476806640625, -4.5693359375, -4.31390380859375, -4.0584716796875, -3.80303955078125, -3.547607421875, -3.29217529296875, -3.0367431640625, -2.78131103515625, -2.52587890625, -2.27044677734375, -2.0150146484375, -1.75958251953125, -1.504150390625, -1.24871826171875, -0.9932861328125, -0.73785400390625, -0.482421875, -0.22698974609375, 0.0284423828125, 0.28387451171875, 0.539306640625, 0.79473876953125, 1.0501708984375, 1.30560302734375, 1.56103515625, 1.81646728515625, 2.0718994140625, 2.32733154296875, 2.582763671875, 2.83819580078125, 3.0936279296875, 3.34906005859375, 3.6044921875, 3.85992431640625, 4.1153564453125, 4.37078857421875, 4.626220703125, 4.88165283203125, 5.1370849609375, 5.39251708984375, 5.64794921875, 5.90338134765625, 6.1588134765625, 6.41424560546875, 6.669677734375, 6.92510986328125, 7.1805419921875, 7.43597412109375, 7.69140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 20.0, 23.0, 44.0, 48.0, 65.0, 109.0, 189.0, 246.0, 393.0, 614.0, 926.0, 1461.0, 2281.0, 3480.0, 5638.0, 8867.0, 14314.0, 22795.0, 35941.0, 56149.0, 83188.0, 116545.0, 141880.0, 147750.0, 127525.0, 95546.0, 66036.0, 42947.0, 27163.0, 17271.0, 10616.0, 6804.0, 4211.0, 2671.0, 1696.0, 1079.0, 720.0, 420.0, 317.0, 202.0, 131.0, 71.0, 48.0, 33.0, 30.0, 9.0, 16.0, 4.0, 1.0, 7.0, 8.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.42578125, -3.319366455078125, -3.21295166015625, -3.106536865234375, -3.0001220703125, -2.893707275390625, -2.78729248046875, -2.680877685546875, -2.574462890625, -2.468048095703125, -2.36163330078125, -2.255218505859375, -2.1488037109375, -2.042388916015625, -1.93597412109375, -1.829559326171875, -1.72314453125, -1.616729736328125, -1.51031494140625, -1.403900146484375, -1.2974853515625, -1.191070556640625, -1.08465576171875, -0.978240966796875, -0.871826171875, -0.765411376953125, -0.65899658203125, -0.552581787109375, -0.4461669921875, -0.339752197265625, -0.23333740234375, -0.126922607421875, -0.0205078125, 0.085906982421875, 0.19232177734375, 0.298736572265625, 0.4051513671875, 0.511566162109375, 0.61798095703125, 0.724395751953125, 0.830810546875, 0.937225341796875, 1.04364013671875, 1.150054931640625, 1.2564697265625, 1.362884521484375, 1.46929931640625, 1.575714111328125, 1.68212890625, 1.788543701171875, 1.89495849609375, 2.001373291015625, 2.1077880859375, 2.214202880859375, 2.32061767578125, 2.427032470703125, 2.533447265625, 2.639862060546875, 2.74627685546875, 2.852691650390625, 2.9591064453125, 3.065521240234375, 3.17193603515625, 3.278350830078125, 3.384765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 5.0, 9.0, 14.0, 19.0, 16.0, 26.0, 30.0, 32.0, 52.0, 43.0, 42.0, 48.0, 54.0, 61.0, 54.0, 55.0, 58.0, 48.0, 55.0, 35.0, 41.0, 46.0, 22.0, 27.0, 28.0, 12.0, 17.0, 9.0, 12.0, 4.0, 3.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023698806762695312, -0.00022955238819122314, -0.00022211670875549316, -0.00021468102931976318, -0.0002072453498840332, -0.00019980967044830322, -0.00019237399101257324, -0.00018493831157684326, -0.00017750263214111328, -0.0001700669527053833, -0.00016263127326965332, -0.00015519559383392334, -0.00014775991439819336, -0.00014032423496246338, -0.0001328885555267334, -0.00012545287609100342, -0.00011801719665527344, -0.00011058151721954346, -0.00010314583778381348, -9.57101583480835e-05, -8.827447891235352e-05, -8.083879947662354e-05, -7.340312004089355e-05, -6.596744060516357e-05, -5.8531761169433594e-05, -5.109608173370361e-05, -4.366040229797363e-05, -3.622472286224365e-05, -2.8789043426513672e-05, -2.135336399078369e-05, -1.3917684555053711e-05, -6.4820051193237305e-06, 9.5367431640625e-07, 8.38935375213623e-06, 1.582503318786621e-05, 2.326071262359619e-05, 3.069639205932617e-05, 3.813207149505615e-05, 4.556775093078613e-05, 5.300343036651611e-05, 6.0439109802246094e-05, 6.787478923797607e-05, 7.531046867370605e-05, 8.274614810943604e-05, 9.018182754516602e-05, 9.7617506980896e-05, 0.00010505318641662598, 0.00011248886585235596, 0.00011992454528808594, 0.00012736022472381592, 0.0001347959041595459, 0.00014223158359527588, 0.00014966726303100586, 0.00015710294246673584, 0.00016453862190246582, 0.0001719743013381958, 0.00017940998077392578, 0.00018684566020965576, 0.00019428133964538574, 0.00020171701908111572, 0.0002091526985168457, 0.00021658837795257568, 0.00022402405738830566, 0.00023145973682403564, 0.00023889541625976562]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 12.0, 18.0, 16.0, 26.0, 39.0, 67.0, 108.0, 161.0, 243.0, 367.0, 621.0, 902.0, 1463.0, 2208.0, 3546.0, 5721.0, 8839.0, 14246.0, 22157.0, 34676.0, 52111.0, 75031.0, 100834.0, 123037.0, 133284.0, 126373.0, 104903.0, 78942.0, 55668.0, 37241.0, 23950.0, 15343.0, 9719.0, 6128.0, 3830.0, 2433.0, 1464.0, 1078.0, 602.0, 395.0, 261.0, 176.0, 102.0, 60.0, 63.0, 33.0, 25.0, 15.0, 10.0, 6.0, 1.0, 4.0, 3.0, 2.0], "bins": [-4.33984375, -4.21435546875, -4.0888671875, -3.96337890625, -3.837890625, -3.71240234375, -3.5869140625, -3.46142578125, -3.3359375, -3.21044921875, -3.0849609375, -2.95947265625, -2.833984375, -2.70849609375, -2.5830078125, -2.45751953125, -2.33203125, -2.20654296875, -2.0810546875, -1.95556640625, -1.830078125, -1.70458984375, -1.5791015625, -1.45361328125, -1.328125, -1.20263671875, -1.0771484375, -0.95166015625, -0.826171875, -0.70068359375, -0.5751953125, -0.44970703125, -0.32421875, -0.19873046875, -0.0732421875, 0.05224609375, 0.177734375, 0.30322265625, 0.4287109375, 0.55419921875, 0.6796875, 0.80517578125, 0.9306640625, 1.05615234375, 1.181640625, 1.30712890625, 1.4326171875, 1.55810546875, 1.68359375, 1.80908203125, 1.9345703125, 2.06005859375, 2.185546875, 2.31103515625, 2.4365234375, 2.56201171875, 2.6875, 2.81298828125, 2.9384765625, 3.06396484375, 3.189453125, 3.31494140625, 3.4404296875, 3.56591796875, 3.69140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 13.0, 10.0, 13.0, 20.0, 31.0, 20.0, 23.0, 44.0, 44.0, 47.0, 53.0, 63.0, 40.0, 64.0, 59.0, 54.0, 52.0, 48.0, 38.0, 48.0, 40.0, 23.0, 26.0, 21.0, 9.0, 17.0, 18.0, 11.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.103515625, -2.0465545654296875, -1.989593505859375, -1.9326324462890625, -1.87567138671875, -1.8187103271484375, -1.761749267578125, -1.7047882080078125, -1.6478271484375, -1.5908660888671875, -1.533905029296875, -1.4769439697265625, -1.41998291015625, -1.3630218505859375, -1.306060791015625, -1.2490997314453125, -1.192138671875, -1.1351776123046875, -1.078216552734375, -1.0212554931640625, -0.96429443359375, -0.9073333740234375, -0.850372314453125, -0.7934112548828125, -0.7364501953125, -0.6794891357421875, -0.622528076171875, -0.5655670166015625, -0.50860595703125, -0.4516448974609375, -0.394683837890625, -0.3377227783203125, -0.28076171875, -0.2238006591796875, -0.166839599609375, -0.1098785400390625, -0.05291748046875, 0.0040435791015625, 0.061004638671875, 0.1179656982421875, 0.1749267578125, 0.2318878173828125, 0.288848876953125, 0.3458099365234375, 0.40277099609375, 0.4597320556640625, 0.516693115234375, 0.5736541748046875, 0.630615234375, 0.6875762939453125, 0.744537353515625, 0.8014984130859375, 0.85845947265625, 0.9154205322265625, 0.972381591796875, 1.0293426513671875, 1.0863037109375, 1.1432647705078125, 1.200225830078125, 1.2571868896484375, 1.31414794921875, 1.3711090087890625, 1.428070068359375, 1.4850311279296875, 1.5419921875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 8.0, 3.0, 10.0, 20.0, 23.0, 22.0, 19.0, 20.0, 19.0, 20.0, 42.0, 37.0, 36.0, 41.0, 36.0, 59.0, 45.0, 53.0, 44.0, 41.0, 44.0, 44.0, 47.0, 32.0, 36.0, 30.0, 32.0, 28.0, 15.0, 16.0, 14.0, 8.0, 10.0, 10.0, 8.0, 9.0, 2.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.577977180480957, -12.169743537902832, -11.761509895324707, -11.353275299072266, -10.94504165649414, -10.536808013916016, -10.12857437133789, -9.720340728759766, -9.31210708618164, -8.903873443603516, -8.49563980102539, -8.087406158447266, -7.679171562194824, -7.270937919616699, -6.862704277038574, -6.454470634460449, -6.046236038208008, -5.638002395629883, -5.2297682762146, -4.821534633636475, -4.413300514221191, -4.005066871643066, -3.5968332290649414, -3.1885993480682373, -2.780365467071533, -2.372131586074829, -1.9638978242874146, -1.5556640625, -1.147430181503296, -0.7391963005065918, -0.3309626579284668, 0.0772712230682373, 0.4855051040649414, 0.8937389254570007, 1.30197274684906, 1.7102065086364746, 2.1184403896331787, 2.526674270629883, 2.934907913208008, 3.343141794204712, 3.751375675201416, 4.159609317779541, 4.567843437194824, 4.976077079772949, 5.384310722351074, 5.792544841766357, 6.200778484344482, 6.609012603759766, 7.017246246337891, 7.425479888916016, 7.833714008331299, 8.241947174072266, 8.650181770324707, 9.058415412902832, 9.466649055480957, 9.874882698059082, 10.283117294311523, 10.691350936889648, 11.099584579467773, 11.507818222045898, 11.91605281829834, 12.324286460876465, 12.73252010345459, 13.140753746032715, 13.54898738861084]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 9.0, 9.0, 17.0, 19.0, 28.0, 22.0, 27.0, 25.0, 30.0, 41.0, 39.0, 45.0, 43.0, 49.0, 38.0, 48.0, 47.0, 45.0, 43.0, 46.0, 31.0, 43.0, 29.0, 29.0, 29.0, 23.0, 27.0, 17.0, 21.0, 20.0, 11.0, 10.0, 8.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.057832717895508, -13.58827018737793, -13.118707656860352, -12.649145126342773, -12.179582595825195, -11.710020065307617, -11.240457534790039, -10.770895004272461, -10.301332473754883, -9.831769943237305, -9.362207412719727, -8.892644882202148, -8.42308235168457, -7.953519821166992, -7.483956813812256, -7.014394283294678, -6.544831275939941, -6.075268745422363, -5.605706214904785, -5.136143684387207, -4.666581153869629, -4.197018623352051, -3.7274556159973145, -3.2578930854797363, -2.788330554962158, -2.31876802444458, -1.8492053747177124, -1.3796427249908447, -0.9100801944732666, -0.4405176639556885, 0.02904510498046875, 0.4986076354980469, 0.9681711196899414, 1.4377336502075195, 1.9072962999343872, 2.376858949661255, 2.846421480178833, 3.315984010696411, 3.7855467796325684, 4.2551093101501465, 4.724671840667725, 5.194234371185303, 5.663796901702881, 6.133359909057617, 6.602922439575195, 7.072484970092773, 7.542047500610352, 8.01161003112793, 8.481172561645508, 8.950735092163086, 9.420297622680664, 9.889860153198242, 10.35942268371582, 10.828985214233398, 11.298547744750977, 11.768110275268555, 12.237672805786133, 12.707235336303711, 13.176797866821289, 13.646360397338867, 14.115922927856445, 14.585485458374023, 15.055047988891602, 15.52461051940918, 15.994174003601074]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 8.0, 14.0, 28.0, 39.0, 56.0, 77.0, 120.0, 206.0, 402.0, 577.0, 1000.0, 1601.0, 2593.0, 4207.0, 6601.0, 10568.0, 16618.0, 25694.0, 38390.0, 55380.0, 75776.0, 96512.0, 113143.0, 120791.0, 115925.0, 101064.0, 81204.0, 60019.0, 42175.0, 28069.0, 18422.0, 11783.0, 7402.0, 4644.0, 2764.0, 1788.0, 1062.0, 642.0, 440.0, 274.0, 177.0, 110.0, 76.0, 54.0, 21.0, 17.0, 8.0, 8.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.91796875, -7.66754150390625, -7.4171142578125, -7.16668701171875, -6.916259765625, -6.66583251953125, -6.4154052734375, -6.16497802734375, -5.91455078125, -5.66412353515625, -5.4136962890625, -5.16326904296875, -4.912841796875, -4.66241455078125, -4.4119873046875, -4.16156005859375, -3.9111328125, -3.66070556640625, -3.4102783203125, -3.15985107421875, -2.909423828125, -2.65899658203125, -2.4085693359375, -2.15814208984375, -1.90771484375, -1.65728759765625, -1.4068603515625, -1.15643310546875, -0.906005859375, -0.65557861328125, -0.4051513671875, -0.15472412109375, 0.095703125, 0.34613037109375, 0.5965576171875, 0.84698486328125, 1.097412109375, 1.34783935546875, 1.5982666015625, 1.84869384765625, 2.09912109375, 2.34954833984375, 2.5999755859375, 2.85040283203125, 3.100830078125, 3.35125732421875, 3.6016845703125, 3.85211181640625, 4.1025390625, 4.35296630859375, 4.6033935546875, 4.85382080078125, 5.104248046875, 5.35467529296875, 5.6051025390625, 5.85552978515625, 6.10595703125, 6.35638427734375, 6.6068115234375, 6.85723876953125, 7.107666015625, 7.35809326171875, 7.6085205078125, 7.85894775390625, 8.109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 11.0, 6.0, 10.0, 14.0, 15.0, 17.0, 31.0, 21.0, 29.0, 35.0, 28.0, 35.0, 35.0, 43.0, 35.0, 42.0, 46.0, 52.0, 46.0, 42.0, 43.0, 34.0, 29.0, 42.0, 32.0, 25.0, 25.0, 27.0, 17.0, 26.0, 19.0, 16.0, 16.0, 8.0, 8.0, 4.0, 12.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.28125, -12.8607177734375, -12.440185546875, -12.0196533203125, -11.59912109375, -11.1785888671875, -10.758056640625, -10.3375244140625, -9.9169921875, -9.4964599609375, -9.075927734375, -8.6553955078125, -8.23486328125, -7.8143310546875, -7.393798828125, -6.9732666015625, -6.552734375, -6.1322021484375, -5.711669921875, -5.2911376953125, -4.87060546875, -4.4500732421875, -4.029541015625, -3.6090087890625, -3.1884765625, -2.7679443359375, -2.347412109375, -1.9268798828125, -1.50634765625, -1.0858154296875, -0.665283203125, -0.2447509765625, 0.17578125, 0.5963134765625, 1.016845703125, 1.4373779296875, 1.85791015625, 2.2784423828125, 2.698974609375, 3.1195068359375, 3.5400390625, 3.9605712890625, 4.381103515625, 4.8016357421875, 5.22216796875, 5.6427001953125, 6.063232421875, 6.4837646484375, 6.904296875, 7.3248291015625, 7.745361328125, 8.1658935546875, 8.58642578125, 9.0069580078125, 9.427490234375, 9.8480224609375, 10.2685546875, 10.6890869140625, 11.109619140625, 11.5301513671875, 11.95068359375, 12.3712158203125, 12.791748046875, 13.2122802734375, 13.6328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 12.0, 16.0, 51.0, 67.0, 110.0, 180.0, 276.0, 474.0, 736.0, 1089.0, 1848.0, 2952.0, 4523.0, 7432.0, 11510.0, 18166.0, 27805.0, 41489.0, 59710.0, 79981.0, 100346.0, 115611.0, 120701.0, 114662.0, 96868.0, 76164.0, 55765.0, 38591.0, 25975.0, 16597.0, 10625.0, 6860.0, 4361.0, 2606.0, 1622.0, 1054.0, 644.0, 437.0, 248.0, 129.0, 102.0, 54.0, 44.0, 25.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.921875, -8.6378173828125, -8.353759765625, -8.0697021484375, -7.78564453125, -7.5015869140625, -7.217529296875, -6.9334716796875, -6.6494140625, -6.3653564453125, -6.081298828125, -5.7972412109375, -5.51318359375, -5.2291259765625, -4.945068359375, -4.6610107421875, -4.376953125, -4.0928955078125, -3.808837890625, -3.5247802734375, -3.24072265625, -2.9566650390625, -2.672607421875, -2.3885498046875, -2.1044921875, -1.8204345703125, -1.536376953125, -1.2523193359375, -0.96826171875, -0.6842041015625, -0.400146484375, -0.1160888671875, 0.16796875, 0.4520263671875, 0.736083984375, 1.0201416015625, 1.30419921875, 1.5882568359375, 1.872314453125, 2.1563720703125, 2.4404296875, 2.7244873046875, 3.008544921875, 3.2926025390625, 3.57666015625, 3.8607177734375, 4.144775390625, 4.4288330078125, 4.712890625, 4.9969482421875, 5.281005859375, 5.5650634765625, 5.84912109375, 6.1331787109375, 6.417236328125, 6.7012939453125, 6.9853515625, 7.2694091796875, 7.553466796875, 7.8375244140625, 8.12158203125, 8.4056396484375, 8.689697265625, 8.9737548828125, 9.2578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 6.0, 9.0, 17.0, 11.0, 19.0, 17.0, 24.0, 21.0, 24.0, 20.0, 35.0, 23.0, 34.0, 42.0, 56.0, 43.0, 50.0, 37.0, 46.0, 24.0, 43.0, 39.0, 33.0, 39.0, 37.0, 24.0, 33.0, 15.0, 27.0, 31.0, 26.0, 12.0, 14.0, 14.0, 10.0, 8.0, 6.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9140625, -7.640869140625, -7.36767578125, -7.094482421875, -6.8212890625, -6.548095703125, -6.27490234375, -6.001708984375, -5.728515625, -5.455322265625, -5.18212890625, -4.908935546875, -4.6357421875, -4.362548828125, -4.08935546875, -3.816162109375, -3.54296875, -3.269775390625, -2.99658203125, -2.723388671875, -2.4501953125, -2.177001953125, -1.90380859375, -1.630615234375, -1.357421875, -1.084228515625, -0.81103515625, -0.537841796875, -0.2646484375, 0.008544921875, 0.28173828125, 0.554931640625, 0.828125, 1.101318359375, 1.37451171875, 1.647705078125, 1.9208984375, 2.194091796875, 2.46728515625, 2.740478515625, 3.013671875, 3.286865234375, 3.56005859375, 3.833251953125, 4.1064453125, 4.379638671875, 4.65283203125, 4.926025390625, 5.19921875, 5.472412109375, 5.74560546875, 6.018798828125, 6.2919921875, 6.565185546875, 6.83837890625, 7.111572265625, 7.384765625, 7.657958984375, 7.93115234375, 8.204345703125, 8.4775390625, 8.750732421875, 9.02392578125, 9.297119140625, 9.5703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 13.0, 22.0, 23.0, 41.0, 64.0, 112.0, 173.0, 233.0, 378.0, 573.0, 678.0, 1145.0, 1716.0, 2641.0, 3964.0, 6107.0, 8986.0, 13904.0, 21025.0, 32045.0, 47791.0, 68761.0, 92212.0, 114695.0, 126945.0, 124963.0, 108372.0, 84746.0, 61608.0, 42411.0, 28086.0, 18211.0, 12144.0, 8074.0, 5428.0, 3353.0, 2383.0, 1537.0, 997.0, 679.0, 448.0, 263.0, 217.0, 152.0, 66.0, 57.0, 45.0, 28.0, 17.0, 9.0, 7.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.390625, -4.260894775390625, -4.13116455078125, -4.001434326171875, -3.8717041015625, -3.741973876953125, -3.61224365234375, -3.482513427734375, -3.352783203125, -3.223052978515625, -3.09332275390625, -2.963592529296875, -2.8338623046875, -2.704132080078125, -2.57440185546875, -2.444671630859375, -2.31494140625, -2.185211181640625, -2.05548095703125, -1.925750732421875, -1.7960205078125, -1.666290283203125, -1.53656005859375, -1.406829833984375, -1.277099609375, -1.147369384765625, -1.01763916015625, -0.887908935546875, -0.7581787109375, -0.628448486328125, -0.49871826171875, -0.368988037109375, -0.2392578125, -0.109527587890625, 0.02020263671875, 0.149932861328125, 0.2796630859375, 0.409393310546875, 0.53912353515625, 0.668853759765625, 0.798583984375, 0.928314208984375, 1.05804443359375, 1.187774658203125, 1.3175048828125, 1.447235107421875, 1.57696533203125, 1.706695556640625, 1.83642578125, 1.966156005859375, 2.09588623046875, 2.225616455078125, 2.3553466796875, 2.485076904296875, 2.61480712890625, 2.744537353515625, 2.874267578125, 3.003997802734375, 3.13372802734375, 3.263458251953125, 3.3931884765625, 3.522918701171875, 3.65264892578125, 3.782379150390625, 3.912109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 4.0, 6.0, 3.0, 10.0, 7.0, 14.0, 15.0, 27.0, 19.0, 31.0, 42.0, 35.0, 37.0, 63.0, 56.0, 50.0, 59.0, 51.0, 48.0, 66.0, 58.0, 56.0, 37.0, 32.0, 27.0, 22.0, 22.0, 22.0, 15.0, 13.0, 14.0, 7.0, 6.0, 6.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006327629089355469, -0.0006147474050521851, -0.0005967319011688232, -0.0005787163972854614, -0.0005607008934020996, -0.0005426853895187378, -0.000524669885635376, -0.0005066543817520142, -0.0004886388778686523, -0.00047062337398529053, -0.0004526078701019287, -0.0004345923662185669, -0.0004165768623352051, -0.00039856135845184326, -0.00038054585456848145, -0.00036253035068511963, -0.0003445148468017578, -0.000326499342918396, -0.0003084838390350342, -0.00029046833515167236, -0.00027245283126831055, -0.00025443732738494873, -0.00023642182350158691, -0.0002184063196182251, -0.00020039081573486328, -0.00018237531185150146, -0.00016435980796813965, -0.00014634430408477783, -0.00012832880020141602, -0.0001103132963180542, -9.229779243469238e-05, -7.428228855133057e-05, -5.626678466796875e-05, -3.8251280784606934e-05, -2.0235776901245117e-05, -2.2202730178833008e-06, 1.5795230865478516e-05, 3.381073474884033e-05, 5.182623863220215e-05, 6.984174251556396e-05, 8.785724639892578e-05, 0.0001058727502822876, 0.00012388825416564941, 0.00014190375804901123, 0.00015991926193237305, 0.00017793476581573486, 0.00019595026969909668, 0.0002139657735824585, 0.0002319812774658203, 0.00024999678134918213, 0.00026801228523254395, 0.00028602778911590576, 0.0003040432929992676, 0.0003220587968826294, 0.0003400743007659912, 0.00035808980464935303, 0.00037610530853271484, 0.00039412081241607666, 0.0004121363162994385, 0.0004301518201828003, 0.0004481673240661621, 0.0004661828279495239, 0.00048419833183288574, 0.0005022138357162476, 0.0005202293395996094]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 17.0, 21.0, 39.0, 49.0, 76.0, 94.0, 190.0, 280.0, 471.0, 729.0, 1069.0, 1877.0, 3025.0, 5096.0, 8914.0, 14926.0, 25036.0, 40717.0, 65446.0, 96656.0, 130013.0, 148591.0, 145918.0, 121693.0, 88313.0, 58327.0, 36448.0, 21929.0, 12977.0, 7796.0, 4663.0, 2688.0, 1689.0, 1032.0, 653.0, 406.0, 277.0, 144.0, 107.0, 62.0, 33.0, 20.0, 18.0, 13.0, 8.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.984375, -4.8280029296875, -4.671630859375, -4.5152587890625, -4.35888671875, -4.2025146484375, -4.046142578125, -3.8897705078125, -3.7333984375, -3.5770263671875, -3.420654296875, -3.2642822265625, -3.10791015625, -2.9515380859375, -2.795166015625, -2.6387939453125, -2.482421875, -2.3260498046875, -2.169677734375, -2.0133056640625, -1.85693359375, -1.7005615234375, -1.544189453125, -1.3878173828125, -1.2314453125, -1.0750732421875, -0.918701171875, -0.7623291015625, -0.60595703125, -0.4495849609375, -0.293212890625, -0.1368408203125, 0.01953125, 0.1759033203125, 0.332275390625, 0.4886474609375, 0.64501953125, 0.8013916015625, 0.957763671875, 1.1141357421875, 1.2705078125, 1.4268798828125, 1.583251953125, 1.7396240234375, 1.89599609375, 2.0523681640625, 2.208740234375, 2.3651123046875, 2.521484375, 2.6778564453125, 2.834228515625, 2.9906005859375, 3.14697265625, 3.3033447265625, 3.459716796875, 3.6160888671875, 3.7724609375, 3.9288330078125, 4.085205078125, 4.2415771484375, 4.39794921875, 4.5543212890625, 4.710693359375, 4.8670654296875, 5.0234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 6.0, 16.0, 16.0, 20.0, 25.0, 15.0, 28.0, 31.0, 41.0, 41.0, 50.0, 47.0, 54.0, 44.0, 49.0, 60.0, 59.0, 46.0, 53.0, 47.0, 40.0, 38.0, 35.0, 23.0, 23.0, 16.0, 10.0, 10.0, 12.0, 7.0, 7.0, 3.0, 2.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8173828125, -1.75830078125, -1.69921875, -1.64013671875, -1.5810546875, -1.52197265625, -1.462890625, -1.40380859375, -1.3447265625, -1.28564453125, -1.2265625, -1.16748046875, -1.1083984375, -1.04931640625, -0.990234375, -0.93115234375, -0.8720703125, -0.81298828125, -0.75390625, -0.69482421875, -0.6357421875, -0.57666015625, -0.517578125, -0.45849609375, -0.3994140625, -0.34033203125, -0.28125, -0.22216796875, -0.1630859375, -0.10400390625, -0.044921875, 0.01416015625, 0.0732421875, 0.13232421875, 0.19140625, 0.25048828125, 0.3095703125, 0.36865234375, 0.427734375, 0.48681640625, 0.5458984375, 0.60498046875, 0.6640625, 0.72314453125, 0.7822265625, 0.84130859375, 0.900390625, 0.95947265625, 1.0185546875, 1.07763671875, 1.13671875, 1.19580078125, 1.2548828125, 1.31396484375, 1.373046875, 1.43212890625, 1.4912109375, 1.55029296875, 1.609375, 1.66845703125, 1.7275390625, 1.78662109375, 1.845703125, 1.90478515625, 1.9638671875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 9.0, 8.0, 16.0, 17.0, 16.0, 20.0, 19.0, 22.0, 35.0, 25.0, 42.0, 44.0, 39.0, 38.0, 48.0, 55.0, 35.0, 46.0, 44.0, 39.0, 46.0, 39.0, 35.0, 38.0, 34.0, 21.0, 26.0, 25.0, 19.0, 12.0, 11.0, 10.0, 13.0, 15.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.695127487182617, -11.289894104003906, -10.884660720825195, -10.479427337646484, -10.074193954467773, -9.668960571289062, -9.263727188110352, -8.85849380493164, -8.45326042175293, -8.048027038574219, -7.642793655395508, -7.237560272216797, -6.832326889038086, -6.427093505859375, -6.021859645843506, -5.616626262664795, -5.211392402648926, -4.806159019470215, -4.400925636291504, -3.995692014694214, -3.590458631515503, -3.185225248336792, -2.779991626739502, -2.374758243560791, -1.96952486038208, -1.5642914772033691, -1.1590579748153687, -0.7538244724273682, -0.3485910892486572, 0.05664229393005371, 0.46187591552734375, 0.8671092987060547, 1.2723417282104492, 1.6775751113891602, 2.082808494567871, 2.488042116165161, 2.893275499343872, 3.298508882522583, 3.703742504119873, 4.108975887298584, 4.514209270477295, 4.919442653656006, 5.324676036834717, 5.729909896850586, 6.135143280029297, 6.540376663208008, 6.945610046386719, 7.35084342956543, 7.756076812744141, 8.161310195922852, 8.566543579101562, 8.971776962280273, 9.377010345458984, 9.782243728637695, 10.187477111816406, 10.592710494995117, 10.997943878173828, 11.403177261352539, 11.80841064453125, 12.213644027709961, 12.618877410888672, 13.024110794067383, 13.429344177246094, 13.834577560424805, 14.239811897277832]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 2.0, 11.0, 7.0, 8.0, 12.0, 15.0, 27.0, 25.0, 31.0, 34.0, 43.0, 37.0, 45.0, 44.0, 48.0, 53.0, 47.0, 61.0, 54.0, 46.0, 41.0, 42.0, 44.0, 38.0, 36.0, 29.0, 21.0, 16.0, 16.0, 19.0, 13.0, 6.0, 8.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.194942474365234, -16.602649688720703, -16.010356903076172, -15.418065071105957, -14.825772285461426, -14.233479499816895, -13.64118766784668, -13.048894882202148, -12.456602096557617, -11.864309310913086, -11.272016525268555, -10.67972469329834, -10.087431907653809, -9.495139122009277, -8.902847290039062, -8.310554504394531, -7.71826171875, -7.125968933105469, -6.533676624298096, -5.941384315490723, -5.349091529846191, -4.75679874420166, -4.164506435394287, -3.572214126586914, -2.979921340942383, -2.3876287937164307, -1.7953362464904785, -1.2030436992645264, -0.6107511520385742, -0.01845860481262207, 0.5738339424133301, 1.1661262512207031, 1.7584209442138672, 2.3507134914398193, 2.9430060386657715, 3.5352985858917236, 4.127591133117676, 4.719883918762207, 5.31217622756958, 5.904468536376953, 6.496761322021484, 7.089054107666016, 7.681346416473389, 8.273638725280762, 8.865931510925293, 9.458224296569824, 10.050516128540039, 10.64280891418457, 11.235101699829102, 11.827394485473633, 12.419687271118164, 13.011979103088379, 13.60427188873291, 14.196564674377441, 14.788856506347656, 15.381149291992188, 15.973442077636719, 16.56573486328125, 17.15802764892578, 17.750320434570312, 18.342613220214844, 18.934904098510742, 19.527196884155273, 20.119489669799805, 20.711782455444336]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 14.0, 9.0, 11.0, 18.0, 20.0, 23.0, 29.0, 35.0, 55.0, 85.0, 101.0, 147.0, 198.0, 255.0, 427.0, 695.0, 1279.0, 2382.0, 4919.0, 1013589.0, 16168.0, 4669.0, 2229.0, 1195.0, 681.0, 370.0, 274.0, 183.0, 122.0, 91.0, 66.0, 49.0, 41.0, 33.0, 30.0, 26.0, 29.0, 15.0, 9.0, 8.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-213.62857055664062, -206.4974822998047, -199.36639404296875, -192.23529052734375, -185.1042022705078, -177.97311401367188, -170.84202575683594, -163.7109375, -156.57984924316406, -149.44876098632812, -142.3176727294922, -135.18658447265625, -128.05548095703125, -120.92439270019531, -113.79330444335938, -106.66221618652344, -99.53112030029297, -92.40003204345703, -85.26893615722656, -78.13784790039062, -71.00675964355469, -63.875667572021484, -56.74457550048828, -49.613487243652344, -42.48239517211914, -35.35130310058594, -28.22021484375, -21.089122772216797, -13.958032608032227, -6.826942443847656, 0.3041496276855469, 7.435237884521484, 14.566329956054688, 21.697420120239258, 28.828510284423828, 35.95960235595703, 43.09069061279297, 50.22178268432617, 57.352874755859375, 64.48396301269531, 71.61505126953125, 78.74613952636719, 85.87723541259766, 93.0083236694336, 100.13941192626953, 107.2705078125, 114.40159606933594, 121.53268432617188, 128.66378784179688, 135.7948760986328, 142.92596435546875, 150.05706787109375, 157.1881561279297, 164.31924438476562, 171.45033264160156, 178.5814208984375, 185.71250915527344, 192.84359741210938, 199.9746856689453, 207.10577392578125, 214.23687744140625, 221.3679656982422, 228.49905395507812, 235.63014221191406, 242.76123046875]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 15.0, 16.0, 28.0, 58.0, 69.0, 98.0, 116.0, 157.0, 217.0, 290.0, 328.0, 460.0, 624.0, 727.0, 967.0, 1315.0, 1729.0, 2554.0, 3982.0, 7186.0, 16879.0, 50920292.0, 476895.0, 15962.0, 6988.0, 3826.0, 2491.0, 1726.0, 1309.0, 957.0, 732.0, 575.0, 462.0, 361.0, 280.0, 211.0, 164.0, 123.0, 83.0, 71.0, 36.0, 30.0, 23.0, 14.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-264.8421325683594, -256.8114013671875, -248.78065490722656, -240.7499237060547, -232.71917724609375, -224.68844604492188, -216.65771484375, -208.62698364257812, -200.5962371826172, -192.5655059814453, -184.53475952148438, -176.5040283203125, -168.47329711914062, -160.4425506591797, -152.4118194580078, -144.38107299804688, -136.350341796875, -128.31961059570312, -120.28886413574219, -112.25813293457031, -104.2273941040039, -96.1966552734375, -88.16592407226562, -80.13518524169922, -72.10444641113281, -64.0737075805664, -56.042972564697266, -48.012237548828125, -39.98149871826172, -31.950759887695312, -23.920024871826172, -15.889289855957031, -7.85858154296875, 0.17215538024902344, 8.202892303466797, 16.23362922668457, 24.264366149902344, 32.29510498046875, 40.32583999633789, 48.35657501220703, 56.38731384277344, 64.41805267333984, 72.44879150390625, 80.47952270507812, 88.51026153564453, 96.54100036621094, 104.57173156738281, 112.60247039794922, 120.63320922851562, 128.6639404296875, 136.69468688964844, 144.7254180908203, 152.75616455078125, 160.78689575195312, 168.817626953125, 176.84835815429688, 184.8791046142578, 192.9098358154297, 200.94058227539062, 208.9713134765625, 217.00204467773438, 225.0327911376953, 233.0635223388672, 241.09426879882812, 249.125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 10.0, 17.0, 23.0, 27.0, 72.0, 124.0, 175.0, 353.0, 508.0, 943.0, 1649.0, 2761.0, 4646.0, 8237.0, 15202.0, 28109.0, 52709.0, 102115.0, 203279.0, 428044.0, 1010017.0, 2108606.0, 1293561.0, 527587.0, 243889.0, 121731.0, 63049.0, 33217.0, 17770.0, 10014.0, 5451.0, 3148.0, 1780.0, 1083.0, 600.0, 359.0, 236.0, 133.0, 85.0, 32.0, 32.0, 22.0, 10.0, 7.0, 6.0, 7.0, 2.0, 2.0, 2.0], "bins": [-38.4375, -37.38818359375, -36.3388671875, -35.28955078125, -34.240234375, -33.19091796875, -32.1416015625, -31.09228515625, -30.04296875, -28.99365234375, -27.9443359375, -26.89501953125, -25.845703125, -24.79638671875, -23.7470703125, -22.69775390625, -21.6484375, -20.59912109375, -19.5498046875, -18.50048828125, -17.451171875, -16.40185546875, -15.3525390625, -14.30322265625, -13.25390625, -12.20458984375, -11.1552734375, -10.10595703125, -9.056640625, -8.00732421875, -6.9580078125, -5.90869140625, -4.859375, -3.81005859375, -2.7607421875, -1.71142578125, -0.662109375, 0.38720703125, 1.4365234375, 2.48583984375, 3.53515625, 4.58447265625, 5.6337890625, 6.68310546875, 7.732421875, 8.78173828125, 9.8310546875, 10.88037109375, 11.9296875, 12.97900390625, 14.0283203125, 15.07763671875, 16.126953125, 17.17626953125, 18.2255859375, 19.27490234375, 20.32421875, 21.37353515625, 22.4228515625, 23.47216796875, 24.521484375, 25.57080078125, 26.6201171875, 27.66943359375, 28.71875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 5.0, 2.0, 4.0, 5.0, 3.0, 7.0, 9.0, 12.0, 14.0, 19.0, 15.0, 19.0, 22.0, 24.0, 30.0, 52.0, 52.0, 53.0, 87.0, 103.0, 129.0, 175.0, 188.0, 198.0, 158.0, 120.0, 93.0, 88.0, 62.0, 46.0, 39.0, 25.0, 31.0, 18.0, 20.0, 20.0, 16.0, 16.0, 10.0, 6.0, 9.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -17.134033203125, -16.58056640625, -16.027099609375, -15.4736328125, -14.920166015625, -14.36669921875, -13.813232421875, -13.259765625, -12.706298828125, -12.15283203125, -11.599365234375, -11.0458984375, -10.492431640625, -9.93896484375, -9.385498046875, -8.83203125, -8.278564453125, -7.72509765625, -7.171630859375, -6.6181640625, -6.064697265625, -5.51123046875, -4.957763671875, -4.404296875, -3.850830078125, -3.29736328125, -2.743896484375, -2.1904296875, -1.636962890625, -1.08349609375, -0.530029296875, 0.0234375, 0.576904296875, 1.13037109375, 1.683837890625, 2.2373046875, 2.790771484375, 3.34423828125, 3.897705078125, 4.451171875, 5.004638671875, 5.55810546875, 6.111572265625, 6.6650390625, 7.218505859375, 7.77197265625, 8.325439453125, 8.87890625, 9.432373046875, 9.98583984375, 10.539306640625, 11.0927734375, 11.646240234375, 12.19970703125, 12.753173828125, 13.306640625, 13.860107421875, 14.41357421875, 14.967041015625, 15.5205078125, 16.073974609375, 16.62744140625, 17.180908203125, 17.734375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 11.0, 15.0, 9.0, 25.0, 29.0, 36.0, 77.0, 108.0, 152.0, 246.0, 359.0, 496.0, 740.0, 1029.0, 1728.0, 2619.0, 4010.0, 6256.0, 9672.0, 14930.0, 23196.0, 35439.0, 54964.0, 83637.0, 126830.0, 191589.0, 302599.0, 570544.0, 1452001.0, 1744678.0, 703139.0, 343388.0, 213872.0, 139537.0, 91538.0, 60722.0, 39114.0, 25412.0, 16488.0, 10200.0, 6798.0, 4587.0, 2945.0, 1910.0, 1312.0, 835.0, 530.0, 337.0, 253.0, 159.0, 108.0, 81.0, 57.0, 41.0, 25.0, 15.0, 6.0, 7.0, 5.0, 7.0, 1.0, 2.0], "bins": [-13.34375, -12.9149169921875, -12.486083984375, -12.0572509765625, -11.62841796875, -11.1995849609375, -10.770751953125, -10.3419189453125, -9.9130859375, -9.4842529296875, -9.055419921875, -8.6265869140625, -8.19775390625, -7.7689208984375, -7.340087890625, -6.9112548828125, -6.482421875, -6.0535888671875, -5.624755859375, -5.1959228515625, -4.76708984375, -4.3382568359375, -3.909423828125, -3.4805908203125, -3.0517578125, -2.6229248046875, -2.194091796875, -1.7652587890625, -1.33642578125, -0.9075927734375, -0.478759765625, -0.0499267578125, 0.37890625, 0.8077392578125, 1.236572265625, 1.6654052734375, 2.09423828125, 2.5230712890625, 2.951904296875, 3.3807373046875, 3.8095703125, 4.2384033203125, 4.667236328125, 5.0960693359375, 5.52490234375, 5.9537353515625, 6.382568359375, 6.8114013671875, 7.240234375, 7.6690673828125, 8.097900390625, 8.5267333984375, 8.95556640625, 9.3843994140625, 9.813232421875, 10.2420654296875, 10.6708984375, 11.0997314453125, 11.528564453125, 11.9573974609375, 12.38623046875, 12.8150634765625, 13.243896484375, 13.6727294921875, 14.1015625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 1.0, 3.0, 6.0, 2.0, 9.0, 8.0, 9.0, 14.0, 13.0, 25.0, 27.0, 26.0, 26.0, 28.0, 34.0, 42.0, 73.0, 90.0, 144.0, 251.0, 314.0, 271.0, 152.0, 103.0, 58.0, 47.0, 34.0, 32.0, 25.0, 31.0, 24.0, 26.0, 21.0, 12.0, 6.0, 6.0, 9.0, 8.0, 6.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-25.9375, -25.11865234375, -24.2998046875, -23.48095703125, -22.662109375, -21.84326171875, -21.0244140625, -20.20556640625, -19.38671875, -18.56787109375, -17.7490234375, -16.93017578125, -16.111328125, -15.29248046875, -14.4736328125, -13.65478515625, -12.8359375, -12.01708984375, -11.1982421875, -10.37939453125, -9.560546875, -8.74169921875, -7.9228515625, -7.10400390625, -6.28515625, -5.46630859375, -4.6474609375, -3.82861328125, -3.009765625, -2.19091796875, -1.3720703125, -0.55322265625, 0.265625, 1.08447265625, 1.9033203125, 2.72216796875, 3.541015625, 4.35986328125, 5.1787109375, 5.99755859375, 6.81640625, 7.63525390625, 8.4541015625, 9.27294921875, 10.091796875, 10.91064453125, 11.7294921875, 12.54833984375, 13.3671875, 14.18603515625, 15.0048828125, 15.82373046875, 16.642578125, 17.46142578125, 18.2802734375, 19.09912109375, 19.91796875, 20.73681640625, 21.5556640625, 22.37451171875, 23.193359375, 24.01220703125, 24.8310546875, 25.64990234375, 26.46875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 2.0, 6.0, 10.0, 12.0, 21.0, 31.0, 37.0, 43.0, 37.0, 76.0, 107.0, 139.0, 189.0, 283.0, 425.0, 591.0, 877.0, 1431.0, 2295.0, 3721.0, 6124.0, 10288.0, 17645.0, 30668.0, 51835.0, 97919.0, 608979.0, 5182019.0, 128036.0, 61537.0, 34895.0, 20383.0, 11998.0, 7250.0, 4254.0, 2569.0, 1573.0, 949.0, 673.0, 398.0, 278.0, 205.0, 151.0, 94.0, 91.0, 81.0, 45.0, 32.0, 28.0, 26.0, 21.0, 20.0, 17.0, 5.0, 9.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0], "bins": [-31.9375, -30.8779296875, -29.818359375, -28.7587890625, -27.69921875, -26.6396484375, -25.580078125, -24.5205078125, -23.4609375, -22.4013671875, -21.341796875, -20.2822265625, -19.22265625, -18.1630859375, -17.103515625, -16.0439453125, -14.984375, -13.9248046875, -12.865234375, -11.8056640625, -10.74609375, -9.6865234375, -8.626953125, -7.5673828125, -6.5078125, -5.4482421875, -4.388671875, -3.3291015625, -2.26953125, -1.2099609375, -0.150390625, 0.9091796875, 1.96875, 3.0283203125, 4.087890625, 5.1474609375, 6.20703125, 7.2666015625, 8.326171875, 9.3857421875, 10.4453125, 11.5048828125, 12.564453125, 13.6240234375, 14.68359375, 15.7431640625, 16.802734375, 17.8623046875, 18.921875, 19.9814453125, 21.041015625, 22.1005859375, 23.16015625, 24.2197265625, 25.279296875, 26.3388671875, 27.3984375, 28.4580078125, 29.517578125, 30.5771484375, 31.63671875, 32.6962890625, 33.755859375, 34.8154296875, 35.875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 5.0, 15.0, 15.0, 18.0, 30.0, 30.0, 37.0, 40.0, 42.0, 49.0, 64.0, 124.0, 240.0, 463.0, 328.0, 114.0, 60.0, 53.0, 36.0, 38.0, 42.0, 42.0, 31.0, 21.0, 16.0, 12.0, 5.0, 10.0, 7.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.03125, -40.5146484375, -38.998046875, -37.4814453125, -35.96484375, -34.4482421875, -32.931640625, -31.4150390625, -29.8984375, -28.3818359375, -26.865234375, -25.3486328125, -23.83203125, -22.3154296875, -20.798828125, -19.2822265625, -17.765625, -16.2490234375, -14.732421875, -13.2158203125, -11.69921875, -10.1826171875, -8.666015625, -7.1494140625, -5.6328125, -4.1162109375, -2.599609375, -1.0830078125, 0.43359375, 1.9501953125, 3.466796875, 4.9833984375, 6.5, 8.0166015625, 9.533203125, 11.0498046875, 12.56640625, 14.0830078125, 15.599609375, 17.1162109375, 18.6328125, 20.1494140625, 21.666015625, 23.1826171875, 24.69921875, 26.2158203125, 27.732421875, 29.2490234375, 30.765625, 32.2822265625, 33.798828125, 35.3154296875, 36.83203125, 38.3486328125, 39.865234375, 41.3818359375, 42.8984375, 44.4150390625, 45.931640625, 47.4482421875, 48.96484375, 50.4814453125, 51.998046875, 53.5146484375, 55.03125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 8.0, 13.0, 0.0, 8.0, 12.0, 9.0, 13.0, 15.0, 17.0, 29.0, 30.0, 33.0, 41.0, 43.0, 66.0, 94.0, 113.0, 93.0, 62.0, 62.0, 41.0, 37.0, 29.0, 26.0, 21.0, 17.0, 20.0, 13.0, 10.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-730.33349609375, -710.9607543945312, -691.5879516601562, -672.2152099609375, -652.8424072265625, -633.4696655273438, -614.096923828125, -594.72412109375, -575.3513793945312, -555.9786376953125, -536.6058349609375, -517.2330932617188, -497.8603210449219, -478.487548828125, -459.1147766113281, -439.74200439453125, -420.3692321777344, -400.9964599609375, -381.6236877441406, -362.25091552734375, -342.878173828125, -323.5054016113281, -304.13262939453125, -284.7598876953125, -265.3870849609375, -246.01431274414062, -226.6415557861328, -207.26878356933594, -187.89602661132812, -168.52325439453125, -149.15048217773438, -129.77772521972656, -110.40496826171875, -91.0322036743164, -71.65943908691406, -52.28666687011719, -32.913902282714844, -13.5411376953125, 5.831634521484375, 25.204391479492188, 44.57716369628906, 63.949928283691406, 83.32269287109375, 102.69546508789062, 122.06822967529297, 141.4409942626953, 160.8137664794922, 180.1865234375, 199.55929565429688, 218.93206787109375, 238.30482482910156, 257.6776123046875, 277.05035400390625, 296.4231262207031, 315.7958984375, 335.16864013671875, 354.54144287109375, 373.9142150878906, 393.2869873046875, 412.65972900390625, 432.0325012207031, 451.4052734375, 470.7780456542969, 490.15081787109375, 509.5235595703125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 1.0, 8.0, 4.0, 6.0, 6.0, 15.0, 10.0, 18.0, 17.0, 15.0, 21.0, 24.0, 20.0, 32.0, 29.0, 30.0, 31.0, 70.0, 99.0, 103.0, 101.0, 71.0, 32.0, 33.0, 39.0, 16.0, 26.0, 18.0, 18.0, 16.0, 17.0, 10.0, 9.0, 9.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-839.3432006835938, -814.9786376953125, -790.614013671875, -766.2494506835938, -741.8848876953125, -717.520263671875, -693.1557006835938, -668.7911376953125, -644.426513671875, -620.0619506835938, -595.6973266601562, -571.332763671875, -546.9681396484375, -522.6035766601562, -498.239013671875, -473.8744201660156, -449.50982666015625, -425.1452331542969, -400.7806396484375, -376.41607666015625, -352.0514831542969, -327.6868896484375, -303.32232666015625, -278.9577331542969, -254.5931396484375, -230.22854614257812, -205.8639678955078, -181.4993896484375, -157.13479614257812, -132.77020263671875, -108.40562438964844, -84.04104614257812, -59.6763916015625, -35.311805725097656, -10.947219848632812, 13.417366027832031, 37.781951904296875, 62.14653778076172, 86.51112365722656, 110.87570190429688, 135.24029541015625, 159.60488891601562, 183.96946716308594, 208.33404541015625, 232.69863891601562, 257.063232421875, 281.42779541015625, 305.7923889160156, 330.156982421875, 354.5215759277344, 378.88616943359375, 403.250732421875, 427.6153259277344, 451.97991943359375, 476.344482421875, 500.7090759277344, 525.0736694335938, 549.438232421875, 573.8028564453125, 598.1674194335938, 622.531982421875, 646.8966064453125, 671.2611694335938, 695.625732421875, 719.9903564453125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 16.0, 18.0, 28.0, 49.0, 81.0, 94.0, 163.0, 232.0, 370.0, 596.0, 928.0, 1639.0, 3040.0, 5427.0, 11081.0, 26577.0, 82317.0, 532773.0, 3206228.0, 224066.0, 54501.0, 20886.0, 10032.0, 5298.0, 2894.0, 1733.0, 1062.0, 659.0, 499.0, 304.0, 201.0, 115.0, 105.0, 72.0, 60.0, 38.0, 30.0, 25.0, 19.0, 5.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.07843017578125, -3.9107666015625, -3.74310302734375, -3.575439453125, -3.40777587890625, -3.2401123046875, -3.07244873046875, -2.90478515625, -2.73712158203125, -2.5694580078125, -2.40179443359375, -2.234130859375, -2.06646728515625, -1.8988037109375, -1.73114013671875, -1.5634765625, -1.39581298828125, -1.2281494140625, -1.06048583984375, -0.892822265625, -0.72515869140625, -0.5574951171875, -0.38983154296875, -0.22216796875, -0.05450439453125, 0.1131591796875, 0.28082275390625, 0.448486328125, 0.61614990234375, 0.7838134765625, 0.95147705078125, 1.119140625, 1.28680419921875, 1.4544677734375, 1.62213134765625, 1.789794921875, 1.95745849609375, 2.1251220703125, 2.29278564453125, 2.46044921875, 2.62811279296875, 2.7957763671875, 2.96343994140625, 3.131103515625, 3.29876708984375, 3.4664306640625, 3.63409423828125, 3.8017578125, 3.96942138671875, 4.1370849609375, 4.30474853515625, 4.472412109375, 4.64007568359375, 4.8077392578125, 4.97540283203125, 5.14306640625, 5.31072998046875, 5.4783935546875, 5.64605712890625, 5.813720703125, 5.98138427734375, 6.1490478515625, 6.31671142578125, 6.484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 10.0, 6.0, 11.0, 17.0, 20.0, 35.0, 67.0, 88.0, 129.0, 194.0, 139.0, 94.0, 73.0, 29.0, 17.0, 17.0, 12.0, 11.0, 6.0, 5.0, 3.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85546875, -0.8222198486328125, -0.788970947265625, -0.7557220458984375, -0.72247314453125, -0.6892242431640625, -0.655975341796875, -0.6227264404296875, -0.5894775390625, -0.5562286376953125, -0.522979736328125, -0.4897308349609375, -0.45648193359375, -0.4232330322265625, -0.389984130859375, -0.3567352294921875, -0.323486328125, -0.2902374267578125, -0.256988525390625, -0.2237396240234375, -0.19049072265625, -0.1572418212890625, -0.123992919921875, -0.0907440185546875, -0.0574951171875, -0.0242462158203125, 0.009002685546875, 0.0422515869140625, 0.07550048828125, 0.1087493896484375, 0.141998291015625, 0.1752471923828125, 0.20849609375, 0.2417449951171875, 0.274993896484375, 0.3082427978515625, 0.34149169921875, 0.3747406005859375, 0.407989501953125, 0.4412384033203125, 0.4744873046875, 0.5077362060546875, 0.540985107421875, 0.5742340087890625, 0.60748291015625, 0.6407318115234375, 0.673980712890625, 0.7072296142578125, 0.740478515625, 0.7737274169921875, 0.806976318359375, 0.8402252197265625, 0.87347412109375, 0.9067230224609375, 0.939971923828125, 0.9732208251953125, 1.0064697265625, 1.0397186279296875, 1.072967529296875, 1.1062164306640625, 1.13946533203125, 1.1727142333984375, 1.205963134765625, 1.2392120361328125, 1.2724609375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 7.0, 15.0, 16.0, 16.0, 28.0, 48.0, 79.0, 163.0, 232.0, 354.0, 664.0, 1335.0, 3082.0, 7633.0, 22568.0, 82949.0, 401752.0, 2532946.0, 921821.0, 159799.0, 38903.0, 11702.0, 4277.0, 1882.0, 897.0, 472.0, 250.0, 147.0, 83.0, 51.0, 41.0, 21.0, 11.0, 6.0, 13.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.15234375, -5.97515869140625, -5.7979736328125, -5.62078857421875, -5.443603515625, -5.26641845703125, -5.0892333984375, -4.91204833984375, -4.73486328125, -4.55767822265625, -4.3804931640625, -4.20330810546875, -4.026123046875, -3.84893798828125, -3.6717529296875, -3.49456787109375, -3.3173828125, -3.14019775390625, -2.9630126953125, -2.78582763671875, -2.608642578125, -2.43145751953125, -2.2542724609375, -2.07708740234375, -1.89990234375, -1.72271728515625, -1.5455322265625, -1.36834716796875, -1.191162109375, -1.01397705078125, -0.8367919921875, -0.65960693359375, -0.482421875, -0.30523681640625, -0.1280517578125, 0.04913330078125, 0.226318359375, 0.40350341796875, 0.5806884765625, 0.75787353515625, 0.93505859375, 1.11224365234375, 1.2894287109375, 1.46661376953125, 1.643798828125, 1.82098388671875, 1.9981689453125, 2.17535400390625, 2.3525390625, 2.52972412109375, 2.7069091796875, 2.88409423828125, 3.061279296875, 3.23846435546875, 3.4156494140625, 3.59283447265625, 3.77001953125, 3.94720458984375, 4.1243896484375, 4.30157470703125, 4.478759765625, 4.65594482421875, 4.8331298828125, 5.01031494140625, 5.1875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 2.0, 12.0, 19.0, 31.0, 31.0, 47.0, 60.0, 104.0, 118.0, 185.0, 261.0, 369.0, 626.0, 842.0, 416.0, 306.0, 199.0, 110.0, 83.0, 76.0, 54.0, 24.0, 28.0, 25.0, 9.0, 6.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.4921875, -2.430206298828125, -2.36822509765625, -2.306243896484375, -2.2442626953125, -2.182281494140625, -2.12030029296875, -2.058319091796875, -1.996337890625, -1.934356689453125, -1.87237548828125, -1.810394287109375, -1.7484130859375, -1.686431884765625, -1.62445068359375, -1.562469482421875, -1.50048828125, -1.438507080078125, -1.37652587890625, -1.314544677734375, -1.2525634765625, -1.190582275390625, -1.12860107421875, -1.066619873046875, -1.004638671875, -0.942657470703125, -0.88067626953125, -0.818695068359375, -0.7567138671875, -0.694732666015625, -0.63275146484375, -0.570770263671875, -0.5087890625, -0.446807861328125, -0.38482666015625, -0.322845458984375, -0.2608642578125, -0.198883056640625, -0.13690185546875, -0.074920654296875, -0.012939453125, 0.049041748046875, 0.11102294921875, 0.173004150390625, 0.2349853515625, 0.296966552734375, 0.35894775390625, 0.420928955078125, 0.48291015625, 0.544891357421875, 0.60687255859375, 0.668853759765625, 0.7308349609375, 0.792816162109375, 0.85479736328125, 0.916778564453125, 0.978759765625, 1.040740966796875, 1.10272216796875, 1.164703369140625, 1.2266845703125, 1.288665771484375, 1.35064697265625, 1.412628173828125, 1.474609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 6.0, 16.0, 23.0, 34.0, 57.0, 82.0, 138.0, 171.0, 156.0, 117.0, 95.0, 57.0, 23.0, 8.0, 11.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.68655776977539, -15.034500122070312, -14.382442474365234, -13.730384826660156, -13.078327178955078, -12.42626953125, -11.774210929870605, -11.122153282165527, -10.47009563446045, -9.818037986755371, -9.165980339050293, -8.513922691345215, -7.8618645668029785, -7.2098069190979, -6.557748794555664, -5.905691146850586, -5.253633499145508, -4.60157585144043, -3.9495179653167725, -3.2974600791931152, -2.645402431488037, -1.993344783782959, -1.3412868976593018, -0.6892290115356445, -0.037171363830566406, 0.6148864030838013, 1.266944169998169, 1.9190019369125366, 2.5710597038269043, 3.2231173515319824, 3.8751752376556396, 4.527233123779297, 5.179288864135742, 5.83134651184082, 6.483404159545898, 7.135462284088135, 7.787519931793213, 8.439577102661133, 9.091635704040527, 9.743693351745605, 10.395750999450684, 11.047808647155762, 11.69986629486084, 12.351923942565918, 13.003982543945312, 13.65604019165039, 14.308097839355469, 14.960155487060547, 15.612213134765625, 16.264270782470703, 16.91632843017578, 17.56838607788086, 18.220443725585938, 18.872501373291016, 19.524559020996094, 20.176616668701172, 20.82867431640625, 21.480731964111328, 22.132789611816406, 22.784847259521484, 23.436904907226562, 24.08896255493164, 24.74102020263672, 25.393077850341797, 26.045137405395508]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 10.0, 16.0, 9.0, 19.0, 23.0, 18.0, 21.0, 32.0, 22.0, 31.0, 37.0, 38.0, 50.0, 51.0, 47.0, 59.0, 48.0, 52.0, 44.0, 47.0, 60.0, 60.0, 33.0, 21.0, 23.0, 22.0, 14.0, 19.0, 13.0, 21.0, 5.0, 5.0, 5.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.358121871948242, -10.051459312438965, -9.744796752929688, -9.43813419342041, -9.131471633911133, -8.824809074401855, -8.518146514892578, -8.2114839553833, -7.904821395874023, -7.598158836364746, -7.291496276855469, -6.984833717346191, -6.678171157836914, -6.371508598327637, -6.064846038818359, -5.758183479309082, -5.451521396636963, -5.1448588371276855, -4.838196277618408, -4.531533718109131, -4.2248711585998535, -3.918208599090576, -3.611546277999878, -3.3048837184906006, -2.9982211589813232, -2.691558599472046, -2.3848960399627686, -2.0782337188720703, -1.7715710401535034, -1.464908480644226, -1.1582460403442383, -0.8515834808349609, -0.5449209213256836, -0.23825839161872864, 0.06840413808822632, 0.3750666379928589, 0.6817291975021362, 0.9883917570114136, 1.2950541973114014, 1.6017167568206787, 1.908379316329956, 2.2150418758392334, 2.5217044353485107, 2.828366756439209, 3.1350293159484863, 3.4416918754577637, 3.748354434967041, 4.055016994476318, 4.361679553985596, 4.668342113494873, 4.97500467300415, 5.281667232513428, 5.588329792022705, 5.894992351531982, 6.201654434204102, 6.508316993713379, 6.814979553222656, 7.121642112731934, 7.428304672241211, 7.734967231750488, 8.041629791259766, 8.348292350769043, 8.65495491027832, 8.961617469787598, 9.268280029296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 10.0, 16.0, 24.0, 23.0, 40.0, 43.0, 73.0, 112.0, 171.0, 264.0, 387.0, 666.0, 1228.0, 2096.0, 4181.0, 9246.0, 23411.0, 84268.0, 495328.0, 333529.0, 59435.0, 18269.0, 7444.0, 3663.0, 1907.0, 1027.0, 637.0, 381.0, 217.0, 157.0, 81.0, 60.0, 37.0, 38.0, 23.0, 18.0, 10.0, 12.0, 6.0, 5.0, 4.0, 2.0, 6.0, 2.0, 1.0], "bins": [-3.30859375, -3.22125244140625, -3.1339111328125, -3.04656982421875, -2.959228515625, -2.87188720703125, -2.7845458984375, -2.69720458984375, -2.60986328125, -2.52252197265625, -2.4351806640625, -2.34783935546875, -2.260498046875, -2.17315673828125, -2.0858154296875, -1.99847412109375, -1.9111328125, -1.82379150390625, -1.7364501953125, -1.64910888671875, -1.561767578125, -1.47442626953125, -1.3870849609375, -1.29974365234375, -1.21240234375, -1.12506103515625, -1.0377197265625, -0.95037841796875, -0.863037109375, -0.77569580078125, -0.6883544921875, -0.60101318359375, -0.513671875, -0.42633056640625, -0.3389892578125, -0.25164794921875, -0.164306640625, -0.07696533203125, 0.0103759765625, 0.09771728515625, 0.18505859375, 0.27239990234375, 0.3597412109375, 0.44708251953125, 0.534423828125, 0.62176513671875, 0.7091064453125, 0.79644775390625, 0.8837890625, 0.97113037109375, 1.0584716796875, 1.14581298828125, 1.233154296875, 1.32049560546875, 1.4078369140625, 1.49517822265625, 1.58251953125, 1.66986083984375, 1.7572021484375, 1.84454345703125, 1.931884765625, 2.01922607421875, 2.1065673828125, 2.19390869140625, 2.28125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 10.0, 13.0, 12.0, 34.0, 44.0, 62.0, 79.0, 118.0, 123.0, 131.0, 99.0, 92.0, 44.0, 39.0, 15.0, 18.0, 14.0, 9.0, 9.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80029296875, -0.7683181762695312, -0.7363433837890625, -0.7043685913085938, -0.672393798828125, -0.6404190063476562, -0.6084442138671875, -0.5764694213867188, -0.54449462890625, -0.5125198364257812, -0.4805450439453125, -0.44857025146484375, -0.416595458984375, -0.38462066650390625, -0.3526458740234375, -0.32067108154296875, -0.2886962890625, -0.25672149658203125, -0.2247467041015625, -0.19277191162109375, -0.160797119140625, -0.12882232666015625, -0.0968475341796875, -0.06487274169921875, -0.03289794921875, -0.00092315673828125, 0.0310516357421875, 0.06302642822265625, 0.095001220703125, 0.12697601318359375, 0.1589508056640625, 0.19092559814453125, 0.222900390625, 0.25487518310546875, 0.2868499755859375, 0.31882476806640625, 0.350799560546875, 0.38277435302734375, 0.4147491455078125, 0.44672393798828125, 0.47869873046875, 0.5106735229492188, 0.5426483154296875, 0.5746231079101562, 0.606597900390625, 0.6385726928710938, 0.6705474853515625, 0.7025222778320312, 0.7344970703125, 0.7664718627929688, 0.7984466552734375, 0.8304214477539062, 0.862396240234375, 0.8943710327148438, 0.9263458251953125, 0.9583206176757812, 0.99029541015625, 1.0222702026367188, 1.0542449951171875, 1.0862197875976562, 1.118194580078125, 1.1501693725585938, 1.1821441650390625, 1.2141189575195312, 1.24609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 10.0, 12.0, 23.0, 22.0, 44.0, 61.0, 112.0, 204.0, 339.0, 711.0, 1589.0, 3688.0, 9549.0, 28932.0, 110612.0, 509717.0, 290696.0, 62809.0, 18143.0, 6367.0, 2485.0, 1180.0, 561.0, 299.0, 157.0, 87.0, 48.0, 34.0, 20.0, 17.0, 4.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5703125, -3.458038330078125, -3.34576416015625, -3.233489990234375, -3.1212158203125, -3.008941650390625, -2.89666748046875, -2.784393310546875, -2.672119140625, -2.559844970703125, -2.44757080078125, -2.335296630859375, -2.2230224609375, -2.110748291015625, -1.99847412109375, -1.886199951171875, -1.77392578125, -1.661651611328125, -1.54937744140625, -1.437103271484375, -1.3248291015625, -1.212554931640625, -1.10028076171875, -0.988006591796875, -0.875732421875, -0.763458251953125, -0.65118408203125, -0.538909912109375, -0.4266357421875, -0.314361572265625, -0.20208740234375, -0.089813232421875, 0.0224609375, 0.134735107421875, 0.24700927734375, 0.359283447265625, 0.4715576171875, 0.583831787109375, 0.69610595703125, 0.808380126953125, 0.920654296875, 1.032928466796875, 1.14520263671875, 1.257476806640625, 1.3697509765625, 1.482025146484375, 1.59429931640625, 1.706573486328125, 1.81884765625, 1.931121826171875, 2.04339599609375, 2.155670166015625, 2.2679443359375, 2.380218505859375, 2.49249267578125, 2.604766845703125, 2.717041015625, 2.829315185546875, 2.94158935546875, 3.053863525390625, 3.1661376953125, 3.278411865234375, 3.39068603515625, 3.502960205078125, 3.615234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 9.0, 6.0, 10.0, 15.0, 12.0, 18.0, 26.0, 23.0, 24.0, 26.0, 27.0, 32.0, 37.0, 35.0, 41.0, 32.0, 57.0, 52.0, 45.0, 48.0, 47.0, 43.0, 38.0, 29.0, 33.0, 27.0, 25.0, 22.0, 30.0, 24.0, 22.0, 13.0, 15.0, 12.0, 11.0, 5.0, 6.0, 3.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.77734375, -2.68707275390625, -2.5968017578125, -2.50653076171875, -2.416259765625, -2.32598876953125, -2.2357177734375, -2.14544677734375, -2.05517578125, -1.96490478515625, -1.8746337890625, -1.78436279296875, -1.694091796875, -1.60382080078125, -1.5135498046875, -1.42327880859375, -1.3330078125, -1.24273681640625, -1.1524658203125, -1.06219482421875, -0.971923828125, -0.88165283203125, -0.7913818359375, -0.70111083984375, -0.61083984375, -0.52056884765625, -0.4302978515625, -0.34002685546875, -0.249755859375, -0.15948486328125, -0.0692138671875, 0.02105712890625, 0.111328125, 0.20159912109375, 0.2918701171875, 0.38214111328125, 0.472412109375, 0.56268310546875, 0.6529541015625, 0.74322509765625, 0.83349609375, 0.92376708984375, 1.0140380859375, 1.10430908203125, 1.194580078125, 1.28485107421875, 1.3751220703125, 1.46539306640625, 1.5556640625, 1.64593505859375, 1.7362060546875, 1.82647705078125, 1.916748046875, 2.00701904296875, 2.0972900390625, 2.18756103515625, 2.27783203125, 2.36810302734375, 2.4583740234375, 2.54864501953125, 2.638916015625, 2.72918701171875, 2.8194580078125, 2.90972900390625, 3.0]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 13.0, 10.0, 13.0, 12.0, 9.0, 26.0, 24.0, 49.0, 68.0, 98.0, 155.0, 243.0, 363.0, 678.0, 1174.0, 2344.0, 4898.0, 12078.0, 35838.0, 151320.0, 521653.0, 237528.0, 51587.0, 16093.0, 6206.0, 2713.0, 1331.0, 728.0, 432.0, 290.0, 179.0, 100.0, 73.0, 47.0, 49.0, 32.0, 28.0, 11.0, 15.0, 5.0, 3.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.998046875, -1.930633544921875, -1.86322021484375, -1.795806884765625, -1.7283935546875, -1.660980224609375, -1.59356689453125, -1.526153564453125, -1.458740234375, -1.391326904296875, -1.32391357421875, -1.256500244140625, -1.1890869140625, -1.121673583984375, -1.05426025390625, -0.986846923828125, -0.91943359375, -0.852020263671875, -0.78460693359375, -0.717193603515625, -0.6497802734375, -0.582366943359375, -0.51495361328125, -0.447540283203125, -0.380126953125, -0.312713623046875, -0.24530029296875, -0.177886962890625, -0.1104736328125, -0.043060302734375, 0.02435302734375, 0.091766357421875, 0.1591796875, 0.226593017578125, 0.29400634765625, 0.361419677734375, 0.4288330078125, 0.496246337890625, 0.56365966796875, 0.631072998046875, 0.698486328125, 0.765899658203125, 0.83331298828125, 0.900726318359375, 0.9681396484375, 1.035552978515625, 1.10296630859375, 1.170379638671875, 1.23779296875, 1.305206298828125, 1.37261962890625, 1.440032958984375, 1.5074462890625, 1.574859619140625, 1.64227294921875, 1.709686279296875, 1.777099609375, 1.844512939453125, 1.91192626953125, 1.979339599609375, 2.0467529296875, 2.114166259765625, 2.18157958984375, 2.248992919921875, 2.31640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 9.0, 16.0, 22.0, 26.0, 34.0, 42.0, 61.0, 68.0, 68.0, 94.0, 108.0, 104.0, 92.0, 53.0, 43.0, 31.0, 32.0, 28.0, 16.0, 16.0, 4.0, 10.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011456012725830078, -0.00011065416038036346, -0.00010674819350242615, -0.00010284222662448883, -9.893625974655151e-05, -9.50302928686142e-05, -9.112432599067688e-05, -8.721835911273956e-05, -8.331239223480225e-05, -7.940642535686493e-05, -7.550045847892761e-05, -7.15944916009903e-05, -6.768852472305298e-05, -6.378255784511566e-05, -5.9876590967178345e-05, -5.597062408924103e-05, -5.206465721130371e-05, -4.8158690333366394e-05, -4.425272345542908e-05, -4.034675657749176e-05, -3.644078969955444e-05, -3.2534822821617126e-05, -2.862885594367981e-05, -2.4722889065742493e-05, -2.0816922187805176e-05, -1.691095530986786e-05, -1.3004988431930542e-05, -9.099021553993225e-06, -5.193054676055908e-06, -1.2870877981185913e-06, 2.6188790798187256e-06, 6.5248459577560425e-06, 1.043081283569336e-05, 1.4336779713630676e-05, 1.8242746591567993e-05, 2.214871346950531e-05, 2.6054680347442627e-05, 2.9960647225379944e-05, 3.386661410331726e-05, 3.777258098125458e-05, 4.1678547859191895e-05, 4.558451473712921e-05, 4.949048161506653e-05, 5.3396448493003845e-05, 5.730241537094116e-05, 6.120838224887848e-05, 6.51143491268158e-05, 6.902031600475311e-05, 7.292628288269043e-05, 7.683224976062775e-05, 8.073821663856506e-05, 8.464418351650238e-05, 8.85501503944397e-05, 9.245611727237701e-05, 9.636208415031433e-05, 0.00010026805102825165, 0.00010417401790618896, 0.00010807998478412628, 0.0001119859516620636, 0.00011589191854000092, 0.00011979788541793823, 0.00012370385229587555, 0.00012760981917381287, 0.00013151578605175018, 0.0001354217529296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 1.0, 0.0, 4.0, 2.0, 9.0, 8.0, 8.0, 16.0, 13.0, 27.0, 32.0, 43.0, 91.0, 121.0, 200.0, 307.0, 505.0, 875.0, 1603.0, 3014.0, 5969.0, 13248.0, 33284.0, 98428.0, 303370.0, 379698.0, 132654.0, 43236.0, 16461.0, 7270.0, 3467.0, 1865.0, 1015.0, 610.0, 380.0, 241.0, 168.0, 101.0, 61.0, 40.0, 34.0, 23.0, 19.0, 12.0, 7.0, 6.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8466796875, -1.7909393310546875, -1.735198974609375, -1.6794586181640625, -1.62371826171875, -1.5679779052734375, -1.512237548828125, -1.4564971923828125, -1.4007568359375, -1.3450164794921875, -1.289276123046875, -1.2335357666015625, -1.17779541015625, -1.1220550537109375, -1.066314697265625, -1.0105743408203125, -0.954833984375, -0.8990936279296875, -0.843353271484375, -0.7876129150390625, -0.73187255859375, -0.6761322021484375, -0.620391845703125, -0.5646514892578125, -0.5089111328125, -0.4531707763671875, -0.397430419921875, -0.3416900634765625, -0.28594970703125, -0.2302093505859375, -0.174468994140625, -0.1187286376953125, -0.06298828125, -0.0072479248046875, 0.048492431640625, 0.1042327880859375, 0.15997314453125, 0.2157135009765625, 0.271453857421875, 0.3271942138671875, 0.3829345703125, 0.4386749267578125, 0.494415283203125, 0.5501556396484375, 0.60589599609375, 0.6616363525390625, 0.717376708984375, 0.7731170654296875, 0.828857421875, 0.8845977783203125, 0.940338134765625, 0.9960784912109375, 1.05181884765625, 1.1075592041015625, 1.163299560546875, 1.2190399169921875, 1.2747802734375, 1.3305206298828125, 1.386260986328125, 1.4420013427734375, 1.49774169921875, 1.5534820556640625, 1.609222412109375, 1.6649627685546875, 1.720703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 0.0, 7.0, 4.0, 4.0, 6.0, 9.0, 11.0, 14.0, 17.0, 32.0, 25.0, 28.0, 32.0, 45.0, 58.0, 46.0, 64.0, 61.0, 58.0, 76.0, 63.0, 58.0, 44.0, 44.0, 32.0, 32.0, 26.0, 21.0, 24.0, 15.0, 11.0, 10.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3076171875, -1.2652740478515625, -1.222930908203125, -1.1805877685546875, -1.13824462890625, -1.0959014892578125, -1.053558349609375, -1.0112152099609375, -0.9688720703125, -0.9265289306640625, -0.884185791015625, -0.8418426513671875, -0.79949951171875, -0.7571563720703125, -0.714813232421875, -0.6724700927734375, -0.630126953125, -0.5877838134765625, -0.545440673828125, -0.5030975341796875, -0.46075439453125, -0.4184112548828125, -0.376068115234375, -0.3337249755859375, -0.2913818359375, -0.2490386962890625, -0.206695556640625, -0.1643524169921875, -0.12200927734375, -0.0796661376953125, -0.037322998046875, 0.0050201416015625, 0.04736328125, 0.0897064208984375, 0.132049560546875, 0.1743927001953125, 0.21673583984375, 0.2590789794921875, 0.301422119140625, 0.3437652587890625, 0.3861083984375, 0.4284515380859375, 0.470794677734375, 0.5131378173828125, 0.55548095703125, 0.5978240966796875, 0.640167236328125, 0.6825103759765625, 0.724853515625, 0.7671966552734375, 0.809539794921875, 0.8518829345703125, 0.89422607421875, 0.9365692138671875, 0.978912353515625, 1.0212554931640625, 1.0635986328125, 1.1059417724609375, 1.148284912109375, 1.1906280517578125, 1.23297119140625, 1.2753143310546875, 1.317657470703125, 1.3600006103515625, 1.40234375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 11.0, 6.0, 12.0, 34.0, 68.0, 172.0, 335.0, 218.0, 79.0, 34.0, 16.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.97271728515625, -53.387969970703125, -51.803226470947266, -50.21847915649414, -48.633731842041016, -47.048988342285156, -45.46424102783203, -43.879493713378906, -42.29474639892578, -40.709999084472656, -39.1252555847168, -37.54050827026367, -35.95576095581055, -34.37101745605469, -32.78627014160156, -31.201522827148438, -29.616779327392578, -28.032033920288086, -26.44728660583496, -24.86254119873047, -23.277793884277344, -21.69304847717285, -20.10830307006836, -18.523555755615234, -16.938810348510742, -15.354063987731934, -13.769317626953125, -12.184572219848633, -10.599825859069824, -9.015079498291016, -7.430334091186523, -5.845587730407715, -4.260837554931641, -2.676091432571411, -1.0913453102111816, 0.49340057373046875, 2.0781469345092773, 3.662893295288086, 5.247638702392578, 6.832385063171387, 8.417131423950195, 10.001877784729004, 11.586624145507812, 13.171369552612305, 14.756115913391113, 16.340862274169922, 17.925607681274414, 19.510353088378906, 21.09510040283203, 22.679845809936523, 24.26459312438965, 25.84933853149414, 27.434085845947266, 29.018831253051758, 30.60357666015625, 32.188323974609375, 33.7730712890625, 35.357818603515625, 36.942562103271484, 38.52730941772461, 40.112056732177734, 41.696800231933594, 43.28154754638672, 44.866294860839844, 46.4510383605957]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 5.0, 4.0, 5.0, 19.0, 11.0, 10.0, 24.0, 54.0, 62.0, 81.0, 114.0, 120.0, 118.0, 97.0, 84.0, 61.0, 38.0, 13.0, 15.0, 10.0, 8.0, 6.0, 1.0, 7.0, 11.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-56.30928039550781, -54.824920654296875, -53.34056091308594, -51.856197357177734, -50.3718376159668, -48.88747787475586, -47.403114318847656, -45.91875457763672, -44.43439483642578, -42.950035095214844, -41.465675354003906, -39.9813117980957, -38.496952056884766, -37.01259231567383, -35.528228759765625, -34.04386901855469, -32.55950927734375, -31.075149536132812, -29.590787887573242, -28.106426239013672, -26.622066497802734, -25.137706756591797, -23.653345108032227, -22.168983459472656, -20.68462371826172, -19.20026397705078, -17.71590232849121, -16.23154067993164, -14.747180938720703, -13.26282024383545, -11.778459548950195, -10.294098854064941, -8.809734344482422, -7.325373649597168, -5.841012954711914, -4.35665225982666, -2.8722915649414062, -1.3879308700561523, 0.09642982482910156, 1.5807905197143555, 3.0651512145996094, 4.549511909484863, 6.033872604370117, 7.518233299255371, 9.002593994140625, 10.486954689025879, 11.971315383911133, 13.455676078796387, 14.94003677368164, 16.424396514892578, 17.90875816345215, 19.39311981201172, 20.877479553222656, 22.361839294433594, 23.846200942993164, 25.330562591552734, 26.814922332763672, 28.29928207397461, 29.78364372253418, 31.26800537109375, 32.75236511230469, 34.236724853515625, 35.72108459472656, 37.205448150634766, 38.6898078918457]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 6.0, 12.0, 30.0, 56.0, 82.0, 154.0, 296.0, 629.0, 1422.0, 3709.0, 14154.0, 100706.0, 3895825.0, 150815.0, 18025.0, 4873.0, 1754.0, 808.0, 348.0, 225.0, 118.0, 72.0, 54.0, 27.0, 25.0, 13.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.609375, -13.133056640625, -12.65673828125, -12.180419921875, -11.7041015625, -11.227783203125, -10.75146484375, -10.275146484375, -9.798828125, -9.322509765625, -8.84619140625, -8.369873046875, -7.8935546875, -7.417236328125, -6.94091796875, -6.464599609375, -5.98828125, -5.511962890625, -5.03564453125, -4.559326171875, -4.0830078125, -3.606689453125, -3.13037109375, -2.654052734375, -2.177734375, -1.701416015625, -1.22509765625, -0.748779296875, -0.2724609375, 0.203857421875, 0.68017578125, 1.156494140625, 1.6328125, 2.109130859375, 2.58544921875, 3.061767578125, 3.5380859375, 4.014404296875, 4.49072265625, 4.967041015625, 5.443359375, 5.919677734375, 6.39599609375, 6.872314453125, 7.3486328125, 7.824951171875, 8.30126953125, 8.777587890625, 9.25390625, 9.730224609375, 10.20654296875, 10.682861328125, 11.1591796875, 11.635498046875, 12.11181640625, 12.588134765625, 13.064453125, 13.540771484375, 14.01708984375, 14.493408203125, 14.9697265625, 15.446044921875, 15.92236328125, 16.398681640625, 16.875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 1.0, 9.0, 17.0, 19.0, 31.0, 37.0, 49.0, 70.0, 89.0, 101.0, 104.0, 101.0, 99.0, 70.0, 51.0, 37.0, 27.0, 16.0, 18.0, 16.0, 4.0, 7.0, 5.0, 5.0, 0.0, 5.0, 3.0, 1.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76220703125, -0.7337722778320312, -0.7053375244140625, -0.6769027709960938, -0.648468017578125, -0.6200332641601562, -0.5915985107421875, -0.5631637573242188, -0.53472900390625, -0.5062942504882812, -0.4778594970703125, -0.44942474365234375, -0.420989990234375, -0.39255523681640625, -0.3641204833984375, -0.33568572998046875, -0.3072509765625, -0.27881622314453125, -0.2503814697265625, -0.22194671630859375, -0.193511962890625, -0.16507720947265625, -0.1366424560546875, -0.10820770263671875, -0.07977294921875, -0.05133819580078125, -0.0229034423828125, 0.00553131103515625, 0.033966064453125, 0.06240081787109375, 0.0908355712890625, 0.11927032470703125, 0.147705078125, 0.17613983154296875, 0.2045745849609375, 0.23300933837890625, 0.261444091796875, 0.28987884521484375, 0.3183135986328125, 0.34674835205078125, 0.37518310546875, 0.40361785888671875, 0.4320526123046875, 0.46048736572265625, 0.488922119140625, 0.5173568725585938, 0.5457916259765625, 0.5742263793945312, 0.6026611328125, 0.6310958862304688, 0.6595306396484375, 0.6879653930664062, 0.716400146484375, 0.7448348999023438, 0.7732696533203125, 0.8017044067382812, 0.83013916015625, 0.8585739135742188, 0.8870086669921875, 0.9154434204101562, 0.943878173828125, 0.9723129272460938, 1.0007476806640625, 1.0291824340820312, 1.0576171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 11.0, 8.0, 21.0, 26.0, 31.0, 66.0, 86.0, 131.0, 264.0, 455.0, 747.0, 1570.0, 3211.0, 7298.0, 19350.0, 64361.0, 341123.0, 3225697.0, 418362.0, 74591.0, 21697.0, 7972.0, 3579.0, 1626.0, 790.0, 472.0, 294.0, 168.0, 86.0, 63.0, 39.0, 25.0, 20.0, 9.0, 7.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.171875, -7.92828369140625, -7.6846923828125, -7.44110107421875, -7.197509765625, -6.95391845703125, -6.7103271484375, -6.46673583984375, -6.22314453125, -5.97955322265625, -5.7359619140625, -5.49237060546875, -5.248779296875, -5.00518798828125, -4.7615966796875, -4.51800537109375, -4.2744140625, -4.03082275390625, -3.7872314453125, -3.54364013671875, -3.300048828125, -3.05645751953125, -2.8128662109375, -2.56927490234375, -2.32568359375, -2.08209228515625, -1.8385009765625, -1.59490966796875, -1.351318359375, -1.10772705078125, -0.8641357421875, -0.62054443359375, -0.376953125, -0.13336181640625, 0.1102294921875, 0.35382080078125, 0.597412109375, 0.84100341796875, 1.0845947265625, 1.32818603515625, 1.57177734375, 1.81536865234375, 2.0589599609375, 2.30255126953125, 2.546142578125, 2.78973388671875, 3.0333251953125, 3.27691650390625, 3.5205078125, 3.76409912109375, 4.0076904296875, 4.25128173828125, 4.494873046875, 4.73846435546875, 4.9820556640625, 5.22564697265625, 5.46923828125, 5.71282958984375, 5.9564208984375, 6.20001220703125, 6.443603515625, 6.68719482421875, 6.9307861328125, 7.17437744140625, 7.41796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 5.0, 4.0, 9.0, 11.0, 11.0, 21.0, 19.0, 32.0, 53.0, 62.0, 98.0, 155.0, 276.0, 548.0, 1522.0, 457.0, 262.0, 153.0, 112.0, 76.0, 51.0, 28.0, 18.0, 19.0, 18.0, 14.0, 12.0, 3.0, 6.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.15625, -1.1194610595703125, -1.082672119140625, -1.0458831787109375, -1.00909423828125, -0.9723052978515625, -0.935516357421875, -0.8987274169921875, -0.8619384765625, -0.8251495361328125, -0.788360595703125, -0.7515716552734375, -0.71478271484375, -0.6779937744140625, -0.641204833984375, -0.6044158935546875, -0.567626953125, -0.5308380126953125, -0.494049072265625, -0.4572601318359375, -0.42047119140625, -0.3836822509765625, -0.346893310546875, -0.3101043701171875, -0.2733154296875, -0.2365264892578125, -0.199737548828125, -0.1629486083984375, -0.12615966796875, -0.0893707275390625, -0.052581787109375, -0.0157928466796875, 0.02099609375, 0.0577850341796875, 0.094573974609375, 0.1313629150390625, 0.16815185546875, 0.2049407958984375, 0.241729736328125, 0.2785186767578125, 0.3153076171875, 0.3520965576171875, 0.388885498046875, 0.4256744384765625, 0.46246337890625, 0.4992523193359375, 0.536041259765625, 0.5728302001953125, 0.609619140625, 0.6464080810546875, 0.683197021484375, 0.7199859619140625, 0.75677490234375, 0.7935638427734375, 0.830352783203125, 0.8671417236328125, 0.9039306640625, 0.9407196044921875, 0.977508544921875, 1.0142974853515625, 1.05108642578125, 1.0878753662109375, 1.124664306640625, 1.1614532470703125, 1.1982421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 10.0, 65.0, 253.0, 422.0, 200.0, 37.0, 8.0, 7.0, 0.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.61604309082031, -37.782100677490234, -36.948158264160156, -36.11421585083008, -35.2802734375, -34.44633483886719, -33.61239242553711, -32.77845001220703, -31.944507598876953, -31.110565185546875, -30.276622772216797, -29.44268226623535, -28.608739852905273, -27.774797439575195, -26.94085693359375, -26.106914520263672, -25.272972106933594, -24.439029693603516, -23.605087280273438, -22.771146774291992, -21.937204360961914, -21.103261947631836, -20.26932144165039, -19.435379028320312, -18.601436614990234, -17.767494201660156, -16.933551788330078, -16.099611282348633, -15.265668869018555, -14.431726455688477, -13.597784996032715, -12.763843536376953, -11.929903030395508, -11.09596061706543, -10.262019157409668, -9.428077697753906, -8.594135284423828, -7.760193347930908, -6.926251411437988, -6.092309474945068, -5.258367538452148, -4.4244256019592285, -3.5904836654663086, -2.7565417289733887, -1.9225997924804688, -1.0886578559875488, -0.2547159194946289, 0.579226016998291, 1.413167953491211, 2.247109889984131, 3.081051826477051, 3.9149937629699707, 4.748935699462891, 5.5828776359558105, 6.4168195724487305, 7.25076150894165, 8.08470344543457, 8.918645858764648, 9.75258731842041, 10.586528778076172, 11.42047119140625, 12.254413604736328, 13.08835506439209, 13.922296524047852, 14.75623893737793]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 19.0, 15.0, 11.0, 18.0, 34.0, 32.0, 33.0, 48.0, 51.0, 54.0, 59.0, 72.0, 68.0, 68.0, 66.0, 49.0, 57.0, 43.0, 50.0, 25.0, 36.0, 12.0, 18.0, 8.0, 7.0, 9.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.389298439025879, -5.227301597595215, -5.065304756164551, -4.903307914733887, -4.7413105964660645, -4.5793137550354, -4.417316913604736, -4.255320072174072, -4.093323230743408, -3.931326389312744, -3.769329309463501, -3.607332468032837, -3.445335626602173, -3.2833385467529297, -3.1213417053222656, -2.9593448638916016, -2.7973477840423584, -2.6353509426116943, -2.473353862762451, -2.311357021331787, -2.149360179901123, -1.9873632192611694, -1.8253662586212158, -1.6633694171905518, -1.5013724565505981, -1.3393754959106445, -1.1773786544799805, -1.0153816938400269, -0.853384792804718, -0.6913878917694092, -0.5293909311294556, -0.3673940896987915, -0.2053971290588379, -0.04340021312236786, 0.11859670281410217, 0.2805936336517334, 0.44259053468704224, 0.6045874357223511, 0.7665843963623047, 0.9285812377929688, 1.0905781984329224, 1.252575159072876, 1.41457200050354, 1.5765689611434937, 1.7385659217834473, 1.9005627632141113, 2.0625596046447754, 2.2245564460754395, 2.3865535259246826, 2.5485503673553467, 2.71054744720459, 2.872544288635254, 3.034541130065918, 3.196537971496582, 3.358535051345825, 3.5205318927764893, 3.6825289726257324, 3.8445258140563965, 4.0065226554870605, 4.168519973754883, 4.330516815185547, 4.492513656616211, 4.654510498046875, 4.816507339477539, 4.978504180908203]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 16.0, 19.0, 23.0, 65.0, 74.0, 127.0, 271.0, 452.0, 908.0, 2042.0, 5278.0, 16226.0, 73337.0, 451907.0, 409632.0, 64906.0, 14705.0, 4822.0, 1925.0, 801.0, 433.0, 241.0, 131.0, 76.0, 47.0, 24.0, 24.0, 10.0, 9.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.453125, -8.21136474609375, -7.9696044921875, -7.72784423828125, -7.486083984375, -7.24432373046875, -7.0025634765625, -6.76080322265625, -6.51904296875, -6.27728271484375, -6.0355224609375, -5.79376220703125, -5.552001953125, -5.31024169921875, -5.0684814453125, -4.82672119140625, -4.5849609375, -4.34320068359375, -4.1014404296875, -3.85968017578125, -3.617919921875, -3.37615966796875, -3.1343994140625, -2.89263916015625, -2.65087890625, -2.40911865234375, -2.1673583984375, -1.92559814453125, -1.683837890625, -1.44207763671875, -1.2003173828125, -0.95855712890625, -0.716796875, -0.47503662109375, -0.2332763671875, 0.00848388671875, 0.250244140625, 0.49200439453125, 0.7337646484375, 0.97552490234375, 1.21728515625, 1.45904541015625, 1.7008056640625, 1.94256591796875, 2.184326171875, 2.42608642578125, 2.6678466796875, 2.90960693359375, 3.1513671875, 3.39312744140625, 3.6348876953125, 3.87664794921875, 4.118408203125, 4.36016845703125, 4.6019287109375, 4.84368896484375, 5.08544921875, 5.32720947265625, 5.5689697265625, 5.81072998046875, 6.052490234375, 6.29425048828125, 6.5360107421875, 6.77777099609375, 7.01953125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 2.0, 5.0, 9.0, 21.0, 31.0, 22.0, 44.0, 55.0, 73.0, 93.0, 102.0, 101.0, 86.0, 78.0, 68.0, 65.0, 35.0, 24.0, 21.0, 16.0, 13.0, 9.0, 4.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.7789230346679688, -0.7516937255859375, -0.7244644165039062, -0.697235107421875, -0.6700057983398438, -0.6427764892578125, -0.6155471801757812, -0.58831787109375, -0.5610885620117188, -0.5338592529296875, -0.5066299438476562, -0.479400634765625, -0.45217132568359375, -0.4249420166015625, -0.39771270751953125, -0.3704833984375, -0.34325408935546875, -0.3160247802734375, -0.28879547119140625, -0.261566162109375, -0.23433685302734375, -0.2071075439453125, -0.17987823486328125, -0.15264892578125, -0.12541961669921875, -0.0981903076171875, -0.07096099853515625, -0.043731689453125, -0.01650238037109375, 0.0107269287109375, 0.03795623779296875, 0.065185546875, 0.09241485595703125, 0.1196441650390625, 0.14687347412109375, 0.174102783203125, 0.20133209228515625, 0.2285614013671875, 0.25579071044921875, 0.28302001953125, 0.31024932861328125, 0.3374786376953125, 0.36470794677734375, 0.391937255859375, 0.41916656494140625, 0.4463958740234375, 0.47362518310546875, 0.5008544921875, 0.5280838012695312, 0.5553131103515625, 0.5825424194335938, 0.609771728515625, 0.6370010375976562, 0.6642303466796875, 0.6914596557617188, 0.71868896484375, 0.7459182739257812, 0.7731475830078125, 0.8003768920898438, 0.827606201171875, 0.8548355102539062, 0.8820648193359375, 0.9092941284179688, 0.9365234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 10.0, 8.0, 12.0, 20.0, 25.0, 33.0, 56.0, 60.0, 106.0, 197.0, 285.0, 491.0, 888.0, 1780.0, 4077.0, 11254.0, 46867.0, 333742.0, 541528.0, 80896.0, 16393.0, 5221.0, 2156.0, 1072.0, 578.0, 320.0, 177.0, 96.0, 62.0, 56.0, 22.0, 15.0, 15.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-7.0859375, -6.87847900390625, -6.6710205078125, -6.46356201171875, -6.256103515625, -6.04864501953125, -5.8411865234375, -5.63372802734375, -5.42626953125, -5.21881103515625, -5.0113525390625, -4.80389404296875, -4.596435546875, -4.38897705078125, -4.1815185546875, -3.97406005859375, -3.7666015625, -3.55914306640625, -3.3516845703125, -3.14422607421875, -2.936767578125, -2.72930908203125, -2.5218505859375, -2.31439208984375, -2.10693359375, -1.89947509765625, -1.6920166015625, -1.48455810546875, -1.277099609375, -1.06964111328125, -0.8621826171875, -0.65472412109375, -0.447265625, -0.23980712890625, -0.0323486328125, 0.17510986328125, 0.382568359375, 0.59002685546875, 0.7974853515625, 1.00494384765625, 1.21240234375, 1.41986083984375, 1.6273193359375, 1.83477783203125, 2.042236328125, 2.24969482421875, 2.4571533203125, 2.66461181640625, 2.8720703125, 3.07952880859375, 3.2869873046875, 3.49444580078125, 3.701904296875, 3.90936279296875, 4.1168212890625, 4.32427978515625, 4.53173828125, 4.73919677734375, 4.9466552734375, 5.15411376953125, 5.361572265625, 5.56903076171875, 5.7764892578125, 5.98394775390625, 6.19140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 11.0, 7.0, 24.0, 22.0, 39.0, 51.0, 51.0, 50.0, 70.0, 83.0, 67.0, 89.0, 83.0, 78.0, 62.0, 52.0, 43.0, 38.0, 23.0, 19.0, 13.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.4921875, -5.361846923828125, -5.23150634765625, -5.101165771484375, -4.9708251953125, -4.840484619140625, -4.71014404296875, -4.579803466796875, -4.449462890625, -4.319122314453125, -4.18878173828125, -4.058441162109375, -3.9281005859375, -3.797760009765625, -3.66741943359375, -3.537078857421875, -3.40673828125, -3.276397705078125, -3.14605712890625, -3.015716552734375, -2.8853759765625, -2.755035400390625, -2.62469482421875, -2.494354248046875, -2.364013671875, -2.233673095703125, -2.10333251953125, -1.972991943359375, -1.8426513671875, -1.712310791015625, -1.58197021484375, -1.451629638671875, -1.3212890625, -1.190948486328125, -1.06060791015625, -0.930267333984375, -0.7999267578125, -0.669586181640625, -0.53924560546875, -0.408905029296875, -0.278564453125, -0.148223876953125, -0.01788330078125, 0.112457275390625, 0.2427978515625, 0.373138427734375, 0.50347900390625, 0.633819580078125, 0.76416015625, 0.894500732421875, 1.02484130859375, 1.155181884765625, 1.2855224609375, 1.415863037109375, 1.54620361328125, 1.676544189453125, 1.806884765625, 1.937225341796875, 2.06756591796875, 2.197906494140625, 2.3282470703125, 2.458587646484375, 2.58892822265625, 2.719268798828125, 2.849609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 3.0, 3.0, 9.0, 9.0, 22.0, 28.0, 52.0, 95.0, 145.0, 293.0, 610.0, 1286.0, 2946.0, 8214.0, 28111.0, 143139.0, 558986.0, 242915.0, 43022.0, 11514.0, 3963.0, 1550.0, 786.0, 343.0, 216.0, 109.0, 69.0, 39.0, 30.0, 18.0, 9.0, 8.0, 9.0, 3.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5859375, -8.36376953125, -8.1416015625, -7.91943359375, -7.697265625, -7.47509765625, -7.2529296875, -7.03076171875, -6.80859375, -6.58642578125, -6.3642578125, -6.14208984375, -5.919921875, -5.69775390625, -5.4755859375, -5.25341796875, -5.03125, -4.80908203125, -4.5869140625, -4.36474609375, -4.142578125, -3.92041015625, -3.6982421875, -3.47607421875, -3.25390625, -3.03173828125, -2.8095703125, -2.58740234375, -2.365234375, -2.14306640625, -1.9208984375, -1.69873046875, -1.4765625, -1.25439453125, -1.0322265625, -0.81005859375, -0.587890625, -0.36572265625, -0.1435546875, 0.07861328125, 0.30078125, 0.52294921875, 0.7451171875, 0.96728515625, 1.189453125, 1.41162109375, 1.6337890625, 1.85595703125, 2.078125, 2.30029296875, 2.5224609375, 2.74462890625, 2.966796875, 3.18896484375, 3.4111328125, 3.63330078125, 3.85546875, 4.07763671875, 4.2998046875, 4.52197265625, 4.744140625, 4.96630859375, 5.1884765625, 5.41064453125, 5.6328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 8.0, 22.0, 52.0, 98.0, 206.0, 275.0, 193.0, 69.0, 28.0, 13.0, 9.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0011072158813476562, -0.0010803937911987305, -0.0010535717010498047, -0.001026749610900879, -0.0009999275207519531, -0.0009731054306030273, -0.0009462833404541016, -0.0009194612503051758, -0.00089263916015625, -0.0008658170700073242, -0.0008389949798583984, -0.0008121728897094727, -0.0007853507995605469, -0.0007585287094116211, -0.0007317066192626953, -0.0007048845291137695, -0.0006780624389648438, -0.000651240348815918, -0.0006244182586669922, -0.0005975961685180664, -0.0005707740783691406, -0.0005439519882202148, -0.0005171298980712891, -0.0004903078079223633, -0.0004634857177734375, -0.0004366636276245117, -0.00040984153747558594, -0.00038301944732666016, -0.0003561973571777344, -0.0003293752670288086, -0.0003025531768798828, -0.00027573108673095703, -0.00024890899658203125, -0.00022208690643310547, -0.0001952648162841797, -0.0001684427261352539, -0.00014162063598632812, -0.00011479854583740234, -8.797645568847656e-05, -6.115436553955078e-05, -3.4332275390625e-05, -7.510185241699219e-06, 1.9311904907226562e-05, 4.6133995056152344e-05, 7.295608520507812e-05, 9.97781753540039e-05, 0.0001266002655029297, 0.00015342235565185547, 0.00018024444580078125, 0.00020706653594970703, 0.0002338886260986328, 0.0002607107162475586, 0.0002875328063964844, 0.00031435489654541016, 0.00034117698669433594, 0.0003679990768432617, 0.0003948211669921875, 0.0004216432571411133, 0.00044846534729003906, 0.00047528743743896484, 0.0005021095275878906, 0.0005289316177368164, 0.0005557537078857422, 0.000582575798034668, 0.0006093978881835938]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 6.0, 11.0, 6.0, 31.0, 47.0, 58.0, 100.0, 144.0, 259.0, 425.0, 852.0, 1518.0, 3429.0, 7887.0, 22449.0, 83750.0, 354083.0, 419365.0, 108845.0, 27996.0, 9577.0, 3910.0, 1785.0, 883.0, 473.0, 255.0, 142.0, 95.0, 51.0, 36.0, 18.0, 20.0, 10.0, 7.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.52734375, -5.33056640625, -5.1337890625, -4.93701171875, -4.740234375, -4.54345703125, -4.3466796875, -4.14990234375, -3.953125, -3.75634765625, -3.5595703125, -3.36279296875, -3.166015625, -2.96923828125, -2.7724609375, -2.57568359375, -2.37890625, -2.18212890625, -1.9853515625, -1.78857421875, -1.591796875, -1.39501953125, -1.1982421875, -1.00146484375, -0.8046875, -0.60791015625, -0.4111328125, -0.21435546875, -0.017578125, 0.17919921875, 0.3759765625, 0.57275390625, 0.76953125, 0.96630859375, 1.1630859375, 1.35986328125, 1.556640625, 1.75341796875, 1.9501953125, 2.14697265625, 2.34375, 2.54052734375, 2.7373046875, 2.93408203125, 3.130859375, 3.32763671875, 3.5244140625, 3.72119140625, 3.91796875, 4.11474609375, 4.3115234375, 4.50830078125, 4.705078125, 4.90185546875, 5.0986328125, 5.29541015625, 5.4921875, 5.68896484375, 5.8857421875, 6.08251953125, 6.279296875, 6.47607421875, 6.6728515625, 6.86962890625, 7.06640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 8.0, 3.0, 3.0, 7.0, 4.0, 16.0, 18.0, 23.0, 30.0, 44.0, 59.0, 87.0, 121.0, 90.0, 80.0, 78.0, 98.0, 66.0, 49.0, 31.0, 28.0, 8.0, 14.0, 8.0, 9.0, 1.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48046875, -4.365570068359375, -4.25067138671875, -4.135772705078125, -4.0208740234375, -3.905975341796875, -3.79107666015625, -3.676177978515625, -3.561279296875, -3.446380615234375, -3.33148193359375, -3.216583251953125, -3.1016845703125, -2.986785888671875, -2.87188720703125, -2.756988525390625, -2.64208984375, -2.527191162109375, -2.41229248046875, -2.297393798828125, -2.1824951171875, -2.067596435546875, -1.95269775390625, -1.837799072265625, -1.722900390625, -1.608001708984375, -1.49310302734375, -1.378204345703125, -1.2633056640625, -1.148406982421875, -1.03350830078125, -0.918609619140625, -0.8037109375, -0.688812255859375, -0.57391357421875, -0.459014892578125, -0.3441162109375, -0.229217529296875, -0.11431884765625, 0.000579833984375, 0.115478515625, 0.230377197265625, 0.34527587890625, 0.460174560546875, 0.5750732421875, 0.689971923828125, 0.80487060546875, 0.919769287109375, 1.03466796875, 1.149566650390625, 1.26446533203125, 1.379364013671875, 1.4942626953125, 1.609161376953125, 1.72406005859375, 1.838958740234375, 1.953857421875, 2.068756103515625, 2.18365478515625, 2.298553466796875, 2.4134521484375, 2.528350830078125, 2.64324951171875, 2.758148193359375, 2.873046875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 7.0, 26.0, 67.0, 140.0, 273.0, 258.0, 138.0, 59.0, 19.0, 12.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.449691772460938, -25.46908187866211, -23.48847198486328, -21.50786018371582, -19.527250289916992, -17.546640396118164, -15.56602954864502, -13.585418701171875, -11.604808807373047, -9.624198913574219, -7.643588066101074, -5.662977695465088, -3.6823673248291016, -1.7017574310302734, 0.2788534164428711, 2.2594642639160156, 4.240074157714844, 6.22068452835083, 8.201294898986816, 10.181905746459961, 12.162515640258789, 14.143125534057617, 16.123737335205078, 18.104347229003906, 20.084957122802734, 22.065567016601562, 24.04617691040039, 26.02678871154785, 28.00739860534668, 29.988008499145508, 31.96862030029297, 33.9492301940918, 35.929840087890625, 37.91044998168945, 39.89105987548828, 41.87166976928711, 43.85227966308594, 45.83289337158203, 47.81350326538086, 49.79411315917969, 51.774723052978516, 53.755332946777344, 55.73594284057617, 57.716552734375, 59.697166442871094, 61.677772521972656, 63.65838623046875, 65.63899230957031, 67.6196060180664, 69.6002197265625, 71.58082580566406, 73.56143951416016, 75.54204559326172, 77.52265930175781, 79.50326538085938, 81.48387908935547, 83.46449279785156, 85.44510650634766, 87.42571258544922, 89.40632629394531, 91.38693237304688, 93.36754608154297, 95.34815216064453, 97.32876586914062, 99.30937194824219]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 5.0, 2.0, 14.0, 8.0, 10.0, 12.0, 14.0, 19.0, 28.0, 33.0, 50.0, 38.0, 38.0, 60.0, 51.0, 54.0, 69.0, 64.0, 58.0, 41.0, 55.0, 47.0, 43.0, 34.0, 20.0, 34.0, 14.0, 10.0, 13.0, 10.0, 8.0, 7.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-23.43783187866211, -22.80716323852539, -22.176494598388672, -21.545825958251953, -20.915157318115234, -20.284488677978516, -19.653820037841797, -19.023151397705078, -18.39248275756836, -17.76181411743164, -17.131145477294922, -16.500476837158203, -15.869808197021484, -15.239139556884766, -14.60846996307373, -13.977801322937012, -13.347131729125977, -12.716463088989258, -12.085794448852539, -11.45512580871582, -10.824457168579102, -10.193788528442383, -9.563118934631348, -8.932450294494629, -8.30178165435791, -7.671113014221191, -7.040444374084473, -6.409775257110596, -5.779106616973877, -5.148437976837158, -4.517768859863281, -3.8871002197265625, -3.256429672241211, -2.625761032104492, -1.9950921535491943, -1.364423394203186, -0.7337546348571777, -0.10308599472045898, 0.5275828838348389, 1.1582517623901367, 1.7889204025268555, 2.419589042663574, 3.050257921218872, 3.68092679977417, 4.311595439910889, 4.942264080047607, 5.572933197021484, 6.203601837158203, 6.834270477294922, 7.464939117431641, 8.09560775756836, 8.726276397705078, 9.356945037841797, 9.987613677978516, 10.61828327178955, 11.24895191192627, 11.879620552062988, 12.510289192199707, 13.140957832336426, 13.771626472473145, 14.40229606628418, 15.032964706420898, 15.663633346557617, 16.294301986694336, 16.924970626831055]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 8.0, 5.0, 11.0, 11.0, 19.0, 29.0, 49.0, 55.0, 95.0, 99.0, 167.0, 263.0, 426.0, 648.0, 1094.0, 2100.0, 4160.0, 9528.0, 24119.0, 72325.0, 310550.0, 3002869.0, 594041.0, 109686.0, 34281.0, 13621.0, 6219.0, 3090.0, 1755.0, 1008.0, 629.0, 355.0, 279.0, 171.0, 152.0, 92.0, 54.0, 56.0, 45.0, 27.0, 26.0, 18.0, 17.0, 14.0, 4.0, 5.0, 6.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8046875, -8.5079345703125, -8.211181640625, -7.9144287109375, -7.61767578125, -7.3209228515625, -7.024169921875, -6.7274169921875, -6.4306640625, -6.1339111328125, -5.837158203125, -5.5404052734375, -5.24365234375, -4.9468994140625, -4.650146484375, -4.3533935546875, -4.056640625, -3.7598876953125, -3.463134765625, -3.1663818359375, -2.86962890625, -2.5728759765625, -2.276123046875, -1.9793701171875, -1.6826171875, -1.3858642578125, -1.089111328125, -0.7923583984375, -0.49560546875, -0.1988525390625, 0.097900390625, 0.3946533203125, 0.69140625, 0.9881591796875, 1.284912109375, 1.5816650390625, 1.87841796875, 2.1751708984375, 2.471923828125, 2.7686767578125, 3.0654296875, 3.3621826171875, 3.658935546875, 3.9556884765625, 4.25244140625, 4.5491943359375, 4.845947265625, 5.1427001953125, 5.439453125, 5.7362060546875, 6.032958984375, 6.3297119140625, 6.62646484375, 6.9232177734375, 7.219970703125, 7.5167236328125, 7.8134765625, 8.1102294921875, 8.406982421875, 8.7037353515625, 9.00048828125, 9.2972412109375, 9.593994140625, 9.8907470703125, 10.1875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 14.0, 6.0, 15.0, 30.0, 46.0, 50.0, 55.0, 83.0, 91.0, 93.0, 101.0, 82.0, 87.0, 62.0, 47.0, 37.0, 30.0, 19.0, 10.0, 9.0, 10.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8388671875, -0.8119964599609375, -0.785125732421875, -0.7582550048828125, -0.73138427734375, -0.7045135498046875, -0.677642822265625, -0.6507720947265625, -0.6239013671875, -0.5970306396484375, -0.570159912109375, -0.5432891845703125, -0.51641845703125, -0.4895477294921875, -0.462677001953125, -0.4358062744140625, -0.408935546875, -0.3820648193359375, -0.355194091796875, -0.3283233642578125, -0.30145263671875, -0.2745819091796875, -0.247711181640625, -0.2208404541015625, -0.1939697265625, -0.1670989990234375, -0.140228271484375, -0.1133575439453125, -0.08648681640625, -0.0596160888671875, -0.032745361328125, -0.0058746337890625, 0.02099609375, 0.0478668212890625, 0.074737548828125, 0.1016082763671875, 0.12847900390625, 0.1553497314453125, 0.182220458984375, 0.2090911865234375, 0.2359619140625, 0.2628326416015625, 0.289703369140625, 0.3165740966796875, 0.34344482421875, 0.3703155517578125, 0.397186279296875, 0.4240570068359375, 0.450927734375, 0.4777984619140625, 0.504669189453125, 0.5315399169921875, 0.55841064453125, 0.5852813720703125, 0.612152099609375, 0.6390228271484375, 0.6658935546875, 0.6927642822265625, 0.719635009765625, 0.7465057373046875, 0.77337646484375, 0.8002471923828125, 0.827117919921875, 0.8539886474609375, 0.880859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 8.0, 9.0, 12.0, 27.0, 32.0, 39.0, 67.0, 95.0, 150.0, 285.0, 632.0, 1644.0, 5583.0, 27154.0, 222417.0, 3308124.0, 563652.0, 51280.0, 9128.0, 2296.0, 817.0, 331.0, 158.0, 106.0, 65.0, 40.0, 29.0, 17.0, 15.0, 13.0, 9.0, 11.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.984375, -14.461669921875, -13.93896484375, -13.416259765625, -12.8935546875, -12.370849609375, -11.84814453125, -11.325439453125, -10.802734375, -10.280029296875, -9.75732421875, -9.234619140625, -8.7119140625, -8.189208984375, -7.66650390625, -7.143798828125, -6.62109375, -6.098388671875, -5.57568359375, -5.052978515625, -4.5302734375, -4.007568359375, -3.48486328125, -2.962158203125, -2.439453125, -1.916748046875, -1.39404296875, -0.871337890625, -0.3486328125, 0.174072265625, 0.69677734375, 1.219482421875, 1.7421875, 2.264892578125, 2.78759765625, 3.310302734375, 3.8330078125, 4.355712890625, 4.87841796875, 5.401123046875, 5.923828125, 6.446533203125, 6.96923828125, 7.491943359375, 8.0146484375, 8.537353515625, 9.06005859375, 9.582763671875, 10.10546875, 10.628173828125, 11.15087890625, 11.673583984375, 12.1962890625, 12.718994140625, 13.24169921875, 13.764404296875, 14.287109375, 14.809814453125, 15.33251953125, 15.855224609375, 16.3779296875, 16.900634765625, 17.42333984375, 17.946044921875, 18.46875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 10.0, 16.0, 14.0, 15.0, 17.0, 28.0, 32.0, 53.0, 65.0, 87.0, 124.0, 196.0, 278.0, 417.0, 845.0, 576.0, 387.0, 251.0, 186.0, 107.0, 81.0, 62.0, 54.0, 39.0, 30.0, 27.0, 18.0, 13.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7900390625, -1.7426605224609375, -1.695281982421875, -1.6479034423828125, -1.60052490234375, -1.5531463623046875, -1.505767822265625, -1.4583892822265625, -1.4110107421875, -1.3636322021484375, -1.316253662109375, -1.2688751220703125, -1.22149658203125, -1.1741180419921875, -1.126739501953125, -1.0793609619140625, -1.031982421875, -0.9846038818359375, -0.937225341796875, -0.8898468017578125, -0.84246826171875, -0.7950897216796875, -0.747711181640625, -0.7003326416015625, -0.6529541015625, -0.6055755615234375, -0.558197021484375, -0.5108184814453125, -0.46343994140625, -0.4160614013671875, -0.368682861328125, -0.3213043212890625, -0.27392578125, -0.2265472412109375, -0.179168701171875, -0.1317901611328125, -0.08441162109375, -0.0370330810546875, 0.010345458984375, 0.0577239990234375, 0.1051025390625, 0.1524810791015625, 0.199859619140625, 0.2472381591796875, 0.29461669921875, 0.3419952392578125, 0.389373779296875, 0.4367523193359375, 0.484130859375, 0.5315093994140625, 0.578887939453125, 0.6262664794921875, 0.67364501953125, 0.7210235595703125, 0.768402099609375, 0.8157806396484375, 0.8631591796875, 0.9105377197265625, 0.957916259765625, 1.0052947998046875, 1.05267333984375, 1.1000518798828125, 1.147430419921875, 1.1948089599609375, 1.2421875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 24.0, 64.0, 130.0, 205.0, 217.0, 182.0, 93.0, 36.0, 18.0, 15.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.244587898254395, -11.574005126953125, -10.903422355651855, -10.232839584350586, -9.562256813049316, -8.891674041748047, -8.221090316772461, -7.55050802230835, -6.87992525100708, -6.2093424797058105, -5.538759708404541, -4.868176460266113, -4.197593688964844, -3.5270111560821533, -2.8564281463623047, -2.185845375061035, -1.5152626037597656, -0.8446797728538513, -0.174096941947937, 0.49648594856262207, 1.1670687198638916, 1.8376514911651611, 2.5082345008850098, 3.1788172721862793, 3.849400043487549, 4.519982814788818, 5.190565586090088, 5.861148834228516, 6.531731605529785, 7.202314376831055, 7.872897148132324, 8.543479919433594, 9.21406364440918, 9.88464641571045, 10.555229187011719, 11.225811958312988, 11.896394729614258, 12.566977500915527, 13.237560272216797, 13.908143997192383, 14.578725814819336, 15.249308586120605, 15.919891357421875, 16.59047508239746, 17.261056900024414, 17.931640625, 18.602222442626953, 19.27280616760254, 19.943389892578125, 20.61397361755371, 21.284555435180664, 21.95513916015625, 22.625720977783203, 23.29630470275879, 23.966886520385742, 24.637470245361328, 25.30805206298828, 25.978635787963867, 26.64921760559082, 27.319801330566406, 27.99038314819336, 28.660966873168945, 29.3315486907959, 30.002132415771484, 30.672714233398438]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 7.0, 13.0, 10.0, 14.0, 14.0, 19.0, 23.0, 22.0, 32.0, 32.0, 36.0, 33.0, 35.0, 34.0, 33.0, 50.0, 51.0, 56.0, 46.0, 50.0, 39.0, 39.0, 39.0, 29.0, 35.0, 34.0, 28.0, 27.0, 19.0, 12.0, 17.0, 13.0, 5.0, 14.0, 5.0, 7.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.065826416015625, -5.8522138595581055, -5.638601303100586, -5.424988746643066, -5.211376190185547, -4.997763633728027, -4.784151077270508, -4.570538520812988, -4.356925964355469, -4.143313407897949, -3.9297008514404297, -3.71608829498291, -3.5024757385253906, -3.288863182067871, -3.0752506256103516, -2.861638069152832, -2.6480252742767334, -2.434412717819214, -2.2208001613616943, -2.007187604904175, -1.7935750484466553, -1.5799623727798462, -1.3663498163223267, -1.1527372598648071, -0.9391247034072876, -0.7255121469497681, -0.5118995904922485, -0.29828697443008423, -0.0846744179725647, 0.1289381980895996, 0.34255075454711914, 0.5561633110046387, 0.7697758674621582, 0.9833884239196777, 1.1970009803771973, 1.4106135368347168, 1.6242260932922363, 1.8378387689590454, 2.0514512062072754, 2.265063762664795, 2.4786763191223145, 2.692288875579834, 2.9059014320373535, 3.119513988494873, 3.3331265449523926, 3.546739101409912, 3.7603516578674316, 3.973964214324951, 4.187577247619629, 4.401189804077148, 4.614802360534668, 4.8284149169921875, 5.042027473449707, 5.255640029907227, 5.469252586364746, 5.682865142822266, 5.896477699279785, 6.110090255737305, 6.323702812194824, 6.537315368652344, 6.750927925109863, 6.964540481567383, 7.178153038024902, 7.391765594482422, 7.605378150939941]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 3.0, 5.0, 19.0, 18.0, 25.0, 40.0, 59.0, 86.0, 110.0, 163.0, 282.0, 398.0, 779.0, 1441.0, 2952.0, 6319.0, 14307.0, 34719.0, 88419.0, 233877.0, 364841.0, 182089.0, 68632.0, 27097.0, 11489.0, 5016.0, 2309.0, 1225.0, 671.0, 446.0, 227.0, 136.0, 107.0, 63.0, 56.0, 40.0, 21.0, 11.0, 17.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.86328125, -6.64447021484375, -6.4256591796875, -6.20684814453125, -5.988037109375, -5.76922607421875, -5.5504150390625, -5.33160400390625, -5.11279296875, -4.89398193359375, -4.6751708984375, -4.45635986328125, -4.237548828125, -4.01873779296875, -3.7999267578125, -3.58111572265625, -3.3623046875, -3.14349365234375, -2.9246826171875, -2.70587158203125, -2.487060546875, -2.26824951171875, -2.0494384765625, -1.83062744140625, -1.61181640625, -1.39300537109375, -1.1741943359375, -0.95538330078125, -0.736572265625, -0.51776123046875, -0.2989501953125, -0.08013916015625, 0.138671875, 0.35748291015625, 0.5762939453125, 0.79510498046875, 1.013916015625, 1.23272705078125, 1.4515380859375, 1.67034912109375, 1.88916015625, 2.10797119140625, 2.3267822265625, 2.54559326171875, 2.764404296875, 2.98321533203125, 3.2020263671875, 3.42083740234375, 3.6396484375, 3.85845947265625, 4.0772705078125, 4.29608154296875, 4.514892578125, 4.73370361328125, 4.9525146484375, 5.17132568359375, 5.39013671875, 5.60894775390625, 5.8277587890625, 6.04656982421875, 6.265380859375, 6.48419189453125, 6.7030029296875, 6.92181396484375, 7.140625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 9.0, 11.0, 13.0, 18.0, 36.0, 47.0, 45.0, 62.0, 74.0, 91.0, 96.0, 80.0, 68.0, 68.0, 50.0, 61.0, 41.0, 35.0, 32.0, 20.0, 10.0, 7.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.85498046875, -0.8277587890625, -0.800537109375, -0.7733154296875, -0.74609375, -0.7188720703125, -0.691650390625, -0.6644287109375, -0.63720703125, -0.6099853515625, -0.582763671875, -0.5555419921875, -0.5283203125, -0.5010986328125, -0.473876953125, -0.4466552734375, -0.41943359375, -0.3922119140625, -0.364990234375, -0.3377685546875, -0.310546875, -0.2833251953125, -0.256103515625, -0.2288818359375, -0.20166015625, -0.1744384765625, -0.147216796875, -0.1199951171875, -0.0927734375, -0.0655517578125, -0.038330078125, -0.0111083984375, 0.01611328125, 0.0433349609375, 0.070556640625, 0.0977783203125, 0.125, 0.1522216796875, 0.179443359375, 0.2066650390625, 0.23388671875, 0.2611083984375, 0.288330078125, 0.3155517578125, 0.3427734375, 0.3699951171875, 0.397216796875, 0.4244384765625, 0.45166015625, 0.4788818359375, 0.506103515625, 0.5333251953125, 0.560546875, 0.5877685546875, 0.614990234375, 0.6422119140625, 0.66943359375, 0.6966552734375, 0.723876953125, 0.7510986328125, 0.7783203125, 0.8055419921875, 0.832763671875, 0.8599853515625, 0.88720703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 9.0, 8.0, 7.0, 12.0, 24.0, 24.0, 39.0, 58.0, 75.0, 102.0, 155.0, 235.0, 452.0, 758.0, 1544.0, 3949.0, 11391.0, 38560.0, 140796.0, 432025.0, 300363.0, 81894.0, 23172.0, 7304.0, 2720.0, 1216.0, 601.0, 361.0, 228.0, 135.0, 105.0, 78.0, 47.0, 28.0, 25.0, 10.0, 15.0, 7.0, 9.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.5703125, -9.259521484375, -8.94873046875, -8.637939453125, -8.3271484375, -8.016357421875, -7.70556640625, -7.394775390625, -7.083984375, -6.773193359375, -6.46240234375, -6.151611328125, -5.8408203125, -5.530029296875, -5.21923828125, -4.908447265625, -4.59765625, -4.286865234375, -3.97607421875, -3.665283203125, -3.3544921875, -3.043701171875, -2.73291015625, -2.422119140625, -2.111328125, -1.800537109375, -1.48974609375, -1.178955078125, -0.8681640625, -0.557373046875, -0.24658203125, 0.064208984375, 0.375, 0.685791015625, 0.99658203125, 1.307373046875, 1.6181640625, 1.928955078125, 2.23974609375, 2.550537109375, 2.861328125, 3.172119140625, 3.48291015625, 3.793701171875, 4.1044921875, 4.415283203125, 4.72607421875, 5.036865234375, 5.34765625, 5.658447265625, 5.96923828125, 6.280029296875, 6.5908203125, 6.901611328125, 7.21240234375, 7.523193359375, 7.833984375, 8.144775390625, 8.45556640625, 8.766357421875, 9.0771484375, 9.387939453125, 9.69873046875, 10.009521484375, 10.3203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 9.0, 16.0, 6.0, 8.0, 16.0, 22.0, 36.0, 32.0, 27.0, 35.0, 53.0, 47.0, 41.0, 43.0, 56.0, 58.0, 56.0, 48.0, 50.0, 53.0, 36.0, 39.0, 28.0, 23.0, 22.0, 26.0, 14.0, 27.0, 15.0, 16.0, 13.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.06988525390625, -3.9327392578125, -3.79559326171875, -3.658447265625, -3.52130126953125, -3.3841552734375, -3.24700927734375, -3.10986328125, -2.97271728515625, -2.8355712890625, -2.69842529296875, -2.561279296875, -2.42413330078125, -2.2869873046875, -2.14984130859375, -2.0126953125, -1.87554931640625, -1.7384033203125, -1.60125732421875, -1.464111328125, -1.32696533203125, -1.1898193359375, -1.05267333984375, -0.91552734375, -0.77838134765625, -0.6412353515625, -0.50408935546875, -0.366943359375, -0.22979736328125, -0.0926513671875, 0.04449462890625, 0.181640625, 0.31878662109375, 0.4559326171875, 0.59307861328125, 0.730224609375, 0.86737060546875, 1.0045166015625, 1.14166259765625, 1.27880859375, 1.41595458984375, 1.5531005859375, 1.69024658203125, 1.827392578125, 1.96453857421875, 2.1016845703125, 2.23883056640625, 2.3759765625, 2.51312255859375, 2.6502685546875, 2.78741455078125, 2.924560546875, 3.06170654296875, 3.1988525390625, 3.33599853515625, 3.47314453125, 3.61029052734375, 3.7474365234375, 3.88458251953125, 4.021728515625, 4.15887451171875, 4.2960205078125, 4.43316650390625, 4.5703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 3.0, 10.0, 10.0, 22.0, 19.0, 31.0, 37.0, 62.0, 103.0, 142.0, 274.0, 387.0, 666.0, 1203.0, 2345.0, 4702.0, 9812.0, 23193.0, 60770.0, 177577.0, 402597.0, 233718.0, 78037.0, 29203.0, 11941.0, 5401.0, 2622.0, 1514.0, 842.0, 465.0, 270.0, 176.0, 125.0, 76.0, 58.0, 46.0, 23.0, 20.0, 17.0, 12.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.06640625, -5.87457275390625, -5.6827392578125, -5.49090576171875, -5.299072265625, -5.10723876953125, -4.9154052734375, -4.72357177734375, -4.53173828125, -4.33990478515625, -4.1480712890625, -3.95623779296875, -3.764404296875, -3.57257080078125, -3.3807373046875, -3.18890380859375, -2.9970703125, -2.80523681640625, -2.6134033203125, -2.42156982421875, -2.229736328125, -2.03790283203125, -1.8460693359375, -1.65423583984375, -1.46240234375, -1.27056884765625, -1.0787353515625, -0.88690185546875, -0.695068359375, -0.50323486328125, -0.3114013671875, -0.11956787109375, 0.072265625, 0.26409912109375, 0.4559326171875, 0.64776611328125, 0.839599609375, 1.03143310546875, 1.2232666015625, 1.41510009765625, 1.60693359375, 1.79876708984375, 1.9906005859375, 2.18243408203125, 2.374267578125, 2.56610107421875, 2.7579345703125, 2.94976806640625, 3.1416015625, 3.33343505859375, 3.5252685546875, 3.71710205078125, 3.908935546875, 4.10076904296875, 4.2926025390625, 4.48443603515625, 4.67626953125, 4.86810302734375, 5.0599365234375, 5.25177001953125, 5.443603515625, 5.63543701171875, 5.8272705078125, 6.01910400390625, 6.2109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 5.0, 6.0, 5.0, 7.0, 7.0, 7.0, 8.0, 10.0, 15.0, 17.0, 22.0, 47.0, 43.0, 51.0, 88.0, 114.0, 127.0, 109.0, 73.0, 54.0, 51.0, 30.0, 23.0, 15.0, 16.0, 12.0, 9.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000896453857421875, -0.0008658617734909058, -0.0008352696895599365, -0.0008046776056289673, -0.000774085521697998, -0.0007434934377670288, -0.0007129013538360596, -0.0006823092699050903, -0.0006517171859741211, -0.0006211251020431519, -0.0005905330181121826, -0.0005599409341812134, -0.0005293488502502441, -0.0004987567663192749, -0.00046816468238830566, -0.0004375725984573364, -0.0004069805145263672, -0.00037638843059539795, -0.0003457963466644287, -0.00031520426273345947, -0.00028461217880249023, -0.000254020094871521, -0.00022342801094055176, -0.00019283592700958252, -0.00016224384307861328, -0.00013165175914764404, -0.0001010596752166748, -7.046759128570557e-05, -3.987550735473633e-05, -9.28342342376709e-06, 2.130866050720215e-05, 5.190074443817139e-05, 8.249282836914062e-05, 0.00011308491230010986, 0.0001436769962310791, 0.00017426908016204834, 0.00020486116409301758, 0.00023545324802398682, 0.00026604533195495605, 0.0002966374158859253, 0.00032722949981689453, 0.00035782158374786377, 0.000388413667678833, 0.00041900575160980225, 0.0004495978355407715, 0.0004801899194717407, 0.00051078200340271, 0.0005413740873336792, 0.0005719661712646484, 0.0006025582551956177, 0.0006331503391265869, 0.0006637424230575562, 0.0006943345069885254, 0.0007249265909194946, 0.0007555186748504639, 0.0007861107587814331, 0.0008167028427124023, 0.0008472949266433716, 0.0008778870105743408, 0.0009084790945053101, 0.0009390711784362793, 0.0009696632623672485, 0.0010002553462982178, 0.001030847430229187, 0.0010614395141601562]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 11.0, 14.0, 14.0, 24.0, 30.0, 42.0, 72.0, 99.0, 161.0, 307.0, 629.0, 1424.0, 3392.0, 9197.0, 31387.0, 157237.0, 634262.0, 161387.0, 32968.0, 9482.0, 3394.0, 1456.0, 660.0, 353.0, 202.0, 112.0, 69.0, 35.0, 31.0, 32.0, 12.0, 22.0, 9.0, 7.0, 8.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.515625, -10.1708984375, -9.826171875, -9.4814453125, -9.13671875, -8.7919921875, -8.447265625, -8.1025390625, -7.7578125, -7.4130859375, -7.068359375, -6.7236328125, -6.37890625, -6.0341796875, -5.689453125, -5.3447265625, -5.0, -4.6552734375, -4.310546875, -3.9658203125, -3.62109375, -3.2763671875, -2.931640625, -2.5869140625, -2.2421875, -1.8974609375, -1.552734375, -1.2080078125, -0.86328125, -0.5185546875, -0.173828125, 0.1708984375, 0.515625, 0.8603515625, 1.205078125, 1.5498046875, 1.89453125, 2.2392578125, 2.583984375, 2.9287109375, 3.2734375, 3.6181640625, 3.962890625, 4.3076171875, 4.65234375, 4.9970703125, 5.341796875, 5.6865234375, 6.03125, 6.3759765625, 6.720703125, 7.0654296875, 7.41015625, 7.7548828125, 8.099609375, 8.4443359375, 8.7890625, 9.1337890625, 9.478515625, 9.8232421875, 10.16796875, 10.5126953125, 10.857421875, 11.2021484375, 11.546875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 8.0, 16.0, 9.0, 18.0, 22.0, 32.0, 38.0, 71.0, 99.0, 133.0, 134.0, 102.0, 64.0, 50.0, 40.0, 30.0, 27.0, 18.0, 22.0, 12.0, 10.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.23828125, -5.06396484375, -4.8896484375, -4.71533203125, -4.541015625, -4.36669921875, -4.1923828125, -4.01806640625, -3.84375, -3.66943359375, -3.4951171875, -3.32080078125, -3.146484375, -2.97216796875, -2.7978515625, -2.62353515625, -2.44921875, -2.27490234375, -2.1005859375, -1.92626953125, -1.751953125, -1.57763671875, -1.4033203125, -1.22900390625, -1.0546875, -0.88037109375, -0.7060546875, -0.53173828125, -0.357421875, -0.18310546875, -0.0087890625, 0.16552734375, 0.33984375, 0.51416015625, 0.6884765625, 0.86279296875, 1.037109375, 1.21142578125, 1.3857421875, 1.56005859375, 1.734375, 1.90869140625, 2.0830078125, 2.25732421875, 2.431640625, 2.60595703125, 2.7802734375, 2.95458984375, 3.12890625, 3.30322265625, 3.4775390625, 3.65185546875, 3.826171875, 4.00048828125, 4.1748046875, 4.34912109375, 4.5234375, 4.69775390625, 4.8720703125, 5.04638671875, 5.220703125, 5.39501953125, 5.5693359375, 5.74365234375, 5.91796875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 17.0, 57.0, 187.0, 364.0, 235.0, 92.0, 34.0, 10.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-154.37173461914062, -149.3635711669922, -144.35540771484375, -139.34722900390625, -134.3390655517578, -129.33090209960938, -124.32273864746094, -119.3145751953125, -114.30641174316406, -109.29824829101562, -104.29007720947266, -99.28191375732422, -94.27375030517578, -89.26557922363281, -84.25741577148438, -79.24925231933594, -74.24108123779297, -69.23291778564453, -64.22474670410156, -59.216583251953125, -54.20841979980469, -49.200252532958984, -44.19208526611328, -39.183921813964844, -34.17575454711914, -29.16758918762207, -24.159423828125, -19.151256561279297, -14.143091201782227, -9.134925842285156, -4.126758575439453, 0.8814048767089844, 5.8895721435546875, 10.897737503051758, 15.905903816223145, 20.91407012939453, 25.9222354888916, 30.930400848388672, 35.938568115234375, 40.94673156738281, 45.954898834228516, 50.96306610107422, 55.971229553222656, 60.97939682006836, 65.98756408691406, 70.9957275390625, 76.00389099121094, 81.01205444335938, 86.02022552490234, 91.02838897705078, 96.03656005859375, 101.04472351074219, 106.05288696289062, 111.06105041503906, 116.06922149658203, 121.07738494873047, 126.08555603027344, 131.09371948242188, 136.1018829345703, 141.11004638671875, 146.11822509765625, 151.1263885498047, 156.13455200195312, 161.14271545410156, 166.15087890625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 6.0, 5.0, 6.0, 6.0, 9.0, 8.0, 8.0, 12.0, 28.0, 14.0, 15.0, 14.0, 25.0, 36.0, 32.0, 35.0, 33.0, 52.0, 50.0, 41.0, 57.0, 42.0, 36.0, 49.0, 43.0, 45.0, 39.0, 33.0, 35.0, 28.0, 26.0, 25.0, 20.0, 14.0, 20.0, 14.0, 5.0, 7.0, 7.0, 11.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.22007369995117, -31.213897705078125, -30.207721710205078, -29.20154571533203, -28.195369720458984, -27.189193725585938, -26.18301773071289, -25.176841735839844, -24.170665740966797, -23.16448974609375, -22.158313751220703, -21.152137756347656, -20.14596176147461, -19.139785766601562, -18.133609771728516, -17.12743377685547, -16.121259689331055, -15.115083694458008, -14.108907699584961, -13.102731704711914, -12.096555709838867, -11.09037971496582, -10.08420467376709, -9.078028678894043, -8.071852684020996, -7.065676689147949, -6.059500694274902, -5.053325176239014, -4.047149181365967, -3.04097318649292, -2.0347976684570312, -1.0286216735839844, -0.0224456787109375, 0.9837301969528198, 1.9899060726165771, 2.996081829071045, 4.002257823944092, 5.008433818817139, 6.014609336853027, 7.020785331726074, 8.026961326599121, 9.033137321472168, 10.039313316345215, 11.045488357543945, 12.051664352416992, 13.057840347290039, 14.064016342163086, 15.070192337036133, 16.07636833190918, 17.082544326782227, 18.088720321655273, 19.09489631652832, 20.101072311401367, 21.107248306274414, 22.113422393798828, 23.119598388671875, 24.125774383544922, 25.13195037841797, 26.138126373291016, 27.144302368164062, 28.15047836303711, 29.156654357910156, 30.162830352783203, 31.16900634765625, 32.1751823425293]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 7.0, 3.0, 7.0, 13.0, 8.0, 18.0, 33.0, 43.0, 66.0, 115.0, 183.0, 305.0, 527.0, 935.0, 1854.0, 3805.0, 8743.0, 22506.0, 71318.0, 315188.0, 3134375.0, 490477.0, 94263.0, 28391.0, 10714.0, 4618.0, 2322.0, 1281.0, 732.0, 437.0, 309.0, 183.0, 160.0, 96.0, 55.0, 66.0, 30.0, 24.0, 9.0, 13.0, 15.0, 11.0, 8.0, 4.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.609375, -9.248291015625, -8.88720703125, -8.526123046875, -8.1650390625, -7.803955078125, -7.44287109375, -7.081787109375, -6.720703125, -6.359619140625, -5.99853515625, -5.637451171875, -5.2763671875, -4.915283203125, -4.55419921875, -4.193115234375, -3.83203125, -3.470947265625, -3.10986328125, -2.748779296875, -2.3876953125, -2.026611328125, -1.66552734375, -1.304443359375, -0.943359375, -0.582275390625, -0.22119140625, 0.139892578125, 0.5009765625, 0.862060546875, 1.22314453125, 1.584228515625, 1.9453125, 2.306396484375, 2.66748046875, 3.028564453125, 3.3896484375, 3.750732421875, 4.11181640625, 4.472900390625, 4.833984375, 5.195068359375, 5.55615234375, 5.917236328125, 6.2783203125, 6.639404296875, 7.00048828125, 7.361572265625, 7.72265625, 8.083740234375, 8.44482421875, 8.805908203125, 9.1669921875, 9.528076171875, 9.88916015625, 10.250244140625, 10.611328125, 10.972412109375, 11.33349609375, 11.694580078125, 12.0556640625, 12.416748046875, 12.77783203125, 13.138916015625, 13.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 6.0, 6.0, 11.0, 13.0, 29.0, 21.0, 33.0, 35.0, 59.0, 58.0, 61.0, 84.0, 69.0, 59.0, 63.0, 69.0, 69.0, 51.0, 42.0, 51.0, 25.0, 22.0, 16.0, 8.0, 10.0, 9.0, 2.0, 5.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.974609375, -0.9424896240234375, -0.910369873046875, -0.8782501220703125, -0.84613037109375, -0.8140106201171875, -0.781890869140625, -0.7497711181640625, -0.7176513671875, -0.6855316162109375, -0.653411865234375, -0.6212921142578125, -0.58917236328125, -0.5570526123046875, -0.524932861328125, -0.4928131103515625, -0.460693359375, -0.4285736083984375, -0.396453857421875, -0.3643341064453125, -0.33221435546875, -0.3000946044921875, -0.267974853515625, -0.2358551025390625, -0.2037353515625, -0.1716156005859375, -0.139495849609375, -0.1073760986328125, -0.07525634765625, -0.0431365966796875, -0.011016845703125, 0.0211029052734375, 0.05322265625, 0.0853424072265625, 0.117462158203125, 0.1495819091796875, 0.18170166015625, 0.2138214111328125, 0.245941162109375, 0.2780609130859375, 0.3101806640625, 0.3423004150390625, 0.374420166015625, 0.4065399169921875, 0.43865966796875, 0.4707794189453125, 0.502899169921875, 0.5350189208984375, 0.567138671875, 0.5992584228515625, 0.631378173828125, 0.6634979248046875, 0.69561767578125, 0.7277374267578125, 0.759857177734375, 0.7919769287109375, 0.8240966796875, 0.8562164306640625, 0.888336181640625, 0.9204559326171875, 0.95257568359375, 0.9846954345703125, 1.016815185546875, 1.0489349365234375, 1.0810546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 6.0, 7.0, 22.0, 17.0, 30.0, 55.0, 94.0, 169.0, 319.0, 607.0, 1282.0, 2634.0, 6809.0, 20992.0, 87507.0, 553399.0, 3068905.0, 360994.0, 64111.0, 16412.0, 5656.0, 2198.0, 981.0, 513.0, 242.0, 125.0, 79.0, 41.0, 25.0, 13.0, 12.0, 9.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -11.1297607421875, -10.673583984375, -10.2174072265625, -9.76123046875, -9.3050537109375, -8.848876953125, -8.3927001953125, -7.9365234375, -7.4803466796875, -7.024169921875, -6.5679931640625, -6.11181640625, -5.6556396484375, -5.199462890625, -4.7432861328125, -4.287109375, -3.8309326171875, -3.374755859375, -2.9185791015625, -2.46240234375, -2.0062255859375, -1.550048828125, -1.0938720703125, -0.6376953125, -0.1815185546875, 0.274658203125, 0.7308349609375, 1.18701171875, 1.6431884765625, 2.099365234375, 2.5555419921875, 3.01171875, 3.4678955078125, 3.924072265625, 4.3802490234375, 4.83642578125, 5.2926025390625, 5.748779296875, 6.2049560546875, 6.6611328125, 7.1173095703125, 7.573486328125, 8.0296630859375, 8.48583984375, 8.9420166015625, 9.398193359375, 9.8543701171875, 10.310546875, 10.7667236328125, 11.222900390625, 11.6790771484375, 12.13525390625, 12.5914306640625, 13.047607421875, 13.5037841796875, 13.9599609375, 14.4161376953125, 14.872314453125, 15.3284912109375, 15.78466796875, 16.2408447265625, 16.697021484375, 17.1531982421875, 17.609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 12.0, 5.0, 11.0, 10.0, 21.0, 22.0, 39.0, 51.0, 62.0, 88.0, 110.0, 171.0, 305.0, 537.0, 1175.0, 521.0, 287.0, 174.0, 131.0, 90.0, 75.0, 36.0, 38.0, 30.0, 17.0, 10.0, 11.0, 4.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.529296875, -2.446258544921875, -2.36322021484375, -2.280181884765625, -2.1971435546875, -2.114105224609375, -2.03106689453125, -1.948028564453125, -1.864990234375, -1.781951904296875, -1.69891357421875, -1.615875244140625, -1.5328369140625, -1.449798583984375, -1.36676025390625, -1.283721923828125, -1.20068359375, -1.117645263671875, -1.03460693359375, -0.951568603515625, -0.8685302734375, -0.785491943359375, -0.70245361328125, -0.619415283203125, -0.536376953125, -0.453338623046875, -0.37030029296875, -0.287261962890625, -0.2042236328125, -0.121185302734375, -0.03814697265625, 0.044891357421875, 0.1279296875, 0.210968017578125, 0.29400634765625, 0.377044677734375, 0.4600830078125, 0.543121337890625, 0.62615966796875, 0.709197998046875, 0.792236328125, 0.875274658203125, 0.95831298828125, 1.041351318359375, 1.1243896484375, 1.207427978515625, 1.29046630859375, 1.373504638671875, 1.45654296875, 1.539581298828125, 1.62261962890625, 1.705657958984375, 1.7886962890625, 1.871734619140625, 1.95477294921875, 2.037811279296875, 2.120849609375, 2.203887939453125, 2.28692626953125, 2.369964599609375, 2.4530029296875, 2.536041259765625, 2.61907958984375, 2.702117919921875, 2.78515625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 8.0, 5.0, 13.0, 26.0, 28.0, 32.0, 45.0, 73.0, 88.0, 127.0, 137.0, 92.0, 88.0, 71.0, 58.0, 38.0, 30.0, 14.0, 16.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.47779655456543, -16.904016494750977, -16.33023452758789, -15.756454467773438, -15.182674407958984, -14.608893394470215, -14.035112380981445, -13.461332321166992, -12.887551307678223, -12.313770294189453, -11.739990234375, -11.16620922088623, -10.592428207397461, -10.018648147583008, -9.444867134094238, -8.871086120605469, -8.297306060791016, -7.723525524139404, -7.149744987487793, -6.575963973999023, -6.002183437347412, -5.428402900695801, -4.854621887207031, -4.28084135055542, -3.7070608139038086, -3.1332802772521973, -2.559499502182007, -1.985718846321106, -1.411938190460205, -0.8381576538085938, -0.2643768787384033, 0.3094038963317871, 0.8831844329833984, 1.4569650888442993, 2.0307457447052, 2.6045265197753906, 3.178307056427002, 3.7520875930786133, 4.325868606567383, 4.899649143218994, 5.4734296798706055, 6.047210216522217, 6.620990753173828, 7.194771766662598, 7.768552303314209, 8.34233283996582, 8.91611385345459, 9.48989486694336, 10.063674926757812, 10.637455940246582, 11.211236000061035, 11.785017013549805, 12.358797073364258, 12.932578086853027, 13.506359100341797, 14.08013916015625, 14.65392017364502, 15.227701187133789, 15.801481246948242, 16.375261306762695, 16.94904327392578, 17.522823333740234, 18.096603393554688, 18.670385360717773, 19.244165420532227]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 5.0, 10.0, 14.0, 27.0, 18.0, 26.0, 24.0, 35.0, 30.0, 43.0, 36.0, 66.0, 58.0, 45.0, 56.0, 53.0, 39.0, 58.0, 41.0, 45.0, 43.0, 34.0, 38.0, 25.0, 30.0, 23.0, 18.0, 14.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.401411056518555, -15.001710891723633, -14.602011680603027, -14.202311515808105, -13.802611351013184, -13.402911186218262, -13.003211975097656, -12.603511810302734, -12.203811645507812, -11.80411148071289, -11.404412269592285, -11.004712104797363, -10.605011940002441, -10.20531177520752, -9.805612564086914, -9.405912399291992, -9.00621223449707, -8.606512069702148, -8.206812858581543, -7.807112693786621, -7.407412528991699, -7.0077128410339355, -6.608013153076172, -6.20831298828125, -5.8086137771606445, -5.408914089202881, -5.009213924407959, -4.609514236450195, -4.209814071655273, -3.8101143836975098, -3.410414457321167, -3.010714530944824, -2.6110143661499023, -2.2113144397735596, -1.8116145133972168, -1.4119147062301636, -1.0122147798538208, -0.612514853477478, -0.2128150463104248, 0.18688488006591797, 0.5865848064422607, 0.9862847328186035, 1.3859846591949463, 1.7856844663619995, 2.1853842735290527, 2.5850844383239746, 2.9847841262817383, 3.384484052658081, 3.784183979034424, 4.1838836669921875, 4.583583831787109, 4.983283519744873, 5.382983684539795, 5.782683372497559, 6.1823835372924805, 6.582083225250244, 6.981782913208008, 7.3814826011657715, 7.781182765960693, 8.180882453918457, 8.580582618713379, 8.9802827835083, 9.379981994628906, 9.779682159423828, 10.17938232421875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 9.0, 13.0, 19.0, 22.0, 35.0, 58.0, 66.0, 110.0, 182.0, 296.0, 495.0, 856.0, 1631.0, 3414.0, 7448.0, 16860.0, 39880.0, 91029.0, 195518.0, 298393.0, 211911.0, 101081.0, 44052.0, 18884.0, 8352.0, 3730.0, 1817.0, 946.0, 535.0, 325.0, 198.0, 105.0, 65.0, 64.0, 41.0, 28.0, 22.0, 11.0, 13.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.13671875, -5.92913818359375, -5.7215576171875, -5.51397705078125, -5.306396484375, -5.09881591796875, -4.8912353515625, -4.68365478515625, -4.47607421875, -4.26849365234375, -4.0609130859375, -3.85333251953125, -3.645751953125, -3.43817138671875, -3.2305908203125, -3.02301025390625, -2.8154296875, -2.60784912109375, -2.4002685546875, -2.19268798828125, -1.985107421875, -1.77752685546875, -1.5699462890625, -1.36236572265625, -1.15478515625, -0.94720458984375, -0.7396240234375, -0.53204345703125, -0.324462890625, -0.11688232421875, 0.0906982421875, 0.29827880859375, 0.505859375, 0.71343994140625, 0.9210205078125, 1.12860107421875, 1.336181640625, 1.54376220703125, 1.7513427734375, 1.95892333984375, 2.16650390625, 2.37408447265625, 2.5816650390625, 2.78924560546875, 2.996826171875, 3.20440673828125, 3.4119873046875, 3.61956787109375, 3.8271484375, 4.03472900390625, 4.2423095703125, 4.44989013671875, 4.657470703125, 4.86505126953125, 5.0726318359375, 5.28021240234375, 5.48779296875, 5.69537353515625, 5.9029541015625, 6.11053466796875, 6.318115234375, 6.52569580078125, 6.7332763671875, 6.94085693359375, 7.1484375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 7.0, 12.0, 14.0, 15.0, 21.0, 32.0, 35.0, 49.0, 39.0, 61.0, 63.0, 50.0, 58.0, 56.0, 74.0, 57.0, 57.0, 44.0, 43.0, 45.0, 32.0, 39.0, 23.0, 14.0, 8.0, 11.0, 13.0, 9.0, 8.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9619140625, -0.927215576171875, -0.89251708984375, -0.857818603515625, -0.8231201171875, -0.788421630859375, -0.75372314453125, -0.719024658203125, -0.684326171875, -0.649627685546875, -0.61492919921875, -0.580230712890625, -0.5455322265625, -0.510833740234375, -0.47613525390625, -0.441436767578125, -0.40673828125, -0.372039794921875, -0.33734130859375, -0.302642822265625, -0.2679443359375, -0.233245849609375, -0.19854736328125, -0.163848876953125, -0.129150390625, -0.094451904296875, -0.05975341796875, -0.025054931640625, 0.0096435546875, 0.044342041015625, 0.07904052734375, 0.113739013671875, 0.1484375, 0.183135986328125, 0.21783447265625, 0.252532958984375, 0.2872314453125, 0.321929931640625, 0.35662841796875, 0.391326904296875, 0.426025390625, 0.460723876953125, 0.49542236328125, 0.530120849609375, 0.5648193359375, 0.599517822265625, 0.63421630859375, 0.668914794921875, 0.70361328125, 0.738311767578125, 0.77301025390625, 0.807708740234375, 0.8424072265625, 0.877105712890625, 0.91180419921875, 0.946502685546875, 0.981201171875, 1.015899658203125, 1.05059814453125, 1.085296630859375, 1.1199951171875, 1.154693603515625, 1.18939208984375, 1.224090576171875, 1.2587890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 16.0, 19.0, 27.0, 34.0, 38.0, 57.0, 77.0, 131.0, 171.0, 242.0, 382.0, 641.0, 1260.0, 2735.0, 7373.0, 21317.0, 68588.0, 221805.0, 454594.0, 182869.0, 56747.0, 17931.0, 6041.0, 2402.0, 1195.0, 670.0, 362.0, 253.0, 171.0, 92.0, 97.0, 54.0, 41.0, 33.0, 25.0, 14.0, 12.0, 9.0, 5.0, 5.0, 3.0, 0.0, 6.0, 0.0, 2.0, 2.0], "bins": [-12.8203125, -12.46826171875, -12.1162109375, -11.76416015625, -11.412109375, -11.06005859375, -10.7080078125, -10.35595703125, -10.00390625, -9.65185546875, -9.2998046875, -8.94775390625, -8.595703125, -8.24365234375, -7.8916015625, -7.53955078125, -7.1875, -6.83544921875, -6.4833984375, -6.13134765625, -5.779296875, -5.42724609375, -5.0751953125, -4.72314453125, -4.37109375, -4.01904296875, -3.6669921875, -3.31494140625, -2.962890625, -2.61083984375, -2.2587890625, -1.90673828125, -1.5546875, -1.20263671875, -0.8505859375, -0.49853515625, -0.146484375, 0.20556640625, 0.5576171875, 0.90966796875, 1.26171875, 1.61376953125, 1.9658203125, 2.31787109375, 2.669921875, 3.02197265625, 3.3740234375, 3.72607421875, 4.078125, 4.43017578125, 4.7822265625, 5.13427734375, 5.486328125, 5.83837890625, 6.1904296875, 6.54248046875, 6.89453125, 7.24658203125, 7.5986328125, 7.95068359375, 8.302734375, 8.65478515625, 9.0068359375, 9.35888671875, 9.7109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 11.0, 11.0, 18.0, 17.0, 20.0, 17.0, 25.0, 18.0, 26.0, 27.0, 38.0, 38.0, 39.0, 40.0, 42.0, 54.0, 48.0, 47.0, 45.0, 48.0, 37.0, 47.0, 43.0, 28.0, 47.0, 30.0, 20.0, 23.0, 18.0, 14.0, 16.0, 9.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.07421875, -5.88262939453125, -5.6910400390625, -5.49945068359375, -5.307861328125, -5.11627197265625, -4.9246826171875, -4.73309326171875, -4.54150390625, -4.34991455078125, -4.1583251953125, -3.96673583984375, -3.775146484375, -3.58355712890625, -3.3919677734375, -3.20037841796875, -3.0087890625, -2.81719970703125, -2.6256103515625, -2.43402099609375, -2.242431640625, -2.05084228515625, -1.8592529296875, -1.66766357421875, -1.47607421875, -1.28448486328125, -1.0928955078125, -0.90130615234375, -0.709716796875, -0.51812744140625, -0.3265380859375, -0.13494873046875, 0.056640625, 0.24822998046875, 0.4398193359375, 0.63140869140625, 0.822998046875, 1.01458740234375, 1.2061767578125, 1.39776611328125, 1.58935546875, 1.78094482421875, 1.9725341796875, 2.16412353515625, 2.355712890625, 2.54730224609375, 2.7388916015625, 2.93048095703125, 3.1220703125, 3.31365966796875, 3.5052490234375, 3.69683837890625, 3.888427734375, 4.08001708984375, 4.2716064453125, 4.46319580078125, 4.65478515625, 4.84637451171875, 5.0379638671875, 5.22955322265625, 5.421142578125, 5.61273193359375, 5.8043212890625, 5.99591064453125, 6.1875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 6.0, 5.0, 5.0, 12.0, 16.0, 29.0, 39.0, 71.0, 130.0, 201.0, 333.0, 580.0, 1067.0, 2125.0, 4527.0, 10406.0, 26003.0, 67691.0, 200610.0, 416749.0, 202744.0, 69355.0, 25944.0, 10663.0, 4660.0, 2086.0, 1091.0, 560.0, 340.0, 212.0, 107.0, 69.0, 44.0, 32.0, 12.0, 8.0, 10.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.90625, -4.75982666015625, -4.6134033203125, -4.46697998046875, -4.320556640625, -4.17413330078125, -4.0277099609375, -3.88128662109375, -3.73486328125, -3.58843994140625, -3.4420166015625, -3.29559326171875, -3.149169921875, -3.00274658203125, -2.8563232421875, -2.70989990234375, -2.5634765625, -2.41705322265625, -2.2706298828125, -2.12420654296875, -1.977783203125, -1.83135986328125, -1.6849365234375, -1.53851318359375, -1.39208984375, -1.24566650390625, -1.0992431640625, -0.95281982421875, -0.806396484375, -0.65997314453125, -0.5135498046875, -0.36712646484375, -0.220703125, -0.07427978515625, 0.0721435546875, 0.21856689453125, 0.364990234375, 0.51141357421875, 0.6578369140625, 0.80426025390625, 0.95068359375, 1.09710693359375, 1.2435302734375, 1.38995361328125, 1.536376953125, 1.68280029296875, 1.8292236328125, 1.97564697265625, 2.1220703125, 2.26849365234375, 2.4149169921875, 2.56134033203125, 2.707763671875, 2.85418701171875, 3.0006103515625, 3.14703369140625, 3.29345703125, 3.43988037109375, 3.5863037109375, 3.73272705078125, 3.879150390625, 4.02557373046875, 4.1719970703125, 4.31842041015625, 4.46484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 10.0, 12.0, 20.0, 23.0, 18.0, 48.0, 42.0, 51.0, 84.0, 165.0, 154.0, 102.0, 63.0, 40.0, 37.0, 30.0, 16.0, 18.0, 13.0, 14.0, 6.0, 6.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010900497436523438, -0.0010560452938079834, -0.001022040843963623, -0.0009880363941192627, -0.0009540319442749023, -0.000920027494430542, -0.0008860230445861816, -0.0008520185947418213, -0.0008180141448974609, -0.0007840096950531006, -0.0007500052452087402, -0.0007160007953643799, -0.0006819963455200195, -0.0006479918956756592, -0.0006139874458312988, -0.0005799829959869385, -0.0005459785461425781, -0.0005119740962982178, -0.0004779696464538574, -0.00044396519660949707, -0.0004099607467651367, -0.00037595629692077637, -0.000341951847076416, -0.00030794739723205566, -0.0002739429473876953, -0.00023993849754333496, -0.0002059340476989746, -0.00017192959785461426, -0.0001379251480102539, -0.00010392069816589355, -6.99162483215332e-05, -3.591179847717285e-05, -1.9073486328125e-06, 3.209710121154785e-05, 6.61015510559082e-05, 0.00010010600090026855, 0.0001341104507446289, 0.00016811490058898926, 0.0002021193504333496, 0.00023612380027770996, 0.0002701282501220703, 0.00030413269996643066, 0.000338137149810791, 0.00037214159965515137, 0.0004061460494995117, 0.00044015049934387207, 0.0004741549491882324, 0.0005081593990325928, 0.0005421638488769531, 0.0005761682987213135, 0.0006101727485656738, 0.0006441771984100342, 0.0006781816482543945, 0.0007121860980987549, 0.0007461905479431152, 0.0007801949977874756, 0.0008141994476318359, 0.0008482038974761963, 0.0008822083473205566, 0.000916212797164917, 0.0009502172470092773, 0.0009842216968536377, 0.001018226146697998, 0.0010522305965423584, 0.0010862350463867188]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 6.0, 12.0, 15.0, 40.0, 65.0, 99.0, 156.0, 292.0, 621.0, 1603.0, 4789.0, 19503.0, 108990.0, 656204.0, 211782.0, 33370.0, 7181.0, 2100.0, 814.0, 385.0, 194.0, 99.0, 84.0, 46.0, 28.0, 25.0, 13.0, 10.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.796875, -8.4788818359375, -8.160888671875, -7.8428955078125, -7.52490234375, -7.2069091796875, -6.888916015625, -6.5709228515625, -6.2529296875, -5.9349365234375, -5.616943359375, -5.2989501953125, -4.98095703125, -4.6629638671875, -4.344970703125, -4.0269775390625, -3.708984375, -3.3909912109375, -3.072998046875, -2.7550048828125, -2.43701171875, -2.1190185546875, -1.801025390625, -1.4830322265625, -1.1650390625, -0.8470458984375, -0.529052734375, -0.2110595703125, 0.10693359375, 0.4249267578125, 0.742919921875, 1.0609130859375, 1.37890625, 1.6968994140625, 2.014892578125, 2.3328857421875, 2.65087890625, 2.9688720703125, 3.286865234375, 3.6048583984375, 3.9228515625, 4.2408447265625, 4.558837890625, 4.8768310546875, 5.19482421875, 5.5128173828125, 5.830810546875, 6.1488037109375, 6.466796875, 6.7847900390625, 7.102783203125, 7.4207763671875, 7.73876953125, 8.0567626953125, 8.374755859375, 8.6927490234375, 9.0107421875, 9.3287353515625, 9.646728515625, 9.9647216796875, 10.28271484375, 10.6007080078125, 10.918701171875, 11.2366943359375, 11.5546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 5.0, 8.0, 6.0, 7.0, 18.0, 17.0, 21.0, 15.0, 37.0, 48.0, 51.0, 79.0, 109.0, 114.0, 115.0, 77.0, 66.0, 43.0, 37.0, 32.0, 22.0, 19.0, 15.0, 7.0, 9.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -3.99530029296875, -3.8460693359375, -3.69683837890625, -3.547607421875, -3.39837646484375, -3.2491455078125, -3.09991455078125, -2.95068359375, -2.80145263671875, -2.6522216796875, -2.50299072265625, -2.353759765625, -2.20452880859375, -2.0552978515625, -1.90606689453125, -1.7568359375, -1.60760498046875, -1.4583740234375, -1.30914306640625, -1.159912109375, -1.01068115234375, -0.8614501953125, -0.71221923828125, -0.56298828125, -0.41375732421875, -0.2645263671875, -0.11529541015625, 0.033935546875, 0.18316650390625, 0.3323974609375, 0.48162841796875, 0.630859375, 0.78009033203125, 0.9293212890625, 1.07855224609375, 1.227783203125, 1.37701416015625, 1.5262451171875, 1.67547607421875, 1.82470703125, 1.97393798828125, 2.1231689453125, 2.27239990234375, 2.421630859375, 2.57086181640625, 2.7200927734375, 2.86932373046875, 3.0185546875, 3.16778564453125, 3.3170166015625, 3.46624755859375, 3.615478515625, 3.76470947265625, 3.9139404296875, 4.06317138671875, 4.21240234375, 4.36163330078125, 4.5108642578125, 4.66009521484375, 4.809326171875, 4.95855712890625, 5.1077880859375, 5.25701904296875, 5.40625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 8.0, 12.0, 20.0, 19.0, 38.0, 55.0, 75.0, 104.0, 120.0, 127.0, 130.0, 104.0, 55.0, 42.0, 39.0, 19.0, 8.0, 6.0, 9.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.84800720214844, -44.56199645996094, -42.27598571777344, -39.98997497558594, -37.70396423339844, -35.41795349121094, -33.13194274902344, -30.845932006835938, -28.559921264648438, -26.273910522460938, -23.987899780273438, -21.701889038085938, -19.415878295898438, -17.129867553710938, -14.843856811523438, -12.557846069335938, -10.271835327148438, -7.9858245849609375, -5.6998138427734375, -3.4138031005859375, -1.1277923583984375, 1.1582183837890625, 3.4442291259765625, 5.7302398681640625, 8.016250610351562, 10.302261352539062, 12.588272094726562, 14.874282836914062, 17.160293579101562, 19.446304321289062, 21.732315063476562, 24.018325805664062, 26.304336547851562, 28.590347290039062, 30.876358032226562, 33.16236877441406, 35.44837951660156, 37.73439025878906, 40.02040100097656, 42.30641174316406, 44.59242248535156, 46.87843322753906, 49.16444396972656, 51.45045471191406, 53.73646545410156, 56.02247619628906, 58.30848693847656, 60.59449768066406, 62.88050842285156, 65.16651916503906, 67.45252990722656, 69.73854064941406, 72.02455139160156, 74.31056213378906, 76.59657287597656, 78.88258361816406, 81.16859436035156, 83.45460510253906, 85.74061584472656, 88.02662658691406, 90.31263732910156, 92.59864807128906, 94.88465881347656, 97.17066955566406, 99.45668029785156]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 5.0, 5.0, 9.0, 14.0, 16.0, 12.0, 9.0, 28.0, 31.0, 22.0, 29.0, 27.0, 29.0, 47.0, 38.0, 39.0, 31.0, 45.0, 24.0, 42.0, 35.0, 36.0, 38.0, 30.0, 36.0, 34.0, 35.0, 38.0, 31.0, 28.0, 27.0, 23.0, 15.0, 10.0, 20.0, 10.0, 6.0, 12.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-43.92805862426758, -42.68036651611328, -41.432674407958984, -40.18498229980469, -38.93729019165039, -37.689598083496094, -36.4419059753418, -35.1942138671875, -33.9465217590332, -32.698829650878906, -31.45113754272461, -30.203445434570312, -28.955753326416016, -27.70806121826172, -26.460369110107422, -25.212677001953125, -23.96498680114746, -22.717294692993164, -21.469602584838867, -20.22191047668457, -18.974218368530273, -17.726526260375977, -16.478836059570312, -15.2311429977417, -13.983450889587402, -12.735758781433105, -11.488066673278809, -10.240375518798828, -8.992683410644531, -7.744990825653076, -6.4972991943359375, -5.249607086181641, -4.001914978027344, -2.754222869873047, -1.506531000137329, -0.25883913040161133, 0.9888529777526855, 2.2365450859069824, 3.484236717224121, 4.731928825378418, 5.979620933532715, 7.227313041687012, 8.475005149841309, 9.722696304321289, 10.970388412475586, 12.218080520629883, 13.46577262878418, 14.713464736938477, 15.961156845092773, 17.20884895324707, 18.456541061401367, 19.704233169555664, 20.95192527770996, 22.199617385864258, 23.447307586669922, 24.69499969482422, 25.942691802978516, 27.190383911132812, 28.43807601928711, 29.685768127441406, 30.933460235595703, 32.18115234375, 33.4288444519043, 34.676536560058594, 35.92422866821289]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 16.0, 24.0, 45.0, 53.0, 86.0, 149.0, 250.0, 408.0, 771.0, 1362.0, 2619.0, 5259.0, 11703.0, 27997.0, 75704.0, 267522.0, 3152540.0, 473525.0, 106273.0, 37514.0, 15360.0, 7173.0, 3476.0, 1876.0, 994.0, 548.0, 343.0, 210.0, 151.0, 103.0, 65.0, 46.0, 36.0, 15.0, 19.0, 12.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.53125, -6.2430419921875, -5.954833984375, -5.6666259765625, -5.37841796875, -5.0902099609375, -4.802001953125, -4.5137939453125, -4.2255859375, -3.9373779296875, -3.649169921875, -3.3609619140625, -3.07275390625, -2.7845458984375, -2.496337890625, -2.2081298828125, -1.919921875, -1.6317138671875, -1.343505859375, -1.0552978515625, -0.76708984375, -0.4788818359375, -0.190673828125, 0.0975341796875, 0.3857421875, 0.6739501953125, 0.962158203125, 1.2503662109375, 1.53857421875, 1.8267822265625, 2.114990234375, 2.4031982421875, 2.69140625, 2.9796142578125, 3.267822265625, 3.5560302734375, 3.84423828125, 4.1324462890625, 4.420654296875, 4.7088623046875, 4.9970703125, 5.2852783203125, 5.573486328125, 5.8616943359375, 6.14990234375, 6.4381103515625, 6.726318359375, 7.0145263671875, 7.302734375, 7.5909423828125, 7.879150390625, 8.1673583984375, 8.45556640625, 8.7437744140625, 9.031982421875, 9.3201904296875, 9.6083984375, 9.8966064453125, 10.184814453125, 10.4730224609375, 10.76123046875, 11.0494384765625, 11.337646484375, 11.6258544921875, 11.9140625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 5.0, 10.0, 6.0, 8.0, 12.0, 9.0, 13.0, 18.0, 18.0, 22.0, 33.0, 25.0, 28.0, 38.0, 43.0, 32.0, 37.0, 34.0, 39.0, 36.0, 39.0, 44.0, 35.0, 49.0, 41.0, 43.0, 20.0, 28.0, 21.0, 27.0, 26.0, 21.0, 18.0, 20.0, 16.0, 15.0, 14.0, 8.0, 7.0, 5.0, 6.0, 5.0, 6.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.84619140625, -0.8159255981445312, -0.7856597900390625, -0.7553939819335938, -0.725128173828125, -0.6948623657226562, -0.6645965576171875, -0.6343307495117188, -0.60406494140625, -0.5737991333007812, -0.5435333251953125, -0.5132675170898438, -0.483001708984375, -0.45273590087890625, -0.4224700927734375, -0.39220428466796875, -0.3619384765625, -0.33167266845703125, -0.3014068603515625, -0.27114105224609375, -0.240875244140625, -0.21060943603515625, -0.1803436279296875, -0.15007781982421875, -0.11981201171875, -0.08954620361328125, -0.0592803955078125, -0.02901458740234375, 0.001251220703125, 0.03151702880859375, 0.0617828369140625, 0.09204864501953125, 0.122314453125, 0.15258026123046875, 0.1828460693359375, 0.21311187744140625, 0.243377685546875, 0.27364349365234375, 0.3039093017578125, 0.33417510986328125, 0.36444091796875, 0.39470672607421875, 0.4249725341796875, 0.45523834228515625, 0.485504150390625, 0.5157699584960938, 0.5460357666015625, 0.5763015747070312, 0.6065673828125, 0.6368331909179688, 0.6670989990234375, 0.6973648071289062, 0.727630615234375, 0.7578964233398438, 0.7881622314453125, 0.8184280395507812, 0.84869384765625, 0.8789596557617188, 0.9092254638671875, 0.9394912719726562, 0.969757080078125, 1.0000228881835938, 1.0302886962890625, 1.0605545043945312, 1.0908203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0, 6.0, 0.0, 9.0, 10.0, 11.0, 17.0, 20.0, 26.0, 42.0, 42.0, 71.0, 101.0, 154.0, 293.0, 544.0, 1134.0, 2429.0, 5911.0, 16726.0, 63247.0, 391563.0, 3312026.0, 320327.0, 55077.0, 14820.0, 5261.0, 2208.0, 1037.0, 506.0, 260.0, 160.0, 81.0, 48.0, 42.0, 25.0, 14.0, 11.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.75, -14.2955322265625, -13.841064453125, -13.3865966796875, -12.93212890625, -12.4776611328125, -12.023193359375, -11.5687255859375, -11.1142578125, -10.6597900390625, -10.205322265625, -9.7508544921875, -9.29638671875, -8.8419189453125, -8.387451171875, -7.9329833984375, -7.478515625, -7.0240478515625, -6.569580078125, -6.1151123046875, -5.66064453125, -5.2061767578125, -4.751708984375, -4.2972412109375, -3.8427734375, -3.3883056640625, -2.933837890625, -2.4793701171875, -2.02490234375, -1.5704345703125, -1.115966796875, -0.6614990234375, -0.20703125, 0.2474365234375, 0.701904296875, 1.1563720703125, 1.61083984375, 2.0653076171875, 2.519775390625, 2.9742431640625, 3.4287109375, 3.8831787109375, 4.337646484375, 4.7921142578125, 5.24658203125, 5.7010498046875, 6.155517578125, 6.6099853515625, 7.064453125, 7.5189208984375, 7.973388671875, 8.4278564453125, 8.88232421875, 9.3367919921875, 9.791259765625, 10.2457275390625, 10.7001953125, 11.1546630859375, 11.609130859375, 12.0635986328125, 12.51806640625, 12.9725341796875, 13.427001953125, 13.8814697265625, 14.3359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 8.0, 7.0, 18.0, 17.0, 22.0, 43.0, 75.0, 117.0, 196.0, 401.0, 1551.0, 889.0, 310.0, 161.0, 80.0, 44.0, 43.0, 30.0, 18.0, 12.0, 13.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.00390625, -5.860443115234375, -5.71697998046875, -5.573516845703125, -5.4300537109375, -5.286590576171875, -5.14312744140625, -4.999664306640625, -4.856201171875, -4.712738037109375, -4.56927490234375, -4.425811767578125, -4.2823486328125, -4.138885498046875, -3.99542236328125, -3.851959228515625, -3.70849609375, -3.565032958984375, -3.42156982421875, -3.278106689453125, -3.1346435546875, -2.991180419921875, -2.84771728515625, -2.704254150390625, -2.560791015625, -2.417327880859375, -2.27386474609375, -2.130401611328125, -1.9869384765625, -1.843475341796875, -1.70001220703125, -1.556549072265625, -1.4130859375, -1.269622802734375, -1.12615966796875, -0.982696533203125, -0.8392333984375, -0.695770263671875, -0.55230712890625, -0.408843994140625, -0.265380859375, -0.121917724609375, 0.02154541015625, 0.165008544921875, 0.3084716796875, 0.451934814453125, 0.59539794921875, 0.738861083984375, 0.88232421875, 1.025787353515625, 1.16925048828125, 1.312713623046875, 1.4561767578125, 1.599639892578125, 1.74310302734375, 1.886566162109375, 2.030029296875, 2.173492431640625, 2.31695556640625, 2.460418701171875, 2.6038818359375, 2.747344970703125, 2.89080810546875, 3.034271240234375, 3.177734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 18.0, 38.0, 55.0, 138.0, 200.0, 223.0, 155.0, 89.0, 50.0, 20.0, 8.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.12188720703125, -37.86996841430664, -36.61804962158203, -35.36613082885742, -34.11421203613281, -32.8622932434082, -31.610374450683594, -30.358455657958984, -29.106536865234375, -27.854618072509766, -26.602699279785156, -25.350780487060547, -24.098861694335938, -22.846942901611328, -21.59502410888672, -20.34310531616211, -19.0911865234375, -17.83926773071289, -16.58734893798828, -15.335430145263672, -14.083511352539062, -12.831592559814453, -11.579673767089844, -10.327754974365234, -9.075836181640625, -7.823917388916016, -6.571998596191406, -5.320079803466797, -4.0681610107421875, -2.816242218017578, -1.5643234252929688, -0.3124046325683594, 0.9395179748535156, 2.191436767578125, 3.4433555603027344, 4.695274353027344, 5.947193145751953, 7.1991119384765625, 8.451030731201172, 9.702949523925781, 10.95486831665039, 12.206787109375, 13.45870590209961, 14.710624694824219, 15.962543487548828, 17.214462280273438, 18.466381072998047, 19.718299865722656, 20.970218658447266, 22.222137451171875, 23.474056243896484, 24.725975036621094, 25.977893829345703, 27.229812622070312, 28.481731414794922, 29.73365020751953, 30.98556900024414, 32.23748779296875, 33.48940658569336, 34.74132537841797, 35.99324417114258, 37.24516296386719, 38.4970817565918, 39.749000549316406, 41.000919342041016]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 6.0, 4.0, 8.0, 10.0, 18.0, 17.0, 24.0, 29.0, 37.0, 22.0, 28.0, 29.0, 31.0, 36.0, 45.0, 51.0, 55.0, 45.0, 38.0, 53.0, 56.0, 42.0, 40.0, 45.0, 38.0, 36.0, 34.0, 18.0, 19.0, 20.0, 11.0, 11.0, 7.0, 10.0, 8.0, 8.0, 0.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.036359786987305, -10.6203031539917, -10.20424747467041, -9.788190841674805, -9.372135162353516, -8.95607852935791, -8.540021896362305, -8.123966217041016, -7.70790958404541, -7.291853427886963, -6.875797271728516, -6.45974063873291, -6.043684482574463, -5.627628326416016, -5.211572170257568, -4.795516014099121, -4.379459857940674, -3.9634037017822266, -3.5473473072052, -3.131291151046753, -2.7152347564697266, -2.2991786003112793, -1.883122444152832, -1.4670660495758057, -1.0510098934173584, -0.6349536180496216, -0.21889740228652954, 0.1971588134765625, 0.6132150888442993, 1.0292713642120361, 1.4453275203704834, 1.8613839149475098, 2.277440071105957, 2.6934962272644043, 3.1095526218414307, 3.525608777999878, 3.9416651725769043, 4.357721328735352, 4.773777484893799, 5.189833641052246, 5.605890274047852, 6.021946430206299, 6.438002586364746, 6.854059219360352, 7.270115375518799, 7.686171531677246, 8.102228164672852, 8.51828384399414, 8.93433952331543, 9.350396156311035, 9.766451835632324, 10.18250846862793, 10.598564147949219, 11.014620780944824, 11.43067741394043, 11.846733093261719, 12.262789726257324, 12.67884635925293, 13.094902038574219, 13.510958671569824, 13.927014350891113, 14.343070983886719, 14.759126663208008, 15.175183296203613, 15.591239929199219]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 12.0, 8.0, 7.0, 16.0, 22.0, 30.0, 36.0, 63.0, 110.0, 165.0, 297.0, 505.0, 917.0, 1749.0, 3506.0, 6623.0, 13201.0, 26149.0, 52283.0, 104125.0, 196720.0, 269050.0, 182116.0, 94977.0, 47749.0, 23464.0, 11919.0, 6003.0, 3113.0, 1664.0, 808.0, 452.0, 277.0, 138.0, 90.0, 70.0, 45.0, 21.0, 18.0, 15.0, 7.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.609375, -5.4364013671875, -5.263427734375, -5.0904541015625, -4.91748046875, -4.7445068359375, -4.571533203125, -4.3985595703125, -4.2255859375, -4.0526123046875, -3.879638671875, -3.7066650390625, -3.53369140625, -3.3607177734375, -3.187744140625, -3.0147705078125, -2.841796875, -2.6688232421875, -2.495849609375, -2.3228759765625, -2.14990234375, -1.9769287109375, -1.803955078125, -1.6309814453125, -1.4580078125, -1.2850341796875, -1.112060546875, -0.9390869140625, -0.76611328125, -0.5931396484375, -0.420166015625, -0.2471923828125, -0.07421875, 0.0987548828125, 0.271728515625, 0.4447021484375, 0.61767578125, 0.7906494140625, 0.963623046875, 1.1365966796875, 1.3095703125, 1.4825439453125, 1.655517578125, 1.8284912109375, 2.00146484375, 2.1744384765625, 2.347412109375, 2.5203857421875, 2.693359375, 2.8663330078125, 3.039306640625, 3.2122802734375, 3.38525390625, 3.5582275390625, 3.731201171875, 3.9041748046875, 4.0771484375, 4.2501220703125, 4.423095703125, 4.5960693359375, 4.76904296875, 4.9420166015625, 5.114990234375, 5.2879638671875, 5.4609375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 4.0, 6.0, 9.0, 9.0, 16.0, 13.0, 17.0, 24.0, 17.0, 32.0, 19.0, 30.0, 44.0, 52.0, 40.0, 40.0, 46.0, 52.0, 34.0, 42.0, 45.0, 44.0, 36.0, 44.0, 37.0, 27.0, 33.0, 20.0, 35.0, 19.0, 10.0, 23.0, 10.0, 19.0, 9.0, 10.0, 9.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9621734619140625, -0.925323486328125, -0.8884735107421875, -0.85162353515625, -0.8147735595703125, -0.777923583984375, -0.7410736083984375, -0.7042236328125, -0.6673736572265625, -0.630523681640625, -0.5936737060546875, -0.55682373046875, -0.5199737548828125, -0.483123779296875, -0.4462738037109375, -0.409423828125, -0.3725738525390625, -0.335723876953125, -0.2988739013671875, -0.26202392578125, -0.2251739501953125, -0.188323974609375, -0.1514739990234375, -0.1146240234375, -0.0777740478515625, -0.040924072265625, -0.0040740966796875, 0.03277587890625, 0.0696258544921875, 0.106475830078125, 0.1433258056640625, 0.18017578125, 0.2170257568359375, 0.253875732421875, 0.2907257080078125, 0.32757568359375, 0.3644256591796875, 0.401275634765625, 0.4381256103515625, 0.4749755859375, 0.5118255615234375, 0.548675537109375, 0.5855255126953125, 0.62237548828125, 0.6592254638671875, 0.696075439453125, 0.7329254150390625, 0.769775390625, 0.8066253662109375, 0.843475341796875, 0.8803253173828125, 0.91717529296875, 0.9540252685546875, 0.990875244140625, 1.0277252197265625, 1.0645751953125, 1.1014251708984375, 1.138275146484375, 1.1751251220703125, 1.21197509765625, 1.2488250732421875, 1.285675048828125, 1.3225250244140625, 1.359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 9.0, 9.0, 23.0, 17.0, 39.0, 62.0, 95.0, 179.0, 254.0, 468.0, 956.0, 2322.0, 7006.0, 25955.0, 109222.0, 409548.0, 365919.0, 93606.0, 22588.0, 6115.0, 2174.0, 891.0, 424.0, 271.0, 144.0, 95.0, 57.0, 47.0, 14.0, 19.0, 8.0, 13.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.90625, -13.5491943359375, -13.192138671875, -12.8350830078125, -12.47802734375, -12.1209716796875, -11.763916015625, -11.4068603515625, -11.0498046875, -10.6927490234375, -10.335693359375, -9.9786376953125, -9.62158203125, -9.2645263671875, -8.907470703125, -8.5504150390625, -8.193359375, -7.8363037109375, -7.479248046875, -7.1221923828125, -6.76513671875, -6.4080810546875, -6.051025390625, -5.6939697265625, -5.3369140625, -4.9798583984375, -4.622802734375, -4.2657470703125, -3.90869140625, -3.5516357421875, -3.194580078125, -2.8375244140625, -2.48046875, -2.1234130859375, -1.766357421875, -1.4093017578125, -1.05224609375, -0.6951904296875, -0.338134765625, 0.0189208984375, 0.3759765625, 0.7330322265625, 1.090087890625, 1.4471435546875, 1.80419921875, 2.1612548828125, 2.518310546875, 2.8753662109375, 3.232421875, 3.5894775390625, 3.946533203125, 4.3035888671875, 4.66064453125, 5.0177001953125, 5.374755859375, 5.7318115234375, 6.0888671875, 6.4459228515625, 6.802978515625, 7.1600341796875, 7.51708984375, 7.8741455078125, 8.231201171875, 8.5882568359375, 8.9453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 11.0, 10.0, 18.0, 19.0, 18.0, 21.0, 31.0, 31.0, 33.0, 35.0, 41.0, 59.0, 49.0, 48.0, 55.0, 45.0, 42.0, 50.0, 45.0, 39.0, 33.0, 25.0, 41.0, 32.0, 24.0, 31.0, 24.0, 18.0, 12.0, 11.0, 7.0, 5.0, 3.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.525146484375, -6.29248046875, -6.059814453125, -5.8271484375, -5.594482421875, -5.36181640625, -5.129150390625, -4.896484375, -4.663818359375, -4.43115234375, -4.198486328125, -3.9658203125, -3.733154296875, -3.50048828125, -3.267822265625, -3.03515625, -2.802490234375, -2.56982421875, -2.337158203125, -2.1044921875, -1.871826171875, -1.63916015625, -1.406494140625, -1.173828125, -0.941162109375, -0.70849609375, -0.475830078125, -0.2431640625, -0.010498046875, 0.22216796875, 0.454833984375, 0.6875, 0.920166015625, 1.15283203125, 1.385498046875, 1.6181640625, 1.850830078125, 2.08349609375, 2.316162109375, 2.548828125, 2.781494140625, 3.01416015625, 3.246826171875, 3.4794921875, 3.712158203125, 3.94482421875, 4.177490234375, 4.41015625, 4.642822265625, 4.87548828125, 5.108154296875, 5.3408203125, 5.573486328125, 5.80615234375, 6.038818359375, 6.271484375, 6.504150390625, 6.73681640625, 6.969482421875, 7.2021484375, 7.434814453125, 7.66748046875, 7.900146484375, 8.1328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 10.0, 5.0, 6.0, 21.0, 19.0, 38.0, 69.0, 107.0, 139.0, 207.0, 359.0, 673.0, 1302.0, 2920.0, 6654.0, 17965.0, 52484.0, 169929.0, 404640.0, 263241.0, 83217.0, 27049.0, 9681.0, 3975.0, 1755.0, 815.0, 477.0, 273.0, 155.0, 127.0, 65.0, 44.0, 29.0, 23.0, 20.0, 18.0, 14.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.708984375, -3.595550537109375, -3.48211669921875, -3.368682861328125, -3.2552490234375, -3.141815185546875, -3.02838134765625, -2.914947509765625, -2.801513671875, -2.688079833984375, -2.57464599609375, -2.461212158203125, -2.3477783203125, -2.234344482421875, -2.12091064453125, -2.007476806640625, -1.89404296875, -1.780609130859375, -1.66717529296875, -1.553741455078125, -1.4403076171875, -1.326873779296875, -1.21343994140625, -1.100006103515625, -0.986572265625, -0.873138427734375, -0.75970458984375, -0.646270751953125, -0.5328369140625, -0.419403076171875, -0.30596923828125, -0.192535400390625, -0.0791015625, 0.034332275390625, 0.14776611328125, 0.261199951171875, 0.3746337890625, 0.488067626953125, 0.60150146484375, 0.714935302734375, 0.828369140625, 0.941802978515625, 1.05523681640625, 1.168670654296875, 1.2821044921875, 1.395538330078125, 1.50897216796875, 1.622406005859375, 1.73583984375, 1.849273681640625, 1.96270751953125, 2.076141357421875, 2.1895751953125, 2.303009033203125, 2.41644287109375, 2.529876708984375, 2.643310546875, 2.756744384765625, 2.87017822265625, 2.983612060546875, 3.0970458984375, 3.210479736328125, 3.32391357421875, 3.437347412109375, 3.55078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 3.0, 4.0, 7.0, 7.0, 13.0, 16.0, 18.0, 18.0, 24.0, 31.0, 31.0, 46.0, 62.0, 87.0, 110.0, 95.0, 81.0, 64.0, 51.0, 30.0, 34.0, 26.0, 24.0, 21.0, 14.0, 19.0, 10.0, 9.0, 9.0, 7.0, 6.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006861686706542969, -0.0006665363907814026, -0.0006469041109085083, -0.000627271831035614, -0.0006076395511627197, -0.0005880072712898254, -0.0005683749914169312, -0.0005487427115440369, -0.0005291104316711426, -0.0005094781517982483, -0.000489845871925354, -0.0004702135920524597, -0.00045058131217956543, -0.00043094903230667114, -0.00041131675243377686, -0.00039168447256088257, -0.0003720521926879883, -0.000352419912815094, -0.0003327876329421997, -0.0003131553530693054, -0.00029352307319641113, -0.00027389079332351685, -0.00025425851345062256, -0.00023462623357772827, -0.00021499395370483398, -0.0001953616738319397, -0.0001757293939590454, -0.00015609711408615112, -0.00013646483421325684, -0.00011683255434036255, -9.720027446746826e-05, -7.756799459457397e-05, -5.793571472167969e-05, -3.83034348487854e-05, -1.8671154975891113e-05, 9.611248970031738e-07, 2.059340476989746e-05, 4.022568464279175e-05, 5.9857964515686035e-05, 7.949024438858032e-05, 9.912252426147461e-05, 0.0001187548041343689, 0.00013838708400726318, 0.00015801936388015747, 0.00017765164375305176, 0.00019728392362594604, 0.00021691620349884033, 0.00023654848337173462, 0.0002561807632446289, 0.0002758130431175232, 0.0002954453229904175, 0.00031507760286331177, 0.00033470988273620605, 0.00035434216260910034, 0.00037397444248199463, 0.0003936067223548889, 0.0004132390022277832, 0.0004328712821006775, 0.0004525035619735718, 0.00047213584184646606, 0.0004917681217193604, 0.0005114004015922546, 0.0005310326814651489, 0.0005506649613380432, 0.0005702972412109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 6.0, 4.0, 4.0, 14.0, 24.0, 28.0, 45.0, 63.0, 100.0, 185.0, 363.0, 623.0, 1513.0, 4282.0, 14188.0, 63464.0, 365210.0, 482383.0, 88416.0, 18788.0, 5309.0, 1848.0, 774.0, 387.0, 202.0, 122.0, 74.0, 40.0, 29.0, 23.0, 17.0, 7.0, 7.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.390625, -6.20855712890625, -6.0264892578125, -5.84442138671875, -5.662353515625, -5.48028564453125, -5.2982177734375, -5.11614990234375, -4.93408203125, -4.75201416015625, -4.5699462890625, -4.38787841796875, -4.205810546875, -4.02374267578125, -3.8416748046875, -3.65960693359375, -3.4775390625, -3.29547119140625, -3.1134033203125, -2.93133544921875, -2.749267578125, -2.56719970703125, -2.3851318359375, -2.20306396484375, -2.02099609375, -1.83892822265625, -1.6568603515625, -1.47479248046875, -1.292724609375, -1.11065673828125, -0.9285888671875, -0.74652099609375, -0.564453125, -0.38238525390625, -0.2003173828125, -0.01824951171875, 0.163818359375, 0.34588623046875, 0.5279541015625, 0.71002197265625, 0.89208984375, 1.07415771484375, 1.2562255859375, 1.43829345703125, 1.620361328125, 1.80242919921875, 1.9844970703125, 2.16656494140625, 2.3486328125, 2.53070068359375, 2.7127685546875, 2.89483642578125, 3.076904296875, 3.25897216796875, 3.4410400390625, 3.62310791015625, 3.80517578125, 3.98724365234375, 4.1693115234375, 4.35137939453125, 4.533447265625, 4.71551513671875, 4.8975830078125, 5.07965087890625, 5.26171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 2.0, 6.0, 10.0, 8.0, 20.0, 21.0, 24.0, 26.0, 44.0, 78.0, 90.0, 97.0, 114.0, 105.0, 82.0, 67.0, 53.0, 47.0, 31.0, 24.0, 17.0, 13.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.68359375, -4.556060791015625, -4.42852783203125, -4.300994873046875, -4.1734619140625, -4.045928955078125, -3.91839599609375, -3.790863037109375, -3.663330078125, -3.535797119140625, -3.40826416015625, -3.280731201171875, -3.1531982421875, -3.025665283203125, -2.89813232421875, -2.770599365234375, -2.64306640625, -2.515533447265625, -2.38800048828125, -2.260467529296875, -2.1329345703125, -2.005401611328125, -1.87786865234375, -1.750335693359375, -1.622802734375, -1.495269775390625, -1.36773681640625, -1.240203857421875, -1.1126708984375, -0.985137939453125, -0.85760498046875, -0.730072021484375, -0.6025390625, -0.475006103515625, -0.34747314453125, -0.219940185546875, -0.0924072265625, 0.035125732421875, 0.16265869140625, 0.290191650390625, 0.417724609375, 0.545257568359375, 0.67279052734375, 0.800323486328125, 0.9278564453125, 1.055389404296875, 1.18292236328125, 1.310455322265625, 1.43798828125, 1.565521240234375, 1.69305419921875, 1.820587158203125, 1.9481201171875, 2.075653076171875, 2.20318603515625, 2.330718994140625, 2.458251953125, 2.585784912109375, 2.71331787109375, 2.840850830078125, 2.9683837890625, 3.095916748046875, 3.22344970703125, 3.350982666015625, 3.478515625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 5.0, 17.0, 17.0, 21.0, 30.0, 46.0, 68.0, 77.0, 101.0, 106.0, 109.0, 99.0, 78.0, 56.0, 55.0, 34.0, 26.0, 18.0, 12.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.19007873535156, -33.72486114501953, -32.259639739990234, -30.79442024230957, -29.329200744628906, -27.863981246948242, -26.398761749267578, -24.933544158935547, -23.46832275390625, -22.003103256225586, -20.537883758544922, -19.072664260864258, -17.607444763183594, -16.14222526550293, -14.677006721496582, -13.211787223815918, -11.74656867980957, -10.281349182128906, -8.816129684448242, -7.350910663604736, -5.885691165924072, -4.420471668243408, -2.9552526473999023, -1.4900331497192383, -0.02481365203857422, 1.4404057264328003, 2.905625104904175, 4.37084436416626, 5.836063861846924, 7.301283359527588, 8.766502380371094, 10.231721878051758, 11.696941375732422, 13.162160873413086, 14.62738037109375, 16.092599868774414, 17.557819366455078, 19.023038864135742, 20.488258361816406, 21.953475952148438, 23.418697357177734, 24.8839168548584, 26.349136352539062, 27.814355850219727, 29.27957534790039, 30.744794845581055, 32.21001434326172, 33.67523193359375, 35.14044952392578, 36.60566711425781, 38.07088851928711, 39.53610610961914, 41.00132751464844, 42.46654510498047, 43.931766510009766, 45.3969841003418, 46.862205505371094, 48.327423095703125, 49.79264450073242, 51.25786209106445, 52.72308349609375, 54.18830108642578, 55.65352249145508, 57.11874008178711, 58.583961486816406]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 4.0, 7.0, 6.0, 7.0, 12.0, 11.0, 14.0, 23.0, 15.0, 22.0, 39.0, 28.0, 35.0, 36.0, 32.0, 43.0, 48.0, 37.0, 46.0, 42.0, 60.0, 63.0, 42.0, 44.0, 39.0, 32.0, 37.0, 36.0, 21.0, 19.0, 27.0, 9.0, 19.0, 10.0, 9.0, 10.0, 6.0, 1.0, 0.0, 2.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.91481018066406, -43.638980865478516, -42.36315155029297, -41.08732604980469, -39.81149673461914, -38.535667419433594, -37.25984191894531, -35.984012603759766, -34.70818328857422, -33.43235397338867, -32.156524658203125, -30.880699157714844, -29.604869842529297, -28.32904052734375, -27.053213119506836, -25.777385711669922, -24.501556396484375, -23.225727081298828, -21.949899673461914, -20.674072265625, -19.398242950439453, -18.122413635253906, -16.846586227416992, -15.570757865905762, -14.294929504394531, -13.0191011428833, -11.74327278137207, -10.46744441986084, -9.19161605834961, -7.915787696838379, -6.639959335327148, -5.364130973815918, -4.088298797607422, -2.8124704360961914, -1.536642074584961, -0.26081371307373047, 1.0150146484375, 2.2908430099487305, 3.566671371459961, 4.842499732971191, 6.118328094482422, 7.394156455993652, 8.669984817504883, 9.945813179016113, 11.221641540527344, 12.497469902038574, 13.773298263549805, 15.049126625061035, 16.324954986572266, 17.600784301757812, 18.876611709594727, 20.15243911743164, 21.428268432617188, 22.704097747802734, 23.97992515563965, 25.255752563476562, 26.53158187866211, 27.807411193847656, 29.08323860168457, 30.359066009521484, 31.63489532470703, 32.91072463989258, 34.186553955078125, 35.462379455566406, 36.73820877075195]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 7.0, 15.0, 12.0, 18.0, 29.0, 49.0, 63.0, 120.0, 154.0, 300.0, 489.0, 884.0, 1530.0, 2893.0, 5848.0, 12998.0, 32458.0, 105573.0, 947738.0, 2887371.0, 129254.0, 37481.0, 14614.0, 6655.0, 3302.0, 1821.0, 1095.0, 554.0, 347.0, 209.0, 131.0, 79.0, 63.0, 43.0, 25.0, 19.0, 15.0, 9.0, 6.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.73956298828125, -6.4595947265625, -6.17962646484375, -5.899658203125, -5.61968994140625, -5.3397216796875, -5.05975341796875, -4.77978515625, -4.49981689453125, -4.2198486328125, -3.93988037109375, -3.659912109375, -3.37994384765625, -3.0999755859375, -2.82000732421875, -2.5400390625, -2.26007080078125, -1.9801025390625, -1.70013427734375, -1.420166015625, -1.14019775390625, -0.8602294921875, -0.58026123046875, -0.30029296875, -0.02032470703125, 0.2596435546875, 0.53961181640625, 0.819580078125, 1.09954833984375, 1.3795166015625, 1.65948486328125, 1.939453125, 2.21942138671875, 2.4993896484375, 2.77935791015625, 3.059326171875, 3.33929443359375, 3.6192626953125, 3.89923095703125, 4.17919921875, 4.45916748046875, 4.7391357421875, 5.01910400390625, 5.299072265625, 5.57904052734375, 5.8590087890625, 6.13897705078125, 6.4189453125, 6.69891357421875, 6.9788818359375, 7.25885009765625, 7.538818359375, 7.81878662109375, 8.0987548828125, 8.37872314453125, 8.65869140625, 8.93865966796875, 9.2186279296875, 9.49859619140625, 9.778564453125, 10.05853271484375, 10.3385009765625, 10.61846923828125, 10.8984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 7.0, 8.0, 10.0, 10.0, 18.0, 18.0, 22.0, 18.0, 34.0, 30.0, 37.0, 38.0, 36.0, 38.0, 48.0, 51.0, 42.0, 41.0, 45.0, 34.0, 43.0, 39.0, 44.0, 36.0, 27.0, 38.0, 28.0, 29.0, 12.0, 21.0, 21.0, 12.0, 9.0, 14.0, 6.0, 3.0, 9.0, 8.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0164794921875, -0.977294921875, -0.9381103515625, -0.89892578125, -0.8597412109375, -0.820556640625, -0.7813720703125, -0.7421875, -0.7030029296875, -0.663818359375, -0.6246337890625, -0.58544921875, -0.5462646484375, -0.507080078125, -0.4678955078125, -0.4287109375, -0.3895263671875, -0.350341796875, -0.3111572265625, -0.27197265625, -0.2327880859375, -0.193603515625, -0.1544189453125, -0.115234375, -0.0760498046875, -0.036865234375, 0.0023193359375, 0.04150390625, 0.0806884765625, 0.119873046875, 0.1590576171875, 0.1982421875, 0.2374267578125, 0.276611328125, 0.3157958984375, 0.35498046875, 0.3941650390625, 0.433349609375, 0.4725341796875, 0.51171875, 0.5509033203125, 0.590087890625, 0.6292724609375, 0.66845703125, 0.7076416015625, 0.746826171875, 0.7860107421875, 0.8251953125, 0.8643798828125, 0.903564453125, 0.9427490234375, 0.98193359375, 1.0211181640625, 1.060302734375, 1.0994873046875, 1.138671875, 1.1778564453125, 1.217041015625, 1.2562255859375, 1.29541015625, 1.3345947265625, 1.373779296875, 1.4129638671875, 1.4521484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 11.0, 11.0, 18.0, 18.0, 44.0, 68.0, 98.0, 151.0, 352.0, 888.0, 2241.0, 6888.0, 25778.0, 151278.0, 3366594.0, 561505.0, 59668.0, 12659.0, 3751.0, 1301.0, 444.0, 225.0, 95.0, 61.0, 47.0, 36.0, 25.0, 4.0, 10.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-20.484375, -20.0267333984375, -19.569091796875, -19.1114501953125, -18.65380859375, -18.1961669921875, -17.738525390625, -17.2808837890625, -16.8232421875, -16.3656005859375, -15.907958984375, -15.4503173828125, -14.99267578125, -14.5350341796875, -14.077392578125, -13.6197509765625, -13.162109375, -12.7044677734375, -12.246826171875, -11.7891845703125, -11.33154296875, -10.8739013671875, -10.416259765625, -9.9586181640625, -9.5009765625, -9.0433349609375, -8.585693359375, -8.1280517578125, -7.67041015625, -7.2127685546875, -6.755126953125, -6.2974853515625, -5.83984375, -5.3822021484375, -4.924560546875, -4.4669189453125, -4.00927734375, -3.5516357421875, -3.093994140625, -2.6363525390625, -2.1787109375, -1.7210693359375, -1.263427734375, -0.8057861328125, -0.34814453125, 0.1094970703125, 0.567138671875, 1.0247802734375, 1.482421875, 1.9400634765625, 2.397705078125, 2.8553466796875, 3.31298828125, 3.7706298828125, 4.228271484375, 4.6859130859375, 5.1435546875, 5.6011962890625, 6.058837890625, 6.5164794921875, 6.97412109375, 7.4317626953125, 7.889404296875, 8.3470458984375, 8.8046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 0.0, 4.0, 10.0, 4.0, 4.0, 13.0, 20.0, 27.0, 40.0, 45.0, 74.0, 78.0, 176.0, 300.0, 812.0, 1544.0, 369.0, 175.0, 128.0, 74.0, 42.0, 41.0, 25.0, 23.0, 12.0, 6.0, 9.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.50390625, -3.40435791015625, -3.3048095703125, -3.20526123046875, -3.105712890625, -3.00616455078125, -2.9066162109375, -2.80706787109375, -2.70751953125, -2.60797119140625, -2.5084228515625, -2.40887451171875, -2.309326171875, -2.20977783203125, -2.1102294921875, -2.01068115234375, -1.9111328125, -1.81158447265625, -1.7120361328125, -1.61248779296875, -1.512939453125, -1.41339111328125, -1.3138427734375, -1.21429443359375, -1.11474609375, -1.01519775390625, -0.9156494140625, -0.81610107421875, -0.716552734375, -0.61700439453125, -0.5174560546875, -0.41790771484375, -0.318359375, -0.21881103515625, -0.1192626953125, -0.01971435546875, 0.079833984375, 0.17938232421875, 0.2789306640625, 0.37847900390625, 0.47802734375, 0.57757568359375, 0.6771240234375, 0.77667236328125, 0.876220703125, 0.97576904296875, 1.0753173828125, 1.17486572265625, 1.2744140625, 1.37396240234375, 1.4735107421875, 1.57305908203125, 1.672607421875, 1.77215576171875, 1.8717041015625, 1.97125244140625, 2.07080078125, 2.17034912109375, 2.2698974609375, 2.36944580078125, 2.468994140625, 2.56854248046875, 2.6680908203125, 2.76763916015625, 2.8671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 3.0, 10.0, 33.0, 84.0, 189.0, 218.0, 218.0, 145.0, 75.0, 14.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.64749145507812, -69.31462860107422, -67.98176574707031, -66.64889526367188, -65.31603240966797, -63.98316955566406, -62.65030288696289, -61.31743621826172, -59.98457336425781, -58.651710510253906, -57.318843841552734, -55.98597717285156, -54.653114318847656, -53.32025146484375, -51.98738479614258, -50.654518127441406, -49.3216552734375, -47.988792419433594, -46.65592575073242, -45.32305908203125, -43.990196228027344, -42.65733337402344, -41.324466705322266, -39.991600036621094, -38.65873718261719, -37.32587432861328, -35.99300765991211, -34.66014099121094, -33.32727813720703, -31.994413375854492, -30.661548614501953, -29.328683853149414, -27.99582290649414, -26.6629581451416, -25.330093383789062, -23.997228622436523, -22.664363861083984, -21.331499099731445, -19.998634338378906, -18.665769577026367, -17.332904815673828, -16.00004005432129, -14.66717529296875, -13.334310531616211, -12.001445770263672, -10.668581008911133, -9.335716247558594, -8.002851486206055, -6.669985771179199, -5.33712100982666, -4.004256248474121, -2.671391487121582, -1.338526725769043, -0.005661964416503906, 1.3272027969360352, 2.660067558288574, 3.9929323196411133, 5.325797080993652, 6.658661842346191, 7.9915266036987305, 9.32439136505127, 10.657256126403809, 11.990120887756348, 13.322985649108887, 14.655850410461426]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 11.0, 3.0, 14.0, 11.0, 14.0, 15.0, 26.0, 28.0, 32.0, 27.0, 31.0, 30.0, 28.0, 38.0, 34.0, 34.0, 47.0, 41.0, 35.0, 46.0, 43.0, 29.0, 47.0, 36.0, 37.0, 38.0, 19.0, 35.0, 18.0, 16.0, 17.0, 25.0, 18.0, 13.0, 10.0, 9.0, 6.0, 7.0, 3.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.230280876159668, -8.92189884185791, -8.613516807556152, -8.305134773254395, -7.996753215789795, -7.688371181488037, -7.3799896240234375, -7.07160758972168, -6.763225555419922, -6.454843521118164, -6.146461486816406, -5.838079929351807, -5.529697895050049, -5.221315860748291, -4.912934303283691, -4.604552268981934, -4.296170234680176, -3.987788200378418, -3.6794064044952393, -3.3710246086120605, -3.0626425743103027, -2.754260540008545, -2.445878744125366, -2.1374969482421875, -1.8291149139404297, -1.5207329988479614, -1.2123510837554932, -0.9039691686630249, -0.5955872535705566, -0.2872053384780884, 0.021176576614379883, 0.3295583724975586, 0.6379413604736328, 0.9463232755661011, 1.2547051906585693, 1.5630871057510376, 1.8714690208435059, 2.1798510551452637, 2.4882328510284424, 2.796614646911621, 3.104996681213379, 3.4133787155151367, 3.7217605113983154, 4.030142307281494, 4.338524341583252, 4.64690637588501, 4.955287933349609, 5.263669967651367, 5.572052001953125, 5.880434036254883, 6.188816070556641, 6.49719762802124, 6.805579662322998, 7.113961696624756, 7.4223432540893555, 7.730725288391113, 8.039107322692871, 8.347489356994629, 8.655871391296387, 8.964253425598145, 9.272634506225586, 9.581016540527344, 9.889398574829102, 10.19778060913086, 10.506162643432617]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 6.0, 7.0, 27.0, 28.0, 45.0, 92.0, 162.0, 335.0, 645.0, 1311.0, 2586.0, 5266.0, 11334.0, 24786.0, 55826.0, 123524.0, 247585.0, 284232.0, 158365.0, 72177.0, 32398.0, 14538.0, 6750.0, 3271.0, 1532.0, 824.0, 407.0, 217.0, 96.0, 73.0, 44.0, 23.0, 11.0, 9.0, 4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.24609375, -5.059814453125, -4.87353515625, -4.687255859375, -4.5009765625, -4.314697265625, -4.12841796875, -3.942138671875, -3.755859375, -3.569580078125, -3.38330078125, -3.197021484375, -3.0107421875, -2.824462890625, -2.63818359375, -2.451904296875, -2.265625, -2.079345703125, -1.89306640625, -1.706787109375, -1.5205078125, -1.334228515625, -1.14794921875, -0.961669921875, -0.775390625, -0.589111328125, -0.40283203125, -0.216552734375, -0.0302734375, 0.156005859375, 0.34228515625, 0.528564453125, 0.71484375, 0.901123046875, 1.08740234375, 1.273681640625, 1.4599609375, 1.646240234375, 1.83251953125, 2.018798828125, 2.205078125, 2.391357421875, 2.57763671875, 2.763916015625, 2.9501953125, 3.136474609375, 3.32275390625, 3.509033203125, 3.6953125, 3.881591796875, 4.06787109375, 4.254150390625, 4.4404296875, 4.626708984375, 4.81298828125, 4.999267578125, 5.185546875, 5.371826171875, 5.55810546875, 5.744384765625, 5.9306640625, 6.116943359375, 6.30322265625, 6.489501953125, 6.67578125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 10.0, 8.0, 7.0, 11.0, 17.0, 18.0, 21.0, 15.0, 21.0, 30.0, 30.0, 22.0, 39.0, 40.0, 34.0, 34.0, 54.0, 34.0, 47.0, 42.0, 38.0, 34.0, 30.0, 38.0, 38.0, 36.0, 26.0, 30.0, 23.0, 15.0, 29.0, 16.0, 15.0, 14.0, 9.0, 15.0, 4.0, 10.0, 12.0, 6.0, 9.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.046875, -1.01129150390625, -0.9757080078125, -0.94012451171875, -0.904541015625, -0.86895751953125, -0.8333740234375, -0.79779052734375, -0.76220703125, -0.72662353515625, -0.6910400390625, -0.65545654296875, -0.619873046875, -0.58428955078125, -0.5487060546875, -0.51312255859375, -0.4775390625, -0.44195556640625, -0.4063720703125, -0.37078857421875, -0.335205078125, -0.29962158203125, -0.2640380859375, -0.22845458984375, -0.19287109375, -0.15728759765625, -0.1217041015625, -0.08612060546875, -0.050537109375, -0.01495361328125, 0.0206298828125, 0.05621337890625, 0.091796875, 0.12738037109375, 0.1629638671875, 0.19854736328125, 0.234130859375, 0.26971435546875, 0.3052978515625, 0.34088134765625, 0.37646484375, 0.41204833984375, 0.4476318359375, 0.48321533203125, 0.518798828125, 0.55438232421875, 0.5899658203125, 0.62554931640625, 0.6611328125, 0.69671630859375, 0.7322998046875, 0.76788330078125, 0.803466796875, 0.83905029296875, 0.8746337890625, 0.91021728515625, 0.94580078125, 0.98138427734375, 1.0169677734375, 1.05255126953125, 1.088134765625, 1.12371826171875, 1.1593017578125, 1.19488525390625, 1.23046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 9.0, 9.0, 19.0, 19.0, 33.0, 63.0, 73.0, 112.0, 191.0, 376.0, 589.0, 1266.0, 3077.0, 9107.0, 33493.0, 140052.0, 468586.0, 293395.0, 70966.0, 17643.0, 5324.0, 2012.0, 912.0, 491.0, 280.0, 152.0, 95.0, 63.0, 50.0, 22.0, 22.0, 13.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5, -9.200927734375, -8.90185546875, -8.602783203125, -8.3037109375, -8.004638671875, -7.70556640625, -7.406494140625, -7.107421875, -6.808349609375, -6.50927734375, -6.210205078125, -5.9111328125, -5.612060546875, -5.31298828125, -5.013916015625, -4.71484375, -4.415771484375, -4.11669921875, -3.817626953125, -3.5185546875, -3.219482421875, -2.92041015625, -2.621337890625, -2.322265625, -2.023193359375, -1.72412109375, -1.425048828125, -1.1259765625, -0.826904296875, -0.52783203125, -0.228759765625, 0.0703125, 0.369384765625, 0.66845703125, 0.967529296875, 1.2666015625, 1.565673828125, 1.86474609375, 2.163818359375, 2.462890625, 2.761962890625, 3.06103515625, 3.360107421875, 3.6591796875, 3.958251953125, 4.25732421875, 4.556396484375, 4.85546875, 5.154541015625, 5.45361328125, 5.752685546875, 6.0517578125, 6.350830078125, 6.64990234375, 6.948974609375, 7.248046875, 7.547119140625, 7.84619140625, 8.145263671875, 8.4443359375, 8.743408203125, 9.04248046875, 9.341552734375, 9.640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 2.0, 5.0, 6.0, 1.0, 8.0, 6.0, 9.0, 16.0, 23.0, 23.0, 26.0, 26.0, 32.0, 38.0, 41.0, 57.0, 44.0, 45.0, 56.0, 47.0, 63.0, 45.0, 35.0, 46.0, 45.0, 32.0, 47.0, 36.0, 38.0, 19.0, 20.0, 17.0, 13.0, 12.0, 15.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.8203125, -7.60296630859375, -7.3856201171875, -7.16827392578125, -6.950927734375, -6.73358154296875, -6.5162353515625, -6.29888916015625, -6.08154296875, -5.86419677734375, -5.6468505859375, -5.42950439453125, -5.212158203125, -4.99481201171875, -4.7774658203125, -4.56011962890625, -4.3427734375, -4.12542724609375, -3.9080810546875, -3.69073486328125, -3.473388671875, -3.25604248046875, -3.0386962890625, -2.82135009765625, -2.60400390625, -2.38665771484375, -2.1693115234375, -1.95196533203125, -1.734619140625, -1.51727294921875, -1.2999267578125, -1.08258056640625, -0.865234375, -0.64788818359375, -0.4305419921875, -0.21319580078125, 0.004150390625, 0.22149658203125, 0.4388427734375, 0.65618896484375, 0.87353515625, 1.09088134765625, 1.3082275390625, 1.52557373046875, 1.742919921875, 1.96026611328125, 2.1776123046875, 2.39495849609375, 2.6123046875, 2.82965087890625, 3.0469970703125, 3.26434326171875, 3.481689453125, 3.69903564453125, 3.9163818359375, 4.13372802734375, 4.35107421875, 4.56842041015625, 4.7857666015625, 5.00311279296875, 5.220458984375, 5.43780517578125, 5.6551513671875, 5.87249755859375, 6.08984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 11.0, 5.0, 8.0, 10.0, 11.0, 18.0, 33.0, 56.0, 72.0, 124.0, 193.0, 400.0, 715.0, 1569.0, 3703.0, 9824.0, 33535.0, 176642.0, 574567.0, 193450.0, 35920.0, 10528.0, 3759.0, 1635.0, 756.0, 394.0, 234.0, 119.0, 88.0, 53.0, 35.0, 23.0, 17.0, 13.0, 11.0, 4.0, 5.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.12371826171875, -4.9661865234375, -4.80865478515625, -4.651123046875, -4.49359130859375, -4.3360595703125, -4.17852783203125, -4.02099609375, -3.86346435546875, -3.7059326171875, -3.54840087890625, -3.390869140625, -3.23333740234375, -3.0758056640625, -2.91827392578125, -2.7607421875, -2.60321044921875, -2.4456787109375, -2.28814697265625, -2.130615234375, -1.97308349609375, -1.8155517578125, -1.65802001953125, -1.50048828125, -1.34295654296875, -1.1854248046875, -1.02789306640625, -0.870361328125, -0.71282958984375, -0.5552978515625, -0.39776611328125, -0.240234375, -0.08270263671875, 0.0748291015625, 0.23236083984375, 0.389892578125, 0.54742431640625, 0.7049560546875, 0.86248779296875, 1.02001953125, 1.17755126953125, 1.3350830078125, 1.49261474609375, 1.650146484375, 1.80767822265625, 1.9652099609375, 2.12274169921875, 2.2802734375, 2.43780517578125, 2.5953369140625, 2.75286865234375, 2.910400390625, 3.06793212890625, 3.2254638671875, 3.38299560546875, 3.54052734375, 3.69805908203125, 3.8555908203125, 4.01312255859375, 4.170654296875, 4.32818603515625, 4.4857177734375, 4.64324951171875, 4.80078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 15.0, 17.0, 20.0, 29.0, 38.0, 60.0, 74.0, 140.0, 150.0, 121.0, 76.0, 66.0, 37.0, 33.0, 30.0, 21.0, 13.0, 12.0, 9.0, 10.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009298324584960938, -0.0008983910083770752, -0.0008669495582580566, -0.0008355081081390381, -0.0008040666580200195, -0.000772625207901001, -0.0007411837577819824, -0.0007097423076629639, -0.0006783008575439453, -0.0006468594074249268, -0.0006154179573059082, -0.0005839765071868896, -0.0005525350570678711, -0.0005210936069488525, -0.000489652156829834, -0.00045821070671081543, -0.0004267692565917969, -0.0003953278064727783, -0.00036388635635375977, -0.0003324449062347412, -0.00030100345611572266, -0.0002695620059967041, -0.00023812055587768555, -0.000206679105758667, -0.00017523765563964844, -0.00014379620552062988, -0.00011235475540161133, -8.091330528259277e-05, -4.947185516357422e-05, -1.8030405044555664e-05, 1.341104507446289e-05, 4.4852495193481445e-05, 7.62939453125e-05, 0.00010773539543151855, 0.0001391768455505371, 0.00017061829566955566, 0.00020205974578857422, 0.00023350119590759277, 0.00026494264602661133, 0.0002963840961456299, 0.00032782554626464844, 0.000359266996383667, 0.00039070844650268555, 0.0004221498966217041, 0.00045359134674072266, 0.0004850327968597412, 0.0005164742469787598, 0.0005479156970977783, 0.0005793571472167969, 0.0006107985973358154, 0.000642240047454834, 0.0006736814975738525, 0.0007051229476928711, 0.0007365643978118896, 0.0007680058479309082, 0.0007994472980499268, 0.0008308887481689453, 0.0008623301982879639, 0.0008937716484069824, 0.000925213098526001, 0.0009566545486450195, 0.000988095998764038, 0.0010195374488830566, 0.0010509788990020752, 0.0010824203491210938]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 3.0, 18.0, 16.0, 21.0, 29.0, 47.0, 83.0, 157.0, 262.0, 430.0, 847.0, 1832.0, 4160.0, 11288.0, 39326.0, 236508.0, 597416.0, 117942.0, 24185.0, 7872.0, 3097.0, 1391.0, 654.0, 400.0, 209.0, 131.0, 76.0, 50.0, 25.0, 16.0, 16.0, 9.0, 5.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.49609375, -6.31219482421875, -6.1282958984375, -5.94439697265625, -5.760498046875, -5.57659912109375, -5.3927001953125, -5.20880126953125, -5.02490234375, -4.84100341796875, -4.6571044921875, -4.47320556640625, -4.289306640625, -4.10540771484375, -3.9215087890625, -3.73760986328125, -3.5537109375, -3.36981201171875, -3.1859130859375, -3.00201416015625, -2.818115234375, -2.63421630859375, -2.4503173828125, -2.26641845703125, -2.08251953125, -1.89862060546875, -1.7147216796875, -1.53082275390625, -1.346923828125, -1.16302490234375, -0.9791259765625, -0.79522705078125, -0.611328125, -0.42742919921875, -0.2435302734375, -0.05963134765625, 0.124267578125, 0.30816650390625, 0.4920654296875, 0.67596435546875, 0.85986328125, 1.04376220703125, 1.2276611328125, 1.41156005859375, 1.595458984375, 1.77935791015625, 1.9632568359375, 2.14715576171875, 2.3310546875, 2.51495361328125, 2.6988525390625, 2.88275146484375, 3.066650390625, 3.25054931640625, 3.4344482421875, 3.61834716796875, 3.80224609375, 3.98614501953125, 4.1700439453125, 4.35394287109375, 4.537841796875, 4.72174072265625, 4.9056396484375, 5.08953857421875, 5.2734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 2.0, 12.0, 11.0, 10.0, 13.0, 18.0, 36.0, 43.0, 77.0, 96.0, 125.0, 120.0, 122.0, 93.0, 68.0, 40.0, 33.0, 29.0, 10.0, 13.0, 7.0, 2.0, 2.0, 5.0, 2.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.32940673828125, -4.1861572265625, -4.04290771484375, -3.899658203125, -3.75640869140625, -3.6131591796875, -3.46990966796875, -3.32666015625, -3.18341064453125, -3.0401611328125, -2.89691162109375, -2.753662109375, -2.61041259765625, -2.4671630859375, -2.32391357421875, -2.1806640625, -2.03741455078125, -1.8941650390625, -1.75091552734375, -1.607666015625, -1.46441650390625, -1.3211669921875, -1.17791748046875, -1.03466796875, -0.89141845703125, -0.7481689453125, -0.60491943359375, -0.461669921875, -0.31842041015625, -0.1751708984375, -0.03192138671875, 0.111328125, 0.25457763671875, 0.3978271484375, 0.54107666015625, 0.684326171875, 0.82757568359375, 0.9708251953125, 1.11407470703125, 1.25732421875, 1.40057373046875, 1.5438232421875, 1.68707275390625, 1.830322265625, 1.97357177734375, 2.1168212890625, 2.26007080078125, 2.4033203125, 2.54656982421875, 2.6898193359375, 2.83306884765625, 2.976318359375, 3.11956787109375, 3.2628173828125, 3.40606689453125, 3.54931640625, 3.69256591796875, 3.8358154296875, 3.97906494140625, 4.122314453125, 4.26556396484375, 4.4088134765625, 4.55206298828125, 4.6953125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 10.0, 9.0, 28.0, 38.0, 82.0, 83.0, 117.0, 133.0, 148.0, 127.0, 94.0, 49.0, 31.0, 27.0, 7.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.88172912597656, -52.98841094970703, -51.0950927734375, -49.20177459716797, -47.30845642089844, -45.415138244628906, -43.521820068359375, -41.628501892089844, -39.73518371582031, -37.84186553955078, -35.94854736328125, -34.05522918701172, -32.16191101074219, -30.268592834472656, -28.375276565551758, -26.481958389282227, -24.588642120361328, -22.695323944091797, -20.802005767822266, -18.908687591552734, -17.015369415283203, -15.122052192687988, -13.228734970092773, -11.335416793823242, -9.442098617553711, -7.54878044128418, -5.655462741851807, -3.7621450424194336, -1.8688268661499023, 0.024491310119628906, 1.9178085327148438, 3.811126708984375, 5.704444885253906, 7.5977630615234375, 9.491081237792969, 11.384398460388184, 13.277716636657715, 15.171034812927246, 17.06435203552246, 18.957670211791992, 20.850988388061523, 22.744306564331055, 24.637624740600586, 26.530941009521484, 28.424259185791016, 30.317577362060547, 32.21089553833008, 34.10421371459961, 35.99753189086914, 37.89085006713867, 39.7841682434082, 41.677486419677734, 43.570804595947266, 45.4641227722168, 47.35743713378906, 49.250755310058594, 51.144073486328125, 53.037391662597656, 54.93070983886719, 56.82402801513672, 58.71734619140625, 60.61066436767578, 62.50398254394531, 64.39730072021484, 66.29061889648438]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 9.0, 8.0, 14.0, 16.0, 18.0, 15.0, 19.0, 16.0, 31.0, 37.0, 31.0, 48.0, 51.0, 51.0, 53.0, 51.0, 53.0, 54.0, 64.0, 49.0, 35.0, 42.0, 50.0, 34.0, 26.0, 14.0, 16.0, 16.0, 12.0, 9.0, 11.0, 7.0, 9.0, 5.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-39.06239700317383, -37.87954330444336, -36.696685791015625, -35.513832092285156, -34.33097839355469, -33.14812469482422, -31.965267181396484, -30.782413482666016, -29.599557876586914, -28.416702270507812, -27.233848571777344, -26.050992965698242, -24.86813735961914, -23.685283660888672, -22.50242805480957, -21.31957244873047, -20.13671875, -18.9538631439209, -17.77100944519043, -16.588153839111328, -15.405299186706543, -14.222444534301758, -13.039588928222656, -11.856734275817871, -10.673879623413086, -9.4910249710083, -8.308170318603516, -7.125314712524414, -5.942460060119629, -4.759605407714844, -3.5767502784729004, -2.393895149230957, -1.2110443115234375, -0.028189420700073242, 1.154665470123291, 2.3375203609466553, 3.5203752517700195, 4.703229904174805, 5.886085033416748, 7.068940162658691, 8.251794815063477, 9.434649467468262, 10.617504119873047, 11.800359725952148, 12.983214378356934, 14.166069030761719, 15.34892463684082, 16.531780242919922, 17.71463394165039, 18.897489547729492, 20.08034324645996, 21.263198852539062, 22.44605255126953, 23.628908157348633, 24.811763763427734, 25.994617462158203, 27.177473068237305, 28.360328674316406, 29.543182373046875, 30.726037979125977, 31.908893585205078, 33.09174728393555, 34.274600982666016, 35.45745849609375, 36.64031219482422]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 10.0, 12.0, 17.0, 29.0, 43.0, 70.0, 123.0, 192.0, 336.0, 539.0, 974.0, 1611.0, 3048.0, 5743.0, 11357.0, 24078.0, 55567.0, 151950.0, 622408.0, 2808002.0, 330098.0, 100825.0, 39869.0, 17701.0, 8830.0, 4530.0, 2540.0, 1410.0, 897.0, 520.0, 333.0, 201.0, 137.0, 76.0, 80.0, 26.0, 25.0, 20.0, 17.0, 12.0, 9.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.26953125, -5.07659912109375, -4.8836669921875, -4.69073486328125, -4.497802734375, -4.30487060546875, -4.1119384765625, -3.91900634765625, -3.72607421875, -3.53314208984375, -3.3402099609375, -3.14727783203125, -2.954345703125, -2.76141357421875, -2.5684814453125, -2.37554931640625, -2.1826171875, -1.98968505859375, -1.7967529296875, -1.60382080078125, -1.410888671875, -1.21795654296875, -1.0250244140625, -0.83209228515625, -0.63916015625, -0.44622802734375, -0.2532958984375, -0.06036376953125, 0.132568359375, 0.32550048828125, 0.5184326171875, 0.71136474609375, 0.904296875, 1.09722900390625, 1.2901611328125, 1.48309326171875, 1.676025390625, 1.86895751953125, 2.0618896484375, 2.25482177734375, 2.44775390625, 2.64068603515625, 2.8336181640625, 3.02655029296875, 3.219482421875, 3.41241455078125, 3.6053466796875, 3.79827880859375, 3.9912109375, 4.18414306640625, 4.3770751953125, 4.57000732421875, 4.762939453125, 4.95587158203125, 5.1488037109375, 5.34173583984375, 5.53466796875, 5.72760009765625, 5.9205322265625, 6.11346435546875, 6.306396484375, 6.49932861328125, 6.6922607421875, 6.88519287109375, 7.078125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 6.0, 10.0, 18.0, 18.0, 17.0, 21.0, 20.0, 29.0, 28.0, 45.0, 41.0, 45.0, 37.0, 48.0, 38.0, 47.0, 51.0, 48.0, 36.0, 46.0, 48.0, 34.0, 35.0, 36.0, 35.0, 21.0, 20.0, 16.0, 14.0, 14.0, 9.0, 16.0, 6.0, 6.0, 8.0, 7.0, 4.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.0934600830078125, -1.052154541015625, -1.0108489990234375, -0.96954345703125, -0.9282379150390625, -0.886932373046875, -0.8456268310546875, -0.8043212890625, -0.7630157470703125, -0.721710205078125, -0.6804046630859375, -0.63909912109375, -0.5977935791015625, -0.556488037109375, -0.5151824951171875, -0.473876953125, -0.4325714111328125, -0.391265869140625, -0.3499603271484375, -0.30865478515625, -0.2673492431640625, -0.226043701171875, -0.1847381591796875, -0.1434326171875, -0.1021270751953125, -0.060821533203125, -0.0195159912109375, 0.02178955078125, 0.0630950927734375, 0.104400634765625, 0.1457061767578125, 0.18701171875, 0.2283172607421875, 0.269622802734375, 0.3109283447265625, 0.35223388671875, 0.3935394287109375, 0.434844970703125, 0.4761505126953125, 0.5174560546875, 0.5587615966796875, 0.600067138671875, 0.6413726806640625, 0.68267822265625, 0.7239837646484375, 0.765289306640625, 0.8065948486328125, 0.847900390625, 0.8892059326171875, 0.930511474609375, 0.9718170166015625, 1.01312255859375, 1.0544281005859375, 1.095733642578125, 1.1370391845703125, 1.1783447265625, 1.2196502685546875, 1.260955810546875, 1.3022613525390625, 1.34356689453125, 1.3848724365234375, 1.426177978515625, 1.4674835205078125, 1.5087890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 10.0, 10.0, 24.0, 46.0, 112.0, 245.0, 618.0, 1886.0, 8227.0, 59415.0, 1211965.0, 2809844.0, 87104.0, 11205.0, 2349.0, 719.0, 281.0, 103.0, 54.0, 27.0, 10.0, 10.0, 9.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3359375, -14.8260498046875, -14.316162109375, -13.8062744140625, -13.29638671875, -12.7864990234375, -12.276611328125, -11.7667236328125, -11.2568359375, -10.7469482421875, -10.237060546875, -9.7271728515625, -9.21728515625, -8.7073974609375, -8.197509765625, -7.6876220703125, -7.177734375, -6.6678466796875, -6.157958984375, -5.6480712890625, -5.13818359375, -4.6282958984375, -4.118408203125, -3.6085205078125, -3.0986328125, -2.5887451171875, -2.078857421875, -1.5689697265625, -1.05908203125, -0.5491943359375, -0.039306640625, 0.4705810546875, 0.98046875, 1.4903564453125, 2.000244140625, 2.5101318359375, 3.02001953125, 3.5299072265625, 4.039794921875, 4.5496826171875, 5.0595703125, 5.5694580078125, 6.079345703125, 6.5892333984375, 7.09912109375, 7.6090087890625, 8.118896484375, 8.6287841796875, 9.138671875, 9.6485595703125, 10.158447265625, 10.6683349609375, 11.17822265625, 11.6881103515625, 12.197998046875, 12.7078857421875, 13.2177734375, 13.7276611328125, 14.237548828125, 14.7474365234375, 15.25732421875, 15.7672119140625, 16.277099609375, 16.7869873046875, 17.296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 9.0, 14.0, 12.0, 25.0, 30.0, 49.0, 77.0, 76.0, 165.0, 249.0, 520.0, 1234.0, 678.0, 327.0, 206.0, 113.0, 80.0, 56.0, 52.0, 24.0, 13.0, 15.0, 13.0, 13.0, 4.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.154083251953125, -4.02691650390625, -3.899749755859375, -3.7725830078125, -3.645416259765625, -3.51824951171875, -3.391082763671875, -3.263916015625, -3.136749267578125, -3.00958251953125, -2.882415771484375, -2.7552490234375, -2.628082275390625, -2.50091552734375, -2.373748779296875, -2.24658203125, -2.119415283203125, -1.99224853515625, -1.865081787109375, -1.7379150390625, -1.610748291015625, -1.48358154296875, -1.356414794921875, -1.229248046875, -1.102081298828125, -0.97491455078125, -0.847747802734375, -0.7205810546875, -0.593414306640625, -0.46624755859375, -0.339080810546875, -0.2119140625, -0.084747314453125, 0.04241943359375, 0.169586181640625, 0.2967529296875, 0.423919677734375, 0.55108642578125, 0.678253173828125, 0.805419921875, 0.932586669921875, 1.05975341796875, 1.186920166015625, 1.3140869140625, 1.441253662109375, 1.56842041015625, 1.695587158203125, 1.82275390625, 1.949920654296875, 2.07708740234375, 2.204254150390625, 2.3314208984375, 2.458587646484375, 2.58575439453125, 2.712921142578125, 2.840087890625, 2.967254638671875, 3.09442138671875, 3.221588134765625, 3.3487548828125, 3.475921630859375, 3.60308837890625, 3.730255126953125, 3.857421875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 10.0, 21.0, 33.0, 85.0, 116.0, 191.0, 174.0, 153.0, 93.0, 57.0, 25.0, 20.0, 10.0, 6.0, 6.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.30530548095703, -33.95218276977539, -32.59906005859375, -31.245933532714844, -29.892810821533203, -28.539688110351562, -27.18656349182129, -25.833438873291016, -24.480316162109375, -23.127193450927734, -21.77406883239746, -20.420944213867188, -19.067821502685547, -17.714698791503906, -16.361574172973633, -15.008450508117676, -13.655326843261719, -12.302203178405762, -10.949079513549805, -9.595955848693848, -8.24283218383789, -6.889708518981934, -5.536584854125977, -4.1834611892700195, -2.8303375244140625, -1.4772138595581055, -0.12409019470214844, 1.2290334701538086, 2.5821571350097656, 3.9352807998657227, 5.28840446472168, 6.641528129577637, 7.994647979736328, 9.347771644592285, 10.700895309448242, 12.0540189743042, 13.407142639160156, 14.760266304016113, 16.11338996887207, 17.466514587402344, 18.819637298583984, 20.172760009765625, 21.5258846282959, 22.879009246826172, 24.232131958007812, 25.585254669189453, 26.938379287719727, 28.29150390625, 29.64462661743164, 30.99774932861328, 32.35087585449219, 33.70399856567383, 35.05712127685547, 36.41024398803711, 37.76336669921875, 39.116493225097656, 40.4696159362793, 41.82273864746094, 43.175865173339844, 44.528987884521484, 45.882110595703125, 47.235233306884766, 48.588356018066406, 49.94148254394531, 51.29460525512695]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 4.0, 9.0, 15.0, 17.0, 19.0, 19.0, 24.0, 19.0, 20.0, 28.0, 33.0, 30.0, 30.0, 40.0, 47.0, 50.0, 53.0, 45.0, 34.0, 40.0, 40.0, 32.0, 29.0, 41.0, 29.0, 40.0, 28.0, 15.0, 26.0, 17.0, 23.0, 21.0, 17.0, 11.0, 12.0, 9.0, 2.0, 8.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.75537872314453, -16.304737091064453, -15.854093551635742, -15.403450965881348, -14.952808380126953, -14.502165794372559, -14.051523208618164, -13.600881576538086, -13.150238037109375, -12.69959545135498, -12.248952865600586, -11.798310279846191, -11.347667694091797, -10.897025108337402, -10.446382522583008, -9.99574089050293, -9.545098304748535, -9.09445571899414, -8.643813133239746, -8.193170547485352, -7.742527961730957, -7.2918853759765625, -6.841243267059326, -6.390600681304932, -5.939958095550537, -5.489315509796143, -5.038672924041748, -4.588030815124512, -4.137388229370117, -3.6867454051971436, -3.236103057861328, -2.7854604721069336, -2.334817886352539, -1.8841753005981445, -1.4335328340530396, -0.9828903675079346, -0.53224778175354, -0.08160519599914551, 0.3690371513366699, 0.8196797370910645, 1.270322322845459, 1.7209649085998535, 2.171607494354248, 2.6222498416900635, 3.072892427444458, 3.5235350131988525, 3.974177360534668, 4.4248199462890625, 4.875462532043457, 5.326105117797852, 5.776747703552246, 6.227390289306641, 6.678032875061035, 7.12867546081543, 7.579317569732666, 8.029960632324219, 8.480602264404297, 8.931244850158691, 9.381887435913086, 9.83253002166748, 10.283172607421875, 10.73381519317627, 11.184457778930664, 11.635099411010742, 12.085742950439453]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 9.0, 10.0, 20.0, 19.0, 19.0, 35.0, 54.0, 83.0, 138.0, 207.0, 380.0, 811.0, 1534.0, 3174.0, 6976.0, 15737.0, 35264.0, 80988.0, 193494.0, 368431.0, 194833.0, 81328.0, 35813.0, 15654.0, 7050.0, 3269.0, 1508.0, 750.0, 383.0, 211.0, 125.0, 76.0, 55.0, 34.0, 30.0, 22.0, 12.0, 5.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.28515625, -7.04632568359375, -6.8074951171875, -6.56866455078125, -6.329833984375, -6.09100341796875, -5.8521728515625, -5.61334228515625, -5.37451171875, -5.13568115234375, -4.8968505859375, -4.65802001953125, -4.419189453125, -4.18035888671875, -3.9415283203125, -3.70269775390625, -3.4638671875, -3.22503662109375, -2.9862060546875, -2.74737548828125, -2.508544921875, -2.26971435546875, -2.0308837890625, -1.79205322265625, -1.55322265625, -1.31439208984375, -1.0755615234375, -0.83673095703125, -0.597900390625, -0.35906982421875, -0.1202392578125, 0.11859130859375, 0.357421875, 0.59625244140625, 0.8350830078125, 1.07391357421875, 1.312744140625, 1.55157470703125, 1.7904052734375, 2.02923583984375, 2.26806640625, 2.50689697265625, 2.7457275390625, 2.98455810546875, 3.223388671875, 3.46221923828125, 3.7010498046875, 3.93988037109375, 4.1787109375, 4.41754150390625, 4.6563720703125, 4.89520263671875, 5.134033203125, 5.37286376953125, 5.6116943359375, 5.85052490234375, 6.08935546875, 6.32818603515625, 6.5670166015625, 6.80584716796875, 7.044677734375, 7.28350830078125, 7.5223388671875, 7.76116943359375, 8.0]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 7.0, 11.0, 6.0, 7.0, 13.0, 15.0, 20.0, 20.0, 26.0, 28.0, 24.0, 35.0, 35.0, 37.0, 38.0, 55.0, 44.0, 42.0, 48.0, 46.0, 47.0, 36.0, 45.0, 48.0, 40.0, 36.0, 26.0, 25.0, 15.0, 25.0, 23.0, 13.0, 21.0, 16.0, 8.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21484375, -1.172821044921875, -1.13079833984375, -1.088775634765625, -1.0467529296875, -1.004730224609375, -0.96270751953125, -0.920684814453125, -0.878662109375, -0.836639404296875, -0.79461669921875, -0.752593994140625, -0.7105712890625, -0.668548583984375, -0.62652587890625, -0.584503173828125, -0.54248046875, -0.500457763671875, -0.45843505859375, -0.416412353515625, -0.3743896484375, -0.332366943359375, -0.29034423828125, -0.248321533203125, -0.206298828125, -0.164276123046875, -0.12225341796875, -0.080230712890625, -0.0382080078125, 0.003814697265625, 0.04583740234375, 0.087860107421875, 0.1298828125, 0.171905517578125, 0.21392822265625, 0.255950927734375, 0.2979736328125, 0.339996337890625, 0.38201904296875, 0.424041748046875, 0.466064453125, 0.508087158203125, 0.55010986328125, 0.592132568359375, 0.6341552734375, 0.676177978515625, 0.71820068359375, 0.760223388671875, 0.80224609375, 0.844268798828125, 0.88629150390625, 0.928314208984375, 0.9703369140625, 1.012359619140625, 1.05438232421875, 1.096405029296875, 1.138427734375, 1.180450439453125, 1.22247314453125, 1.264495849609375, 1.3065185546875, 1.348541259765625, 1.39056396484375, 1.432586669921875, 1.474609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 14.0, 21.0, 25.0, 34.0, 86.0, 121.0, 238.0, 458.0, 1016.0, 2282.0, 6153.0, 21483.0, 99286.0, 505684.0, 328073.0, 61447.0, 14167.0, 4520.0, 1775.0, 771.0, 408.0, 207.0, 105.0, 55.0, 30.0, 26.0, 19.0, 10.0, 10.0, 10.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796875, -10.4351806640625, -10.073486328125, -9.7117919921875, -9.35009765625, -8.9884033203125, -8.626708984375, -8.2650146484375, -7.9033203125, -7.5416259765625, -7.179931640625, -6.8182373046875, -6.45654296875, -6.0948486328125, -5.733154296875, -5.3714599609375, -5.009765625, -4.6480712890625, -4.286376953125, -3.9246826171875, -3.56298828125, -3.2012939453125, -2.839599609375, -2.4779052734375, -2.1162109375, -1.7545166015625, -1.392822265625, -1.0311279296875, -0.66943359375, -0.3077392578125, 0.053955078125, 0.4156494140625, 0.77734375, 1.1390380859375, 1.500732421875, 1.8624267578125, 2.22412109375, 2.5858154296875, 2.947509765625, 3.3092041015625, 3.6708984375, 4.0325927734375, 4.394287109375, 4.7559814453125, 5.11767578125, 5.4793701171875, 5.841064453125, 6.2027587890625, 6.564453125, 6.9261474609375, 7.287841796875, 7.6495361328125, 8.01123046875, 8.3729248046875, 8.734619140625, 9.0963134765625, 9.4580078125, 9.8197021484375, 10.181396484375, 10.5430908203125, 10.90478515625, 11.2664794921875, 11.628173828125, 11.9898681640625, 12.3515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 1.0, 11.0, 9.0, 13.0, 15.0, 21.0, 27.0, 32.0, 31.0, 37.0, 47.0, 43.0, 75.0, 54.0, 53.0, 59.0, 52.0, 51.0, 60.0, 38.0, 54.0, 39.0, 34.0, 24.0, 28.0, 24.0, 12.0, 14.0, 13.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.37347412109375, -8.1141357421875, -7.85479736328125, -7.595458984375, -7.33612060546875, -7.0767822265625, -6.81744384765625, -6.55810546875, -6.29876708984375, -6.0394287109375, -5.78009033203125, -5.520751953125, -5.26141357421875, -5.0020751953125, -4.74273681640625, -4.4833984375, -4.22406005859375, -3.9647216796875, -3.70538330078125, -3.446044921875, -3.18670654296875, -2.9273681640625, -2.66802978515625, -2.40869140625, -2.14935302734375, -1.8900146484375, -1.63067626953125, -1.371337890625, -1.11199951171875, -0.8526611328125, -0.59332275390625, -0.333984375, -0.07464599609375, 0.1846923828125, 0.44403076171875, 0.703369140625, 0.96270751953125, 1.2220458984375, 1.48138427734375, 1.74072265625, 2.00006103515625, 2.2593994140625, 2.51873779296875, 2.778076171875, 3.03741455078125, 3.2967529296875, 3.55609130859375, 3.8154296875, 4.07476806640625, 4.3341064453125, 4.59344482421875, 4.852783203125, 5.11212158203125, 5.3714599609375, 5.63079833984375, 5.89013671875, 6.14947509765625, 6.4088134765625, 6.66815185546875, 6.927490234375, 7.18682861328125, 7.4461669921875, 7.70550537109375, 7.96484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 5.0, 5.0, 7.0, 19.0, 26.0, 60.0, 78.0, 144.0, 250.0, 522.0, 1087.0, 2504.0, 7144.0, 24641.0, 110734.0, 555995.0, 275912.0, 49268.0, 12828.0, 4074.0, 1667.0, 780.0, 340.0, 170.0, 107.0, 68.0, 39.0, 14.0, 20.0, 13.0, 5.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8984375, -6.72039794921875, -6.5423583984375, -6.36431884765625, -6.186279296875, -6.00823974609375, -5.8302001953125, -5.65216064453125, -5.47412109375, -5.29608154296875, -5.1180419921875, -4.94000244140625, -4.761962890625, -4.58392333984375, -4.4058837890625, -4.22784423828125, -4.0498046875, -3.87176513671875, -3.6937255859375, -3.51568603515625, -3.337646484375, -3.15960693359375, -2.9815673828125, -2.80352783203125, -2.62548828125, -2.44744873046875, -2.2694091796875, -2.09136962890625, -1.913330078125, -1.73529052734375, -1.5572509765625, -1.37921142578125, -1.201171875, -1.02313232421875, -0.8450927734375, -0.66705322265625, -0.489013671875, -0.31097412109375, -0.1329345703125, 0.04510498046875, 0.22314453125, 0.40118408203125, 0.5792236328125, 0.75726318359375, 0.935302734375, 1.11334228515625, 1.2913818359375, 1.46942138671875, 1.6474609375, 1.82550048828125, 2.0035400390625, 2.18157958984375, 2.359619140625, 2.53765869140625, 2.7156982421875, 2.89373779296875, 3.07177734375, 3.24981689453125, 3.4278564453125, 3.60589599609375, 3.783935546875, 3.96197509765625, 4.1400146484375, 4.31805419921875, 4.49609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 9.0, 5.0, 6.0, 14.0, 14.0, 18.0, 21.0, 35.0, 41.0, 59.0, 66.0, 137.0, 172.0, 128.0, 76.0, 45.0, 27.0, 29.0, 25.0, 21.0, 2.0, 3.0, 7.0, 4.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010023117065429688, -0.0009722486138343811, -0.0009421855211257935, -0.0009121224284172058, -0.0008820593357086182, -0.0008519962430000305, -0.0008219331502914429, -0.0007918700575828552, -0.0007618069648742676, -0.0007317438721656799, -0.0007016807794570923, -0.0006716176867485046, -0.000641554594039917, -0.0006114915013313293, -0.0005814284086227417, -0.000551365315914154, -0.0005213022232055664, -0.0004912391304969788, -0.0004611760377883911, -0.00043111294507980347, -0.0004010498523712158, -0.0003709867596626282, -0.00034092366695404053, -0.0003108605742454529, -0.00028079748153686523, -0.0002507343888282776, -0.00022067129611968994, -0.0001906082034111023, -0.00016054511070251465, -0.000130482017993927, -0.00010041892528533936, -7.035583257675171e-05, -4.029273986816406e-05, -1.0229647159576416e-05, 1.983344554901123e-05, 4.989653825759888e-05, 7.995963096618652e-05, 0.00011002272367477417, 0.00014008581638336182, 0.00017014890909194946, 0.0002002120018005371, 0.00023027509450912476, 0.0002603381872177124, 0.00029040127992630005, 0.0003204643726348877, 0.00035052746534347534, 0.000380590558052063, 0.00041065365076065063, 0.0004407167434692383, 0.00047077983617782593, 0.0005008429288864136, 0.0005309060215950012, 0.0005609691143035889, 0.0005910322070121765, 0.0006210952997207642, 0.0006511583924293518, 0.0006812214851379395, 0.0007112845778465271, 0.0007413476705551147, 0.0007714107632637024, 0.00080147385597229, 0.0008315369486808777, 0.0008616000413894653, 0.000891663134098053, 0.0009217262268066406]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 1.0, 8.0, 10.0, 9.0, 22.0, 34.0, 38.0, 71.0, 106.0, 172.0, 334.0, 753.0, 1601.0, 3836.0, 10691.0, 35556.0, 167638.0, 592749.0, 179289.0, 37596.0, 10959.0, 3899.0, 1598.0, 715.0, 351.0, 187.0, 102.0, 72.0, 48.0, 29.0, 19.0, 16.0, 10.0, 8.0, 8.0, 5.0, 7.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.508056640625, -4.34423828125, -4.180419921875, -4.0166015625, -3.852783203125, -3.68896484375, -3.525146484375, -3.361328125, -3.197509765625, -3.03369140625, -2.869873046875, -2.7060546875, -2.542236328125, -2.37841796875, -2.214599609375, -2.05078125, -1.886962890625, -1.72314453125, -1.559326171875, -1.3955078125, -1.231689453125, -1.06787109375, -0.904052734375, -0.740234375, -0.576416015625, -0.41259765625, -0.248779296875, -0.0849609375, 0.078857421875, 0.24267578125, 0.406494140625, 0.5703125, 0.734130859375, 0.89794921875, 1.061767578125, 1.2255859375, 1.389404296875, 1.55322265625, 1.717041015625, 1.880859375, 2.044677734375, 2.20849609375, 2.372314453125, 2.5361328125, 2.699951171875, 2.86376953125, 3.027587890625, 3.19140625, 3.355224609375, 3.51904296875, 3.682861328125, 3.8466796875, 4.010498046875, 4.17431640625, 4.338134765625, 4.501953125, 4.665771484375, 4.82958984375, 4.993408203125, 5.1572265625, 5.321044921875, 5.48486328125, 5.648681640625, 5.8125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 14.0, 8.0, 21.0, 11.0, 23.0, 20.0, 46.0, 58.0, 75.0, 97.0, 119.0, 111.0, 103.0, 78.0, 50.0, 34.0, 29.0, 17.0, 23.0, 12.0, 9.0, 5.0, 7.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.185546875, -3.067169189453125, -2.94879150390625, -2.830413818359375, -2.7120361328125, -2.593658447265625, -2.47528076171875, -2.356903076171875, -2.238525390625, -2.120147705078125, -2.00177001953125, -1.883392333984375, -1.7650146484375, -1.646636962890625, -1.52825927734375, -1.409881591796875, -1.29150390625, -1.173126220703125, -1.05474853515625, -0.936370849609375, -0.8179931640625, -0.699615478515625, -0.58123779296875, -0.462860107421875, -0.344482421875, -0.226104736328125, -0.10772705078125, 0.010650634765625, 0.1290283203125, 0.247406005859375, 0.36578369140625, 0.484161376953125, 0.6025390625, 0.720916748046875, 0.83929443359375, 0.957672119140625, 1.0760498046875, 1.194427490234375, 1.31280517578125, 1.431182861328125, 1.549560546875, 1.667938232421875, 1.78631591796875, 1.904693603515625, 2.0230712890625, 2.141448974609375, 2.25982666015625, 2.378204345703125, 2.49658203125, 2.614959716796875, 2.73333740234375, 2.851715087890625, 2.9700927734375, 3.088470458984375, 3.20684814453125, 3.325225830078125, 3.443603515625, 3.561981201171875, 3.68035888671875, 3.798736572265625, 3.9171142578125, 4.035491943359375, 4.15386962890625, 4.272247314453125, 4.390625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 11.0, 21.0, 41.0, 73.0, 110.0, 147.0, 160.0, 135.0, 121.0, 81.0, 41.0, 32.0, 13.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.34989929199219, -105.73538970947266, -103.1208724975586, -100.50636291503906, -97.891845703125, -95.27733612060547, -92.6628189086914, -90.04830932617188, -87.43379211425781, -84.81928253173828, -82.20476531982422, -79.59025573730469, -76.97573852539062, -74.3612289428711, -71.74671173095703, -69.1322021484375, -66.51768493652344, -63.90317153930664, -61.288658142089844, -58.67414474487305, -56.05963134765625, -53.44511795043945, -50.830604553222656, -48.216094970703125, -45.601585388183594, -42.9870719909668, -40.37255859375, -37.7580451965332, -35.143531799316406, -32.52901840209961, -29.914506912231445, -27.29999351501465, -24.68547821044922, -22.070964813232422, -19.456451416015625, -16.841938018798828, -14.227425575256348, -11.61291217803955, -8.99839973449707, -6.383886337280273, -3.7693729400634766, -1.1548597812652588, 1.459653377532959, 4.074166297912598, 6.6886796951293945, 9.303193092346191, 11.917705535888672, 14.532218933105469, 17.146732330322266, 19.761245727539062, 22.37575912475586, 24.990272521972656, 27.604785919189453, 30.21929931640625, 32.83380889892578, 35.448326110839844, 38.062835693359375, 40.67734909057617, 43.29186248779297, 45.906375885009766, 48.52088928222656, 51.13540267944336, 53.749916076660156, 56.36442565917969, 58.97894287109375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 10.0, 10.0, 13.0, 15.0, 20.0, 21.0, 32.0, 28.0, 37.0, 37.0, 43.0, 63.0, 49.0, 61.0, 50.0, 57.0, 59.0, 46.0, 54.0, 46.0, 47.0, 42.0, 28.0, 18.0, 26.0, 17.0, 10.0, 14.0, 10.0, 10.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.27924346923828, -46.84874725341797, -45.41824722290039, -43.98775100708008, -42.557254791259766, -41.12675476074219, -39.696258544921875, -38.26576232910156, -36.835262298583984, -35.40476608276367, -33.974266052246094, -32.54376983642578, -31.113271713256836, -29.68277359008789, -28.252277374267578, -26.821779251098633, -25.39128303527832, -23.960784912109375, -22.530288696289062, -21.099790573120117, -19.669292449951172, -18.23879623413086, -16.808298110961914, -15.377799987792969, -13.94730281829834, -12.516805648803711, -11.086307525634766, -9.655810356140137, -8.225313186645508, -6.7948150634765625, -5.364317893981934, -3.9338197708129883, -2.5033226013183594, -1.0728250741958618, 0.35767245292663574, 1.7881698608398438, 3.218667507171631, 4.649165153503418, 6.079662322998047, 7.510160446166992, 8.940657615661621, 10.37115478515625, 11.801652908325195, 13.232150077819824, 14.662647247314453, 16.0931453704834, 17.523643493652344, 18.954139709472656, 20.3846378326416, 21.815135955810547, 23.24563217163086, 24.676130294799805, 26.10662841796875, 27.537124633789062, 28.967622756958008, 30.398120880126953, 31.828617095947266, 33.25911331176758, 34.689613342285156, 36.12010955810547, 37.55060577392578, 38.98110580444336, 40.41160202026367, 41.84210205078125, 43.27259826660156]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 11.0, 21.0, 38.0, 43.0, 67.0, 111.0, 179.0, 249.0, 388.0, 705.0, 1239.0, 2246.0, 4343.0, 8653.0, 19240.0, 48508.0, 157743.0, 1592288.0, 2106501.0, 164387.0, 48944.0, 19576.0, 8724.0, 4289.0, 2402.0, 1311.0, 787.0, 467.0, 262.0, 187.0, 113.0, 67.0, 49.0, 35.0, 38.0, 14.0, 13.0, 10.0, 9.0, 6.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66015625, -5.43389892578125, -5.2076416015625, -4.98138427734375, -4.755126953125, -4.52886962890625, -4.3026123046875, -4.07635498046875, -3.85009765625, -3.62384033203125, -3.3975830078125, -3.17132568359375, -2.945068359375, -2.71881103515625, -2.4925537109375, -2.26629638671875, -2.0400390625, -1.81378173828125, -1.5875244140625, -1.36126708984375, -1.135009765625, -0.90875244140625, -0.6824951171875, -0.45623779296875, -0.22998046875, -0.00372314453125, 0.2225341796875, 0.44879150390625, 0.675048828125, 0.90130615234375, 1.1275634765625, 1.35382080078125, 1.580078125, 1.80633544921875, 2.0325927734375, 2.25885009765625, 2.485107421875, 2.71136474609375, 2.9376220703125, 3.16387939453125, 3.39013671875, 3.61639404296875, 3.8426513671875, 4.06890869140625, 4.295166015625, 4.52142333984375, 4.7476806640625, 4.97393798828125, 5.2001953125, 5.42645263671875, 5.6527099609375, 5.87896728515625, 6.105224609375, 6.33148193359375, 6.5577392578125, 6.78399658203125, 7.01025390625, 7.23651123046875, 7.4627685546875, 7.68902587890625, 7.915283203125, 8.14154052734375, 8.3677978515625, 8.59405517578125, 8.8203125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 4.0, 5.0, 12.0, 8.0, 17.0, 21.0, 26.0, 21.0, 32.0, 35.0, 28.0, 50.0, 44.0, 60.0, 63.0, 56.0, 54.0, 48.0, 52.0, 46.0, 47.0, 46.0, 28.0, 32.0, 26.0, 20.0, 35.0, 26.0, 20.0, 11.0, 14.0, 7.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.458984375, -1.404083251953125, -1.34918212890625, -1.294281005859375, -1.2393798828125, -1.184478759765625, -1.12957763671875, -1.074676513671875, -1.019775390625, -0.964874267578125, -0.90997314453125, -0.855072021484375, -0.8001708984375, -0.745269775390625, -0.69036865234375, -0.635467529296875, -0.58056640625, -0.525665283203125, -0.47076416015625, -0.415863037109375, -0.3609619140625, -0.306060791015625, -0.25115966796875, -0.196258544921875, -0.141357421875, -0.086456298828125, -0.03155517578125, 0.023345947265625, 0.0782470703125, 0.133148193359375, 0.18804931640625, 0.242950439453125, 0.2978515625, 0.352752685546875, 0.40765380859375, 0.462554931640625, 0.5174560546875, 0.572357177734375, 0.62725830078125, 0.682159423828125, 0.737060546875, 0.791961669921875, 0.84686279296875, 0.901763916015625, 0.9566650390625, 1.011566162109375, 1.06646728515625, 1.121368408203125, 1.17626953125, 1.231170654296875, 1.28607177734375, 1.340972900390625, 1.3958740234375, 1.450775146484375, 1.50567626953125, 1.560577392578125, 1.615478515625, 1.670379638671875, 1.72528076171875, 1.780181884765625, 1.8350830078125, 1.889984130859375, 1.94488525390625, 1.999786376953125, 2.0546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 9.0, 10.0, 25.0, 37.0, 98.0, 173.0, 291.0, 569.0, 1308.0, 2585.0, 6312.0, 15723.0, 44806.0, 164765.0, 1304741.0, 2360634.0, 208669.0, 52652.0, 18183.0, 6980.0, 2988.0, 1332.0, 643.0, 341.0, 178.0, 91.0, 45.0, 30.0, 16.0, 16.0, 11.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.479736328125, -9.20947265625, -8.939208984375, -8.6689453125, -8.398681640625, -8.12841796875, -7.858154296875, -7.587890625, -7.317626953125, -7.04736328125, -6.777099609375, -6.5068359375, -6.236572265625, -5.96630859375, -5.696044921875, -5.42578125, -5.155517578125, -4.88525390625, -4.614990234375, -4.3447265625, -4.074462890625, -3.80419921875, -3.533935546875, -3.263671875, -2.993408203125, -2.72314453125, -2.452880859375, -2.1826171875, -1.912353515625, -1.64208984375, -1.371826171875, -1.1015625, -0.831298828125, -0.56103515625, -0.290771484375, -0.0205078125, 0.249755859375, 0.52001953125, 0.790283203125, 1.060546875, 1.330810546875, 1.60107421875, 1.871337890625, 2.1416015625, 2.411865234375, 2.68212890625, 2.952392578125, 3.22265625, 3.492919921875, 3.76318359375, 4.033447265625, 4.3037109375, 4.573974609375, 4.84423828125, 5.114501953125, 5.384765625, 5.655029296875, 5.92529296875, 6.195556640625, 6.4658203125, 6.736083984375, 7.00634765625, 7.276611328125, 7.546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 7.0, 11.0, 11.0, 14.0, 10.0, 17.0, 19.0, 39.0, 42.0, 49.0, 79.0, 110.0, 184.0, 305.0, 520.0, 1150.0, 586.0, 298.0, 196.0, 113.0, 79.0, 49.0, 39.0, 28.0, 28.0, 14.0, 12.0, 11.0, 8.0, 13.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.775390625, -2.68133544921875, -2.5872802734375, -2.49322509765625, -2.399169921875, -2.30511474609375, -2.2110595703125, -2.11700439453125, -2.02294921875, -1.92889404296875, -1.8348388671875, -1.74078369140625, -1.646728515625, -1.55267333984375, -1.4586181640625, -1.36456298828125, -1.2705078125, -1.17645263671875, -1.0823974609375, -0.98834228515625, -0.894287109375, -0.80023193359375, -0.7061767578125, -0.61212158203125, -0.51806640625, -0.42401123046875, -0.3299560546875, -0.23590087890625, -0.141845703125, -0.04779052734375, 0.0462646484375, 0.14031982421875, 0.234375, 0.32843017578125, 0.4224853515625, 0.51654052734375, 0.610595703125, 0.70465087890625, 0.7987060546875, 0.89276123046875, 0.98681640625, 1.08087158203125, 1.1749267578125, 1.26898193359375, 1.363037109375, 1.45709228515625, 1.5511474609375, 1.64520263671875, 1.7392578125, 1.83331298828125, 1.9273681640625, 2.02142333984375, 2.115478515625, 2.20953369140625, 2.3035888671875, 2.39764404296875, 2.49169921875, 2.58575439453125, 2.6798095703125, 2.77386474609375, 2.867919921875, 2.96197509765625, 3.0560302734375, 3.15008544921875, 3.244140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 8.0, 4.0, 11.0, 10.0, 18.0, 23.0, 35.0, 63.0, 58.0, 97.0, 84.0, 97.0, 99.0, 98.0, 64.0, 75.0, 49.0, 39.0, 34.0, 13.0, 5.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-28.677001953125, -28.05024528503418, -27.42348861694336, -26.79673194885254, -26.16997528076172, -25.543216705322266, -24.916460037231445, -24.289703369140625, -23.662946701049805, -23.036190032958984, -22.409433364868164, -21.782676696777344, -21.15591812133789, -20.52916145324707, -19.90240478515625, -19.27564811706543, -18.64889144897461, -18.02213478088379, -17.39537811279297, -16.76862144470215, -16.141864776611328, -15.515107154846191, -14.888349533081055, -14.261592864990234, -13.634836196899414, -13.008079528808594, -12.381322860717773, -11.754565238952637, -11.127808570861816, -10.501051902770996, -9.87429428100586, -9.247537612915039, -8.620780944824219, -7.994024276733398, -7.36726713180542, -6.740509986877441, -6.113753318786621, -5.486996650695801, -4.860239505767822, -4.233482360839844, -3.6067256927490234, -2.979968786239624, -2.3532118797302246, -1.7264549732208252, -1.0996980667114258, -0.47294116020202637, 0.15381574630737305, 0.7805728912353516, 1.4073295593261719, 2.0340864658355713, 2.6608433723449707, 3.28760027885437, 3.9143571853637695, 4.54111385345459, 5.167870998382568, 5.794628143310547, 6.421384811401367, 7.0481414794921875, 7.674898624420166, 8.301655769348145, 8.928412437438965, 9.555169105529785, 10.181926727294922, 10.808683395385742, 11.435440063476562]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 9.0, 4.0, 5.0, 8.0, 9.0, 12.0, 12.0, 17.0, 19.0, 19.0, 26.0, 30.0, 35.0, 16.0, 40.0, 35.0, 40.0, 27.0, 54.0, 39.0, 47.0, 34.0, 47.0, 36.0, 24.0, 44.0, 33.0, 30.0, 30.0, 37.0, 23.0, 14.0, 24.0, 17.0, 19.0, 15.0, 6.0, 9.0, 15.0, 7.0, 7.0, 6.0, 5.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.984840393066406, -9.645853042602539, -9.306865692138672, -8.967878341674805, -8.628890991210938, -8.289902687072754, -7.950915336608887, -7.6119279861450195, -7.272940635681152, -6.933953285217285, -6.594965934753418, -6.255978107452393, -5.916990756988525, -5.578003406524658, -5.239015579223633, -4.900028228759766, -4.561040878295898, -4.222053527832031, -3.883065938949585, -3.5440783500671387, -3.2050909996032715, -2.8661036491394043, -2.527116060256958, -2.1881284713745117, -1.8491411209106445, -1.5101536512374878, -1.171166181564331, -0.8321787118911743, -0.4931912422180176, -0.15420377254486084, 0.1847836971282959, 0.5237712860107422, 0.862757682800293, 1.2017451524734497, 1.5407326221466064, 1.8797200918197632, 2.21870756149292, 2.557694911956787, 2.8966825008392334, 3.2356700897216797, 3.574657440185547, 3.913644790649414, 4.252632141113281, 4.591619968414307, 4.930607318878174, 5.269594669342041, 5.608582496643066, 5.947569847106934, 6.286557197570801, 6.625544548034668, 6.964531898498535, 7.3035197257995605, 7.642507076263428, 7.981494426727295, 8.32048225402832, 8.659469604492188, 8.998456954956055, 9.337444305419922, 9.676431655883789, 10.015419006347656, 10.354406356811523, 10.693394660949707, 11.032382011413574, 11.371369361877441, 11.710356712341309]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 11.0, 17.0, 25.0, 40.0, 61.0, 94.0, 151.0, 289.0, 529.0, 1379.0, 2987.0, 7456.0, 19041.0, 50040.0, 127977.0, 315717.0, 314196.0, 126882.0, 49454.0, 19197.0, 7369.0, 3029.0, 1292.0, 627.0, 301.0, 165.0, 83.0, 40.0, 40.0, 20.0, 17.0, 11.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.921875, -10.6488037109375, -10.375732421875, -10.1026611328125, -9.82958984375, -9.5565185546875, -9.283447265625, -9.0103759765625, -8.7373046875, -8.4642333984375, -8.191162109375, -7.9180908203125, -7.64501953125, -7.3719482421875, -7.098876953125, -6.8258056640625, -6.552734375, -6.2796630859375, -6.006591796875, -5.7335205078125, -5.46044921875, -5.1873779296875, -4.914306640625, -4.6412353515625, -4.3681640625, -4.0950927734375, -3.822021484375, -3.5489501953125, -3.27587890625, -3.0028076171875, -2.729736328125, -2.4566650390625, -2.18359375, -1.9105224609375, -1.637451171875, -1.3643798828125, -1.09130859375, -0.8182373046875, -0.545166015625, -0.2720947265625, 0.0009765625, 0.2740478515625, 0.547119140625, 0.8201904296875, 1.09326171875, 1.3663330078125, 1.639404296875, 1.9124755859375, 2.185546875, 2.4586181640625, 2.731689453125, 3.0047607421875, 3.27783203125, 3.5509033203125, 3.823974609375, 4.0970458984375, 4.3701171875, 4.6431884765625, 4.916259765625, 5.1893310546875, 5.46240234375, 5.7354736328125, 6.008544921875, 6.2816162109375, 6.5546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 9.0, 11.0, 17.0, 13.0, 25.0, 17.0, 20.0, 26.0, 32.0, 34.0, 42.0, 50.0, 47.0, 53.0, 60.0, 55.0, 46.0, 54.0, 53.0, 40.0, 27.0, 39.0, 23.0, 37.0, 31.0, 25.0, 24.0, 19.0, 18.0, 14.0, 11.0, 10.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3271484375, -1.2739715576171875, -1.220794677734375, -1.1676177978515625, -1.11444091796875, -1.0612640380859375, -1.008087158203125, -0.9549102783203125, -0.9017333984375, -0.8485565185546875, -0.795379638671875, -0.7422027587890625, -0.68902587890625, -0.6358489990234375, -0.582672119140625, -0.5294952392578125, -0.476318359375, -0.4231414794921875, -0.369964599609375, -0.3167877197265625, -0.26361083984375, -0.2104339599609375, -0.157257080078125, -0.1040802001953125, -0.0509033203125, 0.0022735595703125, 0.055450439453125, 0.1086273193359375, 0.16180419921875, 0.2149810791015625, 0.268157958984375, 0.3213348388671875, 0.37451171875, 0.4276885986328125, 0.480865478515625, 0.5340423583984375, 0.58721923828125, 0.6403961181640625, 0.693572998046875, 0.7467498779296875, 0.7999267578125, 0.8531036376953125, 0.906280517578125, 0.9594573974609375, 1.01263427734375, 1.0658111572265625, 1.118988037109375, 1.1721649169921875, 1.225341796875, 1.2785186767578125, 1.331695556640625, 1.3848724365234375, 1.43804931640625, 1.4912261962890625, 1.544403076171875, 1.5975799560546875, 1.6507568359375, 1.7039337158203125, 1.757110595703125, 1.8102874755859375, 1.86346435546875, 1.9166412353515625, 1.969818115234375, 2.0229949951171875, 2.076171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 3.0, 2.0, 7.0, 8.0, 7.0, 16.0, 24.0, 22.0, 26.0, 36.0, 59.0, 71.0, 87.0, 140.0, 220.0, 321.0, 593.0, 1094.0, 2215.0, 5737.0, 17430.0, 58107.0, 198446.0, 474818.0, 201725.0, 58453.0, 17824.0, 5902.0, 2367.0, 1078.0, 600.0, 344.0, 243.0, 153.0, 112.0, 80.0, 51.0, 45.0, 23.0, 24.0, 12.0, 13.0, 10.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.21875, -7.9493408203125, -7.679931640625, -7.4105224609375, -7.14111328125, -6.8717041015625, -6.602294921875, -6.3328857421875, -6.0634765625, -5.7940673828125, -5.524658203125, -5.2552490234375, -4.98583984375, -4.7164306640625, -4.447021484375, -4.1776123046875, -3.908203125, -3.6387939453125, -3.369384765625, -3.0999755859375, -2.83056640625, -2.5611572265625, -2.291748046875, -2.0223388671875, -1.7529296875, -1.4835205078125, -1.214111328125, -0.9447021484375, -0.67529296875, -0.4058837890625, -0.136474609375, 0.1329345703125, 0.40234375, 0.6717529296875, 0.941162109375, 1.2105712890625, 1.47998046875, 1.7493896484375, 2.018798828125, 2.2882080078125, 2.5576171875, 2.8270263671875, 3.096435546875, 3.3658447265625, 3.63525390625, 3.9046630859375, 4.174072265625, 4.4434814453125, 4.712890625, 4.9822998046875, 5.251708984375, 5.5211181640625, 5.79052734375, 6.0599365234375, 6.329345703125, 6.5987548828125, 6.8681640625, 7.1375732421875, 7.406982421875, 7.6763916015625, 7.94580078125, 8.2152099609375, 8.484619140625, 8.7540283203125, 9.0234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 7.0, 12.0, 16.0, 15.0, 18.0, 12.0, 17.0, 27.0, 32.0, 35.0, 46.0, 49.0, 44.0, 59.0, 49.0, 46.0, 57.0, 56.0, 46.0, 38.0, 47.0, 37.0, 26.0, 34.0, 32.0, 21.0, 23.0, 13.0, 21.0, 11.0, 6.0, 8.0, 4.0, 11.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-8.796875, -8.563720703125, -8.33056640625, -8.097412109375, -7.8642578125, -7.631103515625, -7.39794921875, -7.164794921875, -6.931640625, -6.698486328125, -6.46533203125, -6.232177734375, -5.9990234375, -5.765869140625, -5.53271484375, -5.299560546875, -5.06640625, -4.833251953125, -4.60009765625, -4.366943359375, -4.1337890625, -3.900634765625, -3.66748046875, -3.434326171875, -3.201171875, -2.968017578125, -2.73486328125, -2.501708984375, -2.2685546875, -2.035400390625, -1.80224609375, -1.569091796875, -1.3359375, -1.102783203125, -0.86962890625, -0.636474609375, -0.4033203125, -0.170166015625, 0.06298828125, 0.296142578125, 0.529296875, 0.762451171875, 0.99560546875, 1.228759765625, 1.4619140625, 1.695068359375, 1.92822265625, 2.161376953125, 2.39453125, 2.627685546875, 2.86083984375, 3.093994140625, 3.3271484375, 3.560302734375, 3.79345703125, 4.026611328125, 4.259765625, 4.492919921875, 4.72607421875, 4.959228515625, 5.1923828125, 5.425537109375, 5.65869140625, 5.891845703125, 6.125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 4.0, 17.0, 14.0, 23.0, 33.0, 72.0, 87.0, 178.0, 360.0, 623.0, 1303.0, 2732.0, 6377.0, 16420.0, 49717.0, 202954.0, 526759.0, 171600.0, 43706.0, 14775.0, 5671.0, 2530.0, 1200.0, 592.0, 341.0, 193.0, 99.0, 72.0, 39.0, 19.0, 14.0, 13.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.28515625, -6.1297607421875, -5.974365234375, -5.8189697265625, -5.66357421875, -5.5081787109375, -5.352783203125, -5.1973876953125, -5.0419921875, -4.8865966796875, -4.731201171875, -4.5758056640625, -4.42041015625, -4.2650146484375, -4.109619140625, -3.9542236328125, -3.798828125, -3.6434326171875, -3.488037109375, -3.3326416015625, -3.17724609375, -3.0218505859375, -2.866455078125, -2.7110595703125, -2.5556640625, -2.4002685546875, -2.244873046875, -2.0894775390625, -1.93408203125, -1.7786865234375, -1.623291015625, -1.4678955078125, -1.3125, -1.1571044921875, -1.001708984375, -0.8463134765625, -0.69091796875, -0.5355224609375, -0.380126953125, -0.2247314453125, -0.0693359375, 0.0860595703125, 0.241455078125, 0.3968505859375, 0.55224609375, 0.7076416015625, 0.863037109375, 1.0184326171875, 1.173828125, 1.3292236328125, 1.484619140625, 1.6400146484375, 1.79541015625, 1.9508056640625, 2.106201171875, 2.2615966796875, 2.4169921875, 2.5723876953125, 2.727783203125, 2.8831787109375, 3.03857421875, 3.1939697265625, 3.349365234375, 3.5047607421875, 3.66015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 8.0, 8.0, 10.0, 9.0, 15.0, 18.0, 24.0, 19.0, 34.0, 41.0, 51.0, 69.0, 128.0, 157.0, 117.0, 75.0, 46.0, 32.0, 23.0, 21.0, 8.0, 17.0, 9.0, 7.0, 6.0, 6.0, 8.0, 0.0, 5.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0011749267578125, -0.0011407583951950073, -0.0011065900325775146, -0.001072421669960022, -0.0010382533073425293, -0.0010040849447250366, -0.0009699165821075439, -0.0009357482194900513, -0.0009015798568725586, -0.0008674114942550659, -0.0008332431316375732, -0.0007990747690200806, -0.0007649064064025879, -0.0007307380437850952, -0.0006965696811676025, -0.0006624013185501099, -0.0006282329559326172, -0.0005940645933151245, -0.0005598962306976318, -0.0005257278680801392, -0.0004915595054626465, -0.0004573911428451538, -0.00042322278022766113, -0.00038905441761016846, -0.0003548860549926758, -0.0003207176923751831, -0.00028654932975769043, -0.00025238096714019775, -0.00021821260452270508, -0.0001840442419052124, -0.00014987587928771973, -0.00011570751667022705, -8.153915405273438e-05, -4.73707914352417e-05, -1.3202428817749023e-05, 2.0965933799743652e-05, 5.513429641723633e-05, 8.9302659034729e-05, 0.00012347102165222168, 0.00015763938426971436, 0.00019180774688720703, 0.0002259761095046997, 0.0002601444721221924, 0.00029431283473968506, 0.00032848119735717773, 0.0003626495599746704, 0.0003968179225921631, 0.00043098628520965576, 0.00046515464782714844, 0.0004993230104446411, 0.0005334913730621338, 0.0005676597356796265, 0.0006018280982971191, 0.0006359964609146118, 0.0006701648235321045, 0.0007043331861495972, 0.0007385015487670898, 0.0007726699113845825, 0.0008068382740020752, 0.0008410066366195679, 0.0008751749992370605, 0.0009093433618545532, 0.0009435117244720459, 0.0009776800870895386, 0.0010118484497070312]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 5.0, 20.0, 15.0, 23.0, 34.0, 52.0, 84.0, 102.0, 200.0, 388.0, 730.0, 1485.0, 3663.0, 9733.0, 30122.0, 130414.0, 577592.0, 226219.0, 45341.0, 13447.0, 4829.0, 1999.0, 896.0, 466.0, 259.0, 133.0, 105.0, 58.0, 42.0, 26.0, 15.0, 12.0, 9.0, 2.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.33203125, -5.1580810546875, -4.984130859375, -4.8101806640625, -4.63623046875, -4.4622802734375, -4.288330078125, -4.1143798828125, -3.9404296875, -3.7664794921875, -3.592529296875, -3.4185791015625, -3.24462890625, -3.0706787109375, -2.896728515625, -2.7227783203125, -2.548828125, -2.3748779296875, -2.200927734375, -2.0269775390625, -1.85302734375, -1.6790771484375, -1.505126953125, -1.3311767578125, -1.1572265625, -0.9832763671875, -0.809326171875, -0.6353759765625, -0.46142578125, -0.2874755859375, -0.113525390625, 0.0604248046875, 0.234375, 0.4083251953125, 0.582275390625, 0.7562255859375, 0.93017578125, 1.1041259765625, 1.278076171875, 1.4520263671875, 1.6259765625, 1.7999267578125, 1.973876953125, 2.1478271484375, 2.32177734375, 2.4957275390625, 2.669677734375, 2.8436279296875, 3.017578125, 3.1915283203125, 3.365478515625, 3.5394287109375, 3.71337890625, 3.8873291015625, 4.061279296875, 4.2352294921875, 4.4091796875, 4.5831298828125, 4.757080078125, 4.9310302734375, 5.10498046875, 5.2789306640625, 5.452880859375, 5.6268310546875, 5.80078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 7.0, 1.0, 7.0, 8.0, 10.0, 12.0, 24.0, 30.0, 32.0, 26.0, 51.0, 80.0, 99.0, 105.0, 98.0, 119.0, 77.0, 63.0, 39.0, 23.0, 24.0, 13.0, 9.0, 6.0, 9.0, 5.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9921875, -3.8541259765625, -3.716064453125, -3.5780029296875, -3.43994140625, -3.3018798828125, -3.163818359375, -3.0257568359375, -2.8876953125, -2.7496337890625, -2.611572265625, -2.4735107421875, -2.33544921875, -2.1973876953125, -2.059326171875, -1.9212646484375, -1.783203125, -1.6451416015625, -1.507080078125, -1.3690185546875, -1.23095703125, -1.0928955078125, -0.954833984375, -0.8167724609375, -0.6787109375, -0.5406494140625, -0.402587890625, -0.2645263671875, -0.12646484375, 0.0115966796875, 0.149658203125, 0.2877197265625, 0.42578125, 0.5638427734375, 0.701904296875, 0.8399658203125, 0.97802734375, 1.1160888671875, 1.254150390625, 1.3922119140625, 1.5302734375, 1.6683349609375, 1.806396484375, 1.9444580078125, 2.08251953125, 2.2205810546875, 2.358642578125, 2.4967041015625, 2.634765625, 2.7728271484375, 2.910888671875, 3.0489501953125, 3.18701171875, 3.3250732421875, 3.463134765625, 3.6011962890625, 3.7392578125, 3.8773193359375, 4.015380859375, 4.1534423828125, 4.29150390625, 4.4295654296875, 4.567626953125, 4.7056884765625, 4.84375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 8.0, 11.0, 20.0, 28.0, 17.0, 25.0, 48.0, 55.0, 65.0, 74.0, 76.0, 68.0, 93.0, 74.0, 64.0, 62.0, 54.0, 39.0, 36.0, 23.0, 15.0, 9.0, 12.0, 1.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.62540054321289, -23.400836944580078, -22.1762752532959, -20.951711654663086, -19.727149963378906, -18.502586364746094, -17.27802276611328, -16.05345916748047, -14.828897476196289, -13.604334831237793, -12.379772186279297, -11.155208587646484, -9.930645942687988, -8.706083297729492, -7.481520175933838, -6.256957054138184, -5.0323944091796875, -3.8078315258026123, -2.583268642425537, -1.358705759048462, -0.13414287567138672, 1.0904197692871094, 2.3149828910827637, 3.539546012878418, 4.764108657836914, 5.98867130279541, 7.2132344245910645, 8.437797546386719, 9.662360191345215, 10.886922836303711, 12.111486434936523, 13.33604907989502, 14.560615539550781, 15.785178184509277, 17.009740829467773, 18.234304428100586, 19.458866119384766, 20.683429718017578, 21.90799331665039, 23.132556915283203, 24.357118606567383, 25.581682205200195, 26.806243896484375, 28.030807495117188, 29.25537109375, 30.47993278503418, 31.704496383666992, 32.92905807495117, 34.153621673583984, 35.3781852722168, 36.60274887084961, 37.827308654785156, 39.05187225341797, 40.27643585205078, 41.500999450683594, 42.725563049316406, 43.95012664794922, 45.17469024658203, 46.399253845214844, 47.62381362915039, 48.8483772277832, 50.072940826416016, 51.29750442504883, 52.52206802368164, 53.74662780761719]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 13.0, 8.0, 12.0, 13.0, 15.0, 18.0, 14.0, 26.0, 27.0, 23.0, 33.0, 34.0, 34.0, 47.0, 46.0, 43.0, 42.0, 50.0, 41.0, 48.0, 45.0, 36.0, 42.0, 37.0, 37.0, 24.0, 28.0, 36.0, 20.0, 21.0, 18.0, 13.0, 8.0, 9.0, 10.0, 9.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.365501403808594, -36.14567184448242, -34.92584228515625, -33.70601272583008, -32.486183166503906, -31.266353607177734, -30.04652214050293, -28.826692581176758, -27.606863021850586, -26.387033462524414, -25.167203903198242, -23.94737434387207, -22.727542877197266, -21.507713317871094, -20.287883758544922, -19.06805419921875, -17.848224639892578, -16.628395080566406, -15.408565521240234, -14.188735008239746, -12.968905448913574, -11.749075889587402, -10.529245376586914, -9.309415817260742, -8.08958625793457, -6.869756698608398, -5.649926662445068, -4.430096626281738, -3.2102670669555664, -1.9904375076293945, -0.7706074714660645, 0.4492225646972656, 1.6690521240234375, 2.8888819217681885, 4.1087117195129395, 5.3285417556762695, 6.548371315002441, 7.768200874328613, 8.988031387329102, 10.207860946655273, 11.427690505981445, 12.647520065307617, 13.867349624633789, 15.087180137634277, 16.307010650634766, 17.526840209960938, 18.74666976928711, 19.96649932861328, 21.186328887939453, 22.406158447265625, 23.625988006591797, 24.84581756591797, 26.06564712524414, 27.285476684570312, 28.505308151245117, 29.72513771057129, 30.94496726989746, 32.164798736572266, 33.38462829589844, 34.60445785522461, 35.82428741455078, 37.04411697387695, 38.263946533203125, 39.4837760925293, 40.70360565185547]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 7.0, 15.0, 25.0, 63.0, 79.0, 118.0, 213.0, 311.0, 587.0, 1072.0, 1848.0, 3470.0, 6979.0, 14302.0, 31934.0, 82796.0, 294303.0, 2813785.0, 714603.0, 139190.0, 47700.0, 20373.0, 9555.0, 4897.0, 2620.0, 1422.0, 758.0, 497.0, 288.0, 166.0, 105.0, 69.0, 45.0, 27.0, 24.0, 13.0, 12.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.54486083984375, -6.3319091796875, -6.11895751953125, -5.906005859375, -5.69305419921875, -5.4801025390625, -5.26715087890625, -5.05419921875, -4.84124755859375, -4.6282958984375, -4.41534423828125, -4.202392578125, -3.98944091796875, -3.7764892578125, -3.56353759765625, -3.3505859375, -3.13763427734375, -2.9246826171875, -2.71173095703125, -2.498779296875, -2.28582763671875, -2.0728759765625, -1.85992431640625, -1.64697265625, -1.43402099609375, -1.2210693359375, -1.00811767578125, -0.795166015625, -0.58221435546875, -0.3692626953125, -0.15631103515625, 0.056640625, 0.26959228515625, 0.4825439453125, 0.69549560546875, 0.908447265625, 1.12139892578125, 1.3343505859375, 1.54730224609375, 1.76025390625, 1.97320556640625, 2.1861572265625, 2.39910888671875, 2.612060546875, 2.82501220703125, 3.0379638671875, 3.25091552734375, 3.4638671875, 3.67681884765625, 3.8897705078125, 4.10272216796875, 4.315673828125, 4.52862548828125, 4.7415771484375, 4.95452880859375, 5.16748046875, 5.38043212890625, 5.5933837890625, 5.80633544921875, 6.019287109375, 6.23223876953125, 6.4451904296875, 6.65814208984375, 6.87109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 3.0, 3.0, 10.0, 7.0, 8.0, 21.0, 17.0, 22.0, 21.0, 35.0, 25.0, 39.0, 31.0, 43.0, 38.0, 48.0, 45.0, 53.0, 44.0, 53.0, 52.0, 55.0, 41.0, 44.0, 37.0, 26.0, 24.0, 26.0, 17.0, 30.0, 17.0, 20.0, 15.0, 6.0, 12.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.365570068359375, -1.31219482421875, -1.258819580078125, -1.2054443359375, -1.152069091796875, -1.09869384765625, -1.045318603515625, -0.991943359375, -0.938568115234375, -0.88519287109375, -0.831817626953125, -0.7784423828125, -0.725067138671875, -0.67169189453125, -0.618316650390625, -0.56494140625, -0.511566162109375, -0.45819091796875, -0.404815673828125, -0.3514404296875, -0.298065185546875, -0.24468994140625, -0.191314697265625, -0.137939453125, -0.084564208984375, -0.03118896484375, 0.022186279296875, 0.0755615234375, 0.128936767578125, 0.18231201171875, 0.235687255859375, 0.2890625, 0.342437744140625, 0.39581298828125, 0.449188232421875, 0.5025634765625, 0.555938720703125, 0.60931396484375, 0.662689208984375, 0.716064453125, 0.769439697265625, 0.82281494140625, 0.876190185546875, 0.9295654296875, 0.982940673828125, 1.03631591796875, 1.089691162109375, 1.14306640625, 1.196441650390625, 1.24981689453125, 1.303192138671875, 1.3565673828125, 1.409942626953125, 1.46331787109375, 1.516693115234375, 1.570068359375, 1.623443603515625, 1.67681884765625, 1.730194091796875, 1.7835693359375, 1.836944580078125, 1.89031982421875, 1.943695068359375, 1.9970703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 8.0, 12.0, 17.0, 26.0, 48.0, 82.0, 158.0, 243.0, 474.0, 879.0, 1782.0, 3759.0, 8326.0, 19933.0, 54659.0, 191341.0, 1198287.0, 2319262.0, 278685.0, 72182.0, 25122.0, 10268.0, 4461.0, 2099.0, 991.0, 527.0, 298.0, 141.0, 100.0, 42.0, 32.0, 19.0, 8.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0546875, -5.813720703125, -5.57275390625, -5.331787109375, -5.0908203125, -4.849853515625, -4.60888671875, -4.367919921875, -4.126953125, -3.885986328125, -3.64501953125, -3.404052734375, -3.1630859375, -2.922119140625, -2.68115234375, -2.440185546875, -2.19921875, -1.958251953125, -1.71728515625, -1.476318359375, -1.2353515625, -0.994384765625, -0.75341796875, -0.512451171875, -0.271484375, -0.030517578125, 0.21044921875, 0.451416015625, 0.6923828125, 0.933349609375, 1.17431640625, 1.415283203125, 1.65625, 1.897216796875, 2.13818359375, 2.379150390625, 2.6201171875, 2.861083984375, 3.10205078125, 3.343017578125, 3.583984375, 3.824951171875, 4.06591796875, 4.306884765625, 4.5478515625, 4.788818359375, 5.02978515625, 5.270751953125, 5.51171875, 5.752685546875, 5.99365234375, 6.234619140625, 6.4755859375, 6.716552734375, 6.95751953125, 7.198486328125, 7.439453125, 7.680419921875, 7.92138671875, 8.162353515625, 8.4033203125, 8.644287109375, 8.88525390625, 9.126220703125, 9.3671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 6.0, 7.0, 19.0, 9.0, 19.0, 25.0, 39.0, 65.0, 75.0, 98.0, 143.0, 222.0, 351.0, 624.0, 984.0, 507.0, 296.0, 175.0, 119.0, 74.0, 49.0, 37.0, 27.0, 18.0, 15.0, 13.0, 10.0, 8.0, 12.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.30078125, -4.182220458984375, -4.06365966796875, -3.945098876953125, -3.8265380859375, -3.707977294921875, -3.58941650390625, -3.470855712890625, -3.352294921875, -3.233734130859375, -3.11517333984375, -2.996612548828125, -2.8780517578125, -2.759490966796875, -2.64093017578125, -2.522369384765625, -2.40380859375, -2.285247802734375, -2.16668701171875, -2.048126220703125, -1.9295654296875, -1.811004638671875, -1.69244384765625, -1.573883056640625, -1.455322265625, -1.336761474609375, -1.21820068359375, -1.099639892578125, -0.9810791015625, -0.862518310546875, -0.74395751953125, -0.625396728515625, -0.5068359375, -0.388275146484375, -0.26971435546875, -0.151153564453125, -0.0325927734375, 0.085968017578125, 0.20452880859375, 0.323089599609375, 0.441650390625, 0.560211181640625, 0.67877197265625, 0.797332763671875, 0.9158935546875, 1.034454345703125, 1.15301513671875, 1.271575927734375, 1.39013671875, 1.508697509765625, 1.62725830078125, 1.745819091796875, 1.8643798828125, 1.982940673828125, 2.10150146484375, 2.220062255859375, 2.338623046875, 2.457183837890625, 2.57574462890625, 2.694305419921875, 2.8128662109375, 2.931427001953125, 3.04998779296875, 3.168548583984375, 3.287109375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 4.0, 12.0, 30.0, 27.0, 45.0, 68.0, 112.0, 123.0, 137.0, 153.0, 102.0, 80.0, 48.0, 21.0, 17.0, 15.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.89244842529297, -40.81348419189453, -39.734519958496094, -38.65555191040039, -37.57658767700195, -36.497623443603516, -35.41865539550781, -34.339691162109375, -33.26072692871094, -32.1817626953125, -31.10279655456543, -30.02383041381836, -28.944866180419922, -27.865901947021484, -26.786935806274414, -25.707969665527344, -24.629005432128906, -23.55004119873047, -22.4710750579834, -21.392108917236328, -20.31314468383789, -19.234180450439453, -18.155214309692383, -17.076248168945312, -15.997283935546875, -14.918318748474121, -13.839353561401367, -12.760388374328613, -11.68142318725586, -10.602458000183105, -9.523492813110352, -8.444527626037598, -7.365566253662109, -6.2866010665893555, -5.207635879516602, -4.128670692443848, -3.0497055053710938, -1.9707403182983398, -0.8917751312255859, 0.18719005584716797, 1.2661552429199219, 2.345120429992676, 3.4240856170654297, 4.503050804138184, 5.5820159912109375, 6.660981178283691, 7.739946365356445, 8.8189115524292, 9.897876739501953, 10.976841926574707, 12.055807113647461, 13.134772300720215, 14.213737487792969, 15.292702674865723, 16.371667861938477, 17.450634002685547, 18.529598236083984, 19.608562469482422, 20.687528610229492, 21.766494750976562, 22.845458984375, 23.924423217773438, 25.003389358520508, 26.082355499267578, 27.161319732666016]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 3.0, 7.0, 8.0, 7.0, 8.0, 10.0, 11.0, 23.0, 16.0, 31.0, 27.0, 37.0, 37.0, 30.0, 34.0, 45.0, 49.0, 35.0, 42.0, 48.0, 52.0, 44.0, 37.0, 53.0, 36.0, 16.0, 33.0, 27.0, 29.0, 26.0, 18.0, 22.0, 17.0, 22.0, 17.0, 7.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.431818962097168, -12.947786331176758, -12.463753700256348, -11.979721069335938, -11.495688438415527, -11.011655807495117, -10.527623176574707, -10.043590545654297, -9.559557914733887, -9.075525283813477, -8.591492652893066, -8.107460021972656, -7.623427391052246, -7.139394760131836, -6.655362129211426, -6.171329498291016, -5.6872968673706055, -5.203264236450195, -4.719231605529785, -4.235198974609375, -3.751166343688965, -3.2671337127685547, -2.7831010818481445, -2.2990684509277344, -1.8150358200073242, -1.331003189086914, -0.8469705581665039, -0.36293792724609375, 0.1210947036743164, 0.6051273345947266, 1.0891599655151367, 1.5731925964355469, 2.0572261810302734, 2.5412588119506836, 3.0252914428710938, 3.509324073791504, 3.993356704711914, 4.477389335632324, 4.961421966552734, 5.4454545974731445, 5.929487228393555, 6.413519859313965, 6.897552490234375, 7.381585121154785, 7.865617752075195, 8.349650382995605, 8.833683013916016, 9.317715644836426, 9.801748275756836, 10.285780906677246, 10.769813537597656, 11.253846168518066, 11.737878799438477, 12.221911430358887, 12.705944061279297, 13.189976692199707, 13.674009323120117, 14.158041954040527, 14.642074584960938, 15.126107215881348, 15.610139846801758, 16.094173431396484, 16.578205108642578, 17.062236785888672, 17.5462703704834]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 10.0, 11.0, 25.0, 32.0, 59.0, 98.0, 148.0, 234.0, 438.0, 826.0, 1482.0, 2932.0, 6188.0, 12600.0, 27771.0, 65007.0, 192172.0, 484477.0, 152391.0, 55227.0, 24356.0, 11021.0, 5381.0, 2585.0, 1299.0, 752.0, 431.0, 224.0, 142.0, 86.0, 53.0, 24.0, 21.0, 16.0, 9.0, 5.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.484375, -6.21875, -5.953125, -5.6875, -5.421875, -5.15625, -4.890625, -4.625, -4.359375, -4.09375, -3.828125, -3.5625, -3.296875, -3.03125, -2.765625, -2.5, -2.234375, -1.96875, -1.703125, -1.4375, -1.171875, -0.90625, -0.640625, -0.375, -0.109375, 0.15625, 0.421875, 0.6875, 0.953125, 1.21875, 1.484375, 1.75, 2.015625, 2.28125, 2.546875, 2.8125, 3.078125, 3.34375, 3.609375, 3.875, 4.140625, 4.40625, 4.671875, 4.9375, 5.203125, 5.46875, 5.734375, 6.0, 6.265625, 6.53125, 6.796875, 7.0625, 7.328125, 7.59375, 7.859375, 8.125, 8.390625, 8.65625, 8.921875, 9.1875, 9.453125, 9.71875, 9.984375, 10.25]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 7.0, 14.0, 10.0, 15.0, 18.0, 18.0, 31.0, 28.0, 29.0, 34.0, 44.0, 40.0, 39.0, 43.0, 45.0, 62.0, 39.0, 46.0, 49.0, 51.0, 43.0, 46.0, 38.0, 22.0, 28.0, 30.0, 20.0, 21.0, 26.0, 16.0, 11.0, 15.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3994140625, -1.3446197509765625, -1.289825439453125, -1.2350311279296875, -1.18023681640625, -1.1254425048828125, -1.070648193359375, -1.0158538818359375, -0.9610595703125, -0.9062652587890625, -0.851470947265625, -0.7966766357421875, -0.74188232421875, -0.6870880126953125, -0.632293701171875, -0.5774993896484375, -0.522705078125, -0.4679107666015625, -0.413116455078125, -0.3583221435546875, -0.30352783203125, -0.2487335205078125, -0.193939208984375, -0.1391448974609375, -0.0843505859375, -0.0295562744140625, 0.025238037109375, 0.0800323486328125, 0.13482666015625, 0.1896209716796875, 0.244415283203125, 0.2992095947265625, 0.35400390625, 0.4087982177734375, 0.463592529296875, 0.5183868408203125, 0.57318115234375, 0.6279754638671875, 0.682769775390625, 0.7375640869140625, 0.7923583984375, 0.8471527099609375, 0.901947021484375, 0.9567413330078125, 1.01153564453125, 1.0663299560546875, 1.121124267578125, 1.1759185791015625, 1.230712890625, 1.2855072021484375, 1.340301513671875, 1.3950958251953125, 1.44989013671875, 1.5046844482421875, 1.559478759765625, 1.6142730712890625, 1.6690673828125, 1.7238616943359375, 1.778656005859375, 1.8334503173828125, 1.88824462890625, 1.9430389404296875, 1.997833251953125, 2.0526275634765625, 2.107421875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 12.0, 13.0, 25.0, 23.0, 42.0, 49.0, 81.0, 124.0, 197.0, 313.0, 508.0, 894.0, 1978.0, 5013.0, 16059.0, 74527.0, 578005.0, 306652.0, 45717.0, 10838.0, 3820.0, 1580.0, 814.0, 473.0, 247.0, 164.0, 134.0, 69.0, 53.0, 43.0, 22.0, 15.0, 12.0, 8.0, 10.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.3828125, -13.009521484375, -12.63623046875, -12.262939453125, -11.8896484375, -11.516357421875, -11.14306640625, -10.769775390625, -10.396484375, -10.023193359375, -9.64990234375, -9.276611328125, -8.9033203125, -8.530029296875, -8.15673828125, -7.783447265625, -7.41015625, -7.036865234375, -6.66357421875, -6.290283203125, -5.9169921875, -5.543701171875, -5.17041015625, -4.797119140625, -4.423828125, -4.050537109375, -3.67724609375, -3.303955078125, -2.9306640625, -2.557373046875, -2.18408203125, -1.810791015625, -1.4375, -1.064208984375, -0.69091796875, -0.317626953125, 0.0556640625, 0.428955078125, 0.80224609375, 1.175537109375, 1.548828125, 1.922119140625, 2.29541015625, 2.668701171875, 3.0419921875, 3.415283203125, 3.78857421875, 4.161865234375, 4.53515625, 4.908447265625, 5.28173828125, 5.655029296875, 6.0283203125, 6.401611328125, 6.77490234375, 7.148193359375, 7.521484375, 7.894775390625, 8.26806640625, 8.641357421875, 9.0146484375, 9.387939453125, 9.76123046875, 10.134521484375, 10.5078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 10.0, 12.0, 8.0, 27.0, 21.0, 32.0, 36.0, 48.0, 41.0, 59.0, 55.0, 76.0, 52.0, 71.0, 75.0, 64.0, 75.0, 55.0, 41.0, 35.0, 29.0, 19.0, 16.0, 10.0, 11.0, 12.0, 8.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1953125, -11.8544921875, -11.513671875, -11.1728515625, -10.83203125, -10.4912109375, -10.150390625, -9.8095703125, -9.46875, -9.1279296875, -8.787109375, -8.4462890625, -8.10546875, -7.7646484375, -7.423828125, -7.0830078125, -6.7421875, -6.4013671875, -6.060546875, -5.7197265625, -5.37890625, -5.0380859375, -4.697265625, -4.3564453125, -4.015625, -3.6748046875, -3.333984375, -2.9931640625, -2.65234375, -2.3115234375, -1.970703125, -1.6298828125, -1.2890625, -0.9482421875, -0.607421875, -0.2666015625, 0.07421875, 0.4150390625, 0.755859375, 1.0966796875, 1.4375, 1.7783203125, 2.119140625, 2.4599609375, 2.80078125, 3.1416015625, 3.482421875, 3.8232421875, 4.1640625, 4.5048828125, 4.845703125, 5.1865234375, 5.52734375, 5.8681640625, 6.208984375, 6.5498046875, 6.890625, 7.2314453125, 7.572265625, 7.9130859375, 8.25390625, 8.5947265625, 8.935546875, 9.2763671875, 9.6171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 5.0, 20.0, 19.0, 28.0, 64.0, 80.0, 126.0, 240.0, 588.0, 1955.0, 7970.0, 44956.0, 615556.0, 336654.0, 31949.0, 5873.0, 1463.0, 503.0, 231.0, 109.0, 55.0, 35.0, 29.0, 19.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.9765625, -8.6951904296875, -8.413818359375, -8.1324462890625, -7.85107421875, -7.5697021484375, -7.288330078125, -7.0069580078125, -6.7255859375, -6.4442138671875, -6.162841796875, -5.8814697265625, -5.60009765625, -5.3187255859375, -5.037353515625, -4.7559814453125, -4.474609375, -4.1932373046875, -3.911865234375, -3.6304931640625, -3.34912109375, -3.0677490234375, -2.786376953125, -2.5050048828125, -2.2236328125, -1.9422607421875, -1.660888671875, -1.3795166015625, -1.09814453125, -0.8167724609375, -0.535400390625, -0.2540283203125, 0.02734375, 0.3087158203125, 0.590087890625, 0.8714599609375, 1.15283203125, 1.4342041015625, 1.715576171875, 1.9969482421875, 2.2783203125, 2.5596923828125, 2.841064453125, 3.1224365234375, 3.40380859375, 3.6851806640625, 3.966552734375, 4.2479248046875, 4.529296875, 4.8106689453125, 5.092041015625, 5.3734130859375, 5.65478515625, 5.9361572265625, 6.217529296875, 6.4989013671875, 6.7802734375, 7.0616455078125, 7.343017578125, 7.6243896484375, 7.90576171875, 8.1871337890625, 8.468505859375, 8.7498779296875, 9.03125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 13.0, 7.0, 9.0, 10.0, 14.0, 17.0, 10.0, 29.0, 36.0, 72.0, 171.0, 216.0, 134.0, 68.0, 25.0, 28.0, 23.0, 16.0, 11.0, 22.0, 9.0, 9.0, 7.0, 3.0, 6.0, 7.0, 2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001068115234375, -0.0010303109884262085, -0.000992506742477417, -0.0009547024965286255, -0.000916898250579834, -0.0008790940046310425, -0.000841289758682251, -0.0008034855127334595, -0.000765681266784668, -0.0007278770208358765, -0.000690072774887085, -0.0006522685289382935, -0.000614464282989502, -0.0005766600370407104, -0.0005388557910919189, -0.0005010515451431274, -0.00046324729919433594, -0.00042544305324554443, -0.00038763880729675293, -0.0003498345613479614, -0.0003120303153991699, -0.0002742260694503784, -0.00023642182350158691, -0.0001986175775527954, -0.0001608133316040039, -0.0001230090856552124, -8.52048397064209e-05, -4.7400593757629395e-05, -9.59634780883789e-06, 2.8207898139953613e-05, 6.601214408874512e-05, 0.00010381639003753662, 0.00014162063598632812, 0.00017942488193511963, 0.00021722912788391113, 0.00025503337383270264, 0.00029283761978149414, 0.00033064186573028564, 0.00036844611167907715, 0.00040625035762786865, 0.00044405460357666016, 0.00048185884952545166, 0.0005196630954742432, 0.0005574673414230347, 0.0005952715873718262, 0.0006330758333206177, 0.0006708800792694092, 0.0007086843252182007, 0.0007464885711669922, 0.0007842928171157837, 0.0008220970630645752, 0.0008599013090133667, 0.0008977055549621582, 0.0009355098009109497, 0.0009733140468597412, 0.0010111182928085327, 0.0010489225387573242, 0.0010867267847061157, 0.0011245310306549072, 0.0011623352766036987, 0.0012001395225524902, 0.0012379437685012817, 0.0012757480144500732, 0.0013135522603988647, 0.0013513565063476562]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 2.0, 15.0, 22.0, 47.0, 91.0, 224.0, 460.0, 1751.0, 15870.0, 765332.0, 253910.0, 8839.0, 1275.0, 363.0, 176.0, 81.0, 51.0, 21.0, 11.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.40625, -20.9398193359375, -20.473388671875, -20.0069580078125, -19.54052734375, -19.0740966796875, -18.607666015625, -18.1412353515625, -17.6748046875, -17.2083740234375, -16.741943359375, -16.2755126953125, -15.80908203125, -15.3426513671875, -14.876220703125, -14.4097900390625, -13.943359375, -13.4769287109375, -13.010498046875, -12.5440673828125, -12.07763671875, -11.6112060546875, -11.144775390625, -10.6783447265625, -10.2119140625, -9.7454833984375, -9.279052734375, -8.8126220703125, -8.34619140625, -7.8797607421875, -7.413330078125, -6.9468994140625, -6.48046875, -6.0140380859375, -5.547607421875, -5.0811767578125, -4.61474609375, -4.1483154296875, -3.681884765625, -3.2154541015625, -2.7490234375, -2.2825927734375, -1.816162109375, -1.3497314453125, -0.88330078125, -0.4168701171875, 0.049560546875, 0.5159912109375, 0.982421875, 1.4488525390625, 1.915283203125, 2.3817138671875, 2.84814453125, 3.3145751953125, 3.781005859375, 4.2474365234375, 4.7138671875, 5.1802978515625, 5.646728515625, 6.1131591796875, 6.57958984375, 7.0460205078125, 7.512451171875, 7.9788818359375, 8.4453125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 4.0, 12.0, 12.0, 12.0, 12.0, 15.0, 10.0, 17.0, 24.0, 47.0, 87.0, 127.0, 144.0, 117.0, 105.0, 67.0, 38.0, 28.0, 18.0, 24.0, 14.0, 12.0, 7.0, 8.0, 7.0, 7.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.1953125, -5.06427001953125, -4.9332275390625, -4.80218505859375, -4.671142578125, -4.54010009765625, -4.4090576171875, -4.27801513671875, -4.14697265625, -4.01593017578125, -3.8848876953125, -3.75384521484375, -3.622802734375, -3.49176025390625, -3.3607177734375, -3.22967529296875, -3.0986328125, -2.96759033203125, -2.8365478515625, -2.70550537109375, -2.574462890625, -2.44342041015625, -2.3123779296875, -2.18133544921875, -2.05029296875, -1.91925048828125, -1.7882080078125, -1.65716552734375, -1.526123046875, -1.39508056640625, -1.2640380859375, -1.13299560546875, -1.001953125, -0.87091064453125, -0.7398681640625, -0.60882568359375, -0.477783203125, -0.34674072265625, -0.2156982421875, -0.08465576171875, 0.04638671875, 0.17742919921875, 0.3084716796875, 0.43951416015625, 0.570556640625, 0.70159912109375, 0.8326416015625, 0.96368408203125, 1.0947265625, 1.22576904296875, 1.3568115234375, 1.48785400390625, 1.618896484375, 1.74993896484375, 1.8809814453125, 2.01202392578125, 2.14306640625, 2.27410888671875, 2.4051513671875, 2.53619384765625, 2.667236328125, 2.79827880859375, 2.9293212890625, 3.06036376953125, 3.19140625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 10.0, 31.0, 126.0, 287.0, 324.0, 163.0, 48.0, 12.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.99085998535156, -217.42457580566406, -211.8582763671875, -206.2919921875, -200.72569274902344, -195.15940856933594, -189.59310913085938, -184.02682495117188, -178.46054077148438, -172.89425659179688, -167.3279571533203, -161.7616729736328, -156.19537353515625, -150.62908935546875, -145.06280517578125, -139.4965057373047, -133.93020629882812, -128.36392211914062, -122.79762268066406, -117.23133850097656, -111.6650390625, -106.0987548828125, -100.53246307373047, -94.96617126464844, -89.3998794555664, -83.83358764648438, -78.26729583740234, -72.70100402832031, -67.13471984863281, -61.568424224853516, -56.00213623046875, -50.43584442138672, -44.86955261230469, -39.303260803222656, -33.736968994140625, -28.17068099975586, -22.604389190673828, -17.038097381591797, -11.471809387207031, -5.905517578125, -0.33922576904296875, 5.227065086364746, 10.793355941772461, 16.35964584350586, 21.92593765258789, 27.492229461669922, 33.05851745605469, 38.62480926513672, 44.19110107421875, 49.75739288330078, 55.32368469238281, 60.88997268676758, 66.45626831054688, 72.02255249023438, 77.5888442993164, 83.15513610839844, 88.72142791748047, 94.2877197265625, 99.85401153564453, 105.42030334472656, 110.98658752441406, 116.55288696289062, 122.11917114257812, 127.68546295166016, 133.2517547607422]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 8.0, 9.0, 17.0, 16.0, 13.0, 28.0, 25.0, 24.0, 31.0, 40.0, 35.0, 48.0, 37.0, 42.0, 60.0, 58.0, 42.0, 43.0, 43.0, 38.0, 30.0, 37.0, 32.0, 33.0, 35.0, 21.0, 32.0, 23.0, 24.0, 16.0, 11.0, 15.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.01609802246094, -40.74671936035156, -39.47734451293945, -38.20796585083008, -36.93859100341797, -35.669212341308594, -34.399837493896484, -33.13045883178711, -31.861083984375, -30.591707229614258, -29.322330474853516, -28.052953720092773, -26.78357696533203, -25.51420021057129, -24.244823455810547, -22.975444793701172, -21.70606803894043, -20.436691284179688, -19.167314529418945, -17.897937774658203, -16.62856101989746, -15.359184265136719, -14.08980655670166, -12.820429801940918, -11.551053047180176, -10.281676292419434, -9.012299537658691, -7.742922306060791, -6.473545551300049, -5.204168796539307, -3.9347915649414062, -2.665414810180664, -1.3960380554199219, -0.12666118144989014, 1.1427156925201416, 2.412092685699463, 3.681469440460205, 4.950846195220947, 6.220223426818848, 7.48960018157959, 8.758976936340332, 10.028353691101074, 11.297730445861816, 12.567108154296875, 13.836484909057617, 15.10586166381836, 16.3752384185791, 17.644615173339844, 18.913991928100586, 20.183368682861328, 21.45274543762207, 22.722122192382812, 23.991498947143555, 25.260875701904297, 26.530254364013672, 27.79962921142578, 29.069007873535156, 30.3383846282959, 31.60776138305664, 32.877140045166016, 34.146514892578125, 35.4158935546875, 36.68526840209961, 37.954647064208984, 39.224021911621094]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 11.0, 12.0, 27.0, 53.0, 72.0, 107.0, 166.0, 314.0, 519.0, 948.0, 1627.0, 3140.0, 6208.0, 13015.0, 29954.0, 80874.0, 318220.0, 3042699.0, 519359.0, 107329.0, 37843.0, 15856.0, 7516.0, 3704.0, 2023.0, 1082.0, 637.0, 342.0, 220.0, 124.0, 107.0, 54.0, 31.0, 24.0, 22.0, 16.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8046875, -6.558349609375, -6.31201171875, -6.065673828125, -5.8193359375, -5.572998046875, -5.32666015625, -5.080322265625, -4.833984375, -4.587646484375, -4.34130859375, -4.094970703125, -3.8486328125, -3.602294921875, -3.35595703125, -3.109619140625, -2.86328125, -2.616943359375, -2.37060546875, -2.124267578125, -1.8779296875, -1.631591796875, -1.38525390625, -1.138916015625, -0.892578125, -0.646240234375, -0.39990234375, -0.153564453125, 0.0927734375, 0.339111328125, 0.58544921875, 0.831787109375, 1.078125, 1.324462890625, 1.57080078125, 1.817138671875, 2.0634765625, 2.309814453125, 2.55615234375, 2.802490234375, 3.048828125, 3.295166015625, 3.54150390625, 3.787841796875, 4.0341796875, 4.280517578125, 4.52685546875, 4.773193359375, 5.01953125, 5.265869140625, 5.51220703125, 5.758544921875, 6.0048828125, 6.251220703125, 6.49755859375, 6.743896484375, 6.990234375, 7.236572265625, 7.48291015625, 7.729248046875, 7.9755859375, 8.221923828125, 8.46826171875, 8.714599609375, 8.9609375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 10.0, 11.0, 21.0, 17.0, 19.0, 22.0, 27.0, 25.0, 41.0, 36.0, 45.0, 45.0, 53.0, 37.0, 43.0, 53.0, 42.0, 44.0, 43.0, 40.0, 37.0, 42.0, 21.0, 30.0, 18.0, 27.0, 18.0, 29.0, 16.0, 13.0, 13.0, 10.0, 13.0, 2.0, 6.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5615234375, -1.5053253173828125, -1.449127197265625, -1.3929290771484375, -1.33673095703125, -1.2805328369140625, -1.224334716796875, -1.1681365966796875, -1.1119384765625, -1.0557403564453125, -0.999542236328125, -0.9433441162109375, -0.88714599609375, -0.8309478759765625, -0.774749755859375, -0.7185516357421875, -0.662353515625, -0.6061553955078125, -0.549957275390625, -0.4937591552734375, -0.43756103515625, -0.3813629150390625, -0.325164794921875, -0.2689666748046875, -0.2127685546875, -0.1565704345703125, -0.100372314453125, -0.0441741943359375, 0.01202392578125, 0.0682220458984375, 0.124420166015625, 0.1806182861328125, 0.23681640625, 0.2930145263671875, 0.349212646484375, 0.4054107666015625, 0.46160888671875, 0.5178070068359375, 0.574005126953125, 0.6302032470703125, 0.6864013671875, 0.7425994873046875, 0.798797607421875, 0.8549957275390625, 0.91119384765625, 0.9673919677734375, 1.023590087890625, 1.0797882080078125, 1.135986328125, 1.1921844482421875, 1.248382568359375, 1.3045806884765625, 1.36077880859375, 1.4169769287109375, 1.473175048828125, 1.5293731689453125, 1.5855712890625, 1.6417694091796875, 1.697967529296875, 1.7541656494140625, 1.81036376953125, 1.8665618896484375, 1.922760009765625, 1.9789581298828125, 2.03515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 11.0, 13.0, 14.0, 37.0, 37.0, 75.0, 128.0, 211.0, 355.0, 706.0, 1278.0, 2678.0, 5782.0, 14385.0, 43413.0, 183403.0, 2342611.0, 1394919.0, 145246.0, 36567.0, 12524.0, 4898.0, 2326.0, 1150.0, 616.0, 364.0, 202.0, 113.0, 71.0, 46.0, 30.0, 26.0, 16.0, 13.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.60595703125, -8.2978515625, -7.98974609375, -7.681640625, -7.37353515625, -7.0654296875, -6.75732421875, -6.44921875, -6.14111328125, -5.8330078125, -5.52490234375, -5.216796875, -4.90869140625, -4.6005859375, -4.29248046875, -3.984375, -3.67626953125, -3.3681640625, -3.06005859375, -2.751953125, -2.44384765625, -2.1357421875, -1.82763671875, -1.51953125, -1.21142578125, -0.9033203125, -0.59521484375, -0.287109375, 0.02099609375, 0.3291015625, 0.63720703125, 0.9453125, 1.25341796875, 1.5615234375, 1.86962890625, 2.177734375, 2.48583984375, 2.7939453125, 3.10205078125, 3.41015625, 3.71826171875, 4.0263671875, 4.33447265625, 4.642578125, 4.95068359375, 5.2587890625, 5.56689453125, 5.875, 6.18310546875, 6.4912109375, 6.79931640625, 7.107421875, 7.41552734375, 7.7236328125, 8.03173828125, 8.33984375, 8.64794921875, 8.9560546875, 9.26416015625, 9.572265625, 9.88037109375, 10.1884765625, 10.49658203125, 10.8046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 6.0, 6.0, 9.0, 8.0, 11.0, 22.0, 18.0, 29.0, 54.0, 83.0, 99.0, 161.0, 299.0, 652.0, 1303.0, 594.0, 279.0, 147.0, 101.0, 53.0, 44.0, 17.0, 16.0, 14.0, 18.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -4.00836181640625, -3.8721923828125, -3.73602294921875, -3.599853515625, -3.46368408203125, -3.3275146484375, -3.19134521484375, -3.05517578125, -2.91900634765625, -2.7828369140625, -2.64666748046875, -2.510498046875, -2.37432861328125, -2.2381591796875, -2.10198974609375, -1.9658203125, -1.82965087890625, -1.6934814453125, -1.55731201171875, -1.421142578125, -1.28497314453125, -1.1488037109375, -1.01263427734375, -0.87646484375, -0.74029541015625, -0.6041259765625, -0.46795654296875, -0.331787109375, -0.19561767578125, -0.0594482421875, 0.07672119140625, 0.212890625, 0.34906005859375, 0.4852294921875, 0.62139892578125, 0.757568359375, 0.89373779296875, 1.0299072265625, 1.16607666015625, 1.30224609375, 1.43841552734375, 1.5745849609375, 1.71075439453125, 1.846923828125, 1.98309326171875, 2.1192626953125, 2.25543212890625, 2.3916015625, 2.52777099609375, 2.6639404296875, 2.80010986328125, 2.936279296875, 3.07244873046875, 3.2086181640625, 3.34478759765625, 3.48095703125, 3.61712646484375, 3.7532958984375, 3.88946533203125, 4.025634765625, 4.16180419921875, 4.2979736328125, 4.43414306640625, 4.5703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 13.0, 33.0, 81.0, 190.0, 220.0, 242.0, 146.0, 53.0, 21.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.58502197265625, -93.74484252929688, -91.90465545654297, -90.0644760131836, -88.22428894042969, -86.38410949707031, -84.54393005371094, -82.70374298095703, -80.86356353759766, -79.02338409423828, -77.18319702148438, -75.343017578125, -73.5028305053711, -71.66265106201172, -69.82246398925781, -67.98228454589844, -66.14210510253906, -64.30192565917969, -62.46173858642578, -60.621559143066406, -58.781375885009766, -56.941192626953125, -55.101009368896484, -53.260826110839844, -51.42063903808594, -49.5804557800293, -47.740272521972656, -45.90009307861328, -44.05990982055664, -42.2197265625, -40.37954330444336, -38.53936004638672, -36.69917678833008, -34.85899353027344, -33.0188102722168, -31.17862892150879, -29.33844757080078, -27.49826431274414, -25.6580810546875, -23.81789779663086, -21.97771644592285, -20.13753318786621, -18.297351837158203, -16.457168579101562, -14.616986274719238, -12.776803970336914, -10.936620712280273, -9.09643840789795, -7.256256103515625, -5.416073799133301, -3.5758910179138184, -1.735708236694336, 0.10447406768798828, 1.9446563720703125, 3.784839630126953, 5.625021934509277, 7.465204238891602, 9.305386543273926, 11.14556884765625, 12.98575210571289, 14.825934410095215, 16.66611671447754, 18.50629997253418, 20.346481323242188, 22.186664581298828]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 5.0, 11.0, 14.0, 19.0, 25.0, 18.0, 28.0, 33.0, 26.0, 37.0, 37.0, 38.0, 40.0, 52.0, 38.0, 48.0, 45.0, 44.0, 39.0, 38.0, 40.0, 46.0, 34.0, 41.0, 30.0, 35.0, 26.0, 21.0, 14.0, 16.0, 10.0, 7.0, 5.0, 6.0, 8.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.41515064239502, -13.955218315124512, -13.495285987854004, -13.035354614257812, -12.575422286987305, -12.115489959716797, -11.655557632446289, -11.195625305175781, -10.735692977905273, -10.275760650634766, -9.815828323364258, -9.35589599609375, -8.895964622497559, -8.43603229522705, -7.976099967956543, -7.516167640686035, -7.0562357902526855, -6.596303462982178, -6.136371612548828, -5.67643928527832, -5.2165069580078125, -4.756574630737305, -4.296642780303955, -3.8367104530334473, -3.3767783641815186, -2.91684627532959, -2.456913948059082, -1.9969818592071533, -1.537049651145935, -1.0771174430847168, -0.6171853542327881, -0.15725302696228027, 0.30267906188964844, 0.7626112699508667, 1.222543478012085, 1.6824755668640137, 2.1424078941345215, 2.60233998298645, 3.062272071838379, 3.5222043991088867, 3.9821364879608154, 4.442068576812744, 4.902000904083252, 5.361932754516602, 5.821865081787109, 6.281797409057617, 6.741729736328125, 7.201662063598633, 7.661593914031982, 8.121525764465332, 8.58145809173584, 9.041390419006348, 9.501322746276855, 9.961255073547363, 10.421186447143555, 10.881118774414062, 11.34105110168457, 11.800983428955078, 12.260915756225586, 12.720848083496094, 13.180779457092285, 13.640711784362793, 14.1006441116333, 14.560576438903809, 15.020508766174316]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 11.0, 9.0, 14.0, 21.0, 28.0, 32.0, 70.0, 121.0, 232.0, 479.0, 1074.0, 2463.0, 5931.0, 14578.0, 35655.0, 108809.0, 526022.0, 254381.0, 59288.0, 22922.0, 9385.0, 3930.0, 1601.0, 731.0, 330.0, 164.0, 107.0, 52.0, 30.0, 25.0, 14.0, 13.0, 11.0, 10.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1484375, -9.8564453125, -9.564453125, -9.2724609375, -8.98046875, -8.6884765625, -8.396484375, -8.1044921875, -7.8125, -7.5205078125, -7.228515625, -6.9365234375, -6.64453125, -6.3525390625, -6.060546875, -5.7685546875, -5.4765625, -5.1845703125, -4.892578125, -4.6005859375, -4.30859375, -4.0166015625, -3.724609375, -3.4326171875, -3.140625, -2.8486328125, -2.556640625, -2.2646484375, -1.97265625, -1.6806640625, -1.388671875, -1.0966796875, -0.8046875, -0.5126953125, -0.220703125, 0.0712890625, 0.36328125, 0.6552734375, 0.947265625, 1.2392578125, 1.53125, 1.8232421875, 2.115234375, 2.4072265625, 2.69921875, 2.9912109375, 3.283203125, 3.5751953125, 3.8671875, 4.1591796875, 4.451171875, 4.7431640625, 5.03515625, 5.3271484375, 5.619140625, 5.9111328125, 6.203125, 6.4951171875, 6.787109375, 7.0791015625, 7.37109375, 7.6630859375, 7.955078125, 8.2470703125, 8.5390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 2.0, 8.0, 3.0, 10.0, 10.0, 11.0, 20.0, 25.0, 19.0, 31.0, 30.0, 25.0, 33.0, 30.0, 36.0, 44.0, 56.0, 40.0, 31.0, 50.0, 46.0, 40.0, 39.0, 35.0, 30.0, 35.0, 26.0, 34.0, 33.0, 19.0, 20.0, 15.0, 19.0, 17.0, 24.0, 14.0, 4.0, 7.0, 7.0, 4.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7255859375, -1.6712799072265625, -1.616973876953125, -1.5626678466796875, -1.50836181640625, -1.4540557861328125, -1.399749755859375, -1.3454437255859375, -1.2911376953125, -1.2368316650390625, -1.182525634765625, -1.1282196044921875, -1.07391357421875, -1.0196075439453125, -0.965301513671875, -0.9109954833984375, -0.856689453125, -0.8023834228515625, -0.748077392578125, -0.6937713623046875, -0.63946533203125, -0.5851593017578125, -0.530853271484375, -0.4765472412109375, -0.4222412109375, -0.3679351806640625, -0.313629150390625, -0.2593231201171875, -0.20501708984375, -0.1507110595703125, -0.096405029296875, -0.0420989990234375, 0.01220703125, 0.0665130615234375, 0.120819091796875, 0.1751251220703125, 0.22943115234375, 0.2837371826171875, 0.338043212890625, 0.3923492431640625, 0.4466552734375, 0.5009613037109375, 0.555267333984375, 0.6095733642578125, 0.66387939453125, 0.7181854248046875, 0.772491455078125, 0.8267974853515625, 0.881103515625, 0.9354095458984375, 0.989715576171875, 1.0440216064453125, 1.09832763671875, 1.1526336669921875, 1.206939697265625, 1.2612457275390625, 1.3155517578125, 1.3698577880859375, 1.424163818359375, 1.4784698486328125, 1.53277587890625, 1.5870819091796875, 1.641387939453125, 1.6956939697265625, 1.75]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 8.0, 11.0, 15.0, 12.0, 27.0, 37.0, 68.0, 76.0, 144.0, 308.0, 623.0, 1544.0, 4210.0, 14038.0, 51017.0, 630036.0, 292885.0, 36965.0, 10758.0, 3406.0, 1237.0, 502.0, 258.0, 132.0, 89.0, 50.0, 24.0, 16.0, 12.0, 12.0, 8.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.90625, -13.4248046875, -12.943359375, -12.4619140625, -11.98046875, -11.4990234375, -11.017578125, -10.5361328125, -10.0546875, -9.5732421875, -9.091796875, -8.6103515625, -8.12890625, -7.6474609375, -7.166015625, -6.6845703125, -6.203125, -5.7216796875, -5.240234375, -4.7587890625, -4.27734375, -3.7958984375, -3.314453125, -2.8330078125, -2.3515625, -1.8701171875, -1.388671875, -0.9072265625, -0.42578125, 0.0556640625, 0.537109375, 1.0185546875, 1.5, 1.9814453125, 2.462890625, 2.9443359375, 3.42578125, 3.9072265625, 4.388671875, 4.8701171875, 5.3515625, 5.8330078125, 6.314453125, 6.7958984375, 7.27734375, 7.7587890625, 8.240234375, 8.7216796875, 9.203125, 9.6845703125, 10.166015625, 10.6474609375, 11.12890625, 11.6103515625, 12.091796875, 12.5732421875, 13.0546875, 13.5361328125, 14.017578125, 14.4990234375, 14.98046875, 15.4619140625, 15.943359375, 16.4248046875, 16.90625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 3.0, 1.0, 5.0, 6.0, 5.0, 6.0, 7.0, 8.0, 8.0, 14.0, 16.0, 13.0, 32.0, 36.0, 35.0, 52.0, 52.0, 51.0, 65.0, 67.0, 63.0, 60.0, 72.0, 51.0, 62.0, 34.0, 30.0, 30.0, 27.0, 15.0, 17.0, 11.0, 11.0, 10.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.421875, -11.0557861328125, -10.689697265625, -10.3236083984375, -9.95751953125, -9.5914306640625, -9.225341796875, -8.8592529296875, -8.4931640625, -8.1270751953125, -7.760986328125, -7.3948974609375, -7.02880859375, -6.6627197265625, -6.296630859375, -5.9305419921875, -5.564453125, -5.1983642578125, -4.832275390625, -4.4661865234375, -4.10009765625, -3.7340087890625, -3.367919921875, -3.0018310546875, -2.6357421875, -2.2696533203125, -1.903564453125, -1.5374755859375, -1.17138671875, -0.8052978515625, -0.439208984375, -0.0731201171875, 0.29296875, 0.6590576171875, 1.025146484375, 1.3912353515625, 1.75732421875, 2.1234130859375, 2.489501953125, 2.8555908203125, 3.2216796875, 3.5877685546875, 3.953857421875, 4.3199462890625, 4.68603515625, 5.0521240234375, 5.418212890625, 5.7843017578125, 6.150390625, 6.5164794921875, 6.882568359375, 7.2486572265625, 7.61474609375, 7.9808349609375, 8.346923828125, 8.7130126953125, 9.0791015625, 9.4451904296875, 9.811279296875, 10.1773681640625, 10.54345703125, 10.9095458984375, 11.275634765625, 11.6417236328125, 12.0078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 2.0, 5.0, 12.0, 10.0, 12.0, 20.0, 29.0, 32.0, 50.0, 79.0, 95.0, 142.0, 193.0, 278.0, 387.0, 557.0, 853.0, 1384.0, 2223.0, 4018.0, 7948.0, 16307.0, 34686.0, 90506.0, 564061.0, 224829.0, 51952.0, 23279.0, 11237.0, 5449.0, 2918.0, 1676.0, 1051.0, 639.0, 482.0, 345.0, 233.0, 158.0, 112.0, 81.0, 60.0, 44.0, 31.0, 25.0, 25.0, 13.0, 9.0, 8.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.369140625, -3.251922607421875, -3.13470458984375, -3.017486572265625, -2.9002685546875, -2.783050537109375, -2.66583251953125, -2.548614501953125, -2.431396484375, -2.314178466796875, -2.19696044921875, -2.079742431640625, -1.9625244140625, -1.845306396484375, -1.72808837890625, -1.610870361328125, -1.49365234375, -1.376434326171875, -1.25921630859375, -1.141998291015625, -1.0247802734375, -0.907562255859375, -0.79034423828125, -0.673126220703125, -0.555908203125, -0.438690185546875, -0.32147216796875, -0.204254150390625, -0.0870361328125, 0.030181884765625, 0.14739990234375, 0.264617919921875, 0.3818359375, 0.499053955078125, 0.61627197265625, 0.733489990234375, 0.8507080078125, 0.967926025390625, 1.08514404296875, 1.202362060546875, 1.319580078125, 1.436798095703125, 1.55401611328125, 1.671234130859375, 1.7884521484375, 1.905670166015625, 2.02288818359375, 2.140106201171875, 2.25732421875, 2.374542236328125, 2.49176025390625, 2.608978271484375, 2.7261962890625, 2.843414306640625, 2.96063232421875, 3.077850341796875, 3.195068359375, 3.312286376953125, 3.42950439453125, 3.546722412109375, 3.6639404296875, 3.781158447265625, 3.89837646484375, 4.015594482421875, 4.1328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 16.0, 8.0, 16.0, 23.0, 58.0, 276.0, 370.0, 84.0, 36.0, 21.0, 23.0, 8.0, 16.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015668869018554688, -0.0015020519495010376, -0.0014372169971466064, -0.0013723820447921753, -0.0013075470924377441, -0.001242712140083313, -0.0011778771877288818, -0.0011130422353744507, -0.0010482072830200195, -0.0009833723306655884, -0.0009185373783111572, -0.0008537024259567261, -0.0007888674736022949, -0.0007240325212478638, -0.0006591975688934326, -0.0005943626165390015, -0.0005295276641845703, -0.00046469271183013916, -0.000399857759475708, -0.00033502280712127686, -0.0002701878547668457, -0.00020535290241241455, -0.0001405179500579834, -7.568299770355225e-05, -1.0848045349121094e-05, 5.398690700531006e-05, 0.00011882185935974121, 0.00018365681171417236, 0.0002484917640686035, 0.00031332671642303467, 0.0003781616687774658, 0.00044299662113189697, 0.0005078315734863281, 0.0005726665258407593, 0.0006375014781951904, 0.0007023364305496216, 0.0007671713829040527, 0.0008320063352584839, 0.000896841287612915, 0.0009616762399673462, 0.0010265111923217773, 0.0010913461446762085, 0.0011561810970306396, 0.0012210160493850708, 0.001285851001739502, 0.001350685954093933, 0.0014155209064483643, 0.0014803558588027954, 0.0015451908111572266, 0.0016100257635116577, 0.0016748607158660889, 0.00173969566822052, 0.0018045306205749512, 0.0018693655729293823, 0.0019342005252838135, 0.0019990354776382446, 0.0020638704299926758, 0.002128705382347107, 0.002193540334701538, 0.0022583752870559692, 0.0023232102394104004, 0.0023880451917648315, 0.0024528801441192627, 0.002517715096473694, 0.002582550048828125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 2.0, 8.0, 16.0, 11.0, 17.0, 27.0, 44.0, 54.0, 69.0, 127.0, 236.0, 419.0, 783.0, 1458.0, 3173.0, 9367.0, 37802.0, 412356.0, 523391.0, 42085.0, 10137.0, 3484.0, 1545.0, 844.0, 433.0, 232.0, 126.0, 102.0, 55.0, 46.0, 25.0, 25.0, 9.0, 7.0, 11.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.3828125, -7.15234375, -6.921875, -6.69140625, -6.4609375, -6.23046875, -6.0, -5.76953125, -5.5390625, -5.30859375, -5.078125, -4.84765625, -4.6171875, -4.38671875, -4.15625, -3.92578125, -3.6953125, -3.46484375, -3.234375, -3.00390625, -2.7734375, -2.54296875, -2.3125, -2.08203125, -1.8515625, -1.62109375, -1.390625, -1.16015625, -0.9296875, -0.69921875, -0.46875, -0.23828125, -0.0078125, 0.22265625, 0.453125, 0.68359375, 0.9140625, 1.14453125, 1.375, 1.60546875, 1.8359375, 2.06640625, 2.296875, 2.52734375, 2.7578125, 2.98828125, 3.21875, 3.44921875, 3.6796875, 3.91015625, 4.140625, 4.37109375, 4.6015625, 4.83203125, 5.0625, 5.29296875, 5.5234375, 5.75390625, 5.984375, 6.21484375, 6.4453125, 6.67578125, 6.90625, 7.13671875, 7.3671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 2.0, 3.0, 7.0, 9.0, 13.0, 10.0, 20.0, 19.0, 42.0, 60.0, 138.0, 235.0, 188.0, 110.0, 44.0, 27.0, 9.0, 17.0, 15.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-7.52734375, -7.338623046875, -7.14990234375, -6.961181640625, -6.7724609375, -6.583740234375, -6.39501953125, -6.206298828125, -6.017578125, -5.828857421875, -5.64013671875, -5.451416015625, -5.2626953125, -5.073974609375, -4.88525390625, -4.696533203125, -4.5078125, -4.319091796875, -4.13037109375, -3.941650390625, -3.7529296875, -3.564208984375, -3.37548828125, -3.186767578125, -2.998046875, -2.809326171875, -2.62060546875, -2.431884765625, -2.2431640625, -2.054443359375, -1.86572265625, -1.677001953125, -1.48828125, -1.299560546875, -1.11083984375, -0.922119140625, -0.7333984375, -0.544677734375, -0.35595703125, -0.167236328125, 0.021484375, 0.210205078125, 0.39892578125, 0.587646484375, 0.7763671875, 0.965087890625, 1.15380859375, 1.342529296875, 1.53125, 1.719970703125, 1.90869140625, 2.097412109375, 2.2861328125, 2.474853515625, 2.66357421875, 2.852294921875, 3.041015625, 3.229736328125, 3.41845703125, 3.607177734375, 3.7958984375, 3.984619140625, 4.17333984375, 4.362060546875, 4.55078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 9.0, 16.0, 23.0, 24.0, 29.0, 27.0, 39.0, 59.0, 62.0, 67.0, 70.0, 72.0, 73.0, 63.0, 72.0, 47.0, 44.0, 42.0, 42.0, 34.0, 16.0, 21.0, 14.0, 9.0, 6.0, 3.0, 3.0, 2.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.551090240478516, -46.178009033203125, -44.804927825927734, -43.431846618652344, -42.05876541137695, -40.68568420410156, -39.31260299682617, -37.93952178955078, -36.56644058227539, -35.193359375, -33.82027816772461, -32.44719696044922, -31.074115753173828, -29.701034545898438, -28.327953338623047, -26.954872131347656, -25.581789016723633, -24.208707809448242, -22.83562660217285, -21.46254539489746, -20.08946418762207, -18.71638298034668, -17.343299865722656, -15.970219612121582, -14.597138404846191, -13.2240571975708, -11.85097599029541, -10.477893829345703, -9.104812622070312, -7.73173189163208, -6.358650207519531, -4.985569000244141, -3.61248779296875, -2.2394065856933594, -0.8663251399993896, 0.5067563056945801, 1.8798375129699707, 3.2529187202453613, 4.62600040435791, 5.999081611633301, 7.372162818908691, 8.745244026184082, 10.118325233459473, 11.49140739440918, 12.86448860168457, 14.237569808959961, 15.610651016235352, 16.983732223510742, 18.356813430786133, 19.729894638061523, 21.102975845336914, 22.476057052612305, 23.849138259887695, 25.222219467163086, 26.59530258178711, 27.9683837890625, 29.34146499633789, 30.71454620361328, 32.08762741088867, 33.46070861816406, 34.83378982543945, 36.206871032714844, 37.579952239990234, 38.953033447265625, 40.326114654541016]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 3.0, 5.0, 9.0, 10.0, 12.0, 15.0, 13.0, 18.0, 24.0, 20.0, 19.0, 26.0, 33.0, 31.0, 34.0, 36.0, 47.0, 46.0, 34.0, 40.0, 54.0, 37.0, 62.0, 39.0, 30.0, 46.0, 32.0, 38.0, 25.0, 25.0, 28.0, 16.0, 19.0, 11.0, 9.0, 7.0, 9.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.03767013549805, -37.726226806640625, -36.4147834777832, -35.10334014892578, -33.79189682006836, -32.48045349121094, -31.16901206970215, -29.857568740844727, -28.546125411987305, -27.234682083129883, -25.92323875427246, -24.61179542541504, -23.30035400390625, -21.988910675048828, -20.677467346191406, -19.366024017333984, -18.054580688476562, -16.74313735961914, -15.431694030761719, -14.120251655578613, -12.808808326721191, -11.49736499786377, -10.185922622680664, -8.874479293823242, -7.56303596496582, -6.251592636108398, -4.940149784088135, -3.628706693649292, -2.317263603210449, -1.0058202743530273, 0.30562257766723633, 1.6170654296875, 2.928508758544922, 4.239952087402344, 5.551394939422607, 6.862837791442871, 8.174281120300293, 9.485724449157715, 10.79716682434082, 12.108610153198242, 13.420053482055664, 14.731496810913086, 16.042940139770508, 17.35438346862793, 18.66582489013672, 19.97726821899414, 21.288711547851562, 22.600154876708984, 23.911598205566406, 25.223041534423828, 26.53448486328125, 27.845928192138672, 29.157371520996094, 30.468814849853516, 31.780256271362305, 33.091697692871094, 34.40314483642578, 35.7145881652832, 37.026031494140625, 38.33747482299805, 39.64891815185547, 40.96036148071289, 42.27180480957031, 43.58324432373047, 44.89468765258789]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 10.0, 13.0, 16.0, 36.0, 43.0, 51.0, 75.0, 93.0, 152.0, 229.0, 344.0, 515.0, 815.0, 1304.0, 2242.0, 3992.0, 7345.0, 14355.0, 30250.0, 75843.0, 283201.0, 3110895.0, 482156.0, 103925.0, 38615.0, 17406.0, 8870.0, 4608.0, 2619.0, 1511.0, 920.0, 581.0, 371.0, 233.0, 182.0, 131.0, 107.0, 63.0, 65.0, 25.0, 23.0, 13.0, 14.0, 8.0, 8.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.5859375, -9.2730712890625, -8.960205078125, -8.6473388671875, -8.33447265625, -8.0216064453125, -7.708740234375, -7.3958740234375, -7.0830078125, -6.7701416015625, -6.457275390625, -6.1444091796875, -5.83154296875, -5.5186767578125, -5.205810546875, -4.8929443359375, -4.580078125, -4.2672119140625, -3.954345703125, -3.6414794921875, -3.32861328125, -3.0157470703125, -2.702880859375, -2.3900146484375, -2.0771484375, -1.7642822265625, -1.451416015625, -1.1385498046875, -0.82568359375, -0.5128173828125, -0.199951171875, 0.1129150390625, 0.42578125, 0.7386474609375, 1.051513671875, 1.3643798828125, 1.67724609375, 1.9901123046875, 2.302978515625, 2.6158447265625, 2.9287109375, 3.2415771484375, 3.554443359375, 3.8673095703125, 4.18017578125, 4.4930419921875, 4.805908203125, 5.1187744140625, 5.431640625, 5.7445068359375, 6.057373046875, 6.3702392578125, 6.68310546875, 6.9959716796875, 7.308837890625, 7.6217041015625, 7.9345703125, 8.2474365234375, 8.560302734375, 8.8731689453125, 9.18603515625, 9.4989013671875, 9.811767578125, 10.1246337890625, 10.4375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 6.0, 6.0, 9.0, 7.0, 14.0, 13.0, 15.0, 16.0, 17.0, 20.0, 21.0, 33.0, 31.0, 17.0, 33.0, 35.0, 44.0, 46.0, 50.0, 41.0, 40.0, 46.0, 33.0, 36.0, 42.0, 41.0, 39.0, 38.0, 32.0, 26.0, 16.0, 26.0, 17.0, 17.0, 12.0, 13.0, 8.0, 14.0, 7.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7373046875, -1.6784820556640625, -1.619659423828125, -1.5608367919921875, -1.50201416015625, -1.4431915283203125, -1.384368896484375, -1.3255462646484375, -1.2667236328125, -1.2079010009765625, -1.149078369140625, -1.0902557373046875, -1.03143310546875, -0.9726104736328125, -0.913787841796875, -0.8549652099609375, -0.796142578125, -0.7373199462890625, -0.678497314453125, -0.6196746826171875, -0.56085205078125, -0.5020294189453125, -0.443206787109375, -0.3843841552734375, -0.3255615234375, -0.2667388916015625, -0.207916259765625, -0.1490936279296875, -0.09027099609375, -0.0314483642578125, 0.027374267578125, 0.0861968994140625, 0.14501953125, 0.2038421630859375, 0.262664794921875, 0.3214874267578125, 0.38031005859375, 0.4391326904296875, 0.497955322265625, 0.5567779541015625, 0.6156005859375, 0.6744232177734375, 0.733245849609375, 0.7920684814453125, 0.85089111328125, 0.9097137451171875, 0.968536376953125, 1.0273590087890625, 1.086181640625, 1.1450042724609375, 1.203826904296875, 1.2626495361328125, 1.32147216796875, 1.3802947998046875, 1.439117431640625, 1.4979400634765625, 1.5567626953125, 1.6155853271484375, 1.674407958984375, 1.7332305908203125, 1.79205322265625, 1.8508758544921875, 1.909698486328125, 1.9685211181640625, 2.02734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 12.0, 15.0, 20.0, 20.0, 40.0, 62.0, 79.0, 127.0, 226.0, 406.0, 666.0, 1295.0, 2579.0, 5912.0, 14761.0, 44486.0, 187146.0, 3037822.0, 751534.0, 100591.0, 27884.0, 10058.0, 4203.0, 1981.0, 955.0, 532.0, 326.0, 190.0, 129.0, 57.0, 40.0, 28.0, 25.0, 15.0, 8.0, 9.0, 7.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.8046875, -15.337158203125, -14.86962890625, -14.402099609375, -13.9345703125, -13.467041015625, -12.99951171875, -12.531982421875, -12.064453125, -11.596923828125, -11.12939453125, -10.661865234375, -10.1943359375, -9.726806640625, -9.25927734375, -8.791748046875, -8.32421875, -7.856689453125, -7.38916015625, -6.921630859375, -6.4541015625, -5.986572265625, -5.51904296875, -5.051513671875, -4.583984375, -4.116455078125, -3.64892578125, -3.181396484375, -2.7138671875, -2.246337890625, -1.77880859375, -1.311279296875, -0.84375, -0.376220703125, 0.09130859375, 0.558837890625, 1.0263671875, 1.493896484375, 1.96142578125, 2.428955078125, 2.896484375, 3.364013671875, 3.83154296875, 4.299072265625, 4.7666015625, 5.234130859375, 5.70166015625, 6.169189453125, 6.63671875, 7.104248046875, 7.57177734375, 8.039306640625, 8.5068359375, 8.974365234375, 9.44189453125, 9.909423828125, 10.376953125, 10.844482421875, 11.31201171875, 11.779541015625, 12.2470703125, 12.714599609375, 13.18212890625, 13.649658203125, 14.1171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 16.0, 23.0, 41.0, 56.0, 75.0, 207.0, 420.0, 1914.0, 744.0, 250.0, 124.0, 71.0, 51.0, 23.0, 11.0, 6.0, 5.0, 6.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.919189453125, -7.64306640625, -7.366943359375, -7.0908203125, -6.814697265625, -6.53857421875, -6.262451171875, -5.986328125, -5.710205078125, -5.43408203125, -5.157958984375, -4.8818359375, -4.605712890625, -4.32958984375, -4.053466796875, -3.77734375, -3.501220703125, -3.22509765625, -2.948974609375, -2.6728515625, -2.396728515625, -2.12060546875, -1.844482421875, -1.568359375, -1.292236328125, -1.01611328125, -0.739990234375, -0.4638671875, -0.187744140625, 0.08837890625, 0.364501953125, 0.640625, 0.916748046875, 1.19287109375, 1.468994140625, 1.7451171875, 2.021240234375, 2.29736328125, 2.573486328125, 2.849609375, 3.125732421875, 3.40185546875, 3.677978515625, 3.9541015625, 4.230224609375, 4.50634765625, 4.782470703125, 5.05859375, 5.334716796875, 5.61083984375, 5.886962890625, 6.1630859375, 6.439208984375, 6.71533203125, 6.991455078125, 7.267578125, 7.543701171875, 7.81982421875, 8.095947265625, 8.3720703125, 8.648193359375, 8.92431640625, 9.200439453125, 9.4765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 10.0, 13.0, 25.0, 63.0, 95.0, 158.0, 157.0, 178.0, 123.0, 83.0, 37.0, 27.0, 19.0, 7.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.59715270996094, -70.021728515625, -68.44630432128906, -66.87088775634766, -65.29546356201172, -63.72003936767578, -62.144615173339844, -60.56919479370117, -58.9937744140625, -57.41835021972656, -55.84292984008789, -54.26750564575195, -52.69208526611328, -51.116661071777344, -49.541236877441406, -47.965816497802734, -46.3903923034668, -44.81496810913086, -43.23954772949219, -41.66412353515625, -40.08870315551758, -38.51327896118164, -36.93785858154297, -35.36243438720703, -33.787010192871094, -32.211585998535156, -30.636165618896484, -29.060741424560547, -27.485321044921875, -25.909896850585938, -24.334474563598633, -22.759052276611328, -21.18362808227539, -19.608205795288086, -18.03278350830078, -16.457359313964844, -14.881937980651855, -13.30651569366455, -11.73109245300293, -10.155670166015625, -8.58024787902832, -7.004825592041016, -5.429402828216553, -3.85398006439209, -2.278557777404785, -0.7031354904174805, 0.8722877502441406, 2.4477100372314453, 4.02313232421875, 5.598554611206055, 7.173977375030518, 8.74940013885498, 10.324822425842285, 11.90024471282959, 13.475667953491211, 15.051090240478516, 16.62651252746582, 18.201934814453125, 19.77735710144043, 21.352779388427734, 22.928203582763672, 24.503623962402344, 26.07904815673828, 27.654470443725586, 29.22989273071289]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 7.0, 8.0, 6.0, 13.0, 13.0, 23.0, 20.0, 20.0, 33.0, 29.0, 34.0, 30.0, 47.0, 27.0, 37.0, 40.0, 43.0, 48.0, 39.0, 44.0, 40.0, 39.0, 36.0, 38.0, 33.0, 36.0, 27.0, 33.0, 30.0, 19.0, 25.0, 22.0, 13.0, 9.0, 6.0, 4.0, 6.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.841022491455078, -21.221738815307617, -20.602455139160156, -19.983171463012695, -19.363887786865234, -18.74460220336914, -18.125320434570312, -17.50603485107422, -16.886751174926758, -16.267467498779297, -15.648183822631836, -15.028900146484375, -14.409615516662598, -13.790331840515137, -13.171048164367676, -12.551763534545898, -11.932480812072754, -11.313197135925293, -10.693913459777832, -10.074628829956055, -9.455345153808594, -8.836061477661133, -8.216777801513672, -7.597493648529053, -6.978209972381592, -6.358926296234131, -5.739642143249512, -5.120358467102051, -4.50107479095459, -3.8817906379699707, -3.2625069618225098, -2.6432228088378906, -2.0239391326904297, -1.4046552181243896, -0.7853714227676392, -0.16608762741088867, 0.45319628715515137, 1.0724802017211914, 1.6917638778686523, 2.3110480308532715, 2.9303317070007324, 3.5496156215667725, 4.1688995361328125, 4.788183212280273, 5.407466888427734, 6.0267510414123535, 6.6460347175598145, 7.265318870544434, 7.8846025466918945, 8.503886222839355, 9.123169898986816, 9.742454528808594, 10.361738204956055, 10.981021881103516, 11.600305557250977, 12.219589233398438, 12.838872909545898, 13.45815658569336, 14.07744026184082, 14.696723937988281, 15.316008567810059, 15.93529224395752, 16.554576873779297, 17.173860549926758, 17.79314422607422]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 3.0, 5.0, 17.0, 19.0, 31.0, 47.0, 51.0, 85.0, 122.0, 186.0, 326.0, 601.0, 931.0, 1860.0, 3381.0, 6575.0, 13111.0, 25407.0, 49644.0, 96124.0, 202157.0, 307143.0, 169636.0, 82529.0, 42941.0, 22064.0, 11242.0, 5516.0, 2997.0, 1560.0, 861.0, 501.0, 316.0, 195.0, 124.0, 64.0, 66.0, 42.0, 30.0, 13.0, 11.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.60467529296875, -6.4007568359375, -6.19683837890625, -5.992919921875, -5.78900146484375, -5.5850830078125, -5.38116455078125, -5.17724609375, -4.97332763671875, -4.7694091796875, -4.56549072265625, -4.361572265625, -4.15765380859375, -3.9537353515625, -3.74981689453125, -3.5458984375, -3.34197998046875, -3.1380615234375, -2.93414306640625, -2.730224609375, -2.52630615234375, -2.3223876953125, -2.11846923828125, -1.91455078125, -1.71063232421875, -1.5067138671875, -1.30279541015625, -1.098876953125, -0.89495849609375, -0.6910400390625, -0.48712158203125, -0.283203125, -0.07928466796875, 0.1246337890625, 0.32855224609375, 0.532470703125, 0.73638916015625, 0.9403076171875, 1.14422607421875, 1.34814453125, 1.55206298828125, 1.7559814453125, 1.95989990234375, 2.163818359375, 2.36773681640625, 2.5716552734375, 2.77557373046875, 2.9794921875, 3.18341064453125, 3.3873291015625, 3.59124755859375, 3.795166015625, 3.99908447265625, 4.2030029296875, 4.40692138671875, 4.61083984375, 4.81475830078125, 5.0186767578125, 5.22259521484375, 5.426513671875, 5.63043212890625, 5.8343505859375, 6.03826904296875, 6.2421875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 7.0, 5.0, 5.0, 5.0, 6.0, 9.0, 14.0, 12.0, 15.0, 19.0, 15.0, 25.0, 23.0, 29.0, 24.0, 22.0, 40.0, 37.0, 39.0, 39.0, 49.0, 47.0, 33.0, 44.0, 43.0, 40.0, 38.0, 37.0, 31.0, 29.0, 28.0, 21.0, 20.0, 19.0, 20.0, 14.0, 18.0, 16.0, 16.0, 13.0, 8.0, 5.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9228515625, -1.8573455810546875, -1.791839599609375, -1.7263336181640625, -1.66082763671875, -1.5953216552734375, -1.529815673828125, -1.4643096923828125, -1.3988037109375, -1.3332977294921875, -1.267791748046875, -1.2022857666015625, -1.13677978515625, -1.0712738037109375, -1.005767822265625, -0.9402618408203125, -0.874755859375, -0.8092498779296875, -0.743743896484375, -0.6782379150390625, -0.61273193359375, -0.5472259521484375, -0.481719970703125, -0.4162139892578125, -0.3507080078125, -0.2852020263671875, -0.219696044921875, -0.1541900634765625, -0.08868408203125, -0.0231781005859375, 0.042327880859375, 0.1078338623046875, 0.17333984375, 0.2388458251953125, 0.304351806640625, 0.3698577880859375, 0.43536376953125, 0.5008697509765625, 0.566375732421875, 0.6318817138671875, 0.6973876953125, 0.7628936767578125, 0.828399658203125, 0.8939056396484375, 0.95941162109375, 1.0249176025390625, 1.090423583984375, 1.1559295654296875, 1.221435546875, 1.2869415283203125, 1.352447509765625, 1.4179534912109375, 1.48345947265625, 1.5489654541015625, 1.614471435546875, 1.6799774169921875, 1.7454833984375, 1.8109893798828125, 1.876495361328125, 1.9420013427734375, 2.00750732421875, 2.0730133056640625, 2.138519287109375, 2.2040252685546875, 2.26953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 10.0, 10.0, 12.0, 25.0, 27.0, 41.0, 65.0, 83.0, 122.0, 196.0, 265.0, 401.0, 620.0, 1132.0, 2611.0, 9482.0, 44951.0, 239279.0, 613387.0, 105577.0, 21060.0, 4971.0, 1759.0, 895.0, 530.0, 315.0, 232.0, 123.0, 114.0, 67.0, 47.0, 39.0, 36.0, 16.0, 12.0, 12.0, 7.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8359375, -15.373779296875, -14.91162109375, -14.449462890625, -13.9873046875, -13.525146484375, -13.06298828125, -12.600830078125, -12.138671875, -11.676513671875, -11.21435546875, -10.752197265625, -10.2900390625, -9.827880859375, -9.36572265625, -8.903564453125, -8.44140625, -7.979248046875, -7.51708984375, -7.054931640625, -6.5927734375, -6.130615234375, -5.66845703125, -5.206298828125, -4.744140625, -4.281982421875, -3.81982421875, -3.357666015625, -2.8955078125, -2.433349609375, -1.97119140625, -1.509033203125, -1.046875, -0.584716796875, -0.12255859375, 0.339599609375, 0.8017578125, 1.263916015625, 1.72607421875, 2.188232421875, 2.650390625, 3.112548828125, 3.57470703125, 4.036865234375, 4.4990234375, 4.961181640625, 5.42333984375, 5.885498046875, 6.34765625, 6.809814453125, 7.27197265625, 7.734130859375, 8.1962890625, 8.658447265625, 9.12060546875, 9.582763671875, 10.044921875, 10.507080078125, 10.96923828125, 11.431396484375, 11.8935546875, 12.355712890625, 12.81787109375, 13.280029296875, 13.7421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 10.0, 4.0, 6.0, 5.0, 6.0, 12.0, 17.0, 16.0, 14.0, 24.0, 27.0, 27.0, 29.0, 26.0, 31.0, 47.0, 35.0, 52.0, 45.0, 59.0, 47.0, 40.0, 59.0, 46.0, 45.0, 30.0, 35.0, 37.0, 20.0, 26.0, 18.0, 19.0, 18.0, 17.0, 10.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7734375, -11.4031982421875, -11.032958984375, -10.6627197265625, -10.29248046875, -9.9222412109375, -9.552001953125, -9.1817626953125, -8.8115234375, -8.4412841796875, -8.071044921875, -7.7008056640625, -7.33056640625, -6.9603271484375, -6.590087890625, -6.2198486328125, -5.849609375, -5.4793701171875, -5.109130859375, -4.7388916015625, -4.36865234375, -3.9984130859375, -3.628173828125, -3.2579345703125, -2.8876953125, -2.5174560546875, -2.147216796875, -1.7769775390625, -1.40673828125, -1.0364990234375, -0.666259765625, -0.2960205078125, 0.07421875, 0.4444580078125, 0.814697265625, 1.1849365234375, 1.55517578125, 1.9254150390625, 2.295654296875, 2.6658935546875, 3.0361328125, 3.4063720703125, 3.776611328125, 4.1468505859375, 4.51708984375, 4.8873291015625, 5.257568359375, 5.6278076171875, 5.998046875, 6.3682861328125, 6.738525390625, 7.1087646484375, 7.47900390625, 7.8492431640625, 8.219482421875, 8.5897216796875, 8.9599609375, 9.3302001953125, 9.700439453125, 10.0706787109375, 10.44091796875, 10.8111572265625, 11.181396484375, 11.5516357421875, 11.921875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 9.0, 3.0, 19.0, 26.0, 29.0, 77.0, 129.0, 291.0, 802.0, 3533.0, 30199.0, 538656.0, 443897.0, 26386.0, 3178.0, 780.0, 256.0, 126.0, 76.0, 34.0, 26.0, 12.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6875, -14.2420654296875, -13.796630859375, -13.3511962890625, -12.90576171875, -12.4603271484375, -12.014892578125, -11.5694580078125, -11.1240234375, -10.6785888671875, -10.233154296875, -9.7877197265625, -9.34228515625, -8.8968505859375, -8.451416015625, -8.0059814453125, -7.560546875, -7.1151123046875, -6.669677734375, -6.2242431640625, -5.77880859375, -5.3333740234375, -4.887939453125, -4.4425048828125, -3.9970703125, -3.5516357421875, -3.106201171875, -2.6607666015625, -2.21533203125, -1.7698974609375, -1.324462890625, -0.8790283203125, -0.43359375, 0.0118408203125, 0.457275390625, 0.9027099609375, 1.34814453125, 1.7935791015625, 2.239013671875, 2.6844482421875, 3.1298828125, 3.5753173828125, 4.020751953125, 4.4661865234375, 4.91162109375, 5.3570556640625, 5.802490234375, 6.2479248046875, 6.693359375, 7.1387939453125, 7.584228515625, 8.0296630859375, 8.47509765625, 8.9205322265625, 9.365966796875, 9.8114013671875, 10.2568359375, 10.7022705078125, 11.147705078125, 11.5931396484375, 12.03857421875, 12.4840087890625, 12.929443359375, 13.3748779296875, 13.8203125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 8.0, 8.0, 9.0, 9.0, 13.0, 18.0, 23.0, 38.0, 38.0, 47.0, 56.0, 83.0, 171.0, 128.0, 67.0, 62.0, 35.0, 30.0, 22.0, 28.0, 12.0, 11.0, 15.0, 10.0, 8.0, 6.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0014581680297851562, -0.001412123441696167, -0.0013660788536071777, -0.0013200342655181885, -0.0012739896774291992, -0.00122794508934021, -0.0011819005012512207, -0.0011358559131622314, -0.0010898113250732422, -0.001043766736984253, -0.0009977221488952637, -0.0009516775608062744, -0.0009056329727172852, -0.0008595883846282959, -0.0008135437965393066, -0.0007674992084503174, -0.0007214546203613281, -0.0006754100322723389, -0.0006293654441833496, -0.0005833208560943604, -0.0005372762680053711, -0.0004912316799163818, -0.0004451870918273926, -0.0003991425037384033, -0.00035309791564941406, -0.0003070533275604248, -0.00026100873947143555, -0.0002149641513824463, -0.00016891956329345703, -0.00012287497520446777, -7.683038711547852e-05, -3.078579902648926e-05, 1.52587890625e-05, 6.130337715148926e-05, 0.00010734796524047852, 0.00015339255332946777, 0.00019943714141845703, 0.0002454817295074463, 0.00029152631759643555, 0.0003375709056854248, 0.00038361549377441406, 0.0004296600818634033, 0.0004757046699523926, 0.0005217492580413818, 0.0005677938461303711, 0.0006138384342193604, 0.0006598830223083496, 0.0007059276103973389, 0.0007519721984863281, 0.0007980167865753174, 0.0008440613746643066, 0.0008901059627532959, 0.0009361505508422852, 0.0009821951389312744, 0.0010282397270202637, 0.001074284315109253, 0.0011203289031982422, 0.0011663734912872314, 0.0012124180793762207, 0.00125846266746521, 0.0013045072555541992, 0.0013505518436431885, 0.0013965964317321777, 0.001442641019821167, 0.0014886856079101562]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 2.0, 6.0, 18.0, 23.0, 46.0, 71.0, 165.0, 280.0, 593.0, 1538.0, 4909.0, 30195.0, 356121.0, 592996.0, 51380.0, 6868.0, 1905.0, 699.0, 311.0, 185.0, 89.0, 54.0, 30.0, 14.0, 13.0, 14.0, 5.0, 5.0, 7.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.4296875, -13.0472412109375, -12.664794921875, -12.2823486328125, -11.89990234375, -11.5174560546875, -11.135009765625, -10.7525634765625, -10.3701171875, -9.9876708984375, -9.605224609375, -9.2227783203125, -8.84033203125, -8.4578857421875, -8.075439453125, -7.6929931640625, -7.310546875, -6.9281005859375, -6.545654296875, -6.1632080078125, -5.78076171875, -5.3983154296875, -5.015869140625, -4.6334228515625, -4.2509765625, -3.8685302734375, -3.486083984375, -3.1036376953125, -2.72119140625, -2.3387451171875, -1.956298828125, -1.5738525390625, -1.19140625, -0.8089599609375, -0.426513671875, -0.0440673828125, 0.33837890625, 0.7208251953125, 1.103271484375, 1.4857177734375, 1.8681640625, 2.2506103515625, 2.633056640625, 3.0155029296875, 3.39794921875, 3.7803955078125, 4.162841796875, 4.5452880859375, 4.927734375, 5.3101806640625, 5.692626953125, 6.0750732421875, 6.45751953125, 6.8399658203125, 7.222412109375, 7.6048583984375, 7.9873046875, 8.3697509765625, 8.752197265625, 9.1346435546875, 9.51708984375, 9.8995361328125, 10.281982421875, 10.6644287109375, 11.046875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 13.0, 17.0, 21.0, 35.0, 50.0, 77.0, 118.0, 197.0, 175.0, 99.0, 74.0, 49.0, 35.0, 17.0, 14.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.34375, -15.9793701171875, -15.614990234375, -15.2506103515625, -14.88623046875, -14.5218505859375, -14.157470703125, -13.7930908203125, -13.4287109375, -13.0643310546875, -12.699951171875, -12.3355712890625, -11.97119140625, -11.6068115234375, -11.242431640625, -10.8780517578125, -10.513671875, -10.1492919921875, -9.784912109375, -9.4205322265625, -9.05615234375, -8.6917724609375, -8.327392578125, -7.9630126953125, -7.5986328125, -7.2342529296875, -6.869873046875, -6.5054931640625, -6.14111328125, -5.7767333984375, -5.412353515625, -5.0479736328125, -4.68359375, -4.3192138671875, -3.954833984375, -3.5904541015625, -3.22607421875, -2.8616943359375, -2.497314453125, -2.1329345703125, -1.7685546875, -1.4041748046875, -1.039794921875, -0.6754150390625, -0.31103515625, 0.0533447265625, 0.417724609375, 0.7821044921875, 1.146484375, 1.5108642578125, 1.875244140625, 2.2396240234375, 2.60400390625, 2.9683837890625, 3.332763671875, 3.6971435546875, 4.0615234375, 4.4259033203125, 4.790283203125, 5.1546630859375, 5.51904296875, 5.8834228515625, 6.247802734375, 6.6121826171875, 6.9765625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 13.0, 27.0, 84.0, 154.0, 212.0, 215.0, 131.0, 100.0, 39.0, 17.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-197.71441650390625, -192.6486053466797, -187.5828094482422, -182.51699829101562, -177.45120239257812, -172.38539123535156, -167.319580078125, -162.2537841796875, -157.18797302246094, -152.12216186523438, -147.05636596679688, -141.9905548095703, -136.92474365234375, -131.85894775390625, -126.79313659667969, -121.72733306884766, -116.66152954101562, -111.5957260131836, -106.52992248535156, -101.464111328125, -96.39830780029297, -91.33250427246094, -86.26669311523438, -81.20088958740234, -76.13508605957031, -71.06928253173828, -66.00347900390625, -60.93766784667969, -55.871864318847656, -50.806060791015625, -45.74025344848633, -40.67444610595703, -35.60865783691406, -30.5428524017334, -25.477046966552734, -20.41124153137207, -15.345436096191406, -10.279630661010742, -5.213825225830078, -0.14801788330078125, 4.91778564453125, 9.983591079711914, 15.049396514892578, 20.115201950073242, 25.181007385253906, 30.24681282043457, 35.312618255615234, 40.37842559814453, 45.44422912597656, 50.510032653808594, 55.57583999633789, 60.64164733886719, 65.70745086669922, 70.77325439453125, 75.83906555175781, 80.90486907958984, 85.97067260742188, 91.0364761352539, 96.10227966308594, 101.1680908203125, 106.23389434814453, 111.29969787597656, 116.36550903320312, 121.43131256103516, 126.49711608886719]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 7.0, 5.0, 5.0, 5.0, 3.0, 14.0, 8.0, 14.0, 8.0, 18.0, 25.0, 30.0, 22.0, 33.0, 39.0, 49.0, 44.0, 45.0, 46.0, 51.0, 61.0, 60.0, 43.0, 47.0, 42.0, 33.0, 34.0, 31.0, 29.0, 24.0, 22.0, 15.0, 13.0, 16.0, 12.0, 12.0, 12.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-71.30590057373047, -69.27350616455078, -67.2411117553711, -65.20870971679688, -63.17631530761719, -61.1439208984375, -59.11152648925781, -57.07912826538086, -55.046730041503906, -53.01433563232422, -50.981937408447266, -48.94954299926758, -46.917144775390625, -44.88475036621094, -42.85235595703125, -40.8199577331543, -38.78756332397461, -36.75516891479492, -34.72277069091797, -32.69037628173828, -30.657978057861328, -28.62558364868164, -26.59318733215332, -24.560791015625, -22.52839469909668, -20.49599838256836, -18.46360206604004, -16.43120574951172, -14.398810386657715, -12.366414070129395, -10.33401870727539, -8.30162239074707, -6.26922607421875, -4.23682975769043, -2.2044339179992676, -0.17203807830810547, 1.8603582382202148, 3.892754554748535, 5.925149917602539, 7.957546234130859, 9.98994255065918, 12.0223388671875, 14.05473518371582, 16.08713150024414, 18.119525909423828, 20.15192413330078, 22.18431854248047, 24.21671485900879, 26.24911117553711, 28.28150749206543, 30.31390380859375, 32.34629821777344, 34.37869644165039, 36.41109085083008, 38.44348907470703, 40.47588348388672, 42.508277893066406, 44.540672302246094, 46.57307052612305, 48.605464935302734, 50.63786315917969, 52.670257568359375, 54.70265197753906, 56.735050201416016, 58.76744842529297]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 16.0, 13.0, 18.0, 30.0, 61.0, 85.0, 130.0, 210.0, 340.0, 529.0, 888.0, 1568.0, 2611.0, 4840.0, 9131.0, 19459.0, 45080.0, 129848.0, 597254.0, 2884427.0, 339157.0, 91628.0, 34440.0, 15155.0, 7601.0, 4051.0, 2336.0, 1356.0, 790.0, 475.0, 286.0, 167.0, 106.0, 72.0, 47.0, 29.0, 23.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.2744140625, -8.978515625, -8.6826171875, -8.38671875, -8.0908203125, -7.794921875, -7.4990234375, -7.203125, -6.9072265625, -6.611328125, -6.3154296875, -6.01953125, -5.7236328125, -5.427734375, -5.1318359375, -4.8359375, -4.5400390625, -4.244140625, -3.9482421875, -3.65234375, -3.3564453125, -3.060546875, -2.7646484375, -2.46875, -2.1728515625, -1.876953125, -1.5810546875, -1.28515625, -0.9892578125, -0.693359375, -0.3974609375, -0.1015625, 0.1943359375, 0.490234375, 0.7861328125, 1.08203125, 1.3779296875, 1.673828125, 1.9697265625, 2.265625, 2.5615234375, 2.857421875, 3.1533203125, 3.44921875, 3.7451171875, 4.041015625, 4.3369140625, 4.6328125, 4.9287109375, 5.224609375, 5.5205078125, 5.81640625, 6.1123046875, 6.408203125, 6.7041015625, 7.0, 7.2958984375, 7.591796875, 7.8876953125, 8.18359375, 8.4794921875, 8.775390625, 9.0712890625, 9.3671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 7.0, 0.0, 6.0, 4.0, 7.0, 17.0, 7.0, 14.0, 18.0, 26.0, 33.0, 32.0, 29.0, 34.0, 37.0, 48.0, 47.0, 53.0, 36.0, 54.0, 54.0, 51.0, 50.0, 34.0, 37.0, 37.0, 33.0, 28.0, 26.0, 22.0, 30.0, 15.0, 16.0, 17.0, 10.0, 9.0, 5.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.564453125, -2.4813232421875, -2.398193359375, -2.3150634765625, -2.23193359375, -2.1488037109375, -2.065673828125, -1.9825439453125, -1.8994140625, -1.8162841796875, -1.733154296875, -1.6500244140625, -1.56689453125, -1.4837646484375, -1.400634765625, -1.3175048828125, -1.234375, -1.1512451171875, -1.068115234375, -0.9849853515625, -0.90185546875, -0.8187255859375, -0.735595703125, -0.6524658203125, -0.5693359375, -0.4862060546875, -0.403076171875, -0.3199462890625, -0.23681640625, -0.1536865234375, -0.070556640625, 0.0125732421875, 0.095703125, 0.1788330078125, 0.261962890625, 0.3450927734375, 0.42822265625, 0.5113525390625, 0.594482421875, 0.6776123046875, 0.7607421875, 0.8438720703125, 0.927001953125, 1.0101318359375, 1.09326171875, 1.1763916015625, 1.259521484375, 1.3426513671875, 1.42578125, 1.5089111328125, 1.592041015625, 1.6751708984375, 1.75830078125, 1.8414306640625, 1.924560546875, 2.0076904296875, 2.0908203125, 2.1739501953125, 2.257080078125, 2.3402099609375, 2.42333984375, 2.5064697265625, 2.589599609375, 2.6727294921875, 2.755859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 9.0, 7.0, 9.0, 4.0, 24.0, 28.0, 30.0, 46.0, 48.0, 88.0, 138.0, 269.0, 444.0, 775.0, 1614.0, 3527.0, 8050.0, 21729.0, 69191.0, 313545.0, 2925886.0, 678899.0, 116160.0, 32800.0, 11533.0, 4813.0, 2093.0, 1091.0, 554.0, 313.0, 177.0, 117.0, 69.0, 57.0, 37.0, 33.0, 14.0, 13.0, 9.0, 3.0, 8.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.203125, -12.7584228515625, -12.313720703125, -11.8690185546875, -11.42431640625, -10.9796142578125, -10.534912109375, -10.0902099609375, -9.6455078125, -9.2008056640625, -8.756103515625, -8.3114013671875, -7.86669921875, -7.4219970703125, -6.977294921875, -6.5325927734375, -6.087890625, -5.6431884765625, -5.198486328125, -4.7537841796875, -4.30908203125, -3.8643798828125, -3.419677734375, -2.9749755859375, -2.5302734375, -2.0855712890625, -1.640869140625, -1.1961669921875, -0.75146484375, -0.3067626953125, 0.137939453125, 0.5826416015625, 1.02734375, 1.4720458984375, 1.916748046875, 2.3614501953125, 2.80615234375, 3.2508544921875, 3.695556640625, 4.1402587890625, 4.5849609375, 5.0296630859375, 5.474365234375, 5.9190673828125, 6.36376953125, 6.8084716796875, 7.253173828125, 7.6978759765625, 8.142578125, 8.5872802734375, 9.031982421875, 9.4766845703125, 9.92138671875, 10.3660888671875, 10.810791015625, 11.2554931640625, 11.7001953125, 12.1448974609375, 12.589599609375, 13.0343017578125, 13.47900390625, 13.9237060546875, 14.368408203125, 14.8131103515625, 15.2578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 4.0, 3.0, 11.0, 14.0, 26.0, 33.0, 57.0, 69.0, 124.0, 210.0, 422.0, 1123.0, 1008.0, 421.0, 219.0, 114.0, 74.0, 45.0, 35.0, 13.0, 16.0, 8.0, 6.0, 4.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4296875, -11.136474609375, -10.84326171875, -10.550048828125, -10.2568359375, -9.963623046875, -9.67041015625, -9.377197265625, -9.083984375, -8.790771484375, -8.49755859375, -8.204345703125, -7.9111328125, -7.617919921875, -7.32470703125, -7.031494140625, -6.73828125, -6.445068359375, -6.15185546875, -5.858642578125, -5.5654296875, -5.272216796875, -4.97900390625, -4.685791015625, -4.392578125, -4.099365234375, -3.80615234375, -3.512939453125, -3.2197265625, -2.926513671875, -2.63330078125, -2.340087890625, -2.046875, -1.753662109375, -1.46044921875, -1.167236328125, -0.8740234375, -0.580810546875, -0.28759765625, 0.005615234375, 0.298828125, 0.592041015625, 0.88525390625, 1.178466796875, 1.4716796875, 1.764892578125, 2.05810546875, 2.351318359375, 2.64453125, 2.937744140625, 3.23095703125, 3.524169921875, 3.8173828125, 4.110595703125, 4.40380859375, 4.697021484375, 4.990234375, 5.283447265625, 5.57666015625, 5.869873046875, 6.1630859375, 6.456298828125, 6.74951171875, 7.042724609375, 7.3359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 16.0, 23.0, 61.0, 95.0, 142.0, 156.0, 162.0, 134.0, 93.0, 61.0, 21.0, 25.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-112.36250305175781, -109.89006805419922, -107.4176254272461, -104.9451904296875, -102.47274780273438, -100.00031280517578, -97.52787017822266, -95.05543518066406, -92.58299255371094, -90.11055755615234, -87.63811492919922, -85.16567993164062, -82.6932373046875, -80.2208023071289, -77.74835968017578, -75.27592468261719, -72.8034896850586, -70.3310546875, -67.85861206054688, -65.38617706298828, -62.913734436035156, -60.44129943847656, -57.9688606262207, -55.496421813964844, -53.023983001708984, -50.551544189453125, -48.079105377197266, -45.606666564941406, -43.13423156738281, -40.66178894042969, -38.189353942871094, -35.716915130615234, -33.24448013305664, -30.77204132080078, -28.299602508544922, -25.827165603637695, -23.354726791381836, -20.882287979125977, -18.40985107421875, -15.93741226196289, -13.464973449707031, -10.992534637451172, -8.520096778869629, -6.047658443450928, -3.5752201080322266, -1.1027812957763672, 1.3696565628051758, 3.8420944213867188, 6.314533233642578, 8.786972045898438, 11.25940990447998, 13.731847763061523, 16.204286575317383, 18.676725387573242, 21.14916229248047, 23.621601104736328, 26.094039916992188, 28.566478729248047, 31.038917541503906, 33.511356353759766, 35.983795166015625, 38.45623016357422, 40.92866897583008, 43.40110778808594, 45.8735466003418]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 7.0, 13.0, 9.0, 12.0, 13.0, 20.0, 19.0, 20.0, 27.0, 29.0, 42.0, 49.0, 40.0, 52.0, 44.0, 53.0, 54.0, 58.0, 51.0, 50.0, 43.0, 48.0, 31.0, 29.0, 33.0, 18.0, 22.0, 24.0, 8.0, 20.0, 8.0, 12.0, 14.0, 5.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.21209716796875, -29.196584701538086, -28.181072235107422, -27.165557861328125, -26.15004539489746, -25.134532928466797, -24.1190185546875, -23.103506088256836, -22.087993621826172, -21.072481155395508, -20.056968688964844, -19.041454315185547, -18.025941848754883, -17.01042938232422, -15.994915962219238, -14.979402542114258, -13.963890075683594, -12.94837760925293, -11.93286418914795, -10.917350769042969, -9.901838302612305, -8.88632583618164, -7.87081241607666, -6.855299472808838, -5.839786529541016, -4.824273586273193, -3.808760643005371, -2.793247699737549, -1.7777347564697266, -0.7622218132019043, 0.25329113006591797, 1.2688040733337402, 2.284313201904297, 3.299826145172119, 4.315339088439941, 5.330852031707764, 6.346364974975586, 7.361877918243408, 8.37739086151123, 9.392904281616211, 10.408416748046875, 11.423929214477539, 12.43944263458252, 13.4549560546875, 14.470468521118164, 15.485980987548828, 16.501495361328125, 17.51700782775879, 18.532520294189453, 19.548032760620117, 20.56354522705078, 21.579059600830078, 22.594572067260742, 23.610084533691406, 24.625598907470703, 25.641111373901367, 26.65662384033203, 27.672136306762695, 28.68764877319336, 29.703163146972656, 30.71867561340332, 31.734188079833984, 32.74970245361328, 33.76521301269531, 34.78072738647461]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 13.0, 23.0, 23.0, 32.0, 44.0, 62.0, 144.0, 209.0, 335.0, 540.0, 950.0, 1763.0, 3404.0, 6639.0, 13181.0, 27698.0, 57743.0, 117048.0, 207540.0, 253154.0, 175692.0, 93066.0, 45461.0, 21798.0, 10631.0, 5277.0, 2708.0, 1355.0, 807.0, 435.0, 280.0, 167.0, 98.0, 71.0, 44.0, 32.0, 33.0, 11.0, 6.0, 15.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.0078125, -6.8037109375, -6.599609375, -6.3955078125, -6.19140625, -5.9873046875, -5.783203125, -5.5791015625, -5.375, -5.1708984375, -4.966796875, -4.7626953125, -4.55859375, -4.3544921875, -4.150390625, -3.9462890625, -3.7421875, -3.5380859375, -3.333984375, -3.1298828125, -2.92578125, -2.7216796875, -2.517578125, -2.3134765625, -2.109375, -1.9052734375, -1.701171875, -1.4970703125, -1.29296875, -1.0888671875, -0.884765625, -0.6806640625, -0.4765625, -0.2724609375, -0.068359375, 0.1357421875, 0.33984375, 0.5439453125, 0.748046875, 0.9521484375, 1.15625, 1.3603515625, 1.564453125, 1.7685546875, 1.97265625, 2.1767578125, 2.380859375, 2.5849609375, 2.7890625, 2.9931640625, 3.197265625, 3.4013671875, 3.60546875, 3.8095703125, 4.013671875, 4.2177734375, 4.421875, 4.6259765625, 4.830078125, 5.0341796875, 5.23828125, 5.4423828125, 5.646484375, 5.8505859375, 6.0546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 3.0, 12.0, 12.0, 10.0, 15.0, 17.0, 15.0, 25.0, 17.0, 25.0, 36.0, 37.0, 31.0, 44.0, 45.0, 49.0, 25.0, 44.0, 41.0, 50.0, 35.0, 51.0, 42.0, 47.0, 38.0, 28.0, 31.0, 22.0, 21.0, 22.0, 21.0, 22.0, 12.0, 10.0, 14.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623046875, -2.53741455078125, -2.4517822265625, -2.36614990234375, -2.280517578125, -2.19488525390625, -2.1092529296875, -2.02362060546875, -1.93798828125, -1.85235595703125, -1.7667236328125, -1.68109130859375, -1.595458984375, -1.50982666015625, -1.4241943359375, -1.33856201171875, -1.2529296875, -1.16729736328125, -1.0816650390625, -0.99603271484375, -0.910400390625, -0.82476806640625, -0.7391357421875, -0.65350341796875, -0.56787109375, -0.48223876953125, -0.3966064453125, -0.31097412109375, -0.225341796875, -0.13970947265625, -0.0540771484375, 0.03155517578125, 0.1171875, 0.20281982421875, 0.2884521484375, 0.37408447265625, 0.459716796875, 0.54534912109375, 0.6309814453125, 0.71661376953125, 0.80224609375, 0.88787841796875, 0.9735107421875, 1.05914306640625, 1.144775390625, 1.23040771484375, 1.3160400390625, 1.40167236328125, 1.4873046875, 1.57293701171875, 1.6585693359375, 1.74420166015625, 1.829833984375, 1.91546630859375, 2.0010986328125, 2.08673095703125, 2.17236328125, 2.25799560546875, 2.3436279296875, 2.42926025390625, 2.514892578125, 2.60052490234375, 2.6861572265625, 2.77178955078125, 2.857421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 0.0, 10.0, 10.0, 18.0, 18.0, 40.0, 36.0, 58.0, 79.0, 116.0, 131.0, 175.0, 267.0, 356.0, 483.0, 731.0, 1388.0, 3303.0, 12009.0, 58390.0, 284644.0, 502277.0, 143920.0, 28221.0, 6538.0, 2157.0, 1036.0, 642.0, 422.0, 258.0, 214.0, 147.0, 126.0, 87.0, 62.0, 46.0, 35.0, 27.0, 23.0, 9.0, 19.0, 8.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.15625, -12.735595703125, -12.31494140625, -11.894287109375, -11.4736328125, -11.052978515625, -10.63232421875, -10.211669921875, -9.791015625, -9.370361328125, -8.94970703125, -8.529052734375, -8.1083984375, -7.687744140625, -7.26708984375, -6.846435546875, -6.42578125, -6.005126953125, -5.58447265625, -5.163818359375, -4.7431640625, -4.322509765625, -3.90185546875, -3.481201171875, -3.060546875, -2.639892578125, -2.21923828125, -1.798583984375, -1.3779296875, -0.957275390625, -0.53662109375, -0.115966796875, 0.3046875, 0.725341796875, 1.14599609375, 1.566650390625, 1.9873046875, 2.407958984375, 2.82861328125, 3.249267578125, 3.669921875, 4.090576171875, 4.51123046875, 4.931884765625, 5.3525390625, 5.773193359375, 6.19384765625, 6.614501953125, 7.03515625, 7.455810546875, 7.87646484375, 8.297119140625, 8.7177734375, 9.138427734375, 9.55908203125, 9.979736328125, 10.400390625, 10.821044921875, 11.24169921875, 11.662353515625, 12.0830078125, 12.503662109375, 12.92431640625, 13.344970703125, 13.765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 11.0, 4.0, 11.0, 17.0, 9.0, 24.0, 24.0, 17.0, 33.0, 32.0, 34.0, 38.0, 47.0, 41.0, 50.0, 56.0, 51.0, 43.0, 56.0, 52.0, 42.0, 41.0, 36.0, 31.0, 38.0, 34.0, 25.0, 21.0, 16.0, 17.0, 7.0, 8.0, 8.0, 7.0, 8.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.90625, -14.390380859375, -13.87451171875, -13.358642578125, -12.8427734375, -12.326904296875, -11.81103515625, -11.295166015625, -10.779296875, -10.263427734375, -9.74755859375, -9.231689453125, -8.7158203125, -8.199951171875, -7.68408203125, -7.168212890625, -6.65234375, -6.136474609375, -5.62060546875, -5.104736328125, -4.5888671875, -4.072998046875, -3.55712890625, -3.041259765625, -2.525390625, -2.009521484375, -1.49365234375, -0.977783203125, -0.4619140625, 0.053955078125, 0.56982421875, 1.085693359375, 1.6015625, 2.117431640625, 2.63330078125, 3.149169921875, 3.6650390625, 4.180908203125, 4.69677734375, 5.212646484375, 5.728515625, 6.244384765625, 6.76025390625, 7.276123046875, 7.7919921875, 8.307861328125, 8.82373046875, 9.339599609375, 9.85546875, 10.371337890625, 10.88720703125, 11.403076171875, 11.9189453125, 12.434814453125, 12.95068359375, 13.466552734375, 13.982421875, 14.498291015625, 15.01416015625, 15.530029296875, 16.0458984375, 16.561767578125, 17.07763671875, 17.593505859375, 18.109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 1.0, 3.0, 18.0, 16.0, 27.0, 37.0, 87.0, 143.0, 231.0, 474.0, 966.0, 2503.0, 6771.0, 23278.0, 95399.0, 389372.0, 396480.0, 97517.0, 23682.0, 6977.0, 2463.0, 1023.0, 500.0, 241.0, 127.0, 79.0, 40.0, 27.0, 16.0, 25.0, 4.0, 2.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.203125, -6.9708251953125, -6.738525390625, -6.5062255859375, -6.27392578125, -6.0416259765625, -5.809326171875, -5.5770263671875, -5.3447265625, -5.1124267578125, -4.880126953125, -4.6478271484375, -4.41552734375, -4.1832275390625, -3.950927734375, -3.7186279296875, -3.486328125, -3.2540283203125, -3.021728515625, -2.7894287109375, -2.55712890625, -2.3248291015625, -2.092529296875, -1.8602294921875, -1.6279296875, -1.3956298828125, -1.163330078125, -0.9310302734375, -0.69873046875, -0.4664306640625, -0.234130859375, -0.0018310546875, 0.23046875, 0.4627685546875, 0.695068359375, 0.9273681640625, 1.15966796875, 1.3919677734375, 1.624267578125, 1.8565673828125, 2.0888671875, 2.3211669921875, 2.553466796875, 2.7857666015625, 3.01806640625, 3.2503662109375, 3.482666015625, 3.7149658203125, 3.947265625, 4.1795654296875, 4.411865234375, 4.6441650390625, 4.87646484375, 5.1087646484375, 5.341064453125, 5.5733642578125, 5.8056640625, 6.0379638671875, 6.270263671875, 6.5025634765625, 6.73486328125, 6.9671630859375, 7.199462890625, 7.4317626953125, 7.6640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 7.0, 5.0, 7.0, 8.0, 15.0, 28.0, 20.0, 38.0, 49.0, 52.0, 70.0, 90.0, 108.0, 101.0, 80.0, 65.0, 52.0, 39.0, 36.0, 20.0, 18.0, 20.0, 15.0, 10.0, 10.0, 5.0, 5.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001617431640625, -0.001573324203491211, -0.0015292167663574219, -0.0014851093292236328, -0.0014410018920898438, -0.0013968944549560547, -0.0013527870178222656, -0.0013086795806884766, -0.0012645721435546875, -0.0012204647064208984, -0.0011763572692871094, -0.0011322498321533203, -0.0010881423950195312, -0.0010440349578857422, -0.0009999275207519531, -0.0009558200836181641, -0.000911712646484375, -0.0008676052093505859, -0.0008234977722167969, -0.0007793903350830078, -0.0007352828979492188, -0.0006911754608154297, -0.0006470680236816406, -0.0006029605865478516, -0.0005588531494140625, -0.0005147457122802734, -0.0004706382751464844, -0.0004265308380126953, -0.00038242340087890625, -0.0003383159637451172, -0.0002942085266113281, -0.00025010108947753906, -0.00020599365234375, -0.00016188621520996094, -0.00011777877807617188, -7.367134094238281e-05, -2.956390380859375e-05, 1.4543533325195312e-05, 5.8650970458984375e-05, 0.00010275840759277344, 0.0001468658447265625, 0.00019097328186035156, 0.00023508071899414062, 0.0002791881561279297, 0.00032329559326171875, 0.0003674030303955078, 0.0004115104675292969, 0.00045561790466308594, 0.000499725341796875, 0.0005438327789306641, 0.0005879402160644531, 0.0006320476531982422, 0.0006761550903320312, 0.0007202625274658203, 0.0007643699645996094, 0.0008084774017333984, 0.0008525848388671875, 0.0008966922760009766, 0.0009407997131347656, 0.0009849071502685547, 0.0010290145874023438, 0.0010731220245361328, 0.0011172294616699219, 0.001161336898803711, 0.0012054443359375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 9.0, 5.0, 22.0, 24.0, 49.0, 64.0, 102.0, 183.0, 355.0, 684.0, 1526.0, 3981.0, 13879.0, 79851.0, 492514.0, 382502.0, 55992.0, 10840.0, 3262.0, 1306.0, 639.0, 334.0, 183.0, 105.0, 45.0, 40.0, 25.0, 13.0, 7.0, 4.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -12.10260009765625, -11.8067626953125, -11.51092529296875, -11.215087890625, -10.91925048828125, -10.6234130859375, -10.32757568359375, -10.03173828125, -9.73590087890625, -9.4400634765625, -9.14422607421875, -8.848388671875, -8.55255126953125, -8.2567138671875, -7.96087646484375, -7.6650390625, -7.36920166015625, -7.0733642578125, -6.77752685546875, -6.481689453125, -6.18585205078125, -5.8900146484375, -5.59417724609375, -5.29833984375, -5.00250244140625, -4.7066650390625, -4.41082763671875, -4.114990234375, -3.81915283203125, -3.5233154296875, -3.22747802734375, -2.931640625, -2.63580322265625, -2.3399658203125, -2.04412841796875, -1.748291015625, -1.45245361328125, -1.1566162109375, -0.86077880859375, -0.56494140625, -0.26910400390625, 0.0267333984375, 0.32257080078125, 0.618408203125, 0.91424560546875, 1.2100830078125, 1.50592041015625, 1.8017578125, 2.09759521484375, 2.3934326171875, 2.68927001953125, 2.985107421875, 3.28094482421875, 3.5767822265625, 3.87261962890625, 4.16845703125, 4.46429443359375, 4.7601318359375, 5.05596923828125, 5.351806640625, 5.64764404296875, 5.9434814453125, 6.23931884765625, 6.53515625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 3.0, 6.0, 14.0, 14.0, 23.0, 20.0, 32.0, 42.0, 54.0, 70.0, 85.0, 75.0, 97.0, 84.0, 75.0, 66.0, 57.0, 43.0, 31.0, 23.0, 23.0, 18.0, 11.0, 4.0, 9.0, 3.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.5552978515625, -6.341064453125, -6.1268310546875, -5.91259765625, -5.6983642578125, -5.484130859375, -5.2698974609375, -5.0556640625, -4.8414306640625, -4.627197265625, -4.4129638671875, -4.19873046875, -3.9844970703125, -3.770263671875, -3.5560302734375, -3.341796875, -3.1275634765625, -2.913330078125, -2.6990966796875, -2.48486328125, -2.2706298828125, -2.056396484375, -1.8421630859375, -1.6279296875, -1.4136962890625, -1.199462890625, -0.9852294921875, -0.77099609375, -0.5567626953125, -0.342529296875, -0.1282958984375, 0.0859375, 0.3001708984375, 0.514404296875, 0.7286376953125, 0.94287109375, 1.1571044921875, 1.371337890625, 1.5855712890625, 1.7998046875, 2.0140380859375, 2.228271484375, 2.4425048828125, 2.65673828125, 2.8709716796875, 3.085205078125, 3.2994384765625, 3.513671875, 3.7279052734375, 3.942138671875, 4.1563720703125, 4.37060546875, 4.5848388671875, 4.799072265625, 5.0133056640625, 5.2275390625, 5.4417724609375, 5.656005859375, 5.8702392578125, 6.08447265625, 6.2987060546875, 6.512939453125, 6.7271728515625, 6.94140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 52.0, 134.0, 265.0, 285.0, 183.0, 63.0, 14.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.51481628417969, -77.73580169677734, -69.956787109375, -62.177764892578125, -54.39875030517578, -46.61973571777344, -38.84071731567383, -31.06169891357422, -23.282684326171875, -15.503667831420898, -7.724651336669922, 0.05436515808105469, 7.833381652832031, 15.612396240234375, 23.391414642333984, 31.170433044433594, 38.94944763183594, 46.72846221923828, 54.50748062133789, 62.2864990234375, 70.06551361083984, 77.84452819824219, 85.62355041503906, 93.4025650024414, 101.18157958984375, 108.9605941772461, 116.73960876464844, 124.51863098144531, 132.29763793945312, 140.07666015625, 147.85568237304688, 155.63470458984375, 163.41372680664062, 171.1927490234375, 178.9717559814453, 186.7507781982422, 194.52978515625, 202.30880737304688, 210.08782958984375, 217.86685180664062, 225.64585876464844, 233.4248809814453, 241.20388793945312, 248.98291015625, 256.7619323730469, 264.54095458984375, 272.3199462890625, 280.0989685058594, 287.87799072265625, 295.6570129394531, 303.43603515625, 311.21502685546875, 318.9940490722656, 326.7730712890625, 334.5520935058594, 342.33111572265625, 350.110107421875, 357.8891296386719, 365.66815185546875, 373.4471435546875, 381.2261657714844, 389.00518798828125, 396.7842102050781, 404.563232421875, 412.3422546386719]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 15.0, 6.0, 1.0, 9.0, 7.0, 15.0, 15.0, 26.0, 27.0, 21.0, 25.0, 21.0, 38.0, 37.0, 32.0, 37.0, 46.0, 39.0, 45.0, 41.0, 46.0, 40.0, 46.0, 44.0, 41.0, 34.0, 25.0, 28.0, 31.0, 22.0, 26.0, 19.0, 14.0, 15.0, 13.0, 7.0, 10.0, 6.0, 4.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-75.42803192138672, -73.17888641357422, -70.92974090576172, -68.68059539794922, -66.43144989013672, -64.18230438232422, -61.93315887451172, -59.68401336669922, -57.43486785888672, -55.18572235107422, -52.93657684326172, -50.68743133544922, -48.43828582763672, -46.18914031982422, -43.93999481201172, -41.69084930419922, -39.44170379638672, -37.19255828857422, -34.94341278076172, -32.69426727294922, -30.44512176513672, -28.19597625732422, -25.94683074951172, -23.69768524169922, -21.44853973388672, -19.19939422607422, -16.95024871826172, -14.701103210449219, -12.451957702636719, -10.202812194824219, -7.953666687011719, -5.704521179199219, -3.4553680419921875, -1.2062225341796875, 1.0429229736328125, 3.2920684814453125, 5.5412139892578125, 7.7903594970703125, 10.039505004882812, 12.288650512695312, 14.537796020507812, 16.786941528320312, 19.036087036132812, 21.285232543945312, 23.534378051757812, 25.783523559570312, 28.032669067382812, 30.281814575195312, 32.53096008300781, 34.78010559082031, 37.02925109863281, 39.27839660644531, 41.52754211425781, 43.77668762207031, 46.02583312988281, 48.27497863769531, 50.52412414550781, 52.77326965332031, 55.02241516113281, 57.27156066894531, 59.52070617675781, 61.76985168457031, 64.01899719238281, 66.26814270019531, 68.51728820800781]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 9.0, 12.0, 11.0, 14.0, 25.0, 31.0, 43.0, 51.0, 77.0, 99.0, 140.0, 201.0, 272.0, 471.0, 763.0, 1571.0, 3519.0, 11404.0, 59580.0, 3973914.0, 116502.0, 16327.0, 4893.0, 1842.0, 889.0, 509.0, 336.0, 204.0, 146.0, 114.0, 77.0, 55.0, 40.0, 40.0, 21.0, 28.0, 9.0, 8.0, 9.0, 8.0, 5.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.953125, -26.21728515625, -25.4814453125, -24.74560546875, -24.009765625, -23.27392578125, -22.5380859375, -21.80224609375, -21.06640625, -20.33056640625, -19.5947265625, -18.85888671875, -18.123046875, -17.38720703125, -16.6513671875, -15.91552734375, -15.1796875, -14.44384765625, -13.7080078125, -12.97216796875, -12.236328125, -11.50048828125, -10.7646484375, -10.02880859375, -9.29296875, -8.55712890625, -7.8212890625, -7.08544921875, -6.349609375, -5.61376953125, -4.8779296875, -4.14208984375, -3.40625, -2.67041015625, -1.9345703125, -1.19873046875, -0.462890625, 0.27294921875, 1.0087890625, 1.74462890625, 2.48046875, 3.21630859375, 3.9521484375, 4.68798828125, 5.423828125, 6.15966796875, 6.8955078125, 7.63134765625, 8.3671875, 9.10302734375, 9.8388671875, 10.57470703125, 11.310546875, 12.04638671875, 12.7822265625, 13.51806640625, 14.25390625, 14.98974609375, 15.7255859375, 16.46142578125, 17.197265625, 17.93310546875, 18.6689453125, 19.40478515625, 20.140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 9.0, 4.0, 11.0, 11.0, 19.0, 21.0, 24.0, 26.0, 36.0, 38.0, 37.0, 34.0, 45.0, 43.0, 54.0, 48.0, 52.0, 53.0, 54.0, 41.0, 43.0, 49.0, 38.0, 33.0, 32.0, 23.0, 21.0, 14.0, 19.0, 12.0, 10.0, 7.0, 10.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.568359375, -3.461517333984375, -3.35467529296875, -3.247833251953125, -3.1409912109375, -3.034149169921875, -2.92730712890625, -2.820465087890625, -2.713623046875, -2.606781005859375, -2.49993896484375, -2.393096923828125, -2.2862548828125, -2.179412841796875, -2.07257080078125, -1.965728759765625, -1.85888671875, -1.752044677734375, -1.64520263671875, -1.538360595703125, -1.4315185546875, -1.324676513671875, -1.21783447265625, -1.110992431640625, -1.004150390625, -0.897308349609375, -0.79046630859375, -0.683624267578125, -0.5767822265625, -0.469940185546875, -0.36309814453125, -0.256256103515625, -0.1494140625, -0.042572021484375, 0.06427001953125, 0.171112060546875, 0.2779541015625, 0.384796142578125, 0.49163818359375, 0.598480224609375, 0.705322265625, 0.812164306640625, 0.91900634765625, 1.025848388671875, 1.1326904296875, 1.239532470703125, 1.34637451171875, 1.453216552734375, 1.56005859375, 1.666900634765625, 1.77374267578125, 1.880584716796875, 1.9874267578125, 2.094268798828125, 2.20111083984375, 2.307952880859375, 2.414794921875, 2.521636962890625, 2.62847900390625, 2.735321044921875, 2.8421630859375, 2.949005126953125, 3.05584716796875, 3.162689208984375, 3.26953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 3.0, 9.0, 18.0, 17.0, 15.0, 26.0, 23.0, 46.0, 56.0, 60.0, 76.0, 99.0, 126.0, 197.0, 295.0, 454.0, 763.0, 1590.0, 4322.0, 17598.0, 294830.0, 3830291.0, 32341.0, 6222.0, 2096.0, 943.0, 532.0, 321.0, 223.0, 157.0, 114.0, 84.0, 65.0, 66.0, 54.0, 36.0, 28.0, 22.0, 14.0, 10.0, 5.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-35.15625, -34.126953125, -33.09765625, -32.068359375, -31.0390625, -30.009765625, -28.98046875, -27.951171875, -26.921875, -25.892578125, -24.86328125, -23.833984375, -22.8046875, -21.775390625, -20.74609375, -19.716796875, -18.6875, -17.658203125, -16.62890625, -15.599609375, -14.5703125, -13.541015625, -12.51171875, -11.482421875, -10.453125, -9.423828125, -8.39453125, -7.365234375, -6.3359375, -5.306640625, -4.27734375, -3.248046875, -2.21875, -1.189453125, -0.16015625, 0.869140625, 1.8984375, 2.927734375, 3.95703125, 4.986328125, 6.015625, 7.044921875, 8.07421875, 9.103515625, 10.1328125, 11.162109375, 12.19140625, 13.220703125, 14.25, 15.279296875, 16.30859375, 17.337890625, 18.3671875, 19.396484375, 20.42578125, 21.455078125, 22.484375, 23.513671875, 24.54296875, 25.572265625, 26.6015625, 27.630859375, 28.66015625, 29.689453125, 30.71875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 10.0, 12.0, 18.0, 25.0, 60.0, 183.0, 3081.0, 470.0, 121.0, 43.0, 21.0, 17.0, 3.0, 5.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.6929931640625, -5.471923828125, -5.2508544921875, -5.02978515625, -4.8087158203125, -4.587646484375, -4.3665771484375, -4.1455078125, -3.9244384765625, -3.703369140625, -3.4822998046875, -3.26123046875, -3.0401611328125, -2.819091796875, -2.5980224609375, -2.376953125, -2.1558837890625, -1.934814453125, -1.7137451171875, -1.49267578125, -1.2716064453125, -1.050537109375, -0.8294677734375, -0.6083984375, -0.3873291015625, -0.166259765625, 0.0548095703125, 0.27587890625, 0.4969482421875, 0.718017578125, 0.9390869140625, 1.16015625, 1.3812255859375, 1.602294921875, 1.8233642578125, 2.04443359375, 2.2655029296875, 2.486572265625, 2.7076416015625, 2.9287109375, 3.1497802734375, 3.370849609375, 3.5919189453125, 3.81298828125, 4.0340576171875, 4.255126953125, 4.4761962890625, 4.697265625, 4.9183349609375, 5.139404296875, 5.3604736328125, 5.58154296875, 5.8026123046875, 6.023681640625, 6.2447509765625, 6.4658203125, 6.6868896484375, 6.907958984375, 7.1290283203125, 7.35009765625, 7.5711669921875, 7.792236328125, 8.0133056640625, 8.234375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 17.0, 30.0, 40.0, 52.0, 51.0, 76.0, 102.0, 109.0, 104.0, 106.0, 78.0, 68.0, 48.0, 33.0, 27.0, 12.0, 7.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.941688537597656, -23.32851219177246, -22.7153377532959, -22.102161407470703, -21.488985061645508, -20.875808715820312, -20.26263427734375, -19.649457931518555, -19.03628158569336, -18.423105239868164, -17.8099308013916, -17.196754455566406, -16.58357810974121, -15.970402717590332, -15.357227325439453, -14.744050979614258, -14.130876541137695, -13.517701148986816, -12.904524803161621, -12.291349411010742, -11.678173065185547, -11.064997673034668, -10.451822280883789, -9.838645935058594, -9.225470542907715, -8.612295150756836, -7.999118804931641, -7.385943412780762, -6.772767543792725, -6.1595916748046875, -5.546416282653809, -4.9332404136657715, -4.320063591003418, -3.706887722015381, -3.093712091445923, -2.480536460876465, -1.8673605918884277, -1.2541847229003906, -0.6410090923309326, -0.02783346176147461, 0.5853424072265625, 1.19851815700531, 1.8116939067840576, 2.4248695373535156, 3.0380454063415527, 3.65122127532959, 4.264396667480469, 4.877572536468506, 5.490748405456543, 6.10392427444458, 6.717100143432617, 7.330275535583496, 7.943451404571533, 8.55662727355957, 9.16980266571045, 9.782978057861328, 10.396154403686523, 11.009329795837402, 11.622506141662598, 12.235681533813477, 12.848857879638672, 13.46203327178955, 14.07520866394043, 14.688385009765625, 15.301560401916504]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 10.0, 9.0, 12.0, 13.0, 11.0, 15.0, 9.0, 17.0, 13.0, 29.0, 27.0, 26.0, 22.0, 28.0, 39.0, 37.0, 30.0, 39.0, 48.0, 53.0, 38.0, 52.0, 43.0, 48.0, 39.0, 34.0, 32.0, 22.0, 12.0, 25.0, 26.0, 17.0, 16.0, 13.0, 14.0, 15.0, 15.0, 9.0, 11.0, 7.0, 4.0, 10.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.920077323913574, -8.625224113464355, -8.330370903015137, -8.035517692565918, -7.740664482116699, -7.4458112716674805, -7.1509575843811035, -6.856104373931885, -6.561251163482666, -6.266397953033447, -5.9715447425842285, -5.67669153213501, -5.381837844848633, -5.086984634399414, -4.792131423950195, -4.497278213500977, -4.202425003051758, -3.907571792602539, -3.6127185821533203, -3.3178651332855225, -3.0230119228363037, -2.728158712387085, -2.433305263519287, -2.1384520530700684, -1.8435988426208496, -1.5487456321716309, -1.2538923025131226, -0.959039032459259, -0.6641857624053955, -0.36933255195617676, -0.07447922229766846, 0.22037410736083984, 0.5152263641357422, 0.8100796341896057, 1.1049329042434692, 1.3997862339019775, 1.6946394443511963, 1.989492654800415, 2.284346103668213, 2.5791993141174316, 2.8740525245666504, 3.168905735015869, 3.463758945465088, 3.7586123943328857, 4.053465843200684, 4.348319053649902, 4.643172264099121, 4.93802547454834, 5.232878684997559, 5.527731895446777, 5.822585105895996, 6.117438316345215, 6.412291526794434, 6.707144737243652, 7.001998424530029, 7.296851634979248, 7.591704845428467, 7.8865580558776855, 8.181411743164062, 8.476264953613281, 8.7711181640625, 9.065971374511719, 9.360824584960938, 9.655677795410156, 9.950531005859375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 6.0, 6.0, 6.0, 13.0, 18.0, 25.0, 29.0, 58.0, 83.0, 125.0, 261.0, 493.0, 1004.0, 2061.0, 4325.0, 9075.0, 19438.0, 41704.0, 87775.0, 170552.0, 251189.0, 219023.0, 125549.0, 61558.0, 28603.0, 13426.0, 6230.0, 2925.0, 1456.0, 680.0, 383.0, 184.0, 117.0, 60.0, 43.0, 18.0, 21.0, 13.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.078125, -7.83880615234375, -7.5994873046875, -7.36016845703125, -7.120849609375, -6.88153076171875, -6.6422119140625, -6.40289306640625, -6.16357421875, -5.92425537109375, -5.6849365234375, -5.44561767578125, -5.206298828125, -4.96697998046875, -4.7276611328125, -4.48834228515625, -4.2490234375, -4.00970458984375, -3.7703857421875, -3.53106689453125, -3.291748046875, -3.05242919921875, -2.8131103515625, -2.57379150390625, -2.33447265625, -2.09515380859375, -1.8558349609375, -1.61651611328125, -1.377197265625, -1.13787841796875, -0.8985595703125, -0.65924072265625, -0.419921875, -0.18060302734375, 0.0587158203125, 0.29803466796875, 0.537353515625, 0.77667236328125, 1.0159912109375, 1.25531005859375, 1.49462890625, 1.73394775390625, 1.9732666015625, 2.21258544921875, 2.451904296875, 2.69122314453125, 2.9305419921875, 3.16986083984375, 3.4091796875, 3.64849853515625, 3.8878173828125, 4.12713623046875, 4.366455078125, 4.60577392578125, 4.8450927734375, 5.08441162109375, 5.32373046875, 5.56304931640625, 5.8023681640625, 6.04168701171875, 6.281005859375, 6.52032470703125, 6.7596435546875, 6.99896240234375, 7.23828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 3.0, 4.0, 11.0, 8.0, 9.0, 13.0, 11.0, 16.0, 10.0, 29.0, 35.0, 31.0, 29.0, 29.0, 40.0, 35.0, 44.0, 39.0, 40.0, 41.0, 42.0, 37.0, 49.0, 39.0, 46.0, 44.0, 32.0, 31.0, 33.0, 31.0, 23.0, 16.0, 16.0, 16.0, 18.0, 11.0, 11.0, 8.0, 3.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.482421875, -3.374176025390625, -3.26593017578125, -3.157684326171875, -3.0494384765625, -2.941192626953125, -2.83294677734375, -2.724700927734375, -2.616455078125, -2.508209228515625, -2.39996337890625, -2.291717529296875, -2.1834716796875, -2.075225830078125, -1.96697998046875, -1.858734130859375, -1.75048828125, -1.642242431640625, -1.53399658203125, -1.425750732421875, -1.3175048828125, -1.209259033203125, -1.10101318359375, -0.992767333984375, -0.884521484375, -0.776275634765625, -0.66802978515625, -0.559783935546875, -0.4515380859375, -0.343292236328125, -0.23504638671875, -0.126800537109375, -0.0185546875, 0.089691162109375, 0.19793701171875, 0.306182861328125, 0.4144287109375, 0.522674560546875, 0.63092041015625, 0.739166259765625, 0.847412109375, 0.955657958984375, 1.06390380859375, 1.172149658203125, 1.2803955078125, 1.388641357421875, 1.49688720703125, 1.605133056640625, 1.71337890625, 1.821624755859375, 1.92987060546875, 2.038116455078125, 2.1463623046875, 2.254608154296875, 2.36285400390625, 2.471099853515625, 2.579345703125, 2.687591552734375, 2.79583740234375, 2.904083251953125, 3.0123291015625, 3.120574951171875, 3.22882080078125, 3.337066650390625, 3.4453125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 11.0, 10.0, 12.0, 22.0, 32.0, 41.0, 57.0, 75.0, 102.0, 132.0, 181.0, 268.0, 355.0, 626.0, 984.0, 1876.0, 4551.0, 13814.0, 57179.0, 276899.0, 511842.0, 135830.0, 28735.0, 8037.0, 2954.0, 1375.0, 815.0, 517.0, 330.0, 257.0, 174.0, 120.0, 95.0, 74.0, 41.0, 38.0, 23.0, 19.0, 8.0, 15.0, 12.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.515625, -15.04931640625, -14.5830078125, -14.11669921875, -13.650390625, -13.18408203125, -12.7177734375, -12.25146484375, -11.78515625, -11.31884765625, -10.8525390625, -10.38623046875, -9.919921875, -9.45361328125, -8.9873046875, -8.52099609375, -8.0546875, -7.58837890625, -7.1220703125, -6.65576171875, -6.189453125, -5.72314453125, -5.2568359375, -4.79052734375, -4.32421875, -3.85791015625, -3.3916015625, -2.92529296875, -2.458984375, -1.99267578125, -1.5263671875, -1.06005859375, -0.59375, -0.12744140625, 0.3388671875, 0.80517578125, 1.271484375, 1.73779296875, 2.2041015625, 2.67041015625, 3.13671875, 3.60302734375, 4.0693359375, 4.53564453125, 5.001953125, 5.46826171875, 5.9345703125, 6.40087890625, 6.8671875, 7.33349609375, 7.7998046875, 8.26611328125, 8.732421875, 9.19873046875, 9.6650390625, 10.13134765625, 10.59765625, 11.06396484375, 11.5302734375, 11.99658203125, 12.462890625, 12.92919921875, 13.3955078125, 13.86181640625, 14.328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 6.0, 10.0, 10.0, 15.0, 22.0, 24.0, 19.0, 32.0, 31.0, 37.0, 31.0, 29.0, 28.0, 48.0, 35.0, 42.0, 47.0, 49.0, 40.0, 41.0, 38.0, 32.0, 31.0, 38.0, 28.0, 35.0, 15.0, 25.0, 25.0, 15.0, 15.0, 20.0, 8.0, 10.0, 11.0, 9.0, 5.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.971923828125, -15.44384765625, -14.915771484375, -14.3876953125, -13.859619140625, -13.33154296875, -12.803466796875, -12.275390625, -11.747314453125, -11.21923828125, -10.691162109375, -10.1630859375, -9.635009765625, -9.10693359375, -8.578857421875, -8.05078125, -7.522705078125, -6.99462890625, -6.466552734375, -5.9384765625, -5.410400390625, -4.88232421875, -4.354248046875, -3.826171875, -3.298095703125, -2.77001953125, -2.241943359375, -1.7138671875, -1.185791015625, -0.65771484375, -0.129638671875, 0.3984375, 0.926513671875, 1.45458984375, 1.982666015625, 2.5107421875, 3.038818359375, 3.56689453125, 4.094970703125, 4.623046875, 5.151123046875, 5.67919921875, 6.207275390625, 6.7353515625, 7.263427734375, 7.79150390625, 8.319580078125, 8.84765625, 9.375732421875, 9.90380859375, 10.431884765625, 10.9599609375, 11.488037109375, 12.01611328125, 12.544189453125, 13.072265625, 13.600341796875, 14.12841796875, 14.656494140625, 15.1845703125, 15.712646484375, 16.24072265625, 16.768798828125, 17.296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 13.0, 10.0, 10.0, 17.0, 28.0, 41.0, 58.0, 99.0, 128.0, 177.0, 325.0, 626.0, 1185.0, 2518.0, 7180.0, 49333.0, 777467.0, 188745.0, 13361.0, 3718.0, 1574.0, 800.0, 436.0, 221.0, 166.0, 102.0, 70.0, 36.0, 29.0, 25.0, 11.0, 12.0, 5.0, 10.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.90625, -20.32080078125, -19.7353515625, -19.14990234375, -18.564453125, -17.97900390625, -17.3935546875, -16.80810546875, -16.22265625, -15.63720703125, -15.0517578125, -14.46630859375, -13.880859375, -13.29541015625, -12.7099609375, -12.12451171875, -11.5390625, -10.95361328125, -10.3681640625, -9.78271484375, -9.197265625, -8.61181640625, -8.0263671875, -7.44091796875, -6.85546875, -6.27001953125, -5.6845703125, -5.09912109375, -4.513671875, -3.92822265625, -3.3427734375, -2.75732421875, -2.171875, -1.58642578125, -1.0009765625, -0.41552734375, 0.169921875, 0.75537109375, 1.3408203125, 1.92626953125, 2.51171875, 3.09716796875, 3.6826171875, 4.26806640625, 4.853515625, 5.43896484375, 6.0244140625, 6.60986328125, 7.1953125, 7.78076171875, 8.3662109375, 8.95166015625, 9.537109375, 10.12255859375, 10.7080078125, 11.29345703125, 11.87890625, 12.46435546875, 13.0498046875, 13.63525390625, 14.220703125, 14.80615234375, 15.3916015625, 15.97705078125, 16.5625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 7.0, 21.0, 23.0, 30.0, 71.0, 108.0, 133.0, 127.0, 139.0, 102.0, 71.0, 50.0, 35.0, 27.0, 16.0, 11.0, 9.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002315521240234375, -0.0022370517253875732, -0.0021585822105407715, -0.0020801126956939697, -0.002001643180847168, -0.0019231736660003662, -0.0018447041511535645, -0.0017662346363067627, -0.001687765121459961, -0.0016092956066131592, -0.0015308260917663574, -0.0014523565769195557, -0.001373887062072754, -0.0012954175472259521, -0.0012169480323791504, -0.0011384785175323486, -0.0010600090026855469, -0.0009815394878387451, -0.0009030699729919434, -0.0008246004581451416, -0.0007461309432983398, -0.0006676614284515381, -0.0005891919136047363, -0.0005107223987579346, -0.0004322528839111328, -0.00035378336906433105, -0.0002753138542175293, -0.00019684433937072754, -0.00011837482452392578, -3.9905309677124023e-05, 3.8564205169677734e-05, 0.00011703372001647949, 0.00019550323486328125, 0.000273972749710083, 0.00035244226455688477, 0.0004309117794036865, 0.0005093812942504883, 0.00058785080909729, 0.0006663203239440918, 0.0007447898387908936, 0.0008232593536376953, 0.0009017288684844971, 0.0009801983833312988, 0.0010586678981781006, 0.0011371374130249023, 0.001215606927871704, 0.0012940764427185059, 0.0013725459575653076, 0.0014510154724121094, 0.0015294849872589111, 0.0016079545021057129, 0.0016864240169525146, 0.0017648935317993164, 0.0018433630466461182, 0.00192183256149292, 0.0020003020763397217, 0.0020787715911865234, 0.002157241106033325, 0.002235710620880127, 0.0023141801357269287, 0.0023926496505737305, 0.0024711191654205322, 0.002549588680267334, 0.0026280581951141357, 0.0027065277099609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 11.0, 12.0, 38.0, 24.0, 49.0, 100.0, 200.0, 465.0, 1581.0, 10054.0, 711876.0, 315473.0, 6645.0, 1244.0, 392.0, 168.0, 89.0, 41.0, 25.0, 16.0, 14.0, 11.0, 8.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.53125, -32.512451171875, -31.49365234375, -30.474853515625, -29.4560546875, -28.437255859375, -27.41845703125, -26.399658203125, -25.380859375, -24.362060546875, -23.34326171875, -22.324462890625, -21.3056640625, -20.286865234375, -19.26806640625, -18.249267578125, -17.23046875, -16.211669921875, -15.19287109375, -14.174072265625, -13.1552734375, -12.136474609375, -11.11767578125, -10.098876953125, -9.080078125, -8.061279296875, -7.04248046875, -6.023681640625, -5.0048828125, -3.986083984375, -2.96728515625, -1.948486328125, -0.9296875, 0.089111328125, 1.10791015625, 2.126708984375, 3.1455078125, 4.164306640625, 5.18310546875, 6.201904296875, 7.220703125, 8.239501953125, 9.25830078125, 10.277099609375, 11.2958984375, 12.314697265625, 13.33349609375, 14.352294921875, 15.37109375, 16.389892578125, 17.40869140625, 18.427490234375, 19.4462890625, 20.465087890625, 21.48388671875, 22.502685546875, 23.521484375, 24.540283203125, 25.55908203125, 26.577880859375, 27.5966796875, 28.615478515625, 29.63427734375, 30.653076171875, 31.671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 21.0, 39.0, 66.0, 140.0, 199.0, 206.0, 126.0, 90.0, 51.0, 19.0, 11.0, 4.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-34.9375, -34.224365234375, -33.51123046875, -32.798095703125, -32.0849609375, -31.371826171875, -30.65869140625, -29.945556640625, -29.232421875, -28.519287109375, -27.80615234375, -27.093017578125, -26.3798828125, -25.666748046875, -24.95361328125, -24.240478515625, -23.52734375, -22.814208984375, -22.10107421875, -21.387939453125, -20.6748046875, -19.961669921875, -19.24853515625, -18.535400390625, -17.822265625, -17.109130859375, -16.39599609375, -15.682861328125, -14.9697265625, -14.256591796875, -13.54345703125, -12.830322265625, -12.1171875, -11.404052734375, -10.69091796875, -9.977783203125, -9.2646484375, -8.551513671875, -7.83837890625, -7.125244140625, -6.412109375, -5.698974609375, -4.98583984375, -4.272705078125, -3.5595703125, -2.846435546875, -2.13330078125, -1.420166015625, -0.70703125, 0.006103515625, 0.71923828125, 1.432373046875, 2.1455078125, 2.858642578125, 3.57177734375, 4.284912109375, 4.998046875, 5.711181640625, 6.42431640625, 7.137451171875, 7.8505859375, 8.563720703125, 9.27685546875, 9.989990234375, 10.703125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 22.0, 27.0, 35.0, 55.0, 86.0, 131.0, 133.0, 116.0, 124.0, 93.0, 57.0, 45.0, 30.0, 9.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-202.27223205566406, -197.50059509277344, -192.7289581298828, -187.9573211669922, -183.18568420410156, -178.41404724121094, -173.6424102783203, -168.8707733154297, -164.09913635253906, -159.32749938964844, -154.5558624267578, -149.7842254638672, -145.01258850097656, -140.24095153808594, -135.4693145751953, -130.6976776123047, -125.9260482788086, -121.15441131591797, -116.38277435302734, -111.61113739013672, -106.8395004272461, -102.06786346435547, -97.29623413085938, -92.52459716796875, -87.75296020507812, -82.9813232421875, -78.20968627929688, -73.43804931640625, -68.66641235351562, -63.894775390625, -59.12314224243164, -54.351505279541016, -49.579864501953125, -44.8082275390625, -40.036590576171875, -35.26495361328125, -30.493318557739258, -25.721681594848633, -20.95004653930664, -16.178409576416016, -11.40677261352539, -6.635136127471924, -1.863499641418457, 2.9081363677978516, 7.679773330688477, 12.451410293579102, 17.223045349121094, 21.99468231201172, 26.766319274902344, 31.53795623779297, 36.309593200683594, 41.08123016357422, 45.852867126464844, 50.62450408935547, 55.39613723754883, 60.16777420043945, 64.93940734863281, 69.71104431152344, 74.48268127441406, 79.25431823730469, 84.02595520019531, 88.79759216308594, 93.56922912597656, 98.34086608886719, 103.11250305175781]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 14.0, 9.0, 13.0, 6.0, 6.0, 12.0, 11.0, 16.0, 14.0, 26.0, 22.0, 31.0, 34.0, 30.0, 28.0, 57.0, 49.0, 46.0, 50.0, 51.0, 26.0, 44.0, 41.0, 28.0, 40.0, 30.0, 34.0, 30.0, 22.0, 26.0, 21.0, 24.0, 11.0, 20.0, 12.0, 11.0, 9.0, 4.0, 4.0, 10.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-91.76683044433594, -88.948486328125, -86.13014221191406, -83.31179809570312, -80.49345397949219, -77.67510986328125, -74.85676574707031, -72.03842163085938, -69.22007751464844, -66.4017333984375, -63.58338928222656, -60.765045166015625, -57.94670104980469, -55.12835693359375, -52.31001281738281, -49.491668701171875, -46.67332458496094, -43.85498046875, -41.03663635253906, -38.218292236328125, -35.39994812011719, -32.58160400390625, -29.763259887695312, -26.944915771484375, -24.126571655273438, -21.3082275390625, -18.489883422851562, -15.671539306640625, -12.853195190429688, -10.03485107421875, -7.2165069580078125, -4.398162841796875, -1.5798187255859375, 1.238525390625, 4.0568695068359375, 6.875213623046875, 9.693557739257812, 12.51190185546875, 15.330245971679688, 18.148590087890625, 20.966934204101562, 23.7852783203125, 26.603622436523438, 29.421966552734375, 32.24031066894531, 35.05865478515625, 37.87699890136719, 40.695343017578125, 43.51368713378906, 46.33203125, 49.15037536621094, 51.968719482421875, 54.78706359863281, 57.60540771484375, 60.42375183105469, 63.242095947265625, 66.06044006347656, 68.8787841796875, 71.69712829589844, 74.51547241210938, 77.33381652832031, 80.15216064453125, 82.97050476074219, 85.78884887695312, 88.60719299316406]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 13.0, 10.0, 25.0, 35.0, 40.0, 47.0, 62.0, 98.0, 147.0, 228.0, 379.0, 843.0, 2246.0, 9238.0, 118729.0, 4025415.0, 29307.0, 4536.0, 1380.0, 591.0, 314.0, 185.0, 100.0, 60.0, 59.0, 55.0, 39.0, 24.0, 11.0, 17.0, 14.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.75, -31.591796875, -30.43359375, -29.275390625, -28.1171875, -26.958984375, -25.80078125, -24.642578125, -23.484375, -22.326171875, -21.16796875, -20.009765625, -18.8515625, -17.693359375, -16.53515625, -15.376953125, -14.21875, -13.060546875, -11.90234375, -10.744140625, -9.5859375, -8.427734375, -7.26953125, -6.111328125, -4.953125, -3.794921875, -2.63671875, -1.478515625, -0.3203125, 0.837890625, 1.99609375, 3.154296875, 4.3125, 5.470703125, 6.62890625, 7.787109375, 8.9453125, 10.103515625, 11.26171875, 12.419921875, 13.578125, 14.736328125, 15.89453125, 17.052734375, 18.2109375, 19.369140625, 20.52734375, 21.685546875, 22.84375, 24.001953125, 25.16015625, 26.318359375, 27.4765625, 28.634765625, 29.79296875, 30.951171875, 32.109375, 33.267578125, 34.42578125, 35.583984375, 36.7421875, 37.900390625, 39.05859375, 40.216796875, 41.375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 9.0, 11.0, 12.0, 17.0, 20.0, 16.0, 24.0, 27.0, 28.0, 24.0, 39.0, 39.0, 54.0, 48.0, 46.0, 44.0, 55.0, 53.0, 50.0, 48.0, 50.0, 50.0, 41.0, 31.0, 30.0, 32.0, 25.0, 13.0, 12.0, 13.0, 11.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25390625, -4.126251220703125, -3.99859619140625, -3.870941162109375, -3.7432861328125, -3.615631103515625, -3.48797607421875, -3.360321044921875, -3.232666015625, -3.105010986328125, -2.97735595703125, -2.849700927734375, -2.7220458984375, -2.594390869140625, -2.46673583984375, -2.339080810546875, -2.21142578125, -2.083770751953125, -1.95611572265625, -1.828460693359375, -1.7008056640625, -1.573150634765625, -1.44549560546875, -1.317840576171875, -1.190185546875, -1.062530517578125, -0.93487548828125, -0.807220458984375, -0.6795654296875, -0.551910400390625, -0.42425537109375, -0.296600341796875, -0.1689453125, -0.041290283203125, 0.08636474609375, 0.214019775390625, 0.3416748046875, 0.469329833984375, 0.59698486328125, 0.724639892578125, 0.852294921875, 0.979949951171875, 1.10760498046875, 1.235260009765625, 1.3629150390625, 1.490570068359375, 1.61822509765625, 1.745880126953125, 1.87353515625, 2.001190185546875, 2.12884521484375, 2.256500244140625, 2.3841552734375, 2.511810302734375, 2.63946533203125, 2.767120361328125, 2.894775390625, 3.022430419921875, 3.15008544921875, 3.277740478515625, 3.4053955078125, 3.533050537109375, 3.66070556640625, 3.788360595703125, 3.916015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 4.0, 9.0, 10.0, 15.0, 13.0, 15.0, 29.0, 38.0, 60.0, 52.0, 87.0, 115.0, 170.0, 303.0, 517.0, 1101.0, 2409.0, 7081.0, 40873.0, 3953586.0, 166970.0, 13656.0, 3758.0, 1568.0, 698.0, 375.0, 239.0, 132.0, 98.0, 65.0, 56.0, 35.0, 29.0, 25.0, 18.0, 17.0, 12.0, 12.0, 8.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.40625, -33.20849609375, -32.0107421875, -30.81298828125, -29.615234375, -28.41748046875, -27.2197265625, -26.02197265625, -24.82421875, -23.62646484375, -22.4287109375, -21.23095703125, -20.033203125, -18.83544921875, -17.6376953125, -16.43994140625, -15.2421875, -14.04443359375, -12.8466796875, -11.64892578125, -10.451171875, -9.25341796875, -8.0556640625, -6.85791015625, -5.66015625, -4.46240234375, -3.2646484375, -2.06689453125, -0.869140625, 0.32861328125, 1.5263671875, 2.72412109375, 3.921875, 5.11962890625, 6.3173828125, 7.51513671875, 8.712890625, 9.91064453125, 11.1083984375, 12.30615234375, 13.50390625, 14.70166015625, 15.8994140625, 17.09716796875, 18.294921875, 19.49267578125, 20.6904296875, 21.88818359375, 23.0859375, 24.28369140625, 25.4814453125, 26.67919921875, 27.876953125, 29.07470703125, 30.2724609375, 31.47021484375, 32.66796875, 33.86572265625, 35.0634765625, 36.26123046875, 37.458984375, 38.65673828125, 39.8544921875, 41.05224609375, 42.25]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 2.0, 4.0, 11.0, 13.0, 27.0, 62.0, 188.0, 2758.0, 782.0, 116.0, 49.0, 23.0, 17.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75, -5.46142578125, -5.1728515625, -4.88427734375, -4.595703125, -4.30712890625, -4.0185546875, -3.72998046875, -3.44140625, -3.15283203125, -2.8642578125, -2.57568359375, -2.287109375, -1.99853515625, -1.7099609375, -1.42138671875, -1.1328125, -0.84423828125, -0.5556640625, -0.26708984375, 0.021484375, 0.31005859375, 0.5986328125, 0.88720703125, 1.17578125, 1.46435546875, 1.7529296875, 2.04150390625, 2.330078125, 2.61865234375, 2.9072265625, 3.19580078125, 3.484375, 3.77294921875, 4.0615234375, 4.35009765625, 4.638671875, 4.92724609375, 5.2158203125, 5.50439453125, 5.79296875, 6.08154296875, 6.3701171875, 6.65869140625, 6.947265625, 7.23583984375, 7.5244140625, 7.81298828125, 8.1015625, 8.39013671875, 8.6787109375, 8.96728515625, 9.255859375, 9.54443359375, 9.8330078125, 10.12158203125, 10.41015625, 10.69873046875, 10.9873046875, 11.27587890625, 11.564453125, 11.85302734375, 12.1416015625, 12.43017578125, 12.71875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 11.0, 21.0, 35.0, 70.0, 104.0, 126.0, 144.0, 139.0, 96.0, 92.0, 56.0, 42.0, 26.0, 11.0, 9.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.52684783935547, -47.4453010559082, -46.36375427246094, -45.28220748901367, -44.200660705566406, -43.119110107421875, -42.03756332397461, -40.956016540527344, -39.87446975708008, -38.79292297363281, -37.71137619018555, -36.62982940673828, -35.54827880859375, -34.466732025146484, -33.38518524169922, -32.30363845825195, -31.222091674804688, -30.140544891357422, -29.058998107910156, -27.977449417114258, -26.895902633666992, -25.814355850219727, -24.732807159423828, -23.651260375976562, -22.569713592529297, -21.48816680908203, -20.406620025634766, -19.325071334838867, -18.2435245513916, -17.161977767944336, -16.080429077148438, -14.998882293701172, -13.917339324951172, -12.835792541503906, -11.754244804382324, -10.672697067260742, -9.591150283813477, -8.509603500366211, -7.428055763244629, -6.346508502960205, -5.264961242675781, -4.183413982391357, -3.1018667221069336, -2.0203194618225098, -0.9387722015380859, 0.1427750587463379, 1.2243223190307617, 2.3058695793151855, 3.3874168395996094, 4.468964099884033, 5.550511360168457, 6.632058620452881, 7.713605880737305, 8.79515266418457, 9.876700401306152, 10.958248138427734, 12.039794921875, 13.121341705322266, 14.202889442443848, 15.28443717956543, 16.365983963012695, 17.44753074645996, 18.52907943725586, 19.610626220703125, 20.69217300415039]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 7.0, 10.0, 14.0, 9.0, 6.0, 17.0, 16.0, 17.0, 20.0, 18.0, 22.0, 30.0, 32.0, 34.0, 35.0, 38.0, 37.0, 40.0, 39.0, 42.0, 45.0, 30.0, 47.0, 44.0, 57.0, 36.0, 37.0, 39.0, 34.0, 30.0, 21.0, 18.0, 21.0, 10.0, 10.0, 8.0, 5.0, 10.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.6756591796875, -14.229063987731934, -13.78246784210205, -13.335872650146484, -12.889276504516602, -12.442681312561035, -11.996086120605469, -11.549489974975586, -11.10289478302002, -10.656299591064453, -10.20970344543457, -9.763108253479004, -9.316513061523438, -8.869916915893555, -8.423321723937988, -7.976726055145264, -7.530130386352539, -7.0835347175598145, -6.63693904876709, -6.190343856811523, -5.743748188018799, -5.297152519226074, -4.850557327270508, -4.403961658477783, -3.9573659896850586, -3.510770320892334, -3.0641748905181885, -2.617579460144043, -2.1709837913513184, -1.7243881225585938, -1.2777926921844482, -0.8311972618103027, -0.3846006393432617, 0.06199491024017334, 0.5085904598236084, 0.9551860094070435, 1.4017815589904785, 1.8483772277832031, 2.2949726581573486, 2.741568088531494, 3.1881637573242188, 3.6347594261169434, 4.081355094909668, 4.527950286865234, 4.974545955657959, 5.421141624450684, 5.86773681640625, 6.314332485198975, 6.760928153991699, 7.207523822784424, 7.654119491577148, 8.100714683532715, 8.547309875488281, 8.993906021118164, 9.44050121307373, 9.887096405029297, 10.33369255065918, 10.780287742614746, 11.226883888244629, 11.673479080200195, 12.120075225830078, 12.566670417785645, 13.013265609741211, 13.459861755371094, 13.90645694732666]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 14.0, 13.0, 13.0, 29.0, 43.0, 41.0, 54.0, 97.0, 143.0, 179.0, 279.0, 392.0, 540.0, 868.0, 1263.0, 1949.0, 3032.0, 4753.0, 8013.0, 14160.0, 26087.0, 50532.0, 102039.0, 196509.0, 260966.0, 181329.0, 92472.0, 45867.0, 23413.0, 12871.0, 7509.0, 4511.0, 2882.0, 1885.0, 1223.0, 807.0, 544.0, 338.0, 264.0, 189.0, 131.0, 77.0, 68.0, 42.0, 31.0, 26.0, 24.0, 14.0, 11.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.203125, -6.97393798828125, -6.7447509765625, -6.51556396484375, -6.286376953125, -6.05718994140625, -5.8280029296875, -5.59881591796875, -5.36962890625, -5.14044189453125, -4.9112548828125, -4.68206787109375, -4.452880859375, -4.22369384765625, -3.9945068359375, -3.76531982421875, -3.5361328125, -3.30694580078125, -3.0777587890625, -2.84857177734375, -2.619384765625, -2.39019775390625, -2.1610107421875, -1.93182373046875, -1.70263671875, -1.47344970703125, -1.2442626953125, -1.01507568359375, -0.785888671875, -0.55670166015625, -0.3275146484375, -0.09832763671875, 0.130859375, 0.36004638671875, 0.5892333984375, 0.81842041015625, 1.047607421875, 1.27679443359375, 1.5059814453125, 1.73516845703125, 1.96435546875, 2.19354248046875, 2.4227294921875, 2.65191650390625, 2.881103515625, 3.11029052734375, 3.3394775390625, 3.56866455078125, 3.7978515625, 4.02703857421875, 4.2562255859375, 4.48541259765625, 4.714599609375, 4.94378662109375, 5.1729736328125, 5.40216064453125, 5.63134765625, 5.86053466796875, 6.0897216796875, 6.31890869140625, 6.548095703125, 6.77728271484375, 7.0064697265625, 7.23565673828125, 7.46484375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 9.0, 9.0, 9.0, 15.0, 14.0, 22.0, 21.0, 20.0, 34.0, 29.0, 33.0, 39.0, 43.0, 50.0, 60.0, 47.0, 47.0, 48.0, 41.0, 38.0, 51.0, 54.0, 36.0, 39.0, 32.0, 22.0, 26.0, 14.0, 24.0, 21.0, 14.0, 8.0, 10.0, 7.0, 6.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.62884521484375, -4.4881591796875, -4.34747314453125, -4.206787109375, -4.06610107421875, -3.9254150390625, -3.78472900390625, -3.64404296875, -3.50335693359375, -3.3626708984375, -3.22198486328125, -3.081298828125, -2.94061279296875, -2.7999267578125, -2.65924072265625, -2.5185546875, -2.37786865234375, -2.2371826171875, -2.09649658203125, -1.955810546875, -1.81512451171875, -1.6744384765625, -1.53375244140625, -1.39306640625, -1.25238037109375, -1.1116943359375, -0.97100830078125, -0.830322265625, -0.68963623046875, -0.5489501953125, -0.40826416015625, -0.267578125, -0.12689208984375, 0.0137939453125, 0.15447998046875, 0.295166015625, 0.43585205078125, 0.5765380859375, 0.71722412109375, 0.85791015625, 0.99859619140625, 1.1392822265625, 1.27996826171875, 1.420654296875, 1.56134033203125, 1.7020263671875, 1.84271240234375, 1.9833984375, 2.12408447265625, 2.2647705078125, 2.40545654296875, 2.546142578125, 2.68682861328125, 2.8275146484375, 2.96820068359375, 3.10888671875, 3.24957275390625, 3.3902587890625, 3.53094482421875, 3.671630859375, 3.81231689453125, 3.9530029296875, 4.09368896484375, 4.234375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 12.0, 16.0, 29.0, 32.0, 35.0, 54.0, 94.0, 124.0, 155.0, 248.0, 395.0, 708.0, 1319.0, 2798.0, 8130.0, 34108.0, 319095.0, 600591.0, 60970.0, 11822.0, 3808.0, 1606.0, 867.0, 517.0, 282.0, 218.0, 134.0, 93.0, 63.0, 51.0, 33.0, 38.0, 21.0, 17.0, 11.0, 4.0, 4.0, 5.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.0625, -21.330810546875, -20.59912109375, -19.867431640625, -19.1357421875, -18.404052734375, -17.67236328125, -16.940673828125, -16.208984375, -15.477294921875, -14.74560546875, -14.013916015625, -13.2822265625, -12.550537109375, -11.81884765625, -11.087158203125, -10.35546875, -9.623779296875, -8.89208984375, -8.160400390625, -7.4287109375, -6.697021484375, -5.96533203125, -5.233642578125, -4.501953125, -3.770263671875, -3.03857421875, -2.306884765625, -1.5751953125, -0.843505859375, -0.11181640625, 0.619873046875, 1.3515625, 2.083251953125, 2.81494140625, 3.546630859375, 4.2783203125, 5.010009765625, 5.74169921875, 6.473388671875, 7.205078125, 7.936767578125, 8.66845703125, 9.400146484375, 10.1318359375, 10.863525390625, 11.59521484375, 12.326904296875, 13.05859375, 13.790283203125, 14.52197265625, 15.253662109375, 15.9853515625, 16.717041015625, 17.44873046875, 18.180419921875, 18.912109375, 19.643798828125, 20.37548828125, 21.107177734375, 21.8388671875, 22.570556640625, 23.30224609375, 24.033935546875, 24.765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 3.0, 6.0, 5.0, 12.0, 10.0, 8.0, 18.0, 18.0, 20.0, 22.0, 21.0, 25.0, 31.0, 33.0, 36.0, 48.0, 45.0, 40.0, 52.0, 43.0, 55.0, 43.0, 51.0, 46.0, 40.0, 39.0, 30.0, 21.0, 36.0, 21.0, 23.0, 22.0, 17.0, 13.0, 10.0, 11.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.015625, -20.32568359375, -19.6357421875, -18.94580078125, -18.255859375, -17.56591796875, -16.8759765625, -16.18603515625, -15.49609375, -14.80615234375, -14.1162109375, -13.42626953125, -12.736328125, -12.04638671875, -11.3564453125, -10.66650390625, -9.9765625, -9.28662109375, -8.5966796875, -7.90673828125, -7.216796875, -6.52685546875, -5.8369140625, -5.14697265625, -4.45703125, -3.76708984375, -3.0771484375, -2.38720703125, -1.697265625, -1.00732421875, -0.3173828125, 0.37255859375, 1.0625, 1.75244140625, 2.4423828125, 3.13232421875, 3.822265625, 4.51220703125, 5.2021484375, 5.89208984375, 6.58203125, 7.27197265625, 7.9619140625, 8.65185546875, 9.341796875, 10.03173828125, 10.7216796875, 11.41162109375, 12.1015625, 12.79150390625, 13.4814453125, 14.17138671875, 14.861328125, 15.55126953125, 16.2412109375, 16.93115234375, 17.62109375, 18.31103515625, 19.0009765625, 19.69091796875, 20.380859375, 21.07080078125, 21.7607421875, 22.45068359375, 23.140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 6.0, 9.0, 6.0, 15.0, 30.0, 45.0, 59.0, 106.0, 176.0, 460.0, 1302.0, 6339.0, 158799.0, 861466.0, 16178.0, 2306.0, 677.0, 240.0, 113.0, 75.0, 47.0, 29.0, 21.0, 12.0, 6.0, 7.0, 3.0, 3.0, 5.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.71875, -28.766357421875, -27.81396484375, -26.861572265625, -25.9091796875, -24.956787109375, -24.00439453125, -23.052001953125, -22.099609375, -21.147216796875, -20.19482421875, -19.242431640625, -18.2900390625, -17.337646484375, -16.38525390625, -15.432861328125, -14.48046875, -13.528076171875, -12.57568359375, -11.623291015625, -10.6708984375, -9.718505859375, -8.76611328125, -7.813720703125, -6.861328125, -5.908935546875, -4.95654296875, -4.004150390625, -3.0517578125, -2.099365234375, -1.14697265625, -0.194580078125, 0.7578125, 1.710205078125, 2.66259765625, 3.614990234375, 4.5673828125, 5.519775390625, 6.47216796875, 7.424560546875, 8.376953125, 9.329345703125, 10.28173828125, 11.234130859375, 12.1865234375, 13.138916015625, 14.09130859375, 15.043701171875, 15.99609375, 16.948486328125, 17.90087890625, 18.853271484375, 19.8056640625, 20.758056640625, 21.71044921875, 22.662841796875, 23.615234375, 24.567626953125, 25.52001953125, 26.472412109375, 27.4248046875, 28.377197265625, 29.32958984375, 30.281982421875, 31.234375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 3.0, 7.0, 10.0, 9.0, 13.0, 27.0, 44.0, 56.0, 91.0, 125.0, 187.0, 142.0, 115.0, 61.0, 37.0, 28.0, 16.0, 12.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033969879150390625, -0.0033087730407714844, -0.0032205581665039062, -0.003132343292236328, -0.00304412841796875, -0.002955913543701172, -0.0028676986694335938, -0.0027794837951660156, -0.0026912689208984375, -0.0026030540466308594, -0.0025148391723632812, -0.002426624298095703, -0.002338409423828125, -0.002250194549560547, -0.0021619796752929688, -0.0020737648010253906, -0.0019855499267578125, -0.0018973350524902344, -0.0018091201782226562, -0.0017209053039550781, -0.0016326904296875, -0.0015444755554199219, -0.0014562606811523438, -0.0013680458068847656, -0.0012798309326171875, -0.0011916160583496094, -0.0011034011840820312, -0.0010151863098144531, -0.000926971435546875, -0.0008387565612792969, -0.0007505416870117188, -0.0006623268127441406, -0.0005741119384765625, -0.0004858970642089844, -0.00039768218994140625, -0.0003094673156738281, -0.00022125244140625, -0.00013303756713867188, -4.482269287109375e-05, 4.3392181396484375e-05, 0.0001316070556640625, 0.00021982192993164062, 0.00030803680419921875, 0.0003962516784667969, 0.000484466552734375, 0.0005726814270019531, 0.0006608963012695312, 0.0007491111755371094, 0.0008373260498046875, 0.0009255409240722656, 0.0010137557983398438, 0.0011019706726074219, 0.001190185546875, 0.0012784004211425781, 0.0013666152954101562, 0.0014548301696777344, 0.0015430450439453125, 0.0016312599182128906, 0.0017194747924804688, 0.0018076896667480469, 0.001895904541015625, 0.001984119415283203, 0.0020723342895507812, 0.0021605491638183594, 0.0022487640380859375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 6.0, 9.0, 10.0, 16.0, 15.0, 26.0, 47.0, 59.0, 94.0, 146.0, 328.0, 684.0, 1798.0, 5447.0, 30059.0, 664708.0, 321312.0, 17149.0, 3915.0, 1439.0, 591.0, 247.0, 147.0, 103.0, 49.0, 32.0, 23.0, 20.0, 12.0, 18.0, 9.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.118896484375, -18.51904296875, -17.919189453125, -17.3193359375, -16.719482421875, -16.11962890625, -15.519775390625, -14.919921875, -14.320068359375, -13.72021484375, -13.120361328125, -12.5205078125, -11.920654296875, -11.32080078125, -10.720947265625, -10.12109375, -9.521240234375, -8.92138671875, -8.321533203125, -7.7216796875, -7.121826171875, -6.52197265625, -5.922119140625, -5.322265625, -4.722412109375, -4.12255859375, -3.522705078125, -2.9228515625, -2.322998046875, -1.72314453125, -1.123291015625, -0.5234375, 0.076416015625, 0.67626953125, 1.276123046875, 1.8759765625, 2.475830078125, 3.07568359375, 3.675537109375, 4.275390625, 4.875244140625, 5.47509765625, 6.074951171875, 6.6748046875, 7.274658203125, 7.87451171875, 8.474365234375, 9.07421875, 9.674072265625, 10.27392578125, 10.873779296875, 11.4736328125, 12.073486328125, 12.67333984375, 13.273193359375, 13.873046875, 14.472900390625, 15.07275390625, 15.672607421875, 16.2724609375, 16.872314453125, 17.47216796875, 18.072021484375, 18.671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 18.0, 24.0, 48.0, 61.0, 99.0, 121.0, 140.0, 146.0, 98.0, 82.0, 50.0, 33.0, 19.0, 10.0, 13.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.515625, -19.0015869140625, -18.487548828125, -17.9735107421875, -17.45947265625, -16.9454345703125, -16.431396484375, -15.9173583984375, -15.4033203125, -14.8892822265625, -14.375244140625, -13.8612060546875, -13.34716796875, -12.8331298828125, -12.319091796875, -11.8050537109375, -11.291015625, -10.7769775390625, -10.262939453125, -9.7489013671875, -9.23486328125, -8.7208251953125, -8.206787109375, -7.6927490234375, -7.1787109375, -6.6646728515625, -6.150634765625, -5.6365966796875, -5.12255859375, -4.6085205078125, -4.094482421875, -3.5804443359375, -3.06640625, -2.5523681640625, -2.038330078125, -1.5242919921875, -1.01025390625, -0.4962158203125, 0.017822265625, 0.5318603515625, 1.0458984375, 1.5599365234375, 2.073974609375, 2.5880126953125, 3.10205078125, 3.6160888671875, 4.130126953125, 4.6441650390625, 5.158203125, 5.6722412109375, 6.186279296875, 6.7003173828125, 7.21435546875, 7.7283935546875, 8.242431640625, 8.7564697265625, 9.2705078125, 9.7845458984375, 10.298583984375, 10.8126220703125, 11.32666015625, 11.8406982421875, 12.354736328125, 12.8687744140625, 13.3828125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 15.0, 34.0, 105.0, 253.0, 277.0, 194.0, 83.0, 29.0, 10.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-590.80517578125, -579.2482299804688, -567.6913452148438, -556.1343994140625, -544.5774536132812, -533.0205688476562, -521.463623046875, -509.90667724609375, -498.3497619628906, -486.7928466796875, -475.23590087890625, -463.6789855957031, -452.1220703125, -440.56512451171875, -429.0082092285156, -417.4512939453125, -405.89434814453125, -394.3374328613281, -382.7804870605469, -371.22357177734375, -359.6666259765625, -348.1097106933594, -336.55279541015625, -324.995849609375, -313.4389343261719, -301.88201904296875, -290.3250732421875, -278.7681579589844, -267.21124267578125, -255.654296875, -244.09738159179688, -232.5404510498047, -220.9835205078125, -209.4265899658203, -197.86965942382812, -186.312744140625, -174.7558135986328, -163.19888305664062, -151.6419677734375, -140.0850372314453, -128.52810668945312, -116.97117614746094, -105.41425323486328, -93.85733032226562, -82.30039978027344, -70.74346923828125, -59.186546325683594, -47.62962341308594, -36.07269287109375, -24.515766143798828, -12.958839416503906, -1.4019126892089844, 10.155014038085938, 21.71194076538086, 33.26886749267578, 44.82579040527344, 56.382720947265625, 67.93965148925781, 79.49657440185547, 91.05349731445312, 102.61042785644531, 114.1673583984375, 125.72428131103516, 137.2812042236328, 148.838134765625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 7.0, 17.0, 8.0, 24.0, 17.0, 24.0, 28.0, 44.0, 39.0, 48.0, 58.0, 44.0, 73.0, 72.0, 60.0, 58.0, 47.0, 45.0, 44.0, 46.0, 30.0, 23.0, 21.0, 24.0, 22.0, 16.0, 7.0, 11.0, 9.0, 10.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.08881378173828, -101.17424011230469, -97.25967407226562, -93.34510040283203, -89.43052673339844, -85.51595306396484, -81.60137939453125, -77.68681335449219, -73.7722396850586, -69.857666015625, -65.94309997558594, -62.028526306152344, -58.11395263671875, -54.199378967285156, -50.28480911254883, -46.3702392578125, -42.455665588378906, -38.54109191894531, -34.626522064208984, -30.711950302124023, -26.797378540039062, -22.8828067779541, -18.96823501586914, -15.05366325378418, -11.139091491699219, -7.224519729614258, -3.309947967529297, 0.6046237945556641, 4.519195556640625, 8.433767318725586, 12.348339080810547, 16.262910842895508, 20.177474975585938, 24.0920467376709, 28.00661849975586, 31.92119026184082, 35.83576202392578, 39.750335693359375, 43.6649055480957, 47.57947540283203, 51.494049072265625, 55.40862274169922, 59.32319259643555, 63.237762451171875, 67.15233612060547, 71.06690979003906, 74.98147583007812, 78.89604949951172, 82.81062316894531, 86.7251968383789, 90.6397705078125, 94.55433654785156, 98.46891021728516, 102.38348388671875, 106.29804992675781, 110.2126235961914, 114.127197265625, 118.0417709350586, 121.95634460449219, 125.87091064453125, 129.78549194335938, 133.70005798339844, 137.6146240234375, 141.52920532226562, 145.4437713623047]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 3.0, 9.0, 8.0, 11.0, 10.0, 30.0, 48.0, 83.0, 126.0, 268.0, 791.0, 2850.0, 20282.0, 4132479.0, 32086.0, 3574.0, 921.0, 371.0, 140.0, 76.0, 49.0, 17.0, 19.0, 10.0, 5.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.15625, -47.599609375, -46.04296875, -44.486328125, -42.9296875, -41.373046875, -39.81640625, -38.259765625, -36.703125, -35.146484375, -33.58984375, -32.033203125, -30.4765625, -28.919921875, -27.36328125, -25.806640625, -24.25, -22.693359375, -21.13671875, -19.580078125, -18.0234375, -16.466796875, -14.91015625, -13.353515625, -11.796875, -10.240234375, -8.68359375, -7.126953125, -5.5703125, -4.013671875, -2.45703125, -0.900390625, 0.65625, 2.212890625, 3.76953125, 5.326171875, 6.8828125, 8.439453125, 9.99609375, 11.552734375, 13.109375, 14.666015625, 16.22265625, 17.779296875, 19.3359375, 20.892578125, 22.44921875, 24.005859375, 25.5625, 27.119140625, 28.67578125, 30.232421875, 31.7890625, 33.345703125, 34.90234375, 36.458984375, 38.015625, 39.572265625, 41.12890625, 42.685546875, 44.2421875, 45.798828125, 47.35546875, 48.912109375, 50.46875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 7.0, 15.0, 11.0, 15.0, 23.0, 34.0, 28.0, 56.0, 39.0, 58.0, 56.0, 84.0, 67.0, 82.0, 66.0, 52.0, 62.0, 40.0, 42.0, 42.0, 21.0, 29.0, 17.0, 15.0, 11.0, 10.0, 8.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55859375, -4.36151123046875, -4.1644287109375, -3.96734619140625, -3.770263671875, -3.57318115234375, -3.3760986328125, -3.17901611328125, -2.98193359375, -2.78485107421875, -2.5877685546875, -2.39068603515625, -2.193603515625, -1.99652099609375, -1.7994384765625, -1.60235595703125, -1.4052734375, -1.20819091796875, -1.0111083984375, -0.81402587890625, -0.616943359375, -0.41986083984375, -0.2227783203125, -0.02569580078125, 0.17138671875, 0.36846923828125, 0.5655517578125, 0.76263427734375, 0.959716796875, 1.15679931640625, 1.3538818359375, 1.55096435546875, 1.748046875, 1.94512939453125, 2.1422119140625, 2.33929443359375, 2.536376953125, 2.73345947265625, 2.9305419921875, 3.12762451171875, 3.32470703125, 3.52178955078125, 3.7188720703125, 3.91595458984375, 4.113037109375, 4.31011962890625, 4.5072021484375, 4.70428466796875, 4.9013671875, 5.09844970703125, 5.2955322265625, 5.49261474609375, 5.689697265625, 5.88677978515625, 6.0838623046875, 6.28094482421875, 6.47802734375, 6.67510986328125, 6.8721923828125, 7.06927490234375, 7.266357421875, 7.46343994140625, 7.6605224609375, 7.85760498046875, 8.0546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 9.0, 14.0, 15.0, 23.0, 30.0, 37.0, 49.0, 73.0, 133.0, 262.0, 463.0, 865.0, 2345.0, 6959.0, 34625.0, 4026445.0, 103850.0, 12072.0, 3321.0, 1288.0, 567.0, 281.0, 178.0, 106.0, 85.0, 48.0, 30.0, 25.0, 17.0, 13.0, 10.0, 6.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-32.625, -31.595703125, -30.56640625, -29.537109375, -28.5078125, -27.478515625, -26.44921875, -25.419921875, -24.390625, -23.361328125, -22.33203125, -21.302734375, -20.2734375, -19.244140625, -18.21484375, -17.185546875, -16.15625, -15.126953125, -14.09765625, -13.068359375, -12.0390625, -11.009765625, -9.98046875, -8.951171875, -7.921875, -6.892578125, -5.86328125, -4.833984375, -3.8046875, -2.775390625, -1.74609375, -0.716796875, 0.3125, 1.341796875, 2.37109375, 3.400390625, 4.4296875, 5.458984375, 6.48828125, 7.517578125, 8.546875, 9.576171875, 10.60546875, 11.634765625, 12.6640625, 13.693359375, 14.72265625, 15.751953125, 16.78125, 17.810546875, 18.83984375, 19.869140625, 20.8984375, 21.927734375, 22.95703125, 23.986328125, 25.015625, 26.044921875, 27.07421875, 28.103515625, 29.1328125, 30.162109375, 31.19140625, 32.220703125, 33.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 10.0, 11.0, 14.0, 20.0, 33.0, 127.0, 3306.0, 389.0, 83.0, 37.0, 14.0, 11.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.091064453125, -4.84619140625, -4.601318359375, -4.3564453125, -4.111572265625, -3.86669921875, -3.621826171875, -3.376953125, -3.132080078125, -2.88720703125, -2.642333984375, -2.3974609375, -2.152587890625, -1.90771484375, -1.662841796875, -1.41796875, -1.173095703125, -0.92822265625, -0.683349609375, -0.4384765625, -0.193603515625, 0.05126953125, 0.296142578125, 0.541015625, 0.785888671875, 1.03076171875, 1.275634765625, 1.5205078125, 1.765380859375, 2.01025390625, 2.255126953125, 2.5, 2.744873046875, 2.98974609375, 3.234619140625, 3.4794921875, 3.724365234375, 3.96923828125, 4.214111328125, 4.458984375, 4.703857421875, 4.94873046875, 5.193603515625, 5.4384765625, 5.683349609375, 5.92822265625, 6.173095703125, 6.41796875, 6.662841796875, 6.90771484375, 7.152587890625, 7.3974609375, 7.642333984375, 7.88720703125, 8.132080078125, 8.376953125, 8.621826171875, 8.86669921875, 9.111572265625, 9.3564453125, 9.601318359375, 9.84619140625, 10.091064453125, 10.3359375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 11.0, 7.0, 13.0, 18.0, 26.0, 37.0, 43.0, 50.0, 83.0, 92.0, 115.0, 100.0, 100.0, 81.0, 49.0, 61.0, 42.0, 28.0, 16.0, 11.0, 4.0, 6.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.923587799072266, -15.387580871582031, -14.851573944091797, -14.315567016601562, -13.779560089111328, -13.243553161621094, -12.70754623413086, -12.171539306640625, -11.63553237915039, -11.099525451660156, -10.563518524169922, -10.027511596679688, -9.491504669189453, -8.955497741699219, -8.419490814208984, -7.883483409881592, -7.347476005554199, -6.811469078063965, -6.2754621505737305, -5.739455223083496, -5.203448295593262, -4.667441368103027, -4.131433963775635, -3.5954270362854004, -3.059420108795166, -2.5234131813049316, -1.9874061346054077, -1.4513990879058838, -0.9153921604156494, -0.37938523292541504, 0.15662193298339844, 0.6926288604736328, 1.2286357879638672, 1.7646427154541016, 2.300649642944336, 2.8366568088531494, 3.372663736343384, 3.908670663833618, 4.444677829742432, 4.980684757232666, 5.5166916847229, 6.052698612213135, 6.588705539703369, 7.124712944030762, 7.660719871520996, 8.19672679901123, 8.732733726501465, 9.2687406539917, 9.804747581481934, 10.340754508972168, 10.876761436462402, 11.412768363952637, 11.948775291442871, 12.484782218933105, 13.020790100097656, 13.55679702758789, 14.092803955078125, 14.62881088256836, 15.164817810058594, 15.700824737548828, 16.236831665039062, 16.772838592529297, 17.30884552001953, 17.844852447509766, 18.380859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 8.0, 10.0, 11.0, 15.0, 16.0, 11.0, 23.0, 27.0, 21.0, 22.0, 34.0, 31.0, 30.0, 46.0, 44.0, 52.0, 42.0, 56.0, 54.0, 43.0, 49.0, 40.0, 35.0, 44.0, 31.0, 29.0, 27.0, 30.0, 20.0, 16.0, 18.0, 10.0, 10.0, 7.0, 10.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6367769241333, -9.321385383605957, -9.00599479675293, -8.690603256225586, -8.375211715698242, -8.059821128845215, -7.744429588317871, -7.4290385246276855, -7.1136474609375, -6.7982563972473145, -6.482865333557129, -6.167473793029785, -5.8520827293396, -5.536691665649414, -5.22130012512207, -4.905909061431885, -4.590517997741699, -4.275126934051514, -3.959735631942749, -3.6443443298339844, -3.328953266143799, -3.0135622024536133, -2.6981709003448486, -2.382779598236084, -2.0673885345458984, -1.7519973516464233, -1.4366061687469482, -1.1212149858474731, -0.805823802947998, -0.49043262004852295, -0.17504143714904785, 0.1403498649597168, 0.45573997497558594, 0.771131157875061, 1.0865223407745361, 1.4019135236740112, 1.7173047065734863, 2.032695770263672, 2.3480870723724365, 2.663478374481201, 2.9788694381713867, 3.2942605018615723, 3.609651803970337, 3.9250431060791016, 4.240434169769287, 4.555825233459473, 4.871216773986816, 5.186607837677002, 5.5019989013671875, 5.817389965057373, 6.132781028747559, 6.448172569274902, 6.763563632965088, 7.078954696655273, 7.394346237182617, 7.709737300872803, 8.025128364562988, 8.340519905090332, 8.65591049194336, 8.971302032470703, 9.286693572998047, 9.602084159851074, 9.917475700378418, 10.232866287231445, 10.548257827758789]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 13.0, 27.0, 31.0, 44.0, 68.0, 106.0, 194.0, 300.0, 559.0, 922.0, 1705.0, 3454.0, 6950.0, 14934.0, 33250.0, 75434.0, 170974.0, 316842.0, 232585.0, 104620.0, 46194.0, 20426.0, 9236.0, 4438.0, 2248.0, 1255.0, 702.0, 403.0, 226.0, 149.0, 103.0, 60.0, 27.0, 24.0, 13.0, 13.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.28143310546875, -7.0277099609375, -6.77398681640625, -6.520263671875, -6.26654052734375, -6.0128173828125, -5.75909423828125, -5.50537109375, -5.25164794921875, -4.9979248046875, -4.74420166015625, -4.490478515625, -4.23675537109375, -3.9830322265625, -3.72930908203125, -3.4755859375, -3.22186279296875, -2.9681396484375, -2.71441650390625, -2.460693359375, -2.20697021484375, -1.9532470703125, -1.69952392578125, -1.44580078125, -1.19207763671875, -0.9383544921875, -0.68463134765625, -0.430908203125, -0.17718505859375, 0.0765380859375, 0.33026123046875, 0.583984375, 0.83770751953125, 1.0914306640625, 1.34515380859375, 1.598876953125, 1.85260009765625, 2.1063232421875, 2.36004638671875, 2.61376953125, 2.86749267578125, 3.1212158203125, 3.37493896484375, 3.628662109375, 3.88238525390625, 4.1361083984375, 4.38983154296875, 4.6435546875, 4.89727783203125, 5.1510009765625, 5.40472412109375, 5.658447265625, 5.91217041015625, 6.1658935546875, 6.41961669921875, 6.67333984375, 6.92706298828125, 7.1807861328125, 7.43450927734375, 7.688232421875, 7.94195556640625, 8.1956787109375, 8.44940185546875, 8.703125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 10.0, 8.0, 19.0, 17.0, 25.0, 18.0, 32.0, 16.0, 52.0, 35.0, 60.0, 50.0, 51.0, 71.0, 51.0, 66.0, 61.0, 55.0, 48.0, 46.0, 34.0, 36.0, 21.0, 26.0, 20.0, 17.0, 17.0, 8.0, 8.0, 5.0, 5.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.0, -4.8121337890625, -4.624267578125, -4.4364013671875, -4.24853515625, -4.0606689453125, -3.872802734375, -3.6849365234375, -3.4970703125, -3.3092041015625, -3.121337890625, -2.9334716796875, -2.74560546875, -2.5577392578125, -2.369873046875, -2.1820068359375, -1.994140625, -1.8062744140625, -1.618408203125, -1.4305419921875, -1.24267578125, -1.0548095703125, -0.866943359375, -0.6790771484375, -0.4912109375, -0.3033447265625, -0.115478515625, 0.0723876953125, 0.26025390625, 0.4481201171875, 0.635986328125, 0.8238525390625, 1.01171875, 1.1995849609375, 1.387451171875, 1.5753173828125, 1.76318359375, 1.9510498046875, 2.138916015625, 2.3267822265625, 2.5146484375, 2.7025146484375, 2.890380859375, 3.0782470703125, 3.26611328125, 3.4539794921875, 3.641845703125, 3.8297119140625, 4.017578125, 4.2054443359375, 4.393310546875, 4.5811767578125, 4.76904296875, 4.9569091796875, 5.144775390625, 5.3326416015625, 5.5205078125, 5.7083740234375, 5.896240234375, 6.0841064453125, 6.27197265625, 6.4598388671875, 6.647705078125, 6.8355712890625, 7.0234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 6.0, 6.0, 2.0, 8.0, 12.0, 19.0, 12.0, 26.0, 33.0, 56.0, 95.0, 108.0, 162.0, 282.0, 451.0, 802.0, 1707.0, 5899.0, 57359.0, 829913.0, 137224.0, 9716.0, 2196.0, 988.0, 524.0, 357.0, 204.0, 146.0, 81.0, 48.0, 36.0, 24.0, 24.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.03076171875, -19.2177734375, -18.40478515625, -17.591796875, -16.77880859375, -15.9658203125, -15.15283203125, -14.33984375, -13.52685546875, -12.7138671875, -11.90087890625, -11.087890625, -10.27490234375, -9.4619140625, -8.64892578125, -7.8359375, -7.02294921875, -6.2099609375, -5.39697265625, -4.583984375, -3.77099609375, -2.9580078125, -2.14501953125, -1.33203125, -0.51904296875, 0.2939453125, 1.10693359375, 1.919921875, 2.73291015625, 3.5458984375, 4.35888671875, 5.171875, 5.98486328125, 6.7978515625, 7.61083984375, 8.423828125, 9.23681640625, 10.0498046875, 10.86279296875, 11.67578125, 12.48876953125, 13.3017578125, 14.11474609375, 14.927734375, 15.74072265625, 16.5537109375, 17.36669921875, 18.1796875, 18.99267578125, 19.8056640625, 20.61865234375, 21.431640625, 22.24462890625, 23.0576171875, 23.87060546875, 24.68359375, 25.49658203125, 26.3095703125, 27.12255859375, 27.935546875, 28.74853515625, 29.5615234375, 30.37451171875, 31.1875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 3.0, 12.0, 6.0, 9.0, 10.0, 15.0, 11.0, 25.0, 21.0, 28.0, 24.0, 32.0, 49.0, 41.0, 44.0, 46.0, 47.0, 57.0, 52.0, 46.0, 52.0, 45.0, 37.0, 37.0, 35.0, 37.0, 20.0, 25.0, 24.0, 15.0, 17.0, 18.0, 24.0, 12.0, 2.0, 10.0, 6.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.96875, -24.2451171875, -23.521484375, -22.7978515625, -22.07421875, -21.3505859375, -20.626953125, -19.9033203125, -19.1796875, -18.4560546875, -17.732421875, -17.0087890625, -16.28515625, -15.5615234375, -14.837890625, -14.1142578125, -13.390625, -12.6669921875, -11.943359375, -11.2197265625, -10.49609375, -9.7724609375, -9.048828125, -8.3251953125, -7.6015625, -6.8779296875, -6.154296875, -5.4306640625, -4.70703125, -3.9833984375, -3.259765625, -2.5361328125, -1.8125, -1.0888671875, -0.365234375, 0.3583984375, 1.08203125, 1.8056640625, 2.529296875, 3.2529296875, 3.9765625, 4.7001953125, 5.423828125, 6.1474609375, 6.87109375, 7.5947265625, 8.318359375, 9.0419921875, 9.765625, 10.4892578125, 11.212890625, 11.9365234375, 12.66015625, 13.3837890625, 14.107421875, 14.8310546875, 15.5546875, 16.2783203125, 17.001953125, 17.7255859375, 18.44921875, 19.1728515625, 19.896484375, 20.6201171875, 21.34375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 7.0, 21.0, 24.0, 35.0, 59.0, 94.0, 173.0, 313.0, 773.0, 2168.0, 10938.0, 178057.0, 804243.0, 44189.0, 5078.0, 1276.0, 480.0, 267.0, 148.0, 59.0, 41.0, 30.0, 22.0, 13.0, 13.0, 3.0, 4.0, 5.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.28125, -13.82470703125, -13.3681640625, -12.91162109375, -12.455078125, -11.99853515625, -11.5419921875, -11.08544921875, -10.62890625, -10.17236328125, -9.7158203125, -9.25927734375, -8.802734375, -8.34619140625, -7.8896484375, -7.43310546875, -6.9765625, -6.52001953125, -6.0634765625, -5.60693359375, -5.150390625, -4.69384765625, -4.2373046875, -3.78076171875, -3.32421875, -2.86767578125, -2.4111328125, -1.95458984375, -1.498046875, -1.04150390625, -0.5849609375, -0.12841796875, 0.328125, 0.78466796875, 1.2412109375, 1.69775390625, 2.154296875, 2.61083984375, 3.0673828125, 3.52392578125, 3.98046875, 4.43701171875, 4.8935546875, 5.35009765625, 5.806640625, 6.26318359375, 6.7197265625, 7.17626953125, 7.6328125, 8.08935546875, 8.5458984375, 9.00244140625, 9.458984375, 9.91552734375, 10.3720703125, 10.82861328125, 11.28515625, 11.74169921875, 12.1982421875, 12.65478515625, 13.111328125, 13.56787109375, 14.0244140625, 14.48095703125, 14.9375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 5.0, 9.0, 20.0, 18.0, 27.0, 29.0, 54.0, 52.0, 125.0, 136.0, 139.0, 93.0, 76.0, 52.0, 49.0, 29.0, 24.0, 15.0, 13.0, 7.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023040771484375, -0.0022419095039367676, -0.002179741859436035, -0.0021175742149353027, -0.0020554065704345703, -0.001993238925933838, -0.0019310712814331055, -0.001868903636932373, -0.0018067359924316406, -0.0017445683479309082, -0.0016824007034301758, -0.0016202330589294434, -0.001558065414428711, -0.0014958977699279785, -0.001433730125427246, -0.0013715624809265137, -0.0013093948364257812, -0.0012472271919250488, -0.0011850595474243164, -0.001122891902923584, -0.0010607242584228516, -0.0009985566139221191, -0.0009363889694213867, -0.0008742213249206543, -0.0008120536804199219, -0.0007498860359191895, -0.000687718391418457, -0.0006255507469177246, -0.0005633831024169922, -0.0005012154579162598, -0.00043904781341552734, -0.0003768801689147949, -0.0003147125244140625, -0.0002525448799133301, -0.00019037723541259766, -0.00012820959091186523, -6.604194641113281e-05, -3.874301910400391e-06, 5.829334259033203e-05, 0.00012046098709106445, 0.00018262863159179688, 0.0002447962760925293, 0.0003069639205932617, 0.00036913156509399414, 0.00043129920959472656, 0.000493466854095459, 0.0005556344985961914, 0.0006178021430969238, 0.0006799697875976562, 0.0007421374320983887, 0.0008043050765991211, 0.0008664727210998535, 0.0009286403656005859, 0.0009908080101013184, 0.0010529756546020508, 0.0011151432991027832, 0.0011773109436035156, 0.001239478588104248, 0.0013016462326049805, 0.0013638138771057129, 0.0014259815216064453, 0.0014881491661071777, 0.0015503168106079102, 0.0016124844551086426, 0.001674652099609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 10.0, 12.0, 22.0, 32.0, 60.0, 74.0, 118.0, 228.0, 310.0, 580.0, 1127.0, 2232.0, 5541.0, 19738.0, 120498.0, 655953.0, 200068.0, 28975.0, 7287.0, 2678.0, 1251.0, 638.0, 418.0, 236.0, 142.0, 96.0, 56.0, 42.0, 23.0, 24.0, 22.0, 10.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-10.828125, -10.540283203125, -10.25244140625, -9.964599609375, -9.6767578125, -9.388916015625, -9.10107421875, -8.813232421875, -8.525390625, -8.237548828125, -7.94970703125, -7.661865234375, -7.3740234375, -7.086181640625, -6.79833984375, -6.510498046875, -6.22265625, -5.934814453125, -5.64697265625, -5.359130859375, -5.0712890625, -4.783447265625, -4.49560546875, -4.207763671875, -3.919921875, -3.632080078125, -3.34423828125, -3.056396484375, -2.7685546875, -2.480712890625, -2.19287109375, -1.905029296875, -1.6171875, -1.329345703125, -1.04150390625, -0.753662109375, -0.4658203125, -0.177978515625, 0.10986328125, 0.397705078125, 0.685546875, 0.973388671875, 1.26123046875, 1.549072265625, 1.8369140625, 2.124755859375, 2.41259765625, 2.700439453125, 2.98828125, 3.276123046875, 3.56396484375, 3.851806640625, 4.1396484375, 4.427490234375, 4.71533203125, 5.003173828125, 5.291015625, 5.578857421875, 5.86669921875, 6.154541015625, 6.4423828125, 6.730224609375, 7.01806640625, 7.305908203125, 7.59375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 9.0, 7.0, 18.0, 16.0, 21.0, 36.0, 36.0, 45.0, 85.0, 95.0, 102.0, 92.0, 85.0, 72.0, 57.0, 54.0, 40.0, 38.0, 33.0, 19.0, 14.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.64453125, -6.34674072265625, -6.0489501953125, -5.75115966796875, -5.453369140625, -5.15557861328125, -4.8577880859375, -4.55999755859375, -4.26220703125, -3.96441650390625, -3.6666259765625, -3.36883544921875, -3.071044921875, -2.77325439453125, -2.4754638671875, -2.17767333984375, -1.8798828125, -1.58209228515625, -1.2843017578125, -0.98651123046875, -0.688720703125, -0.39093017578125, -0.0931396484375, 0.20465087890625, 0.50244140625, 0.80023193359375, 1.0980224609375, 1.39581298828125, 1.693603515625, 1.99139404296875, 2.2891845703125, 2.58697509765625, 2.884765625, 3.18255615234375, 3.4803466796875, 3.77813720703125, 4.075927734375, 4.37371826171875, 4.6715087890625, 4.96929931640625, 5.26708984375, 5.56488037109375, 5.8626708984375, 6.16046142578125, 6.458251953125, 6.75604248046875, 7.0538330078125, 7.35162353515625, 7.6494140625, 7.94720458984375, 8.2449951171875, 8.54278564453125, 8.840576171875, 9.13836669921875, 9.4361572265625, 9.73394775390625, 10.03173828125, 10.32952880859375, 10.6273193359375, 10.92510986328125, 11.222900390625, 11.52069091796875, 11.8184814453125, 12.11627197265625, 12.4140625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 23.0, 76.0, 114.0, 203.0, 176.0, 173.0, 99.0, 51.0, 32.0, 20.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-182.18984985351562, -176.3679962158203, -170.54612731933594, -164.72427368164062, -158.90240478515625, -153.08055114746094, -147.25869750976562, -141.43682861328125, -135.61497497558594, -129.79312133789062, -123.97125244140625, -118.14939880371094, -112.3275375366211, -106.50567626953125, -100.68382263183594, -94.8619613647461, -89.04010009765625, -83.2182388305664, -77.39637756347656, -71.57452392578125, -65.7526626586914, -59.93080139160156, -54.108943939208984, -48.287086486816406, -42.46522521972656, -36.64336395263672, -30.82150650024414, -24.99964714050293, -19.17778778076172, -13.355928421020508, -7.534069061279297, -1.7122116088867188, 4.109649658203125, 9.931509017944336, 15.753368377685547, 21.575227737426758, 27.39708709716797, 33.21894836425781, 39.04080581665039, 44.86266326904297, 50.68452453613281, 56.506385803222656, 62.328243255615234, 68.15010070800781, 73.97196197509766, 79.7938232421875, 85.61567687988281, 91.43753814697266, 97.2593994140625, 103.08126068115234, 108.90312194824219, 114.7249755859375, 120.54683685302734, 126.36869812011719, 132.1905517578125, 138.01242065429688, 143.8342742919922, 149.6561279296875, 155.47799682617188, 161.2998504638672, 167.1217041015625, 172.94357299804688, 178.7654266357422, 184.5872802734375, 190.40914916992188]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 9.0, 16.0, 12.0, 12.0, 27.0, 26.0, 24.0, 45.0, 44.0, 46.0, 51.0, 70.0, 60.0, 68.0, 74.0, 53.0, 68.0, 55.0, 48.0, 36.0, 33.0, 24.0, 25.0, 21.0, 13.0, 8.0, 4.0, 8.0, 5.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.56768798828125, -131.28904724121094, -127.01042175292969, -122.73178100585938, -118.4531478881836, -114.17451477050781, -109.89588165283203, -105.61724853515625, -101.33860778808594, -97.05997467041016, -92.78134155273438, -88.50270080566406, -84.22406768798828, -79.9454345703125, -75.66680145263672, -71.38816833496094, -67.10953521728516, -62.830902099609375, -58.55226516723633, -54.27363204956055, -49.9949951171875, -45.71636199951172, -41.43772888183594, -37.159095764160156, -32.88045883178711, -28.601823806762695, -24.32318878173828, -20.0445556640625, -15.765920639038086, -11.487285614013672, -7.208652496337891, -2.9300174713134766, 1.3486175537109375, 5.627252101898193, 9.90588665008545, 14.184520721435547, 18.46315574645996, 22.741790771484375, 27.020423889160156, 31.29905891418457, 35.577693939208984, 39.856327056884766, 44.13496398925781, 48.413597106933594, 52.692230224609375, 56.97086715698242, 61.2495002746582, 65.52813720703125, 69.80677032470703, 74.08540344238281, 78.3640365600586, 82.64266967773438, 86.92131042480469, 91.19994354248047, 95.47857666015625, 99.75720977783203, 104.03584289550781, 108.3144760131836, 112.59310913085938, 116.87174987792969, 121.15038299560547, 125.42901611328125, 129.7076416015625, 133.9862823486328, 138.26492309570312]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 7.0, 20.0, 30.0, 41.0, 51.0, 124.0, 193.0, 376.0, 729.0, 1702.0, 4849.0, 23569.0, 3125642.0, 1006801.0, 22250.0, 4759.0, 1680.0, 696.0, 313.0, 163.0, 102.0, 62.0, 38.0, 19.0, 20.0, 13.0, 7.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.109375, -26.33447265625, -25.5595703125, -24.78466796875, -24.009765625, -23.23486328125, -22.4599609375, -21.68505859375, -20.91015625, -20.13525390625, -19.3603515625, -18.58544921875, -17.810546875, -17.03564453125, -16.2607421875, -15.48583984375, -14.7109375, -13.93603515625, -13.1611328125, -12.38623046875, -11.611328125, -10.83642578125, -10.0615234375, -9.28662109375, -8.51171875, -7.73681640625, -6.9619140625, -6.18701171875, -5.412109375, -4.63720703125, -3.8623046875, -3.08740234375, -2.3125, -1.53759765625, -0.7626953125, 0.01220703125, 0.787109375, 1.56201171875, 2.3369140625, 3.11181640625, 3.88671875, 4.66162109375, 5.4365234375, 6.21142578125, 6.986328125, 7.76123046875, 8.5361328125, 9.31103515625, 10.0859375, 10.86083984375, 11.6357421875, 12.41064453125, 13.185546875, 13.96044921875, 14.7353515625, 15.51025390625, 16.28515625, 17.06005859375, 17.8349609375, 18.60986328125, 19.384765625, 20.15966796875, 20.9345703125, 21.70947265625, 22.484375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 4.0, 9.0, 13.0, 23.0, 37.0, 37.0, 33.0, 57.0, 78.0, 88.0, 83.0, 87.0, 89.0, 66.0, 72.0, 55.0, 41.0, 33.0, 24.0, 23.0, 15.0, 5.0, 5.0, 7.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.66796875, -7.41705322265625, -7.1661376953125, -6.91522216796875, -6.664306640625, -6.41339111328125, -6.1624755859375, -5.91156005859375, -5.66064453125, -5.40972900390625, -5.1588134765625, -4.90789794921875, -4.656982421875, -4.40606689453125, -4.1551513671875, -3.90423583984375, -3.6533203125, -3.40240478515625, -3.1514892578125, -2.90057373046875, -2.649658203125, -2.39874267578125, -2.1478271484375, -1.89691162109375, -1.64599609375, -1.39508056640625, -1.1441650390625, -0.89324951171875, -0.642333984375, -0.39141845703125, -0.1405029296875, 0.11041259765625, 0.361328125, 0.61224365234375, 0.8631591796875, 1.11407470703125, 1.364990234375, 1.61590576171875, 1.8668212890625, 2.11773681640625, 2.36865234375, 2.61956787109375, 2.8704833984375, 3.12139892578125, 3.372314453125, 3.62322998046875, 3.8741455078125, 4.12506103515625, 4.3759765625, 4.62689208984375, 4.8778076171875, 5.12872314453125, 5.379638671875, 5.63055419921875, 5.8814697265625, 6.13238525390625, 6.38330078125, 6.63421630859375, 6.8851318359375, 7.13604736328125, 7.386962890625, 7.63787841796875, 7.8887939453125, 8.13970947265625, 8.390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 7.0, 24.0, 17.0, 28.0, 37.0, 69.0, 100.0, 155.0, 321.0, 711.0, 1385.0, 3623.0, 12000.0, 66704.0, 3795554.0, 278378.0, 24697.0, 6234.0, 2230.0, 949.0, 420.0, 244.0, 115.0, 88.0, 57.0, 42.0, 21.0, 16.0, 12.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.265625, -19.627197265625, -18.98876953125, -18.350341796875, -17.7119140625, -17.073486328125, -16.43505859375, -15.796630859375, -15.158203125, -14.519775390625, -13.88134765625, -13.242919921875, -12.6044921875, -11.966064453125, -11.32763671875, -10.689208984375, -10.05078125, -9.412353515625, -8.77392578125, -8.135498046875, -7.4970703125, -6.858642578125, -6.22021484375, -5.581787109375, -4.943359375, -4.304931640625, -3.66650390625, -3.028076171875, -2.3896484375, -1.751220703125, -1.11279296875, -0.474365234375, 0.1640625, 0.802490234375, 1.44091796875, 2.079345703125, 2.7177734375, 3.356201171875, 3.99462890625, 4.633056640625, 5.271484375, 5.909912109375, 6.54833984375, 7.186767578125, 7.8251953125, 8.463623046875, 9.10205078125, 9.740478515625, 10.37890625, 11.017333984375, 11.65576171875, 12.294189453125, 12.9326171875, 13.571044921875, 14.20947265625, 14.847900390625, 15.486328125, 16.124755859375, 16.76318359375, 17.401611328125, 18.0400390625, 18.678466796875, 19.31689453125, 19.955322265625, 20.59375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 9.0, 2.0, 12.0, 10.0, 25.0, 56.0, 104.0, 222.0, 1969.0, 1229.0, 214.0, 89.0, 50.0, 23.0, 21.0, 15.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.5203857421875, -5.243896484375, -4.9674072265625, -4.69091796875, -4.4144287109375, -4.137939453125, -3.8614501953125, -3.5849609375, -3.3084716796875, -3.031982421875, -2.7554931640625, -2.47900390625, -2.2025146484375, -1.926025390625, -1.6495361328125, -1.373046875, -1.0965576171875, -0.820068359375, -0.5435791015625, -0.26708984375, 0.0093994140625, 0.285888671875, 0.5623779296875, 0.8388671875, 1.1153564453125, 1.391845703125, 1.6683349609375, 1.94482421875, 2.2213134765625, 2.497802734375, 2.7742919921875, 3.05078125, 3.3272705078125, 3.603759765625, 3.8802490234375, 4.15673828125, 4.4332275390625, 4.709716796875, 4.9862060546875, 5.2626953125, 5.5391845703125, 5.815673828125, 6.0921630859375, 6.36865234375, 6.6451416015625, 6.921630859375, 7.1981201171875, 7.474609375, 7.7510986328125, 8.027587890625, 8.3040771484375, 8.58056640625, 8.8570556640625, 9.133544921875, 9.4100341796875, 9.6865234375, 9.9630126953125, 10.239501953125, 10.5159912109375, 10.79248046875, 11.0689697265625, 11.345458984375, 11.6219482421875, 11.8984375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 15.0, 26.0, 32.0, 49.0, 59.0, 88.0, 120.0, 117.0, 97.0, 98.0, 70.0, 62.0, 48.0, 35.0, 24.0, 15.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.38446044921875, -32.4602165222168, -31.535972595214844, -30.61172866821289, -29.687484741210938, -28.763240814208984, -27.83899688720703, -26.914752960205078, -25.990509033203125, -25.066265106201172, -24.14202117919922, -23.217777252197266, -22.293533325195312, -21.36928939819336, -20.445045471191406, -19.520801544189453, -18.5965576171875, -17.672313690185547, -16.748069763183594, -15.82382583618164, -14.899581909179688, -13.975337982177734, -13.051094055175781, -12.126850128173828, -11.202606201171875, -10.278362274169922, -9.354118347167969, -8.429874420166016, -7.5056304931640625, -6.581386566162109, -5.657142639160156, -4.732898712158203, -3.80865478515625, -2.884410858154297, -1.9601669311523438, -1.0359230041503906, -0.1116790771484375, 0.8125648498535156, 1.7368087768554688, 2.661052703857422, 3.585296630859375, 4.509540557861328, 5.433784484863281, 6.358028411865234, 7.2822723388671875, 8.20651626586914, 9.130760192871094, 10.055004119873047, 10.979248046875, 11.903491973876953, 12.827735900878906, 13.75197982788086, 14.676223754882812, 15.600467681884766, 16.52471160888672, 17.448955535888672, 18.373199462890625, 19.297443389892578, 20.22168731689453, 21.145931243896484, 22.070175170898438, 22.99441909790039, 23.918663024902344, 24.842906951904297, 25.76715087890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 9.0, 8.0, 11.0, 14.0, 13.0, 18.0, 27.0, 23.0, 20.0, 23.0, 25.0, 38.0, 35.0, 40.0, 50.0, 53.0, 34.0, 42.0, 41.0, 45.0, 48.0, 50.0, 30.0, 30.0, 35.0, 24.0, 29.0, 28.0, 27.0, 25.0, 22.0, 11.0, 11.0, 13.0, 11.0, 6.0, 5.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.463735580444336, -16.899127960205078, -16.334518432617188, -15.769909858703613, -15.205301284790039, -14.640692710876465, -14.07608413696289, -13.511475563049316, -12.946866989135742, -12.382258415222168, -11.817649841308594, -11.25304126739502, -10.688432693481445, -10.123824119567871, -9.559215545654297, -8.994606971740723, -8.429998397827148, -7.865389823913574, -7.30078125, -6.736172676086426, -6.171564102172852, -5.606955528259277, -5.042346954345703, -4.477738380432129, -3.9131298065185547, -3.3485212326049805, -2.7839126586914062, -2.219304084777832, -1.6546955108642578, -1.0900869369506836, -0.5254783630371094, 0.039130210876464844, 0.6037368774414062, 1.1683454513549805, 1.7329540252685547, 2.297562599182129, 2.862171173095703, 3.4267797470092773, 3.9913883209228516, 4.555996894836426, 5.12060546875, 5.685214042663574, 6.249822616577148, 6.814431190490723, 7.379039764404297, 7.943648338317871, 8.508256912231445, 9.07286548614502, 9.637474060058594, 10.202082633972168, 10.766691207885742, 11.331299781799316, 11.89590835571289, 12.460516929626465, 13.025125503540039, 13.589734077453613, 14.154342651367188, 14.718951225280762, 15.283559799194336, 15.84816837310791, 16.412776947021484, 16.977386474609375, 17.541994094848633, 18.10660171508789, 18.67121124267578]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 3.0, 6.0, 1.0, 7.0, 11.0, 16.0, 17.0, 25.0, 41.0, 50.0, 96.0, 127.0, 202.0, 346.0, 599.0, 1076.0, 2011.0, 4083.0, 8621.0, 19464.0, 45742.0, 111199.0, 301605.0, 336996.0, 124643.0, 51158.0, 21727.0, 9270.0, 4440.0, 2225.0, 1138.0, 609.0, 377.0, 212.0, 137.0, 94.0, 60.0, 45.0, 25.0, 11.0, 11.0, 11.0, 9.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-12.3515625, -11.999267578125, -11.64697265625, -11.294677734375, -10.9423828125, -10.590087890625, -10.23779296875, -9.885498046875, -9.533203125, -9.180908203125, -8.82861328125, -8.476318359375, -8.1240234375, -7.771728515625, -7.41943359375, -7.067138671875, -6.71484375, -6.362548828125, -6.01025390625, -5.657958984375, -5.3056640625, -4.953369140625, -4.60107421875, -4.248779296875, -3.896484375, -3.544189453125, -3.19189453125, -2.839599609375, -2.4873046875, -2.135009765625, -1.78271484375, -1.430419921875, -1.078125, -0.725830078125, -0.37353515625, -0.021240234375, 0.3310546875, 0.683349609375, 1.03564453125, 1.387939453125, 1.740234375, 2.092529296875, 2.44482421875, 2.797119140625, 3.1494140625, 3.501708984375, 3.85400390625, 4.206298828125, 4.55859375, 4.910888671875, 5.26318359375, 5.615478515625, 5.9677734375, 6.320068359375, 6.67236328125, 7.024658203125, 7.376953125, 7.729248046875, 8.08154296875, 8.433837890625, 8.7861328125, 9.138427734375, 9.49072265625, 9.843017578125, 10.1953125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 10.0, 13.0, 13.0, 15.0, 31.0, 17.0, 35.0, 35.0, 53.0, 53.0, 41.0, 72.0, 62.0, 69.0, 72.0, 60.0, 77.0, 38.0, 43.0, 45.0, 23.0, 19.0, 26.0, 14.0, 18.0, 8.0, 5.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.30078125, -6.09271240234375, -5.8846435546875, -5.67657470703125, -5.468505859375, -5.26043701171875, -5.0523681640625, -4.84429931640625, -4.63623046875, -4.42816162109375, -4.2200927734375, -4.01202392578125, -3.803955078125, -3.59588623046875, -3.3878173828125, -3.17974853515625, -2.9716796875, -2.76361083984375, -2.5555419921875, -2.34747314453125, -2.139404296875, -1.93133544921875, -1.7232666015625, -1.51519775390625, -1.30712890625, -1.09906005859375, -0.8909912109375, -0.68292236328125, -0.474853515625, -0.26678466796875, -0.0587158203125, 0.14935302734375, 0.357421875, 0.56549072265625, 0.7735595703125, 0.98162841796875, 1.189697265625, 1.39776611328125, 1.6058349609375, 1.81390380859375, 2.02197265625, 2.23004150390625, 2.4381103515625, 2.64617919921875, 2.854248046875, 3.06231689453125, 3.2703857421875, 3.47845458984375, 3.6865234375, 3.89459228515625, 4.1026611328125, 4.31072998046875, 4.518798828125, 4.72686767578125, 4.9349365234375, 5.14300537109375, 5.35107421875, 5.55914306640625, 5.7672119140625, 5.97528076171875, 6.183349609375, 6.39141845703125, 6.5994873046875, 6.80755615234375, 7.015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 6.0, 10.0, 15.0, 17.0, 17.0, 27.0, 34.0, 55.0, 67.0, 94.0, 142.0, 204.0, 309.0, 442.0, 622.0, 1047.0, 1896.0, 4391.0, 14850.0, 86858.0, 672342.0, 222460.0, 29411.0, 6968.0, 2631.0, 1314.0, 713.0, 468.0, 313.0, 225.0, 156.0, 114.0, 80.0, 57.0, 54.0, 38.0, 20.0, 15.0, 16.0, 8.0, 9.0, 7.0, 8.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.234375, -20.6044921875, -19.974609375, -19.3447265625, -18.71484375, -18.0849609375, -17.455078125, -16.8251953125, -16.1953125, -15.5654296875, -14.935546875, -14.3056640625, -13.67578125, -13.0458984375, -12.416015625, -11.7861328125, -11.15625, -10.5263671875, -9.896484375, -9.2666015625, -8.63671875, -8.0068359375, -7.376953125, -6.7470703125, -6.1171875, -5.4873046875, -4.857421875, -4.2275390625, -3.59765625, -2.9677734375, -2.337890625, -1.7080078125, -1.078125, -0.4482421875, 0.181640625, 0.8115234375, 1.44140625, 2.0712890625, 2.701171875, 3.3310546875, 3.9609375, 4.5908203125, 5.220703125, 5.8505859375, 6.48046875, 7.1103515625, 7.740234375, 8.3701171875, 9.0, 9.6298828125, 10.259765625, 10.8896484375, 11.51953125, 12.1494140625, 12.779296875, 13.4091796875, 14.0390625, 14.6689453125, 15.298828125, 15.9287109375, 16.55859375, 17.1884765625, 17.818359375, 18.4482421875, 19.078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 9.0, 2.0, 11.0, 12.0, 14.0, 10.0, 13.0, 25.0, 21.0, 23.0, 33.0, 16.0, 31.0, 35.0, 30.0, 38.0, 39.0, 37.0, 30.0, 65.0, 48.0, 48.0, 41.0, 29.0, 34.0, 29.0, 29.0, 24.0, 28.0, 17.0, 29.0, 27.0, 25.0, 18.0, 11.0, 15.0, 12.0, 8.0, 4.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-18.5, -17.914794921875, -17.32958984375, -16.744384765625, -16.1591796875, -15.573974609375, -14.98876953125, -14.403564453125, -13.818359375, -13.233154296875, -12.64794921875, -12.062744140625, -11.4775390625, -10.892333984375, -10.30712890625, -9.721923828125, -9.13671875, -8.551513671875, -7.96630859375, -7.381103515625, -6.7958984375, -6.210693359375, -5.62548828125, -5.040283203125, -4.455078125, -3.869873046875, -3.28466796875, -2.699462890625, -2.1142578125, -1.529052734375, -0.94384765625, -0.358642578125, 0.2265625, 0.811767578125, 1.39697265625, 1.982177734375, 2.5673828125, 3.152587890625, 3.73779296875, 4.322998046875, 4.908203125, 5.493408203125, 6.07861328125, 6.663818359375, 7.2490234375, 7.834228515625, 8.41943359375, 9.004638671875, 9.58984375, 10.175048828125, 10.76025390625, 11.345458984375, 11.9306640625, 12.515869140625, 13.10107421875, 13.686279296875, 14.271484375, 14.856689453125, 15.44189453125, 16.027099609375, 16.6123046875, 17.197509765625, 17.78271484375, 18.367919921875, 18.953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 9.0, 15.0, 12.0, 27.0, 34.0, 64.0, 98.0, 170.0, 330.0, 593.0, 1398.0, 3746.0, 12561.0, 60867.0, 419345.0, 462916.0, 65975.0, 13578.0, 3875.0, 1477.0, 649.0, 376.0, 161.0, 114.0, 64.0, 26.0, 29.0, 16.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.7578125, -7.55377197265625, -7.3497314453125, -7.14569091796875, -6.941650390625, -6.73760986328125, -6.5335693359375, -6.32952880859375, -6.12548828125, -5.92144775390625, -5.7174072265625, -5.51336669921875, -5.309326171875, -5.10528564453125, -4.9012451171875, -4.69720458984375, -4.4931640625, -4.28912353515625, -4.0850830078125, -3.88104248046875, -3.677001953125, -3.47296142578125, -3.2689208984375, -3.06488037109375, -2.86083984375, -2.65679931640625, -2.4527587890625, -2.24871826171875, -2.044677734375, -1.84063720703125, -1.6365966796875, -1.43255615234375, -1.228515625, -1.02447509765625, -0.8204345703125, -0.61639404296875, -0.412353515625, -0.20831298828125, -0.0042724609375, 0.19976806640625, 0.40380859375, 0.60784912109375, 0.8118896484375, 1.01593017578125, 1.219970703125, 1.42401123046875, 1.6280517578125, 1.83209228515625, 2.0361328125, 2.24017333984375, 2.4442138671875, 2.64825439453125, 2.852294921875, 3.05633544921875, 3.2603759765625, 3.46441650390625, 3.66845703125, 3.87249755859375, 4.0765380859375, 4.28057861328125, 4.484619140625, 4.68865966796875, 4.8927001953125, 5.09674072265625, 5.30078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 3.0, 12.0, 8.0, 14.0, 18.0, 28.0, 29.0, 56.0, 45.0, 70.0, 118.0, 186.0, 125.0, 68.0, 55.0, 43.0, 23.0, 25.0, 18.0, 17.0, 8.0, 9.0, 9.0, 2.0, 7.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001743316650390625, -0.0016775131225585938, -0.0016117095947265625, -0.0015459060668945312, -0.0014801025390625, -0.0014142990112304688, -0.0013484954833984375, -0.0012826919555664062, -0.001216888427734375, -0.0011510848999023438, -0.0010852813720703125, -0.0010194778442382812, -0.00095367431640625, -0.0008878707885742188, -0.0008220672607421875, -0.0007562637329101562, -0.000690460205078125, -0.0006246566772460938, -0.0005588531494140625, -0.0004930496215820312, -0.00042724609375, -0.00036144256591796875, -0.0002956390380859375, -0.00022983551025390625, -0.000164031982421875, -9.822845458984375e-05, -3.24249267578125e-05, 3.337860107421875e-05, 9.918212890625e-05, 0.00016498565673828125, 0.0002307891845703125, 0.00029659271240234375, 0.000362396240234375, 0.00042819976806640625, 0.0004940032958984375, 0.0005598068237304688, 0.0006256103515625, 0.0006914138793945312, 0.0007572174072265625, 0.0008230209350585938, 0.000888824462890625, 0.0009546279907226562, 0.0010204315185546875, 0.0010862350463867188, 0.00115203857421875, 0.0012178421020507812, 0.0012836456298828125, 0.0013494491577148438, 0.001415252685546875, 0.0014810562133789062, 0.0015468597412109375, 0.0016126632690429688, 0.001678466796875, 0.0017442703247070312, 0.0018100738525390625, 0.0018758773803710938, 0.001941680908203125, 0.0020074844360351562, 0.0020732879638671875, 0.0021390914916992188, 0.00220489501953125, 0.0022706985473632812, 0.0023365020751953125, 0.0024023056030273438, 0.002468109130859375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 5.0, 4.0, 13.0, 24.0, 32.0, 58.0, 74.0, 116.0, 187.0, 276.0, 487.0, 891.0, 1667.0, 3865.0, 11870.0, 56801.0, 409167.0, 476518.0, 65266.0, 13380.0, 4047.0, 1666.0, 828.0, 472.0, 289.0, 181.0, 114.0, 81.0, 53.0, 35.0, 29.0, 10.0, 7.0, 12.0, 5.0, 5.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.140625, -4.935302734375, -4.72998046875, -4.524658203125, -4.3193359375, -4.114013671875, -3.90869140625, -3.703369140625, -3.498046875, -3.292724609375, -3.08740234375, -2.882080078125, -2.6767578125, -2.471435546875, -2.26611328125, -2.060791015625, -1.85546875, -1.650146484375, -1.44482421875, -1.239501953125, -1.0341796875, -0.828857421875, -0.62353515625, -0.418212890625, -0.212890625, -0.007568359375, 0.19775390625, 0.403076171875, 0.6083984375, 0.813720703125, 1.01904296875, 1.224365234375, 1.4296875, 1.635009765625, 1.84033203125, 2.045654296875, 2.2509765625, 2.456298828125, 2.66162109375, 2.866943359375, 3.072265625, 3.277587890625, 3.48291015625, 3.688232421875, 3.8935546875, 4.098876953125, 4.30419921875, 4.509521484375, 4.71484375, 4.920166015625, 5.12548828125, 5.330810546875, 5.5361328125, 5.741455078125, 5.94677734375, 6.152099609375, 6.357421875, 6.562744140625, 6.76806640625, 6.973388671875, 7.1787109375, 7.384033203125, 7.58935546875, 7.794677734375, 8.0]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 10.0, 9.0, 9.0, 17.0, 18.0, 25.0, 18.0, 32.0, 31.0, 38.0, 34.0, 45.0, 48.0, 62.0, 56.0, 63.0, 69.0, 57.0, 43.0, 49.0, 40.0, 32.0, 21.0, 30.0, 25.0, 9.0, 25.0, 11.0, 15.0, 10.0, 5.0, 13.0, 6.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.33203125, -4.18988037109375, -4.0477294921875, -3.90557861328125, -3.763427734375, -3.62127685546875, -3.4791259765625, -3.33697509765625, -3.19482421875, -3.05267333984375, -2.9105224609375, -2.76837158203125, -2.626220703125, -2.48406982421875, -2.3419189453125, -2.19976806640625, -2.0576171875, -1.91546630859375, -1.7733154296875, -1.63116455078125, -1.489013671875, -1.34686279296875, -1.2047119140625, -1.06256103515625, -0.92041015625, -0.77825927734375, -0.6361083984375, -0.49395751953125, -0.351806640625, -0.20965576171875, -0.0675048828125, 0.07464599609375, 0.216796875, 0.35894775390625, 0.5010986328125, 0.64324951171875, 0.785400390625, 0.92755126953125, 1.0697021484375, 1.21185302734375, 1.35400390625, 1.49615478515625, 1.6383056640625, 1.78045654296875, 1.922607421875, 2.06475830078125, 2.2069091796875, 2.34906005859375, 2.4912109375, 2.63336181640625, 2.7755126953125, 2.91766357421875, 3.059814453125, 3.20196533203125, 3.3441162109375, 3.48626708984375, 3.62841796875, 3.77056884765625, 3.9127197265625, 4.05487060546875, 4.197021484375, 4.33917236328125, 4.4813232421875, 4.62347412109375, 4.765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 7.0, 23.0, 38.0, 76.0, 124.0, 161.0, 190.0, 151.0, 118.0, 57.0, 21.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.71223449707031, -103.33866119384766, -97.96509552001953, -92.59152221679688, -87.21795654296875, -81.8443832397461, -76.47080993652344, -71.09724426269531, -65.72367095947266, -60.350101470947266, -54.976531982421875, -49.60295867919922, -44.22938919067383, -38.85581970214844, -33.48224639892578, -28.10867691040039, -22.735107421875, -17.36153793334961, -11.987966537475586, -6.6143951416015625, -1.2408256530761719, 4.132743835449219, 9.506317138671875, 14.879886627197266, 20.253456115722656, 25.627025604248047, 31.00059700012207, 36.374168395996094, 41.747737884521484, 47.121307373046875, 52.49488067626953, 57.86845016479492, 63.24201965332031, 68.61559295654297, 73.9891586303711, 79.36273193359375, 84.73629760742188, 90.10987091064453, 95.48344421386719, 100.85700988769531, 106.23058319091797, 111.60415649414062, 116.97772216796875, 122.3512954711914, 127.72486877441406, 133.0984344482422, 138.47201538085938, 143.8455810546875, 149.21914672851562, 154.59271240234375, 159.96629333496094, 165.33985900878906, 170.7134246826172, 176.08700561523438, 181.4605712890625, 186.83413696289062, 192.20770263671875, 197.58126831054688, 202.95484924316406, 208.3284149169922, 213.7019805908203, 219.0755615234375, 224.44912719726562, 229.82269287109375, 235.19627380371094]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 15.0, 13.0, 14.0, 25.0, 21.0, 23.0, 26.0, 32.0, 35.0, 38.0, 41.0, 45.0, 54.0, 51.0, 44.0, 52.0, 53.0, 50.0, 35.0, 33.0, 46.0, 36.0, 32.0, 34.0, 26.0, 22.0, 10.0, 10.0, 13.0, 12.0, 9.0, 9.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.49604797363281, -92.42346954345703, -89.35088348388672, -86.27830505371094, -83.20571899414062, -80.13314056396484, -77.06056213378906, -73.98797607421875, -70.91539764404297, -67.84281921386719, -64.77023315429688, -61.697654724121094, -58.62507247924805, -55.552490234375, -52.47990798950195, -49.407325744628906, -46.33474349975586, -43.26216125488281, -40.189579010009766, -37.11699676513672, -34.04441833496094, -30.97183609008789, -27.899253845214844, -24.82667350769043, -21.754091262817383, -18.681509017944336, -15.608928680419922, -12.536346435546875, -9.463765144348145, -6.391183853149414, -3.318601608276367, -0.24602127075195312, 2.8265609741210938, 5.899142265319824, 8.971723556518555, 12.044305801391602, 15.116887092590332, 18.189468383789062, 21.26205062866211, 24.334630966186523, 27.40721321105957, 30.479795455932617, 33.55237579345703, 36.62495803833008, 39.697540283203125, 42.770118713378906, 45.84270477294922, 48.915283203125, 51.98786544799805, 55.060447692871094, 58.13302993774414, 61.20561218261719, 64.27819061279297, 67.35076904296875, 70.42335510253906, 73.49593353271484, 76.56851959228516, 79.64109802246094, 82.71368408203125, 85.78626251220703, 88.85884857177734, 91.93142700195312, 95.00401306152344, 98.07659149169922, 101.149169921875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 3.0, 7.0, 5.0, 6.0, 19.0, 29.0, 44.0, 63.0, 86.0, 144.0, 200.0, 437.0, 911.0, 1842.0, 4312.0, 11444.0, 39021.0, 227196.0, 2561236.0, 1195745.0, 112572.0, 24735.0, 8100.0, 3120.0, 1402.0, 716.0, 368.0, 185.0, 125.0, 68.0, 43.0, 33.0, 18.0, 15.0, 14.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.03125, -12.686767578125, -12.34228515625, -11.997802734375, -11.6533203125, -11.308837890625, -10.96435546875, -10.619873046875, -10.275390625, -9.930908203125, -9.58642578125, -9.241943359375, -8.8974609375, -8.552978515625, -8.20849609375, -7.864013671875, -7.51953125, -7.175048828125, -6.83056640625, -6.486083984375, -6.1416015625, -5.797119140625, -5.45263671875, -5.108154296875, -4.763671875, -4.419189453125, -4.07470703125, -3.730224609375, -3.3857421875, -3.041259765625, -2.69677734375, -2.352294921875, -2.0078125, -1.663330078125, -1.31884765625, -0.974365234375, -0.6298828125, -0.285400390625, 0.05908203125, 0.403564453125, 0.748046875, 1.092529296875, 1.43701171875, 1.781494140625, 2.1259765625, 2.470458984375, 2.81494140625, 3.159423828125, 3.50390625, 3.848388671875, 4.19287109375, 4.537353515625, 4.8818359375, 5.226318359375, 5.57080078125, 5.915283203125, 6.259765625, 6.604248046875, 6.94873046875, 7.293212890625, 7.6376953125, 7.982177734375, 8.32666015625, 8.671142578125, 9.015625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 5.0, 5.0, 12.0, 13.0, 14.0, 19.0, 24.0, 13.0, 14.0, 22.0, 22.0, 28.0, 34.0, 31.0, 24.0, 25.0, 34.0, 32.0, 48.0, 42.0, 31.0, 41.0, 36.0, 34.0, 35.0, 43.0, 30.0, 32.0, 22.0, 25.0, 24.0, 35.0, 19.0, 23.0, 17.0, 11.0, 10.0, 10.0, 9.0, 6.0, 11.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.34375, -3.22576904296875, -3.1077880859375, -2.98980712890625, -2.871826171875, -2.75384521484375, -2.6358642578125, -2.51788330078125, -2.39990234375, -2.28192138671875, -2.1639404296875, -2.04595947265625, -1.927978515625, -1.80999755859375, -1.6920166015625, -1.57403564453125, -1.4560546875, -1.33807373046875, -1.2200927734375, -1.10211181640625, -0.984130859375, -0.86614990234375, -0.7481689453125, -0.63018798828125, -0.51220703125, -0.39422607421875, -0.2762451171875, -0.15826416015625, -0.040283203125, 0.07769775390625, 0.1956787109375, 0.31365966796875, 0.431640625, 0.54962158203125, 0.6676025390625, 0.78558349609375, 0.903564453125, 1.02154541015625, 1.1395263671875, 1.25750732421875, 1.37548828125, 1.49346923828125, 1.6114501953125, 1.72943115234375, 1.847412109375, 1.96539306640625, 2.0833740234375, 2.20135498046875, 2.3193359375, 2.43731689453125, 2.5552978515625, 2.67327880859375, 2.791259765625, 2.90924072265625, 3.0272216796875, 3.14520263671875, 3.26318359375, 3.38116455078125, 3.4991455078125, 3.61712646484375, 3.735107421875, 3.85308837890625, 3.9710693359375, 4.08905029296875, 4.20703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 8.0, 3.0, 6.0, 15.0, 13.0, 20.0, 18.0, 32.0, 32.0, 68.0, 91.0, 156.0, 241.0, 401.0, 725.0, 1314.0, 2665.0, 5814.0, 14250.0, 42129.0, 180120.0, 1716939.0, 1957630.0, 199308.0, 45360.0, 14992.0, 5975.0, 2749.0, 1361.0, 730.0, 405.0, 226.0, 146.0, 94.0, 59.0, 52.0, 36.0, 22.0, 25.0, 14.0, 6.0, 8.0, 9.0, 3.0, 2.0, 1.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.916259765625, -8.59814453125, -8.280029296875, -7.9619140625, -7.643798828125, -7.32568359375, -7.007568359375, -6.689453125, -6.371337890625, -6.05322265625, -5.735107421875, -5.4169921875, -5.098876953125, -4.78076171875, -4.462646484375, -4.14453125, -3.826416015625, -3.50830078125, -3.190185546875, -2.8720703125, -2.553955078125, -2.23583984375, -1.917724609375, -1.599609375, -1.281494140625, -0.96337890625, -0.645263671875, -0.3271484375, -0.009033203125, 0.30908203125, 0.627197265625, 0.9453125, 1.263427734375, 1.58154296875, 1.899658203125, 2.2177734375, 2.535888671875, 2.85400390625, 3.172119140625, 3.490234375, 3.808349609375, 4.12646484375, 4.444580078125, 4.7626953125, 5.080810546875, 5.39892578125, 5.717041015625, 6.03515625, 6.353271484375, 6.67138671875, 6.989501953125, 7.3076171875, 7.625732421875, 7.94384765625, 8.261962890625, 8.580078125, 8.898193359375, 9.21630859375, 9.534423828125, 9.8525390625, 10.170654296875, 10.48876953125, 10.806884765625, 11.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 0.0, 5.0, 4.0, 16.0, 18.0, 13.0, 18.0, 23.0, 37.0, 55.0, 68.0, 121.0, 166.0, 246.0, 447.0, 695.0, 708.0, 516.0, 343.0, 170.0, 119.0, 73.0, 60.0, 44.0, 24.0, 22.0, 10.0, 7.0, 9.0, 8.0, 5.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.78125, -14.3482666015625, -13.915283203125, -13.4822998046875, -13.04931640625, -12.6163330078125, -12.183349609375, -11.7503662109375, -11.3173828125, -10.8843994140625, -10.451416015625, -10.0184326171875, -9.58544921875, -9.1524658203125, -8.719482421875, -8.2864990234375, -7.853515625, -7.4205322265625, -6.987548828125, -6.5545654296875, -6.12158203125, -5.6885986328125, -5.255615234375, -4.8226318359375, -4.3896484375, -3.9566650390625, -3.523681640625, -3.0906982421875, -2.65771484375, -2.2247314453125, -1.791748046875, -1.3587646484375, -0.92578125, -0.4927978515625, -0.059814453125, 0.3731689453125, 0.80615234375, 1.2391357421875, 1.672119140625, 2.1051025390625, 2.5380859375, 2.9710693359375, 3.404052734375, 3.8370361328125, 4.27001953125, 4.7030029296875, 5.135986328125, 5.5689697265625, 6.001953125, 6.4349365234375, 6.867919921875, 7.3009033203125, 7.73388671875, 8.1668701171875, 8.599853515625, 9.0328369140625, 9.4658203125, 9.8988037109375, 10.331787109375, 10.7647705078125, 11.19775390625, 11.6307373046875, 12.063720703125, 12.4967041015625, 12.9296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 9.0, 8.0, 13.0, 33.0, 39.0, 109.0, 147.0, 160.0, 196.0, 113.0, 77.0, 36.0, 18.0, 10.0, 8.0, 5.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.97355651855469, -105.54515838623047, -101.11676025390625, -96.6883544921875, -92.25995635986328, -87.83155822753906, -83.40315246582031, -78.9747543334961, -74.54635620117188, -70.11795806884766, -65.68955993652344, -61.26115417480469, -56.83275604248047, -52.40435791015625, -47.975955963134766, -43.54755401611328, -39.11915588378906, -34.690757751464844, -30.26235580444336, -25.833955764770508, -21.405555725097656, -16.977155685424805, -12.548755645751953, -8.120355606079102, -3.69195556640625, 0.7364444732666016, 5.164844512939453, 9.593244552612305, 14.021644592285156, 18.450044631958008, 22.87844467163086, 27.30684471130371, 31.7352294921875, 36.16362762451172, 40.5920295715332, 45.02043151855469, 49.448829650878906, 53.877227783203125, 58.30562973022461, 62.734031677246094, 67.16242980957031, 71.59082794189453, 76.01922607421875, 80.4476318359375, 84.87602996826172, 89.30442810058594, 93.73283386230469, 98.1612319946289, 102.58963012695312, 107.01802825927734, 111.44642639160156, 115.87483215332031, 120.30323028564453, 124.73162841796875, 129.1600341796875, 133.5884246826172, 138.01683044433594, 142.4452362060547, 146.87362670898438, 151.30203247070312, 155.73043823242188, 160.15882873535156, 164.5872344970703, 169.015625, 173.44403076171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 3.0, 11.0, 13.0, 12.0, 11.0, 33.0, 16.0, 25.0, 30.0, 33.0, 31.0, 29.0, 37.0, 45.0, 48.0, 60.0, 37.0, 48.0, 40.0, 45.0, 43.0, 32.0, 32.0, 32.0, 34.0, 41.0, 19.0, 25.0, 21.0, 22.0, 15.0, 14.0, 15.0, 8.0, 3.0, 9.0, 5.0, 1.0, 11.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.4970703125, -54.5816650390625, -52.666263580322266, -50.750858306884766, -48.83545684814453, -46.92005157470703, -45.00464630126953, -43.0892448425293, -41.17384338378906, -39.25843811035156, -37.34303665161133, -35.42763137817383, -33.512229919433594, -31.596824645996094, -29.681421279907227, -27.76601791381836, -25.85061264038086, -23.935209274291992, -22.019805908203125, -20.104400634765625, -18.18899917602539, -16.27359390258789, -14.358190536499023, -12.442787170410156, -10.527383804321289, -8.611980438232422, -6.6965765953063965, -4.781172752380371, -2.865769386291504, -0.9503660202026367, 0.9650382995605469, 2.880441665649414, 4.795845031738281, 6.711248397827148, 8.626651763916016, 10.5420560836792, 12.457459449768066, 14.372862815856934, 16.288267135620117, 18.203670501708984, 20.11907386779785, 22.03447723388672, 23.949880599975586, 25.865283966064453, 27.780689239501953, 29.696090698242188, 31.611495971679688, 33.52690124511719, 35.44230270385742, 37.35770797729492, 39.273109436035156, 41.188514709472656, 43.10391616821289, 45.01932144165039, 46.934722900390625, 48.850128173828125, 50.765533447265625, 52.680938720703125, 54.59634017944336, 56.51174545288086, 58.427146911621094, 60.342552185058594, 62.257957458496094, 64.17335510253906, 66.08876037597656]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 13.0, 11.0, 11.0, 19.0, 28.0, 32.0, 59.0, 75.0, 126.0, 220.0, 303.0, 503.0, 894.0, 1523.0, 2661.0, 5040.0, 9832.0, 20437.0, 44655.0, 113398.0, 410967.0, 287308.0, 81775.0, 34628.0, 16512.0, 7897.0, 4148.0, 2254.0, 1232.0, 757.0, 462.0, 277.0, 185.0, 110.0, 60.0, 41.0, 32.0, 21.0, 14.0, 10.0, 12.0, 10.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.609375, -9.2762451171875, -8.943115234375, -8.6099853515625, -8.27685546875, -7.9437255859375, -7.610595703125, -7.2774658203125, -6.9443359375, -6.6112060546875, -6.278076171875, -5.9449462890625, -5.61181640625, -5.2786865234375, -4.945556640625, -4.6124267578125, -4.279296875, -3.9461669921875, -3.613037109375, -3.2799072265625, -2.94677734375, -2.6136474609375, -2.280517578125, -1.9473876953125, -1.6142578125, -1.2811279296875, -0.947998046875, -0.6148681640625, -0.28173828125, 0.0513916015625, 0.384521484375, 0.7176513671875, 1.05078125, 1.3839111328125, 1.717041015625, 2.0501708984375, 2.38330078125, 2.7164306640625, 3.049560546875, 3.3826904296875, 3.7158203125, 4.0489501953125, 4.382080078125, 4.7152099609375, 5.04833984375, 5.3814697265625, 5.714599609375, 6.0477294921875, 6.380859375, 6.7139892578125, 7.047119140625, 7.3802490234375, 7.71337890625, 8.0465087890625, 8.379638671875, 8.7127685546875, 9.0458984375, 9.3790283203125, 9.712158203125, 10.0452880859375, 10.37841796875, 10.7115478515625, 11.044677734375, 11.3778076171875, 11.7109375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 0.0, 6.0, 2.0, 6.0, 7.0, 11.0, 20.0, 21.0, 16.0, 24.0, 23.0, 35.0, 47.0, 40.0, 49.0, 41.0, 49.0, 54.0, 52.0, 52.0, 52.0, 57.0, 54.0, 45.0, 44.0, 27.0, 30.0, 27.0, 21.0, 26.0, 19.0, 12.0, 13.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.719757080078125, -3.55084228515625, -3.381927490234375, -3.2130126953125, -3.044097900390625, -2.87518310546875, -2.706268310546875, -2.537353515625, -2.368438720703125, -2.19952392578125, -2.030609130859375, -1.8616943359375, -1.692779541015625, -1.52386474609375, -1.354949951171875, -1.18603515625, -1.017120361328125, -0.84820556640625, -0.679290771484375, -0.5103759765625, -0.341461181640625, -0.17254638671875, -0.003631591796875, 0.165283203125, 0.334197998046875, 0.50311279296875, 0.672027587890625, 0.8409423828125, 1.009857177734375, 1.17877197265625, 1.347686767578125, 1.5166015625, 1.685516357421875, 1.85443115234375, 2.023345947265625, 2.1922607421875, 2.361175537109375, 2.53009033203125, 2.699005126953125, 2.867919921875, 3.036834716796875, 3.20574951171875, 3.374664306640625, 3.5435791015625, 3.712493896484375, 3.88140869140625, 4.050323486328125, 4.21923828125, 4.388153076171875, 4.55706787109375, 4.725982666015625, 4.8948974609375, 5.063812255859375, 5.23272705078125, 5.401641845703125, 5.570556640625, 5.739471435546875, 5.90838623046875, 6.077301025390625, 6.2462158203125, 6.415130615234375, 6.58404541015625, 6.752960205078125, 6.921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 5.0, 7.0, 11.0, 13.0, 27.0, 42.0, 51.0, 89.0, 177.0, 235.0, 453.0, 898.0, 1988.0, 6503.0, 50666.0, 893931.0, 80679.0, 8224.0, 2261.0, 992.0, 521.0, 305.0, 174.0, 118.0, 68.0, 36.0, 28.0, 18.0, 8.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.75, -27.70751953125, -26.6650390625, -25.62255859375, -24.580078125, -23.53759765625, -22.4951171875, -21.45263671875, -20.41015625, -19.36767578125, -18.3251953125, -17.28271484375, -16.240234375, -15.19775390625, -14.1552734375, -13.11279296875, -12.0703125, -11.02783203125, -9.9853515625, -8.94287109375, -7.900390625, -6.85791015625, -5.8154296875, -4.77294921875, -3.73046875, -2.68798828125, -1.6455078125, -0.60302734375, 0.439453125, 1.48193359375, 2.5244140625, 3.56689453125, 4.609375, 5.65185546875, 6.6943359375, 7.73681640625, 8.779296875, 9.82177734375, 10.8642578125, 11.90673828125, 12.94921875, 13.99169921875, 15.0341796875, 16.07666015625, 17.119140625, 18.16162109375, 19.2041015625, 20.24658203125, 21.2890625, 22.33154296875, 23.3740234375, 24.41650390625, 25.458984375, 26.50146484375, 27.5439453125, 28.58642578125, 29.62890625, 30.67138671875, 31.7138671875, 32.75634765625, 33.798828125, 34.84130859375, 35.8837890625, 36.92626953125, 37.96875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 8.0, 6.0, 10.0, 11.0, 15.0, 14.0, 17.0, 27.0, 28.0, 24.0, 27.0, 46.0, 48.0, 46.0, 43.0, 49.0, 48.0, 42.0, 56.0, 54.0, 41.0, 41.0, 41.0, 44.0, 24.0, 28.0, 28.0, 19.0, 19.0, 17.0, 13.0, 9.0, 10.0, 7.0, 6.0, 5.0, 5.0, 1.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.25, -22.57763671875, -21.9052734375, -21.23291015625, -20.560546875, -19.88818359375, -19.2158203125, -18.54345703125, -17.87109375, -17.19873046875, -16.5263671875, -15.85400390625, -15.181640625, -14.50927734375, -13.8369140625, -13.16455078125, -12.4921875, -11.81982421875, -11.1474609375, -10.47509765625, -9.802734375, -9.13037109375, -8.4580078125, -7.78564453125, -7.11328125, -6.44091796875, -5.7685546875, -5.09619140625, -4.423828125, -3.75146484375, -3.0791015625, -2.40673828125, -1.734375, -1.06201171875, -0.3896484375, 0.28271484375, 0.955078125, 1.62744140625, 2.2998046875, 2.97216796875, 3.64453125, 4.31689453125, 4.9892578125, 5.66162109375, 6.333984375, 7.00634765625, 7.6787109375, 8.35107421875, 9.0234375, 9.69580078125, 10.3681640625, 11.04052734375, 11.712890625, 12.38525390625, 13.0576171875, 13.72998046875, 14.40234375, 15.07470703125, 15.7470703125, 16.41943359375, 17.091796875, 17.76416015625, 18.4365234375, 19.10888671875, 19.78125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 12.0, 8.0, 17.0, 23.0, 30.0, 66.0, 111.0, 174.0, 389.0, 879.0, 2548.0, 9980.0, 70451.0, 839123.0, 106836.0, 12855.0, 3105.0, 1005.0, 432.0, 191.0, 109.0, 60.0, 47.0, 25.0, 20.0, 9.0, 10.0, 8.0, 10.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.625, -11.27880859375, -10.9326171875, -10.58642578125, -10.240234375, -9.89404296875, -9.5478515625, -9.20166015625, -8.85546875, -8.50927734375, -8.1630859375, -7.81689453125, -7.470703125, -7.12451171875, -6.7783203125, -6.43212890625, -6.0859375, -5.73974609375, -5.3935546875, -5.04736328125, -4.701171875, -4.35498046875, -4.0087890625, -3.66259765625, -3.31640625, -2.97021484375, -2.6240234375, -2.27783203125, -1.931640625, -1.58544921875, -1.2392578125, -0.89306640625, -0.546875, -0.20068359375, 0.1455078125, 0.49169921875, 0.837890625, 1.18408203125, 1.5302734375, 1.87646484375, 2.22265625, 2.56884765625, 2.9150390625, 3.26123046875, 3.607421875, 3.95361328125, 4.2998046875, 4.64599609375, 4.9921875, 5.33837890625, 5.6845703125, 6.03076171875, 6.376953125, 6.72314453125, 7.0693359375, 7.41552734375, 7.76171875, 8.10791015625, 8.4541015625, 8.80029296875, 9.146484375, 9.49267578125, 9.8388671875, 10.18505859375, 10.53125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 7.0, 12.0, 10.0, 15.0, 22.0, 15.0, 42.0, 49.0, 95.0, 259.0, 212.0, 102.0, 49.0, 28.0, 27.0, 19.0, 16.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027637481689453125, -0.002664625644683838, -0.0025655031204223633, -0.0024663805961608887, -0.002367258071899414, -0.0022681355476379395, -0.002169013023376465, -0.0020698904991149902, -0.0019707679748535156, -0.001871645450592041, -0.0017725229263305664, -0.0016734004020690918, -0.0015742778778076172, -0.0014751553535461426, -0.001376032829284668, -0.0012769103050231934, -0.0011777877807617188, -0.0010786652565002441, -0.0009795427322387695, -0.0008804202079772949, -0.0007812976837158203, -0.0006821751594543457, -0.0005830526351928711, -0.0004839301109313965, -0.0003848075866699219, -0.00028568506240844727, -0.00018656253814697266, -8.744001388549805e-05, 1.1682510375976562e-05, 0.00011080503463745117, 0.00020992755889892578, 0.0003090500831604004, 0.000408172607421875, 0.0005072951316833496, 0.0006064176559448242, 0.0007055401802062988, 0.0008046627044677734, 0.000903785228729248, 0.0010029077529907227, 0.0011020302772521973, 0.0012011528015136719, 0.0013002753257751465, 0.001399397850036621, 0.0014985203742980957, 0.0015976428985595703, 0.001696765422821045, 0.0017958879470825195, 0.0018950104713439941, 0.0019941329956054688, 0.0020932555198669434, 0.002192378044128418, 0.0022915005683898926, 0.002390623092651367, 0.002489745616912842, 0.0025888681411743164, 0.002687990665435791, 0.0027871131896972656, 0.0028862357139587402, 0.002985358238220215, 0.0030844807624816895, 0.003183603286743164, 0.0032827258110046387, 0.0033818483352661133, 0.003480970859527588, 0.0035800933837890625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 0.0, 3.0, 6.0, 10.0, 18.0, 29.0, 34.0, 43.0, 50.0, 97.0, 142.0, 284.0, 410.0, 759.0, 1523.0, 3512.0, 11043.0, 68778.0, 729965.0, 199875.0, 21969.0, 5567.0, 2096.0, 945.0, 504.0, 325.0, 169.0, 118.0, 73.0, 69.0, 44.0, 23.0, 15.0, 12.0, 7.0, 16.0, 6.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.08984375, -6.83404541015625, -6.5782470703125, -6.32244873046875, -6.066650390625, -5.81085205078125, -5.5550537109375, -5.29925537109375, -5.04345703125, -4.78765869140625, -4.5318603515625, -4.27606201171875, -4.020263671875, -3.76446533203125, -3.5086669921875, -3.25286865234375, -2.9970703125, -2.74127197265625, -2.4854736328125, -2.22967529296875, -1.973876953125, -1.71807861328125, -1.4622802734375, -1.20648193359375, -0.95068359375, -0.69488525390625, -0.4390869140625, -0.18328857421875, 0.072509765625, 0.32830810546875, 0.5841064453125, 0.83990478515625, 1.095703125, 1.35150146484375, 1.6072998046875, 1.86309814453125, 2.118896484375, 2.37469482421875, 2.6304931640625, 2.88629150390625, 3.14208984375, 3.39788818359375, 3.6536865234375, 3.90948486328125, 4.165283203125, 4.42108154296875, 4.6768798828125, 4.93267822265625, 5.1884765625, 5.44427490234375, 5.7000732421875, 5.95587158203125, 6.211669921875, 6.46746826171875, 6.7232666015625, 6.97906494140625, 7.23486328125, 7.49066162109375, 7.7464599609375, 8.00225830078125, 8.258056640625, 8.51385498046875, 8.7696533203125, 9.02545166015625, 9.28125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 11.0, 8.0, 11.0, 10.0, 20.0, 15.0, 16.0, 28.0, 37.0, 39.0, 52.0, 73.0, 92.0, 85.0, 96.0, 85.0, 65.0, 44.0, 37.0, 40.0, 21.0, 27.0, 16.0, 16.0, 8.0, 10.0, 5.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.1171875, -4.9326171875, -4.748046875, -4.5634765625, -4.37890625, -4.1943359375, -4.009765625, -3.8251953125, -3.640625, -3.4560546875, -3.271484375, -3.0869140625, -2.90234375, -2.7177734375, -2.533203125, -2.3486328125, -2.1640625, -1.9794921875, -1.794921875, -1.6103515625, -1.42578125, -1.2412109375, -1.056640625, -0.8720703125, -0.6875, -0.5029296875, -0.318359375, -0.1337890625, 0.05078125, 0.2353515625, 0.419921875, 0.6044921875, 0.7890625, 0.9736328125, 1.158203125, 1.3427734375, 1.52734375, 1.7119140625, 1.896484375, 2.0810546875, 2.265625, 2.4501953125, 2.634765625, 2.8193359375, 3.00390625, 3.1884765625, 3.373046875, 3.5576171875, 3.7421875, 3.9267578125, 4.111328125, 4.2958984375, 4.48046875, 4.6650390625, 4.849609375, 5.0341796875, 5.21875, 5.4033203125, 5.587890625, 5.7724609375, 5.95703125, 6.1416015625, 6.326171875, 6.5107421875, 6.6953125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 9.0, 12.0, 32.0, 45.0, 84.0, 134.0, 185.0, 175.0, 146.0, 81.0, 47.0, 24.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-152.63987731933594, -147.70834350585938, -142.7768096923828, -137.8452606201172, -132.91372680664062, -127.98219299316406, -123.0506591796875, -118.11912536621094, -113.18758392333984, -108.25605010986328, -103.32450866699219, -98.39297485351562, -93.46144104003906, -88.52989959716797, -83.5983657836914, -78.66682434082031, -73.73529052734375, -68.80375671386719, -63.872215270996094, -58.94068145751953, -54.0091438293457, -49.077606201171875, -44.14607238769531, -39.214534759521484, -34.282997131347656, -29.351459503173828, -24.419923782348633, -19.488388061523438, -14.55685043334961, -9.625312805175781, -4.693777084350586, 0.23775863647460938, 5.1693115234375, 10.100848197937012, 15.032384872436523, 19.96392059326172, 24.895458221435547, 29.826995849609375, 34.75852966308594, 39.690067291259766, 44.621604919433594, 49.55314254760742, 54.48468017578125, 59.41621398925781, 64.34774780273438, 69.27928924560547, 74.21082305908203, 79.14236450195312, 84.07389831542969, 89.00543212890625, 93.93697357177734, 98.8685073852539, 103.800048828125, 108.73158264160156, 113.66311645507812, 118.59465026855469, 123.52619171142578, 128.45773315429688, 133.38926696777344, 138.32080078125, 143.25233459472656, 148.18386840820312, 153.11541748046875, 158.0469512939453, 162.97848510742188]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 7.0, 2.0, 6.0, 8.0, 7.0, 8.0, 12.0, 13.0, 13.0, 13.0, 17.0, 18.0, 22.0, 27.0, 33.0, 23.0, 32.0, 44.0, 59.0, 55.0, 55.0, 51.0, 47.0, 57.0, 43.0, 32.0, 49.0, 38.0, 30.0, 30.0, 16.0, 19.0, 21.0, 16.0, 18.0, 14.0, 9.0, 8.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-91.1695556640625, -88.5467758178711, -85.92399597167969, -83.30122375488281, -80.6784439086914, -78.0556640625, -75.4328842163086, -72.81010437011719, -70.18733215332031, -67.5645523071289, -64.9417724609375, -62.31899642944336, -59.69622039794922, -57.07344055175781, -54.450660705566406, -51.827880859375, -49.205101013183594, -46.58232116699219, -43.95954513549805, -41.33676528930664, -38.7139892578125, -36.091209411621094, -33.46842956542969, -30.845651626586914, -28.22287368774414, -25.600095748901367, -22.977317810058594, -20.354537963867188, -17.731760025024414, -15.10898208618164, -12.48620319366455, -9.863424301147461, -7.240653991699219, -4.617875576019287, -1.9950971603393555, 0.6276812553405762, 3.250459671020508, 5.873237609863281, 8.496016502380371, 11.118795394897461, 13.741573333740234, 16.364351272583008, 18.98712921142578, 21.609909057617188, 24.23268699645996, 26.855464935302734, 29.47824478149414, 32.10102081298828, 34.72380065917969, 37.346580505371094, 39.969356536865234, 42.59213638305664, 45.21491241455078, 47.83769226074219, 50.460472106933594, 53.083251953125, 55.70602798461914, 58.32880783081055, 60.95158386230469, 63.574363708496094, 66.1971435546875, 68.81991577148438, 71.44269561767578, 74.06547546386719, 76.6882553100586]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 2.0, 7.0, 4.0, 6.0, 11.0, 17.0, 17.0, 22.0, 35.0, 37.0, 65.0, 86.0, 125.0, 209.0, 505.0, 1874.0, 13072.0, 771556.0, 3373142.0, 29129.0, 2928.0, 662.0, 268.0, 160.0, 103.0, 59.0, 43.0, 34.0, 32.0, 9.0, 14.0, 11.0, 12.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.21875, -18.483642578125, -17.74853515625, -17.013427734375, -16.2783203125, -15.543212890625, -14.80810546875, -14.072998046875, -13.337890625, -12.602783203125, -11.86767578125, -11.132568359375, -10.3974609375, -9.662353515625, -8.92724609375, -8.192138671875, -7.45703125, -6.721923828125, -5.98681640625, -5.251708984375, -4.5166015625, -3.781494140625, -3.04638671875, -2.311279296875, -1.576171875, -0.841064453125, -0.10595703125, 0.629150390625, 1.3642578125, 2.099365234375, 2.83447265625, 3.569580078125, 4.3046875, 5.039794921875, 5.77490234375, 6.510009765625, 7.2451171875, 7.980224609375, 8.71533203125, 9.450439453125, 10.185546875, 10.920654296875, 11.65576171875, 12.390869140625, 13.1259765625, 13.861083984375, 14.59619140625, 15.331298828125, 16.06640625, 16.801513671875, 17.53662109375, 18.271728515625, 19.0068359375, 19.741943359375, 20.47705078125, 21.212158203125, 21.947265625, 22.682373046875, 23.41748046875, 24.152587890625, 24.8876953125, 25.622802734375, 26.35791015625, 27.093017578125, 27.828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 13.0, 2.0, 9.0, 15.0, 18.0, 15.0, 15.0, 25.0, 28.0, 28.0, 41.0, 40.0, 50.0, 46.0, 41.0, 55.0, 50.0, 59.0, 65.0, 49.0, 33.0, 53.0, 39.0, 33.0, 33.0, 26.0, 22.0, 28.0, 19.0, 15.0, 6.0, 5.0, 8.0, 8.0, 4.0, 3.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84375, -5.68133544921875, -5.5189208984375, -5.35650634765625, -5.194091796875, -5.03167724609375, -4.8692626953125, -4.70684814453125, -4.54443359375, -4.38201904296875, -4.2196044921875, -4.05718994140625, -3.894775390625, -3.73236083984375, -3.5699462890625, -3.40753173828125, -3.2451171875, -3.08270263671875, -2.9202880859375, -2.75787353515625, -2.595458984375, -2.43304443359375, -2.2706298828125, -2.10821533203125, -1.94580078125, -1.78338623046875, -1.6209716796875, -1.45855712890625, -1.296142578125, -1.13372802734375, -0.9713134765625, -0.80889892578125, -0.646484375, -0.48406982421875, -0.3216552734375, -0.15924072265625, 0.003173828125, 0.16558837890625, 0.3280029296875, 0.49041748046875, 0.65283203125, 0.81524658203125, 0.9776611328125, 1.14007568359375, 1.302490234375, 1.46490478515625, 1.6273193359375, 1.78973388671875, 1.9521484375, 2.11456298828125, 2.2769775390625, 2.43939208984375, 2.601806640625, 2.76422119140625, 2.9266357421875, 3.08905029296875, 3.25146484375, 3.41387939453125, 3.5762939453125, 3.73870849609375, 3.901123046875, 4.06353759765625, 4.2259521484375, 4.38836669921875, 4.55078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 3.0, 4.0, 10.0, 3.0, 9.0, 13.0, 24.0, 33.0, 46.0, 74.0, 115.0, 204.0, 392.0, 763.0, 1602.0, 4273.0, 12146.0, 45950.0, 386329.0, 3271612.0, 405563.0, 45421.0, 11731.0, 4231.0, 1718.0, 848.0, 449.0, 278.0, 160.0, 92.0, 51.0, 43.0, 23.0, 18.0, 15.0, 11.0, 7.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.4453125, -11.029296875, -10.61328125, -10.197265625, -9.78125, -9.365234375, -8.94921875, -8.533203125, -8.1171875, -7.701171875, -7.28515625, -6.869140625, -6.453125, -6.037109375, -5.62109375, -5.205078125, -4.7890625, -4.373046875, -3.95703125, -3.541015625, -3.125, -2.708984375, -2.29296875, -1.876953125, -1.4609375, -1.044921875, -0.62890625, -0.212890625, 0.203125, 0.619140625, 1.03515625, 1.451171875, 1.8671875, 2.283203125, 2.69921875, 3.115234375, 3.53125, 3.947265625, 4.36328125, 4.779296875, 5.1953125, 5.611328125, 6.02734375, 6.443359375, 6.859375, 7.275390625, 7.69140625, 8.107421875, 8.5234375, 8.939453125, 9.35546875, 9.771484375, 10.1875, 10.603515625, 11.01953125, 11.435546875, 11.8515625, 12.267578125, 12.68359375, 13.099609375, 13.515625, 13.931640625, 14.34765625, 14.763671875, 15.1796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 12.0, 10.0, 21.0, 34.0, 54.0, 59.0, 116.0, 166.0, 316.0, 571.0, 785.0, 770.0, 458.0, 276.0, 147.0, 92.0, 43.0, 30.0, 25.0, 16.0, 7.0, 15.0, 8.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.851806640625, -8.40673828125, -7.961669921875, -7.5166015625, -7.071533203125, -6.62646484375, -6.181396484375, -5.736328125, -5.291259765625, -4.84619140625, -4.401123046875, -3.9560546875, -3.510986328125, -3.06591796875, -2.620849609375, -2.17578125, -1.730712890625, -1.28564453125, -0.840576171875, -0.3955078125, 0.049560546875, 0.49462890625, 0.939697265625, 1.384765625, 1.829833984375, 2.27490234375, 2.719970703125, 3.1650390625, 3.610107421875, 4.05517578125, 4.500244140625, 4.9453125, 5.390380859375, 5.83544921875, 6.280517578125, 6.7255859375, 7.170654296875, 7.61572265625, 8.060791015625, 8.505859375, 8.950927734375, 9.39599609375, 9.841064453125, 10.2861328125, 10.731201171875, 11.17626953125, 11.621337890625, 12.06640625, 12.511474609375, 12.95654296875, 13.401611328125, 13.8466796875, 14.291748046875, 14.73681640625, 15.181884765625, 15.626953125, 16.072021484375, 16.51708984375, 16.962158203125, 17.4072265625, 17.852294921875, 18.29736328125, 18.742431640625, 19.1875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 22.0, 58.0, 101.0, 171.0, 183.0, 170.0, 118.0, 57.0, 32.0, 19.0, 12.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-163.07550048828125, -159.2574920654297, -155.4394989013672, -151.62149047851562, -147.80349731445312, -143.98548889160156, -140.16749572753906, -136.3494873046875, -132.531494140625, -128.71348571777344, -124.89549255371094, -121.0774917602539, -117.25949096679688, -113.44149017333984, -109.62348937988281, -105.80548095703125, -101.98748016357422, -98.16947937011719, -94.35147857666016, -90.53347778320312, -86.7154769897461, -82.89747619628906, -79.0794677734375, -75.261474609375, -71.44346618652344, -67.6254653930664, -63.807464599609375, -59.989463806152344, -56.17146301269531, -52.35346221923828, -48.535457611083984, -44.71745681762695, -40.89945983886719, -37.081459045410156, -33.263458251953125, -29.44545555114746, -25.62745475769043, -21.8094539642334, -17.991451263427734, -14.173450469970703, -10.355449676513672, -6.537448406219482, -2.719447135925293, 1.0985546112060547, 4.916555404663086, 8.734556198120117, 12.552558898925781, 16.370559692382812, 20.188560485839844, 24.006561279296875, 27.824562072753906, 31.64256477355957, 35.46056365966797, 39.278564453125, 43.0965690612793, 46.91456985473633, 50.73257064819336, 54.55057144165039, 58.36857223510742, 62.18657684326172, 66.00457763671875, 69.82257843017578, 73.64057922363281, 77.45858001708984, 81.27658081054688]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 8.0, 13.0, 13.0, 15.0, 28.0, 25.0, 20.0, 41.0, 38.0, 36.0, 33.0, 43.0, 47.0, 50.0, 60.0, 56.0, 46.0, 48.0, 50.0, 54.0, 48.0, 41.0, 36.0, 29.0, 31.0, 19.0, 16.0, 11.0, 12.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 1.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.76190185546875, -64.59051513671875, -62.41912078857422, -60.24773025512695, -58.07633972167969, -55.90494918823242, -53.733558654785156, -51.562171936035156, -49.390777587890625, -47.21938705444336, -45.047996520996094, -42.87660598754883, -40.70521545410156, -38.5338249206543, -36.36243438720703, -34.19104766845703, -32.019657135009766, -29.8482666015625, -27.676876068115234, -25.50548553466797, -23.334095001220703, -21.162704467773438, -18.991315841674805, -16.81992530822754, -14.648534774780273, -12.477144241333008, -10.305753707885742, -8.134364128112793, -5.962973594665527, -3.7915830612182617, -1.6201934814453125, 0.5511970520019531, 2.7225875854492188, 4.893978118896484, 7.065368175506592, 9.2367582321167, 11.408148765563965, 13.57953929901123, 15.75092887878418, 17.922319412231445, 20.09370994567871, 22.265100479125977, 24.436491012573242, 26.607879638671875, 28.77927017211914, 30.950660705566406, 33.12205123901367, 35.29344177246094, 37.4648323059082, 39.63622283935547, 41.807613372802734, 43.97900390625, 46.150394439697266, 48.32178497314453, 50.49317169189453, 52.66456604003906, 54.83595275878906, 57.00734329223633, 59.178733825683594, 61.35012435913086, 63.521514892578125, 65.69290161132812, 67.86429595947266, 70.03568267822266, 72.20707702636719]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 4.0, 5.0, 11.0, 12.0, 20.0, 40.0, 47.0, 60.0, 107.0, 116.0, 159.0, 280.0, 417.0, 631.0, 1081.0, 1767.0, 2993.0, 5301.0, 9972.0, 19985.0, 45738.0, 133987.0, 430448.0, 259929.0, 74858.0, 29454.0, 14075.0, 7087.0, 3966.0, 2213.0, 1338.0, 828.0, 513.0, 339.0, 234.0, 160.0, 108.0, 80.0, 46.0, 42.0, 28.0, 22.0, 14.0, 12.0, 11.0, 4.0, 3.0, 2.0, 0.0, 0.0, 6.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4453125, -9.1478271484375, -8.850341796875, -8.5528564453125, -8.25537109375, -7.9578857421875, -7.660400390625, -7.3629150390625, -7.0654296875, -6.7679443359375, -6.470458984375, -6.1729736328125, -5.87548828125, -5.5780029296875, -5.280517578125, -4.9830322265625, -4.685546875, -4.3880615234375, -4.090576171875, -3.7930908203125, -3.49560546875, -3.1981201171875, -2.900634765625, -2.6031494140625, -2.3056640625, -2.0081787109375, -1.710693359375, -1.4132080078125, -1.11572265625, -0.8182373046875, -0.520751953125, -0.2232666015625, 0.07421875, 0.3717041015625, 0.669189453125, 0.9666748046875, 1.26416015625, 1.5616455078125, 1.859130859375, 2.1566162109375, 2.4541015625, 2.7515869140625, 3.049072265625, 3.3465576171875, 3.64404296875, 3.9415283203125, 4.239013671875, 4.5364990234375, 4.833984375, 5.1314697265625, 5.428955078125, 5.7264404296875, 6.02392578125, 6.3214111328125, 6.618896484375, 6.9163818359375, 7.2138671875, 7.5113525390625, 7.808837890625, 8.1063232421875, 8.40380859375, 8.7012939453125, 8.998779296875, 9.2962646484375, 9.59375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 6.0, 14.0, 4.0, 12.0, 9.0, 15.0, 16.0, 20.0, 19.0, 23.0, 24.0, 26.0, 28.0, 29.0, 34.0, 42.0, 40.0, 44.0, 32.0, 32.0, 51.0, 57.0, 42.0, 41.0, 40.0, 48.0, 22.0, 24.0, 31.0, 26.0, 27.0, 23.0, 19.0, 14.0, 10.0, 13.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0], "bins": [-4.8828125, -4.74041748046875, -4.5980224609375, -4.45562744140625, -4.313232421875, -4.17083740234375, -4.0284423828125, -3.88604736328125, -3.74365234375, -3.60125732421875, -3.4588623046875, -3.31646728515625, -3.174072265625, -3.03167724609375, -2.8892822265625, -2.74688720703125, -2.6044921875, -2.46209716796875, -2.3197021484375, -2.17730712890625, -2.034912109375, -1.89251708984375, -1.7501220703125, -1.60772705078125, -1.46533203125, -1.32293701171875, -1.1805419921875, -1.03814697265625, -0.895751953125, -0.75335693359375, -0.6109619140625, -0.46856689453125, -0.326171875, -0.18377685546875, -0.0413818359375, 0.10101318359375, 0.243408203125, 0.38580322265625, 0.5281982421875, 0.67059326171875, 0.81298828125, 0.95538330078125, 1.0977783203125, 1.24017333984375, 1.382568359375, 1.52496337890625, 1.6673583984375, 1.80975341796875, 1.9521484375, 2.09454345703125, 2.2369384765625, 2.37933349609375, 2.521728515625, 2.66412353515625, 2.8065185546875, 2.94891357421875, 3.09130859375, 3.23370361328125, 3.3760986328125, 3.51849365234375, 3.660888671875, 3.80328369140625, 3.9456787109375, 4.08807373046875, 4.23046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 4.0, 8.0, 6.0, 16.0, 25.0, 26.0, 39.0, 55.0, 98.0, 139.0, 223.0, 365.0, 733.0, 1534.0, 3889.0, 14001.0, 86991.0, 794145.0, 120819.0, 17352.0, 4447.0, 1684.0, 811.0, 446.0, 244.0, 145.0, 107.0, 61.0, 42.0, 34.0, 22.0, 16.0, 5.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.5, -19.829345703125, -19.15869140625, -18.488037109375, -17.8173828125, -17.146728515625, -16.47607421875, -15.805419921875, -15.134765625, -14.464111328125, -13.79345703125, -13.122802734375, -12.4521484375, -11.781494140625, -11.11083984375, -10.440185546875, -9.76953125, -9.098876953125, -8.42822265625, -7.757568359375, -7.0869140625, -6.416259765625, -5.74560546875, -5.074951171875, -4.404296875, -3.733642578125, -3.06298828125, -2.392333984375, -1.7216796875, -1.051025390625, -0.38037109375, 0.290283203125, 0.9609375, 1.631591796875, 2.30224609375, 2.972900390625, 3.6435546875, 4.314208984375, 4.98486328125, 5.655517578125, 6.326171875, 6.996826171875, 7.66748046875, 8.338134765625, 9.0087890625, 9.679443359375, 10.35009765625, 11.020751953125, 11.69140625, 12.362060546875, 13.03271484375, 13.703369140625, 14.3740234375, 15.044677734375, 15.71533203125, 16.385986328125, 17.056640625, 17.727294921875, 18.39794921875, 19.068603515625, 19.7392578125, 20.409912109375, 21.08056640625, 21.751220703125, 22.421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 16.0, 10.0, 8.0, 17.0, 26.0, 32.0, 26.0, 34.0, 39.0, 44.0, 45.0, 53.0, 53.0, 52.0, 57.0, 45.0, 53.0, 61.0, 68.0, 53.0, 29.0, 38.0, 24.0, 18.0, 15.0, 15.0, 6.0, 8.0, 12.0, 6.0, 11.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.875, -22.0927734375, -21.310546875, -20.5283203125, -19.74609375, -18.9638671875, -18.181640625, -17.3994140625, -16.6171875, -15.8349609375, -15.052734375, -14.2705078125, -13.48828125, -12.7060546875, -11.923828125, -11.1416015625, -10.359375, -9.5771484375, -8.794921875, -8.0126953125, -7.23046875, -6.4482421875, -5.666015625, -4.8837890625, -4.1015625, -3.3193359375, -2.537109375, -1.7548828125, -0.97265625, -0.1904296875, 0.591796875, 1.3740234375, 2.15625, 2.9384765625, 3.720703125, 4.5029296875, 5.28515625, 6.0673828125, 6.849609375, 7.6318359375, 8.4140625, 9.1962890625, 9.978515625, 10.7607421875, 11.54296875, 12.3251953125, 13.107421875, 13.8896484375, 14.671875, 15.4541015625, 16.236328125, 17.0185546875, 17.80078125, 18.5830078125, 19.365234375, 20.1474609375, 20.9296875, 21.7119140625, 22.494140625, 23.2763671875, 24.05859375, 24.8408203125, 25.623046875, 26.4052734375, 27.1875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 14.0, 15.0, 26.0, 54.0, 121.0, 415.0, 2400.0, 40167.0, 946204.0, 55588.0, 2761.0, 465.0, 153.0, 73.0, 39.0, 22.0, 8.0, 4.0, 8.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.921875, -15.34375, -14.765625, -14.1875, -13.609375, -13.03125, -12.453125, -11.875, -11.296875, -10.71875, -10.140625, -9.5625, -8.984375, -8.40625, -7.828125, -7.25, -6.671875, -6.09375, -5.515625, -4.9375, -4.359375, -3.78125, -3.203125, -2.625, -2.046875, -1.46875, -0.890625, -0.3125, 0.265625, 0.84375, 1.421875, 2.0, 2.578125, 3.15625, 3.734375, 4.3125, 4.890625, 5.46875, 6.046875, 6.625, 7.203125, 7.78125, 8.359375, 8.9375, 9.515625, 10.09375, 10.671875, 11.25, 11.828125, 12.40625, 12.984375, 13.5625, 14.140625, 14.71875, 15.296875, 15.875, 16.453125, 17.03125, 17.609375, 18.1875, 18.765625, 19.34375, 19.921875, 20.5]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 8.0, 3.0, 6.0, 11.0, 11.0, 7.0, 19.0, 16.0, 39.0, 48.0, 61.0, 132.0, 152.0, 160.0, 92.0, 57.0, 35.0, 37.0, 17.0, 18.0, 15.0, 9.0, 9.0, 14.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015611648559570312, -0.001504942774772644, -0.0014487206935882568, -0.0013924986124038696, -0.0013362765312194824, -0.0012800544500350952, -0.001223832368850708, -0.0011676102876663208, -0.0011113882064819336, -0.0010551661252975464, -0.0009989440441131592, -0.000942721962928772, -0.0008864998817443848, -0.0008302778005599976, -0.0007740557193756104, -0.0007178336381912231, -0.0006616115570068359, -0.0006053894758224487, -0.0005491673946380615, -0.0004929453134536743, -0.0004367232322692871, -0.0003805011510848999, -0.0003242790699005127, -0.0002680569887161255, -0.00021183490753173828, -0.00015561282634735107, -9.939074516296387e-05, -4.316866397857666e-05, 1.3053417205810547e-05, 6.927549839019775e-05, 0.00012549757957458496, 0.00018171966075897217, 0.00023794174194335938, 0.0002941638231277466, 0.0003503859043121338, 0.000406607985496521, 0.0004628300666809082, 0.0005190521478652954, 0.0005752742290496826, 0.0006314963102340698, 0.000687718391418457, 0.0007439404726028442, 0.0008001625537872314, 0.0008563846349716187, 0.0009126067161560059, 0.0009688287973403931, 0.0010250508785247803, 0.0010812729597091675, 0.0011374950408935547, 0.001193717122077942, 0.001249939203262329, 0.0013061612844467163, 0.0013623833656311035, 0.0014186054468154907, 0.001474827527999878, 0.0015310496091842651, 0.0015872716903686523, 0.0016434937715530396, 0.0016997158527374268, 0.001755937933921814, 0.0018121600151062012, 0.0018683820962905884, 0.0019246041774749756, 0.001980826258659363, 0.00203704833984375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 11.0, 16.0, 29.0, 74.0, 177.0, 379.0, 999.0, 3250.0, 19553.0, 424280.0, 572098.0, 22427.0, 3597.0, 956.0, 357.0, 157.0, 78.0, 45.0, 18.0, 14.0, 8.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.7955322265625, -9.419189453125, -9.0428466796875, -8.66650390625, -8.2901611328125, -7.913818359375, -7.5374755859375, -7.1611328125, -6.7847900390625, -6.408447265625, -6.0321044921875, -5.65576171875, -5.2794189453125, -4.903076171875, -4.5267333984375, -4.150390625, -3.7740478515625, -3.397705078125, -3.0213623046875, -2.64501953125, -2.2686767578125, -1.892333984375, -1.5159912109375, -1.1396484375, -0.7633056640625, -0.386962890625, -0.0106201171875, 0.36572265625, 0.7420654296875, 1.118408203125, 1.4947509765625, 1.87109375, 2.2474365234375, 2.623779296875, 3.0001220703125, 3.37646484375, 3.7528076171875, 4.129150390625, 4.5054931640625, 4.8818359375, 5.2581787109375, 5.634521484375, 6.0108642578125, 6.38720703125, 6.7635498046875, 7.139892578125, 7.5162353515625, 7.892578125, 8.2689208984375, 8.645263671875, 9.0216064453125, 9.39794921875, 9.7742919921875, 10.150634765625, 10.5269775390625, 10.9033203125, 11.2796630859375, 11.656005859375, 12.0323486328125, 12.40869140625, 12.7850341796875, 13.161376953125, 13.5377197265625, 13.9140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 4.0, 4.0, 9.0, 15.0, 7.0, 10.0, 18.0, 21.0, 26.0, 32.0, 39.0, 50.0, 58.0, 70.0, 81.0, 69.0, 63.0, 63.0, 50.0, 61.0, 44.0, 41.0, 30.0, 26.0, 15.0, 13.0, 17.0, 14.0, 12.0, 5.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.015625, -3.853271484375, -3.69091796875, -3.528564453125, -3.3662109375, -3.203857421875, -3.04150390625, -2.879150390625, -2.716796875, -2.554443359375, -2.39208984375, -2.229736328125, -2.0673828125, -1.905029296875, -1.74267578125, -1.580322265625, -1.41796875, -1.255615234375, -1.09326171875, -0.930908203125, -0.7685546875, -0.606201171875, -0.44384765625, -0.281494140625, -0.119140625, 0.043212890625, 0.20556640625, 0.367919921875, 0.5302734375, 0.692626953125, 0.85498046875, 1.017333984375, 1.1796875, 1.342041015625, 1.50439453125, 1.666748046875, 1.8291015625, 1.991455078125, 2.15380859375, 2.316162109375, 2.478515625, 2.640869140625, 2.80322265625, 2.965576171875, 3.1279296875, 3.290283203125, 3.45263671875, 3.614990234375, 3.77734375, 3.939697265625, 4.10205078125, 4.264404296875, 4.4267578125, 4.589111328125, 4.75146484375, 4.913818359375, 5.076171875, 5.238525390625, 5.40087890625, 5.563232421875, 5.7255859375, 5.887939453125, 6.05029296875, 6.212646484375, 6.375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 12.0, 32.0, 67.0, 124.0, 190.0, 215.0, 134.0, 103.0, 52.0, 25.0, 11.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.98062133789062, -113.25540924072266, -108.53019714355469, -103.80498504638672, -99.07977294921875, -94.35456085205078, -89.62934875488281, -84.90413665771484, -80.17892456054688, -75.4537124633789, -70.72850036621094, -66.00328826904297, -61.278076171875, -56.55286407470703, -51.82765197753906, -47.102439880371094, -42.377227783203125, -37.652015686035156, -32.92680358886719, -28.20159149169922, -23.47637939453125, -18.75116729736328, -14.025955200195312, -9.300743103027344, -4.575531005859375, 0.14968109130859375, 4.8748931884765625, 9.600105285644531, 14.3253173828125, 19.05052947998047, 23.775741577148438, 28.500953674316406, 33.22615051269531, 37.95136260986328, 42.67657470703125, 47.40178680419922, 52.12699890136719, 56.852210998535156, 61.577423095703125, 66.3026351928711, 71.02784729003906, 75.75305938720703, 80.478271484375, 85.20348358154297, 89.92869567871094, 94.6539077758789, 99.37911987304688, 104.10433197021484, 108.82954406738281, 113.55475616455078, 118.27996826171875, 123.00518035888672, 127.73039245605469, 132.45559692382812, 137.18081665039062, 141.90603637695312, 146.63124084472656, 151.3564453125, 156.0816650390625, 160.806884765625, 165.53208923339844, 170.25729370117188, 174.98251342773438, 179.70773315429688, 184.4329376220703]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 10.0, 12.0, 15.0, 22.0, 19.0, 23.0, 23.0, 32.0, 33.0, 35.0, 50.0, 49.0, 48.0, 53.0, 61.0, 60.0, 58.0, 55.0, 57.0, 43.0, 45.0, 34.0, 26.0, 26.0, 19.0, 13.0, 9.0, 13.0, 10.0, 6.0, 15.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.53691101074219, -68.43246459960938, -65.3280258178711, -62.22357940673828, -59.11913299560547, -56.01469039916992, -52.910247802734375, -49.80580139160156, -46.70135498046875, -43.5969123840332, -40.49246597290039, -37.388023376464844, -34.28357696533203, -31.179134368896484, -28.074689865112305, -24.970245361328125, -21.865802764892578, -18.7613582611084, -15.656913757324219, -12.552470207214355, -9.448025703430176, -6.343581199645996, -3.239137649536133, -0.13469314575195312, 2.9697513580322266, 6.074195861816406, 9.178640365600586, 12.28308391571045, 15.387528419494629, 18.491973876953125, 21.596416473388672, 24.70086097717285, 27.80530548095703, 30.90974998474121, 34.01419448852539, 37.11863708496094, 40.22308349609375, 43.3275260925293, 46.431968688964844, 49.536415100097656, 52.64086151123047, 55.745304107666016, 58.84975051879883, 61.954193115234375, 65.05863952636719, 68.1630859375, 71.26752471923828, 74.3719711303711, 77.47640991210938, 80.58085632324219, 83.68529510498047, 86.78974151611328, 89.8941879272461, 92.9986343383789, 96.10307312011719, 99.20751953125, 102.31196594238281, 105.41641235351562, 108.5208511352539, 111.62529754638672, 114.72974395751953, 117.83419036865234, 120.93862915039062, 124.04307556152344, 127.14752197265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 8.0, 9.0, 19.0, 29.0, 30.0, 59.0, 79.0, 166.0, 295.0, 413.0, 874.0, 1571.0, 3148.0, 6486.0, 14424.0, 36752.0, 109510.0, 421844.0, 1585466.0, 1480683.0, 377068.0, 97022.0, 32502.0, 13162.0, 6086.0, 2967.0, 1493.0, 834.0, 466.0, 278.0, 182.0, 114.0, 91.0, 44.0, 35.0, 20.0, 18.0, 8.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5859375, -5.39947509765625, -5.2130126953125, -5.02655029296875, -4.840087890625, -4.65362548828125, -4.4671630859375, -4.28070068359375, -4.09423828125, -3.90777587890625, -3.7213134765625, -3.53485107421875, -3.348388671875, -3.16192626953125, -2.9754638671875, -2.78900146484375, -2.6025390625, -2.41607666015625, -2.2296142578125, -2.04315185546875, -1.856689453125, -1.67022705078125, -1.4837646484375, -1.29730224609375, -1.11083984375, -0.92437744140625, -0.7379150390625, -0.55145263671875, -0.364990234375, -0.17852783203125, 0.0079345703125, 0.19439697265625, 0.380859375, 0.56732177734375, 0.7537841796875, 0.94024658203125, 1.126708984375, 1.31317138671875, 1.4996337890625, 1.68609619140625, 1.87255859375, 2.05902099609375, 2.2454833984375, 2.43194580078125, 2.618408203125, 2.80487060546875, 2.9913330078125, 3.17779541015625, 3.3642578125, 3.55072021484375, 3.7371826171875, 3.92364501953125, 4.110107421875, 4.29656982421875, 4.4830322265625, 4.66949462890625, 4.85595703125, 5.04241943359375, 5.2288818359375, 5.41534423828125, 5.601806640625, 5.78826904296875, 5.9747314453125, 6.16119384765625, 6.34765625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 12.0, 14.0, 12.0, 16.0, 13.0, 17.0, 32.0, 32.0, 39.0, 49.0, 51.0, 43.0, 41.0, 66.0, 53.0, 58.0, 63.0, 61.0, 53.0, 55.0, 38.0, 33.0, 27.0, 26.0, 26.0, 19.0, 11.0, 12.0, 5.0, 6.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.328125, -5.15081787109375, -4.9735107421875, -4.79620361328125, -4.618896484375, -4.44158935546875, -4.2642822265625, -4.08697509765625, -3.90966796875, -3.73236083984375, -3.5550537109375, -3.37774658203125, -3.200439453125, -3.02313232421875, -2.8458251953125, -2.66851806640625, -2.4912109375, -2.31390380859375, -2.1365966796875, -1.95928955078125, -1.781982421875, -1.60467529296875, -1.4273681640625, -1.25006103515625, -1.07275390625, -0.89544677734375, -0.7181396484375, -0.54083251953125, -0.363525390625, -0.18621826171875, -0.0089111328125, 0.16839599609375, 0.345703125, 0.52301025390625, 0.7003173828125, 0.87762451171875, 1.054931640625, 1.23223876953125, 1.4095458984375, 1.58685302734375, 1.76416015625, 1.94146728515625, 2.1187744140625, 2.29608154296875, 2.473388671875, 2.65069580078125, 2.8280029296875, 3.00531005859375, 3.1826171875, 3.35992431640625, 3.5372314453125, 3.71453857421875, 3.891845703125, 4.06915283203125, 4.2464599609375, 4.42376708984375, 4.60107421875, 4.77838134765625, 4.9556884765625, 5.13299560546875, 5.310302734375, 5.48760986328125, 5.6649169921875, 5.84222412109375, 6.01953125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 12.0, 17.0, 18.0, 53.0, 51.0, 101.0, 194.0, 393.0, 859.0, 2316.0, 7619.0, 34491.0, 288635.0, 3328802.0, 475260.0, 42535.0, 8383.0, 2603.0, 1006.0, 426.0, 195.0, 91.0, 82.0, 49.0, 22.0, 18.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.046875, -15.522216796875, -14.99755859375, -14.472900390625, -13.9482421875, -13.423583984375, -12.89892578125, -12.374267578125, -11.849609375, -11.324951171875, -10.80029296875, -10.275634765625, -9.7509765625, -9.226318359375, -8.70166015625, -8.177001953125, -7.65234375, -7.127685546875, -6.60302734375, -6.078369140625, -5.5537109375, -5.029052734375, -4.50439453125, -3.979736328125, -3.455078125, -2.930419921875, -2.40576171875, -1.881103515625, -1.3564453125, -0.831787109375, -0.30712890625, 0.217529296875, 0.7421875, 1.266845703125, 1.79150390625, 2.316162109375, 2.8408203125, 3.365478515625, 3.89013671875, 4.414794921875, 4.939453125, 5.464111328125, 5.98876953125, 6.513427734375, 7.0380859375, 7.562744140625, 8.08740234375, 8.612060546875, 9.13671875, 9.661376953125, 10.18603515625, 10.710693359375, 11.2353515625, 11.760009765625, 12.28466796875, 12.809326171875, 13.333984375, 13.858642578125, 14.38330078125, 14.907958984375, 15.4326171875, 15.957275390625, 16.48193359375, 17.006591796875, 17.53125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 3.0, 4.0, 5.0, 10.0, 9.0, 16.0, 17.0, 18.0, 27.0, 43.0, 56.0, 77.0, 102.0, 168.0, 230.0, 411.0, 513.0, 646.0, 571.0, 406.0, 256.0, 149.0, 95.0, 78.0, 45.0, 26.0, 23.0, 21.0, 15.0, 9.0, 5.0, 3.0, 2.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.9921875, -15.51416015625, -15.0361328125, -14.55810546875, -14.080078125, -13.60205078125, -13.1240234375, -12.64599609375, -12.16796875, -11.68994140625, -11.2119140625, -10.73388671875, -10.255859375, -9.77783203125, -9.2998046875, -8.82177734375, -8.34375, -7.86572265625, -7.3876953125, -6.90966796875, -6.431640625, -5.95361328125, -5.4755859375, -4.99755859375, -4.51953125, -4.04150390625, -3.5634765625, -3.08544921875, -2.607421875, -2.12939453125, -1.6513671875, -1.17333984375, -0.6953125, -0.21728515625, 0.2607421875, 0.73876953125, 1.216796875, 1.69482421875, 2.1728515625, 2.65087890625, 3.12890625, 3.60693359375, 4.0849609375, 4.56298828125, 5.041015625, 5.51904296875, 5.9970703125, 6.47509765625, 6.953125, 7.43115234375, 7.9091796875, 8.38720703125, 8.865234375, 9.34326171875, 9.8212890625, 10.29931640625, 10.77734375, 11.25537109375, 11.7333984375, 12.21142578125, 12.689453125, 13.16748046875, 13.6455078125, 14.12353515625, 14.6015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 18.0, 69.0, 235.0, 384.0, 211.0, 45.0, 12.0, 7.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-450.91387939453125, -440.55572509765625, -430.19757080078125, -419.83941650390625, -409.4812927246094, -399.1231384277344, -388.7649841308594, -378.4068298339844, -368.0486755371094, -357.6905212402344, -347.3323669433594, -336.9742431640625, -326.6160888671875, -316.2579345703125, -305.8997802734375, -295.5416259765625, -285.1834716796875, -274.8253173828125, -264.4671630859375, -254.10902404785156, -243.75086975097656, -233.39273071289062, -223.03457641601562, -212.67642211914062, -202.31829833984375, -191.96014404296875, -181.6020050048828, -171.2438507080078, -160.8856964111328, -150.52755737304688, -140.16940307617188, -129.81124877929688, -119.45307922363281, -109.09493255615234, -98.73677825927734, -88.37863159179688, -78.02047729492188, -67.6623306274414, -57.30418395996094, -46.94602966308594, -36.58788299560547, -26.229732513427734, -15.871583938598633, -5.513435363769531, 4.844715118408203, 15.202865600585938, 25.561012268066406, 35.919166564941406, 46.277313232421875, 56.63546371459961, 66.99361419677734, 77.35176086425781, 87.70991516113281, 98.06806182861328, 108.42620849609375, 118.78436279296875, 129.14251708984375, 139.50067138671875, 149.8588104248047, 160.2169647216797, 170.5751190185547, 180.93325805664062, 191.29141235351562, 201.64956665039062, 212.00770568847656]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 7.0, 4.0, 18.0, 14.0, 15.0, 19.0, 22.0, 21.0, 45.0, 40.0, 26.0, 42.0, 33.0, 43.0, 43.0, 44.0, 49.0, 41.0, 51.0, 31.0, 42.0, 34.0, 44.0, 30.0, 37.0, 26.0, 22.0, 20.0, 21.0, 19.0, 19.0, 16.0, 8.0, 8.0, 2.0, 11.0, 5.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-79.4129638671875, -77.12326049804688, -74.83356475830078, -72.54386138916016, -70.25415802001953, -67.96446228027344, -65.67475891113281, -63.38505935668945, -61.095359802246094, -58.805660247802734, -56.51595687866211, -54.22625732421875, -51.93655776977539, -49.64685821533203, -47.357154846191406, -45.06745529174805, -42.77775192260742, -40.48805236816406, -38.19834899902344, -35.90864944458008, -33.61894989013672, -31.329248428344727, -29.039546966552734, -26.749847412109375, -24.460145950317383, -22.17044448852539, -19.88074493408203, -17.59104347229004, -15.301342964172363, -13.011642456054688, -10.721940994262695, -8.432241439819336, -6.142539978027344, -3.852839231491089, -1.563138484954834, 0.7265625, 3.016263008117676, 5.305963516235352, 7.595664978027344, 9.885364532470703, 12.175065994262695, 14.464766502380371, 16.754467010498047, 19.04416847229004, 21.33386993408203, 23.62356948852539, 25.913270950317383, 28.202970504760742, 30.492671966552734, 32.782371520996094, 35.07207489013672, 37.36177444458008, 39.65147399902344, 41.94117736816406, 44.23087692260742, 46.52057647705078, 48.810279846191406, 51.099979400634766, 53.38968276977539, 55.67938232421875, 57.96908187866211, 60.25878143310547, 62.548484802246094, 64.83818054199219, 67.12788391113281]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 6.0, 7.0, 15.0, 30.0, 26.0, 48.0, 51.0, 91.0, 133.0, 194.0, 315.0, 447.0, 622.0, 988.0, 1699.0, 2545.0, 4057.0, 6811.0, 11594.0, 20249.0, 35295.0, 64178.0, 127143.0, 265091.0, 249859.0, 116600.0, 59944.0, 33167.0, 19017.0, 11133.0, 6479.0, 3893.0, 2461.0, 1504.0, 935.0, 606.0, 414.0, 264.0, 197.0, 116.0, 115.0, 77.0, 33.0, 35.0, 18.0, 16.0, 12.0, 6.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.81640625, -6.59613037109375, -6.3758544921875, -6.15557861328125, -5.935302734375, -5.71502685546875, -5.4947509765625, -5.27447509765625, -5.05419921875, -4.83392333984375, -4.6136474609375, -4.39337158203125, -4.173095703125, -3.95281982421875, -3.7325439453125, -3.51226806640625, -3.2919921875, -3.07171630859375, -2.8514404296875, -2.63116455078125, -2.410888671875, -2.19061279296875, -1.9703369140625, -1.75006103515625, -1.52978515625, -1.30950927734375, -1.0892333984375, -0.86895751953125, -0.648681640625, -0.42840576171875, -0.2081298828125, 0.01214599609375, 0.232421875, 0.45269775390625, 0.6729736328125, 0.89324951171875, 1.113525390625, 1.33380126953125, 1.5540771484375, 1.77435302734375, 1.99462890625, 2.21490478515625, 2.4351806640625, 2.65545654296875, 2.875732421875, 3.09600830078125, 3.3162841796875, 3.53656005859375, 3.7568359375, 3.97711181640625, 4.1973876953125, 4.41766357421875, 4.637939453125, 4.85821533203125, 5.0784912109375, 5.29876708984375, 5.51904296875, 5.73931884765625, 5.9595947265625, 6.17987060546875, 6.400146484375, 6.62042236328125, 6.8406982421875, 7.06097412109375, 7.28125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 8.0, 6.0, 10.0, 14.0, 17.0, 11.0, 17.0, 25.0, 29.0, 29.0, 28.0, 40.0, 48.0, 47.0, 49.0, 62.0, 47.0, 61.0, 58.0, 48.0, 53.0, 30.0, 33.0, 28.0, 38.0, 28.0, 17.0, 31.0, 14.0, 18.0, 14.0, 16.0, 6.0, 5.0, 7.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84375, -4.678955078125, -4.51416015625, -4.349365234375, -4.1845703125, -4.019775390625, -3.85498046875, -3.690185546875, -3.525390625, -3.360595703125, -3.19580078125, -3.031005859375, -2.8662109375, -2.701416015625, -2.53662109375, -2.371826171875, -2.20703125, -2.042236328125, -1.87744140625, -1.712646484375, -1.5478515625, -1.383056640625, -1.21826171875, -1.053466796875, -0.888671875, -0.723876953125, -0.55908203125, -0.394287109375, -0.2294921875, -0.064697265625, 0.10009765625, 0.264892578125, 0.4296875, 0.594482421875, 0.75927734375, 0.924072265625, 1.0888671875, 1.253662109375, 1.41845703125, 1.583251953125, 1.748046875, 1.912841796875, 2.07763671875, 2.242431640625, 2.4072265625, 2.572021484375, 2.73681640625, 2.901611328125, 3.06640625, 3.231201171875, 3.39599609375, 3.560791015625, 3.7255859375, 3.890380859375, 4.05517578125, 4.219970703125, 4.384765625, 4.549560546875, 4.71435546875, 4.879150390625, 5.0439453125, 5.208740234375, 5.37353515625, 5.538330078125, 5.703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 14.0, 20.0, 23.0, 34.0, 64.0, 83.0, 151.0, 244.0, 357.0, 676.0, 1303.0, 2839.0, 8823.0, 55726.0, 821272.0, 134512.0, 14675.0, 3924.0, 1665.0, 863.0, 474.0, 270.0, 172.0, 89.0, 70.0, 56.0, 40.0, 23.0, 20.0, 12.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.25, -32.262451171875, -31.27490234375, -30.287353515625, -29.2998046875, -28.312255859375, -27.32470703125, -26.337158203125, -25.349609375, -24.362060546875, -23.37451171875, -22.386962890625, -21.3994140625, -20.411865234375, -19.42431640625, -18.436767578125, -17.44921875, -16.461669921875, -15.47412109375, -14.486572265625, -13.4990234375, -12.511474609375, -11.52392578125, -10.536376953125, -9.548828125, -8.561279296875, -7.57373046875, -6.586181640625, -5.5986328125, -4.611083984375, -3.62353515625, -2.635986328125, -1.6484375, -0.660888671875, 0.32666015625, 1.314208984375, 2.3017578125, 3.289306640625, 4.27685546875, 5.264404296875, 6.251953125, 7.239501953125, 8.22705078125, 9.214599609375, 10.2021484375, 11.189697265625, 12.17724609375, 13.164794921875, 14.15234375, 15.139892578125, 16.12744140625, 17.114990234375, 18.1025390625, 19.090087890625, 20.07763671875, 21.065185546875, 22.052734375, 23.040283203125, 24.02783203125, 25.015380859375, 26.0029296875, 26.990478515625, 27.97802734375, 28.965576171875, 29.953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 7.0, 3.0, 9.0, 12.0, 7.0, 22.0, 24.0, 23.0, 25.0, 29.0, 43.0, 46.0, 43.0, 57.0, 73.0, 67.0, 51.0, 59.0, 45.0, 63.0, 49.0, 44.0, 31.0, 29.0, 29.0, 33.0, 19.0, 14.0, 11.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.796875, -27.932373046875, -27.06787109375, -26.203369140625, -25.3388671875, -24.474365234375, -23.60986328125, -22.745361328125, -21.880859375, -21.016357421875, -20.15185546875, -19.287353515625, -18.4228515625, -17.558349609375, -16.69384765625, -15.829345703125, -14.96484375, -14.100341796875, -13.23583984375, -12.371337890625, -11.5068359375, -10.642333984375, -9.77783203125, -8.913330078125, -8.048828125, -7.184326171875, -6.31982421875, -5.455322265625, -4.5908203125, -3.726318359375, -2.86181640625, -1.997314453125, -1.1328125, -0.268310546875, 0.59619140625, 1.460693359375, 2.3251953125, 3.189697265625, 4.05419921875, 4.918701171875, 5.783203125, 6.647705078125, 7.51220703125, 8.376708984375, 9.2412109375, 10.105712890625, 10.97021484375, 11.834716796875, 12.69921875, 13.563720703125, 14.42822265625, 15.292724609375, 16.1572265625, 17.021728515625, 17.88623046875, 18.750732421875, 19.615234375, 20.479736328125, 21.34423828125, 22.208740234375, 23.0732421875, 23.937744140625, 24.80224609375, 25.666748046875, 26.53125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 15.0, 13.0, 43.0, 74.0, 150.0, 269.0, 692.0, 1899.0, 5930.0, 28310.0, 257206.0, 683679.0, 56587.0, 9340.0, 2602.0, 915.0, 415.0, 186.0, 91.0, 65.0, 32.0, 8.0, 13.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.4453125, -10.1483154296875, -9.851318359375, -9.5543212890625, -9.25732421875, -8.9603271484375, -8.663330078125, -8.3663330078125, -8.0693359375, -7.7723388671875, -7.475341796875, -7.1783447265625, -6.88134765625, -6.5843505859375, -6.287353515625, -5.9903564453125, -5.693359375, -5.3963623046875, -5.099365234375, -4.8023681640625, -4.50537109375, -4.2083740234375, -3.911376953125, -3.6143798828125, -3.3173828125, -3.0203857421875, -2.723388671875, -2.4263916015625, -2.12939453125, -1.8323974609375, -1.535400390625, -1.2384033203125, -0.94140625, -0.6444091796875, -0.347412109375, -0.0504150390625, 0.24658203125, 0.5435791015625, 0.840576171875, 1.1375732421875, 1.4345703125, 1.7315673828125, 2.028564453125, 2.3255615234375, 2.62255859375, 2.9195556640625, 3.216552734375, 3.5135498046875, 3.810546875, 4.1075439453125, 4.404541015625, 4.7015380859375, 4.99853515625, 5.2955322265625, 5.592529296875, 5.8895263671875, 6.1865234375, 6.4835205078125, 6.780517578125, 7.0775146484375, 7.37451171875, 7.6715087890625, 7.968505859375, 8.2655029296875, 8.5625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 13.0, 16.0, 33.0, 34.0, 43.0, 56.0, 119.0, 222.0, 172.0, 89.0, 46.0, 34.0, 34.0, 26.0, 14.0, 14.0, 6.0, 8.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00274658203125, -0.0026397705078125, -0.002532958984375, -0.0024261474609375, -0.0023193359375, -0.0022125244140625, -0.002105712890625, -0.0019989013671875, -0.00189208984375, -0.0017852783203125, -0.001678466796875, -0.0015716552734375, -0.00146484375, -0.0013580322265625, -0.001251220703125, -0.0011444091796875, -0.00103759765625, -0.0009307861328125, -0.000823974609375, -0.0007171630859375, -0.0006103515625, -0.0005035400390625, -0.000396728515625, -0.0002899169921875, -0.00018310546875, -7.62939453125e-05, 3.0517578125e-05, 0.0001373291015625, 0.000244140625, 0.0003509521484375, 0.000457763671875, 0.0005645751953125, 0.00067138671875, 0.0007781982421875, 0.000885009765625, 0.0009918212890625, 0.0010986328125, 0.0012054443359375, 0.001312255859375, 0.0014190673828125, 0.00152587890625, 0.0016326904296875, 0.001739501953125, 0.0018463134765625, 0.001953125, 0.0020599365234375, 0.002166748046875, 0.0022735595703125, 0.00238037109375, 0.0024871826171875, 0.002593994140625, 0.0027008056640625, 0.0028076171875, 0.0029144287109375, 0.003021240234375, 0.0031280517578125, 0.00323486328125, 0.0033416748046875, 0.003448486328125, 0.0035552978515625, 0.003662109375, 0.0037689208984375, 0.003875732421875, 0.0039825439453125, 0.00408935546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 8.0, 10.0, 12.0, 16.0, 30.0, 59.0, 107.0, 181.0, 355.0, 631.0, 1426.0, 3502.0, 12718.0, 115901.0, 802268.0, 94171.0, 11295.0, 3230.0, 1353.0, 574.0, 300.0, 154.0, 95.0, 57.0, 34.0, 24.0, 12.0, 10.0, 7.0, 5.0, 3.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.3411865234375, -10.049560546875, -9.7579345703125, -9.46630859375, -9.1746826171875, -8.883056640625, -8.5914306640625, -8.2998046875, -8.0081787109375, -7.716552734375, -7.4249267578125, -7.13330078125, -6.8416748046875, -6.550048828125, -6.2584228515625, -5.966796875, -5.6751708984375, -5.383544921875, -5.0919189453125, -4.80029296875, -4.5086669921875, -4.217041015625, -3.9254150390625, -3.6337890625, -3.3421630859375, -3.050537109375, -2.7589111328125, -2.46728515625, -2.1756591796875, -1.884033203125, -1.5924072265625, -1.30078125, -1.0091552734375, -0.717529296875, -0.4259033203125, -0.13427734375, 0.1573486328125, 0.448974609375, 0.7406005859375, 1.0322265625, 1.3238525390625, 1.615478515625, 1.9071044921875, 2.19873046875, 2.4903564453125, 2.781982421875, 3.0736083984375, 3.365234375, 3.6568603515625, 3.948486328125, 4.2401123046875, 4.53173828125, 4.8233642578125, 5.114990234375, 5.4066162109375, 5.6982421875, 5.9898681640625, 6.281494140625, 6.5731201171875, 6.86474609375, 7.1563720703125, 7.447998046875, 7.7396240234375, 8.03125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 10.0, 11.0, 8.0, 10.0, 32.0, 21.0, 33.0, 15.0, 40.0, 44.0, 59.0, 78.0, 64.0, 64.0, 66.0, 71.0, 52.0, 53.0, 42.0, 40.0, 28.0, 20.0, 27.0, 16.0, 20.0, 15.0, 13.0, 10.0, 6.0, 7.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.313720703125, -5.12353515625, -4.933349609375, -4.7431640625, -4.552978515625, -4.36279296875, -4.172607421875, -3.982421875, -3.792236328125, -3.60205078125, -3.411865234375, -3.2216796875, -3.031494140625, -2.84130859375, -2.651123046875, -2.4609375, -2.270751953125, -2.08056640625, -1.890380859375, -1.7001953125, -1.510009765625, -1.31982421875, -1.129638671875, -0.939453125, -0.749267578125, -0.55908203125, -0.368896484375, -0.1787109375, 0.011474609375, 0.20166015625, 0.391845703125, 0.58203125, 0.772216796875, 0.96240234375, 1.152587890625, 1.3427734375, 1.532958984375, 1.72314453125, 1.913330078125, 2.103515625, 2.293701171875, 2.48388671875, 2.674072265625, 2.8642578125, 3.054443359375, 3.24462890625, 3.434814453125, 3.625, 3.815185546875, 4.00537109375, 4.195556640625, 4.3857421875, 4.575927734375, 4.76611328125, 4.956298828125, 5.146484375, 5.336669921875, 5.52685546875, 5.717041015625, 5.9072265625, 6.097412109375, 6.28759765625, 6.477783203125, 6.66796875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 10.0, 72.0, 181.0, 406.0, 200.0, 78.0, 27.0, 6.0, 9.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.10906982421875, -323.1803283691406, -313.2515869140625, -303.32281494140625, -293.3940734863281, -283.46533203125, -273.5365905761719, -263.60784912109375, -253.67909240722656, -243.75035095214844, -233.82159423828125, -223.89285278320312, -213.964111328125, -204.0353546142578, -194.1066131591797, -184.1778564453125, -174.24911499023438, -164.32037353515625, -154.39161682128906, -144.46287536621094, -134.53411865234375, -124.60537719726562, -114.6766357421875, -104.74788665771484, -94.81913757324219, -84.89038848876953, -74.96163940429688, -65.03289794921875, -55.104148864746094, -45.17539978027344, -35.24665451049805, -25.317909240722656, -15.389190673828125, -5.460443496704102, 4.468303680419922, 14.397050857543945, 24.32579803466797, 34.254547119140625, 44.183292388916016, 54.112037658691406, 64.04078674316406, 73.96953582763672, 83.89828491210938, 93.8270263671875, 103.75577545166016, 113.68452453613281, 123.61326599121094, 133.54202270507812, 143.47076416015625, 153.39950561523438, 163.32826232910156, 173.2570037841797, 183.18576049804688, 193.114501953125, 203.04324340820312, 212.97198486328125, 222.90074157714844, 232.82948303222656, 242.75823974609375, 252.68698120117188, 262.61572265625, 272.54449462890625, 282.4732360839844, 292.4019775390625, 302.3307189941406]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 12.0, 11.0, 13.0, 15.0, 18.0, 18.0, 20.0, 21.0, 23.0, 38.0, 20.0, 39.0, 38.0, 52.0, 47.0, 66.0, 67.0, 70.0, 52.0, 51.0, 35.0, 35.0, 32.0, 35.0, 23.0, 17.0, 20.0, 19.0, 21.0, 9.0, 12.0, 7.0, 10.0, 6.0, 10.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-102.92532348632812, -99.95173645019531, -96.9781494140625, -94.00456237792969, -91.03096771240234, -88.05738067626953, -85.08379364013672, -82.1102066040039, -79.1366195678711, -76.16303253173828, -73.18944549560547, -70.21585083007812, -67.24226379394531, -64.2686767578125, -61.29508972167969, -58.321502685546875, -55.3479118347168, -52.374324798583984, -49.400733947753906, -46.427146911621094, -43.45355987548828, -40.47997283935547, -37.50638198852539, -34.53279495239258, -31.559206008911133, -28.585617065429688, -25.612030029296875, -22.63844108581543, -19.664852142333984, -16.691265106201172, -13.717676162719727, -10.744089126586914, -7.770500183105469, -4.79691219329834, -1.8233237266540527, 1.1502647399902344, 4.123852729797363, 7.097440719604492, 10.071029663085938, 13.04461669921875, 16.018205642700195, 18.99179458618164, 21.965381622314453, 24.9389705657959, 27.912559509277344, 30.886146545410156, 33.85973358154297, 36.83332061767578, 39.80691146850586, 42.78049850463867, 45.75408935546875, 48.72767639160156, 51.701263427734375, 54.67485046386719, 57.648441314697266, 60.62202835083008, 63.595619201660156, 66.56920623779297, 69.54279327392578, 72.51638793945312, 75.48997497558594, 78.46356201171875, 81.43714904785156, 84.41073608398438, 87.38432312011719]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 10.0, 11.0, 8.0, 8.0, 21.0, 32.0, 43.0, 61.0, 93.0, 121.0, 211.0, 289.0, 509.0, 736.0, 1306.0, 2314.0, 4400.0, 8938.0, 20114.0, 51697.0, 163234.0, 625353.0, 1764221.0, 1129773.0, 287102.0, 79989.0, 28454.0, 12198.0, 5776.0, 2915.0, 1711.0, 955.0, 575.0, 375.0, 218.0, 169.0, 107.0, 73.0, 43.0, 38.0, 17.0, 22.0, 13.0, 12.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-5.328125, -5.16015625, -4.9921875, -4.82421875, -4.65625, -4.48828125, -4.3203125, -4.15234375, -3.984375, -3.81640625, -3.6484375, -3.48046875, -3.3125, -3.14453125, -2.9765625, -2.80859375, -2.640625, -2.47265625, -2.3046875, -2.13671875, -1.96875, -1.80078125, -1.6328125, -1.46484375, -1.296875, -1.12890625, -0.9609375, -0.79296875, -0.625, -0.45703125, -0.2890625, -0.12109375, 0.046875, 0.21484375, 0.3828125, 0.55078125, 0.71875, 0.88671875, 1.0546875, 1.22265625, 1.390625, 1.55859375, 1.7265625, 1.89453125, 2.0625, 2.23046875, 2.3984375, 2.56640625, 2.734375, 2.90234375, 3.0703125, 3.23828125, 3.40625, 3.57421875, 3.7421875, 3.91015625, 4.078125, 4.24609375, 4.4140625, 4.58203125, 4.75, 4.91796875, 5.0859375, 5.25390625, 5.421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 15.0, 13.0, 19.0, 21.0, 21.0, 31.0, 14.0, 22.0, 26.0, 36.0, 40.0, 37.0, 44.0, 35.0, 46.0, 45.0, 37.0, 35.0, 47.0, 47.0, 48.0, 38.0, 34.0, 19.0, 36.0, 22.0, 16.0, 17.0, 24.0, 16.0, 19.0, 10.0, 10.0, 9.0, 9.0, 3.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.3515625, -4.2086181640625, -4.065673828125, -3.9227294921875, -3.77978515625, -3.6368408203125, -3.493896484375, -3.3509521484375, -3.2080078125, -3.0650634765625, -2.922119140625, -2.7791748046875, -2.63623046875, -2.4932861328125, -2.350341796875, -2.2073974609375, -2.064453125, -1.9215087890625, -1.778564453125, -1.6356201171875, -1.49267578125, -1.3497314453125, -1.206787109375, -1.0638427734375, -0.9208984375, -0.7779541015625, -0.635009765625, -0.4920654296875, -0.34912109375, -0.2061767578125, -0.063232421875, 0.0797119140625, 0.22265625, 0.3656005859375, 0.508544921875, 0.6514892578125, 0.79443359375, 0.9373779296875, 1.080322265625, 1.2232666015625, 1.3662109375, 1.5091552734375, 1.652099609375, 1.7950439453125, 1.93798828125, 2.0809326171875, 2.223876953125, 2.3668212890625, 2.509765625, 2.6527099609375, 2.795654296875, 2.9385986328125, 3.08154296875, 3.2244873046875, 3.367431640625, 3.5103759765625, 3.6533203125, 3.7962646484375, 3.939208984375, 4.0821533203125, 4.22509765625, 4.3680419921875, 4.510986328125, 4.6539306640625, 4.796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 9.0, 10.0, 16.0, 26.0, 25.0, 42.0, 75.0, 98.0, 213.0, 347.0, 764.0, 2157.0, 7639.0, 36531.0, 399223.0, 3459017.0, 252412.0, 26581.0, 5880.0, 1843.0, 668.0, 305.0, 126.0, 104.0, 57.0, 31.0, 23.0, 15.0, 14.0, 8.0, 6.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.875, -23.2845458984375, -22.694091796875, -22.1036376953125, -21.51318359375, -20.9227294921875, -20.332275390625, -19.7418212890625, -19.1513671875, -18.5609130859375, -17.970458984375, -17.3800048828125, -16.78955078125, -16.1990966796875, -15.608642578125, -15.0181884765625, -14.427734375, -13.8372802734375, -13.246826171875, -12.6563720703125, -12.06591796875, -11.4754638671875, -10.885009765625, -10.2945556640625, -9.7041015625, -9.1136474609375, -8.523193359375, -7.9327392578125, -7.34228515625, -6.7518310546875, -6.161376953125, -5.5709228515625, -4.98046875, -4.3900146484375, -3.799560546875, -3.2091064453125, -2.61865234375, -2.0281982421875, -1.437744140625, -0.8472900390625, -0.2568359375, 0.3336181640625, 0.924072265625, 1.5145263671875, 2.10498046875, 2.6954345703125, 3.285888671875, 3.8763427734375, 4.466796875, 5.0572509765625, 5.647705078125, 6.2381591796875, 6.82861328125, 7.4190673828125, 8.009521484375, 8.5999755859375, 9.1904296875, 9.7808837890625, 10.371337890625, 10.9617919921875, 11.55224609375, 12.1427001953125, 12.733154296875, 13.3236083984375, 13.9140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 1.0, 4.0, 7.0, 10.0, 8.0, 9.0, 20.0, 20.0, 20.0, 30.0, 58.0, 73.0, 116.0, 223.0, 351.0, 617.0, 742.0, 641.0, 414.0, 275.0, 150.0, 88.0, 71.0, 44.0, 23.0, 18.0, 15.0, 10.0, 4.0, 4.0, 3.0, 4.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.71875, -18.14794921875, -17.5771484375, -17.00634765625, -16.435546875, -15.86474609375, -15.2939453125, -14.72314453125, -14.15234375, -13.58154296875, -13.0107421875, -12.43994140625, -11.869140625, -11.29833984375, -10.7275390625, -10.15673828125, -9.5859375, -9.01513671875, -8.4443359375, -7.87353515625, -7.302734375, -6.73193359375, -6.1611328125, -5.59033203125, -5.01953125, -4.44873046875, -3.8779296875, -3.30712890625, -2.736328125, -2.16552734375, -1.5947265625, -1.02392578125, -0.453125, 0.11767578125, 0.6884765625, 1.25927734375, 1.830078125, 2.40087890625, 2.9716796875, 3.54248046875, 4.11328125, 4.68408203125, 5.2548828125, 5.82568359375, 6.396484375, 6.96728515625, 7.5380859375, 8.10888671875, 8.6796875, 9.25048828125, 9.8212890625, 10.39208984375, 10.962890625, 11.53369140625, 12.1044921875, 12.67529296875, 13.24609375, 13.81689453125, 14.3876953125, 14.95849609375, 15.529296875, 16.10009765625, 16.6708984375, 17.24169921875, 17.8125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 6.0, 12.0, 34.0, 74.0, 144.0, 231.0, 220.0, 142.0, 60.0, 29.0, 15.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-219.93130493164062, -213.695068359375, -207.45883178710938, -201.2225799560547, -194.98634338378906, -188.75010681152344, -182.51385498046875, -176.27761840820312, -170.0413818359375, -163.80514526367188, -157.56890869140625, -151.33265686035156, -145.09642028808594, -138.8601837158203, -132.62393188476562, -126.3876953125, -120.15145874023438, -113.91522216796875, -107.6789779663086, -101.44273376464844, -95.20649719238281, -88.97026062011719, -82.73401641845703, -76.49777221679688, -70.26153564453125, -64.02529907226562, -57.78905487060547, -51.55281448364258, -45.31657409667969, -39.0803337097168, -32.844093322753906, -26.607852935791016, -20.371597290039062, -14.135356903076172, -7.899116516113281, -1.6628761291503906, 4.5733642578125, 10.80960464477539, 17.04584503173828, 23.282085418701172, 29.518325805664062, 35.75456619262695, 41.990806579589844, 48.227046966552734, 54.463287353515625, 60.699527740478516, 66.9357681274414, 73.17201232910156, 79.40824890136719, 85.64448547363281, 91.88072967529297, 98.11697387695312, 104.35321044921875, 110.58944702148438, 116.82569122314453, 123.06193542480469, 129.2981719970703, 135.53440856933594, 141.77066040039062, 148.00689697265625, 154.24313354492188, 160.4793701171875, 166.71560668945312, 172.9518585205078, 179.18809509277344]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 7.0, 6.0, 4.0, 9.0, 9.0, 19.0, 18.0, 25.0, 24.0, 34.0, 28.0, 34.0, 31.0, 42.0, 30.0, 39.0, 40.0, 38.0, 40.0, 48.0, 42.0, 54.0, 36.0, 51.0, 32.0, 37.0, 39.0, 26.0, 30.0, 12.0, 28.0, 15.0, 14.0, 8.0, 9.0, 6.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-76.9912109375, -74.47167205810547, -71.95213317871094, -69.4325942993164, -66.91305541992188, -64.39350891113281, -61.87397384643555, -59.35443115234375, -56.83489227294922, -54.31535339355469, -51.795814514160156, -49.276275634765625, -46.75673294067383, -44.2371940612793, -41.717655181884766, -39.19811248779297, -36.6785774230957, -34.15903854370117, -31.639497756958008, -29.119958877563477, -26.600418090820312, -24.08087921142578, -21.56134033203125, -19.041799545288086, -16.522260665893555, -14.002720832824707, -11.48318099975586, -8.963642120361328, -6.4441022872924805, -3.924562454223633, -1.4050235748291016, 1.1145172119140625, 3.6340560913085938, 6.153595924377441, 8.673135757446289, 11.19267463684082, 13.712214469909668, 16.231754302978516, 18.751293182373047, 21.27083396911621, 23.790372848510742, 26.309911727905273, 28.829452514648438, 31.34899139404297, 33.8685302734375, 36.38806915283203, 38.90760803222656, 41.42715072631836, 43.94668960571289, 46.46622848510742, 48.98576736450195, 51.50531005859375, 54.02484893798828, 56.54438781738281, 59.063926696777344, 61.583465576171875, 64.1030044555664, 66.62254333496094, 69.14208221435547, 71.66162109375, 74.18115997314453, 76.70069885253906, 79.22024536132812, 81.73978424072266, 84.25932312011719]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 10.0, 8.0, 25.0, 28.0, 49.0, 81.0, 117.0, 229.0, 434.0, 723.0, 1385.0, 2869.0, 6241.0, 14947.0, 41002.0, 155648.0, 542362.0, 202025.0, 49291.0, 17141.0, 7114.0, 3296.0, 1600.0, 847.0, 474.0, 238.0, 132.0, 95.0, 51.0, 34.0, 29.0, 13.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4453125, -14.01513671875, -13.5849609375, -13.15478515625, -12.724609375, -12.29443359375, -11.8642578125, -11.43408203125, -11.00390625, -10.57373046875, -10.1435546875, -9.71337890625, -9.283203125, -8.85302734375, -8.4228515625, -7.99267578125, -7.5625, -7.13232421875, -6.7021484375, -6.27197265625, -5.841796875, -5.41162109375, -4.9814453125, -4.55126953125, -4.12109375, -3.69091796875, -3.2607421875, -2.83056640625, -2.400390625, -1.97021484375, -1.5400390625, -1.10986328125, -0.6796875, -0.24951171875, 0.1806640625, 0.61083984375, 1.041015625, 1.47119140625, 1.9013671875, 2.33154296875, 2.76171875, 3.19189453125, 3.6220703125, 4.05224609375, 4.482421875, 4.91259765625, 5.3427734375, 5.77294921875, 6.203125, 6.63330078125, 7.0634765625, 7.49365234375, 7.923828125, 8.35400390625, 8.7841796875, 9.21435546875, 9.64453125, 10.07470703125, 10.5048828125, 10.93505859375, 11.365234375, 11.79541015625, 12.2255859375, 12.65576171875, 13.0859375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 4.0, 13.0, 5.0, 12.0, 8.0, 14.0, 27.0, 19.0, 19.0, 22.0, 31.0, 35.0, 44.0, 29.0, 52.0, 45.0, 44.0, 37.0, 47.0, 48.0, 57.0, 39.0, 34.0, 24.0, 30.0, 33.0, 28.0, 29.0, 15.0, 23.0, 18.0, 21.0, 13.0, 20.0, 13.0, 9.0, 7.0, 5.0, 9.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.2890625, -4.13543701171875, -3.9818115234375, -3.82818603515625, -3.674560546875, -3.52093505859375, -3.3673095703125, -3.21368408203125, -3.06005859375, -2.90643310546875, -2.7528076171875, -2.59918212890625, -2.445556640625, -2.29193115234375, -2.1383056640625, -1.98468017578125, -1.8310546875, -1.67742919921875, -1.5238037109375, -1.37017822265625, -1.216552734375, -1.06292724609375, -0.9093017578125, -0.75567626953125, -0.60205078125, -0.44842529296875, -0.2947998046875, -0.14117431640625, 0.012451171875, 0.16607666015625, 0.3197021484375, 0.47332763671875, 0.626953125, 0.78057861328125, 0.9342041015625, 1.08782958984375, 1.241455078125, 1.39508056640625, 1.5487060546875, 1.70233154296875, 1.85595703125, 2.00958251953125, 2.1632080078125, 2.31683349609375, 2.470458984375, 2.62408447265625, 2.7777099609375, 2.93133544921875, 3.0849609375, 3.23858642578125, 3.3922119140625, 3.54583740234375, 3.699462890625, 3.85308837890625, 4.0067138671875, 4.16033935546875, 4.31396484375, 4.46759033203125, 4.6212158203125, 4.77484130859375, 4.928466796875, 5.08209228515625, 5.2357177734375, 5.38934326171875, 5.54296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 9.0, 7.0, 19.0, 15.0, 28.0, 23.0, 35.0, 45.0, 77.0, 91.0, 111.0, 185.0, 258.0, 455.0, 738.0, 1337.0, 2861.0, 7999.0, 30699.0, 253565.0, 676168.0, 54192.0, 11563.0, 3949.0, 1685.0, 859.0, 526.0, 347.0, 214.0, 134.0, 97.0, 93.0, 44.0, 32.0, 20.0, 20.0, 16.0, 7.0, 13.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.25, -20.568115234375, -19.88623046875, -19.204345703125, -18.5224609375, -17.840576171875, -17.15869140625, -16.476806640625, -15.794921875, -15.113037109375, -14.43115234375, -13.749267578125, -13.0673828125, -12.385498046875, -11.70361328125, -11.021728515625, -10.33984375, -9.657958984375, -8.97607421875, -8.294189453125, -7.6123046875, -6.930419921875, -6.24853515625, -5.566650390625, -4.884765625, -4.202880859375, -3.52099609375, -2.839111328125, -2.1572265625, -1.475341796875, -0.79345703125, -0.111572265625, 0.5703125, 1.252197265625, 1.93408203125, 2.615966796875, 3.2978515625, 3.979736328125, 4.66162109375, 5.343505859375, 6.025390625, 6.707275390625, 7.38916015625, 8.071044921875, 8.7529296875, 9.434814453125, 10.11669921875, 10.798583984375, 11.48046875, 12.162353515625, 12.84423828125, 13.526123046875, 14.2080078125, 14.889892578125, 15.57177734375, 16.253662109375, 16.935546875, 17.617431640625, 18.29931640625, 18.981201171875, 19.6630859375, 20.344970703125, 21.02685546875, 21.708740234375, 22.390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 12.0, 3.0, 9.0, 14.0, 16.0, 24.0, 22.0, 29.0, 44.0, 44.0, 45.0, 45.0, 42.0, 52.0, 62.0, 76.0, 45.0, 59.0, 50.0, 43.0, 40.0, 41.0, 22.0, 31.0, 19.0, 16.0, 20.0, 14.0, 18.0, 12.0, 4.0, 7.0, 8.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.484375, -22.6689453125, -21.853515625, -21.0380859375, -20.22265625, -19.4072265625, -18.591796875, -17.7763671875, -16.9609375, -16.1455078125, -15.330078125, -14.5146484375, -13.69921875, -12.8837890625, -12.068359375, -11.2529296875, -10.4375, -9.6220703125, -8.806640625, -7.9912109375, -7.17578125, -6.3603515625, -5.544921875, -4.7294921875, -3.9140625, -3.0986328125, -2.283203125, -1.4677734375, -0.65234375, 0.1630859375, 0.978515625, 1.7939453125, 2.609375, 3.4248046875, 4.240234375, 5.0556640625, 5.87109375, 6.6865234375, 7.501953125, 8.3173828125, 9.1328125, 9.9482421875, 10.763671875, 11.5791015625, 12.39453125, 13.2099609375, 14.025390625, 14.8408203125, 15.65625, 16.4716796875, 17.287109375, 18.1025390625, 18.91796875, 19.7333984375, 20.548828125, 21.3642578125, 22.1796875, 22.9951171875, 23.810546875, 24.6259765625, 25.44140625, 26.2568359375, 27.072265625, 27.8876953125, 28.703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 3.0, 12.0, 11.0, 12.0, 25.0, 33.0, 64.0, 80.0, 158.0, 274.0, 453.0, 1076.0, 2726.0, 8550.0, 36870.0, 250977.0, 658742.0, 67759.0, 13770.0, 3934.0, 1484.0, 662.0, 354.0, 219.0, 111.0, 58.0, 48.0, 29.0, 12.0, 11.0, 12.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.05804443359375, -5.8074951171875, -5.55694580078125, -5.306396484375, -5.05584716796875, -4.8052978515625, -4.55474853515625, -4.30419921875, -4.05364990234375, -3.8031005859375, -3.55255126953125, -3.302001953125, -3.05145263671875, -2.8009033203125, -2.55035400390625, -2.2998046875, -2.04925537109375, -1.7987060546875, -1.54815673828125, -1.297607421875, -1.04705810546875, -0.7965087890625, -0.54595947265625, -0.29541015625, -0.04486083984375, 0.2056884765625, 0.45623779296875, 0.706787109375, 0.95733642578125, 1.2078857421875, 1.45843505859375, 1.708984375, 1.95953369140625, 2.2100830078125, 2.46063232421875, 2.711181640625, 2.96173095703125, 3.2122802734375, 3.46282958984375, 3.71337890625, 3.96392822265625, 4.2144775390625, 4.46502685546875, 4.715576171875, 4.96612548828125, 5.2166748046875, 5.46722412109375, 5.7177734375, 5.96832275390625, 6.2188720703125, 6.46942138671875, 6.719970703125, 6.97052001953125, 7.2210693359375, 7.47161865234375, 7.72216796875, 7.97271728515625, 8.2232666015625, 8.47381591796875, 8.724365234375, 8.97491455078125, 9.2254638671875, 9.47601318359375, 9.7265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 9.0, 6.0, 23.0, 22.0, 26.0, 24.0, 42.0, 43.0, 97.0, 144.0, 165.0, 131.0, 82.0, 41.0, 35.0, 29.0, 13.0, 12.0, 7.0, 12.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017461776733398438, -0.0016715973615646362, -0.0015970170497894287, -0.0015224367380142212, -0.0014478564262390137, -0.0013732761144638062, -0.0012986958026885986, -0.0012241154909133911, -0.0011495351791381836, -0.001074954867362976, -0.0010003745555877686, -0.000925794243812561, -0.0008512139320373535, -0.000776633620262146, -0.0007020533084869385, -0.000627472996711731, -0.0005528926849365234, -0.0004783123731613159, -0.0004037320613861084, -0.0003291517496109009, -0.00025457143783569336, -0.00017999112606048584, -0.00010541081428527832, -3.08305025100708e-05, 4.374980926513672e-05, 0.00011833012104034424, 0.00019291043281555176, 0.0002674907445907593, 0.0003420710563659668, 0.0004166513681411743, 0.0004912316799163818, 0.0005658119916915894, 0.0006403923034667969, 0.0007149726152420044, 0.0007895529270172119, 0.0008641332387924194, 0.000938713550567627, 0.0010132938623428345, 0.001087874174118042, 0.0011624544858932495, 0.001237034797668457, 0.0013116151094436646, 0.001386195421218872, 0.0014607757329940796, 0.0015353560447692871, 0.0016099363565444946, 0.0016845166683197021, 0.0017590969800949097, 0.0018336772918701172, 0.0019082576036453247, 0.0019828379154205322, 0.0020574182271957397, 0.0021319985389709473, 0.002206578850746155, 0.0022811591625213623, 0.00235573947429657, 0.0024303197860717773, 0.002504900097846985, 0.0025794804096221924, 0.0026540607213974, 0.0027286410331726074, 0.002803221344947815, 0.0028778016567230225, 0.00295238196849823, 0.0030269622802734375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 8.0, 7.0, 18.0, 42.0, 62.0, 118.0, 216.0, 473.0, 1561.0, 7179.0, 132568.0, 875706.0, 25854.0, 3126.0, 997.0, 324.0, 136.0, 60.0, 39.0, 21.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1796875, -13.7261962890625, -13.272705078125, -12.8192138671875, -12.36572265625, -11.9122314453125, -11.458740234375, -11.0052490234375, -10.5517578125, -10.0982666015625, -9.644775390625, -9.1912841796875, -8.73779296875, -8.2843017578125, -7.830810546875, -7.3773193359375, -6.923828125, -6.4703369140625, -6.016845703125, -5.5633544921875, -5.10986328125, -4.6563720703125, -4.202880859375, -3.7493896484375, -3.2958984375, -2.8424072265625, -2.388916015625, -1.9354248046875, -1.48193359375, -1.0284423828125, -0.574951171875, -0.1214599609375, 0.33203125, 0.7855224609375, 1.239013671875, 1.6925048828125, 2.14599609375, 2.5994873046875, 3.052978515625, 3.5064697265625, 3.9599609375, 4.4134521484375, 4.866943359375, 5.3204345703125, 5.77392578125, 6.2274169921875, 6.680908203125, 7.1343994140625, 7.587890625, 8.0413818359375, 8.494873046875, 8.9483642578125, 9.40185546875, 9.8553466796875, 10.308837890625, 10.7623291015625, 11.2158203125, 11.6693115234375, 12.122802734375, 12.5762939453125, 13.02978515625, 13.4832763671875, 13.936767578125, 14.3902587890625, 14.84375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 4.0, 5.0, 11.0, 11.0, 23.0, 30.0, 36.0, 53.0, 79.0, 96.0, 110.0, 127.0, 113.0, 79.0, 64.0, 42.0, 23.0, 32.0, 15.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.30474853515625, -5.0665283203125, -4.82830810546875, -4.590087890625, -4.35186767578125, -4.1136474609375, -3.87542724609375, -3.63720703125, -3.39898681640625, -3.1607666015625, -2.92254638671875, -2.684326171875, -2.44610595703125, -2.2078857421875, -1.96966552734375, -1.7314453125, -1.49322509765625, -1.2550048828125, -1.01678466796875, -0.778564453125, -0.54034423828125, -0.3021240234375, -0.06390380859375, 0.17431640625, 0.41253662109375, 0.6507568359375, 0.88897705078125, 1.127197265625, 1.36541748046875, 1.6036376953125, 1.84185791015625, 2.080078125, 2.31829833984375, 2.5565185546875, 2.79473876953125, 3.032958984375, 3.27117919921875, 3.5093994140625, 3.74761962890625, 3.98583984375, 4.22406005859375, 4.4622802734375, 4.70050048828125, 4.938720703125, 5.17694091796875, 5.4151611328125, 5.65338134765625, 5.8916015625, 6.12982177734375, 6.3680419921875, 6.60626220703125, 6.844482421875, 7.08270263671875, 7.3209228515625, 7.55914306640625, 7.79736328125, 8.03558349609375, 8.2738037109375, 8.51202392578125, 8.750244140625, 8.98846435546875, 9.2266845703125, 9.46490478515625, 9.703125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 10.0, 11.0, 53.0, 220.0, 453.0, 176.0, 49.0, 12.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-262.339111328125, -252.47108459472656, -242.6030731201172, -232.73504638671875, -222.8670196533203, -212.99899291992188, -203.1309814453125, -193.26295471191406, -183.39492797851562, -173.5269012451172, -163.6588897705078, -153.79086303710938, -143.92283630371094, -134.0548095703125, -124.18679809570312, -114.31877136230469, -104.45075988769531, -94.5827407836914, -84.71471405029297, -74.84669494628906, -64.97866821289062, -55.11064910888672, -45.24263000488281, -35.374603271484375, -25.50658416748047, -15.638562202453613, -5.770540237426758, 4.097480773925781, 13.965503692626953, 23.833526611328125, 33.70154571533203, 43.56957244873047, 53.437591552734375, 63.30561447143555, 73.17363739013672, 83.04165649414062, 92.90968322753906, 102.77770233154297, 112.64572143554688, 122.51374816894531, 132.38177490234375, 142.2498016357422, 152.11781311035156, 161.98583984375, 171.85386657714844, 181.72189331054688, 191.58990478515625, 201.4579315185547, 211.32594299316406, 221.1939697265625, 231.06198120117188, 240.9300079345703, 250.79803466796875, 260.6660461425781, 270.5340576171875, 280.402099609375, 290.2701110839844, 300.13812255859375, 310.00616455078125, 319.8741760253906, 329.7421875, 339.6102294921875, 349.4782409667969, 359.34625244140625, 369.21429443359375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 6.0, 8.0, 5.0, 10.0, 15.0, 20.0, 25.0, 16.0, 23.0, 26.0, 49.0, 38.0, 24.0, 35.0, 51.0, 45.0, 61.0, 62.0, 54.0, 69.0, 40.0, 35.0, 26.0, 36.0, 20.0, 26.0, 28.0, 21.0, 21.0, 21.0, 11.0, 11.0, 11.0, 12.0, 7.0, 5.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.5633773803711, -83.81790924072266, -81.07244110107422, -78.32697296142578, -75.58150482177734, -72.8360366821289, -70.09056091308594, -67.3450927734375, -64.59962463378906, -61.854156494140625, -59.10868835449219, -56.36322021484375, -53.61775207519531, -50.872283935546875, -48.12681198120117, -45.381343841552734, -42.63587951660156, -39.890411376953125, -37.14494323730469, -34.39947509765625, -31.65400505065918, -28.908536911010742, -26.163066864013672, -23.417598724365234, -20.672130584716797, -17.92666244506836, -15.181193351745605, -12.435724258422852, -9.690256118774414, -6.944787979125977, -4.199317932128906, -1.4538497924804688, 1.2916107177734375, 4.037079334259033, 6.782547950744629, 9.528017044067383, 12.27348518371582, 15.018953323364258, 17.764423370361328, 20.509891510009766, 23.255359649658203, 26.00082778930664, 28.746295928955078, 31.49176597595215, 34.23723602294922, 36.982704162597656, 39.728172302246094, 42.47364044189453, 45.21910858154297, 47.964576721191406, 50.710044860839844, 53.45551300048828, 56.20098114013672, 58.946449279785156, 61.69192123413086, 64.43739318847656, 67.182861328125, 69.92832946777344, 72.67379760742188, 75.41926574707031, 78.16473388671875, 80.91020202636719, 83.65567016601562, 86.40113830566406, 89.1466064453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 3.0, 6.0, 11.0, 8.0, 20.0, 27.0, 43.0, 66.0, 94.0, 128.0, 195.0, 258.0, 462.0, 731.0, 1177.0, 1988.0, 3602.0, 7091.0, 16210.0, 45365.0, 175023.0, 871936.0, 2102910.0, 744935.0, 151329.0, 40678.0, 14937.0, 6740.0, 3302.0, 1888.0, 1072.0, 631.0, 478.0, 252.0, 216.0, 150.0, 101.0, 58.0, 44.0, 29.0, 18.0, 17.0, 18.0, 11.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.37890625, -5.18988037109375, -5.0008544921875, -4.81182861328125, -4.622802734375, -4.43377685546875, -4.2447509765625, -4.05572509765625, -3.86669921875, -3.67767333984375, -3.4886474609375, -3.29962158203125, -3.110595703125, -2.92156982421875, -2.7325439453125, -2.54351806640625, -2.3544921875, -2.16546630859375, -1.9764404296875, -1.78741455078125, -1.598388671875, -1.40936279296875, -1.2203369140625, -1.03131103515625, -0.84228515625, -0.65325927734375, -0.4642333984375, -0.27520751953125, -0.086181640625, 0.10284423828125, 0.2918701171875, 0.48089599609375, 0.669921875, 0.85894775390625, 1.0479736328125, 1.23699951171875, 1.426025390625, 1.61505126953125, 1.8040771484375, 1.99310302734375, 2.18212890625, 2.37115478515625, 2.5601806640625, 2.74920654296875, 2.938232421875, 3.12725830078125, 3.3162841796875, 3.50531005859375, 3.6943359375, 3.88336181640625, 4.0723876953125, 4.26141357421875, 4.450439453125, 4.63946533203125, 4.8284912109375, 5.01751708984375, 5.20654296875, 5.39556884765625, 5.5845947265625, 5.77362060546875, 5.962646484375, 6.15167236328125, 6.3406982421875, 6.52972412109375, 6.71875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 5.0, 5.0, 7.0, 11.0, 13.0, 14.0, 18.0, 21.0, 23.0, 39.0, 31.0, 42.0, 40.0, 36.0, 41.0, 44.0, 57.0, 45.0, 46.0, 51.0, 48.0, 51.0, 30.0, 29.0, 43.0, 33.0, 27.0, 18.0, 20.0, 23.0, 22.0, 16.0, 7.0, 7.0, 11.0, 3.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.1640625, -5.995361328125, -5.82666015625, -5.657958984375, -5.4892578125, -5.320556640625, -5.15185546875, -4.983154296875, -4.814453125, -4.645751953125, -4.47705078125, -4.308349609375, -4.1396484375, -3.970947265625, -3.80224609375, -3.633544921875, -3.46484375, -3.296142578125, -3.12744140625, -2.958740234375, -2.7900390625, -2.621337890625, -2.45263671875, -2.283935546875, -2.115234375, -1.946533203125, -1.77783203125, -1.609130859375, -1.4404296875, -1.271728515625, -1.10302734375, -0.934326171875, -0.765625, -0.596923828125, -0.42822265625, -0.259521484375, -0.0908203125, 0.077880859375, 0.24658203125, 0.415283203125, 0.583984375, 0.752685546875, 0.92138671875, 1.090087890625, 1.2587890625, 1.427490234375, 1.59619140625, 1.764892578125, 1.93359375, 2.102294921875, 2.27099609375, 2.439697265625, 2.6083984375, 2.777099609375, 2.94580078125, 3.114501953125, 3.283203125, 3.451904296875, 3.62060546875, 3.789306640625, 3.9580078125, 4.126708984375, 4.29541015625, 4.464111328125, 4.6328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 11.0, 12.0, 11.0, 17.0, 20.0, 32.0, 29.0, 69.0, 78.0, 168.0, 239.0, 402.0, 833.0, 1607.0, 3894.0, 9824.0, 31917.0, 177695.0, 2618141.0, 1219282.0, 94173.0, 22238.0, 7615.0, 3002.0, 1293.0, 626.0, 379.0, 232.0, 139.0, 94.0, 49.0, 45.0, 30.0, 14.0, 9.0, 14.0, 7.0, 5.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.8671875, -13.4449462890625, -13.022705078125, -12.6004638671875, -12.17822265625, -11.7559814453125, -11.333740234375, -10.9114990234375, -10.4892578125, -10.0670166015625, -9.644775390625, -9.2225341796875, -8.80029296875, -8.3780517578125, -7.955810546875, -7.5335693359375, -7.111328125, -6.6890869140625, -6.266845703125, -5.8446044921875, -5.42236328125, -5.0001220703125, -4.577880859375, -4.1556396484375, -3.7333984375, -3.3111572265625, -2.888916015625, -2.4666748046875, -2.04443359375, -1.6221923828125, -1.199951171875, -0.7777099609375, -0.35546875, 0.0667724609375, 0.489013671875, 0.9112548828125, 1.33349609375, 1.7557373046875, 2.177978515625, 2.6002197265625, 3.0224609375, 3.4447021484375, 3.866943359375, 4.2891845703125, 4.71142578125, 5.1336669921875, 5.555908203125, 5.9781494140625, 6.400390625, 6.8226318359375, 7.244873046875, 7.6671142578125, 8.08935546875, 8.5115966796875, 8.933837890625, 9.3560791015625, 9.7783203125, 10.2005615234375, 10.622802734375, 11.0450439453125, 11.46728515625, 11.8895263671875, 12.311767578125, 12.7340087890625, 13.15625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 9.0, 6.0, 9.0, 11.0, 8.0, 24.0, 31.0, 34.0, 41.0, 97.0, 137.0, 266.0, 363.0, 660.0, 713.0, 621.0, 389.0, 217.0, 145.0, 90.0, 60.0, 31.0, 24.0, 21.0, 14.0, 11.0, 9.0, 7.0, 7.0, 7.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.5087890625, -13.017578125, -12.5263671875, -12.03515625, -11.5439453125, -11.052734375, -10.5615234375, -10.0703125, -9.5791015625, -9.087890625, -8.5966796875, -8.10546875, -7.6142578125, -7.123046875, -6.6318359375, -6.140625, -5.6494140625, -5.158203125, -4.6669921875, -4.17578125, -3.6845703125, -3.193359375, -2.7021484375, -2.2109375, -1.7197265625, -1.228515625, -0.7373046875, -0.24609375, 0.2451171875, 0.736328125, 1.2275390625, 1.71875, 2.2099609375, 2.701171875, 3.1923828125, 3.68359375, 4.1748046875, 4.666015625, 5.1572265625, 5.6484375, 6.1396484375, 6.630859375, 7.1220703125, 7.61328125, 8.1044921875, 8.595703125, 9.0869140625, 9.578125, 10.0693359375, 10.560546875, 11.0517578125, 11.54296875, 12.0341796875, 12.525390625, 13.0166015625, 13.5078125, 13.9990234375, 14.490234375, 14.9814453125, 15.47265625, 15.9638671875, 16.455078125, 16.9462890625, 17.4375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 8.0, 12.0, 19.0, 68.0, 118.0, 238.0, 256.0, 141.0, 65.0, 35.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-261.55029296875, -255.4888916015625, -249.427490234375, -243.3660888671875, -237.3046875, -231.2432861328125, -225.181884765625, -219.1204833984375, -213.05908203125, -206.9976806640625, -200.936279296875, -194.8748779296875, -188.8134765625, -182.7520751953125, -176.690673828125, -170.6292724609375, -164.56787109375, -158.5064697265625, -152.445068359375, -146.3836669921875, -140.322265625, -134.2608642578125, -128.199462890625, -122.1380615234375, -116.07667541503906, -110.01527404785156, -103.95387268066406, -97.89247131347656, -91.83106994628906, -85.76966857910156, -79.70826721191406, -73.64686584472656, -67.5854721069336, -61.524070739746094, -55.462669372558594, -49.401268005371094, -43.339866638183594, -37.278465270996094, -31.21706771850586, -25.15566635131836, -19.09426498413086, -13.03286361694336, -6.971463203430176, -0.9100627899169922, 5.151338577270508, 11.212739944458008, 17.274139404296875, 23.335540771484375, 29.396942138671875, 35.458343505859375, 41.519744873046875, 47.581146240234375, 53.642547607421875, 59.703948974609375, 65.76535034179688, 71.82675170898438, 77.88815307617188, 83.94955444335938, 90.01095581054688, 96.07235717773438, 102.13375854492188, 108.19515991210938, 114.25656127929688, 120.31796264648438, 126.37935638427734]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 6.0, 9.0, 10.0, 12.0, 20.0, 17.0, 21.0, 27.0, 31.0, 31.0, 38.0, 37.0, 46.0, 36.0, 46.0, 50.0, 62.0, 39.0, 30.0, 41.0, 50.0, 44.0, 37.0, 32.0, 48.0, 27.0, 29.0, 28.0, 13.0, 17.0, 17.0, 9.0, 5.0, 4.0, 5.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.16746520996094, -72.04879760742188, -69.93013000488281, -67.81146240234375, -65.69279479980469, -63.57412338256836, -61.45545196533203, -59.33678436279297, -57.218116760253906, -55.099449157714844, -52.98078155517578, -50.86211013793945, -48.74344253540039, -46.62477493286133, -44.506103515625, -42.38743591308594, -40.268768310546875, -38.15010070800781, -36.03143310546875, -33.91276168823242, -31.79409408569336, -29.675426483154297, -27.5567569732666, -25.438087463378906, -23.319419860839844, -21.20075225830078, -19.082082748413086, -16.96341323852539, -14.844745635986328, -12.72607707977295, -10.60740852355957, -8.488739967346191, -6.370079040527344, -4.251410484313965, -2.132741928100586, -0.014073371887207031, 2.104595184326172, 4.223263740539551, 6.34193229675293, 8.460600852966309, 10.579269409179688, 12.697937965393066, 14.816606521606445, 16.93527603149414, 19.053943634033203, 21.172611236572266, 23.29128074645996, 25.409950256347656, 27.52861785888672, 29.64728546142578, 31.765954971313477, 33.88462448120117, 36.003292083740234, 38.1219596862793, 40.240631103515625, 42.35929870605469, 44.47796630859375, 46.59663391113281, 48.715301513671875, 50.8339729309082, 52.952640533447266, 55.07130813598633, 57.189979553222656, 59.30864715576172, 61.42731475830078]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 4.0, 10.0, 18.0, 19.0, 29.0, 42.0, 59.0, 84.0, 154.0, 191.0, 247.0, 365.0, 511.0, 777.0, 1290.0, 1986.0, 3118.0, 5739.0, 11306.0, 24367.0, 60415.0, 159556.0, 321306.0, 264844.0, 111233.0, 42472.0, 17635.0, 8565.0, 4596.0, 2668.0, 1657.0, 1049.0, 681.0, 474.0, 378.0, 201.0, 164.0, 90.0, 83.0, 48.0, 37.0, 22.0, 16.0, 18.0, 13.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48046875, -5.296630859375, -5.11279296875, -4.928955078125, -4.7451171875, -4.561279296875, -4.37744140625, -4.193603515625, -4.009765625, -3.825927734375, -3.64208984375, -3.458251953125, -3.2744140625, -3.090576171875, -2.90673828125, -2.722900390625, -2.5390625, -2.355224609375, -2.17138671875, -1.987548828125, -1.8037109375, -1.619873046875, -1.43603515625, -1.252197265625, -1.068359375, -0.884521484375, -0.70068359375, -0.516845703125, -0.3330078125, -0.149169921875, 0.03466796875, 0.218505859375, 0.40234375, 0.586181640625, 0.77001953125, 0.953857421875, 1.1376953125, 1.321533203125, 1.50537109375, 1.689208984375, 1.873046875, 2.056884765625, 2.24072265625, 2.424560546875, 2.6083984375, 2.792236328125, 2.97607421875, 3.159912109375, 3.34375, 3.527587890625, 3.71142578125, 3.895263671875, 4.0791015625, 4.262939453125, 4.44677734375, 4.630615234375, 4.814453125, 4.998291015625, 5.18212890625, 5.365966796875, 5.5498046875, 5.733642578125, 5.91748046875, 6.101318359375, 6.28515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 10.0, 8.0, 14.0, 15.0, 13.0, 17.0, 13.0, 22.0, 34.0, 27.0, 30.0, 40.0, 39.0, 46.0, 50.0, 48.0, 53.0, 49.0, 55.0, 46.0, 46.0, 36.0, 26.0, 37.0, 38.0, 24.0, 27.0, 27.0, 16.0, 18.0, 12.0, 18.0, 12.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.48828125, -5.3125, -5.13671875, -4.9609375, -4.78515625, -4.609375, -4.43359375, -4.2578125, -4.08203125, -3.90625, -3.73046875, -3.5546875, -3.37890625, -3.203125, -3.02734375, -2.8515625, -2.67578125, -2.5, -2.32421875, -2.1484375, -1.97265625, -1.796875, -1.62109375, -1.4453125, -1.26953125, -1.09375, -0.91796875, -0.7421875, -0.56640625, -0.390625, -0.21484375, -0.0390625, 0.13671875, 0.3125, 0.48828125, 0.6640625, 0.83984375, 1.015625, 1.19140625, 1.3671875, 1.54296875, 1.71875, 1.89453125, 2.0703125, 2.24609375, 2.421875, 2.59765625, 2.7734375, 2.94921875, 3.125, 3.30078125, 3.4765625, 3.65234375, 3.828125, 4.00390625, 4.1796875, 4.35546875, 4.53125, 4.70703125, 4.8828125, 5.05859375, 5.234375, 5.41015625, 5.5859375, 5.76171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 13.0, 11.0, 12.0, 20.0, 27.0, 40.0, 50.0, 83.0, 105.0, 160.0, 273.0, 527.0, 1123.0, 2513.0, 7604.0, 32559.0, 242422.0, 661716.0, 77561.0, 14321.0, 4129.0, 1593.0, 732.0, 352.0, 187.0, 111.0, 96.0, 41.0, 48.0, 28.0, 20.0, 14.0, 11.0, 14.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.953125, -12.524658203125, -12.09619140625, -11.667724609375, -11.2392578125, -10.810791015625, -10.38232421875, -9.953857421875, -9.525390625, -9.096923828125, -8.66845703125, -8.239990234375, -7.8115234375, -7.383056640625, -6.95458984375, -6.526123046875, -6.09765625, -5.669189453125, -5.24072265625, -4.812255859375, -4.3837890625, -3.955322265625, -3.52685546875, -3.098388671875, -2.669921875, -2.241455078125, -1.81298828125, -1.384521484375, -0.9560546875, -0.527587890625, -0.09912109375, 0.329345703125, 0.7578125, 1.186279296875, 1.61474609375, 2.043212890625, 2.4716796875, 2.900146484375, 3.32861328125, 3.757080078125, 4.185546875, 4.614013671875, 5.04248046875, 5.470947265625, 5.8994140625, 6.327880859375, 6.75634765625, 7.184814453125, 7.61328125, 8.041748046875, 8.47021484375, 8.898681640625, 9.3271484375, 9.755615234375, 10.18408203125, 10.612548828125, 11.041015625, 11.469482421875, 11.89794921875, 12.326416015625, 12.7548828125, 13.183349609375, 13.61181640625, 14.040283203125, 14.46875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 12.0, 9.0, 22.0, 22.0, 13.0, 22.0, 35.0, 36.0, 42.0, 43.0, 56.0, 45.0, 55.0, 61.0, 60.0, 70.0, 49.0, 63.0, 43.0, 43.0, 36.0, 30.0, 19.0, 22.0, 21.0, 12.0, 11.0, 7.0, 8.0, 5.0, 3.0, 0.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.4375, -25.617431640625, -24.79736328125, -23.977294921875, -23.1572265625, -22.337158203125, -21.51708984375, -20.697021484375, -19.876953125, -19.056884765625, -18.23681640625, -17.416748046875, -16.5966796875, -15.776611328125, -14.95654296875, -14.136474609375, -13.31640625, -12.496337890625, -11.67626953125, -10.856201171875, -10.0361328125, -9.216064453125, -8.39599609375, -7.575927734375, -6.755859375, -5.935791015625, -5.11572265625, -4.295654296875, -3.4755859375, -2.655517578125, -1.83544921875, -1.015380859375, -0.1953125, 0.624755859375, 1.44482421875, 2.264892578125, 3.0849609375, 3.905029296875, 4.72509765625, 5.545166015625, 6.365234375, 7.185302734375, 8.00537109375, 8.825439453125, 9.6455078125, 10.465576171875, 11.28564453125, 12.105712890625, 12.92578125, 13.745849609375, 14.56591796875, 15.385986328125, 16.2060546875, 17.026123046875, 17.84619140625, 18.666259765625, 19.486328125, 20.306396484375, 21.12646484375, 21.946533203125, 22.7666015625, 23.586669921875, 24.40673828125, 25.226806640625, 26.046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 8.0, 13.0, 13.0, 25.0, 37.0, 60.0, 93.0, 153.0, 283.0, 492.0, 1037.0, 2448.0, 6519.0, 21373.0, 95531.0, 615913.0, 239648.0, 45499.0, 12065.0, 4118.0, 1585.0, 744.0, 364.0, 199.0, 119.0, 54.0, 52.0, 27.0, 31.0, 13.0, 12.0, 4.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.954833984375, -4.80810546875, -4.661376953125, -4.5146484375, -4.367919921875, -4.22119140625, -4.074462890625, -3.927734375, -3.781005859375, -3.63427734375, -3.487548828125, -3.3408203125, -3.194091796875, -3.04736328125, -2.900634765625, -2.75390625, -2.607177734375, -2.46044921875, -2.313720703125, -2.1669921875, -2.020263671875, -1.87353515625, -1.726806640625, -1.580078125, -1.433349609375, -1.28662109375, -1.139892578125, -0.9931640625, -0.846435546875, -0.69970703125, -0.552978515625, -0.40625, -0.259521484375, -0.11279296875, 0.033935546875, 0.1806640625, 0.327392578125, 0.47412109375, 0.620849609375, 0.767578125, 0.914306640625, 1.06103515625, 1.207763671875, 1.3544921875, 1.501220703125, 1.64794921875, 1.794677734375, 1.94140625, 2.088134765625, 2.23486328125, 2.381591796875, 2.5283203125, 2.675048828125, 2.82177734375, 2.968505859375, 3.115234375, 3.261962890625, 3.40869140625, 3.555419921875, 3.7021484375, 3.848876953125, 3.99560546875, 4.142333984375, 4.2890625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 4.0, 7.0, 3.0, 8.0, 6.0, 16.0, 20.0, 27.0, 55.0, 84.0, 101.0, 113.0, 131.0, 107.0, 89.0, 69.0, 49.0, 40.0, 18.0, 20.0, 5.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013494491577148438, -0.0013061314821243286, -0.0012628138065338135, -0.0012194961309432983, -0.0011761784553527832, -0.001132860779762268, -0.001089543104171753, -0.0010462254285812378, -0.0010029077529907227, -0.0009595900774002075, -0.0009162724018096924, -0.0008729547262191772, -0.0008296370506286621, -0.000786319375038147, -0.0007430016994476318, -0.0006996840238571167, -0.0006563663482666016, -0.0006130486726760864, -0.0005697309970855713, -0.0005264133214950562, -0.000483095645904541, -0.0004397779703140259, -0.00039646029472351074, -0.0003531426191329956, -0.00030982494354248047, -0.00026650726795196533, -0.0002231895923614502, -0.00017987191677093506, -0.00013655424118041992, -9.323656558990479e-05, -4.991888999938965e-05, -6.601214408874512e-06, 3.6716461181640625e-05, 8.003413677215576e-05, 0.0001233518123626709, 0.00016666948795318604, 0.00020998716354370117, 0.0002533048391342163, 0.00029662251472473145, 0.0003399401903152466, 0.0003832578659057617, 0.00042657554149627686, 0.000469893217086792, 0.0005132108926773071, 0.0005565285682678223, 0.0005998462438583374, 0.0006431639194488525, 0.0006864815950393677, 0.0007297992706298828, 0.000773116946220398, 0.0008164346218109131, 0.0008597522974014282, 0.0009030699729919434, 0.0009463876485824585, 0.0009897053241729736, 0.0010330229997634888, 0.001076340675354004, 0.001119658350944519, 0.0011629760265350342, 0.0012062937021255493, 0.0012496113777160645, 0.0012929290533065796, 0.0013362467288970947, 0.0013795644044876099, 0.001422882080078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 5.0, 15.0, 19.0, 17.0, 33.0, 49.0, 87.0, 181.0, 330.0, 910.0, 2626.0, 10996.0, 78738.0, 750783.0, 177293.0, 20050.0, 4127.0, 1275.0, 475.0, 228.0, 118.0, 68.0, 45.0, 29.0, 18.0, 17.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.640625, -7.4136962890625, -7.186767578125, -6.9598388671875, -6.73291015625, -6.5059814453125, -6.279052734375, -6.0521240234375, -5.8251953125, -5.5982666015625, -5.371337890625, -5.1444091796875, -4.91748046875, -4.6905517578125, -4.463623046875, -4.2366943359375, -4.009765625, -3.7828369140625, -3.555908203125, -3.3289794921875, -3.10205078125, -2.8751220703125, -2.648193359375, -2.4212646484375, -2.1943359375, -1.9674072265625, -1.740478515625, -1.5135498046875, -1.28662109375, -1.0596923828125, -0.832763671875, -0.6058349609375, -0.37890625, -0.1519775390625, 0.074951171875, 0.3018798828125, 0.52880859375, 0.7557373046875, 0.982666015625, 1.2095947265625, 1.4365234375, 1.6634521484375, 1.890380859375, 2.1173095703125, 2.34423828125, 2.5711669921875, 2.798095703125, 3.0250244140625, 3.251953125, 3.4788818359375, 3.705810546875, 3.9327392578125, 4.15966796875, 4.3865966796875, 4.613525390625, 4.8404541015625, 5.0673828125, 5.2943115234375, 5.521240234375, 5.7481689453125, 5.97509765625, 6.2020263671875, 6.428955078125, 6.6558837890625, 6.8828125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 9.0, 8.0, 7.0, 8.0, 4.0, 10.0, 22.0, 25.0, 38.0, 33.0, 44.0, 69.0, 76.0, 97.0, 85.0, 87.0, 87.0, 72.0, 68.0, 34.0, 30.0, 19.0, 21.0, 15.0, 8.0, 9.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.125, -5.967132568359375, -5.80926513671875, -5.651397705078125, -5.4935302734375, -5.335662841796875, -5.17779541015625, -5.019927978515625, -4.862060546875, -4.704193115234375, -4.54632568359375, -4.388458251953125, -4.2305908203125, -4.072723388671875, -3.91485595703125, -3.756988525390625, -3.59912109375, -3.441253662109375, -3.28338623046875, -3.125518798828125, -2.9676513671875, -2.809783935546875, -2.65191650390625, -2.494049072265625, -2.336181640625, -2.178314208984375, -2.02044677734375, -1.862579345703125, -1.7047119140625, -1.546844482421875, -1.38897705078125, -1.231109619140625, -1.0732421875, -0.915374755859375, -0.75750732421875, -0.599639892578125, -0.4417724609375, -0.283905029296875, -0.12603759765625, 0.031829833984375, 0.189697265625, 0.347564697265625, 0.50543212890625, 0.663299560546875, 0.8211669921875, 0.979034423828125, 1.13690185546875, 1.294769287109375, 1.45263671875, 1.610504150390625, 1.76837158203125, 1.926239013671875, 2.0841064453125, 2.241973876953125, 2.39984130859375, 2.557708740234375, 2.715576171875, 2.873443603515625, 3.03131103515625, 3.189178466796875, 3.3470458984375, 3.504913330078125, 3.66278076171875, 3.820648193359375, 3.978515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 5.0, 14.0, 20.0, 45.0, 101.0, 163.0, 295.0, 156.0, 93.0, 52.0, 20.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.56491088867188, -134.87120056152344, -131.17750549316406, -127.48379516601562, -123.79009246826172, -120.09638977050781, -116.4026870727539, -112.708984375, -109.01527404785156, -105.32157135009766, -101.62786865234375, -97.93415832519531, -94.2404556274414, -90.5467529296875, -86.8530502319336, -83.15934753417969, -79.46564483642578, -75.77194213867188, -72.07823944091797, -68.38453674316406, -64.69082641601562, -60.99712371826172, -57.30342102050781, -53.609718322753906, -49.916011810302734, -46.22230911254883, -42.528602600097656, -38.83489990234375, -35.141197204589844, -31.447490692138672, -27.753787994384766, -24.060083389282227, -20.366371154785156, -16.672666549682617, -12.978962898254395, -9.285259246826172, -5.591554641723633, -1.8978500366210938, 1.7958526611328125, 5.489557266235352, 9.18326187133789, 12.87696647644043, 16.57067108154297, 20.264373779296875, 23.958078384399414, 27.651782989501953, 31.34548568725586, 35.03919219970703, 38.73289489746094, 42.426597595214844, 46.120304107666016, 49.81400680541992, 53.507713317871094, 57.201416015625, 60.895118713378906, 64.58882141113281, 68.28253173828125, 71.97623443603516, 75.66993713378906, 79.3636474609375, 83.0573501586914, 86.75105285644531, 90.44475555419922, 94.13845825195312, 97.83216094970703]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 1.0, 4.0, 9.0, 7.0, 13.0, 14.0, 15.0, 17.0, 19.0, 16.0, 27.0, 24.0, 23.0, 23.0, 28.0, 40.0, 48.0, 51.0, 64.0, 64.0, 70.0, 60.0, 51.0, 35.0, 44.0, 23.0, 34.0, 24.0, 17.0, 19.0, 13.0, 14.0, 16.0, 13.0, 8.0, 16.0, 5.0, 7.0, 5.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-88.7977066040039, -86.15140533447266, -83.5051040649414, -80.85880279541016, -78.21249389648438, -75.56619262695312, -72.91989135742188, -70.27359008789062, -67.62728881835938, -64.98098754882812, -62.334686279296875, -59.68838119506836, -57.04207992553711, -54.39577865600586, -51.749473571777344, -49.103172302246094, -46.456871032714844, -43.810569763183594, -41.164268493652344, -38.51796340942383, -35.87166213989258, -33.22536087036133, -30.579057693481445, -27.932754516601562, -25.286453247070312, -22.640151977539062, -19.99384880065918, -17.347545623779297, -14.701244354248047, -12.05494213104248, -9.408639907836914, -6.762336730957031, -4.1160430908203125, -1.469740867614746, 1.1765613555908203, 3.8228635787963867, 6.469165802001953, 9.11546802520752, 11.761770248413086, 14.408073425292969, 17.05437469482422, 19.70067596435547, 22.34697914123535, 24.993282318115234, 27.639583587646484, 30.285884857177734, 32.93218994140625, 35.5784912109375, 38.22479248046875, 40.87109375, 43.51739501953125, 46.163700103759766, 48.810001373291016, 51.456302642822266, 54.10260772705078, 56.74890899658203, 59.39521026611328, 62.04151153564453, 64.68781280517578, 67.33411407470703, 69.98042297363281, 72.62672424316406, 75.27302551269531, 77.91932678222656, 80.56562805175781]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 8.0, 16.0, 17.0, 33.0, 52.0, 71.0, 105.0, 154.0, 239.0, 407.0, 681.0, 1216.0, 2088.0, 4503.0, 10306.0, 31544.0, 150012.0, 949080.0, 2319147.0, 593007.0, 94542.0, 21520.0, 7737.0, 3387.0, 1783.0, 985.0, 583.0, 364.0, 228.0, 139.0, 94.0, 56.0, 39.0, 31.0, 25.0, 28.0, 14.0, 5.0, 13.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73046875, -5.51312255859375, -5.2957763671875, -5.07843017578125, -4.861083984375, -4.64373779296875, -4.4263916015625, -4.20904541015625, -3.99169921875, -3.77435302734375, -3.5570068359375, -3.33966064453125, -3.122314453125, -2.90496826171875, -2.6876220703125, -2.47027587890625, -2.2529296875, -2.03558349609375, -1.8182373046875, -1.60089111328125, -1.383544921875, -1.16619873046875, -0.9488525390625, -0.73150634765625, -0.51416015625, -0.29681396484375, -0.0794677734375, 0.13787841796875, 0.355224609375, 0.57257080078125, 0.7899169921875, 1.00726318359375, 1.224609375, 1.44195556640625, 1.6593017578125, 1.87664794921875, 2.093994140625, 2.31134033203125, 2.5286865234375, 2.74603271484375, 2.96337890625, 3.18072509765625, 3.3980712890625, 3.61541748046875, 3.832763671875, 4.05010986328125, 4.2674560546875, 4.48480224609375, 4.7021484375, 4.91949462890625, 5.1368408203125, 5.35418701171875, 5.571533203125, 5.78887939453125, 6.0062255859375, 6.22357177734375, 6.44091796875, 6.65826416015625, 6.8756103515625, 7.09295654296875, 7.310302734375, 7.52764892578125, 7.7449951171875, 7.96234130859375, 8.1796875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 6.0, 10.0, 11.0, 16.0, 10.0, 13.0, 13.0, 12.0, 14.0, 28.0, 19.0, 28.0, 35.0, 37.0, 24.0, 33.0, 35.0, 43.0, 35.0, 41.0, 37.0, 36.0, 42.0, 33.0, 39.0, 38.0, 33.0, 31.0, 30.0, 28.0, 28.0, 14.0, 17.0, 16.0, 14.0, 16.0, 12.0, 17.0, 18.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-4.5, -4.3629150390625, -4.225830078125, -4.0887451171875, -3.95166015625, -3.8145751953125, -3.677490234375, -3.5404052734375, -3.4033203125, -3.2662353515625, -3.129150390625, -2.9920654296875, -2.85498046875, -2.7178955078125, -2.580810546875, -2.4437255859375, -2.306640625, -2.1695556640625, -2.032470703125, -1.8953857421875, -1.75830078125, -1.6212158203125, -1.484130859375, -1.3470458984375, -1.2099609375, -1.0728759765625, -0.935791015625, -0.7987060546875, -0.66162109375, -0.5245361328125, -0.387451171875, -0.2503662109375, -0.11328125, 0.0238037109375, 0.160888671875, 0.2979736328125, 0.43505859375, 0.5721435546875, 0.709228515625, 0.8463134765625, 0.9833984375, 1.1204833984375, 1.257568359375, 1.3946533203125, 1.53173828125, 1.6688232421875, 1.805908203125, 1.9429931640625, 2.080078125, 2.2171630859375, 2.354248046875, 2.4913330078125, 2.62841796875, 2.7655029296875, 2.902587890625, 3.0396728515625, 3.1767578125, 3.3138427734375, 3.450927734375, 3.5880126953125, 3.72509765625, 3.8621826171875, 3.999267578125, 4.1363525390625, 4.2734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 4.0, 11.0, 15.0, 23.0, 41.0, 68.0, 114.0, 238.0, 583.0, 1163.0, 3142.0, 11530.0, 91767.0, 3419338.0, 628638.0, 28418.0, 5672.0, 2010.0, 733.0, 347.0, 200.0, 74.0, 44.0, 29.0, 12.0, 20.0, 10.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-21.171875, -20.544677734375, -19.91748046875, -19.290283203125, -18.6630859375, -18.035888671875, -17.40869140625, -16.781494140625, -16.154296875, -15.527099609375, -14.89990234375, -14.272705078125, -13.6455078125, -13.018310546875, -12.39111328125, -11.763916015625, -11.13671875, -10.509521484375, -9.88232421875, -9.255126953125, -8.6279296875, -8.000732421875, -7.37353515625, -6.746337890625, -6.119140625, -5.491943359375, -4.86474609375, -4.237548828125, -3.6103515625, -2.983154296875, -2.35595703125, -1.728759765625, -1.1015625, -0.474365234375, 0.15283203125, 0.780029296875, 1.4072265625, 2.034423828125, 2.66162109375, 3.288818359375, 3.916015625, 4.543212890625, 5.17041015625, 5.797607421875, 6.4248046875, 7.052001953125, 7.67919921875, 8.306396484375, 8.93359375, 9.560791015625, 10.18798828125, 10.815185546875, 11.4423828125, 12.069580078125, 12.69677734375, 13.323974609375, 13.951171875, 14.578369140625, 15.20556640625, 15.832763671875, 16.4599609375, 17.087158203125, 17.71435546875, 18.341552734375, 18.96875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 4.0, 10.0, 12.0, 18.0, 27.0, 42.0, 61.0, 94.0, 167.0, 271.0, 473.0, 625.0, 743.0, 567.0, 373.0, 199.0, 122.0, 84.0, 42.0, 35.0, 23.0, 12.0, 14.0, 10.0, 5.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.140625, -15.68310546875, -15.2255859375, -14.76806640625, -14.310546875, -13.85302734375, -13.3955078125, -12.93798828125, -12.48046875, -12.02294921875, -11.5654296875, -11.10791015625, -10.650390625, -10.19287109375, -9.7353515625, -9.27783203125, -8.8203125, -8.36279296875, -7.9052734375, -7.44775390625, -6.990234375, -6.53271484375, -6.0751953125, -5.61767578125, -5.16015625, -4.70263671875, -4.2451171875, -3.78759765625, -3.330078125, -2.87255859375, -2.4150390625, -1.95751953125, -1.5, -1.04248046875, -0.5849609375, -0.12744140625, 0.330078125, 0.78759765625, 1.2451171875, 1.70263671875, 2.16015625, 2.61767578125, 3.0751953125, 3.53271484375, 3.990234375, 4.44775390625, 4.9052734375, 5.36279296875, 5.8203125, 6.27783203125, 6.7353515625, 7.19287109375, 7.650390625, 8.10791015625, 8.5654296875, 9.02294921875, 9.48046875, 9.93798828125, 10.3955078125, 10.85302734375, 11.310546875, 11.76806640625, 12.2255859375, 12.68310546875, 13.140625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 7.0, 8.0, 15.0, 22.0, 46.0, 109.0, 176.0, 240.0, 156.0, 108.0, 68.0, 25.0, 17.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.64208984375, -184.7345428466797, -179.82699584960938, -174.91944885253906, -170.01190185546875, -165.10435485839844, -160.19680786132812, -155.2892608642578, -150.3817138671875, -145.4741668701172, -140.56661987304688, -135.65907287597656, -130.75152587890625, -125.84397888183594, -120.93643188476562, -116.02888488769531, -111.121337890625, -106.21379089355469, -101.30624389648438, -96.39869689941406, -91.49114990234375, -86.58360290527344, -81.67605590820312, -76.76850891113281, -71.8609619140625, -66.95341491699219, -62.045867919921875, -57.13832092285156, -52.23077392578125, -47.32322692871094, -42.415679931640625, -37.50813293457031, -32.60060119628906, -27.69305419921875, -22.785507202148438, -17.877960205078125, -12.970413208007812, -8.0628662109375, -3.1553192138671875, 1.752227783203125, 6.6597747802734375, 11.56732177734375, 16.474868774414062, 21.382415771484375, 26.289962768554688, 31.197509765625, 36.10505676269531, 41.012603759765625, 45.92015075683594, 50.82769775390625, 55.73524475097656, 60.642791748046875, 65.55033874511719, 70.4578857421875, 75.36543273925781, 80.27297973632812, 85.18052673339844, 90.08807373046875, 94.99562072753906, 99.90316772460938, 104.81071472167969, 109.71826171875, 114.62580871582031, 119.53335571289062, 124.44090270996094]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 5.0, 15.0, 12.0, 18.0, 22.0, 19.0, 23.0, 25.0, 42.0, 38.0, 46.0, 38.0, 60.0, 55.0, 55.0, 44.0, 43.0, 57.0, 53.0, 58.0, 38.0, 32.0, 43.0, 22.0, 30.0, 16.0, 23.0, 10.0, 17.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.755088806152344, -54.704044342041016, -52.65299987792969, -50.60195541381836, -48.55091094970703, -46.49986267089844, -44.44881820678711, -42.39777374267578, -40.34672927856445, -38.295684814453125, -36.2446403503418, -34.19359588623047, -32.142547607421875, -30.09150505065918, -28.04045867919922, -25.98941421508789, -23.938369750976562, -21.887325286865234, -19.836280822753906, -17.785234451293945, -15.734189987182617, -13.683145523071289, -11.632100105285645, -9.5810546875, -7.530010223388672, -5.4789652824401855, -3.427920341491699, -1.376875400543213, 0.6741695404052734, 2.7252140045166016, 4.776259422302246, 6.827304840087891, 8.87835693359375, 10.929401397705078, 12.980446815490723, 15.031492233276367, 17.082536697387695, 19.133581161499023, 21.184627532958984, 23.235671997070312, 25.28671646118164, 27.33776092529297, 29.388805389404297, 31.439851760864258, 33.49089813232422, 35.54193878173828, 37.592987060546875, 39.6440315246582, 41.69507598876953, 43.74612045288086, 45.79716491699219, 47.848209381103516, 49.899253845214844, 51.95030212402344, 54.001346588134766, 56.052391052246094, 58.10343551635742, 60.15447998046875, 62.20552444458008, 64.2565689086914, 66.3076171875, 68.35865783691406, 70.40970611572266, 72.46075439453125, 74.51179504394531]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 11.0, 13.0, 22.0, 41.0, 34.0, 65.0, 109.0, 158.0, 251.0, 505.0, 936.0, 2047.0, 4692.0, 14081.0, 63624.0, 413108.0, 452836.0, 71301.0, 15387.0, 4959.0, 2042.0, 997.0, 510.0, 303.0, 200.0, 98.0, 70.0, 43.0, 36.0, 28.0, 9.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8203125, -11.4512939453125, -11.082275390625, -10.7132568359375, -10.34423828125, -9.9752197265625, -9.606201171875, -9.2371826171875, -8.8681640625, -8.4991455078125, -8.130126953125, -7.7611083984375, -7.39208984375, -7.0230712890625, -6.654052734375, -6.2850341796875, -5.916015625, -5.5469970703125, -5.177978515625, -4.8089599609375, -4.43994140625, -4.0709228515625, -3.701904296875, -3.3328857421875, -2.9638671875, -2.5948486328125, -2.225830078125, -1.8568115234375, -1.48779296875, -1.1187744140625, -0.749755859375, -0.3807373046875, -0.01171875, 0.3572998046875, 0.726318359375, 1.0953369140625, 1.46435546875, 1.8333740234375, 2.202392578125, 2.5714111328125, 2.9404296875, 3.3094482421875, 3.678466796875, 4.0474853515625, 4.41650390625, 4.7855224609375, 5.154541015625, 5.5235595703125, 5.892578125, 6.2615966796875, 6.630615234375, 6.9996337890625, 7.36865234375, 7.7376708984375, 8.106689453125, 8.4757080078125, 8.8447265625, 9.2137451171875, 9.582763671875, 9.9517822265625, 10.32080078125, 10.6898193359375, 11.058837890625, 11.4278564453125, 11.796875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 1.0, 7.0, 8.0, 13.0, 14.0, 15.0, 26.0, 21.0, 19.0, 24.0, 23.0, 35.0, 45.0, 38.0, 38.0, 45.0, 44.0, 52.0, 52.0, 50.0, 35.0, 35.0, 44.0, 38.0, 33.0, 46.0, 34.0, 32.0, 18.0, 27.0, 19.0, 8.0, 14.0, 11.0, 4.0, 5.0, 12.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.796875, -5.61309814453125, -5.4293212890625, -5.24554443359375, -5.061767578125, -4.87799072265625, -4.6942138671875, -4.51043701171875, -4.32666015625, -4.14288330078125, -3.9591064453125, -3.77532958984375, -3.591552734375, -3.40777587890625, -3.2239990234375, -3.04022216796875, -2.8564453125, -2.67266845703125, -2.4888916015625, -2.30511474609375, -2.121337890625, -1.93756103515625, -1.7537841796875, -1.57000732421875, -1.38623046875, -1.20245361328125, -1.0186767578125, -0.83489990234375, -0.651123046875, -0.46734619140625, -0.2835693359375, -0.09979248046875, 0.083984375, 0.26776123046875, 0.4515380859375, 0.63531494140625, 0.819091796875, 1.00286865234375, 1.1866455078125, 1.37042236328125, 1.55419921875, 1.73797607421875, 1.9217529296875, 2.10552978515625, 2.289306640625, 2.47308349609375, 2.6568603515625, 2.84063720703125, 3.0244140625, 3.20819091796875, 3.3919677734375, 3.57574462890625, 3.759521484375, 3.94329833984375, 4.1270751953125, 4.31085205078125, 4.49462890625, 4.67840576171875, 4.8621826171875, 5.04595947265625, 5.229736328125, 5.41351318359375, 5.5972900390625, 5.78106689453125, 5.96484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 10.0, 11.0, 14.0, 6.0, 20.0, 23.0, 35.0, 52.0, 122.0, 184.0, 320.0, 657.0, 1709.0, 5096.0, 33553.0, 771847.0, 214861.0, 14689.0, 3176.0, 1107.0, 450.0, 223.0, 144.0, 74.0, 52.0, 32.0, 28.0, 20.0, 10.0, 7.0, 4.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.953125, -24.293212890625, -23.63330078125, -22.973388671875, -22.3134765625, -21.653564453125, -20.99365234375, -20.333740234375, -19.673828125, -19.013916015625, -18.35400390625, -17.694091796875, -17.0341796875, -16.374267578125, -15.71435546875, -15.054443359375, -14.39453125, -13.734619140625, -13.07470703125, -12.414794921875, -11.7548828125, -11.094970703125, -10.43505859375, -9.775146484375, -9.115234375, -8.455322265625, -7.79541015625, -7.135498046875, -6.4755859375, -5.815673828125, -5.15576171875, -4.495849609375, -3.8359375, -3.176025390625, -2.51611328125, -1.856201171875, -1.1962890625, -0.536376953125, 0.12353515625, 0.783447265625, 1.443359375, 2.103271484375, 2.76318359375, 3.423095703125, 4.0830078125, 4.742919921875, 5.40283203125, 6.062744140625, 6.72265625, 7.382568359375, 8.04248046875, 8.702392578125, 9.3623046875, 10.022216796875, 10.68212890625, 11.342041015625, 12.001953125, 12.661865234375, 13.32177734375, 13.981689453125, 14.6416015625, 15.301513671875, 15.96142578125, 16.621337890625, 17.28125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 5.0, 5.0, 4.0, 7.0, 15.0, 11.0, 15.0, 20.0, 16.0, 21.0, 32.0, 48.0, 40.0, 48.0, 45.0, 62.0, 61.0, 65.0, 46.0, 49.0, 53.0, 56.0, 42.0, 45.0, 40.0, 30.0, 18.0, 21.0, 19.0, 15.0, 10.0, 10.0, 6.0, 4.0, 8.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.28125, -22.451171875, -21.62109375, -20.791015625, -19.9609375, -19.130859375, -18.30078125, -17.470703125, -16.640625, -15.810546875, -14.98046875, -14.150390625, -13.3203125, -12.490234375, -11.66015625, -10.830078125, -10.0, -9.169921875, -8.33984375, -7.509765625, -6.6796875, -5.849609375, -5.01953125, -4.189453125, -3.359375, -2.529296875, -1.69921875, -0.869140625, -0.0390625, 0.791015625, 1.62109375, 2.451171875, 3.28125, 4.111328125, 4.94140625, 5.771484375, 6.6015625, 7.431640625, 8.26171875, 9.091796875, 9.921875, 10.751953125, 11.58203125, 12.412109375, 13.2421875, 14.072265625, 14.90234375, 15.732421875, 16.5625, 17.392578125, 18.22265625, 19.052734375, 19.8828125, 20.712890625, 21.54296875, 22.373046875, 23.203125, 24.033203125, 24.86328125, 25.693359375, 26.5234375, 27.353515625, 28.18359375, 29.013671875, 29.84375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 8.0, 12.0, 21.0, 39.0, 57.0, 90.0, 136.0, 253.0, 483.0, 855.0, 1876.0, 4207.0, 10973.0, 35998.0, 172870.0, 681324.0, 101215.0, 24001.0, 7797.0, 3252.0, 1441.0, 689.0, 371.0, 214.0, 139.0, 72.0, 52.0, 30.0, 21.0, 14.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.75390625, -4.62310791015625, -4.4923095703125, -4.36151123046875, -4.230712890625, -4.09991455078125, -3.9691162109375, -3.83831787109375, -3.70751953125, -3.57672119140625, -3.4459228515625, -3.31512451171875, -3.184326171875, -3.05352783203125, -2.9227294921875, -2.79193115234375, -2.6611328125, -2.53033447265625, -2.3995361328125, -2.26873779296875, -2.137939453125, -2.00714111328125, -1.8763427734375, -1.74554443359375, -1.61474609375, -1.48394775390625, -1.3531494140625, -1.22235107421875, -1.091552734375, -0.96075439453125, -0.8299560546875, -0.69915771484375, -0.568359375, -0.43756103515625, -0.3067626953125, -0.17596435546875, -0.045166015625, 0.08563232421875, 0.2164306640625, 0.34722900390625, 0.47802734375, 0.60882568359375, 0.7396240234375, 0.87042236328125, 1.001220703125, 1.13201904296875, 1.2628173828125, 1.39361572265625, 1.5244140625, 1.65521240234375, 1.7860107421875, 1.91680908203125, 2.047607421875, 2.17840576171875, 2.3092041015625, 2.44000244140625, 2.57080078125, 2.70159912109375, 2.8323974609375, 2.96319580078125, 3.093994140625, 3.22479248046875, 3.3555908203125, 3.48638916015625, 3.6171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 3.0, 10.0, 7.0, 13.0, 15.0, 21.0, 23.0, 43.0, 58.0, 93.0, 130.0, 154.0, 126.0, 95.0, 64.0, 47.0, 26.0, 16.0, 14.0, 11.0, 7.0, 4.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015354156494140625, -0.0014865398406982422, -0.0014376640319824219, -0.0013887882232666016, -0.0013399124145507812, -0.001291036605834961, -0.0012421607971191406, -0.0011932849884033203, -0.0011444091796875, -0.0010955333709716797, -0.0010466575622558594, -0.000997781753540039, -0.0009489059448242188, -0.0009000301361083984, -0.0008511543273925781, -0.0008022785186767578, -0.0007534027099609375, -0.0007045269012451172, -0.0006556510925292969, -0.0006067752838134766, -0.0005578994750976562, -0.0005090236663818359, -0.0004601478576660156, -0.0004112720489501953, -0.000362396240234375, -0.0003135204315185547, -0.0002646446228027344, -0.00021576881408691406, -0.00016689300537109375, -0.00011801719665527344, -6.914138793945312e-05, -2.0265579223632812e-05, 2.86102294921875e-05, 7.748603820800781e-05, 0.00012636184692382812, 0.00017523765563964844, 0.00022411346435546875, 0.00027298927307128906, 0.0003218650817871094, 0.0003707408905029297, 0.00041961669921875, 0.0004684925079345703, 0.0005173683166503906, 0.0005662441253662109, 0.0006151199340820312, 0.0006639957427978516, 0.0007128715515136719, 0.0007617473602294922, 0.0008106231689453125, 0.0008594989776611328, 0.0009083747863769531, 0.0009572505950927734, 0.0010061264038085938, 0.001055002212524414, 0.0011038780212402344, 0.0011527538299560547, 0.001201629638671875, 0.0012505054473876953, 0.0012993812561035156, 0.001348257064819336, 0.0013971328735351562, 0.0014460086822509766, 0.0014948844909667969, 0.0015437602996826172, 0.0015926361083984375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 9.0, 9.0, 10.0, 19.0, 19.0, 29.0, 36.0, 41.0, 81.0, 118.0, 177.0, 275.0, 474.0, 848.0, 1707.0, 3650.0, 8900.0, 25625.0, 98921.0, 639807.0, 198888.0, 44711.0, 13734.0, 5294.0, 2377.0, 1128.0, 611.0, 358.0, 222.0, 151.0, 101.0, 48.0, 50.0, 34.0, 23.0, 18.0, 16.0, 10.0, 6.0, 6.0, 2.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.529296875, -3.406402587890625, -3.28350830078125, -3.160614013671875, -3.0377197265625, -2.914825439453125, -2.79193115234375, -2.669036865234375, -2.546142578125, -2.423248291015625, -2.30035400390625, -2.177459716796875, -2.0545654296875, -1.931671142578125, -1.80877685546875, -1.685882568359375, -1.56298828125, -1.440093994140625, -1.31719970703125, -1.194305419921875, -1.0714111328125, -0.948516845703125, -0.82562255859375, -0.702728271484375, -0.579833984375, -0.456939697265625, -0.33404541015625, -0.211151123046875, -0.0882568359375, 0.034637451171875, 0.15753173828125, 0.280426025390625, 0.4033203125, 0.526214599609375, 0.64910888671875, 0.772003173828125, 0.8948974609375, 1.017791748046875, 1.14068603515625, 1.263580322265625, 1.386474609375, 1.509368896484375, 1.63226318359375, 1.755157470703125, 1.8780517578125, 2.000946044921875, 2.12384033203125, 2.246734619140625, 2.36962890625, 2.492523193359375, 2.61541748046875, 2.738311767578125, 2.8612060546875, 2.984100341796875, 3.10699462890625, 3.229888916015625, 3.352783203125, 3.475677490234375, 3.59857177734375, 3.721466064453125, 3.8443603515625, 3.967254638671875, 4.09014892578125, 4.213043212890625, 4.3359375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 5.0, 7.0, 12.0, 20.0, 38.0, 31.0, 46.0, 67.0, 75.0, 95.0, 111.0, 104.0, 92.0, 64.0, 53.0, 37.0, 32.0, 30.0, 14.0, 16.0, 12.0, 11.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.72265625, -4.5679931640625, -4.413330078125, -4.2586669921875, -4.10400390625, -3.9493408203125, -3.794677734375, -3.6400146484375, -3.4853515625, -3.3306884765625, -3.176025390625, -3.0213623046875, -2.86669921875, -2.7120361328125, -2.557373046875, -2.4027099609375, -2.248046875, -2.0933837890625, -1.938720703125, -1.7840576171875, -1.62939453125, -1.4747314453125, -1.320068359375, -1.1654052734375, -1.0107421875, -0.8560791015625, -0.701416015625, -0.5467529296875, -0.39208984375, -0.2374267578125, -0.082763671875, 0.0718994140625, 0.2265625, 0.3812255859375, 0.535888671875, 0.6905517578125, 0.84521484375, 0.9998779296875, 1.154541015625, 1.3092041015625, 1.4638671875, 1.6185302734375, 1.773193359375, 1.9278564453125, 2.08251953125, 2.2371826171875, 2.391845703125, 2.5465087890625, 2.701171875, 2.8558349609375, 3.010498046875, 3.1651611328125, 3.31982421875, 3.4744873046875, 3.629150390625, 3.7838134765625, 3.9384765625, 4.0931396484375, 4.247802734375, 4.4024658203125, 4.55712890625, 4.7117919921875, 4.866455078125, 5.0211181640625, 5.17578125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 9.0, 17.0, 28.0, 45.0, 98.0, 138.0, 313.0, 161.0, 77.0, 51.0, 19.0, 17.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.1891860961914, -110.57050323486328, -106.95182037353516, -103.33313751220703, -99.71444702148438, -96.09576416015625, -92.47708129882812, -88.8583984375, -85.23971557617188, -81.62103271484375, -78.00234985351562, -74.3836669921875, -70.76498413085938, -67.14630126953125, -63.527610778808594, -59.90892791748047, -56.290245056152344, -52.67156219482422, -49.052879333496094, -45.4341926574707, -41.81550979614258, -38.19682693481445, -34.57814025878906, -30.959457397460938, -27.340774536132812, -23.722091674804688, -20.10340690612793, -16.484722137451172, -12.866039276123047, -9.247356414794922, -5.628671646118164, -2.0099868774414062, 1.60870361328125, 5.227387428283691, 8.846071243286133, 12.464755058288574, 16.083438873291016, 19.70212173461914, 23.3208065032959, 26.939491271972656, 30.55817413330078, 34.176856994628906, 37.79553985595703, 41.41422653198242, 45.03290939331055, 48.65159225463867, 52.27027893066406, 55.88896179199219, 59.50764465332031, 63.12632751464844, 66.74501037597656, 70.36369323730469, 73.98237609863281, 77.60105895996094, 81.2197494506836, 84.83843231201172, 88.45711517333984, 92.07579803466797, 95.6944808959961, 99.31316375732422, 102.93185424804688, 106.550537109375, 110.16921997070312, 113.78790283203125, 117.40658569335938]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 3.0, 7.0, 7.0, 8.0, 14.0, 11.0, 19.0, 14.0, 28.0, 27.0, 29.0, 24.0, 31.0, 36.0, 39.0, 48.0, 49.0, 77.0, 96.0, 80.0, 46.0, 41.0, 32.0, 40.0, 26.0, 30.0, 19.0, 14.0, 21.0, 20.0, 11.0, 13.0, 11.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-89.75408935546875, -87.13092803955078, -84.50776672363281, -81.88459777832031, -79.26143646240234, -76.63827514648438, -74.0151138305664, -71.39195251464844, -68.76878356933594, -66.14562225341797, -63.522457122802734, -60.899295806884766, -58.27613067626953, -55.65296936035156, -53.029808044433594, -50.406646728515625, -47.783485412597656, -45.16032409667969, -42.53715896606445, -39.913997650146484, -37.29083251953125, -34.66767120361328, -32.04450988769531, -29.42134666442871, -26.79818344116211, -24.175020217895508, -21.551856994628906, -18.928695678710938, -16.305532455444336, -13.682369232177734, -11.05920696258545, -8.436044692993164, -5.8128814697265625, -3.189718723297119, -0.5665559768676758, 2.0566067695617676, 4.679769515991211, 7.3029327392578125, 9.926095008850098, 12.549257278442383, 15.172420501708984, 17.795583724975586, 20.418746948242188, 23.041908264160156, 25.665071487426758, 28.28823471069336, 30.911396026611328, 33.53456115722656, 36.15772247314453, 38.7808837890625, 41.404048919677734, 44.0272102355957, 46.65037536621094, 49.273536682128906, 51.896697998046875, 54.519859313964844, 57.14302444458008, 59.76618576049805, 62.38935089111328, 65.01251220703125, 67.63567352294922, 70.25883483886719, 72.88200378417969, 75.50516510009766, 78.12832641601562]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 8.0, 10.0, 15.0, 32.0, 42.0, 73.0, 112.0, 170.0, 211.0, 337.0, 522.0, 830.0, 1378.0, 2484.0, 5197.0, 14273.0, 64472.0, 497567.0, 2526202.0, 932303.0, 114282.0, 20102.0, 6331.0, 2952.0, 1570.0, 927.0, 634.0, 383.0, 277.0, 176.0, 129.0, 70.0, 52.0, 55.0, 29.0, 9.0, 20.0, 15.0, 9.0, 6.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.20703125, -6.93658447265625, -6.6661376953125, -6.39569091796875, -6.125244140625, -5.85479736328125, -5.5843505859375, -5.31390380859375, -5.04345703125, -4.77301025390625, -4.5025634765625, -4.23211669921875, -3.961669921875, -3.69122314453125, -3.4207763671875, -3.15032958984375, -2.8798828125, -2.60943603515625, -2.3389892578125, -2.06854248046875, -1.798095703125, -1.52764892578125, -1.2572021484375, -0.98675537109375, -0.71630859375, -0.44586181640625, -0.1754150390625, 0.09503173828125, 0.365478515625, 0.63592529296875, 0.9063720703125, 1.17681884765625, 1.447265625, 1.71771240234375, 1.9881591796875, 2.25860595703125, 2.529052734375, 2.79949951171875, 3.0699462890625, 3.34039306640625, 3.61083984375, 3.88128662109375, 4.1517333984375, 4.42218017578125, 4.692626953125, 4.96307373046875, 5.2335205078125, 5.50396728515625, 5.7744140625, 6.04486083984375, 6.3153076171875, 6.58575439453125, 6.856201171875, 7.12664794921875, 7.3970947265625, 7.66754150390625, 7.93798828125, 8.20843505859375, 8.4788818359375, 8.74932861328125, 9.019775390625, 9.29022216796875, 9.5606689453125, 9.83111572265625, 10.1015625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 3.0, 8.0, 6.0, 14.0, 9.0, 14.0, 14.0, 20.0, 21.0, 20.0, 18.0, 16.0, 29.0, 32.0, 27.0, 36.0, 35.0, 42.0, 34.0, 37.0, 43.0, 42.0, 42.0, 44.0, 37.0, 39.0, 40.0, 31.0, 30.0, 28.0, 29.0, 23.0, 19.0, 17.0, 22.0, 18.0, 14.0, 8.0, 10.0, 3.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0], "bins": [-5.10546875, -4.95501708984375, -4.8045654296875, -4.65411376953125, -4.503662109375, -4.35321044921875, -4.2027587890625, -4.05230712890625, -3.90185546875, -3.75140380859375, -3.6009521484375, -3.45050048828125, -3.300048828125, -3.14959716796875, -2.9991455078125, -2.84869384765625, -2.6982421875, -2.54779052734375, -2.3973388671875, -2.24688720703125, -2.096435546875, -1.94598388671875, -1.7955322265625, -1.64508056640625, -1.49462890625, -1.34417724609375, -1.1937255859375, -1.04327392578125, -0.892822265625, -0.74237060546875, -0.5919189453125, -0.44146728515625, -0.291015625, -0.14056396484375, 0.0098876953125, 0.16033935546875, 0.310791015625, 0.46124267578125, 0.6116943359375, 0.76214599609375, 0.91259765625, 1.06304931640625, 1.2135009765625, 1.36395263671875, 1.514404296875, 1.66485595703125, 1.8153076171875, 1.96575927734375, 2.1162109375, 2.26666259765625, 2.4171142578125, 2.56756591796875, 2.718017578125, 2.86846923828125, 3.0189208984375, 3.16937255859375, 3.31982421875, 3.47027587890625, 3.6207275390625, 3.77117919921875, 3.921630859375, 4.07208251953125, 4.2225341796875, 4.37298583984375, 4.5234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 7.0, 15.0, 21.0, 28.0, 43.0, 88.0, 163.0, 310.0, 698.0, 1660.0, 5367.0, 24650.0, 468471.0, 3553073.0, 120796.0, 13172.0, 3436.0, 1217.0, 500.0, 245.0, 120.0, 69.0, 41.0, 20.0, 12.0, 12.0, 10.0, 6.0, 7.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.52587890625, -15.9423828125, -15.35888671875, -14.775390625, -14.19189453125, -13.6083984375, -13.02490234375, -12.44140625, -11.85791015625, -11.2744140625, -10.69091796875, -10.107421875, -9.52392578125, -8.9404296875, -8.35693359375, -7.7734375, -7.18994140625, -6.6064453125, -6.02294921875, -5.439453125, -4.85595703125, -4.2724609375, -3.68896484375, -3.10546875, -2.52197265625, -1.9384765625, -1.35498046875, -0.771484375, -0.18798828125, 0.3955078125, 0.97900390625, 1.5625, 2.14599609375, 2.7294921875, 3.31298828125, 3.896484375, 4.47998046875, 5.0634765625, 5.64697265625, 6.23046875, 6.81396484375, 7.3974609375, 7.98095703125, 8.564453125, 9.14794921875, 9.7314453125, 10.31494140625, 10.8984375, 11.48193359375, 12.0654296875, 12.64892578125, 13.232421875, 13.81591796875, 14.3994140625, 14.98291015625, 15.56640625, 16.14990234375, 16.7333984375, 17.31689453125, 17.900390625, 18.48388671875, 19.0673828125, 19.65087890625, 20.234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 6.0, 6.0, 5.0, 8.0, 9.0, 16.0, 26.0, 50.0, 72.0, 123.0, 248.0, 432.0, 704.0, 878.0, 611.0, 405.0, 195.0, 122.0, 57.0, 29.0, 25.0, 13.0, 10.0, 5.0, 8.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.75, -13.185791015625, -12.62158203125, -12.057373046875, -11.4931640625, -10.928955078125, -10.36474609375, -9.800537109375, -9.236328125, -8.672119140625, -8.10791015625, -7.543701171875, -6.9794921875, -6.415283203125, -5.85107421875, -5.286865234375, -4.72265625, -4.158447265625, -3.59423828125, -3.030029296875, -2.4658203125, -1.901611328125, -1.33740234375, -0.773193359375, -0.208984375, 0.355224609375, 0.91943359375, 1.483642578125, 2.0478515625, 2.612060546875, 3.17626953125, 3.740478515625, 4.3046875, 4.868896484375, 5.43310546875, 5.997314453125, 6.5615234375, 7.125732421875, 7.68994140625, 8.254150390625, 8.818359375, 9.382568359375, 9.94677734375, 10.510986328125, 11.0751953125, 11.639404296875, 12.20361328125, 12.767822265625, 13.33203125, 13.896240234375, 14.46044921875, 15.024658203125, 15.5888671875, 16.153076171875, 16.71728515625, 17.281494140625, 17.845703125, 18.409912109375, 18.97412109375, 19.538330078125, 20.1025390625, 20.666748046875, 21.23095703125, 21.795166015625, 22.359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 8.0, 29.0, 37.0, 109.0, 154.0, 220.0, 213.0, 105.0, 58.0, 27.0, 11.0, 6.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-207.4503173828125, -202.70236206054688, -197.95440673828125, -193.2064666748047, -188.45851135253906, -183.71055603027344, -178.96261596679688, -174.21466064453125, -169.46670532226562, -164.71875, -159.97079467773438, -155.2228546142578, -150.4748992919922, -145.72694396972656, -140.97900390625, -136.23104858398438, -131.48309326171875, -126.73513793945312, -121.98719024658203, -117.23924255371094, -112.49128723144531, -107.74333190917969, -102.9953842163086, -98.2474365234375, -93.49948120117188, -88.75152587890625, -84.00357818603516, -79.25563049316406, -74.50767517089844, -69.75971984863281, -65.01177215576172, -60.26382064819336, -55.515869140625, -50.76791763305664, -46.01996612548828, -41.27201461791992, -36.52406311035156, -31.776111602783203, -27.028160095214844, -22.280208587646484, -17.532257080078125, -12.784305572509766, -8.036354064941406, -3.288402557373047, 1.4595489501953125, 6.207500457763672, 10.955451965332031, 15.70340347290039, 20.45135498046875, 25.19930648803711, 29.94725799560547, 34.69520950317383, 39.44316101074219, 44.19111251831055, 48.939064025878906, 53.687015533447266, 58.434967041015625, 63.182918548583984, 67.93087005615234, 72.67881774902344, 77.42677307128906, 82.17472839355469, 86.92267608642578, 91.67062377929688, 96.4185791015625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 9.0, 6.0, 8.0, 12.0, 8.0, 7.0, 10.0, 20.0, 18.0, 22.0, 34.0, 30.0, 30.0, 52.0, 46.0, 46.0, 45.0, 58.0, 38.0, 44.0, 56.0, 46.0, 42.0, 45.0, 38.0, 37.0, 28.0, 28.0, 28.0, 17.0, 11.0, 14.0, 8.0, 15.0, 11.0, 6.0, 7.0, 4.0, 7.0, 0.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-61.771026611328125, -59.89614486694336, -58.021263122558594, -56.14638137817383, -54.27149963378906, -52.39661407470703, -50.52173614501953, -48.6468505859375, -46.771968841552734, -44.89708709716797, -43.0222053527832, -41.14732360839844, -39.27244186401367, -37.397560119628906, -35.522674560546875, -33.64779281616211, -31.772912979125977, -29.89803123474121, -28.023149490356445, -26.148265838623047, -24.27338409423828, -22.398502349853516, -20.52362060546875, -18.648738861083984, -16.77385711669922, -14.898975372314453, -13.024092674255371, -11.149210929870605, -9.274328231811523, -7.399446487426758, -5.524564743041992, -3.64968204498291, -1.7747993469238281, 0.10008275508880615, 1.9749648571014404, 3.849846839904785, 5.724729061126709, 7.599611282348633, 9.474493026733398, 11.34937572479248, 13.224257469177246, 15.099139213562012, 16.974021911621094, 18.84890365600586, 20.723785400390625, 22.59866714477539, 24.473548889160156, 26.348432540893555, 28.22331428527832, 30.098196029663086, 31.97307777404785, 33.84796142578125, 35.722843170166016, 37.59772491455078, 39.47260665893555, 41.34748840332031, 43.22237014770508, 45.097251892089844, 46.97213363647461, 48.847015380859375, 50.72189712524414, 52.596778869628906, 54.47166442871094, 56.3465461730957, 58.22142791748047]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 8.0, 22.0, 24.0, 27.0, 62.0, 81.0, 150.0, 211.0, 334.0, 571.0, 1127.0, 2251.0, 5414.0, 14749.0, 50452.0, 240329.0, 547155.0, 135177.0, 32180.0, 10414.0, 3942.0, 1732.0, 879.0, 504.0, 245.0, 149.0, 116.0, 64.0, 58.0, 26.0, 30.0, 19.0, 19.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.7093505859375, -9.340576171875, -8.9718017578125, -8.60302734375, -8.2342529296875, -7.865478515625, -7.4967041015625, -7.1279296875, -6.7591552734375, -6.390380859375, -6.0216064453125, -5.65283203125, -5.2840576171875, -4.915283203125, -4.5465087890625, -4.177734375, -3.8089599609375, -3.440185546875, -3.0714111328125, -2.70263671875, -2.3338623046875, -1.965087890625, -1.5963134765625, -1.2275390625, -0.8587646484375, -0.489990234375, -0.1212158203125, 0.24755859375, 0.6163330078125, 0.985107421875, 1.3538818359375, 1.72265625, 2.0914306640625, 2.460205078125, 2.8289794921875, 3.19775390625, 3.5665283203125, 3.935302734375, 4.3040771484375, 4.6728515625, 5.0416259765625, 5.410400390625, 5.7791748046875, 6.14794921875, 6.5167236328125, 6.885498046875, 7.2542724609375, 7.623046875, 7.9918212890625, 8.360595703125, 8.7293701171875, 9.09814453125, 9.4669189453125, 9.835693359375, 10.2044677734375, 10.5732421875, 10.9420166015625, 11.310791015625, 11.6795654296875, 12.04833984375, 12.4171142578125, 12.785888671875, 13.1546630859375, 13.5234375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 4.0, 13.0, 5.0, 12.0, 6.0, 11.0, 15.0, 20.0, 24.0, 24.0, 23.0, 27.0, 24.0, 42.0, 29.0, 34.0, 48.0, 51.0, 31.0, 43.0, 44.0, 33.0, 34.0, 39.0, 31.0, 32.0, 40.0, 26.0, 29.0, 35.0, 21.0, 18.0, 19.0, 21.0, 11.0, 8.0, 15.0, 11.0, 10.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.37890625, -5.2132568359375, -5.047607421875, -4.8819580078125, -4.71630859375, -4.5506591796875, -4.385009765625, -4.2193603515625, -4.0537109375, -3.8880615234375, -3.722412109375, -3.5567626953125, -3.39111328125, -3.2254638671875, -3.059814453125, -2.8941650390625, -2.728515625, -2.5628662109375, -2.397216796875, -2.2315673828125, -2.06591796875, -1.9002685546875, -1.734619140625, -1.5689697265625, -1.4033203125, -1.2376708984375, -1.072021484375, -0.9063720703125, -0.74072265625, -0.5750732421875, -0.409423828125, -0.2437744140625, -0.078125, 0.0875244140625, 0.253173828125, 0.4188232421875, 0.58447265625, 0.7501220703125, 0.915771484375, 1.0814208984375, 1.2470703125, 1.4127197265625, 1.578369140625, 1.7440185546875, 1.90966796875, 2.0753173828125, 2.240966796875, 2.4066162109375, 2.572265625, 2.7379150390625, 2.903564453125, 3.0692138671875, 3.23486328125, 3.4005126953125, 3.566162109375, 3.7318115234375, 3.8974609375, 4.0631103515625, 4.228759765625, 4.3944091796875, 4.56005859375, 4.7257080078125, 4.891357421875, 5.0570068359375, 5.22265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 8.0, 15.0, 21.0, 22.0, 24.0, 36.0, 52.0, 91.0, 148.0, 205.0, 392.0, 684.0, 1345.0, 3041.0, 9112.0, 41949.0, 682019.0, 267833.0, 29159.0, 7227.0, 2548.0, 1078.0, 621.0, 296.0, 203.0, 123.0, 80.0, 66.0, 40.0, 21.0, 24.0, 13.0, 10.0, 13.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0, -16.467041015625, -15.93408203125, -15.401123046875, -14.8681640625, -14.335205078125, -13.80224609375, -13.269287109375, -12.736328125, -12.203369140625, -11.67041015625, -11.137451171875, -10.6044921875, -10.071533203125, -9.53857421875, -9.005615234375, -8.47265625, -7.939697265625, -7.40673828125, -6.873779296875, -6.3408203125, -5.807861328125, -5.27490234375, -4.741943359375, -4.208984375, -3.676025390625, -3.14306640625, -2.610107421875, -2.0771484375, -1.544189453125, -1.01123046875, -0.478271484375, 0.0546875, 0.587646484375, 1.12060546875, 1.653564453125, 2.1865234375, 2.719482421875, 3.25244140625, 3.785400390625, 4.318359375, 4.851318359375, 5.38427734375, 5.917236328125, 6.4501953125, 6.983154296875, 7.51611328125, 8.049072265625, 8.58203125, 9.114990234375, 9.64794921875, 10.180908203125, 10.7138671875, 11.246826171875, 11.77978515625, 12.312744140625, 12.845703125, 13.378662109375, 13.91162109375, 14.444580078125, 14.9775390625, 15.510498046875, 16.04345703125, 16.576416015625, 17.109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 8.0, 4.0, 9.0, 7.0, 13.0, 14.0, 20.0, 16.0, 13.0, 34.0, 35.0, 41.0, 41.0, 42.0, 74.0, 65.0, 73.0, 60.0, 38.0, 57.0, 54.0, 44.0, 45.0, 36.0, 26.0, 29.0, 16.0, 17.0, 16.0, 15.0, 6.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.109375, -24.284912109375, -23.46044921875, -22.635986328125, -21.8115234375, -20.987060546875, -20.16259765625, -19.338134765625, -18.513671875, -17.689208984375, -16.86474609375, -16.040283203125, -15.2158203125, -14.391357421875, -13.56689453125, -12.742431640625, -11.91796875, -11.093505859375, -10.26904296875, -9.444580078125, -8.6201171875, -7.795654296875, -6.97119140625, -6.146728515625, -5.322265625, -4.497802734375, -3.67333984375, -2.848876953125, -2.0244140625, -1.199951171875, -0.37548828125, 0.448974609375, 1.2734375, 2.097900390625, 2.92236328125, 3.746826171875, 4.5712890625, 5.395751953125, 6.22021484375, 7.044677734375, 7.869140625, 8.693603515625, 9.51806640625, 10.342529296875, 11.1669921875, 11.991455078125, 12.81591796875, 13.640380859375, 14.46484375, 15.289306640625, 16.11376953125, 16.938232421875, 17.7626953125, 18.587158203125, 19.41162109375, 20.236083984375, 21.060546875, 21.885009765625, 22.70947265625, 23.533935546875, 24.3583984375, 25.182861328125, 26.00732421875, 26.831787109375, 27.65625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 9.0, 11.0, 16.0, 20.0, 37.0, 53.0, 83.0, 152.0, 252.0, 435.0, 1061.0, 2349.0, 6800.0, 24057.0, 120552.0, 747297.0, 111670.0, 22797.0, 6544.0, 2367.0, 997.0, 430.0, 223.0, 122.0, 78.0, 43.0, 27.0, 19.0, 14.0, 11.0, 7.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.126739501953125, -4.00347900390625, -3.880218505859375, -3.7569580078125, -3.633697509765625, -3.51043701171875, -3.387176513671875, -3.263916015625, -3.140655517578125, -3.01739501953125, -2.894134521484375, -2.7708740234375, -2.647613525390625, -2.52435302734375, -2.401092529296875, -2.27783203125, -2.154571533203125, -2.03131103515625, -1.908050537109375, -1.7847900390625, -1.661529541015625, -1.53826904296875, -1.415008544921875, -1.291748046875, -1.168487548828125, -1.04522705078125, -0.921966552734375, -0.7987060546875, -0.675445556640625, -0.55218505859375, -0.428924560546875, -0.3056640625, -0.182403564453125, -0.05914306640625, 0.064117431640625, 0.1873779296875, 0.310638427734375, 0.43389892578125, 0.557159423828125, 0.680419921875, 0.803680419921875, 0.92694091796875, 1.050201416015625, 1.1734619140625, 1.296722412109375, 1.41998291015625, 1.543243408203125, 1.66650390625, 1.789764404296875, 1.91302490234375, 2.036285400390625, 2.1595458984375, 2.282806396484375, 2.40606689453125, 2.529327392578125, 2.652587890625, 2.775848388671875, 2.89910888671875, 3.022369384765625, 3.1456298828125, 3.268890380859375, 3.39215087890625, 3.515411376953125, 3.638671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 12.0, 7.0, 17.0, 17.0, 32.0, 56.0, 76.0, 181.0, 223.0, 154.0, 78.0, 53.0, 36.0, 22.0, 13.0, 5.0, 2.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.003055572509765625, -0.0029868781566619873, -0.0029181838035583496, -0.002849489450454712, -0.0027807950973510742, -0.0027121007442474365, -0.002643406391143799, -0.002574712038040161, -0.0025060176849365234, -0.0024373233318328857, -0.002368628978729248, -0.0022999346256256104, -0.0022312402725219727, -0.002162545919418335, -0.0020938515663146973, -0.0020251572132110596, -0.001956462860107422, -0.0018877685070037842, -0.0018190741539001465, -0.0017503798007965088, -0.001681685447692871, -0.0016129910945892334, -0.0015442967414855957, -0.001475602388381958, -0.0014069080352783203, -0.0013382136821746826, -0.001269519329071045, -0.0012008249759674072, -0.0011321306228637695, -0.0010634362697601318, -0.0009947419166564941, -0.0009260475635528564, -0.0008573532104492188, -0.0007886588573455811, -0.0007199645042419434, -0.0006512701511383057, -0.000582575798034668, -0.0005138814449310303, -0.0004451870918273926, -0.0003764927387237549, -0.0003077983856201172, -0.0002391040325164795, -0.0001704096794128418, -0.0001017153263092041, -3.3020973205566406e-05, 3.567337989807129e-05, 0.00010436773300170898, 0.00017306208610534668, 0.00024175643920898438, 0.00031045079231262207, 0.00037914514541625977, 0.00044783949851989746, 0.0005165338516235352, 0.0005852282047271729, 0.0006539225578308105, 0.0007226169109344482, 0.0007913112640380859, 0.0008600056171417236, 0.0009286999702453613, 0.000997394323348999, 0.0010660886764526367, 0.0011347830295562744, 0.0012034773826599121, 0.0012721717357635498, 0.0013408660888671875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 9.0, 10.0, 5.0, 13.0, 21.0, 44.0, 57.0, 121.0, 188.0, 361.0, 613.0, 1162.0, 2749.0, 8040.0, 29845.0, 135788.0, 703271.0, 125623.0, 27800.0, 7549.0, 2738.0, 1172.0, 564.0, 357.0, 184.0, 104.0, 56.0, 32.0, 20.0, 27.0, 13.0, 5.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.526275634765625, -2.41387939453125, -2.301483154296875, -2.1890869140625, -2.076690673828125, -1.96429443359375, -1.851898193359375, -1.739501953125, -1.627105712890625, -1.51470947265625, -1.402313232421875, -1.2899169921875, -1.177520751953125, -1.06512451171875, -0.952728271484375, -0.84033203125, -0.727935791015625, -0.61553955078125, -0.503143310546875, -0.3907470703125, -0.278350830078125, -0.16595458984375, -0.053558349609375, 0.058837890625, 0.171234130859375, 0.28363037109375, 0.396026611328125, 0.5084228515625, 0.620819091796875, 0.73321533203125, 0.845611572265625, 0.9580078125, 1.070404052734375, 1.18280029296875, 1.295196533203125, 1.4075927734375, 1.519989013671875, 1.63238525390625, 1.744781494140625, 1.857177734375, 1.969573974609375, 2.08197021484375, 2.194366455078125, 2.3067626953125, 2.419158935546875, 2.53155517578125, 2.643951416015625, 2.75634765625, 2.868743896484375, 2.98114013671875, 3.093536376953125, 3.2059326171875, 3.318328857421875, 3.43072509765625, 3.543121337890625, 3.655517578125, 3.767913818359375, 3.88031005859375, 3.992706298828125, 4.1051025390625, 4.217498779296875, 4.32989501953125, 4.442291259765625, 4.5546875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 12.0, 6.0, 16.0, 12.0, 27.0, 31.0, 47.0, 61.0, 51.0, 81.0, 109.0, 122.0, 93.0, 58.0, 59.0, 46.0, 39.0, 31.0, 23.0, 14.0, 10.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.2265625, -4.0859375, -3.9453125, -3.8046875, -3.6640625, -3.5234375, -3.3828125, -3.2421875, -3.1015625, -2.9609375, -2.8203125, -2.6796875, -2.5390625, -2.3984375, -2.2578125, -2.1171875, -1.9765625, -1.8359375, -1.6953125, -1.5546875, -1.4140625, -1.2734375, -1.1328125, -0.9921875, -0.8515625, -0.7109375, -0.5703125, -0.4296875, -0.2890625, -0.1484375, -0.0078125, 0.1328125, 0.2734375, 0.4140625, 0.5546875, 0.6953125, 0.8359375, 0.9765625, 1.1171875, 1.2578125, 1.3984375, 1.5390625, 1.6796875, 1.8203125, 1.9609375, 2.1015625, 2.2421875, 2.3828125, 2.5234375, 2.6640625, 2.8046875, 2.9453125, 3.0859375, 3.2265625, 3.3671875, 3.5078125, 3.6484375, 3.7890625, 3.9296875, 4.0703125, 4.2109375, 4.3515625, 4.4921875, 4.6328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 18.0, 41.0, 107.0, 235.0, 386.0, 126.0, 46.0, 17.0, 10.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-167.78106689453125, -162.02047729492188, -156.2598876953125, -150.49929809570312, -144.73870849609375, -138.97811889648438, -133.217529296875, -127.45693969726562, -121.69635009765625, -115.93576049804688, -110.1751708984375, -104.41458129882812, -98.65399169921875, -92.89340209960938, -87.1328125, -81.37222290039062, -75.61162567138672, -69.85103607177734, -64.09044647216797, -58.329856872558594, -52.56926727294922, -46.808677673339844, -41.0480842590332, -35.28749465942383, -29.526905059814453, -23.766315460205078, -18.005725860595703, -12.245134353637695, -6.48454475402832, -0.7239551544189453, 5.0366363525390625, 10.797225952148438, 16.557815551757812, 22.318405151367188, 28.078994750976562, 33.83958435058594, 39.60017395019531, 45.36076354980469, 51.12135696411133, 56.8819465637207, 62.64253616333008, 68.40312957763672, 74.1637191772461, 79.92430877685547, 85.68489837646484, 91.44548797607422, 97.2060775756836, 102.96666717529297, 108.72725677490234, 114.48784637451172, 120.2484359741211, 126.00902557373047, 131.76962280273438, 137.53021240234375, 143.29080200195312, 149.0513916015625, 154.81198120117188, 160.57257080078125, 166.33316040039062, 172.09375, 177.85433959960938, 183.61492919921875, 189.37551879882812, 195.1361083984375, 200.89669799804688]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 6.0, 12.0, 24.0, 23.0, 21.0, 27.0, 20.0, 28.0, 33.0, 37.0, 61.0, 132.0, 170.0, 71.0, 51.0, 47.0, 38.0, 24.0, 35.0, 29.0, 22.0, 16.0, 14.0, 9.0, 8.0, 4.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.37966918945312, -93.93621826171875, -90.49276733398438, -87.04931640625, -83.60586547851562, -80.16241455078125, -76.71895599365234, -73.27550506591797, -69.8320541381836, -66.38860321044922, -62.945152282714844, -59.5016975402832, -56.05824661254883, -52.61479568481445, -49.17134094238281, -45.72789001464844, -42.28443908691406, -38.84098815917969, -35.39753723144531, -31.954082489013672, -28.510631561279297, -25.067180633544922, -21.623727798461914, -18.180274963378906, -14.736824035644531, -11.29337215423584, -7.849920272827148, -4.406468391418457, -0.9630165100097656, 2.4804344177246094, 5.923887252807617, 9.367340087890625, 12.810791015625, 16.254241943359375, 19.697694778442383, 23.14114761352539, 26.584598541259766, 30.02804946899414, 33.47150421142578, 36.914955139160156, 40.35840606689453, 43.801856994628906, 47.24530792236328, 50.68876266479492, 54.1322135925293, 57.57566452026367, 61.01911926269531, 64.46257019042969, 67.90602111816406, 71.34947204589844, 74.79292297363281, 78.23637390136719, 81.67982482910156, 85.12327575683594, 88.56673431396484, 92.01018524169922, 95.4536361694336, 98.89708709716797, 102.34053802490234, 105.78398895263672, 109.22744750976562, 112.6708984375, 116.11434936523438, 119.55780029296875, 123.00125122070312]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 14.0, 19.0, 28.0, 31.0, 45.0, 80.0, 112.0, 170.0, 219.0, 337.0, 496.0, 801.0, 1391.0, 2310.0, 4275.0, 8819.0, 21158.0, 63062.0, 234237.0, 859016.0, 1759419.0, 886389.0, 246259.0, 64431.0, 21317.0, 9111.0, 4351.0, 2402.0, 1402.0, 909.0, 547.0, 339.0, 233.0, 154.0, 117.0, 54.0, 51.0, 44.0, 27.0, 17.0, 13.0, 17.0, 11.0, 9.0, 6.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.9609375, -7.7000732421875, -7.439208984375, -7.1783447265625, -6.91748046875, -6.6566162109375, -6.395751953125, -6.1348876953125, -5.8740234375, -5.6131591796875, -5.352294921875, -5.0914306640625, -4.83056640625, -4.5697021484375, -4.308837890625, -4.0479736328125, -3.787109375, -3.5262451171875, -3.265380859375, -3.0045166015625, -2.74365234375, -2.4827880859375, -2.221923828125, -1.9610595703125, -1.7001953125, -1.4393310546875, -1.178466796875, -0.9176025390625, -0.65673828125, -0.3958740234375, -0.135009765625, 0.1258544921875, 0.38671875, 0.6475830078125, 0.908447265625, 1.1693115234375, 1.43017578125, 1.6910400390625, 1.951904296875, 2.2127685546875, 2.4736328125, 2.7344970703125, 2.995361328125, 3.2562255859375, 3.51708984375, 3.7779541015625, 4.038818359375, 4.2996826171875, 4.560546875, 4.8214111328125, 5.082275390625, 5.3431396484375, 5.60400390625, 5.8648681640625, 6.125732421875, 6.3865966796875, 6.6474609375, 6.9083251953125, 7.169189453125, 7.4300537109375, 7.69091796875, 7.9517822265625, 8.212646484375, 8.4735107421875, 8.734375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 5.0, 1.0, 5.0, 2.0, 5.0, 7.0, 9.0, 7.0, 13.0, 13.0, 26.0, 20.0, 21.0, 26.0, 24.0, 32.0, 27.0, 29.0, 27.0, 27.0, 29.0, 41.0, 38.0, 50.0, 52.0, 46.0, 45.0, 48.0, 30.0, 42.0, 40.0, 22.0, 35.0, 31.0, 22.0, 18.0, 15.0, 15.0, 12.0, 10.0, 10.0, 9.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83203125, -4.65838623046875, -4.4847412109375, -4.31109619140625, -4.137451171875, -3.96380615234375, -3.7901611328125, -3.61651611328125, -3.44287109375, -3.26922607421875, -3.0955810546875, -2.92193603515625, -2.748291015625, -2.57464599609375, -2.4010009765625, -2.22735595703125, -2.0537109375, -1.88006591796875, -1.7064208984375, -1.53277587890625, -1.359130859375, -1.18548583984375, -1.0118408203125, -0.83819580078125, -0.66455078125, -0.49090576171875, -0.3172607421875, -0.14361572265625, 0.030029296875, 0.20367431640625, 0.3773193359375, 0.55096435546875, 0.724609375, 0.89825439453125, 1.0718994140625, 1.24554443359375, 1.419189453125, 1.59283447265625, 1.7664794921875, 1.94012451171875, 2.11376953125, 2.28741455078125, 2.4610595703125, 2.63470458984375, 2.808349609375, 2.98199462890625, 3.1556396484375, 3.32928466796875, 3.5029296875, 3.67657470703125, 3.8502197265625, 4.02386474609375, 4.197509765625, 4.37115478515625, 4.5447998046875, 4.71844482421875, 4.89208984375, 5.06573486328125, 5.2393798828125, 5.41302490234375, 5.586669921875, 5.76031494140625, 5.9339599609375, 6.10760498046875, 6.28125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 8.0, 10.0, 16.0, 21.0, 26.0, 43.0, 74.0, 104.0, 205.0, 428.0, 895.0, 2505.0, 12052.0, 373561.0, 3751908.0, 44666.0, 4991.0, 1469.0, 607.0, 281.0, 150.0, 92.0, 54.0, 35.0, 23.0, 10.0, 10.0, 14.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.6875, -40.47021484375, -39.2529296875, -38.03564453125, -36.818359375, -35.60107421875, -34.3837890625, -33.16650390625, -31.94921875, -30.73193359375, -29.5146484375, -28.29736328125, -27.080078125, -25.86279296875, -24.6455078125, -23.42822265625, -22.2109375, -20.99365234375, -19.7763671875, -18.55908203125, -17.341796875, -16.12451171875, -14.9072265625, -13.68994140625, -12.47265625, -11.25537109375, -10.0380859375, -8.82080078125, -7.603515625, -6.38623046875, -5.1689453125, -3.95166015625, -2.734375, -1.51708984375, -0.2998046875, 0.91748046875, 2.134765625, 3.35205078125, 4.5693359375, 5.78662109375, 7.00390625, 8.22119140625, 9.4384765625, 10.65576171875, 11.873046875, 13.09033203125, 14.3076171875, 15.52490234375, 16.7421875, 17.95947265625, 19.1767578125, 20.39404296875, 21.611328125, 22.82861328125, 24.0458984375, 25.26318359375, 26.48046875, 27.69775390625, 28.9150390625, 30.13232421875, 31.349609375, 32.56689453125, 33.7841796875, 35.00146484375, 36.21875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 3.0, 8.0, 9.0, 16.0, 26.0, 27.0, 31.0, 57.0, 61.0, 92.0, 121.0, 172.0, 214.0, 296.0, 399.0, 450.0, 476.0, 380.0, 313.0, 209.0, 154.0, 146.0, 107.0, 56.0, 63.0, 35.0, 33.0, 25.0, 19.0, 11.0, 13.0, 9.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.25, -15.723876953125, -15.19775390625, -14.671630859375, -14.1455078125, -13.619384765625, -13.09326171875, -12.567138671875, -12.041015625, -11.514892578125, -10.98876953125, -10.462646484375, -9.9365234375, -9.410400390625, -8.88427734375, -8.358154296875, -7.83203125, -7.305908203125, -6.77978515625, -6.253662109375, -5.7275390625, -5.201416015625, -4.67529296875, -4.149169921875, -3.623046875, -3.096923828125, -2.57080078125, -2.044677734375, -1.5185546875, -0.992431640625, -0.46630859375, 0.059814453125, 0.5859375, 1.112060546875, 1.63818359375, 2.164306640625, 2.6904296875, 3.216552734375, 3.74267578125, 4.268798828125, 4.794921875, 5.321044921875, 5.84716796875, 6.373291015625, 6.8994140625, 7.425537109375, 7.95166015625, 8.477783203125, 9.00390625, 9.530029296875, 10.05615234375, 10.582275390625, 11.1083984375, 11.634521484375, 12.16064453125, 12.686767578125, 13.212890625, 13.739013671875, 14.26513671875, 14.791259765625, 15.3173828125, 15.843505859375, 16.36962890625, 16.895751953125, 17.421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 11.0, 18.0, 37.0, 65.0, 132.0, 201.0, 223.0, 112.0, 76.0, 39.0, 32.0, 16.0, 10.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.8726806640625, -281.3412170410156, -272.8097839355469, -264.2783203125, -255.74688720703125, -247.21543884277344, -238.68399047851562, -230.15252685546875, -221.62109375, -213.0896453857422, -204.55819702148438, -196.02674865722656, -187.49530029296875, -178.96385192871094, -170.43240356445312, -161.90093994140625, -153.36949157714844, -144.83804321289062, -136.3065948486328, -127.775146484375, -119.24369812011719, -110.71224975585938, -102.18079376220703, -93.64934539794922, -85.1178970336914, -76.5864486694336, -68.05500030517578, -59.5235481262207, -50.99209976196289, -42.46065139770508, -33.92919921875, -25.397750854492188, -16.866302490234375, -8.334853172302246, 0.1965961456298828, 8.728046417236328, 17.25949478149414, 25.790943145751953, 34.32239532470703, 42.853843688964844, 51.385292053222656, 59.91674041748047, 68.44818878173828, 76.97964477539062, 85.51109313964844, 94.04254150390625, 102.57398986816406, 111.10543823242188, 119.63688659667969, 128.1683349609375, 136.6997833251953, 145.23123168945312, 153.76268005371094, 162.29412841796875, 170.82559204101562, 179.35702514648438, 187.88848876953125, 196.41993713378906, 204.95138549804688, 213.4828338623047, 222.0142822265625, 230.5457305908203, 239.07717895507812, 247.608642578125, 256.14007568359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 4.0, 7.0, 9.0, 12.0, 7.0, 13.0, 9.0, 8.0, 17.0, 15.0, 33.0, 21.0, 31.0, 35.0, 22.0, 28.0, 38.0, 34.0, 36.0, 34.0, 37.0, 49.0, 50.0, 54.0, 29.0, 50.0, 33.0, 38.0, 26.0, 30.0, 29.0, 22.0, 16.0, 17.0, 12.0, 25.0, 14.0, 20.0, 5.0, 6.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-95.79580688476562, -92.85271453857422, -89.90962219238281, -86.96653747558594, -84.02344512939453, -81.08035278320312, -78.13726043701172, -75.19416809082031, -72.25108337402344, -69.30799102783203, -66.36489868164062, -63.421810150146484, -60.478721618652344, -57.53562927246094, -54.59253692626953, -51.649444580078125, -48.70635223388672, -45.76325988769531, -42.82017135620117, -39.877079010009766, -36.933990478515625, -33.99089813232422, -31.047805786132812, -28.10471534729004, -25.161624908447266, -22.218534469604492, -19.27544403076172, -16.332351684570312, -13.389261245727539, -10.446170806884766, -7.503078460693359, -4.559988021850586, -1.6169052124023438, 1.326185703277588, 4.2692766189575195, 7.212368011474609, 10.155458450317383, 13.098548889160156, 16.041641235351562, 18.984731674194336, 21.92782211303711, 24.870912551879883, 27.814002990722656, 30.757095336914062, 33.70018768310547, 36.64327621459961, 39.586368560791016, 42.529457092285156, 45.47254943847656, 48.41564178466797, 51.35873031616211, 54.301822662353516, 57.244911193847656, 60.18800354003906, 63.13109588623047, 66.07418823242188, 69.01727294921875, 71.96036529541016, 74.90345764160156, 77.84654235839844, 80.78963470458984, 83.73272705078125, 86.67581939697266, 89.61891174316406, 92.56200408935547]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 11.0, 11.0, 15.0, 24.0, 44.0, 75.0, 137.0, 238.0, 418.0, 991.0, 2155.0, 5542.0, 17532.0, 71923.0, 408673.0, 435862.0, 76839.0, 18227.0, 5652.0, 2169.0, 954.0, 493.0, 267.0, 112.0, 57.0, 42.0, 20.0, 14.0, 20.0, 10.0, 7.0, 6.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.234375, -9.8555908203125, -9.476806640625, -9.0980224609375, -8.71923828125, -8.3404541015625, -7.961669921875, -7.5828857421875, -7.2041015625, -6.8253173828125, -6.446533203125, -6.0677490234375, -5.68896484375, -5.3101806640625, -4.931396484375, -4.5526123046875, -4.173828125, -3.7950439453125, -3.416259765625, -3.0374755859375, -2.65869140625, -2.2799072265625, -1.901123046875, -1.5223388671875, -1.1435546875, -0.7647705078125, -0.385986328125, -0.0072021484375, 0.37158203125, 0.7503662109375, 1.129150390625, 1.5079345703125, 1.88671875, 2.2655029296875, 2.644287109375, 3.0230712890625, 3.40185546875, 3.7806396484375, 4.159423828125, 4.5382080078125, 4.9169921875, 5.2957763671875, 5.674560546875, 6.0533447265625, 6.43212890625, 6.8109130859375, 7.189697265625, 7.5684814453125, 7.947265625, 8.3260498046875, 8.704833984375, 9.0836181640625, 9.46240234375, 9.8411865234375, 10.219970703125, 10.5987548828125, 10.9775390625, 11.3563232421875, 11.735107421875, 12.1138916015625, 12.49267578125, 12.8714599609375, 13.250244140625, 13.6290283203125, 14.0078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 8.0, 5.0, 5.0, 11.0, 19.0, 17.0, 36.0, 31.0, 30.0, 53.0, 57.0, 58.0, 40.0, 65.0, 78.0, 78.0, 74.0, 66.0, 46.0, 42.0, 35.0, 31.0, 42.0, 19.0, 22.0, 16.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.021484375, -8.66796875, -8.314453125, -7.9609375, -7.607421875, -7.25390625, -6.900390625, -6.546875, -6.193359375, -5.83984375, -5.486328125, -5.1328125, -4.779296875, -4.42578125, -4.072265625, -3.71875, -3.365234375, -3.01171875, -2.658203125, -2.3046875, -1.951171875, -1.59765625, -1.244140625, -0.890625, -0.537109375, -0.18359375, 0.169921875, 0.5234375, 0.876953125, 1.23046875, 1.583984375, 1.9375, 2.291015625, 2.64453125, 2.998046875, 3.3515625, 3.705078125, 4.05859375, 4.412109375, 4.765625, 5.119140625, 5.47265625, 5.826171875, 6.1796875, 6.533203125, 6.88671875, 7.240234375, 7.59375, 7.947265625, 8.30078125, 8.654296875, 9.0078125, 9.361328125, 9.71484375, 10.068359375, 10.421875, 10.775390625, 11.12890625, 11.482421875, 11.8359375, 12.189453125, 12.54296875, 12.896484375, 13.25]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 7.0, 10.0, 18.0, 21.0, 35.0, 65.0, 139.0, 311.0, 699.0, 2349.0, 16177.0, 846503.0, 171031.0, 8441.0, 1665.0, 579.0, 238.0, 110.0, 54.0, 43.0, 25.0, 10.0, 10.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.21875, -25.4873046875, -24.755859375, -24.0244140625, -23.29296875, -22.5615234375, -21.830078125, -21.0986328125, -20.3671875, -19.6357421875, -18.904296875, -18.1728515625, -17.44140625, -16.7099609375, -15.978515625, -15.2470703125, -14.515625, -13.7841796875, -13.052734375, -12.3212890625, -11.58984375, -10.8583984375, -10.126953125, -9.3955078125, -8.6640625, -7.9326171875, -7.201171875, -6.4697265625, -5.73828125, -5.0068359375, -4.275390625, -3.5439453125, -2.8125, -2.0810546875, -1.349609375, -0.6181640625, 0.11328125, 0.8447265625, 1.576171875, 2.3076171875, 3.0390625, 3.7705078125, 4.501953125, 5.2333984375, 5.96484375, 6.6962890625, 7.427734375, 8.1591796875, 8.890625, 9.6220703125, 10.353515625, 11.0849609375, 11.81640625, 12.5478515625, 13.279296875, 14.0107421875, 14.7421875, 15.4736328125, 16.205078125, 16.9365234375, 17.66796875, 18.3994140625, 19.130859375, 19.8623046875, 20.59375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 4.0, 5.0, 9.0, 8.0, 10.0, 11.0, 19.0, 23.0, 26.0, 26.0, 36.0, 43.0, 59.0, 57.0, 81.0, 87.0, 93.0, 59.0, 55.0, 51.0, 46.0, 38.0, 24.0, 17.0, 15.0, 16.0, 14.0, 7.0, 4.0, 18.0, 11.0, 5.0, 4.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.9375, -31.826171875, -30.71484375, -29.603515625, -28.4921875, -27.380859375, -26.26953125, -25.158203125, -24.046875, -22.935546875, -21.82421875, -20.712890625, -19.6015625, -18.490234375, -17.37890625, -16.267578125, -15.15625, -14.044921875, -12.93359375, -11.822265625, -10.7109375, -9.599609375, -8.48828125, -7.376953125, -6.265625, -5.154296875, -4.04296875, -2.931640625, -1.8203125, -0.708984375, 0.40234375, 1.513671875, 2.625, 3.736328125, 4.84765625, 5.958984375, 7.0703125, 8.181640625, 9.29296875, 10.404296875, 11.515625, 12.626953125, 13.73828125, 14.849609375, 15.9609375, 17.072265625, 18.18359375, 19.294921875, 20.40625, 21.517578125, 22.62890625, 23.740234375, 24.8515625, 25.962890625, 27.07421875, 28.185546875, 29.296875, 30.408203125, 31.51953125, 32.630859375, 33.7421875, 34.853515625, 35.96484375, 37.076171875, 38.1875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 5.0, 4.0, 8.0, 7.0, 17.0, 18.0, 20.0, 35.0, 30.0, 44.0, 51.0, 70.0, 115.0, 166.0, 254.0, 400.0, 609.0, 963.0, 1791.0, 3289.0, 6822.0, 15580.0, 43051.0, 315726.0, 583784.0, 44581.0, 16284.0, 6900.0, 3352.0, 1743.0, 1006.0, 655.0, 355.0, 241.0, 148.0, 111.0, 71.0, 47.0, 48.0, 30.0, 28.0, 20.0, 16.0, 12.0, 13.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.8193359375, -1.7658538818359375, -1.712371826171875, -1.6588897705078125, -1.60540771484375, -1.5519256591796875, -1.498443603515625, -1.4449615478515625, -1.3914794921875, -1.3379974365234375, -1.284515380859375, -1.2310333251953125, -1.17755126953125, -1.1240692138671875, -1.070587158203125, -1.0171051025390625, -0.963623046875, -0.9101409912109375, -0.856658935546875, -0.8031768798828125, -0.74969482421875, -0.6962127685546875, -0.642730712890625, -0.5892486572265625, -0.5357666015625, -0.4822845458984375, -0.428802490234375, -0.3753204345703125, -0.32183837890625, -0.2683563232421875, -0.214874267578125, -0.1613922119140625, -0.10791015625, -0.0544281005859375, -0.000946044921875, 0.0525360107421875, 0.10601806640625, 0.1595001220703125, 0.212982177734375, 0.2664642333984375, 0.3199462890625, 0.3734283447265625, 0.426910400390625, 0.4803924560546875, 0.53387451171875, 0.5873565673828125, 0.640838623046875, 0.6943206787109375, 0.747802734375, 0.8012847900390625, 0.854766845703125, 0.9082489013671875, 0.96173095703125, 1.0152130126953125, 1.068695068359375, 1.1221771240234375, 1.1756591796875, 1.2291412353515625, 1.282623291015625, 1.3361053466796875, 1.38958740234375, 1.4430694580078125, 1.496551513671875, 1.5500335693359375, 1.603515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 7.0, 7.0, 8.0, 14.0, 10.0, 20.0, 23.0, 32.0, 38.0, 41.0, 51.0, 75.0, 104.0, 92.0, 98.0, 71.0, 67.0, 42.0, 38.0, 26.0, 25.0, 10.0, 8.0, 12.0, 14.0, 10.0, 4.0, 9.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004456043243408203, -0.0004304759204387665, -0.00041534751653671265, -0.0004002191126346588, -0.000385090708732605, -0.00036996230483055115, -0.0003548339009284973, -0.0003397054970264435, -0.00032457709312438965, -0.0003094486892223358, -0.000294320285320282, -0.00027919188141822815, -0.0002640634775161743, -0.0002489350736141205, -0.00023380666971206665, -0.00021867826581001282, -0.00020354986190795898, -0.00018842145800590515, -0.00017329305410385132, -0.00015816465020179749, -0.00014303624629974365, -0.00012790784239768982, -0.00011277943849563599, -9.765103459358215e-05, -8.252263069152832e-05, -6.739422678947449e-05, -5.2265822887420654e-05, -3.713741898536682e-05, -2.2009015083312988e-05, -6.880611181259155e-06, 8.247792720794678e-06, 2.337619662284851e-05, 3.8504600524902344e-05, 5.363300442695618e-05, 6.876140832901001e-05, 8.388981223106384e-05, 9.901821613311768e-05, 0.00011414662003517151, 0.00012927502393722534, 0.00014440342783927917, 0.000159531831741333, 0.00017466023564338684, 0.00018978863954544067, 0.0002049170434474945, 0.00022004544734954834, 0.00023517385125160217, 0.000250302255153656, 0.00026543065905570984, 0.00028055906295776367, 0.0002956874668598175, 0.00031081587076187134, 0.00032594427466392517, 0.000341072678565979, 0.00035620108246803284, 0.00037132948637008667, 0.0003864578902721405, 0.00040158629417419434, 0.00041671469807624817, 0.000431843101978302, 0.00044697150588035583, 0.00046209990978240967, 0.0004772283136844635, 0.0004923567175865173, 0.0005074851214885712, 0.000522613525390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 15.0, 12.0, 20.0, 39.0, 54.0, 66.0, 91.0, 156.0, 282.0, 452.0, 798.0, 1680.0, 3719.0, 9187.0, 27073.0, 116566.0, 778919.0, 75450.0, 20398.0, 7430.0, 2947.0, 1457.0, 703.0, 413.0, 235.0, 140.0, 89.0, 46.0, 44.0, 19.0, 16.0, 8.0, 4.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.0625, -2.9847259521484375, -2.906951904296875, -2.8291778564453125, -2.75140380859375, -2.6736297607421875, -2.595855712890625, -2.5180816650390625, -2.4403076171875, -2.3625335693359375, -2.284759521484375, -2.2069854736328125, -2.12921142578125, -2.0514373779296875, -1.973663330078125, -1.8958892822265625, -1.818115234375, -1.7403411865234375, -1.662567138671875, -1.5847930908203125, -1.50701904296875, -1.4292449951171875, -1.351470947265625, -1.2736968994140625, -1.1959228515625, -1.1181488037109375, -1.040374755859375, -0.9626007080078125, -0.88482666015625, -0.8070526123046875, -0.729278564453125, -0.6515045166015625, -0.57373046875, -0.4959564208984375, -0.418182373046875, -0.3404083251953125, -0.26263427734375, -0.1848602294921875, -0.107086181640625, -0.0293121337890625, 0.0484619140625, 0.1262359619140625, 0.204010009765625, 0.2817840576171875, 0.35955810546875, 0.4373321533203125, 0.515106201171875, 0.5928802490234375, 0.670654296875, 0.7484283447265625, 0.826202392578125, 0.9039764404296875, 0.98175048828125, 1.0595245361328125, 1.137298583984375, 1.2150726318359375, 1.2928466796875, 1.3706207275390625, 1.448394775390625, 1.5261688232421875, 1.60394287109375, 1.6817169189453125, 1.759490966796875, 1.8372650146484375, 1.9150390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 7.0, 9.0, 4.0, 6.0, 10.0, 14.0, 18.0, 36.0, 41.0, 49.0, 67.0, 129.0, 122.0, 119.0, 104.0, 62.0, 39.0, 29.0, 30.0, 21.0, 17.0, 13.0, 14.0, 8.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.728515625, -3.61480712890625, -3.5010986328125, -3.38739013671875, -3.273681640625, -3.15997314453125, -3.0462646484375, -2.93255615234375, -2.81884765625, -2.70513916015625, -2.5914306640625, -2.47772216796875, -2.364013671875, -2.25030517578125, -2.1365966796875, -2.02288818359375, -1.9091796875, -1.79547119140625, -1.6817626953125, -1.56805419921875, -1.454345703125, -1.34063720703125, -1.2269287109375, -1.11322021484375, -0.99951171875, -0.88580322265625, -0.7720947265625, -0.65838623046875, -0.544677734375, -0.43096923828125, -0.3172607421875, -0.20355224609375, -0.08984375, 0.02386474609375, 0.1375732421875, 0.25128173828125, 0.364990234375, 0.47869873046875, 0.5924072265625, 0.70611572265625, 0.81982421875, 0.93353271484375, 1.0472412109375, 1.16094970703125, 1.274658203125, 1.38836669921875, 1.5020751953125, 1.61578369140625, 1.7294921875, 1.84320068359375, 1.9569091796875, 2.07061767578125, 2.184326171875, 2.29803466796875, 2.4117431640625, 2.52545166015625, 2.63916015625, 2.75286865234375, 2.8665771484375, 2.98028564453125, 3.093994140625, 3.20770263671875, 3.3214111328125, 3.43511962890625, 3.548828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 28.0, 95.0, 444.0, 278.0, 77.0, 29.0, 19.0, 16.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.42794036865234, -93.1633071899414, -86.89866638183594, -80.634033203125, -74.36939239501953, -68.1047592163086, -61.84012222290039, -55.57548522949219, -49.310848236083984, -43.04621124267578, -36.78157424926758, -30.516939163208008, -24.252302169799805, -17.9876651763916, -11.723030090332031, -5.458393096923828, 0.806243896484375, 7.07088041305542, 13.335516929626465, 19.60015296936035, 25.864789962768555, 32.129425048828125, 38.39406204223633, 44.65869903564453, 50.923336029052734, 57.18797302246094, 63.45261001586914, 69.71724700927734, 75.98188018798828, 82.24652099609375, 88.51115417480469, 94.77578735351562, 101.04042053222656, 107.3050537109375, 113.56969451904297, 119.8343276977539, 126.09896850585938, 132.3636016845703, 138.62823486328125, 144.89288330078125, 151.1575164794922, 157.42214965820312, 163.68678283691406, 169.95143127441406, 176.216064453125, 182.48069763183594, 188.74533081054688, 195.00997924804688, 201.27459716796875, 207.5392303466797, 213.80386352539062, 220.06851196289062, 226.33314514160156, 232.5977783203125, 238.86241149902344, 245.12704467773438, 251.39169311523438, 257.6563415527344, 263.92095947265625, 270.18560791015625, 276.4502258300781, 282.7148742675781, 288.9795227050781, 295.244140625, 301.5087890625]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 3.0, 5.0, 4.0, 8.0, 9.0, 14.0, 6.0, 9.0, 13.0, 15.0, 20.0, 29.0, 20.0, 22.0, 44.0, 109.0, 113.0, 56.0, 93.0, 103.0, 61.0, 40.0, 27.0, 12.0, 20.0, 14.0, 13.0, 11.0, 7.0, 10.0, 11.0, 9.0, 7.0, 10.0, 7.0, 6.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-82.41512298583984, -79.95773315429688, -77.50035095214844, -75.04296112060547, -72.5855712890625, -70.12818145751953, -67.67079162597656, -65.21340942382812, -62.756019592285156, -60.29862976074219, -57.841243743896484, -55.38385772705078, -52.92646789550781, -50.469078063964844, -48.01169204711914, -45.55430603027344, -43.09691619873047, -40.6395263671875, -38.1821403503418, -35.724754333496094, -33.267364501953125, -30.80997657775879, -28.352588653564453, -25.895200729370117, -23.43781280517578, -20.980424880981445, -18.52303695678711, -16.065649032592773, -13.608261108398438, -11.150873184204102, -8.693485260009766, -6.23609733581543, -3.778717041015625, -1.321329116821289, 1.1360588073730469, 3.593446731567383, 6.050834655761719, 8.508222579956055, 10.96561050415039, 13.422998428344727, 15.880386352539062, 18.3377742767334, 20.795162200927734, 23.25255012512207, 25.709938049316406, 28.167325973510742, 30.624713897705078, 33.08209991455078, 35.53948974609375, 37.99687957763672, 40.45426559448242, 42.911651611328125, 45.369041442871094, 47.82643127441406, 50.283817291259766, 52.74120330810547, 55.19859313964844, 57.655982971191406, 60.11336898803711, 62.57075500488281, 65.02814483642578, 67.48553466796875, 69.94291687011719, 72.40030670166016, 74.85769653320312]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 6.0, 3.0, 0.0, 1.0, 6.0, 7.0, 8.0, 12.0, 15.0, 17.0, 15.0, 9.0, 19.0, 26.0, 33.0, 28.0, 44.0, 63.0, 108.0, 179.0, 92.0, 53.0, 24.0, 30.0, 30.0, 26.0, 26.0, 27.0, 20.0, 19.0, 10.0, 11.0, 7.0, 10.0, 8.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.9453125, -8.6861572265625, -8.427001953125, -8.1678466796875, -7.90869140625, -7.6495361328125, -7.390380859375, -7.1312255859375, -6.8720703125, -6.6129150390625, -6.353759765625, -6.0946044921875, -5.83544921875, -5.5762939453125, -5.317138671875, -5.0579833984375, -4.798828125, -4.5396728515625, -4.280517578125, -4.0213623046875, -3.76220703125, -3.5030517578125, -3.243896484375, -2.9847412109375, -2.7255859375, -2.4664306640625, -2.207275390625, -1.9481201171875, -1.68896484375, -1.4298095703125, -1.170654296875, -0.9114990234375, -0.65234375, -0.3931884765625, -0.134033203125, 0.1251220703125, 0.38427734375, 0.6434326171875, 0.902587890625, 1.1617431640625, 1.4208984375, 1.6800537109375, 1.939208984375, 2.1983642578125, 2.45751953125, 2.7166748046875, 2.975830078125, 3.2349853515625, 3.494140625, 3.7532958984375, 4.012451171875, 4.2716064453125, 4.53076171875, 4.7899169921875, 5.049072265625, 5.3082275390625, 5.5673828125, 5.8265380859375, 6.085693359375, 6.3448486328125, 6.60400390625, 6.8631591796875, 7.122314453125, 7.3814697265625, 7.640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 14.0, 13.0, 4.0, 15.0, 27.0, 20.0, 26.0, 64.0, 75.0, 213.0, 599.0, 2003.0, 8852.0, 8319103.0, 51246.0, 4360.0, 1161.0, 362.0, 174.0, 92.0, 52.0, 25.0, 14.0, 9.0, 11.0, 9.0, 5.0, 4.0, 0.0, 2.0, 4.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.04344940185547, -73.85832214355469, -71.67318725585938, -69.4880599975586, -67.30293273925781, -65.1177978515625, -62.93267059326172, -60.74754333496094, -58.56241226196289, -56.377281188964844, -54.19215393066406, -52.007022857666016, -49.82189178466797, -47.63676452636719, -45.45163345336914, -43.266502380371094, -41.08137512207031, -38.896244049072266, -36.711116790771484, -34.52598571777344, -32.340858459472656, -30.15572738647461, -27.970596313476562, -25.78546714782715, -23.600337982177734, -21.41520881652832, -19.230079650878906, -17.04494857788086, -14.859819412231445, -12.674690246582031, -10.4895601272583, -8.30443000793457, -6.119304656982422, -3.9341750144958496, -1.7490453720092773, 0.4360842704772949, 2.621213912963867, 4.806343078613281, 6.991473197937012, 9.176603317260742, 11.361732482910156, 13.54686164855957, 15.7319917678833, 17.91712188720703, 20.102251052856445, 22.28738021850586, 24.472511291503906, 26.65764045715332, 28.842769622802734, 31.02789878845215, 33.21302795410156, 35.39815902709961, 37.583290100097656, 39.76841735839844, 41.953548431396484, 44.13867950439453, 46.32380676269531, 48.50893783569336, 50.69406509399414, 52.87919616699219, 55.06432342529297, 57.249454498291016, 59.43458557128906, 61.619712829589844, 63.80484390258789]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 8.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 1.0, 11.0, 8.0, 4.0, 8.0, 5.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.25323486328125, -94.98501586914062, -91.71680450439453, -88.4485855102539, -85.18037414550781, -81.91215515136719, -78.64393615722656, -75.37571716308594, -72.10750579833984, -68.83928680419922, -65.57107543945312, -62.3028564453125, -59.03464126586914, -55.76642608642578, -52.498207092285156, -49.2299919128418, -45.96177673339844, -42.69356155395508, -39.42534637451172, -36.157127380371094, -32.888912200927734, -29.620697021484375, -26.352479934692383, -23.08426284790039, -19.81604766845703, -16.547832489013672, -13.27961540222168, -10.011399269104004, -6.743183135986328, -3.4749679565429688, -0.20675086975097656, 3.0614662170410156, 6.329673767089844, 9.59788990020752, 12.866106033325195, 16.134323120117188, 19.402538299560547, 22.670753479003906, 25.9389705657959, 29.20718765258789, 32.47540283203125, 35.74361801147461, 39.01183319091797, 42.280052185058594, 45.54826736450195, 48.81648254394531, 52.08470153808594, 55.3529167175293, 58.621131896972656, 61.889347076416016, 65.15756225585938, 68.42578125, 71.69400024414062, 74.96221160888672, 78.23043060302734, 81.49864196777344, 84.76686096191406, 88.03507995605469, 91.30329132080078, 94.5715103149414, 97.8397216796875, 101.10794067382812, 104.37615966796875, 107.64437866210938, 110.91259002685547]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 7.0, 5.0, 5.0, 5.0, 8.0, 7.0, 15.0, 17.0, 23.0, 24.0, 34.0, 38.0, 36.0, 43.0, 48.0, 53.0, 43.0, 63.0, 51.0, 63.0, 62.0, 47.0, 42.0, 44.0, 33.0, 28.0, 33.0, 15.0, 21.0, 15.0, 15.0, 13.0, 9.0, 3.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.11566162109375, -4.9383544921875, -4.76104736328125, -4.583740234375, -4.40643310546875, -4.2291259765625, -4.05181884765625, -3.87451171875, -3.69720458984375, -3.5198974609375, -3.34259033203125, -3.165283203125, -2.98797607421875, -2.8106689453125, -2.63336181640625, -2.4560546875, -2.27874755859375, -2.1014404296875, -1.92413330078125, -1.746826171875, -1.56951904296875, -1.3922119140625, -1.21490478515625, -1.03759765625, -0.86029052734375, -0.6829833984375, -0.50567626953125, -0.328369140625, -0.15106201171875, 0.0262451171875, 0.20355224609375, 0.380859375, 0.55816650390625, 0.7354736328125, 0.91278076171875, 1.090087890625, 1.26739501953125, 1.4447021484375, 1.62200927734375, 1.79931640625, 1.97662353515625, 2.1539306640625, 2.33123779296875, 2.508544921875, 2.68585205078125, 2.8631591796875, 3.04046630859375, 3.2177734375, 3.39508056640625, 3.5723876953125, 3.74969482421875, 3.927001953125, 4.10430908203125, 4.2816162109375, 4.45892333984375, 4.63623046875, 4.81353759765625, 4.9908447265625, 5.16815185546875, 5.345458984375, 5.52276611328125, 5.7000732421875, 5.87738037109375, 6.0546875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 12.0, 3.0, 11.0, 5.0, 14.0, 16.0, 20.0, 30.0, 53.0, 78.0, 108.0, 211.0, 404.0, 820.0, 2055.0, 5694.0, 18873.0, 65536.0, 196423.0, 162829.0, 48974.0, 14213.0, 4657.0, 1682.0, 690.0, 344.0, 197.0, 105.0, 74.0, 44.0, 28.0, 19.0, 11.0, 14.0, 7.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.375, -63.5537109375, -61.732421875, -59.9111328125, -58.08984375, -56.2685546875, -54.447265625, -52.6259765625, -50.8046875, -48.9833984375, -47.162109375, -45.3408203125, -43.51953125, -41.6982421875, -39.876953125, -38.0556640625, -36.234375, -34.4130859375, -32.591796875, -30.7705078125, -28.94921875, -27.1279296875, -25.306640625, -23.4853515625, -21.6640625, -19.8427734375, -18.021484375, -16.2001953125, -14.37890625, -12.5576171875, -10.736328125, -8.9150390625, -7.09375, -5.2724609375, -3.451171875, -1.6298828125, 0.19140625, 2.0126953125, 3.833984375, 5.6552734375, 7.4765625, 9.2978515625, 11.119140625, 12.9404296875, 14.76171875, 16.5830078125, 18.404296875, 20.2255859375, 22.046875, 23.8681640625, 25.689453125, 27.5107421875, 29.33203125, 31.1533203125, 32.974609375, 34.7958984375, 36.6171875, 38.4384765625, 40.259765625, 42.0810546875, 43.90234375, 45.7236328125, 47.544921875, 49.3662109375, 51.1875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 8.0, 10.0, 8.0, 19.0, 26.0, 30.0, 31.0, 39.0, 52.0, 58.0, 59.0, 75.0, 80.0, 73.0, 82.0, 82.0, 46.0, 59.0, 42.0, 34.0, 17.0, 14.0, 13.0, 9.0, 10.0, 4.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3984375, -9.0953369140625, -8.792236328125, -8.4891357421875, -8.18603515625, -7.8829345703125, -7.579833984375, -7.2767333984375, -6.9736328125, -6.6705322265625, -6.367431640625, -6.0643310546875, -5.76123046875, -5.4581298828125, -5.155029296875, -4.8519287109375, -4.548828125, -4.2457275390625, -3.942626953125, -3.6395263671875, -3.33642578125, -3.0333251953125, -2.730224609375, -2.4271240234375, -2.1240234375, -1.8209228515625, -1.517822265625, -1.2147216796875, -0.91162109375, -0.6085205078125, -0.305419921875, -0.0023193359375, 0.30078125, 0.6038818359375, 0.906982421875, 1.2100830078125, 1.51318359375, 1.8162841796875, 2.119384765625, 2.4224853515625, 2.7255859375, 3.0286865234375, 3.331787109375, 3.6348876953125, 3.93798828125, 4.2410888671875, 4.544189453125, 4.8472900390625, 5.150390625, 5.4534912109375, 5.756591796875, 6.0596923828125, 6.36279296875, 6.6658935546875, 6.968994140625, 7.2720947265625, 7.5751953125, 7.8782958984375, 8.181396484375, 8.4844970703125, 8.78759765625, 9.0906982421875, 9.393798828125, 9.6968994140625, 10.0]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 8.0, 9.0, 14.0, 20.0, 53.0, 69.0, 78.0, 85.0, 45.0, 22.0, 21.0, 3.0, 6.0, 12.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.4355354309082, -48.931541442871094, -47.427547454833984, -45.923553466796875, -44.41956329345703, -42.91556930541992, -41.41157531738281, -39.9075813293457, -38.403587341308594, -36.899593353271484, -35.395599365234375, -33.89160919189453, -32.38761520385742, -30.883621215820312, -29.379627227783203, -27.875633239746094, -26.37164306640625, -24.86764907836914, -23.363656997680664, -21.859663009643555, -20.355670928955078, -18.85167694091797, -17.34768295288086, -15.843689918518066, -14.339696884155273, -12.83570384979248, -11.331710815429688, -9.827716827392578, -8.323723793029785, -6.819730758666992, -5.315736770629883, -3.81174373626709, -2.3077545166015625, -0.8037612438201904, 0.7002320289611816, 2.204225540161133, 3.708218574523926, 5.212211608886719, 6.716205596923828, 8.220198631286621, 9.724191665649414, 11.228184700012207, 12.732177734375, 14.23617172241211, 15.740164756774902, 17.244157791137695, 18.748151779174805, 20.25214385986328, 21.75613784790039, 23.2601318359375, 24.764123916625977, 26.268117904663086, 27.772109985351562, 29.276103973388672, 30.78009796142578, 32.28409194946289, 33.7880859375, 35.29207992553711, 36.79607391357422, 38.30006408691406, 39.80405807495117, 41.30805206298828, 42.81204605102539, 44.3160400390625, 45.820030212402344]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 12.0, 11.0, 21.0, 52.0, 70.0, 88.0, 81.0, 47.0, 25.0, 14.0, 6.0, 2.0, 7.0, 4.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.54945373535156, -59.01248550415039, -57.47551727294922, -55.93854522705078, -54.40157699584961, -52.86460876464844, -51.327640533447266, -49.790672302246094, -48.25370407104492, -46.71673583984375, -45.17976760864258, -43.642799377441406, -42.10582733154297, -40.5688591003418, -39.031890869140625, -37.49492263793945, -35.95795440673828, -34.42098617553711, -32.88401794433594, -31.347047805786133, -29.81007957458496, -28.273109436035156, -26.736141204833984, -25.199172973632812, -23.662200927734375, -22.125232696533203, -20.5882625579834, -19.051294326782227, -17.514326095581055, -15.977356910705566, -14.440387725830078, -12.903419494628906, -11.366451263427734, -9.829482078552246, -8.292513847351074, -6.755544662475586, -5.218575954437256, -3.681607246398926, -2.1446380615234375, -0.6076698303222656, 0.9292993545532227, 2.4662680625915527, 4.003236770629883, 5.540205955505371, 7.077174663543701, 8.614143371582031, 10.15111255645752, 11.688080787658691, 13.22504997253418, 14.762019157409668, 16.298988342285156, 17.835956573486328, 19.3729248046875, 20.909893035888672, 22.446863174438477, 23.98383140563965, 25.520801544189453, 27.057769775390625, 28.59473991394043, 30.1317081451416, 31.668676376342773, 33.20564651489258, 34.74261474609375, 36.27958297729492, 37.816551208496094]}, "eval/loss": 0.7061182856559753, "eval/wer": 0.12633875446251489, "eval/runtime": 638.826, "eval/samples_per_second": 4.136, "eval/steps_per_second": 0.518} \ No newline at end of file +{"train/loss": 0.2602, "train/learning_rate": 1.8408450704225354e-06, "train/epoch": 23.54, "train/global_step": 21000, "_runtime": 127314, "_timestamp": 1648268658, "_step": 21013, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 5.0, 1.0, 5.0, 5.0, 9.0, 13.0, 17.0, 12.0, 19.0, 16.0, 34.0, 28.0, 25.0, 30.0, 37.0, 37.0, 35.0, 45.0, 46.0, 45.0, 44.0, 40.0, 41.0, 41.0, 33.0, 42.0, 30.0, 31.0, 28.0, 24.0, 31.0, 24.0, 17.0, 18.0, 18.0, 11.0, 14.0, 8.0, 7.0, 8.0, 6.0, 7.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-44.89548873901367, -43.69374465942383, -42.49199676513672, -41.290252685546875, -40.088504791259766, -38.88676071166992, -37.68501281738281, -36.48326873779297, -35.281524658203125, -34.07978057861328, -32.87803268432617, -31.676286697387695, -30.47454071044922, -29.272796630859375, -28.0710506439209, -26.869304656982422, -25.667556762695312, -24.465810775756836, -23.26406478881836, -22.062318801879883, -20.860572814941406, -19.658828735351562, -18.457082748413086, -17.25533676147461, -16.053590774536133, -14.851844787597656, -13.65009880065918, -12.44835376739502, -11.246607780456543, -10.044861793518066, -8.843116760253906, -7.64137077331543, -6.439628601074219, -5.237882614135742, -4.036137104034424, -2.8343913555145264, -1.632645606994629, -0.43089962005615234, 0.770845890045166, 1.9725914001464844, 3.174337387084961, 4.3760833740234375, 5.577828884124756, 6.779574394226074, 7.981320381164551, 9.183066368103027, 10.384811401367188, 11.586557388305664, 12.78830337524414, 13.990049362182617, 15.191795349121094, 16.39354133605957, 17.595287322998047, 18.79703140258789, 19.998777389526367, 21.200523376464844, 22.40226936340332, 23.604015350341797, 24.805761337280273, 26.00750732421875, 27.209251403808594, 28.410999298095703, 29.612743377685547, 30.814489364624023, 32.0162353515625]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 8.0, 5.0, 15.0, 17.0, 14.0, 10.0, 19.0, 19.0, 20.0, 35.0, 34.0, 33.0, 28.0, 31.0, 43.0, 28.0, 41.0, 33.0, 37.0, 45.0, 37.0, 40.0, 39.0, 43.0, 32.0, 43.0, 33.0, 32.0, 36.0, 29.0, 20.0, 15.0, 14.0, 9.0, 8.0, 14.0, 8.0, 4.0, 8.0, 2.0, 0.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.66038131713867, -35.51462173461914, -34.36886215209961, -33.22310256958008, -32.07734298706055, -30.931583404541016, -29.78582191467285, -28.64006233215332, -27.49430274963379, -26.348543167114258, -25.202783584594727, -24.057024002075195, -22.91126251220703, -21.7655029296875, -20.61974334716797, -19.473983764648438, -18.328224182128906, -17.182464599609375, -16.036705017089844, -14.890944480895996, -13.745184898376465, -12.599425315856934, -11.453664779663086, -10.307905197143555, -9.162145614624023, -8.016386032104492, -6.870625972747803, -5.724865913391113, -4.579106330871582, -3.433346748352051, -2.2875866889953613, -1.1418266296386719, 0.003932952880859375, 1.1496927738189697, 2.29545259475708, 3.4412124156951904, 4.586972236633301, 5.732731819152832, 6.8784918785095215, 8.024251937866211, 9.170011520385742, 10.315771102905273, 11.461530685424805, 12.607291221618652, 13.753050804138184, 14.898810386657715, 16.044570922851562, 17.190330505371094, 18.336090087890625, 19.481849670410156, 20.627609252929688, 21.77336883544922, 22.91912841796875, 24.06488800048828, 25.210649490356445, 26.356409072875977, 27.502168655395508, 28.64792823791504, 29.79368782043457, 30.9394474029541, 32.085208892822266, 33.2309684753418, 34.37672805786133, 35.52248764038086, 36.66824722290039]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 20.0, 25.0, 54.0, 70.0, 111.0, 183.0, 306.0, 535.0, 881.0, 1461.0, 2393.0, 4077.0, 6590.0, 11257.0, 18929.0, 31295.0, 52555.0, 87366.0, 146278.0, 241882.0, 390815.0, 590865.0, 731247.0, 663770.0, 468594.0, 294610.0, 179111.0, 107093.0, 65001.0, 38540.0, 23214.0, 14009.0, 8512.0, 4935.0, 2941.0, 1865.0, 1120.0, 699.0, 433.0, 248.0, 143.0, 90.0, 53.0, 44.0, 22.0, 8.0, 13.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-52.0, -50.24951171875, -48.4990234375, -46.74853515625, -44.998046875, -43.24755859375, -41.4970703125, -39.74658203125, -37.99609375, -36.24560546875, -34.4951171875, -32.74462890625, -30.994140625, -29.24365234375, -27.4931640625, -25.74267578125, -23.9921875, -22.24169921875, -20.4912109375, -18.74072265625, -16.990234375, -15.23974609375, -13.4892578125, -11.73876953125, -9.98828125, -8.23779296875, -6.4873046875, -4.73681640625, -2.986328125, -1.23583984375, 0.5146484375, 2.26513671875, 4.015625, 5.76611328125, 7.5166015625, 9.26708984375, 11.017578125, 12.76806640625, 14.5185546875, 16.26904296875, 18.01953125, 19.77001953125, 21.5205078125, 23.27099609375, 25.021484375, 26.77197265625, 28.5224609375, 30.27294921875, 32.0234375, 33.77392578125, 35.5244140625, 37.27490234375, 39.025390625, 40.77587890625, 42.5263671875, 44.27685546875, 46.02734375, 47.77783203125, 49.5283203125, 51.27880859375, 53.029296875, 54.77978515625, 56.5302734375, 58.28076171875, 60.03125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 7.0, 15.0, 19.0, 13.0, 12.0, 15.0, 15.0, 24.0, 11.0, 19.0, 15.0, 31.0, 35.0, 25.0, 29.0, 23.0, 44.0, 29.0, 25.0, 41.0, 41.0, 30.0, 30.0, 41.0, 29.0, 31.0, 42.0, 31.0, 42.0, 25.0, 28.0, 24.0, 21.0, 14.0, 26.0, 10.0, 15.0, 11.0, 6.0, 6.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-33.46875, -32.41650390625, -31.3642578125, -30.31201171875, -29.259765625, -28.20751953125, -27.1552734375, -26.10302734375, -25.05078125, -23.99853515625, -22.9462890625, -21.89404296875, -20.841796875, -19.78955078125, -18.7373046875, -17.68505859375, -16.6328125, -15.58056640625, -14.5283203125, -13.47607421875, -12.423828125, -11.37158203125, -10.3193359375, -9.26708984375, -8.21484375, -7.16259765625, -6.1103515625, -5.05810546875, -4.005859375, -2.95361328125, -1.9013671875, -0.84912109375, 0.203125, 1.25537109375, 2.3076171875, 3.35986328125, 4.412109375, 5.46435546875, 6.5166015625, 7.56884765625, 8.62109375, 9.67333984375, 10.7255859375, 11.77783203125, 12.830078125, 13.88232421875, 14.9345703125, 15.98681640625, 17.0390625, 18.09130859375, 19.1435546875, 20.19580078125, 21.248046875, 22.30029296875, 23.3525390625, 24.40478515625, 25.45703125, 26.50927734375, 27.5615234375, 28.61376953125, 29.666015625, 30.71826171875, 31.7705078125, 32.82275390625, 33.875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 15.0, 31.0, 52.0, 91.0, 134.0, 216.0, 402.0, 586.0, 1007.0, 1586.0, 2564.0, 4071.0, 6386.0, 9980.0, 16250.0, 25408.0, 40242.0, 63500.0, 98799.0, 151581.0, 227236.0, 326761.0, 446952.0, 549747.0, 572537.0, 496073.0, 376962.0, 266616.0, 180197.0, 118743.0, 77018.0, 48851.0, 31070.0, 19543.0, 12429.0, 7715.0, 4807.0, 3134.0, 1959.0, 1176.0, 703.0, 427.0, 305.0, 177.0, 99.0, 59.0, 34.0, 24.0, 12.0, 5.0, 5.0, 2.0, 1.0, 1.0], "bins": [-44.46875, -43.1689453125, -41.869140625, -40.5693359375, -39.26953125, -37.9697265625, -36.669921875, -35.3701171875, -34.0703125, -32.7705078125, -31.470703125, -30.1708984375, -28.87109375, -27.5712890625, -26.271484375, -24.9716796875, -23.671875, -22.3720703125, -21.072265625, -19.7724609375, -18.47265625, -17.1728515625, -15.873046875, -14.5732421875, -13.2734375, -11.9736328125, -10.673828125, -9.3740234375, -8.07421875, -6.7744140625, -5.474609375, -4.1748046875, -2.875, -1.5751953125, -0.275390625, 1.0244140625, 2.32421875, 3.6240234375, 4.923828125, 6.2236328125, 7.5234375, 8.8232421875, 10.123046875, 11.4228515625, 12.72265625, 14.0224609375, 15.322265625, 16.6220703125, 17.921875, 19.2216796875, 20.521484375, 21.8212890625, 23.12109375, 24.4208984375, 25.720703125, 27.0205078125, 28.3203125, 29.6201171875, 30.919921875, 32.2197265625, 33.51953125, 34.8193359375, 36.119140625, 37.4189453125, 38.71875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 3.0, 3.0, 9.0, 16.0, 14.0, 15.0, 22.0, 29.0, 32.0, 57.0, 63.0, 90.0, 85.0, 105.0, 130.0, 135.0, 159.0, 191.0, 197.0, 218.0, 261.0, 231.0, 223.0, 214.0, 224.0, 198.0, 166.0, 144.0, 135.0, 102.0, 101.0, 88.0, 82.0, 62.0, 59.0, 38.0, 31.0, 29.0, 24.0, 19.0, 11.0, 15.0, 14.0, 9.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.125, -16.55029296875, -15.9755859375, -15.40087890625, -14.826171875, -14.25146484375, -13.6767578125, -13.10205078125, -12.52734375, -11.95263671875, -11.3779296875, -10.80322265625, -10.228515625, -9.65380859375, -9.0791015625, -8.50439453125, -7.9296875, -7.35498046875, -6.7802734375, -6.20556640625, -5.630859375, -5.05615234375, -4.4814453125, -3.90673828125, -3.33203125, -2.75732421875, -2.1826171875, -1.60791015625, -1.033203125, -0.45849609375, 0.1162109375, 0.69091796875, 1.265625, 1.84033203125, 2.4150390625, 2.98974609375, 3.564453125, 4.13916015625, 4.7138671875, 5.28857421875, 5.86328125, 6.43798828125, 7.0126953125, 7.58740234375, 8.162109375, 8.73681640625, 9.3115234375, 9.88623046875, 10.4609375, 11.03564453125, 11.6103515625, 12.18505859375, 12.759765625, 13.33447265625, 13.9091796875, 14.48388671875, 15.05859375, 15.63330078125, 16.2080078125, 16.78271484375, 17.357421875, 17.93212890625, 18.5068359375, 19.08154296875, 19.65625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 4.0, 7.0, 10.0, 12.0, 10.0, 19.0, 17.0, 9.0, 18.0, 22.0, 34.0, 34.0, 29.0, 36.0, 36.0, 45.0, 39.0, 50.0, 34.0, 46.0, 34.0, 42.0, 57.0, 43.0, 33.0, 34.0, 35.0, 37.0, 33.0, 19.0, 30.0, 15.0, 15.0, 7.0, 9.0, 10.0, 11.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.735687255859375, -43.22833251953125, -41.72098159790039, -40.213626861572266, -38.706275939941406, -37.19892120361328, -35.691566467285156, -34.1842155456543, -32.67686462402344, -31.169511795043945, -29.662158966064453, -28.154804229736328, -26.64745330810547, -25.140098571777344, -23.63274574279785, -22.12539291381836, -20.618038177490234, -19.110685348510742, -17.60333251953125, -16.095977783203125, -14.58862590789795, -13.081273078918457, -11.573919296264648, -10.066566467285156, -8.559213638305664, -7.051860809326172, -5.5445075035095215, -4.037154197692871, -2.529801368713379, -1.0224485397338867, 0.4849052429199219, 1.992258071899414, 3.499614715576172, 5.006967544555664, 6.5143208503723145, 8.021674156188965, 9.529026985168457, 11.03637981414795, 12.543733596801758, 14.05108642578125, 15.558439254760742, 17.065792083740234, 18.573144912719727, 20.08049774169922, 21.587852478027344, 23.095203399658203, 24.602558135986328, 26.10991096496582, 27.617263793945312, 29.124616622924805, 30.631969451904297, 32.13932418823242, 33.64667510986328, 35.154029846191406, 36.66138458251953, 38.16873550415039, 39.67608642578125, 41.183441162109375, 42.690792083740234, 44.19814682006836, 45.70549774169922, 47.212852478027344, 48.72020721435547, 50.22755813598633, 51.73491287231445]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 7.0, 7.0, 5.0, 11.0, 16.0, 9.0, 16.0, 15.0, 21.0, 23.0, 31.0, 18.0, 29.0, 28.0, 28.0, 25.0, 36.0, 39.0, 42.0, 36.0, 25.0, 42.0, 35.0, 45.0, 47.0, 37.0, 46.0, 29.0, 36.0, 28.0, 22.0, 30.0, 15.0, 22.0, 19.0, 21.0, 14.0, 9.0, 7.0, 6.0, 8.0, 8.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.88594055175781, -40.551082611083984, -39.216224670410156, -37.88136672973633, -36.5465087890625, -35.211647033691406, -33.87678909301758, -32.54193115234375, -31.207073211669922, -29.872215270996094, -28.537357330322266, -27.202497482299805, -25.867639541625977, -24.53278160095215, -23.197921752929688, -21.86306381225586, -20.52820587158203, -19.193347930908203, -17.858489990234375, -16.523630142211914, -15.188772201538086, -13.853914260864258, -12.519055366516113, -11.184196472167969, -9.84933853149414, -8.514480590820312, -7.179621696472168, -5.844763278961182, -4.509904861450195, -3.175046443939209, -1.8401880264282227, -0.5053291320800781, 0.8295326232910156, 2.164391040802002, 3.4992494583129883, 4.834107875823975, 6.168966293334961, 7.503824710845947, 8.838683128356934, 10.173542022705078, 11.508399963378906, 12.843257904052734, 14.178116798400879, 15.512975692749023, 16.84783363342285, 18.18269157409668, 19.51755142211914, 20.85240936279297, 22.187267303466797, 23.522125244140625, 24.856983184814453, 26.191843032836914, 27.526700973510742, 28.86155891418457, 30.19641876220703, 31.53127670288086, 32.86613464355469, 34.200992584228516, 35.535850524902344, 36.87070846557617, 38.20556640625, 39.540428161621094, 40.87528610229492, 42.21014404296875, 43.54500198364258]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 12.0, 21.0, 46.0, 65.0, 89.0, 165.0, 243.0, 385.0, 594.0, 980.0, 1501.0, 2298.0, 3597.0, 5189.0, 7964.0, 12068.0, 18326.0, 26508.0, 38911.0, 55060.0, 75003.0, 96890.0, 115257.0, 122612.0, 115548.0, 97279.0, 75425.0, 55421.0, 39369.0, 27604.0, 18229.0, 12541.0, 8117.0, 5420.0, 3489.0, 2248.0, 1479.0, 973.0, 597.0, 368.0, 232.0, 148.0, 109.0, 73.0, 34.0, 19.0, 10.0, 11.0, 6.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-49.75, -48.17138671875, -46.5927734375, -45.01416015625, -43.435546875, -41.85693359375, -40.2783203125, -38.69970703125, -37.12109375, -35.54248046875, -33.9638671875, -32.38525390625, -30.806640625, -29.22802734375, -27.6494140625, -26.07080078125, -24.4921875, -22.91357421875, -21.3349609375, -19.75634765625, -18.177734375, -16.59912109375, -15.0205078125, -13.44189453125, -11.86328125, -10.28466796875, -8.7060546875, -7.12744140625, -5.548828125, -3.97021484375, -2.3916015625, -0.81298828125, 0.765625, 2.34423828125, 3.9228515625, 5.50146484375, 7.080078125, 8.65869140625, 10.2373046875, 11.81591796875, 13.39453125, 14.97314453125, 16.5517578125, 18.13037109375, 19.708984375, 21.28759765625, 22.8662109375, 24.44482421875, 26.0234375, 27.60205078125, 29.1806640625, 30.75927734375, 32.337890625, 33.91650390625, 35.4951171875, 37.07373046875, 38.65234375, 40.23095703125, 41.8095703125, 43.38818359375, 44.966796875, 46.54541015625, 48.1240234375, 49.70263671875, 51.28125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 9.0, 7.0, 8.0, 13.0, 13.0, 15.0, 23.0, 20.0, 20.0, 23.0, 30.0, 30.0, 38.0, 28.0, 28.0, 42.0, 37.0, 35.0, 31.0, 31.0, 40.0, 54.0, 32.0, 39.0, 29.0, 28.0, 42.0, 24.0, 34.0, 27.0, 31.0, 17.0, 17.0, 17.0, 15.0, 11.0, 12.0, 13.0, 6.0, 6.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-39.0625, -37.83154296875, -36.6005859375, -35.36962890625, -34.138671875, -32.90771484375, -31.6767578125, -30.44580078125, -29.21484375, -27.98388671875, -26.7529296875, -25.52197265625, -24.291015625, -23.06005859375, -21.8291015625, -20.59814453125, -19.3671875, -18.13623046875, -16.9052734375, -15.67431640625, -14.443359375, -13.21240234375, -11.9814453125, -10.75048828125, -9.51953125, -8.28857421875, -7.0576171875, -5.82666015625, -4.595703125, -3.36474609375, -2.1337890625, -0.90283203125, 0.328125, 1.55908203125, 2.7900390625, 4.02099609375, 5.251953125, 6.48291015625, 7.7138671875, 8.94482421875, 10.17578125, 11.40673828125, 12.6376953125, 13.86865234375, 15.099609375, 16.33056640625, 17.5615234375, 18.79248046875, 20.0234375, 21.25439453125, 22.4853515625, 23.71630859375, 24.947265625, 26.17822265625, 27.4091796875, 28.64013671875, 29.87109375, 31.10205078125, 32.3330078125, 33.56396484375, 34.794921875, 36.02587890625, 37.2568359375, 38.48779296875, 39.71875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 6.0, 4.0, 6.0, 26.0, 32.0, 42.0, 58.0, 92.0, 123.0, 216.0, 347.0, 567.0, 852.0, 1347.0, 2286.0, 3684.0, 6174.0, 10486.0, 18001.0, 31370.0, 55237.0, 97262.0, 161436.0, 212436.0, 180240.0, 113248.0, 64446.0, 36831.0, 20963.0, 12333.0, 7303.0, 4263.0, 2594.0, 1619.0, 942.0, 595.0, 387.0, 248.0, 172.0, 89.0, 69.0, 44.0, 40.0, 19.0, 14.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.9375, -91.9365234375, -88.935546875, -85.9345703125, -82.93359375, -79.9326171875, -76.931640625, -73.9306640625, -70.9296875, -67.9287109375, -64.927734375, -61.9267578125, -58.92578125, -55.9248046875, -52.923828125, -49.9228515625, -46.921875, -43.9208984375, -40.919921875, -37.9189453125, -34.91796875, -31.9169921875, -28.916015625, -25.9150390625, -22.9140625, -19.9130859375, -16.912109375, -13.9111328125, -10.91015625, -7.9091796875, -4.908203125, -1.9072265625, 1.09375, 4.0947265625, 7.095703125, 10.0966796875, 13.09765625, 16.0986328125, 19.099609375, 22.1005859375, 25.1015625, 28.1025390625, 31.103515625, 34.1044921875, 37.10546875, 40.1064453125, 43.107421875, 46.1083984375, 49.109375, 52.1103515625, 55.111328125, 58.1123046875, 61.11328125, 64.1142578125, 67.115234375, 70.1162109375, 73.1171875, 76.1181640625, 79.119140625, 82.1201171875, 85.12109375, 88.1220703125, 91.123046875, 94.1240234375, 97.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 5.0, 6.0, 7.0, 14.0, 14.0, 11.0, 16.0, 19.0, 21.0, 30.0, 20.0, 35.0, 30.0, 39.0, 37.0, 28.0, 39.0, 33.0, 35.0, 52.0, 37.0, 26.0, 44.0, 36.0, 43.0, 31.0, 32.0, 19.0, 21.0, 36.0, 17.0, 24.0, 23.0, 18.0, 21.0, 22.0, 11.0, 5.0, 7.0, 7.0, 8.0, 0.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.484375, -27.574462890625, -26.66455078125, -25.754638671875, -24.8447265625, -23.934814453125, -23.02490234375, -22.114990234375, -21.205078125, -20.295166015625, -19.38525390625, -18.475341796875, -17.5654296875, -16.655517578125, -15.74560546875, -14.835693359375, -13.92578125, -13.015869140625, -12.10595703125, -11.196044921875, -10.2861328125, -9.376220703125, -8.46630859375, -7.556396484375, -6.646484375, -5.736572265625, -4.82666015625, -3.916748046875, -3.0068359375, -2.096923828125, -1.18701171875, -0.277099609375, 0.6328125, 1.542724609375, 2.45263671875, 3.362548828125, 4.2724609375, 5.182373046875, 6.09228515625, 7.002197265625, 7.912109375, 8.822021484375, 9.73193359375, 10.641845703125, 11.5517578125, 12.461669921875, 13.37158203125, 14.281494140625, 15.19140625, 16.101318359375, 17.01123046875, 17.921142578125, 18.8310546875, 19.740966796875, 20.65087890625, 21.560791015625, 22.470703125, 23.380615234375, 24.29052734375, 25.200439453125, 26.1103515625, 27.020263671875, 27.93017578125, 28.840087890625, 29.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 10.0, 27.0, 24.0, 38.0, 32.0, 61.0, 118.0, 151.0, 231.0, 337.0, 518.0, 790.0, 1360.0, 2033.0, 3538.0, 6297.0, 11463.0, 22830.0, 47217.0, 102316.0, 209058.0, 281411.0, 185647.0, 88017.0, 40878.0, 20021.0, 10212.0, 5461.0, 3195.0, 1902.0, 1171.0, 736.0, 472.0, 333.0, 203.0, 136.0, 97.0, 62.0, 42.0, 32.0, 30.0, 8.0, 14.0, 6.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-55.0, -53.4013671875, -51.802734375, -50.2041015625, -48.60546875, -47.0068359375, -45.408203125, -43.8095703125, -42.2109375, -40.6123046875, -39.013671875, -37.4150390625, -35.81640625, -34.2177734375, -32.619140625, -31.0205078125, -29.421875, -27.8232421875, -26.224609375, -24.6259765625, -23.02734375, -21.4287109375, -19.830078125, -18.2314453125, -16.6328125, -15.0341796875, -13.435546875, -11.8369140625, -10.23828125, -8.6396484375, -7.041015625, -5.4423828125, -3.84375, -2.2451171875, -0.646484375, 0.9521484375, 2.55078125, 4.1494140625, 5.748046875, 7.3466796875, 8.9453125, 10.5439453125, 12.142578125, 13.7412109375, 15.33984375, 16.9384765625, 18.537109375, 20.1357421875, 21.734375, 23.3330078125, 24.931640625, 26.5302734375, 28.12890625, 29.7275390625, 31.326171875, 32.9248046875, 34.5234375, 36.1220703125, 37.720703125, 39.3193359375, 40.91796875, 42.5166015625, 44.115234375, 45.7138671875, 47.3125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 13.0, 11.0, 14.0, 14.0, 18.0, 27.0, 27.0, 31.0, 36.0, 48.0, 51.0, 56.0, 61.0, 69.0, 61.0, 73.0, 60.0, 62.0, 37.0, 43.0, 37.0, 27.0, 26.0, 13.0, 12.0, 17.0, 11.0, 9.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.003437042236328125, -0.0033233165740966797, -0.0032095909118652344, -0.003095865249633789, -0.0029821395874023438, -0.0028684139251708984, -0.002754688262939453, -0.002640962600708008, -0.0025272369384765625, -0.002413511276245117, -0.002299785614013672, -0.0021860599517822266, -0.0020723342895507812, -0.001958608627319336, -0.0018448829650878906, -0.0017311573028564453, -0.001617431640625, -0.0015037059783935547, -0.0013899803161621094, -0.001276254653930664, -0.0011625289916992188, -0.0010488033294677734, -0.0009350776672363281, -0.0008213520050048828, -0.0007076263427734375, -0.0005939006805419922, -0.0004801750183105469, -0.00036644935607910156, -0.00025272369384765625, -0.00013899803161621094, -2.5272369384765625e-05, 8.845329284667969e-05, 0.000202178955078125, 0.0003159046173095703, 0.0004296302795410156, 0.0005433559417724609, 0.0006570816040039062, 0.0007708072662353516, 0.0008845329284667969, 0.0009982585906982422, 0.0011119842529296875, 0.0012257099151611328, 0.0013394355773925781, 0.0014531612396240234, 0.0015668869018554688, 0.001680612564086914, 0.0017943382263183594, 0.0019080638885498047, 0.00202178955078125, 0.0021355152130126953, 0.0022492408752441406, 0.002362966537475586, 0.0024766921997070312, 0.0025904178619384766, 0.002704143524169922, 0.002817869186401367, 0.0029315948486328125, 0.003045320510864258, 0.003159046173095703, 0.0032727718353271484, 0.0033864974975585938, 0.003500223159790039, 0.0036139488220214844, 0.0037276744842529297, 0.003841400146484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 11.0, 10.0, 11.0, 10.0, 22.0, 26.0, 37.0, 50.0, 86.0, 92.0, 177.0, 263.0, 441.0, 677.0, 991.0, 1523.0, 2475.0, 4184.0, 6557.0, 11163.0, 18536.0, 31886.0, 55422.0, 95045.0, 148518.0, 189540.0, 175980.0, 123741.0, 74909.0, 42997.0, 25166.0, 14805.0, 8858.0, 5342.0, 3251.0, 2080.0, 1289.0, 830.0, 537.0, 327.0, 213.0, 151.0, 95.0, 68.0, 53.0, 31.0, 23.0, 26.0, 12.0, 11.0, 4.0, 1.0, 6.0, 4.0, 1.0, 1.0, 2.0], "bins": [-48.78125, -47.29296875, -45.8046875, -44.31640625, -42.828125, -41.33984375, -39.8515625, -38.36328125, -36.875, -35.38671875, -33.8984375, -32.41015625, -30.921875, -29.43359375, -27.9453125, -26.45703125, -24.96875, -23.48046875, -21.9921875, -20.50390625, -19.015625, -17.52734375, -16.0390625, -14.55078125, -13.0625, -11.57421875, -10.0859375, -8.59765625, -7.109375, -5.62109375, -4.1328125, -2.64453125, -1.15625, 0.33203125, 1.8203125, 3.30859375, 4.796875, 6.28515625, 7.7734375, 9.26171875, 10.75, 12.23828125, 13.7265625, 15.21484375, 16.703125, 18.19140625, 19.6796875, 21.16796875, 22.65625, 24.14453125, 25.6328125, 27.12109375, 28.609375, 30.09765625, 31.5859375, 33.07421875, 34.5625, 36.05078125, 37.5390625, 39.02734375, 40.515625, 42.00390625, 43.4921875, 44.98046875, 46.46875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 6.0, 10.0, 4.0, 5.0, 9.0, 9.0, 11.0, 20.0, 22.0, 24.0, 30.0, 38.0, 32.0, 43.0, 54.0, 44.0, 54.0, 48.0, 57.0, 45.0, 51.0, 48.0, 57.0, 32.0, 41.0, 50.0, 18.0, 30.0, 21.0, 10.0, 15.0, 12.0, 8.0, 11.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-18.03125, -17.527099609375, -17.02294921875, -16.518798828125, -16.0146484375, -15.510498046875, -15.00634765625, -14.502197265625, -13.998046875, -13.493896484375, -12.98974609375, -12.485595703125, -11.9814453125, -11.477294921875, -10.97314453125, -10.468994140625, -9.96484375, -9.460693359375, -8.95654296875, -8.452392578125, -7.9482421875, -7.444091796875, -6.93994140625, -6.435791015625, -5.931640625, -5.427490234375, -4.92333984375, -4.419189453125, -3.9150390625, -3.410888671875, -2.90673828125, -2.402587890625, -1.8984375, -1.394287109375, -0.89013671875, -0.385986328125, 0.1181640625, 0.622314453125, 1.12646484375, 1.630615234375, 2.134765625, 2.638916015625, 3.14306640625, 3.647216796875, 4.1513671875, 4.655517578125, 5.15966796875, 5.663818359375, 6.16796875, 6.672119140625, 7.17626953125, 7.680419921875, 8.1845703125, 8.688720703125, 9.19287109375, 9.697021484375, 10.201171875, 10.705322265625, 11.20947265625, 11.713623046875, 12.2177734375, 12.721923828125, 13.22607421875, 13.730224609375, 14.234375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 6.0, 4.0, 6.0, 15.0, 8.0, 16.0, 21.0, 23.0, 30.0, 32.0, 25.0, 37.0, 46.0, 44.0, 40.0, 44.0, 43.0, 40.0, 39.0, 50.0, 40.0, 48.0, 45.0, 30.0, 32.0, 39.0, 34.0, 27.0, 15.0, 22.0, 16.0, 13.0, 18.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.12483596801758, -44.69575500488281, -43.26667785644531, -41.83759689331055, -40.40851593017578, -38.979434967041016, -37.55035400390625, -36.12127685546875, -34.692195892333984, -33.26311492919922, -31.834035873413086, -30.404956817626953, -28.975875854492188, -27.546794891357422, -26.11771583557129, -24.688636779785156, -23.25955581665039, -21.830474853515625, -20.401395797729492, -18.97231674194336, -17.543235778808594, -16.114154815673828, -14.685075759887695, -13.255995750427246, -11.826915740966797, -10.397835731506348, -8.968755722045898, -7.539675712585449, -6.110595703125, -4.681515693664551, -3.2524356842041016, -1.8233556747436523, -0.3942756652832031, 1.034804344177246, 2.4638843536376953, 3.8929643630981445, 5.322044372558594, 6.751124382019043, 8.180204391479492, 9.609284400939941, 11.03836441040039, 12.46744441986084, 13.896524429321289, 15.325604438781738, 16.754684448242188, 18.183765411376953, 19.612844467163086, 21.04192352294922, 22.471004486083984, 23.90008544921875, 25.329164505004883, 26.758243560791016, 28.18732452392578, 29.616405487060547, 31.04548454284668, 32.47456359863281, 33.90364456176758, 35.332725524902344, 36.761802673339844, 38.19088363647461, 39.619964599609375, 41.04904556274414, 42.478126525878906, 43.907203674316406, 45.33628463745117]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 6.0, 7.0, 6.0, 9.0, 7.0, 17.0, 17.0, 25.0, 18.0, 18.0, 32.0, 28.0, 32.0, 32.0, 23.0, 33.0, 49.0, 42.0, 53.0, 40.0, 43.0, 49.0, 38.0, 48.0, 39.0, 36.0, 31.0, 32.0, 30.0, 28.0, 26.0, 16.0, 16.0, 16.0, 9.0, 14.0, 12.0, 14.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-46.6157341003418, -45.24986267089844, -43.883995056152344, -42.518123626708984, -41.15225601196289, -39.78638458251953, -38.42051696777344, -37.05464553833008, -35.68877410888672, -34.32290267944336, -32.957035064697266, -31.591163635253906, -30.225296020507812, -28.859424591064453, -27.493555068969727, -26.127685546875, -24.761817932128906, -23.39594841003418, -22.030078887939453, -20.664207458496094, -19.29833984375, -17.93246841430664, -16.566598892211914, -15.200729370117188, -13.834859848022461, -12.468990325927734, -11.103120803833008, -9.737250328063965, -8.371380805969238, -7.005511283874512, -5.639640808105469, -4.273771286010742, -2.9079017639160156, -1.54203200340271, -0.1761622428894043, 1.1897077560424805, 2.555577278137207, 3.9214468002319336, 5.287317276000977, 6.653186798095703, 8.01905632019043, 9.384925842285156, 10.750795364379883, 12.116665840148926, 13.482535362243652, 14.848404884338379, 16.214275360107422, 17.58014488220215, 18.946014404296875, 20.3118839263916, 21.677753448486328, 23.043624877929688, 24.40949249267578, 25.77536392211914, 27.141233444213867, 28.507102966308594, 29.87297248840332, 31.238842010498047, 32.604713439941406, 33.9705810546875, 35.33645248413086, 36.70232009887695, 38.06819152832031, 39.434059143066406, 40.799930572509766]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 15.0, 21.0, 25.0, 33.0, 71.0, 119.0, 151.0, 267.0, 400.0, 661.0, 950.0, 1601.0, 2401.0, 3778.0, 5804.0, 8618.0, 12979.0, 18839.0, 26613.0, 36642.0, 48376.0, 61852.0, 75271.0, 87101.0, 95008.0, 97186.0, 93409.0, 85003.0, 71995.0, 58255.0, 45051.0, 33737.0, 24487.0, 17353.0, 11813.0, 7891.0, 5201.0, 3439.0, 2224.0, 1404.0, 919.0, 612.0, 362.0, 228.0, 155.0, 83.0, 60.0, 41.0, 21.0, 14.0, 9.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.15625, -31.1630859375, -30.169921875, -29.1767578125, -28.18359375, -27.1904296875, -26.197265625, -25.2041015625, -24.2109375, -23.2177734375, -22.224609375, -21.2314453125, -20.23828125, -19.2451171875, -18.251953125, -17.2587890625, -16.265625, -15.2724609375, -14.279296875, -13.2861328125, -12.29296875, -11.2998046875, -10.306640625, -9.3134765625, -8.3203125, -7.3271484375, -6.333984375, -5.3408203125, -4.34765625, -3.3544921875, -2.361328125, -1.3681640625, -0.375, 0.6181640625, 1.611328125, 2.6044921875, 3.59765625, 4.5908203125, 5.583984375, 6.5771484375, 7.5703125, 8.5634765625, 9.556640625, 10.5498046875, 11.54296875, 12.5361328125, 13.529296875, 14.5224609375, 15.515625, 16.5087890625, 17.501953125, 18.4951171875, 19.48828125, 20.4814453125, 21.474609375, 22.4677734375, 23.4609375, 24.4541015625, 25.447265625, 26.4404296875, 27.43359375, 28.4267578125, 29.419921875, 30.4130859375, 31.40625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 8.0, 11.0, 13.0, 12.0, 17.0, 17.0, 20.0, 20.0, 23.0, 24.0, 27.0, 29.0, 28.0, 14.0, 45.0, 40.0, 44.0, 51.0, 46.0, 37.0, 43.0, 49.0, 43.0, 35.0, 29.0, 30.0, 36.0, 32.0, 18.0, 32.0, 23.0, 19.0, 14.0, 10.0, 12.0, 8.0, 7.0, 13.0, 4.0, 9.0, 2.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.28125, -43.9560546875, -42.630859375, -41.3056640625, -39.98046875, -38.6552734375, -37.330078125, -36.0048828125, -34.6796875, -33.3544921875, -32.029296875, -30.7041015625, -29.37890625, -28.0537109375, -26.728515625, -25.4033203125, -24.078125, -22.7529296875, -21.427734375, -20.1025390625, -18.77734375, -17.4521484375, -16.126953125, -14.8017578125, -13.4765625, -12.1513671875, -10.826171875, -9.5009765625, -8.17578125, -6.8505859375, -5.525390625, -4.2001953125, -2.875, -1.5498046875, -0.224609375, 1.1005859375, 2.42578125, 3.7509765625, 5.076171875, 6.4013671875, 7.7265625, 9.0517578125, 10.376953125, 11.7021484375, 13.02734375, 14.3525390625, 15.677734375, 17.0029296875, 18.328125, 19.6533203125, 20.978515625, 22.3037109375, 23.62890625, 24.9541015625, 26.279296875, 27.6044921875, 28.9296875, 30.2548828125, 31.580078125, 32.9052734375, 34.23046875, 35.5556640625, 36.880859375, 38.2060546875, 39.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 4.0, 8.0, 17.0, 27.0, 38.0, 69.0, 96.0, 151.0, 250.0, 378.0, 654.0, 959.0, 1404.0, 2202.0, 3226.0, 4831.0, 7241.0, 10437.0, 14701.0, 20613.0, 28701.0, 38952.0, 50582.0, 63513.0, 76727.0, 87438.0, 93176.0, 95148.0, 90099.0, 80182.0, 68313.0, 55750.0, 42941.0, 32448.0, 23769.0, 16874.0, 11871.0, 8281.0, 5417.0, 3740.0, 2533.0, 1695.0, 1125.0, 708.0, 442.0, 343.0, 198.0, 120.0, 65.0, 41.0, 27.0, 13.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-34.59375, -33.44775390625, -32.3017578125, -31.15576171875, -30.009765625, -28.86376953125, -27.7177734375, -26.57177734375, -25.42578125, -24.27978515625, -23.1337890625, -21.98779296875, -20.841796875, -19.69580078125, -18.5498046875, -17.40380859375, -16.2578125, -15.11181640625, -13.9658203125, -12.81982421875, -11.673828125, -10.52783203125, -9.3818359375, -8.23583984375, -7.08984375, -5.94384765625, -4.7978515625, -3.65185546875, -2.505859375, -1.35986328125, -0.2138671875, 0.93212890625, 2.078125, 3.22412109375, 4.3701171875, 5.51611328125, 6.662109375, 7.80810546875, 8.9541015625, 10.10009765625, 11.24609375, 12.39208984375, 13.5380859375, 14.68408203125, 15.830078125, 16.97607421875, 18.1220703125, 19.26806640625, 20.4140625, 21.56005859375, 22.7060546875, 23.85205078125, 24.998046875, 26.14404296875, 27.2900390625, 28.43603515625, 29.58203125, 30.72802734375, 31.8740234375, 33.02001953125, 34.166015625, 35.31201171875, 36.4580078125, 37.60400390625, 38.75]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 8.0, 2.0, 7.0, 3.0, 13.0, 9.0, 8.0, 16.0, 13.0, 22.0, 22.0, 21.0, 24.0, 28.0, 30.0, 30.0, 35.0, 46.0, 40.0, 25.0, 29.0, 50.0, 51.0, 44.0, 53.0, 31.0, 39.0, 33.0, 46.0, 24.0, 24.0, 22.0, 24.0, 24.0, 22.0, 18.0, 15.0, 14.0, 6.0, 9.0, 7.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-33.375, -32.478271484375, -31.58154296875, -30.684814453125, -29.7880859375, -28.891357421875, -27.99462890625, -27.097900390625, -26.201171875, -25.304443359375, -24.40771484375, -23.510986328125, -22.6142578125, -21.717529296875, -20.82080078125, -19.924072265625, -19.02734375, -18.130615234375, -17.23388671875, -16.337158203125, -15.4404296875, -14.543701171875, -13.64697265625, -12.750244140625, -11.853515625, -10.956787109375, -10.06005859375, -9.163330078125, -8.2666015625, -7.369873046875, -6.47314453125, -5.576416015625, -4.6796875, -3.782958984375, -2.88623046875, -1.989501953125, -1.0927734375, -0.196044921875, 0.70068359375, 1.597412109375, 2.494140625, 3.390869140625, 4.28759765625, 5.184326171875, 6.0810546875, 6.977783203125, 7.87451171875, 8.771240234375, 9.66796875, 10.564697265625, 11.46142578125, 12.358154296875, 13.2548828125, 14.151611328125, 15.04833984375, 15.945068359375, 16.841796875, 17.738525390625, 18.63525390625, 19.531982421875, 20.4287109375, 21.325439453125, 22.22216796875, 23.118896484375, 24.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 13.0, 17.0, 26.0, 34.0, 72.0, 104.0, 171.0, 256.0, 342.0, 541.0, 827.0, 1351.0, 2034.0, 3337.0, 5252.0, 8327.0, 13072.0, 20199.0, 31060.0, 45747.0, 65613.0, 87161.0, 107070.0, 120321.0, 120986.0, 110523.0, 90793.0, 69289.0, 49288.0, 33620.0, 22026.0, 14302.0, 9084.0, 5814.0, 3587.0, 2284.0, 1483.0, 926.0, 551.0, 353.0, 241.0, 140.0, 104.0, 68.0, 46.0, 35.0, 24.0, 16.0, 10.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.3203125, -12.9052734375, -12.490234375, -12.0751953125, -11.66015625, -11.2451171875, -10.830078125, -10.4150390625, -10.0, -9.5849609375, -9.169921875, -8.7548828125, -8.33984375, -7.9248046875, -7.509765625, -7.0947265625, -6.6796875, -6.2646484375, -5.849609375, -5.4345703125, -5.01953125, -4.6044921875, -4.189453125, -3.7744140625, -3.359375, -2.9443359375, -2.529296875, -2.1142578125, -1.69921875, -1.2841796875, -0.869140625, -0.4541015625, -0.0390625, 0.3759765625, 0.791015625, 1.2060546875, 1.62109375, 2.0361328125, 2.451171875, 2.8662109375, 3.28125, 3.6962890625, 4.111328125, 4.5263671875, 4.94140625, 5.3564453125, 5.771484375, 6.1865234375, 6.6015625, 7.0166015625, 7.431640625, 7.8466796875, 8.26171875, 8.6767578125, 9.091796875, 9.5068359375, 9.921875, 10.3369140625, 10.751953125, 11.1669921875, 11.58203125, 11.9970703125, 12.412109375, 12.8271484375, 13.2421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 11.0, 5.0, 6.0, 11.0, 12.0, 26.0, 23.0, 36.0, 38.0, 43.0, 50.0, 52.0, 52.0, 63.0, 63.0, 63.0, 70.0, 51.0, 59.0, 51.0, 39.0, 30.0, 35.0, 17.0, 18.0, 14.0, 16.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020351409912109375, -0.0019670426845550537, -0.00189894437789917, -0.0018308460712432861, -0.0017627477645874023, -0.0016946494579315186, -0.0016265511512756348, -0.001558452844619751, -0.0014903545379638672, -0.0014222562313079834, -0.0013541579246520996, -0.0012860596179962158, -0.001217961311340332, -0.0011498630046844482, -0.0010817646980285645, -0.0010136663913726807, -0.0009455680847167969, -0.0008774697780609131, -0.0008093714714050293, -0.0007412731647491455, -0.0006731748580932617, -0.0006050765514373779, -0.0005369782447814941, -0.00046887993812561035, -0.00040078163146972656, -0.0003326833248138428, -0.000264585018157959, -0.0001964867115020752, -0.0001283884048461914, -6.029009819030762e-05, 7.808208465576172e-06, 7.590651512145996e-05, 0.00014400482177734375, 0.00021210312843322754, 0.00028020143508911133, 0.0003482997417449951, 0.0004163980484008789, 0.0004844963550567627, 0.0005525946617126465, 0.0006206929683685303, 0.0006887912750244141, 0.0007568895816802979, 0.0008249878883361816, 0.0008930861949920654, 0.0009611845016479492, 0.001029282808303833, 0.0010973811149597168, 0.0011654794216156006, 0.0012335777282714844, 0.0013016760349273682, 0.001369774341583252, 0.0014378726482391357, 0.0015059709548950195, 0.0015740692615509033, 0.0016421675682067871, 0.001710265874862671, 0.0017783641815185547, 0.0018464624881744385, 0.0019145607948303223, 0.001982659101486206, 0.00205075740814209, 0.0021188557147979736, 0.0021869540214538574, 0.002255052328109741, 0.002323150634765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 7.0, 7.0, 12.0, 17.0, 23.0, 46.0, 61.0, 108.0, 140.0, 240.0, 346.0, 508.0, 862.0, 1320.0, 2022.0, 3352.0, 5280.0, 8755.0, 13878.0, 21283.0, 32484.0, 48107.0, 66730.0, 87568.0, 107845.0, 119170.0, 119452.0, 107581.0, 89966.0, 68389.0, 49154.0, 33283.0, 22209.0, 14162.0, 9043.0, 5683.0, 3449.0, 2197.0, 1361.0, 878.0, 561.0, 352.0, 203.0, 159.0, 113.0, 77.0, 34.0, 36.0, 14.0, 13.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-13.3671875, -12.949951171875, -12.53271484375, -12.115478515625, -11.6982421875, -11.281005859375, -10.86376953125, -10.446533203125, -10.029296875, -9.612060546875, -9.19482421875, -8.777587890625, -8.3603515625, -7.943115234375, -7.52587890625, -7.108642578125, -6.69140625, -6.274169921875, -5.85693359375, -5.439697265625, -5.0224609375, -4.605224609375, -4.18798828125, -3.770751953125, -3.353515625, -2.936279296875, -2.51904296875, -2.101806640625, -1.6845703125, -1.267333984375, -0.85009765625, -0.432861328125, -0.015625, 0.401611328125, 0.81884765625, 1.236083984375, 1.6533203125, 2.070556640625, 2.48779296875, 2.905029296875, 3.322265625, 3.739501953125, 4.15673828125, 4.573974609375, 4.9912109375, 5.408447265625, 5.82568359375, 6.242919921875, 6.66015625, 7.077392578125, 7.49462890625, 7.911865234375, 8.3291015625, 8.746337890625, 9.16357421875, 9.580810546875, 9.998046875, 10.415283203125, 10.83251953125, 11.249755859375, 11.6669921875, 12.084228515625, 12.50146484375, 12.918701171875, 13.3359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 6.0, 8.0, 11.0, 11.0, 16.0, 22.0, 23.0, 15.0, 27.0, 34.0, 40.0, 51.0, 50.0, 44.0, 60.0, 53.0, 47.0, 56.0, 58.0, 42.0, 42.0, 38.0, 43.0, 30.0, 25.0, 22.0, 17.0, 19.0, 9.0, 15.0, 15.0, 12.0, 9.0, 5.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2109375, -6.01531982421875, -5.8197021484375, -5.62408447265625, -5.428466796875, -5.23284912109375, -5.0372314453125, -4.84161376953125, -4.64599609375, -4.45037841796875, -4.2547607421875, -4.05914306640625, -3.863525390625, -3.66790771484375, -3.4722900390625, -3.27667236328125, -3.0810546875, -2.88543701171875, -2.6898193359375, -2.49420166015625, -2.298583984375, -2.10296630859375, -1.9073486328125, -1.71173095703125, -1.51611328125, -1.32049560546875, -1.1248779296875, -0.92926025390625, -0.733642578125, -0.53802490234375, -0.3424072265625, -0.14678955078125, 0.048828125, 0.24444580078125, 0.4400634765625, 0.63568115234375, 0.831298828125, 1.02691650390625, 1.2225341796875, 1.41815185546875, 1.61376953125, 1.80938720703125, 2.0050048828125, 2.20062255859375, 2.396240234375, 2.59185791015625, 2.7874755859375, 2.98309326171875, 3.1787109375, 3.37432861328125, 3.5699462890625, 3.76556396484375, 3.961181640625, 4.15679931640625, 4.3524169921875, 4.54803466796875, 4.74365234375, 4.93927001953125, 5.1348876953125, 5.33050537109375, 5.526123046875, 5.72174072265625, 5.9173583984375, 6.11297607421875, 6.30859375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0, 7.0, 8.0, 6.0, 8.0, 12.0, 16.0, 18.0, 22.0, 20.0, 29.0, 29.0, 29.0, 34.0, 37.0, 31.0, 47.0, 42.0, 47.0, 36.0, 40.0, 39.0, 44.0, 50.0, 38.0, 35.0, 38.0, 36.0, 27.0, 27.0, 28.0, 22.0, 15.0, 8.0, 11.0, 5.0, 11.0, 13.0, 5.0, 10.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.402565002441406, -40.03293991088867, -38.66331481933594, -37.29368591308594, -35.9240608215332, -34.55443572998047, -33.18480682373047, -31.815181732177734, -30.445556640625, -29.075931549072266, -27.7063045501709, -26.33667755126953, -24.967052459716797, -23.597427368164062, -22.227800369262695, -20.858173370361328, -19.488548278808594, -18.11892318725586, -16.749296188354492, -15.379670143127441, -14.01004409790039, -12.64041805267334, -11.270792007446289, -9.901165962219238, -8.531539916992188, -7.161913871765137, -5.792287826538086, -4.422661781311035, -3.0530357360839844, -1.6834096908569336, -0.3137836456298828, 1.055842399597168, 2.4254684448242188, 3.7950944900512695, 5.16472053527832, 6.534346580505371, 7.903972625732422, 9.273598670959473, 10.643224716186523, 12.012850761413574, 13.382476806640625, 14.752102851867676, 16.121728897094727, 17.491355895996094, 18.860980987548828, 20.230606079101562, 21.60023307800293, 22.969860076904297, 24.33948516845703, 25.709110260009766, 27.078737258911133, 28.4483642578125, 29.817989349365234, 31.18761444091797, 32.55724334716797, 33.9268684387207, 35.29649353027344, 36.66611862182617, 38.035743713378906, 39.405372619628906, 40.77499771118164, 42.144622802734375, 43.514251708984375, 44.88387680053711, 46.253501892089844]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 4.0, 8.0, 9.0, 12.0, 5.0, 8.0, 13.0, 15.0, 18.0, 28.0, 24.0, 21.0, 25.0, 26.0, 35.0, 32.0, 29.0, 29.0, 42.0, 33.0, 38.0, 35.0, 36.0, 45.0, 31.0, 41.0, 26.0, 37.0, 47.0, 24.0, 20.0, 16.0, 22.0, 17.0, 25.0, 24.0, 14.0, 20.0, 21.0, 12.0, 16.0, 8.0, 3.0, 3.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.50913619995117, -37.23678207397461, -35.96442794799805, -34.69207763671875, -33.41972351074219, -32.147369384765625, -30.875015258789062, -29.6026611328125, -28.33030891418457, -27.057954788208008, -25.785602569580078, -24.513248443603516, -23.240894317626953, -21.968542098999023, -20.69618797302246, -19.42383575439453, -18.15148162841797, -16.879127502441406, -15.606775283813477, -14.334421157836914, -13.062067985534668, -11.789714813232422, -10.51736068725586, -9.245007514953613, -7.972654342651367, -6.700301170349121, -5.427947521209717, -4.1555938720703125, -2.8832406997680664, -1.6108875274658203, -0.338533878326416, 0.9338197708129883, 2.2061729431152344, 3.4785263538360596, 4.750879764556885, 6.023233413696289, 7.295586585998535, 8.567939758300781, 9.840293884277344, 11.11264705657959, 12.385000228881836, 13.657353401184082, 14.929706573486328, 16.20206069946289, 17.474414825439453, 18.746767044067383, 20.019121170043945, 21.291473388671875, 22.563827514648438, 23.836181640625, 25.10853385925293, 26.380887985229492, 27.653240203857422, 28.925594329833984, 30.197948455810547, 31.47030258178711, 32.742652893066406, 34.01500701904297, 35.28736114501953, 36.55971145629883, 37.83206558227539, 39.10441970825195, 40.376773834228516, 41.64912796020508, 42.92148208618164]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 10.0, 20.0, 33.0, 43.0, 70.0, 136.0, 218.0, 370.0, 646.0, 1143.0, 1959.0, 3337.0, 5799.0, 9902.0, 16897.0, 29108.0, 50645.0, 88685.0, 153649.0, 266462.0, 440401.0, 644543.0, 748397.0, 649137.0, 446081.0, 269300.0, 155793.0, 89312.0, 51183.0, 29522.0, 17052.0, 9918.0, 5848.0, 3527.0, 2072.0, 1250.0, 725.0, 427.0, 269.0, 166.0, 83.0, 48.0, 29.0, 21.0, 16.0, 12.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.21875, -44.751953125, -43.28515625, -41.818359375, -40.3515625, -38.884765625, -37.41796875, -35.951171875, -34.484375, -33.017578125, -31.55078125, -30.083984375, -28.6171875, -27.150390625, -25.68359375, -24.216796875, -22.75, -21.283203125, -19.81640625, -18.349609375, -16.8828125, -15.416015625, -13.94921875, -12.482421875, -11.015625, -9.548828125, -8.08203125, -6.615234375, -5.1484375, -3.681640625, -2.21484375, -0.748046875, 0.71875, 2.185546875, 3.65234375, 5.119140625, 6.5859375, 8.052734375, 9.51953125, 10.986328125, 12.453125, 13.919921875, 15.38671875, 16.853515625, 18.3203125, 19.787109375, 21.25390625, 22.720703125, 24.1875, 25.654296875, 27.12109375, 28.587890625, 30.0546875, 31.521484375, 32.98828125, 34.455078125, 35.921875, 37.388671875, 38.85546875, 40.322265625, 41.7890625, 43.255859375, 44.72265625, 46.189453125, 47.65625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 8.0, 4.0, 9.0, 15.0, 9.0, 15.0, 19.0, 19.0, 26.0, 31.0, 19.0, 33.0, 26.0, 42.0, 25.0, 25.0, 37.0, 28.0, 41.0, 26.0, 45.0, 36.0, 45.0, 34.0, 31.0, 27.0, 31.0, 25.0, 35.0, 30.0, 23.0, 23.0, 21.0, 28.0, 11.0, 21.0, 14.0, 15.0, 13.0, 12.0, 5.0, 3.0, 6.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.984375, -30.938232421875, -29.89208984375, -28.845947265625, -27.7998046875, -26.753662109375, -25.70751953125, -24.661376953125, -23.615234375, -22.569091796875, -21.52294921875, -20.476806640625, -19.4306640625, -18.384521484375, -17.33837890625, -16.292236328125, -15.24609375, -14.199951171875, -13.15380859375, -12.107666015625, -11.0615234375, -10.015380859375, -8.96923828125, -7.923095703125, -6.876953125, -5.830810546875, -4.78466796875, -3.738525390625, -2.6923828125, -1.646240234375, -0.60009765625, 0.446044921875, 1.4921875, 2.538330078125, 3.58447265625, 4.630615234375, 5.6767578125, 6.722900390625, 7.76904296875, 8.815185546875, 9.861328125, 10.907470703125, 11.95361328125, 12.999755859375, 14.0458984375, 15.092041015625, 16.13818359375, 17.184326171875, 18.23046875, 19.276611328125, 20.32275390625, 21.368896484375, 22.4150390625, 23.461181640625, 24.50732421875, 25.553466796875, 26.599609375, 27.645751953125, 28.69189453125, 29.738037109375, 30.7841796875, 31.830322265625, 32.87646484375, 33.922607421875, 34.96875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 4.0, 13.0, 26.0, 52.0, 60.0, 95.0, 130.0, 227.0, 392.0, 577.0, 996.0, 1525.0, 2539.0, 4137.0, 6642.0, 10864.0, 17673.0, 28992.0, 46956.0, 74857.0, 120429.0, 187498.0, 283549.0, 405363.0, 532817.0, 597306.0, 555694.0, 438641.0, 311419.0, 209106.0, 134074.0, 84761.0, 52311.0, 32424.0, 20147.0, 12318.0, 7533.0, 4723.0, 2839.0, 1756.0, 1092.0, 680.0, 400.0, 228.0, 145.0, 84.0, 61.0, 51.0, 24.0, 19.0, 11.0, 12.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-34.65625, -33.486328125, -32.31640625, -31.146484375, -29.9765625, -28.806640625, -27.63671875, -26.466796875, -25.296875, -24.126953125, -22.95703125, -21.787109375, -20.6171875, -19.447265625, -18.27734375, -17.107421875, -15.9375, -14.767578125, -13.59765625, -12.427734375, -11.2578125, -10.087890625, -8.91796875, -7.748046875, -6.578125, -5.408203125, -4.23828125, -3.068359375, -1.8984375, -0.728515625, 0.44140625, 1.611328125, 2.78125, 3.951171875, 5.12109375, 6.291015625, 7.4609375, 8.630859375, 9.80078125, 10.970703125, 12.140625, 13.310546875, 14.48046875, 15.650390625, 16.8203125, 17.990234375, 19.16015625, 20.330078125, 21.5, 22.669921875, 23.83984375, 25.009765625, 26.1796875, 27.349609375, 28.51953125, 29.689453125, 30.859375, 32.029296875, 33.19921875, 34.369140625, 35.5390625, 36.708984375, 37.87890625, 39.048828125, 40.21875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 1.0, 6.0, 6.0, 2.0, 9.0, 6.0, 16.0, 13.0, 16.0, 20.0, 29.0, 35.0, 44.0, 47.0, 45.0, 68.0, 69.0, 78.0, 98.0, 99.0, 130.0, 138.0, 144.0, 164.0, 172.0, 199.0, 184.0, 209.0, 229.0, 217.0, 186.0, 171.0, 159.0, 155.0, 141.0, 128.0, 101.0, 101.0, 79.0, 65.0, 60.0, 43.0, 51.0, 41.0, 29.0, 12.0, 19.0, 12.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0], "bins": [-14.9375, -14.4820556640625, -14.026611328125, -13.5711669921875, -13.11572265625, -12.6602783203125, -12.204833984375, -11.7493896484375, -11.2939453125, -10.8385009765625, -10.383056640625, -9.9276123046875, -9.47216796875, -9.0167236328125, -8.561279296875, -8.1058349609375, -7.650390625, -7.1949462890625, -6.739501953125, -6.2840576171875, -5.82861328125, -5.3731689453125, -4.917724609375, -4.4622802734375, -4.0068359375, -3.5513916015625, -3.095947265625, -2.6405029296875, -2.18505859375, -1.7296142578125, -1.274169921875, -0.8187255859375, -0.36328125, 0.0921630859375, 0.547607421875, 1.0030517578125, 1.45849609375, 1.9139404296875, 2.369384765625, 2.8248291015625, 3.2802734375, 3.7357177734375, 4.191162109375, 4.6466064453125, 5.10205078125, 5.5574951171875, 6.012939453125, 6.4683837890625, 6.923828125, 7.3792724609375, 7.834716796875, 8.2901611328125, 8.74560546875, 9.2010498046875, 9.656494140625, 10.1119384765625, 10.5673828125, 11.0228271484375, 11.478271484375, 11.9337158203125, 12.38916015625, 12.8446044921875, 13.300048828125, 13.7554931640625, 14.2109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 6.0, 7.0, 3.0, 9.0, 11.0, 12.0, 14.0, 14.0, 23.0, 16.0, 18.0, 34.0, 41.0, 31.0, 45.0, 44.0, 36.0, 41.0, 38.0, 46.0, 52.0, 51.0, 55.0, 47.0, 36.0, 28.0, 51.0, 23.0, 26.0, 27.0, 24.0, 16.0, 16.0, 8.0, 11.0, 9.0, 8.0, 6.0, 7.0, 7.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.242271423339844, -43.82782745361328, -42.41338348388672, -40.998939514160156, -39.584495544433594, -38.17005157470703, -36.75560760498047, -35.341163635253906, -33.926719665527344, -32.51227569580078, -31.09783172607422, -29.683387756347656, -28.268943786621094, -26.85449981689453, -25.44005584716797, -24.025611877441406, -22.611167907714844, -21.19672393798828, -19.78227996826172, -18.367835998535156, -16.953392028808594, -15.538948059082031, -14.124504089355469, -12.710060119628906, -11.295616149902344, -9.881172180175781, -8.466728210449219, -7.052284240722656, -5.637840270996094, -4.223396301269531, -2.8089523315429688, -1.3945083618164062, 0.01993560791015625, 1.4343795776367188, 2.8488235473632812, 4.263267517089844, 5.677711486816406, 7.092155456542969, 8.506599426269531, 9.921043395996094, 11.335487365722656, 12.749931335449219, 14.164375305175781, 15.578819274902344, 16.993263244628906, 18.40770721435547, 19.82215118408203, 21.236595153808594, 22.651039123535156, 24.06548309326172, 25.47992706298828, 26.894371032714844, 28.308815002441406, 29.72325897216797, 31.13770294189453, 32.552146911621094, 33.966590881347656, 35.38103485107422, 36.79547882080078, 38.209922790527344, 39.624366760253906, 41.03881072998047, 42.45325469970703, 43.867698669433594, 45.282142639160156]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 7.0, 9.0, 10.0, 10.0, 12.0, 13.0, 17.0, 21.0, 13.0, 22.0, 30.0, 26.0, 32.0, 39.0, 31.0, 43.0, 54.0, 39.0, 31.0, 39.0, 41.0, 37.0, 46.0, 41.0, 22.0, 30.0, 34.0, 30.0, 38.0, 25.0, 30.0, 18.0, 14.0, 15.0, 19.0, 8.0, 13.0, 5.0, 13.0, 9.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.3831672668457, -38.076507568359375, -36.76984405517578, -35.46318054199219, -34.15652084350586, -32.84986114501953, -31.543197631835938, -30.236536026000977, -28.929874420166016, -27.623212814331055, -26.316551208496094, -25.009889602661133, -23.703227996826172, -22.39656639099121, -21.08990478515625, -19.78324317932129, -18.476581573486328, -17.169919967651367, -15.863258361816406, -14.556596755981445, -13.249935150146484, -11.943273544311523, -10.636611938476562, -9.329950332641602, -8.02328872680664, -6.71662712097168, -5.409965515136719, -4.103303909301758, -2.796642303466797, -1.489980697631836, -0.183319091796875, 1.123342514038086, 2.4300003051757812, 3.736661911010742, 5.043323516845703, 6.349985122680664, 7.656646728515625, 8.963308334350586, 10.269969940185547, 11.576631546020508, 12.883293151855469, 14.18995475769043, 15.49661636352539, 16.80327796936035, 18.109939575195312, 19.416601181030273, 20.723262786865234, 22.029924392700195, 23.336585998535156, 24.643247604370117, 25.949909210205078, 27.25657081604004, 28.563232421875, 29.86989402770996, 31.176555633544922, 32.48321533203125, 33.789878845214844, 35.09654235839844, 36.403202056884766, 37.709861755371094, 39.01652526855469, 40.32318878173828, 41.62984848022461, 42.93650817871094, 44.24317169189453]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 10.0, 16.0, 14.0, 23.0, 42.0, 57.0, 131.0, 177.0, 271.0, 433.0, 637.0, 1075.0, 1546.0, 2571.0, 3914.0, 6004.0, 9421.0, 14349.0, 21475.0, 30636.0, 43349.0, 58393.0, 76033.0, 94725.0, 108627.0, 113394.0, 106863.0, 92919.0, 74427.0, 57251.0, 41381.0, 29552.0, 20165.0, 13495.0, 8965.0, 5800.0, 3747.0, 2443.0, 1518.0, 990.0, 659.0, 391.0, 238.0, 180.0, 92.0, 70.0, 39.0, 24.0, 15.0, 4.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.40625, -53.64404296875, -51.8818359375, -50.11962890625, -48.357421875, -46.59521484375, -44.8330078125, -43.07080078125, -41.30859375, -39.54638671875, -37.7841796875, -36.02197265625, -34.259765625, -32.49755859375, -30.7353515625, -28.97314453125, -27.2109375, -25.44873046875, -23.6865234375, -21.92431640625, -20.162109375, -18.39990234375, -16.6376953125, -14.87548828125, -13.11328125, -11.35107421875, -9.5888671875, -7.82666015625, -6.064453125, -4.30224609375, -2.5400390625, -0.77783203125, 0.984375, 2.74658203125, 4.5087890625, 6.27099609375, 8.033203125, 9.79541015625, 11.5576171875, 13.31982421875, 15.08203125, 16.84423828125, 18.6064453125, 20.36865234375, 22.130859375, 23.89306640625, 25.6552734375, 27.41748046875, 29.1796875, 30.94189453125, 32.7041015625, 34.46630859375, 36.228515625, 37.99072265625, 39.7529296875, 41.51513671875, 43.27734375, 45.03955078125, 46.8017578125, 48.56396484375, 50.326171875, 52.08837890625, 53.8505859375, 55.61279296875, 57.375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 7.0, 6.0, 13.0, 13.0, 20.0, 16.0, 31.0, 14.0, 24.0, 28.0, 40.0, 34.0, 29.0, 40.0, 47.0, 32.0, 55.0, 43.0, 32.0, 40.0, 31.0, 39.0, 39.0, 38.0, 35.0, 31.0, 20.0, 35.0, 23.0, 18.0, 19.0, 20.0, 15.0, 17.0, 11.0, 6.0, 12.0, 6.0, 7.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.03125, -25.08740234375, -24.1435546875, -23.19970703125, -22.255859375, -21.31201171875, -20.3681640625, -19.42431640625, -18.48046875, -17.53662109375, -16.5927734375, -15.64892578125, -14.705078125, -13.76123046875, -12.8173828125, -11.87353515625, -10.9296875, -9.98583984375, -9.0419921875, -8.09814453125, -7.154296875, -6.21044921875, -5.2666015625, -4.32275390625, -3.37890625, -2.43505859375, -1.4912109375, -0.54736328125, 0.396484375, 1.34033203125, 2.2841796875, 3.22802734375, 4.171875, 5.11572265625, 6.0595703125, 7.00341796875, 7.947265625, 8.89111328125, 9.8349609375, 10.77880859375, 11.72265625, 12.66650390625, 13.6103515625, 14.55419921875, 15.498046875, 16.44189453125, 17.3857421875, 18.32958984375, 19.2734375, 20.21728515625, 21.1611328125, 22.10498046875, 23.048828125, 23.99267578125, 24.9365234375, 25.88037109375, 26.82421875, 27.76806640625, 28.7119140625, 29.65576171875, 30.599609375, 31.54345703125, 32.4873046875, 33.43115234375, 34.375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 11.0, 7.0, 15.0, 22.0, 37.0, 50.0, 79.0, 128.0, 223.0, 292.0, 464.0, 777.0, 1143.0, 1819.0, 2750.0, 4344.0, 6612.0, 10814.0, 16995.0, 26953.0, 42048.0, 64987.0, 97695.0, 137685.0, 164287.0, 148626.0, 110822.0, 74907.0, 48298.0, 31388.0, 19962.0, 12480.0, 7887.0, 4999.0, 3335.0, 1971.0, 1270.0, 844.0, 514.0, 337.0, 235.0, 154.0, 111.0, 61.0, 41.0, 31.0, 19.0, 10.0, 7.0, 7.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-85.8125, -83.013671875, -80.21484375, -77.416015625, -74.6171875, -71.818359375, -69.01953125, -66.220703125, -63.421875, -60.623046875, -57.82421875, -55.025390625, -52.2265625, -49.427734375, -46.62890625, -43.830078125, -41.03125, -38.232421875, -35.43359375, -32.634765625, -29.8359375, -27.037109375, -24.23828125, -21.439453125, -18.640625, -15.841796875, -13.04296875, -10.244140625, -7.4453125, -4.646484375, -1.84765625, 0.951171875, 3.75, 6.548828125, 9.34765625, 12.146484375, 14.9453125, 17.744140625, 20.54296875, 23.341796875, 26.140625, 28.939453125, 31.73828125, 34.537109375, 37.3359375, 40.134765625, 42.93359375, 45.732421875, 48.53125, 51.330078125, 54.12890625, 56.927734375, 59.7265625, 62.525390625, 65.32421875, 68.123046875, 70.921875, 73.720703125, 76.51953125, 79.318359375, 82.1171875, 84.916015625, 87.71484375, 90.513671875, 93.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 4.0, 6.0, 12.0, 9.0, 10.0, 15.0, 23.0, 21.0, 22.0, 31.0, 39.0, 28.0, 27.0, 32.0, 32.0, 43.0, 32.0, 40.0, 36.0, 53.0, 39.0, 34.0, 39.0, 25.0, 45.0, 37.0, 34.0, 37.0, 32.0, 19.0, 33.0, 14.0, 18.0, 14.0, 18.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.90625, -24.120849609375, -23.33544921875, -22.550048828125, -21.7646484375, -20.979248046875, -20.19384765625, -19.408447265625, -18.623046875, -17.837646484375, -17.05224609375, -16.266845703125, -15.4814453125, -14.696044921875, -13.91064453125, -13.125244140625, -12.33984375, -11.554443359375, -10.76904296875, -9.983642578125, -9.1982421875, -8.412841796875, -7.62744140625, -6.842041015625, -6.056640625, -5.271240234375, -4.48583984375, -3.700439453125, -2.9150390625, -2.129638671875, -1.34423828125, -0.558837890625, 0.2265625, 1.011962890625, 1.79736328125, 2.582763671875, 3.3681640625, 4.153564453125, 4.93896484375, 5.724365234375, 6.509765625, 7.295166015625, 8.08056640625, 8.865966796875, 9.6513671875, 10.436767578125, 11.22216796875, 12.007568359375, 12.79296875, 13.578369140625, 14.36376953125, 15.149169921875, 15.9345703125, 16.719970703125, 17.50537109375, 18.290771484375, 19.076171875, 19.861572265625, 20.64697265625, 21.432373046875, 22.2177734375, 23.003173828125, 23.78857421875, 24.573974609375, 25.359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 9.0, 3.0, 21.0, 19.0, 31.0, 47.0, 72.0, 116.0, 203.0, 257.0, 406.0, 705.0, 1071.0, 1913.0, 3293.0, 5575.0, 10386.0, 20794.0, 42230.0, 92834.0, 200315.0, 296512.0, 195698.0, 90666.0, 41582.0, 19846.0, 10468.0, 5587.0, 3062.0, 1796.0, 1095.0, 682.0, 417.0, 322.0, 165.0, 126.0, 75.0, 47.0, 36.0, 24.0, 15.0, 12.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.5, -40.04296875, -38.5859375, -37.12890625, -35.671875, -34.21484375, -32.7578125, -31.30078125, -29.84375, -28.38671875, -26.9296875, -25.47265625, -24.015625, -22.55859375, -21.1015625, -19.64453125, -18.1875, -16.73046875, -15.2734375, -13.81640625, -12.359375, -10.90234375, -9.4453125, -7.98828125, -6.53125, -5.07421875, -3.6171875, -2.16015625, -0.703125, 0.75390625, 2.2109375, 3.66796875, 5.125, 6.58203125, 8.0390625, 9.49609375, 10.953125, 12.41015625, 13.8671875, 15.32421875, 16.78125, 18.23828125, 19.6953125, 21.15234375, 22.609375, 24.06640625, 25.5234375, 26.98046875, 28.4375, 29.89453125, 31.3515625, 32.80859375, 34.265625, 35.72265625, 37.1796875, 38.63671875, 40.09375, 41.55078125, 43.0078125, 44.46484375, 45.921875, 47.37890625, 48.8359375, 50.29296875, 51.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 5.0, 0.0, 5.0, 1.0, 4.0, 1.0, 3.0, 3.0, 7.0, 2.0, 6.0, 9.0, 8.0, 12.0, 13.0, 15.0, 19.0, 24.0, 35.0, 44.0, 50.0, 62.0, 51.0, 71.0, 74.0, 71.0, 66.0, 56.0, 48.0, 50.0, 32.0, 34.0, 25.0, 16.0, 20.0, 9.0, 13.0, 6.0, 8.0, 11.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003421783447265625, -0.003303706645965576, -0.0031856298446655273, -0.0030675530433654785, -0.0029494762420654297, -0.002831399440765381, -0.002713322639465332, -0.002595245838165283, -0.0024771690368652344, -0.0023590922355651855, -0.0022410154342651367, -0.002122938632965088, -0.002004861831665039, -0.0018867850303649902, -0.0017687082290649414, -0.0016506314277648926, -0.0015325546264648438, -0.001414477825164795, -0.001296401023864746, -0.0011783242225646973, -0.0010602474212646484, -0.0009421706199645996, -0.0008240938186645508, -0.000706017017364502, -0.0005879402160644531, -0.0004698634147644043, -0.00035178661346435547, -0.00023370981216430664, -0.00011563301086425781, 2.4437904357910156e-06, 0.00012052059173583984, 0.00023859739303588867, 0.0003566741943359375, 0.00047475099563598633, 0.0005928277969360352, 0.000710904598236084, 0.0008289813995361328, 0.0009470582008361816, 0.0010651350021362305, 0.0011832118034362793, 0.0013012886047363281, 0.001419365406036377, 0.0015374422073364258, 0.0016555190086364746, 0.0017735958099365234, 0.0018916726112365723, 0.002009749412536621, 0.00212782621383667, 0.0022459030151367188, 0.0023639798164367676, 0.0024820566177368164, 0.0026001334190368652, 0.002718210220336914, 0.002836287021636963, 0.0029543638229370117, 0.0030724406242370605, 0.0031905174255371094, 0.003308594226837158, 0.003426671028137207, 0.003544747829437256, 0.0036628246307373047, 0.0037809014320373535, 0.0038989782333374023, 0.004017055034637451, 0.0041351318359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 14.0, 21.0, 15.0, 29.0, 48.0, 80.0, 123.0, 126.0, 183.0, 256.0, 447.0, 644.0, 953.0, 1603.0, 2326.0, 3756.0, 6031.0, 10112.0, 16767.0, 27515.0, 46265.0, 75687.0, 115679.0, 159103.0, 174306.0, 145375.0, 100308.0, 63155.0, 38271.0, 23132.0, 13623.0, 8346.0, 5139.0, 3155.0, 2095.0, 1297.0, 864.0, 540.0, 362.0, 239.0, 158.0, 135.0, 78.0, 69.0, 30.0, 34.0, 23.0, 12.0, 6.0, 6.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-28.3125, -27.408447265625, -26.50439453125, -25.600341796875, -24.6962890625, -23.792236328125, -22.88818359375, -21.984130859375, -21.080078125, -20.176025390625, -19.27197265625, -18.367919921875, -17.4638671875, -16.559814453125, -15.65576171875, -14.751708984375, -13.84765625, -12.943603515625, -12.03955078125, -11.135498046875, -10.2314453125, -9.327392578125, -8.42333984375, -7.519287109375, -6.615234375, -5.711181640625, -4.80712890625, -3.903076171875, -2.9990234375, -2.094970703125, -1.19091796875, -0.286865234375, 0.6171875, 1.521240234375, 2.42529296875, 3.329345703125, 4.2333984375, 5.137451171875, 6.04150390625, 6.945556640625, 7.849609375, 8.753662109375, 9.65771484375, 10.561767578125, 11.4658203125, 12.369873046875, 13.27392578125, 14.177978515625, 15.08203125, 15.986083984375, 16.89013671875, 17.794189453125, 18.6982421875, 19.602294921875, 20.50634765625, 21.410400390625, 22.314453125, 23.218505859375, 24.12255859375, 25.026611328125, 25.9306640625, 26.834716796875, 27.73876953125, 28.642822265625, 29.546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 8.0, 8.0, 14.0, 17.0, 9.0, 25.0, 24.0, 19.0, 32.0, 25.0, 24.0, 47.0, 47.0, 40.0, 50.0, 54.0, 60.0, 55.0, 50.0, 48.0, 42.0, 35.0, 37.0, 35.0, 23.0, 25.0, 20.0, 25.0, 22.0, 12.0, 5.0, 11.0, 12.0, 1.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.6796875, -9.3359375, -8.9921875, -8.6484375, -8.3046875, -7.9609375, -7.6171875, -7.2734375, -6.9296875, -6.5859375, -6.2421875, -5.8984375, -5.5546875, -5.2109375, -4.8671875, -4.5234375, -4.1796875, -3.8359375, -3.4921875, -3.1484375, -2.8046875, -2.4609375, -2.1171875, -1.7734375, -1.4296875, -1.0859375, -0.7421875, -0.3984375, -0.0546875, 0.2890625, 0.6328125, 0.9765625, 1.3203125, 1.6640625, 2.0078125, 2.3515625, 2.6953125, 3.0390625, 3.3828125, 3.7265625, 4.0703125, 4.4140625, 4.7578125, 5.1015625, 5.4453125, 5.7890625, 6.1328125, 6.4765625, 6.8203125, 7.1640625, 7.5078125, 7.8515625, 8.1953125, 8.5390625, 8.8828125, 9.2265625, 9.5703125, 9.9140625, 10.2578125, 10.6015625, 10.9453125, 11.2890625, 11.6328125, 11.9765625, 12.3203125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 14.0, 9.0, 16.0, 22.0, 27.0, 22.0, 24.0, 28.0, 35.0, 31.0, 45.0, 45.0, 34.0, 51.0, 45.0, 36.0, 54.0, 49.0, 46.0, 40.0, 47.0, 35.0, 41.0, 26.0, 23.0, 20.0, 19.0, 14.0, 22.0, 15.0, 8.0, 8.0, 6.0, 6.0, 9.0, 5.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.449039459228516, -31.454389572143555, -30.459739685058594, -29.465089797973633, -28.470439910888672, -27.475788116455078, -26.481138229370117, -25.486488342285156, -24.491838455200195, -23.497188568115234, -22.502538681030273, -21.507888793945312, -20.51323699951172, -19.51858901977539, -18.523937225341797, -17.529287338256836, -16.534637451171875, -15.539987564086914, -14.545337677001953, -13.550686836242676, -12.556036949157715, -11.561387062072754, -10.566736221313477, -9.572086334228516, -8.577436447143555, -7.582786560058594, -6.588136196136475, -5.5934858322143555, -4.5988359451293945, -3.6041860580444336, -2.6095356941223145, -1.6148853302001953, -0.6202354431152344, 0.37441468238830566, 1.3690648078918457, 2.3637149333953857, 3.358365058898926, 4.353014945983887, 5.347665309906006, 6.342315673828125, 7.336965560913086, 8.331615447998047, 9.326265335083008, 10.320916175842285, 11.315566062927246, 12.310215950012207, 13.304866790771484, 14.299516677856445, 15.294166564941406, 16.288816452026367, 17.283466339111328, 18.27811622619629, 19.27276611328125, 20.267417907714844, 21.262067794799805, 22.256717681884766, 23.251367568969727, 24.246017456054688, 25.24066734313965, 26.23531723022461, 27.229969024658203, 28.22461700439453, 29.219268798828125, 30.213918685913086, 31.208568572998047]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 8.0, 14.0, 10.0, 13.0, 13.0, 28.0, 31.0, 35.0, 29.0, 34.0, 42.0, 31.0, 35.0, 48.0, 41.0, 47.0, 37.0, 46.0, 44.0, 38.0, 64.0, 36.0, 30.0, 27.0, 33.0, 25.0, 26.0, 18.0, 14.0, 21.0, 13.0, 15.0, 14.0, 7.0, 5.0, 7.0, 7.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.86933135986328, -29.865570068359375, -28.861806869506836, -27.85804557800293, -26.85428237915039, -25.850521087646484, -24.846759796142578, -23.842998504638672, -22.839235305786133, -21.835474014282227, -20.831710815429688, -19.82794952392578, -18.824188232421875, -17.820425033569336, -16.81666374206543, -15.812901496887207, -14.809139251708984, -13.805377006530762, -12.801614761352539, -11.797853469848633, -10.79409122467041, -9.790328979492188, -8.786567687988281, -7.782805442810059, -6.779043197631836, -5.775280952453613, -4.771519184112549, -3.7677571773529053, -2.7639951705932617, -1.760232925415039, -0.7564711570739746, 0.24729061126708984, 1.2510566711425781, 2.2548186779022217, 3.2585806846618652, 4.26234245300293, 5.266104698181152, 6.269866943359375, 7.2736287117004395, 8.277390480041504, 9.281152725219727, 10.28491497039795, 11.288677215576172, 12.292438507080078, 13.2962007522583, 14.299962997436523, 15.30372428894043, 16.30748748779297, 17.311248779296875, 18.31501007080078, 19.31877326965332, 20.322534561157227, 21.326297760009766, 22.330059051513672, 23.333820343017578, 24.337581634521484, 25.341344833374023, 26.34510612487793, 27.34886932373047, 28.352630615234375, 29.35639190673828, 30.36015510559082, 31.363916397094727, 32.367679595947266, 33.37144088745117]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 13.0, 11.0, 19.0, 29.0, 51.0, 82.0, 139.0, 252.0, 378.0, 594.0, 988.0, 1430.0, 2298.0, 3675.0, 5595.0, 8562.0, 12993.0, 19067.0, 27908.0, 39533.0, 53390.0, 68524.0, 84518.0, 96979.0, 104412.0, 103304.0, 95312.0, 82581.0, 67093.0, 51134.0, 37387.0, 26728.0, 18386.0, 12350.0, 8219.0, 5337.0, 3422.0, 2187.0, 1373.0, 876.0, 560.0, 317.0, 221.0, 150.0, 57.0, 52.0, 23.0, 26.0, 15.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.189208984375, -17.58154296875, -16.973876953125, -16.3662109375, -15.758544921875, -15.15087890625, -14.543212890625, -13.935546875, -13.327880859375, -12.72021484375, -12.112548828125, -11.5048828125, -10.897216796875, -10.28955078125, -9.681884765625, -9.07421875, -8.466552734375, -7.85888671875, -7.251220703125, -6.6435546875, -6.035888671875, -5.42822265625, -4.820556640625, -4.212890625, -3.605224609375, -2.99755859375, -2.389892578125, -1.7822265625, -1.174560546875, -0.56689453125, 0.040771484375, 0.6484375, 1.256103515625, 1.86376953125, 2.471435546875, 3.0791015625, 3.686767578125, 4.29443359375, 4.902099609375, 5.509765625, 6.117431640625, 6.72509765625, 7.332763671875, 7.9404296875, 8.548095703125, 9.15576171875, 9.763427734375, 10.37109375, 10.978759765625, 11.58642578125, 12.194091796875, 12.8017578125, 13.409423828125, 14.01708984375, 14.624755859375, 15.232421875, 15.840087890625, 16.44775390625, 17.055419921875, 17.6630859375, 18.270751953125, 18.87841796875, 19.486083984375, 20.09375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 5.0, 14.0, 5.0, 7.0, 16.0, 14.0, 32.0, 25.0, 26.0, 35.0, 26.0, 30.0, 32.0, 40.0, 28.0, 43.0, 40.0, 47.0, 49.0, 44.0, 35.0, 39.0, 40.0, 28.0, 27.0, 32.0, 31.0, 28.0, 29.0, 25.0, 14.0, 16.0, 18.0, 17.0, 10.0, 11.0, 8.0, 9.0, 3.0, 7.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-33.5625, -32.642822265625, -31.72314453125, -30.803466796875, -29.8837890625, -28.964111328125, -28.04443359375, -27.124755859375, -26.205078125, -25.285400390625, -24.36572265625, -23.446044921875, -22.5263671875, -21.606689453125, -20.68701171875, -19.767333984375, -18.84765625, -17.927978515625, -17.00830078125, -16.088623046875, -15.1689453125, -14.249267578125, -13.32958984375, -12.409912109375, -11.490234375, -10.570556640625, -9.65087890625, -8.731201171875, -7.8115234375, -6.891845703125, -5.97216796875, -5.052490234375, -4.1328125, -3.213134765625, -2.29345703125, -1.373779296875, -0.4541015625, 0.465576171875, 1.38525390625, 2.304931640625, 3.224609375, 4.144287109375, 5.06396484375, 5.983642578125, 6.9033203125, 7.822998046875, 8.74267578125, 9.662353515625, 10.58203125, 11.501708984375, 12.42138671875, 13.341064453125, 14.2607421875, 15.180419921875, 16.10009765625, 17.019775390625, 17.939453125, 18.859130859375, 19.77880859375, 20.698486328125, 21.6181640625, 22.537841796875, 23.45751953125, 24.377197265625, 25.296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 11.0, 12.0, 14.0, 23.0, 48.0, 80.0, 90.0, 176.0, 287.0, 501.0, 861.0, 1479.0, 2534.0, 4447.0, 7921.0, 13654.0, 23380.0, 38900.0, 62012.0, 91532.0, 123579.0, 144055.0, 146011.0, 126048.0, 95189.0, 65286.0, 41283.0, 24831.0, 14522.0, 8346.0, 4764.0, 2830.0, 1579.0, 934.0, 525.0, 339.0, 192.0, 104.0, 65.0, 44.0, 35.0, 13.0, 7.0, 6.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.25, -33.244384765625, -32.23876953125, -31.233154296875, -30.2275390625, -29.221923828125, -28.21630859375, -27.210693359375, -26.205078125, -25.199462890625, -24.19384765625, -23.188232421875, -22.1826171875, -21.177001953125, -20.17138671875, -19.165771484375, -18.16015625, -17.154541015625, -16.14892578125, -15.143310546875, -14.1376953125, -13.132080078125, -12.12646484375, -11.120849609375, -10.115234375, -9.109619140625, -8.10400390625, -7.098388671875, -6.0927734375, -5.087158203125, -4.08154296875, -3.075927734375, -2.0703125, -1.064697265625, -0.05908203125, 0.946533203125, 1.9521484375, 2.957763671875, 3.96337890625, 4.968994140625, 5.974609375, 6.980224609375, 7.98583984375, 8.991455078125, 9.9970703125, 11.002685546875, 12.00830078125, 13.013916015625, 14.01953125, 15.025146484375, 16.03076171875, 17.036376953125, 18.0419921875, 19.047607421875, 20.05322265625, 21.058837890625, 22.064453125, 23.070068359375, 24.07568359375, 25.081298828125, 26.0869140625, 27.092529296875, 28.09814453125, 29.103759765625, 30.109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 4.0, 7.0, 11.0, 8.0, 20.0, 23.0, 19.0, 35.0, 22.0, 24.0, 36.0, 31.0, 37.0, 45.0, 55.0, 40.0, 41.0, 46.0, 53.0, 60.0, 39.0, 51.0, 53.0, 37.0, 31.0, 32.0, 26.0, 31.0, 24.0, 11.0, 16.0, 9.0, 9.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.390625, -22.652099609375, -21.91357421875, -21.175048828125, -20.4365234375, -19.697998046875, -18.95947265625, -18.220947265625, -17.482421875, -16.743896484375, -16.00537109375, -15.266845703125, -14.5283203125, -13.789794921875, -13.05126953125, -12.312744140625, -11.57421875, -10.835693359375, -10.09716796875, -9.358642578125, -8.6201171875, -7.881591796875, -7.14306640625, -6.404541015625, -5.666015625, -4.927490234375, -4.18896484375, -3.450439453125, -2.7119140625, -1.973388671875, -1.23486328125, -0.496337890625, 0.2421875, 0.980712890625, 1.71923828125, 2.457763671875, 3.1962890625, 3.934814453125, 4.67333984375, 5.411865234375, 6.150390625, 6.888916015625, 7.62744140625, 8.365966796875, 9.1044921875, 9.843017578125, 10.58154296875, 11.320068359375, 12.05859375, 12.797119140625, 13.53564453125, 14.274169921875, 15.0126953125, 15.751220703125, 16.48974609375, 17.228271484375, 17.966796875, 18.705322265625, 19.44384765625, 20.182373046875, 20.9208984375, 21.659423828125, 22.39794921875, 23.136474609375, 23.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 5.0, 10.0, 9.0, 24.0, 33.0, 64.0, 64.0, 95.0, 140.0, 200.0, 289.0, 472.0, 780.0, 1257.0, 2137.0, 3434.0, 6301.0, 11060.0, 20265.0, 37428.0, 67418.0, 110845.0, 159219.0, 183895.0, 163585.0, 117354.0, 71685.0, 40245.0, 21997.0, 11828.0, 6771.0, 3719.0, 2219.0, 1307.0, 841.0, 553.0, 349.0, 195.0, 141.0, 89.0, 76.0, 50.0, 28.0, 18.0, 19.0, 15.0, 10.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.0234375, -12.5972900390625, -12.171142578125, -11.7449951171875, -11.31884765625, -10.8927001953125, -10.466552734375, -10.0404052734375, -9.6142578125, -9.1881103515625, -8.761962890625, -8.3358154296875, -7.90966796875, -7.4835205078125, -7.057373046875, -6.6312255859375, -6.205078125, -5.7789306640625, -5.352783203125, -4.9266357421875, -4.50048828125, -4.0743408203125, -3.648193359375, -3.2220458984375, -2.7958984375, -2.3697509765625, -1.943603515625, -1.5174560546875, -1.09130859375, -0.6651611328125, -0.239013671875, 0.1871337890625, 0.61328125, 1.0394287109375, 1.465576171875, 1.8917236328125, 2.31787109375, 2.7440185546875, 3.170166015625, 3.5963134765625, 4.0224609375, 4.4486083984375, 4.874755859375, 5.3009033203125, 5.72705078125, 6.1531982421875, 6.579345703125, 7.0054931640625, 7.431640625, 7.8577880859375, 8.283935546875, 8.7100830078125, 9.13623046875, 9.5623779296875, 9.988525390625, 10.4146728515625, 10.8408203125, 11.2669677734375, 11.693115234375, 12.1192626953125, 12.54541015625, 12.9715576171875, 13.397705078125, 13.8238525390625, 14.25]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 5.0, 16.0, 17.0, 34.0, 45.0, 40.0, 47.0, 64.0, 76.0, 76.0, 89.0, 97.0, 81.0, 56.0, 59.0, 49.0, 39.0, 27.0, 24.0, 15.0, 12.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022945404052734375, -0.002235323190689087, -0.0021761059761047363, -0.0021168887615203857, -0.002057671546936035, -0.0019984543323516846, -0.001939237117767334, -0.0018800199031829834, -0.0018208026885986328, -0.0017615854740142822, -0.0017023682594299316, -0.001643151044845581, -0.0015839338302612305, -0.0015247166156768799, -0.0014654994010925293, -0.0014062821865081787, -0.0013470649719238281, -0.0012878477573394775, -0.001228630542755127, -0.0011694133281707764, -0.0011101961135864258, -0.0010509788990020752, -0.0009917616844177246, -0.000932544469833374, -0.0008733272552490234, -0.0008141100406646729, -0.0007548928260803223, -0.0006956756114959717, -0.0006364583969116211, -0.0005772411823272705, -0.0005180239677429199, -0.00045880675315856934, -0.00039958953857421875, -0.00034037232398986816, -0.0002811551094055176, -0.000221937894821167, -0.0001627206802368164, -0.00010350346565246582, -4.4286251068115234e-05, 1.4930963516235352e-05, 7.414817810058594e-05, 0.00013336539268493652, 0.0001925826072692871, 0.0002517998218536377, 0.0003110170364379883, 0.00037023425102233887, 0.00042945146560668945, 0.00048866868019104, 0.0005478858947753906, 0.0006071031093597412, 0.0006663203239440918, 0.0007255375385284424, 0.000784754753112793, 0.0008439719676971436, 0.0009031891822814941, 0.0009624063968658447, 0.0010216236114501953, 0.001080840826034546, 0.0011400580406188965, 0.001199275255203247, 0.0012584924697875977, 0.0013177096843719482, 0.0013769268989562988, 0.0014361441135406494, 0.001495361328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 9.0, 6.0, 9.0, 12.0, 22.0, 25.0, 43.0, 54.0, 83.0, 121.0, 205.0, 277.0, 489.0, 825.0, 1342.0, 2457.0, 4381.0, 7627.0, 13770.0, 24327.0, 41871.0, 69422.0, 105987.0, 141734.0, 161545.0, 152891.0, 119377.0, 81015.0, 50568.0, 29659.0, 16586.0, 9407.0, 5178.0, 2904.0, 1651.0, 1022.0, 583.0, 342.0, 242.0, 154.0, 108.0, 61.0, 52.0, 39.0, 31.0, 15.0, 9.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-11.546875, -11.1934814453125, -10.840087890625, -10.4866943359375, -10.13330078125, -9.7799072265625, -9.426513671875, -9.0731201171875, -8.7197265625, -8.3663330078125, -8.012939453125, -7.6595458984375, -7.30615234375, -6.9527587890625, -6.599365234375, -6.2459716796875, -5.892578125, -5.5391845703125, -5.185791015625, -4.8323974609375, -4.47900390625, -4.1256103515625, -3.772216796875, -3.4188232421875, -3.0654296875, -2.7120361328125, -2.358642578125, -2.0052490234375, -1.65185546875, -1.2984619140625, -0.945068359375, -0.5916748046875, -0.23828125, 0.1151123046875, 0.468505859375, 0.8218994140625, 1.17529296875, 1.5286865234375, 1.882080078125, 2.2354736328125, 2.5888671875, 2.9422607421875, 3.295654296875, 3.6490478515625, 4.00244140625, 4.3558349609375, 4.709228515625, 5.0626220703125, 5.416015625, 5.7694091796875, 6.122802734375, 6.4761962890625, 6.82958984375, 7.1829833984375, 7.536376953125, 7.8897705078125, 8.2431640625, 8.5965576171875, 8.949951171875, 9.3033447265625, 9.65673828125, 10.0101318359375, 10.363525390625, 10.7169189453125, 11.0703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 5.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 8.0, 9.0, 17.0, 8.0, 16.0, 30.0, 27.0, 27.0, 44.0, 27.0, 40.0, 50.0, 54.0, 45.0, 49.0, 57.0, 44.0, 53.0, 46.0, 52.0, 37.0, 34.0, 30.0, 25.0, 28.0, 26.0, 16.0, 14.0, 10.0, 5.0, 6.0, 3.0, 6.0, 7.0, 9.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.673553466796875, -2.56390380859375, -2.454254150390625, -2.3446044921875, -2.234954833984375, -2.12530517578125, -2.015655517578125, -1.906005859375, -1.796356201171875, -1.68670654296875, -1.577056884765625, -1.4674072265625, -1.357757568359375, -1.24810791015625, -1.138458251953125, -1.02880859375, -0.919158935546875, -0.80950927734375, -0.699859619140625, -0.5902099609375, -0.480560302734375, -0.37091064453125, -0.261260986328125, -0.151611328125, -0.041961669921875, 0.06768798828125, 0.177337646484375, 0.2869873046875, 0.396636962890625, 0.50628662109375, 0.615936279296875, 0.7255859375, 0.835235595703125, 0.94488525390625, 1.054534912109375, 1.1641845703125, 1.273834228515625, 1.38348388671875, 1.493133544921875, 1.602783203125, 1.712432861328125, 1.82208251953125, 1.931732177734375, 2.0413818359375, 2.151031494140625, 2.26068115234375, 2.370330810546875, 2.47998046875, 2.589630126953125, 2.69927978515625, 2.808929443359375, 2.9185791015625, 3.028228759765625, 3.13787841796875, 3.247528076171875, 3.357177734375, 3.466827392578125, 3.57647705078125, 3.686126708984375, 3.7957763671875, 3.905426025390625, 4.01507568359375, 4.124725341796875, 4.234375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 9.0, 13.0, 8.0, 9.0, 19.0, 21.0, 26.0, 21.0, 28.0, 27.0, 39.0, 39.0, 40.0, 43.0, 54.0, 41.0, 47.0, 46.0, 49.0, 42.0, 31.0, 36.0, 47.0, 31.0, 22.0, 30.0, 31.0, 22.0, 21.0, 22.0, 18.0, 11.0, 5.0, 11.0, 5.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-33.03375244140625, -32.07163619995117, -31.10952377319336, -30.147409439086914, -29.18529510498047, -28.223180770874023, -27.261066436767578, -26.2989501953125, -25.336837768554688, -24.374723434448242, -23.412609100341797, -22.45049476623535, -21.488380432128906, -20.52626609802246, -19.564151763916016, -18.602035522460938, -17.639921188354492, -16.677806854248047, -15.715692520141602, -14.753578186035156, -13.791463851928711, -12.829349517822266, -11.867234230041504, -10.905119895935059, -9.943005561828613, -8.980891227722168, -8.018776893615723, -7.056662082672119, -6.094547748565674, -5.1324334144592285, -4.170318603515625, -3.2082042694091797, -2.2460899353027344, -1.2839754819869995, -0.32186102867126465, 0.6402535438537598, 1.602367877960205, 2.5644822120666504, 3.526597023010254, 4.488711357116699, 5.4508256912231445, 6.41294002532959, 7.375054359436035, 8.337169647216797, 9.299283981323242, 10.261398315429688, 11.223512649536133, 12.185626983642578, 13.147741317749023, 14.109855651855469, 15.071969985961914, 16.03408432006836, 16.996198654174805, 17.95831298828125, 18.920429229736328, 19.88254165649414, 20.84465789794922, 21.806772232055664, 22.76888656616211, 23.731000900268555, 24.693115234375, 25.655229568481445, 26.61734390258789, 27.57946014404297, 28.54157257080078]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 4.0, 4.0, 1.0, 8.0, 3.0, 5.0, 6.0, 10.0, 15.0, 16.0, 9.0, 12.0, 21.0, 15.0, 24.0, 20.0, 21.0, 17.0, 25.0, 31.0, 34.0, 39.0, 47.0, 45.0, 40.0, 37.0, 28.0, 34.0, 37.0, 32.0, 30.0, 28.0, 32.0, 32.0, 27.0, 32.0, 28.0, 23.0, 22.0, 17.0, 15.0, 8.0, 14.0, 17.0, 4.0, 7.0, 5.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.801513671875, -23.95681381225586, -23.112112045288086, -22.267412185668945, -21.422712326049805, -20.57801055908203, -19.73331069946289, -18.88861083984375, -18.043909072875977, -17.199209213256836, -16.354507446289062, -15.509807586669922, -14.665106773376465, -13.820405960083008, -12.975706100463867, -12.13100528717041, -11.28630542755127, -10.441604614257812, -9.596904754638672, -8.752203941345215, -7.907503128051758, -7.062802791595459, -6.21810245513916, -5.373401641845703, -4.528701305389404, -3.6840007305145264, -2.8393001556396484, -1.9945998191833496, -1.1498992443084717, -0.30519866943359375, 0.5395016670227051, 1.384202480316162, 2.228902816772461, 3.073603391647339, 3.918303966522217, 4.763004302978516, 5.607705116271973, 6.4524054527282715, 7.29710578918457, 8.141806602478027, 8.986507415771484, 9.831208229064941, 10.675908088684082, 11.520608901977539, 12.365309715270996, 13.210010528564453, 14.054710388183594, 14.89941120147705, 15.744111061096191, 16.58881187438965, 17.43351173400879, 18.278213500976562, 19.122913360595703, 19.967613220214844, 20.812313079833984, 21.657014846801758, 22.5017147064209, 23.34641456604004, 24.191116333007812, 25.035816192626953, 25.880516052246094, 26.725217819213867, 27.569917678833008, 28.41461944580078, 29.259319305419922]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 7.0, 18.0, 30.0, 45.0, 87.0, 120.0, 202.0, 325.0, 594.0, 1104.0, 2123.0, 4023.0, 7329.0, 13809.0, 26628.0, 52139.0, 100010.0, 190312.0, 345753.0, 559487.0, 740565.0, 756360.0, 589646.0, 370827.0, 205812.0, 108361.0, 56410.0, 28868.0, 15437.0, 8123.0, 4317.0, 2284.0, 1275.0, 810.0, 439.0, 227.0, 138.0, 97.0, 58.0, 31.0, 12.0, 17.0, 11.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.0625, -31.148193359375, -30.23388671875, -29.319580078125, -28.4052734375, -27.490966796875, -26.57666015625, -25.662353515625, -24.748046875, -23.833740234375, -22.91943359375, -22.005126953125, -21.0908203125, -20.176513671875, -19.26220703125, -18.347900390625, -17.43359375, -16.519287109375, -15.60498046875, -14.690673828125, -13.7763671875, -12.862060546875, -11.94775390625, -11.033447265625, -10.119140625, -9.204833984375, -8.29052734375, -7.376220703125, -6.4619140625, -5.547607421875, -4.63330078125, -3.718994140625, -2.8046875, -1.890380859375, -0.97607421875, -0.061767578125, 0.8525390625, 1.766845703125, 2.68115234375, 3.595458984375, 4.509765625, 5.424072265625, 6.33837890625, 7.252685546875, 8.1669921875, 9.081298828125, 9.99560546875, 10.909912109375, 11.82421875, 12.738525390625, 13.65283203125, 14.567138671875, 15.4814453125, 16.395751953125, 17.31005859375, 18.224365234375, 19.138671875, 20.052978515625, 20.96728515625, 21.881591796875, 22.7958984375, 23.710205078125, 24.62451171875, 25.538818359375, 26.453125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 9.0, 8.0, 5.0, 4.0, 13.0, 8.0, 22.0, 9.0, 18.0, 10.0, 19.0, 16.0, 19.0, 34.0, 46.0, 21.0, 34.0, 25.0, 42.0, 31.0, 47.0, 33.0, 32.0, 29.0, 30.0, 37.0, 30.0, 33.0, 37.0, 32.0, 30.0, 20.0, 23.0, 26.0, 16.0, 20.0, 21.0, 18.0, 18.0, 9.0, 9.0, 7.0, 7.0, 7.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-22.796875, -22.106201171875, -21.41552734375, -20.724853515625, -20.0341796875, -19.343505859375, -18.65283203125, -17.962158203125, -17.271484375, -16.580810546875, -15.89013671875, -15.199462890625, -14.5087890625, -13.818115234375, -13.12744140625, -12.436767578125, -11.74609375, -11.055419921875, -10.36474609375, -9.674072265625, -8.9833984375, -8.292724609375, -7.60205078125, -6.911376953125, -6.220703125, -5.530029296875, -4.83935546875, -4.148681640625, -3.4580078125, -2.767333984375, -2.07666015625, -1.385986328125, -0.6953125, -0.004638671875, 0.68603515625, 1.376708984375, 2.0673828125, 2.758056640625, 3.44873046875, 4.139404296875, 4.830078125, 5.520751953125, 6.21142578125, 6.902099609375, 7.5927734375, 8.283447265625, 8.97412109375, 9.664794921875, 10.35546875, 11.046142578125, 11.73681640625, 12.427490234375, 13.1181640625, 13.808837890625, 14.49951171875, 15.190185546875, 15.880859375, 16.571533203125, 17.26220703125, 17.952880859375, 18.6435546875, 19.334228515625, 20.02490234375, 20.715576171875, 21.40625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 8.0, 2.0, 9.0, 17.0, 17.0, 37.0, 40.0, 73.0, 106.0, 197.0, 316.0, 529.0, 994.0, 1729.0, 2889.0, 5316.0, 9505.0, 17268.0, 31521.0, 56822.0, 100768.0, 175142.0, 288372.0, 440116.0, 594245.0, 667275.0, 607229.0, 458223.0, 304731.0, 186368.0, 107804.0, 61001.0, 33591.0, 18732.0, 10375.0, 5579.0, 3150.0, 1732.0, 1018.0, 603.0, 350.0, 211.0, 111.0, 67.0, 31.0, 26.0, 17.0, 11.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.1875, -25.2705078125, -24.353515625, -23.4365234375, -22.51953125, -21.6025390625, -20.685546875, -19.7685546875, -18.8515625, -17.9345703125, -17.017578125, -16.1005859375, -15.18359375, -14.2666015625, -13.349609375, -12.4326171875, -11.515625, -10.5986328125, -9.681640625, -8.7646484375, -7.84765625, -6.9306640625, -6.013671875, -5.0966796875, -4.1796875, -3.2626953125, -2.345703125, -1.4287109375, -0.51171875, 0.4052734375, 1.322265625, 2.2392578125, 3.15625, 4.0732421875, 4.990234375, 5.9072265625, 6.82421875, 7.7412109375, 8.658203125, 9.5751953125, 10.4921875, 11.4091796875, 12.326171875, 13.2431640625, 14.16015625, 15.0771484375, 15.994140625, 16.9111328125, 17.828125, 18.7451171875, 19.662109375, 20.5791015625, 21.49609375, 22.4130859375, 23.330078125, 24.2470703125, 25.1640625, 26.0810546875, 26.998046875, 27.9150390625, 28.83203125, 29.7490234375, 30.666015625, 31.5830078125, 32.5]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 9.0, 5.0, 6.0, 14.0, 8.0, 5.0, 15.0, 24.0, 31.0, 35.0, 41.0, 48.0, 60.0, 65.0, 92.0, 117.0, 121.0, 133.0, 184.0, 194.0, 196.0, 214.0, 230.0, 216.0, 226.0, 211.0, 206.0, 171.0, 179.0, 123.0, 157.0, 139.0, 118.0, 75.0, 80.0, 71.0, 67.0, 43.0, 33.0, 29.0, 26.0, 21.0, 9.0, 9.0, 8.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.1640625, -10.825927734375, -10.48779296875, -10.149658203125, -9.8115234375, -9.473388671875, -9.13525390625, -8.797119140625, -8.458984375, -8.120849609375, -7.78271484375, -7.444580078125, -7.1064453125, -6.768310546875, -6.43017578125, -6.092041015625, -5.75390625, -5.415771484375, -5.07763671875, -4.739501953125, -4.4013671875, -4.063232421875, -3.72509765625, -3.386962890625, -3.048828125, -2.710693359375, -2.37255859375, -2.034423828125, -1.6962890625, -1.358154296875, -1.02001953125, -0.681884765625, -0.34375, -0.005615234375, 0.33251953125, 0.670654296875, 1.0087890625, 1.346923828125, 1.68505859375, 2.023193359375, 2.361328125, 2.699462890625, 3.03759765625, 3.375732421875, 3.7138671875, 4.052001953125, 4.39013671875, 4.728271484375, 5.06640625, 5.404541015625, 5.74267578125, 6.080810546875, 6.4189453125, 6.757080078125, 7.09521484375, 7.433349609375, 7.771484375, 8.109619140625, 8.44775390625, 8.785888671875, 9.1240234375, 9.462158203125, 9.80029296875, 10.138427734375, 10.4765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 7.0, 3.0, 3.0, 8.0, 8.0, 7.0, 10.0, 18.0, 18.0, 16.0, 14.0, 20.0, 19.0, 28.0, 29.0, 29.0, 28.0, 36.0, 38.0, 37.0, 51.0, 31.0, 42.0, 39.0, 38.0, 41.0, 45.0, 31.0, 32.0, 33.0, 29.0, 27.0, 26.0, 27.0, 29.0, 14.0, 13.0, 17.0, 12.0, 4.0, 7.0, 10.0, 8.0, 9.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.756084442138672, -23.90727424621582, -23.0584659576416, -22.20965576171875, -21.36084747314453, -20.51203727722168, -19.663227081298828, -18.81441879272461, -17.965608596801758, -17.116798400878906, -16.267990112304688, -15.419179916381836, -14.5703706741333, -13.721561431884766, -12.872751235961914, -12.023941993713379, -11.175132751464844, -10.326323509216309, -9.477514266967773, -8.628704071044922, -7.779894828796387, -6.931085586547852, -6.082275867462158, -5.233466148376465, -4.38465690612793, -3.5358474254608154, -2.687037944793701, -1.838228464126587, -0.9894189834594727, -0.1406097412109375, 0.7081999778747559, 1.5570096969604492, 2.4058170318603516, 3.254626512527466, 4.10343599319458, 4.952245712280273, 5.801054954528809, 6.649864196777344, 7.498673915863037, 8.34748363494873, 9.196292877197266, 10.0451021194458, 10.893911361694336, 11.742721557617188, 12.591530799865723, 13.440340042114258, 14.28915023803711, 15.137959480285645, 15.98676872253418, 16.83557891845703, 17.68438720703125, 18.5331974029541, 19.382007598876953, 20.230815887451172, 21.079626083374023, 21.928436279296875, 22.777244567871094, 23.626054763793945, 24.474863052368164, 25.323673248291016, 26.172481536865234, 27.021291732788086, 27.870101928710938, 28.718910217285156, 29.567720413208008]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 1.0, 7.0, 8.0, 6.0, 6.0, 15.0, 13.0, 13.0, 20.0, 15.0, 22.0, 20.0, 30.0, 24.0, 24.0, 28.0, 33.0, 24.0, 33.0, 28.0, 47.0, 38.0, 31.0, 41.0, 20.0, 43.0, 27.0, 44.0, 25.0, 29.0, 26.0, 27.0, 16.0, 30.0, 26.0, 19.0, 15.0, 18.0, 19.0, 5.0, 14.0, 6.0, 10.0, 10.0, 4.0, 6.0, 6.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-24.25715446472168, -23.493690490722656, -22.730226516723633, -21.96676254272461, -21.203298568725586, -20.439834594726562, -19.676368713378906, -18.912906646728516, -18.14944076538086, -17.385976791381836, -16.622512817382812, -15.859048843383789, -15.095584869384766, -14.332120895385742, -13.568655967712402, -12.805191993713379, -12.041728973388672, -11.278264999389648, -10.514801025390625, -9.751337051391602, -8.987873077392578, -8.224409103393555, -7.460944175720215, -6.697480201721191, -5.934016227722168, -5.1705522537231445, -4.407088279724121, -3.6436238288879395, -2.880159854888916, -2.1166958808898926, -1.353231430053711, -0.5897674560546875, 0.17369651794433594, 0.9371606111526489, 1.700624704360962, 2.4640889167785645, 3.227552890777588, 3.9910168647766113, 4.754481315612793, 5.517945289611816, 6.28140926361084, 7.044873237609863, 7.808337211608887, 8.571802139282227, 9.33526611328125, 10.098730087280273, 10.862194061279297, 11.62565803527832, 12.389122009277344, 13.152585983276367, 13.91604995727539, 14.679513931274414, 15.442977905273438, 16.20644187927246, 16.969905853271484, 17.73337173461914, 18.49683380126953, 19.260297775268555, 20.023761749267578, 20.7872257232666, 21.550689697265625, 22.31415367126465, 23.077617645263672, 23.841083526611328, 24.60454750061035]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 14.0, 17.0, 29.0, 43.0, 53.0, 81.0, 123.0, 159.0, 282.0, 393.0, 594.0, 833.0, 1275.0, 1854.0, 2745.0, 3865.0, 5683.0, 8205.0, 11625.0, 17106.0, 25578.0, 38783.0, 60526.0, 93438.0, 135092.0, 161952.0, 150534.0, 111621.0, 73596.0, 46933.0, 30738.0, 20449.0, 13612.0, 9306.0, 6557.0, 4571.0, 3223.0, 2280.0, 1523.0, 1048.0, 728.0, 520.0, 318.0, 232.0, 150.0, 101.0, 67.0, 34.0, 23.0, 16.0, 12.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0], "bins": [-43.375, -42.04931640625, -40.7236328125, -39.39794921875, -38.072265625, -36.74658203125, -35.4208984375, -34.09521484375, -32.76953125, -31.44384765625, -30.1181640625, -28.79248046875, -27.466796875, -26.14111328125, -24.8154296875, -23.48974609375, -22.1640625, -20.83837890625, -19.5126953125, -18.18701171875, -16.861328125, -15.53564453125, -14.2099609375, -12.88427734375, -11.55859375, -10.23291015625, -8.9072265625, -7.58154296875, -6.255859375, -4.93017578125, -3.6044921875, -2.27880859375, -0.953125, 0.37255859375, 1.6982421875, 3.02392578125, 4.349609375, 5.67529296875, 7.0009765625, 8.32666015625, 9.65234375, 10.97802734375, 12.3037109375, 13.62939453125, 14.955078125, 16.28076171875, 17.6064453125, 18.93212890625, 20.2578125, 21.58349609375, 22.9091796875, 24.23486328125, 25.560546875, 26.88623046875, 28.2119140625, 29.53759765625, 30.86328125, 32.18896484375, 33.5146484375, 34.84033203125, 36.166015625, 37.49169921875, 38.8173828125, 40.14306640625, 41.46875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 7.0, 12.0, 10.0, 6.0, 11.0, 11.0, 20.0, 23.0, 23.0, 27.0, 29.0, 20.0, 46.0, 38.0, 37.0, 39.0, 33.0, 40.0, 35.0, 36.0, 34.0, 33.0, 44.0, 41.0, 31.0, 33.0, 34.0, 35.0, 21.0, 25.0, 22.0, 21.0, 19.0, 10.0, 18.0, 14.0, 10.0, 4.0, 4.0, 6.0, 4.0, 8.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.90625, -23.14208984375, -22.3779296875, -21.61376953125, -20.849609375, -20.08544921875, -19.3212890625, -18.55712890625, -17.79296875, -17.02880859375, -16.2646484375, -15.50048828125, -14.736328125, -13.97216796875, -13.2080078125, -12.44384765625, -11.6796875, -10.91552734375, -10.1513671875, -9.38720703125, -8.623046875, -7.85888671875, -7.0947265625, -6.33056640625, -5.56640625, -4.80224609375, -4.0380859375, -3.27392578125, -2.509765625, -1.74560546875, -0.9814453125, -0.21728515625, 0.546875, 1.31103515625, 2.0751953125, 2.83935546875, 3.603515625, 4.36767578125, 5.1318359375, 5.89599609375, 6.66015625, 7.42431640625, 8.1884765625, 8.95263671875, 9.716796875, 10.48095703125, 11.2451171875, 12.00927734375, 12.7734375, 13.53759765625, 14.3017578125, 15.06591796875, 15.830078125, 16.59423828125, 17.3583984375, 18.12255859375, 18.88671875, 19.65087890625, 20.4150390625, 21.17919921875, 21.943359375, 22.70751953125, 23.4716796875, 24.23583984375, 25.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 11.0, 7.0, 17.0, 31.0, 50.0, 90.0, 109.0, 190.0, 263.0, 476.0, 699.0, 1177.0, 1790.0, 2912.0, 4752.0, 7779.0, 12707.0, 20913.0, 36419.0, 66457.0, 129119.0, 237475.0, 237352.0, 130019.0, 66781.0, 36457.0, 21224.0, 12769.0, 7752.0, 4858.0, 2948.0, 1822.0, 1109.0, 744.0, 481.0, 285.0, 185.0, 113.0, 78.0, 53.0, 27.0, 17.0, 15.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6875, -63.498046875, -61.30859375, -59.119140625, -56.9296875, -54.740234375, -52.55078125, -50.361328125, -48.171875, -45.982421875, -43.79296875, -41.603515625, -39.4140625, -37.224609375, -35.03515625, -32.845703125, -30.65625, -28.466796875, -26.27734375, -24.087890625, -21.8984375, -19.708984375, -17.51953125, -15.330078125, -13.140625, -10.951171875, -8.76171875, -6.572265625, -4.3828125, -2.193359375, -0.00390625, 2.185546875, 4.375, 6.564453125, 8.75390625, 10.943359375, 13.1328125, 15.322265625, 17.51171875, 19.701171875, 21.890625, 24.080078125, 26.26953125, 28.458984375, 30.6484375, 32.837890625, 35.02734375, 37.216796875, 39.40625, 41.595703125, 43.78515625, 45.974609375, 48.1640625, 50.353515625, 52.54296875, 54.732421875, 56.921875, 59.111328125, 61.30078125, 63.490234375, 65.6796875, 67.869140625, 70.05859375, 72.248046875, 74.4375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 14.0, 19.0, 18.0, 14.0, 24.0, 27.0, 35.0, 36.0, 34.0, 43.0, 37.0, 35.0, 40.0, 61.0, 51.0, 38.0, 56.0, 40.0, 54.0, 43.0, 41.0, 30.0, 28.0, 25.0, 31.0, 29.0, 22.0, 13.0, 16.0, 9.0, 7.0, 9.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.46875, -23.748046875, -23.02734375, -22.306640625, -21.5859375, -20.865234375, -20.14453125, -19.423828125, -18.703125, -17.982421875, -17.26171875, -16.541015625, -15.8203125, -15.099609375, -14.37890625, -13.658203125, -12.9375, -12.216796875, -11.49609375, -10.775390625, -10.0546875, -9.333984375, -8.61328125, -7.892578125, -7.171875, -6.451171875, -5.73046875, -5.009765625, -4.2890625, -3.568359375, -2.84765625, -2.126953125, -1.40625, -0.685546875, 0.03515625, 0.755859375, 1.4765625, 2.197265625, 2.91796875, 3.638671875, 4.359375, 5.080078125, 5.80078125, 6.521484375, 7.2421875, 7.962890625, 8.68359375, 9.404296875, 10.125, 10.845703125, 11.56640625, 12.287109375, 13.0078125, 13.728515625, 14.44921875, 15.169921875, 15.890625, 16.611328125, 17.33203125, 18.052734375, 18.7734375, 19.494140625, 20.21484375, 20.935546875, 21.65625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 10.0, 10.0, 10.0, 22.0, 23.0, 38.0, 38.0, 55.0, 65.0, 82.0, 121.0, 179.0, 228.0, 352.0, 524.0, 804.0, 1264.0, 2199.0, 3868.0, 7647.0, 17102.0, 41175.0, 112340.0, 292150.0, 333060.0, 143216.0, 51240.0, 20256.0, 9089.0, 4536.0, 2505.0, 1484.0, 897.0, 607.0, 380.0, 269.0, 212.0, 114.0, 104.0, 77.0, 65.0, 42.0, 30.0, 19.0, 15.0, 12.0, 7.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.0625, -38.77490234375, -37.4873046875, -36.19970703125, -34.912109375, -33.62451171875, -32.3369140625, -31.04931640625, -29.76171875, -28.47412109375, -27.1865234375, -25.89892578125, -24.611328125, -23.32373046875, -22.0361328125, -20.74853515625, -19.4609375, -18.17333984375, -16.8857421875, -15.59814453125, -14.310546875, -13.02294921875, -11.7353515625, -10.44775390625, -9.16015625, -7.87255859375, -6.5849609375, -5.29736328125, -4.009765625, -2.72216796875, -1.4345703125, -0.14697265625, 1.140625, 2.42822265625, 3.7158203125, 5.00341796875, 6.291015625, 7.57861328125, 8.8662109375, 10.15380859375, 11.44140625, 12.72900390625, 14.0166015625, 15.30419921875, 16.591796875, 17.87939453125, 19.1669921875, 20.45458984375, 21.7421875, 23.02978515625, 24.3173828125, 25.60498046875, 26.892578125, 28.18017578125, 29.4677734375, 30.75537109375, 32.04296875, 33.33056640625, 34.6181640625, 35.90576171875, 37.193359375, 38.48095703125, 39.7685546875, 41.05615234375, 42.34375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 14.0, 9.0, 9.0, 23.0, 30.0, 51.0, 80.0, 132.0, 210.0, 165.0, 102.0, 61.0, 39.0, 14.0, 11.0, 12.0, 6.0, 2.0, 2.0, 6.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006015777587890625, -0.005842745304107666, -0.005669713020324707, -0.005496680736541748, -0.005323648452758789, -0.00515061616897583, -0.004977583885192871, -0.004804551601409912, -0.004631519317626953, -0.004458487033843994, -0.004285454750061035, -0.004112422466278076, -0.003939390182495117, -0.003766357898712158, -0.0035933256149291992, -0.0034202933311462402, -0.0032472610473632812, -0.0030742287635803223, -0.0029011964797973633, -0.0027281641960144043, -0.0025551319122314453, -0.0023820996284484863, -0.0022090673446655273, -0.0020360350608825684, -0.0018630027770996094, -0.0016899704933166504, -0.0015169382095336914, -0.0013439059257507324, -0.0011708736419677734, -0.0009978413581848145, -0.0008248090744018555, -0.0006517767906188965, -0.0004787445068359375, -0.0003057122230529785, -0.00013267993927001953, 4.035234451293945e-05, 0.00021338462829589844, 0.0003864169120788574, 0.0005594491958618164, 0.0007324814796447754, 0.0009055137634277344, 0.0010785460472106934, 0.0012515783309936523, 0.0014246106147766113, 0.0015976428985595703, 0.0017706751823425293, 0.0019437074661254883, 0.0021167397499084473, 0.0022897720336914062, 0.0024628043174743652, 0.0026358366012573242, 0.002808868885040283, 0.002981901168823242, 0.003154933452606201, 0.00332796573638916, 0.003500998020172119, 0.003674030303955078, 0.003847062587738037, 0.004020094871520996, 0.004193127155303955, 0.004366159439086914, 0.004539191722869873, 0.004712224006652832, 0.004885256290435791, 0.00505828857421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 9.0, 17.0, 12.0, 18.0, 24.0, 37.0, 48.0, 63.0, 113.0, 133.0, 233.0, 289.0, 489.0, 824.0, 1387.0, 2209.0, 3677.0, 6462.0, 12362.0, 24904.0, 51652.0, 103560.0, 182574.0, 235642.0, 193034.0, 113546.0, 56998.0, 27318.0, 13691.0, 7103.0, 3864.0, 2336.0, 1348.0, 828.0, 561.0, 372.0, 231.0, 170.0, 107.0, 96.0, 64.0, 40.0, 33.0, 25.0, 10.0, 12.0, 5.0, 7.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.84375, -25.965576171875, -25.08740234375, -24.209228515625, -23.3310546875, -22.452880859375, -21.57470703125, -20.696533203125, -19.818359375, -18.940185546875, -18.06201171875, -17.183837890625, -16.3056640625, -15.427490234375, -14.54931640625, -13.671142578125, -12.79296875, -11.914794921875, -11.03662109375, -10.158447265625, -9.2802734375, -8.402099609375, -7.52392578125, -6.645751953125, -5.767578125, -4.889404296875, -4.01123046875, -3.133056640625, -2.2548828125, -1.376708984375, -0.49853515625, 0.379638671875, 1.2578125, 2.135986328125, 3.01416015625, 3.892333984375, 4.7705078125, 5.648681640625, 6.52685546875, 7.405029296875, 8.283203125, 9.161376953125, 10.03955078125, 10.917724609375, 11.7958984375, 12.674072265625, 13.55224609375, 14.430419921875, 15.30859375, 16.186767578125, 17.06494140625, 17.943115234375, 18.8212890625, 19.699462890625, 20.57763671875, 21.455810546875, 22.333984375, 23.212158203125, 24.09033203125, 24.968505859375, 25.8466796875, 26.724853515625, 27.60302734375, 28.481201171875, 29.359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 7.0, 5.0, 17.0, 15.0, 19.0, 13.0, 26.0, 29.0, 46.0, 37.0, 48.0, 57.0, 64.0, 57.0, 58.0, 63.0, 63.0, 65.0, 46.0, 60.0, 32.0, 27.0, 19.0, 27.0, 11.0, 12.0, 13.0, 9.0, 14.0, 9.0, 5.0, 5.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.745361328125, -7.46728515625, -7.189208984375, -6.9111328125, -6.633056640625, -6.35498046875, -6.076904296875, -5.798828125, -5.520751953125, -5.24267578125, -4.964599609375, -4.6865234375, -4.408447265625, -4.13037109375, -3.852294921875, -3.57421875, -3.296142578125, -3.01806640625, -2.739990234375, -2.4619140625, -2.183837890625, -1.90576171875, -1.627685546875, -1.349609375, -1.071533203125, -0.79345703125, -0.515380859375, -0.2373046875, 0.040771484375, 0.31884765625, 0.596923828125, 0.875, 1.153076171875, 1.43115234375, 1.709228515625, 1.9873046875, 2.265380859375, 2.54345703125, 2.821533203125, 3.099609375, 3.377685546875, 3.65576171875, 3.933837890625, 4.2119140625, 4.489990234375, 4.76806640625, 5.046142578125, 5.32421875, 5.602294921875, 5.88037109375, 6.158447265625, 6.4365234375, 6.714599609375, 6.99267578125, 7.270751953125, 7.548828125, 7.826904296875, 8.10498046875, 8.383056640625, 8.6611328125, 8.939208984375, 9.21728515625, 9.495361328125, 9.7734375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 8.0, 4.0, 16.0, 16.0, 19.0, 24.0, 24.0, 28.0, 30.0, 33.0, 36.0, 39.0, 45.0, 50.0, 39.0, 45.0, 44.0, 57.0, 55.0, 49.0, 43.0, 40.0, 46.0, 31.0, 22.0, 18.0, 31.0, 18.0, 16.0, 15.0, 6.0, 14.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.85295867919922, -23.94821548461914, -23.043472290039062, -22.138729095458984, -21.233985900878906, -20.329242706298828, -19.424497604370117, -18.51975440979004, -17.61501121520996, -16.710268020629883, -15.805524826049805, -14.90078067779541, -13.996037483215332, -13.091294288635254, -12.18655014038086, -11.281806945800781, -10.377063751220703, -9.472320556640625, -8.567577362060547, -7.662833213806152, -6.758090019226074, -5.853346824645996, -4.94860315322876, -4.043859481811523, -3.1391162872314453, -2.234372854232788, -1.3296294212341309, -0.42488598823547363, 0.4798574447631836, 1.3846006393432617, 2.289344310760498, 3.1940879821777344, 4.0988311767578125, 5.003574371337891, 5.908318042755127, 6.813061714172363, 7.717804908752441, 8.62254810333252, 9.527292251586914, 10.432035446166992, 11.33677864074707, 12.241521835327148, 13.146265029907227, 14.051009178161621, 14.9557523727417, 15.860495567321777, 16.765239715576172, 17.66998291015625, 18.574726104736328, 19.479469299316406, 20.384212493896484, 21.288955688476562, 22.19369888305664, 23.09844207763672, 24.00318717956543, 24.907930374145508, 25.812673568725586, 26.717416763305664, 27.622159957885742, 28.52690315246582, 29.43164825439453, 30.33639144897461, 31.241134643554688, 32.145877838134766, 33.050621032714844]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 3.0, 2.0, 6.0, 7.0, 6.0, 11.0, 9.0, 12.0, 7.0, 19.0, 20.0, 15.0, 28.0, 20.0, 21.0, 30.0, 29.0, 24.0, 30.0, 36.0, 35.0, 37.0, 34.0, 36.0, 42.0, 31.0, 36.0, 37.0, 32.0, 30.0, 24.0, 28.0, 32.0, 15.0, 35.0, 20.0, 19.0, 22.0, 20.0, 14.0, 13.0, 12.0, 11.0, 11.0, 8.0, 6.0, 7.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.898344039916992, -20.2132511138916, -19.52815818786621, -18.843063354492188, -18.157970428466797, -17.472877502441406, -16.787784576416016, -16.102691650390625, -15.417598724365234, -14.732505798339844, -14.047411918640137, -13.362318992614746, -12.677226066589355, -11.992132186889648, -11.307039260864258, -10.621946334838867, -9.93685245513916, -9.25175952911377, -8.566665649414062, -7.881572723388672, -7.196479797363281, -6.511386394500732, -5.826292991638184, -5.141200065612793, -4.456106662750244, -3.7710134983062744, -3.0859203338623047, -2.400826930999756, -1.7157337665557861, -1.0306406021118164, -0.3455471992492676, 0.33954572677612305, 1.0246391296386719, 1.7097322940826416, 2.3948254585266113, 3.07991886138916, 3.76501202583313, 4.4501051902771, 5.135198593139648, 5.820291519165039, 6.505384922027588, 7.190478324890137, 7.875571250915527, 8.560665130615234, 9.245758056640625, 9.930850982666016, 10.615943908691406, 11.301036834716797, 11.986130714416504, 12.671223640441895, 13.356317520141602, 14.041410446166992, 14.726503372192383, 15.411596298217773, 16.096691131591797, 16.781784057617188, 17.466876983642578, 18.15196990966797, 18.83706283569336, 19.52215576171875, 20.207250595092773, 20.892343521118164, 21.577436447143555, 22.262529373168945, 22.947622299194336]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 10.0, 10.0, 19.0, 20.0, 27.0, 44.0, 68.0, 114.0, 170.0, 276.0, 486.0, 733.0, 1186.0, 1797.0, 2699.0, 4052.0, 6171.0, 9308.0, 14219.0, 20868.0, 30101.0, 42394.0, 57308.0, 74096.0, 90735.0, 103175.0, 108048.0, 104701.0, 93728.0, 77473.0, 60651.0, 45199.0, 31941.0, 22033.0, 15192.0, 9982.0, 6777.0, 4372.0, 2931.0, 1953.0, 1217.0, 810.0, 538.0, 343.0, 208.0, 148.0, 71.0, 71.0, 31.0, 22.0, 14.0, 7.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-18.890625, -18.31103515625, -17.7314453125, -17.15185546875, -16.572265625, -15.99267578125, -15.4130859375, -14.83349609375, -14.25390625, -13.67431640625, -13.0947265625, -12.51513671875, -11.935546875, -11.35595703125, -10.7763671875, -10.19677734375, -9.6171875, -9.03759765625, -8.4580078125, -7.87841796875, -7.298828125, -6.71923828125, -6.1396484375, -5.56005859375, -4.98046875, -4.40087890625, -3.8212890625, -3.24169921875, -2.662109375, -2.08251953125, -1.5029296875, -0.92333984375, -0.34375, 0.23583984375, 0.8154296875, 1.39501953125, 1.974609375, 2.55419921875, 3.1337890625, 3.71337890625, 4.29296875, 4.87255859375, 5.4521484375, 6.03173828125, 6.611328125, 7.19091796875, 7.7705078125, 8.35009765625, 8.9296875, 9.50927734375, 10.0888671875, 10.66845703125, 11.248046875, 11.82763671875, 12.4072265625, 12.98681640625, 13.56640625, 14.14599609375, 14.7255859375, 15.30517578125, 15.884765625, 16.46435546875, 17.0439453125, 17.62353515625, 18.203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 4.0, 10.0, 8.0, 10.0, 18.0, 9.0, 17.0, 18.0, 21.0, 19.0, 12.0, 25.0, 34.0, 27.0, 31.0, 39.0, 35.0, 37.0, 46.0, 33.0, 34.0, 41.0, 43.0, 31.0, 37.0, 26.0, 29.0, 29.0, 30.0, 27.0, 25.0, 25.0, 27.0, 12.0, 18.0, 13.0, 18.0, 12.0, 9.0, 12.0, 5.0, 8.0, 8.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.03125, -21.316650390625, -20.60205078125, -19.887451171875, -19.1728515625, -18.458251953125, -17.74365234375, -17.029052734375, -16.314453125, -15.599853515625, -14.88525390625, -14.170654296875, -13.4560546875, -12.741455078125, -12.02685546875, -11.312255859375, -10.59765625, -9.883056640625, -9.16845703125, -8.453857421875, -7.7392578125, -7.024658203125, -6.31005859375, -5.595458984375, -4.880859375, -4.166259765625, -3.45166015625, -2.737060546875, -2.0224609375, -1.307861328125, -0.59326171875, 0.121337890625, 0.8359375, 1.550537109375, 2.26513671875, 2.979736328125, 3.6943359375, 4.408935546875, 5.12353515625, 5.838134765625, 6.552734375, 7.267333984375, 7.98193359375, 8.696533203125, 9.4111328125, 10.125732421875, 10.84033203125, 11.554931640625, 12.26953125, 12.984130859375, 13.69873046875, 14.413330078125, 15.1279296875, 15.842529296875, 16.55712890625, 17.271728515625, 17.986328125, 18.700927734375, 19.41552734375, 20.130126953125, 20.8447265625, 21.559326171875, 22.27392578125, 22.988525390625, 23.703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 9.0, 13.0, 24.0, 37.0, 50.0, 88.0, 130.0, 196.0, 284.0, 408.0, 598.0, 985.0, 1490.0, 2278.0, 3346.0, 5005.0, 7648.0, 11157.0, 16809.0, 24074.0, 34290.0, 47410.0, 62793.0, 78861.0, 93102.0, 102523.0, 104871.0, 99923.0, 87258.0, 71955.0, 55763.0, 41519.0, 30099.0, 20841.0, 14211.0, 9478.0, 6501.0, 4251.0, 2819.0, 1873.0, 1195.0, 790.0, 521.0, 366.0, 251.0, 153.0, 114.0, 77.0, 34.0, 25.0, 19.0, 14.0, 10.0, 7.0, 3.0, 2.0, 0.0, 5.0], "bins": [-19.96875, -19.350341796875, -18.73193359375, -18.113525390625, -17.4951171875, -16.876708984375, -16.25830078125, -15.639892578125, -15.021484375, -14.403076171875, -13.78466796875, -13.166259765625, -12.5478515625, -11.929443359375, -11.31103515625, -10.692626953125, -10.07421875, -9.455810546875, -8.83740234375, -8.218994140625, -7.6005859375, -6.982177734375, -6.36376953125, -5.745361328125, -5.126953125, -4.508544921875, -3.89013671875, -3.271728515625, -2.6533203125, -2.034912109375, -1.41650390625, -0.798095703125, -0.1796875, 0.438720703125, 1.05712890625, 1.675537109375, 2.2939453125, 2.912353515625, 3.53076171875, 4.149169921875, 4.767578125, 5.385986328125, 6.00439453125, 6.622802734375, 7.2412109375, 7.859619140625, 8.47802734375, 9.096435546875, 9.71484375, 10.333251953125, 10.95166015625, 11.570068359375, 12.1884765625, 12.806884765625, 13.42529296875, 14.043701171875, 14.662109375, 15.280517578125, 15.89892578125, 16.517333984375, 17.1357421875, 17.754150390625, 18.37255859375, 18.990966796875, 19.609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 9.0, 11.0, 13.0, 8.0, 15.0, 12.0, 13.0, 20.0, 24.0, 29.0, 27.0, 21.0, 26.0, 31.0, 35.0, 31.0, 36.0, 41.0, 34.0, 31.0, 33.0, 38.0, 29.0, 36.0, 37.0, 42.0, 38.0, 37.0, 26.0, 28.0, 25.0, 21.0, 23.0, 17.0, 10.0, 14.0, 8.0, 9.0, 9.0, 12.0, 7.0, 4.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.796875, -14.319580078125, -13.84228515625, -13.364990234375, -12.8876953125, -12.410400390625, -11.93310546875, -11.455810546875, -10.978515625, -10.501220703125, -10.02392578125, -9.546630859375, -9.0693359375, -8.592041015625, -8.11474609375, -7.637451171875, -7.16015625, -6.682861328125, -6.20556640625, -5.728271484375, -5.2509765625, -4.773681640625, -4.29638671875, -3.819091796875, -3.341796875, -2.864501953125, -2.38720703125, -1.909912109375, -1.4326171875, -0.955322265625, -0.47802734375, -0.000732421875, 0.4765625, 0.953857421875, 1.43115234375, 1.908447265625, 2.3857421875, 2.863037109375, 3.34033203125, 3.817626953125, 4.294921875, 4.772216796875, 5.24951171875, 5.726806640625, 6.2041015625, 6.681396484375, 7.15869140625, 7.635986328125, 8.11328125, 8.590576171875, 9.06787109375, 9.545166015625, 10.0224609375, 10.499755859375, 10.97705078125, 11.454345703125, 11.931640625, 12.408935546875, 12.88623046875, 13.363525390625, 13.8408203125, 14.318115234375, 14.79541015625, 15.272705078125, 15.75]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 14.0, 11.0, 20.0, 27.0, 37.0, 53.0, 74.0, 101.0, 138.0, 200.0, 304.0, 415.0, 567.0, 808.0, 1253.0, 2127.0, 3753.0, 8023.0, 20649.0, 63546.0, 183668.0, 335125.0, 262921.0, 105824.0, 34209.0, 12090.0, 5089.0, 2604.0, 1598.0, 1020.0, 680.0, 474.0, 339.0, 248.0, 131.0, 126.0, 87.0, 61.0, 38.0, 37.0, 22.0, 11.0, 9.0, 11.0, 2.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-27.46875, -26.654296875, -25.83984375, -25.025390625, -24.2109375, -23.396484375, -22.58203125, -21.767578125, -20.953125, -20.138671875, -19.32421875, -18.509765625, -17.6953125, -16.880859375, -16.06640625, -15.251953125, -14.4375, -13.623046875, -12.80859375, -11.994140625, -11.1796875, -10.365234375, -9.55078125, -8.736328125, -7.921875, -7.107421875, -6.29296875, -5.478515625, -4.6640625, -3.849609375, -3.03515625, -2.220703125, -1.40625, -0.591796875, 0.22265625, 1.037109375, 1.8515625, 2.666015625, 3.48046875, 4.294921875, 5.109375, 5.923828125, 6.73828125, 7.552734375, 8.3671875, 9.181640625, 9.99609375, 10.810546875, 11.625, 12.439453125, 13.25390625, 14.068359375, 14.8828125, 15.697265625, 16.51171875, 17.326171875, 18.140625, 18.955078125, 19.76953125, 20.583984375, 21.3984375, 22.212890625, 23.02734375, 23.841796875, 24.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 11.0, 10.0, 12.0, 23.0, 27.0, 48.0, 54.0, 85.0, 91.0, 105.0, 92.0, 77.0, 85.0, 70.0, 44.0, 39.0, 30.0, 16.0, 16.0, 16.0, 4.0, 4.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002071380615234375, -0.0019976794719696045, -0.001923978328704834, -0.0018502771854400635, -0.001776576042175293, -0.0017028748989105225, -0.001629173755645752, -0.0015554726123809814, -0.001481771469116211, -0.0014080703258514404, -0.00133436918258667, -0.0012606680393218994, -0.001186966896057129, -0.0011132657527923584, -0.0010395646095275879, -0.0009658634662628174, -0.0008921623229980469, -0.0008184611797332764, -0.0007447600364685059, -0.0006710588932037354, -0.0005973577499389648, -0.0005236566066741943, -0.00044995546340942383, -0.0003762543201446533, -0.0003025531768798828, -0.0002288520336151123, -0.0001551508903503418, -8.144974708557129e-05, -7.748603820800781e-06, 6.595253944396973e-05, 0.00013965368270874023, 0.00021335482597351074, 0.00028705596923828125, 0.00036075711250305176, 0.00043445825576782227, 0.0005081593990325928, 0.0005818605422973633, 0.0006555616855621338, 0.0007292628288269043, 0.0008029639720916748, 0.0008766651153564453, 0.0009503662586212158, 0.0010240674018859863, 0.0010977685451507568, 0.0011714696884155273, 0.0012451708316802979, 0.0013188719749450684, 0.0013925731182098389, 0.0014662742614746094, 0.0015399754047393799, 0.0016136765480041504, 0.001687377691268921, 0.0017610788345336914, 0.001834779977798462, 0.0019084811210632324, 0.001982182264328003, 0.0020558834075927734, 0.002129584550857544, 0.0022032856941223145, 0.002276986837387085, 0.0023506879806518555, 0.002424389123916626, 0.0024980902671813965, 0.002571791410446167, 0.0026454925537109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 15.0, 16.0, 15.0, 33.0, 54.0, 83.0, 118.0, 187.0, 247.0, 368.0, 590.0, 1036.0, 1908.0, 3963.0, 9315.0, 26392.0, 74511.0, 181526.0, 288908.0, 253144.0, 128151.0, 48123.0, 16941.0, 6287.0, 2861.0, 1417.0, 827.0, 539.0, 300.0, 226.0, 145.0, 102.0, 70.0, 56.0, 22.0, 16.0, 12.0, 8.0, 7.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.859375, -20.203125, -19.546875, -18.890625, -18.234375, -17.578125, -16.921875, -16.265625, -15.609375, -14.953125, -14.296875, -13.640625, -12.984375, -12.328125, -11.671875, -11.015625, -10.359375, -9.703125, -9.046875, -8.390625, -7.734375, -7.078125, -6.421875, -5.765625, -5.109375, -4.453125, -3.796875, -3.140625, -2.484375, -1.828125, -1.171875, -0.515625, 0.140625, 0.796875, 1.453125, 2.109375, 2.765625, 3.421875, 4.078125, 4.734375, 5.390625, 6.046875, 6.703125, 7.359375, 8.015625, 8.671875, 9.328125, 9.984375, 10.640625, 11.296875, 11.953125, 12.609375, 13.265625, 13.921875, 14.578125, 15.234375, 15.890625, 16.546875, 17.203125, 17.859375, 18.515625, 19.171875, 19.828125, 20.484375, 21.140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 17.0, 25.0, 27.0, 35.0, 47.0, 57.0, 71.0, 76.0, 79.0, 94.0, 87.0, 78.0, 60.0, 46.0, 53.0, 34.0, 25.0, 16.0, 13.0, 7.0, 4.0, 5.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.9765625, -5.801025390625, -5.62548828125, -5.449951171875, -5.2744140625, -5.098876953125, -4.92333984375, -4.747802734375, -4.572265625, -4.396728515625, -4.22119140625, -4.045654296875, -3.8701171875, -3.694580078125, -3.51904296875, -3.343505859375, -3.16796875, -2.992431640625, -2.81689453125, -2.641357421875, -2.4658203125, -2.290283203125, -2.11474609375, -1.939208984375, -1.763671875, -1.588134765625, -1.41259765625, -1.237060546875, -1.0615234375, -0.885986328125, -0.71044921875, -0.534912109375, -0.359375, -0.183837890625, -0.00830078125, 0.167236328125, 0.3427734375, 0.518310546875, 0.69384765625, 0.869384765625, 1.044921875, 1.220458984375, 1.39599609375, 1.571533203125, 1.7470703125, 1.922607421875, 2.09814453125, 2.273681640625, 2.44921875, 2.624755859375, 2.80029296875, 2.975830078125, 3.1513671875, 3.326904296875, 3.50244140625, 3.677978515625, 3.853515625, 4.029052734375, 4.20458984375, 4.380126953125, 4.5556640625, 4.731201171875, 4.90673828125, 5.082275390625, 5.2578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 3.0, 14.0, 13.0, 21.0, 14.0, 22.0, 30.0, 30.0, 29.0, 18.0, 43.0, 47.0, 31.0, 36.0, 42.0, 46.0, 45.0, 47.0, 42.0, 40.0, 43.0, 50.0, 47.0, 34.0, 39.0, 10.0, 26.0, 21.0, 13.0, 13.0, 12.0, 12.0, 5.0, 13.0, 5.0, 6.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.16592025756836, -23.354825973510742, -22.543731689453125, -21.732637405395508, -20.92154312133789, -20.11044692993164, -19.299352645874023, -18.488258361816406, -17.67716407775879, -16.866069793701172, -16.054975509643555, -15.243880271911621, -14.432785987854004, -13.621691703796387, -12.810596466064453, -11.999502182006836, -11.188407897949219, -10.377313613891602, -9.566219329833984, -8.75512409210205, -7.944029808044434, -7.132935523986816, -6.321840763092041, -5.510746002197266, -4.699651718139648, -3.888557195663452, -3.077462673187256, -2.2663681507110596, -1.4552736282348633, -0.6441793441772461, 0.1669154167175293, 0.9780101776123047, 1.789102554321289, 2.6001970767974854, 3.4112915992736816, 4.222386360168457, 5.033480644226074, 5.844574928283691, 6.655669689178467, 7.466764450073242, 8.27785873413086, 9.088953018188477, 9.900047302246094, 10.711142539978027, 11.522236824035645, 12.333331108093262, 13.144426345825195, 13.955520629882812, 14.76661491394043, 15.577709197998047, 16.388803482055664, 17.19989776611328, 18.01099395751953, 18.822086334228516, 19.633182525634766, 20.444276809692383, 21.25537109375, 22.066465377807617, 22.877559661865234, 23.68865394592285, 24.49974822998047, 25.31084442138672, 26.121938705444336, 26.933032989501953, 27.74412727355957]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 7.0, 11.0, 11.0, 15.0, 15.0, 18.0, 22.0, 20.0, 17.0, 17.0, 29.0, 37.0, 38.0, 37.0, 37.0, 30.0, 46.0, 37.0, 34.0, 47.0, 45.0, 45.0, 42.0, 36.0, 35.0, 38.0, 27.0, 28.0, 31.0, 16.0, 23.0, 16.0, 16.0, 12.0, 15.0, 14.0, 11.0, 3.0, 8.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.236860275268555, -26.4128360748291, -25.588809967041016, -24.764785766601562, -23.94076156616211, -23.116737365722656, -22.29271125793457, -21.468687057495117, -20.64466094970703, -19.820636749267578, -18.996610641479492, -18.17258644104004, -17.348562240600586, -16.5245361328125, -15.700511932373047, -14.876487731933594, -14.05246353149414, -13.228438377380371, -12.404414176940918, -11.580389022827148, -10.756364822387695, -9.932339668273926, -9.108314514160156, -8.284290313720703, -7.460265159606934, -6.636240482330322, -5.812215805053711, -4.988190650939941, -4.16416597366333, -3.3401412963867188, -2.516116142272949, -1.692091464996338, -0.8680667877197266, -0.044041991233825684, 0.7799828052520752, 1.6040077209472656, 2.428032398223877, 3.2520570755004883, 4.076082229614258, 4.900106906890869, 5.7241315841674805, 6.548156261444092, 7.372180938720703, 8.196206092834473, 9.020231246948242, 9.844255447387695, 10.668280601501465, 11.492305755615234, 12.316329956054688, 13.140355110168457, 13.96437931060791, 14.78840446472168, 15.612428665161133, 16.43645477294922, 17.260478973388672, 18.084503173828125, 18.908527374267578, 19.73255157470703, 20.556577682495117, 21.38060188293457, 22.204626083374023, 23.02865219116211, 23.852676391601562, 24.676700592041016, 25.5007266998291]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 9.0, 19.0, 29.0, 58.0, 70.0, 121.0, 167.0, 332.0, 574.0, 995.0, 1555.0, 2638.0, 4492.0, 7874.0, 13407.0, 23532.0, 40860.0, 72894.0, 127632.0, 221480.0, 362476.0, 532182.0, 657062.0, 663211.0, 543861.0, 375245.0, 230213.0, 132729.0, 75911.0, 43043.0, 24478.0, 14472.0, 8343.0, 5015.0, 2844.0, 1755.0, 1106.0, 613.0, 364.0, 222.0, 146.0, 98.0, 70.0, 35.0, 23.0, 9.0, 12.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.765625, -19.107666015625, -18.44970703125, -17.791748046875, -17.1337890625, -16.475830078125, -15.81787109375, -15.159912109375, -14.501953125, -13.843994140625, -13.18603515625, -12.528076171875, -11.8701171875, -11.212158203125, -10.55419921875, -9.896240234375, -9.23828125, -8.580322265625, -7.92236328125, -7.264404296875, -6.6064453125, -5.948486328125, -5.29052734375, -4.632568359375, -3.974609375, -3.316650390625, -2.65869140625, -2.000732421875, -1.3427734375, -0.684814453125, -0.02685546875, 0.631103515625, 1.2890625, 1.947021484375, 2.60498046875, 3.262939453125, 3.9208984375, 4.578857421875, 5.23681640625, 5.894775390625, 6.552734375, 7.210693359375, 7.86865234375, 8.526611328125, 9.1845703125, 9.842529296875, 10.50048828125, 11.158447265625, 11.81640625, 12.474365234375, 13.13232421875, 13.790283203125, 14.4482421875, 15.106201171875, 15.76416015625, 16.422119140625, 17.080078125, 17.738037109375, 18.39599609375, 19.053955078125, 19.7119140625, 20.369873046875, 21.02783203125, 21.685791015625, 22.34375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 10.0, 10.0, 12.0, 10.0, 8.0, 13.0, 15.0, 22.0, 24.0, 23.0, 23.0, 37.0, 33.0, 40.0, 24.0, 44.0, 37.0, 34.0, 36.0, 64.0, 44.0, 48.0, 37.0, 40.0, 51.0, 33.0, 28.0, 28.0, 29.0, 24.0, 19.0, 18.0, 15.0, 18.0, 13.0, 7.0, 12.0, 5.0, 5.0, 12.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.421875, -25.6806640625, -24.939453125, -24.1982421875, -23.45703125, -22.7158203125, -21.974609375, -21.2333984375, -20.4921875, -19.7509765625, -19.009765625, -18.2685546875, -17.52734375, -16.7861328125, -16.044921875, -15.3037109375, -14.5625, -13.8212890625, -13.080078125, -12.3388671875, -11.59765625, -10.8564453125, -10.115234375, -9.3740234375, -8.6328125, -7.8916015625, -7.150390625, -6.4091796875, -5.66796875, -4.9267578125, -4.185546875, -3.4443359375, -2.703125, -1.9619140625, -1.220703125, -0.4794921875, 0.26171875, 1.0029296875, 1.744140625, 2.4853515625, 3.2265625, 3.9677734375, 4.708984375, 5.4501953125, 6.19140625, 6.9326171875, 7.673828125, 8.4150390625, 9.15625, 9.8974609375, 10.638671875, 11.3798828125, 12.12109375, 12.8623046875, 13.603515625, 14.3447265625, 15.0859375, 15.8271484375, 16.568359375, 17.3095703125, 18.05078125, 18.7919921875, 19.533203125, 20.2744140625, 21.015625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 6.0, 4.0, 13.0, 19.0, 41.0, 42.0, 115.0, 158.0, 291.0, 512.0, 852.0, 1551.0, 2731.0, 4886.0, 8984.0, 16455.0, 30622.0, 54682.0, 98273.0, 174592.0, 294325.0, 459663.0, 623123.0, 696672.0, 615902.0, 446152.0, 283698.0, 168222.0, 94836.0, 52351.0, 29294.0, 15770.0, 8554.0, 4797.0, 2711.0, 1457.0, 824.0, 456.0, 269.0, 162.0, 94.0, 56.0, 30.0, 12.0, 16.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.296875, -24.492919921875, -23.68896484375, -22.885009765625, -22.0810546875, -21.277099609375, -20.47314453125, -19.669189453125, -18.865234375, -18.061279296875, -17.25732421875, -16.453369140625, -15.6494140625, -14.845458984375, -14.04150390625, -13.237548828125, -12.43359375, -11.629638671875, -10.82568359375, -10.021728515625, -9.2177734375, -8.413818359375, -7.60986328125, -6.805908203125, -6.001953125, -5.197998046875, -4.39404296875, -3.590087890625, -2.7861328125, -1.982177734375, -1.17822265625, -0.374267578125, 0.4296875, 1.233642578125, 2.03759765625, 2.841552734375, 3.6455078125, 4.449462890625, 5.25341796875, 6.057373046875, 6.861328125, 7.665283203125, 8.46923828125, 9.273193359375, 10.0771484375, 10.881103515625, 11.68505859375, 12.489013671875, 13.29296875, 14.096923828125, 14.90087890625, 15.704833984375, 16.5087890625, 17.312744140625, 18.11669921875, 18.920654296875, 19.724609375, 20.528564453125, 21.33251953125, 22.136474609375, 22.9404296875, 23.744384765625, 24.54833984375, 25.352294921875, 26.15625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 2.0, 7.0, 8.0, 7.0, 9.0, 15.0, 21.0, 28.0, 32.0, 45.0, 50.0, 54.0, 67.0, 80.0, 87.0, 107.0, 116.0, 144.0, 161.0, 165.0, 186.0, 179.0, 215.0, 197.0, 214.0, 220.0, 193.0, 196.0, 194.0, 168.0, 129.0, 121.0, 135.0, 101.0, 76.0, 75.0, 46.0, 46.0, 36.0, 31.0, 24.0, 29.0, 10.0, 12.0, 14.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-9.6484375, -9.3719482421875, -9.095458984375, -8.8189697265625, -8.54248046875, -8.2659912109375, -7.989501953125, -7.7130126953125, -7.4365234375, -7.1600341796875, -6.883544921875, -6.6070556640625, -6.33056640625, -6.0540771484375, -5.777587890625, -5.5010986328125, -5.224609375, -4.9481201171875, -4.671630859375, -4.3951416015625, -4.11865234375, -3.8421630859375, -3.565673828125, -3.2891845703125, -3.0126953125, -2.7362060546875, -2.459716796875, -2.1832275390625, -1.90673828125, -1.6302490234375, -1.353759765625, -1.0772705078125, -0.80078125, -0.5242919921875, -0.247802734375, 0.0286865234375, 0.30517578125, 0.5816650390625, 0.858154296875, 1.1346435546875, 1.4111328125, 1.6876220703125, 1.964111328125, 2.2406005859375, 2.51708984375, 2.7935791015625, 3.070068359375, 3.3465576171875, 3.623046875, 3.8995361328125, 4.176025390625, 4.4525146484375, 4.72900390625, 5.0054931640625, 5.281982421875, 5.5584716796875, 5.8349609375, 6.1114501953125, 6.387939453125, 6.6644287109375, 6.94091796875, 7.2174072265625, 7.493896484375, 7.7703857421875, 8.046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 9.0, 12.0, 11.0, 11.0, 25.0, 17.0, 40.0, 26.0, 31.0, 31.0, 32.0, 43.0, 50.0, 35.0, 54.0, 44.0, 44.0, 35.0, 39.0, 46.0, 37.0, 37.0, 44.0, 26.0, 21.0, 29.0, 24.0, 25.0, 14.0, 10.0, 9.0, 11.0, 9.0, 8.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-27.20257568359375, -26.402612686157227, -25.60264778137207, -24.802684783935547, -24.00271987915039, -23.202756881713867, -22.402793884277344, -21.602828979492188, -20.802865982055664, -20.00290298461914, -19.202938079833984, -18.40297508239746, -17.603012084960938, -16.80304718017578, -16.003084182739258, -15.203120231628418, -14.403156280517578, -13.603192329406738, -12.803228378295898, -12.003265380859375, -11.203301429748535, -10.403337478637695, -9.603374481201172, -8.803410530090332, -8.003446578979492, -7.203482627868652, -6.403519153594971, -5.603555679321289, -4.803591728210449, -4.003627777099609, -3.2036643028259277, -2.403700828552246, -1.6037349700927734, -0.8037712574005127, -0.003807544708251953, 0.7961561679840088, 1.5961198806762695, 2.3960835933685303, 3.196047306060791, 3.9960107803344727, 4.7959747314453125, 5.595938682556152, 6.395902156829834, 7.195865631103516, 7.9958295822143555, 8.795793533325195, 9.595756530761719, 10.395720481872559, 11.195684432983398, 11.995648384094238, 12.795612335205078, 13.595575332641602, 14.395539283752441, 15.195503234863281, 15.995466232299805, 16.795429229736328, 17.595394134521484, 18.395357131958008, 19.195322036743164, 19.995285034179688, 20.795249938964844, 21.595212936401367, 22.39517593383789, 23.195140838623047, 23.99510383605957]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 13.0, 15.0, 19.0, 20.0, 13.0, 20.0, 22.0, 27.0, 29.0, 21.0, 37.0, 32.0, 25.0, 45.0, 39.0, 37.0, 42.0, 54.0, 34.0, 49.0, 29.0, 35.0, 50.0, 22.0, 41.0, 29.0, 33.0, 25.0, 20.0, 18.0, 21.0, 13.0, 9.0, 9.0, 6.0, 7.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.329103469848633, -23.54814338684082, -22.76718521118164, -21.986225128173828, -21.205265045166016, -20.424304962158203, -19.64334487915039, -18.86238670349121, -18.0814266204834, -17.300466537475586, -16.519508361816406, -15.738548278808594, -14.957588195800781, -14.176628112792969, -13.395668983459473, -12.614709854125977, -11.833749771118164, -11.052789688110352, -10.271830558776855, -9.49087142944336, -8.709911346435547, -7.928951740264893, -7.147992134094238, -6.367032527923584, -5.58607292175293, -4.805113315582275, -4.024153709411621, -3.243194103240967, -2.4622344970703125, -1.6812748908996582, -0.9003152847290039, -0.11935567855834961, 0.6616039276123047, 1.442563533782959, 2.2235231399536133, 3.0044827461242676, 3.785442352294922, 4.566401958465576, 5.3473615646362305, 6.128321170806885, 6.909280776977539, 7.690240383148193, 8.471199989318848, 9.252159118652344, 10.033119201660156, 10.814079284667969, 11.595038414001465, 12.375997543334961, 13.156957626342773, 13.937917709350586, 14.718876838684082, 15.499835968017578, 16.28079605102539, 17.061756134033203, 17.842716217041016, 18.623674392700195, 19.404634475708008, 20.18559455871582, 20.966552734375, 21.747512817382812, 22.528472900390625, 23.309432983398438, 24.09039306640625, 24.87135124206543, 25.652311325073242]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [7.0, 3.0, 5.0, 4.0, 11.0, 9.0, 19.0, 20.0, 31.0, 42.0, 57.0, 73.0, 108.0, 180.0, 252.0, 356.0, 548.0, 862.0, 1295.0, 1939.0, 3033.0, 4801.0, 7691.0, 12189.0, 20041.0, 34276.0, 61134.0, 109712.0, 182394.0, 216846.0, 164497.0, 95131.0, 53089.0, 30385.0, 17733.0, 10708.0, 6793.0, 4167.0, 2784.0, 1798.0, 1204.0, 791.0, 500.0, 325.0, 236.0, 155.0, 103.0, 69.0, 46.0, 45.0, 17.0, 16.0, 13.0, 13.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-39.9375, -38.578125, -37.21875, -35.859375, -34.5, -33.140625, -31.78125, -30.421875, -29.0625, -27.703125, -26.34375, -24.984375, -23.625, -22.265625, -20.90625, -19.546875, -18.1875, -16.828125, -15.46875, -14.109375, -12.75, -11.390625, -10.03125, -8.671875, -7.3125, -5.953125, -4.59375, -3.234375, -1.875, -0.515625, 0.84375, 2.203125, 3.5625, 4.921875, 6.28125, 7.640625, 9.0, 10.359375, 11.71875, 13.078125, 14.4375, 15.796875, 17.15625, 18.515625, 19.875, 21.234375, 22.59375, 23.953125, 25.3125, 26.671875, 28.03125, 29.390625, 30.75, 32.109375, 33.46875, 34.828125, 36.1875, 37.546875, 38.90625, 40.265625, 41.625, 42.984375, 44.34375, 45.703125, 47.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 10.0, 7.0, 11.0, 4.0, 12.0, 8.0, 10.0, 23.0, 16.0, 20.0, 25.0, 21.0, 41.0, 20.0, 40.0, 35.0, 31.0, 38.0, 51.0, 32.0, 41.0, 47.0, 43.0, 33.0, 29.0, 36.0, 31.0, 31.0, 31.0, 24.0, 25.0, 33.0, 27.0, 10.0, 18.0, 16.0, 12.0, 13.0, 8.0, 7.0, 8.0, 4.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.28125, -22.5517578125, -21.822265625, -21.0927734375, -20.36328125, -19.6337890625, -18.904296875, -18.1748046875, -17.4453125, -16.7158203125, -15.986328125, -15.2568359375, -14.52734375, -13.7978515625, -13.068359375, -12.3388671875, -11.609375, -10.8798828125, -10.150390625, -9.4208984375, -8.69140625, -7.9619140625, -7.232421875, -6.5029296875, -5.7734375, -5.0439453125, -4.314453125, -3.5849609375, -2.85546875, -2.1259765625, -1.396484375, -0.6669921875, 0.0625, 0.7919921875, 1.521484375, 2.2509765625, 2.98046875, 3.7099609375, 4.439453125, 5.1689453125, 5.8984375, 6.6279296875, 7.357421875, 8.0869140625, 8.81640625, 9.5458984375, 10.275390625, 11.0048828125, 11.734375, 12.4638671875, 13.193359375, 13.9228515625, 14.65234375, 15.3818359375, 16.111328125, 16.8408203125, 17.5703125, 18.2998046875, 19.029296875, 19.7587890625, 20.48828125, 21.2177734375, 21.947265625, 22.6767578125, 23.40625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 11.0, 16.0, 10.0, 14.0, 20.0, 27.0, 45.0, 70.0, 94.0, 166.0, 259.0, 366.0, 515.0, 792.0, 1168.0, 1755.0, 2731.0, 4096.0, 6161.0, 9539.0, 14999.0, 23615.0, 39375.0, 69151.0, 126797.0, 209494.0, 215275.0, 136141.0, 73775.0, 41694.0, 25231.0, 15674.0, 10120.0, 6570.0, 4409.0, 2799.0, 1862.0, 1247.0, 762.0, 564.0, 377.0, 257.0, 175.0, 101.0, 84.0, 57.0, 35.0, 23.0, 16.0, 15.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-44.40625, -42.9765625, -41.546875, -40.1171875, -38.6875, -37.2578125, -35.828125, -34.3984375, -32.96875, -31.5390625, -30.109375, -28.6796875, -27.25, -25.8203125, -24.390625, -22.9609375, -21.53125, -20.1015625, -18.671875, -17.2421875, -15.8125, -14.3828125, -12.953125, -11.5234375, -10.09375, -8.6640625, -7.234375, -5.8046875, -4.375, -2.9453125, -1.515625, -0.0859375, 1.34375, 2.7734375, 4.203125, 5.6328125, 7.0625, 8.4921875, 9.921875, 11.3515625, 12.78125, 14.2109375, 15.640625, 17.0703125, 18.5, 19.9296875, 21.359375, 22.7890625, 24.21875, 25.6484375, 27.078125, 28.5078125, 29.9375, 31.3671875, 32.796875, 34.2265625, 35.65625, 37.0859375, 38.515625, 39.9453125, 41.375, 42.8046875, 44.234375, 45.6640625, 47.09375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 8.0, 5.0, 9.0, 4.0, 10.0, 7.0, 10.0, 9.0, 14.0, 17.0, 20.0, 23.0, 32.0, 29.0, 26.0, 36.0, 35.0, 44.0, 41.0, 37.0, 43.0, 45.0, 44.0, 43.0, 32.0, 40.0, 34.0, 40.0, 33.0, 27.0, 32.0, 26.0, 21.0, 17.0, 13.0, 12.0, 16.0, 12.0, 14.0, 10.0, 6.0, 5.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-17.5, -16.9837646484375, -16.467529296875, -15.9512939453125, -15.43505859375, -14.9188232421875, -14.402587890625, -13.8863525390625, -13.3701171875, -12.8538818359375, -12.337646484375, -11.8214111328125, -11.30517578125, -10.7889404296875, -10.272705078125, -9.7564697265625, -9.240234375, -8.7239990234375, -8.207763671875, -7.6915283203125, -7.17529296875, -6.6590576171875, -6.142822265625, -5.6265869140625, -5.1103515625, -4.5941162109375, -4.077880859375, -3.5616455078125, -3.04541015625, -2.5291748046875, -2.012939453125, -1.4967041015625, -0.98046875, -0.4642333984375, 0.052001953125, 0.5682373046875, 1.08447265625, 1.6007080078125, 2.116943359375, 2.6331787109375, 3.1494140625, 3.6656494140625, 4.181884765625, 4.6981201171875, 5.21435546875, 5.7305908203125, 6.246826171875, 6.7630615234375, 7.279296875, 7.7955322265625, 8.311767578125, 8.8280029296875, 9.34423828125, 9.8604736328125, 10.376708984375, 10.8929443359375, 11.4091796875, 11.9254150390625, 12.441650390625, 12.9578857421875, 13.47412109375, 13.9903564453125, 14.506591796875, 15.0228271484375, 15.5390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 3.0, 11.0, 6.0, 9.0, 20.0, 18.0, 25.0, 39.0, 43.0, 57.0, 63.0, 86.0, 120.0, 147.0, 213.0, 299.0, 448.0, 619.0, 880.0, 1270.0, 1864.0, 2960.0, 4725.0, 7527.0, 13001.0, 23131.0, 42606.0, 81659.0, 154316.0, 232670.0, 210323.0, 123709.0, 64563.0, 33501.0, 18558.0, 10656.0, 6440.0, 3914.0, 2571.0, 1620.0, 1127.0, 761.0, 569.0, 387.0, 307.0, 181.0, 117.0, 105.0, 86.0, 52.0, 57.0, 30.0, 20.0, 23.0, 14.0, 9.0, 12.0, 5.0, 6.0, 5.0, 3.0], "bins": [-18.8125, -18.2392578125, -17.666015625, -17.0927734375, -16.51953125, -15.9462890625, -15.373046875, -14.7998046875, -14.2265625, -13.6533203125, -13.080078125, -12.5068359375, -11.93359375, -11.3603515625, -10.787109375, -10.2138671875, -9.640625, -9.0673828125, -8.494140625, -7.9208984375, -7.34765625, -6.7744140625, -6.201171875, -5.6279296875, -5.0546875, -4.4814453125, -3.908203125, -3.3349609375, -2.76171875, -2.1884765625, -1.615234375, -1.0419921875, -0.46875, 0.1044921875, 0.677734375, 1.2509765625, 1.82421875, 2.3974609375, 2.970703125, 3.5439453125, 4.1171875, 4.6904296875, 5.263671875, 5.8369140625, 6.41015625, 6.9833984375, 7.556640625, 8.1298828125, 8.703125, 9.2763671875, 9.849609375, 10.4228515625, 10.99609375, 11.5693359375, 12.142578125, 12.7158203125, 13.2890625, 13.8623046875, 14.435546875, 15.0087890625, 15.58203125, 16.1552734375, 16.728515625, 17.3017578125, 17.875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 17.0, 16.0, 28.0, 48.0, 56.0, 130.0, 146.0, 157.0, 129.0, 82.0, 56.0, 27.0, 29.0, 16.0, 9.0, 8.0, 2.0, 8.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002162933349609375, -0.002069026231765747, -0.001975119113922119, -0.0018812119960784912, -0.0017873048782348633, -0.0016933977603912354, -0.0015994906425476074, -0.0015055835247039795, -0.0014116764068603516, -0.0013177692890167236, -0.0012238621711730957, -0.0011299550533294678, -0.0010360479354858398, -0.0009421408176422119, -0.000848233699798584, -0.0007543265819549561, -0.0006604194641113281, -0.0005665123462677002, -0.00047260522842407227, -0.00037869811058044434, -0.0002847909927368164, -0.00019088387489318848, -9.697675704956055e-05, -3.069639205932617e-06, 9.083747863769531e-05, 0.00018474459648132324, 0.00027865171432495117, 0.0003725588321685791, 0.00046646595001220703, 0.000560373067855835, 0.0006542801856994629, 0.0007481873035430908, 0.0008420944213867188, 0.0009360015392303467, 0.0010299086570739746, 0.0011238157749176025, 0.0012177228927612305, 0.0013116300106048584, 0.0014055371284484863, 0.0014994442462921143, 0.0015933513641357422, 0.0016872584819793701, 0.001781165599822998, 0.001875072717666626, 0.001968979835510254, 0.002062886953353882, 0.0021567940711975098, 0.0022507011890411377, 0.0023446083068847656, 0.0024385154247283936, 0.0025324225425720215, 0.0026263296604156494, 0.0027202367782592773, 0.0028141438961029053, 0.002908051013946533, 0.003001958131790161, 0.003095865249633789, 0.003189772367477417, 0.003283679485321045, 0.003377586603164673, 0.0034714937210083008, 0.0035654008388519287, 0.0036593079566955566, 0.0037532150745391846, 0.0038471221923828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 11.0, 10.0, 15.0, 18.0, 23.0, 40.0, 65.0, 69.0, 127.0, 183.0, 250.0, 411.0, 594.0, 1012.0, 1447.0, 2134.0, 3466.0, 5529.0, 8975.0, 14538.0, 23166.0, 37613.0, 58615.0, 86660.0, 118968.0, 144049.0, 146199.0, 125335.0, 94547.0, 64000.0, 41586.0, 26048.0, 15998.0, 9779.0, 6247.0, 3681.0, 2445.0, 1594.0, 1037.0, 697.0, 468.0, 312.0, 173.0, 136.0, 107.0, 61.0, 39.0, 34.0, 19.0, 8.0, 12.0, 7.0, 3.0, 1.0, 4.0, 4.0], "bins": [-13.5703125, -13.1724853515625, -12.774658203125, -12.3768310546875, -11.97900390625, -11.5811767578125, -11.183349609375, -10.7855224609375, -10.3876953125, -9.9898681640625, -9.592041015625, -9.1942138671875, -8.79638671875, -8.3985595703125, -8.000732421875, -7.6029052734375, -7.205078125, -6.8072509765625, -6.409423828125, -6.0115966796875, -5.61376953125, -5.2159423828125, -4.818115234375, -4.4202880859375, -4.0224609375, -3.6246337890625, -3.226806640625, -2.8289794921875, -2.43115234375, -2.0333251953125, -1.635498046875, -1.2376708984375, -0.83984375, -0.4420166015625, -0.044189453125, 0.3536376953125, 0.75146484375, 1.1492919921875, 1.547119140625, 1.9449462890625, 2.3427734375, 2.7406005859375, 3.138427734375, 3.5362548828125, 3.93408203125, 4.3319091796875, 4.729736328125, 5.1275634765625, 5.525390625, 5.9232177734375, 6.321044921875, 6.7188720703125, 7.11669921875, 7.5145263671875, 7.912353515625, 8.3101806640625, 8.7080078125, 9.1058349609375, 9.503662109375, 9.9014892578125, 10.29931640625, 10.6971435546875, 11.094970703125, 11.4927978515625, 11.890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 5.0, 5.0, 5.0, 5.0, 8.0, 9.0, 10.0, 15.0, 19.0, 16.0, 23.0, 24.0, 29.0, 41.0, 40.0, 55.0, 65.0, 45.0, 56.0, 52.0, 58.0, 57.0, 53.0, 41.0, 45.0, 35.0, 37.0, 39.0, 27.0, 21.0, 13.0, 15.0, 8.0, 5.0, 8.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6328125, -5.44964599609375, -5.2664794921875, -5.08331298828125, -4.900146484375, -4.71697998046875, -4.5338134765625, -4.35064697265625, -4.16748046875, -3.98431396484375, -3.8011474609375, -3.61798095703125, -3.434814453125, -3.25164794921875, -3.0684814453125, -2.88531494140625, -2.7021484375, -2.51898193359375, -2.3358154296875, -2.15264892578125, -1.969482421875, -1.78631591796875, -1.6031494140625, -1.41998291015625, -1.23681640625, -1.05364990234375, -0.8704833984375, -0.68731689453125, -0.504150390625, -0.32098388671875, -0.1378173828125, 0.04534912109375, 0.228515625, 0.41168212890625, 0.5948486328125, 0.77801513671875, 0.961181640625, 1.14434814453125, 1.3275146484375, 1.51068115234375, 1.69384765625, 1.87701416015625, 2.0601806640625, 2.24334716796875, 2.426513671875, 2.60968017578125, 2.7928466796875, 2.97601318359375, 3.1591796875, 3.34234619140625, 3.5255126953125, 3.70867919921875, 3.891845703125, 4.07501220703125, 4.2581787109375, 4.44134521484375, 4.62451171875, 4.80767822265625, 4.9908447265625, 5.17401123046875, 5.357177734375, 5.54034423828125, 5.7235107421875, 5.90667724609375, 6.08984375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 10.0, 10.0, 7.0, 16.0, 12.0, 17.0, 18.0, 22.0, 21.0, 32.0, 19.0, 36.0, 43.0, 37.0, 38.0, 36.0, 32.0, 53.0, 43.0, 41.0, 42.0, 41.0, 41.0, 33.0, 45.0, 33.0, 28.0, 25.0, 35.0, 22.0, 19.0, 19.0, 7.0, 14.0, 8.0, 7.0, 8.0, 2.0, 3.0, 6.0, 2.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.85923194885254, -22.121984481811523, -21.384735107421875, -20.64748764038086, -19.91023826599121, -19.172990798950195, -18.435741424560547, -17.69849395751953, -16.961244583129883, -16.223997116088867, -15.486747741699219, -14.749499320983887, -14.012250900268555, -13.275002479553223, -12.53775405883789, -11.800506591796875, -11.063258171081543, -10.326009750366211, -9.588761329650879, -8.851512908935547, -8.114264488220215, -7.377016067504883, -6.639768123626709, -5.902519702911377, -5.165271282196045, -4.428022861480713, -3.690774440765381, -2.953526258468628, -2.216277837753296, -1.4790294170379639, -0.7417812347412109, -0.004532814025878906, 0.7327156066894531, 1.4699640274047852, 2.207212448120117, 2.94446063041687, 3.681709051132202, 4.418957710266113, 5.156205654144287, 5.893454074859619, 6.630702495574951, 7.367950916290283, 8.105198860168457, 8.842447280883789, 9.579695701599121, 10.316944122314453, 11.054192543029785, 11.791440963745117, 12.52868938446045, 13.265937805175781, 14.003186225891113, 14.740434646606445, 15.477683067321777, 16.21493148803711, 16.952178955078125, 17.689428329467773, 18.42667579650879, 19.163923263549805, 19.901172637939453, 20.63842010498047, 21.375669479370117, 22.112916946411133, 22.85016632080078, 23.587413787841797, 24.324663162231445]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 7.0, 12.0, 13.0, 16.0, 17.0, 19.0, 20.0, 24.0, 30.0, 21.0, 28.0, 37.0, 36.0, 29.0, 34.0, 43.0, 41.0, 49.0, 39.0, 46.0, 40.0, 35.0, 37.0, 40.0, 41.0, 26.0, 42.0, 24.0, 28.0, 20.0, 22.0, 16.0, 18.0, 5.0, 6.0, 8.0, 5.0, 6.0, 7.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.105548858642578, -22.346323013305664, -21.587095260620117, -20.827869415283203, -20.06864356994629, -19.309417724609375, -18.550189971923828, -17.790964126586914, -17.03173828125, -16.272512435913086, -15.513285636901855, -14.754058837890625, -13.994832992553711, -13.23560619354248, -12.47637939453125, -11.717153549194336, -10.957925796508789, -10.198698997497559, -9.439473152160645, -8.680246353149414, -7.921020030975342, -7.1617937088012695, -6.402566909790039, -5.643340587615967, -4.8841142654418945, -4.124887943267822, -3.365661382675171, -2.6064348220825195, -1.8472084999084473, -1.087982177734375, -0.32875537872314453, 0.43047094345092773, 1.1896953582763672, 1.948921799659729, 2.708148241043091, 3.467374801635742, 4.2266011238098145, 4.985827445983887, 5.745054244995117, 6.5042805671691895, 7.263506889343262, 8.022733688354492, 8.781959533691406, 9.541186332702637, 10.300413131713867, 11.059638977050781, 11.818865776062012, 12.578092575073242, 13.337318420410156, 14.096545219421387, 14.8557710647583, 15.614997863769531, 16.374223709106445, 17.13344955444336, 17.892677307128906, 18.65190315246582, 19.411128997802734, 20.17035484313965, 20.929582595825195, 21.68880844116211, 22.448034286499023, 23.207260131835938, 23.966487884521484, 24.7257137298584, 25.484941482543945]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 7.0, 12.0, 13.0, 28.0, 26.0, 56.0, 81.0, 113.0, 189.0, 313.0, 459.0, 718.0, 1211.0, 1812.0, 2888.0, 4438.0, 6930.0, 10713.0, 16073.0, 23439.0, 33893.0, 46363.0, 62971.0, 79695.0, 95225.0, 105823.0, 107891.0, 101915.0, 88455.0, 72586.0, 55877.0, 40915.0, 29145.0, 19957.0, 13401.0, 8728.0, 5836.0, 3780.0, 2365.0, 1515.0, 997.0, 611.0, 360.0, 261.0, 177.0, 106.0, 68.0, 48.0, 31.0, 15.0, 16.0, 12.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.296875, -15.7587890625, -15.220703125, -14.6826171875, -14.14453125, -13.6064453125, -13.068359375, -12.5302734375, -11.9921875, -11.4541015625, -10.916015625, -10.3779296875, -9.83984375, -9.3017578125, -8.763671875, -8.2255859375, -7.6875, -7.1494140625, -6.611328125, -6.0732421875, -5.53515625, -4.9970703125, -4.458984375, -3.9208984375, -3.3828125, -2.8447265625, -2.306640625, -1.7685546875, -1.23046875, -0.6923828125, -0.154296875, 0.3837890625, 0.921875, 1.4599609375, 1.998046875, 2.5361328125, 3.07421875, 3.6123046875, 4.150390625, 4.6884765625, 5.2265625, 5.7646484375, 6.302734375, 6.8408203125, 7.37890625, 7.9169921875, 8.455078125, 8.9931640625, 9.53125, 10.0693359375, 10.607421875, 11.1455078125, 11.68359375, 12.2216796875, 12.759765625, 13.2978515625, 13.8359375, 14.3740234375, 14.912109375, 15.4501953125, 15.98828125, 16.5263671875, 17.064453125, 17.6025390625, 18.140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 7.0, 3.0, 6.0, 9.0, 9.0, 10.0, 19.0, 19.0, 7.0, 16.0, 25.0, 26.0, 15.0, 31.0, 23.0, 40.0, 39.0, 44.0, 32.0, 30.0, 33.0, 44.0, 33.0, 50.0, 36.0, 22.0, 24.0, 44.0, 48.0, 39.0, 20.0, 28.0, 26.0, 19.0, 18.0, 21.0, 13.0, 11.0, 15.0, 8.0, 8.0, 10.0, 5.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-21.46875, -20.787109375, -20.10546875, -19.423828125, -18.7421875, -18.060546875, -17.37890625, -16.697265625, -16.015625, -15.333984375, -14.65234375, -13.970703125, -13.2890625, -12.607421875, -11.92578125, -11.244140625, -10.5625, -9.880859375, -9.19921875, -8.517578125, -7.8359375, -7.154296875, -6.47265625, -5.791015625, -5.109375, -4.427734375, -3.74609375, -3.064453125, -2.3828125, -1.701171875, -1.01953125, -0.337890625, 0.34375, 1.025390625, 1.70703125, 2.388671875, 3.0703125, 3.751953125, 4.43359375, 5.115234375, 5.796875, 6.478515625, 7.16015625, 7.841796875, 8.5234375, 9.205078125, 9.88671875, 10.568359375, 11.25, 11.931640625, 12.61328125, 13.294921875, 13.9765625, 14.658203125, 15.33984375, 16.021484375, 16.703125, 17.384765625, 18.06640625, 18.748046875, 19.4296875, 20.111328125, 20.79296875, 21.474609375, 22.15625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 13.0, 24.0, 38.0, 48.0, 70.0, 156.0, 218.0, 351.0, 605.0, 978.0, 1602.0, 2802.0, 4385.0, 7274.0, 12096.0, 19114.0, 29899.0, 45505.0, 65159.0, 87656.0, 109626.0, 123952.0, 124609.0, 113518.0, 92765.0, 69921.0, 48775.0, 32535.0, 21064.0, 13036.0, 8139.0, 5017.0, 2969.0, 1807.0, 1119.0, 650.0, 409.0, 265.0, 158.0, 85.0, 57.0, 26.0, 16.0, 14.0, 13.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.265625, -21.572021484375, -20.87841796875, -20.184814453125, -19.4912109375, -18.797607421875, -18.10400390625, -17.410400390625, -16.716796875, -16.023193359375, -15.32958984375, -14.635986328125, -13.9423828125, -13.248779296875, -12.55517578125, -11.861572265625, -11.16796875, -10.474365234375, -9.78076171875, -9.087158203125, -8.3935546875, -7.699951171875, -7.00634765625, -6.312744140625, -5.619140625, -4.925537109375, -4.23193359375, -3.538330078125, -2.8447265625, -2.151123046875, -1.45751953125, -0.763916015625, -0.0703125, 0.623291015625, 1.31689453125, 2.010498046875, 2.7041015625, 3.397705078125, 4.09130859375, 4.784912109375, 5.478515625, 6.172119140625, 6.86572265625, 7.559326171875, 8.2529296875, 8.946533203125, 9.64013671875, 10.333740234375, 11.02734375, 11.720947265625, 12.41455078125, 13.108154296875, 13.8017578125, 14.495361328125, 15.18896484375, 15.882568359375, 16.576171875, 17.269775390625, 17.96337890625, 18.656982421875, 19.3505859375, 20.044189453125, 20.73779296875, 21.431396484375, 22.125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 5.0, 6.0, 7.0, 5.0, 14.0, 9.0, 9.0, 17.0, 20.0, 22.0, 24.0, 15.0, 23.0, 30.0, 28.0, 30.0, 32.0, 37.0, 39.0, 40.0, 40.0, 34.0, 34.0, 47.0, 39.0, 39.0, 39.0, 47.0, 29.0, 34.0, 23.0, 34.0, 23.0, 17.0, 13.0, 11.0, 10.0, 12.0, 12.0, 11.0, 14.0, 2.0, 3.0, 4.0, 1.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.5703125, -13.1170654296875, -12.663818359375, -12.2105712890625, -11.75732421875, -11.3040771484375, -10.850830078125, -10.3975830078125, -9.9443359375, -9.4910888671875, -9.037841796875, -8.5845947265625, -8.13134765625, -7.6781005859375, -7.224853515625, -6.7716064453125, -6.318359375, -5.8651123046875, -5.411865234375, -4.9586181640625, -4.50537109375, -4.0521240234375, -3.598876953125, -3.1456298828125, -2.6923828125, -2.2391357421875, -1.785888671875, -1.3326416015625, -0.87939453125, -0.4261474609375, 0.027099609375, 0.4803466796875, 0.93359375, 1.3868408203125, 1.840087890625, 2.2933349609375, 2.74658203125, 3.1998291015625, 3.653076171875, 4.1063232421875, 4.5595703125, 5.0128173828125, 5.466064453125, 5.9193115234375, 6.37255859375, 6.8258056640625, 7.279052734375, 7.7322998046875, 8.185546875, 8.6387939453125, 9.092041015625, 9.5452880859375, 9.99853515625, 10.4517822265625, 10.905029296875, 11.3582763671875, 11.8115234375, 12.2647705078125, 12.718017578125, 13.1712646484375, 13.62451171875, 14.0777587890625, 14.531005859375, 14.9842529296875, 15.4375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 14.0, 14.0, 41.0, 48.0, 47.0, 103.0, 161.0, 217.0, 362.0, 547.0, 896.0, 1416.0, 2377.0, 3864.0, 6530.0, 10873.0, 18535.0, 31636.0, 52702.0, 84133.0, 121639.0, 154434.0, 161013.0, 137766.0, 99337.0, 63874.0, 38970.0, 23269.0, 13335.0, 8096.0, 4770.0, 2815.0, 1761.0, 1056.0, 714.0, 420.0, 256.0, 179.0, 115.0, 74.0, 51.0, 40.0, 27.0, 12.0, 4.0, 4.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.75, -11.3961181640625, -11.042236328125, -10.6883544921875, -10.33447265625, -9.9805908203125, -9.626708984375, -9.2728271484375, -8.9189453125, -8.5650634765625, -8.211181640625, -7.8572998046875, -7.50341796875, -7.1495361328125, -6.795654296875, -6.4417724609375, -6.087890625, -5.7340087890625, -5.380126953125, -5.0262451171875, -4.67236328125, -4.3184814453125, -3.964599609375, -3.6107177734375, -3.2568359375, -2.9029541015625, -2.549072265625, -2.1951904296875, -1.84130859375, -1.4874267578125, -1.133544921875, -0.7796630859375, -0.42578125, -0.0718994140625, 0.281982421875, 0.6358642578125, 0.98974609375, 1.3436279296875, 1.697509765625, 2.0513916015625, 2.4052734375, 2.7591552734375, 3.113037109375, 3.4669189453125, 3.82080078125, 4.1746826171875, 4.528564453125, 4.8824462890625, 5.236328125, 5.5902099609375, 5.944091796875, 6.2979736328125, 6.65185546875, 7.0057373046875, 7.359619140625, 7.7135009765625, 8.0673828125, 8.4212646484375, 8.775146484375, 9.1290283203125, 9.48291015625, 9.8367919921875, 10.190673828125, 10.5445556640625, 10.8984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 9.0, 14.0, 14.0, 19.0, 23.0, 33.0, 30.0, 39.0, 55.0, 48.0, 37.0, 45.0, 58.0, 58.0, 59.0, 54.0, 56.0, 43.0, 44.0, 38.0, 38.0, 29.0, 25.0, 26.0, 22.0, 14.0, 15.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0013380050659179688, -0.0012992173433303833, -0.0012604296207427979, -0.0012216418981552124, -0.001182854175567627, -0.0011440664529800415, -0.001105278730392456, -0.0010664910078048706, -0.0010277032852172852, -0.0009889155626296997, -0.0009501278400421143, -0.0009113401174545288, -0.0008725523948669434, -0.0008337646722793579, -0.0007949769496917725, -0.000756189227104187, -0.0007174015045166016, -0.0006786137819290161, -0.0006398260593414307, -0.0006010383367538452, -0.0005622506141662598, -0.0005234628915786743, -0.00048467516899108887, -0.0004458874464035034, -0.00040709972381591797, -0.0003683120012283325, -0.00032952427864074707, -0.0002907365560531616, -0.00025194883346557617, -0.00021316111087799072, -0.00017437338829040527, -0.00013558566570281982, -9.679794311523438e-05, -5.8010220527648926e-05, -1.9222497940063477e-05, 1.9565224647521973e-05, 5.835294723510742e-05, 9.714066982269287e-05, 0.00013592839241027832, 0.00017471611499786377, 0.00021350383758544922, 0.00025229156017303467, 0.0002910792827606201, 0.00032986700534820557, 0.000368654727935791, 0.00040744245052337646, 0.0004462301731109619, 0.00048501789569854736, 0.0005238056182861328, 0.0005625933408737183, 0.0006013810634613037, 0.0006401687860488892, 0.0006789565086364746, 0.0007177442312240601, 0.0007565319538116455, 0.000795319676399231, 0.0008341073989868164, 0.0008728951215744019, 0.0009116828441619873, 0.0009504705667495728, 0.0009892582893371582, 0.0010280460119247437, 0.001066833734512329, 0.0011056214570999146, 0.0011444091796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 11.0, 26.0, 29.0, 33.0, 42.0, 86.0, 139.0, 204.0, 317.0, 482.0, 853.0, 1323.0, 2366.0, 3808.0, 6448.0, 10776.0, 17910.0, 29129.0, 46797.0, 70743.0, 98910.0, 126711.0, 141479.0, 136309.0, 114335.0, 85071.0, 58143.0, 37791.0, 23077.0, 14068.0, 8374.0, 5172.0, 2973.0, 1790.0, 1067.0, 665.0, 392.0, 233.0, 163.0, 107.0, 54.0, 38.0, 28.0, 28.0, 19.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.265625, -8.973876953125, -8.68212890625, -8.390380859375, -8.0986328125, -7.806884765625, -7.51513671875, -7.223388671875, -6.931640625, -6.639892578125, -6.34814453125, -6.056396484375, -5.7646484375, -5.472900390625, -5.18115234375, -4.889404296875, -4.59765625, -4.305908203125, -4.01416015625, -3.722412109375, -3.4306640625, -3.138916015625, -2.84716796875, -2.555419921875, -2.263671875, -1.971923828125, -1.68017578125, -1.388427734375, -1.0966796875, -0.804931640625, -0.51318359375, -0.221435546875, 0.0703125, 0.362060546875, 0.65380859375, 0.945556640625, 1.2373046875, 1.529052734375, 1.82080078125, 2.112548828125, 2.404296875, 2.696044921875, 2.98779296875, 3.279541015625, 3.5712890625, 3.863037109375, 4.15478515625, 4.446533203125, 4.73828125, 5.030029296875, 5.32177734375, 5.613525390625, 5.9052734375, 6.197021484375, 6.48876953125, 6.780517578125, 7.072265625, 7.364013671875, 7.65576171875, 7.947509765625, 8.2392578125, 8.531005859375, 8.82275390625, 9.114501953125, 9.40625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 9.0, 10.0, 10.0, 8.0, 8.0, 24.0, 12.0, 23.0, 18.0, 27.0, 32.0, 37.0, 35.0, 38.0, 35.0, 56.0, 48.0, 54.0, 52.0, 45.0, 58.0, 46.0, 41.0, 41.0, 26.0, 38.0, 26.0, 31.0, 18.0, 18.0, 9.0, 12.0, 14.0, 12.0, 7.0, 3.0, 11.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.078125, -3.960205078125, -3.84228515625, -3.724365234375, -3.6064453125, -3.488525390625, -3.37060546875, -3.252685546875, -3.134765625, -3.016845703125, -2.89892578125, -2.781005859375, -2.6630859375, -2.545166015625, -2.42724609375, -2.309326171875, -2.19140625, -2.073486328125, -1.95556640625, -1.837646484375, -1.7197265625, -1.601806640625, -1.48388671875, -1.365966796875, -1.248046875, -1.130126953125, -1.01220703125, -0.894287109375, -0.7763671875, -0.658447265625, -0.54052734375, -0.422607421875, -0.3046875, -0.186767578125, -0.06884765625, 0.049072265625, 0.1669921875, 0.284912109375, 0.40283203125, 0.520751953125, 0.638671875, 0.756591796875, 0.87451171875, 0.992431640625, 1.1103515625, 1.228271484375, 1.34619140625, 1.464111328125, 1.58203125, 1.699951171875, 1.81787109375, 1.935791015625, 2.0537109375, 2.171630859375, 2.28955078125, 2.407470703125, 2.525390625, 2.643310546875, 2.76123046875, 2.879150390625, 2.9970703125, 3.114990234375, 3.23291015625, 3.350830078125, 3.46875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 11.0, 5.0, 13.0, 17.0, 17.0, 17.0, 20.0, 28.0, 20.0, 31.0, 25.0, 43.0, 41.0, 35.0, 53.0, 47.0, 48.0, 44.0, 40.0, 50.0, 46.0, 39.0, 32.0, 42.0, 27.0, 37.0, 35.0, 27.0, 18.0, 16.0, 15.0, 7.0, 14.0, 13.0, 5.0, 5.0, 0.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.80634307861328, -21.02112579345703, -20.23590850830078, -19.45069122314453, -18.66547393798828, -17.880258560180664, -17.095041275024414, -16.309823989868164, -15.524606704711914, -14.739389419555664, -13.954172134399414, -13.16895580291748, -12.38373851776123, -11.59852123260498, -10.813304901123047, -10.028087615966797, -9.242870330810547, -8.457653045654297, -7.672436237335205, -6.887219429016113, -6.102002143859863, -5.316784858703613, -4.5315680503845215, -3.7463512420654297, -2.9611339569091797, -2.175916910171509, -1.390699863433838, -0.605482816696167, 0.1797342300415039, 0.9649512767791748, 1.7501683235168457, 2.5353851318359375, 3.3206043243408203, 4.10582160949707, 4.891038417816162, 5.676255226135254, 6.461472511291504, 7.246689796447754, 8.031906127929688, 8.817123413085938, 9.602340698242188, 10.387557983398438, 11.172775268554688, 11.957991600036621, 12.743208885192871, 13.528426170349121, 14.313642501831055, 15.098859786987305, 15.884077072143555, 16.669294357299805, 17.454511642456055, 18.239728927612305, 19.024944305419922, 19.810161590576172, 20.595378875732422, 21.380596160888672, 22.165813446044922, 22.951030731201172, 23.736248016357422, 24.521465301513672, 25.306682586669922, 26.09189796447754, 26.87711524963379, 27.66233253479004, 28.44754981994629]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 13.0, 6.0, 16.0, 18.0, 10.0, 23.0, 22.0, 17.0, 30.0, 24.0, 38.0, 34.0, 36.0, 36.0, 38.0, 40.0, 40.0, 55.0, 38.0, 44.0, 41.0, 34.0, 37.0, 40.0, 47.0, 32.0, 23.0, 22.0, 20.0, 21.0, 21.0, 14.0, 12.0, 12.0, 9.0, 4.0, 5.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.896875381469727, -22.11444854736328, -21.332019805908203, -20.549592971801758, -19.767166137695312, -18.984737396240234, -18.20231056213379, -17.419883728027344, -16.637454986572266, -15.855027198791504, -15.072599411010742, -14.290172576904297, -13.507744789123535, -12.725317001342773, -11.942890167236328, -11.160462379455566, -10.378034591674805, -9.595606803894043, -8.813179016113281, -8.030752182006836, -7.248324394226074, -6.4658966064453125, -5.683469295501709, -4.9010419845581055, -4.118614196777344, -3.336186647415161, -2.5537590980529785, -1.771331548690796, -0.9889039993286133, -0.20647644996643066, 0.575951099395752, 1.3583784103393555, 2.14080810546875, 2.9232356548309326, 3.7056632041931152, 4.488090515136719, 5.2705183029174805, 6.052946090698242, 6.835373401641846, 7.617800712585449, 8.400228500366211, 9.182656288146973, 9.965084075927734, 10.74751091003418, 11.529938697814941, 12.312366485595703, 13.094793319702148, 13.87722110748291, 14.659648895263672, 15.442076683044434, 16.224504470825195, 17.00693130493164, 17.78936004638672, 18.571786880493164, 19.35421371459961, 20.136642456054688, 20.919069290161133, 21.701496124267578, 22.483924865722656, 23.2663516998291, 24.048778533935547, 24.831207275390625, 25.61363410949707, 26.396060943603516, 27.178489685058594]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 11.0, 12.0, 27.0, 33.0, 68.0, 94.0, 138.0, 244.0, 356.0, 520.0, 856.0, 1344.0, 2245.0, 3606.0, 5966.0, 9744.0, 16857.0, 28156.0, 49147.0, 84316.0, 145256.0, 245899.0, 386338.0, 540275.0, 644264.0, 630110.0, 511904.0, 352876.0, 220749.0, 130128.0, 74969.0, 42990.0, 25588.0, 15304.0, 9112.0, 5616.0, 3419.0, 2143.0, 1366.0, 846.0, 500.0, 314.0, 208.0, 135.0, 91.0, 66.0, 31.0, 16.0, 18.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.296875, -16.737060546875, -16.17724609375, -15.617431640625, -15.0576171875, -14.497802734375, -13.93798828125, -13.378173828125, -12.818359375, -12.258544921875, -11.69873046875, -11.138916015625, -10.5791015625, -10.019287109375, -9.45947265625, -8.899658203125, -8.33984375, -7.780029296875, -7.22021484375, -6.660400390625, -6.1005859375, -5.540771484375, -4.98095703125, -4.421142578125, -3.861328125, -3.301513671875, -2.74169921875, -2.181884765625, -1.6220703125, -1.062255859375, -0.50244140625, 0.057373046875, 0.6171875, 1.177001953125, 1.73681640625, 2.296630859375, 2.8564453125, 3.416259765625, 3.97607421875, 4.535888671875, 5.095703125, 5.655517578125, 6.21533203125, 6.775146484375, 7.3349609375, 7.894775390625, 8.45458984375, 9.014404296875, 9.57421875, 10.134033203125, 10.69384765625, 11.253662109375, 11.8134765625, 12.373291015625, 12.93310546875, 13.492919921875, 14.052734375, 14.612548828125, 15.17236328125, 15.732177734375, 16.2919921875, 16.851806640625, 17.41162109375, 17.971435546875, 18.53125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 8.0, 2.0, 5.0, 6.0, 6.0, 14.0, 15.0, 17.0, 16.0, 22.0, 16.0, 21.0, 29.0, 33.0, 36.0, 42.0, 42.0, 37.0, 40.0, 48.0, 42.0, 38.0, 47.0, 41.0, 46.0, 39.0, 40.0, 43.0, 34.0, 25.0, 12.0, 22.0, 21.0, 22.0, 15.0, 2.0, 16.0, 14.0, 7.0, 5.0, 8.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.40625, -19.733154296875, -19.06005859375, -18.386962890625, -17.7138671875, -17.040771484375, -16.36767578125, -15.694580078125, -15.021484375, -14.348388671875, -13.67529296875, -13.002197265625, -12.3291015625, -11.656005859375, -10.98291015625, -10.309814453125, -9.63671875, -8.963623046875, -8.29052734375, -7.617431640625, -6.9443359375, -6.271240234375, -5.59814453125, -4.925048828125, -4.251953125, -3.578857421875, -2.90576171875, -2.232666015625, -1.5595703125, -0.886474609375, -0.21337890625, 0.459716796875, 1.1328125, 1.805908203125, 2.47900390625, 3.152099609375, 3.8251953125, 4.498291015625, 5.17138671875, 5.844482421875, 6.517578125, 7.190673828125, 7.86376953125, 8.536865234375, 9.2099609375, 9.883056640625, 10.55615234375, 11.229248046875, 11.90234375, 12.575439453125, 13.24853515625, 13.921630859375, 14.5947265625, 15.267822265625, 15.94091796875, 16.614013671875, 17.287109375, 17.960205078125, 18.63330078125, 19.306396484375, 19.9794921875, 20.652587890625, 21.32568359375, 21.998779296875, 22.671875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 7.0, 15.0, 20.0, 41.0, 78.0, 148.0, 250.0, 526.0, 1060.0, 2171.0, 4316.0, 8876.0, 18822.0, 38680.0, 80748.0, 162258.0, 312285.0, 543674.0, 781145.0, 826575.0, 629516.0, 381933.0, 204177.0, 101348.0, 49509.0, 24036.0, 11338.0, 5357.0, 2717.0, 1324.0, 635.0, 318.0, 177.0, 92.0, 46.0, 23.0, 16.0, 8.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.34375, -25.470458984375, -24.59716796875, -23.723876953125, -22.8505859375, -21.977294921875, -21.10400390625, -20.230712890625, -19.357421875, -18.484130859375, -17.61083984375, -16.737548828125, -15.8642578125, -14.990966796875, -14.11767578125, -13.244384765625, -12.37109375, -11.497802734375, -10.62451171875, -9.751220703125, -8.8779296875, -8.004638671875, -7.13134765625, -6.258056640625, -5.384765625, -4.511474609375, -3.63818359375, -2.764892578125, -1.8916015625, -1.018310546875, -0.14501953125, 0.728271484375, 1.6015625, 2.474853515625, 3.34814453125, 4.221435546875, 5.0947265625, 5.968017578125, 6.84130859375, 7.714599609375, 8.587890625, 9.461181640625, 10.33447265625, 11.207763671875, 12.0810546875, 12.954345703125, 13.82763671875, 14.700927734375, 15.57421875, 16.447509765625, 17.32080078125, 18.194091796875, 19.0673828125, 19.940673828125, 20.81396484375, 21.687255859375, 22.560546875, 23.433837890625, 24.30712890625, 25.180419921875, 26.0537109375, 26.927001953125, 27.80029296875, 28.673583984375, 29.546875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 5.0, 7.0, 11.0, 13.0, 10.0, 17.0, 22.0, 26.0, 37.0, 48.0, 57.0, 53.0, 81.0, 101.0, 138.0, 117.0, 144.0, 167.0, 165.0, 179.0, 218.0, 215.0, 225.0, 208.0, 220.0, 204.0, 185.0, 153.0, 140.0, 140.0, 127.0, 126.0, 104.0, 77.0, 66.0, 51.0, 53.0, 33.0, 28.0, 30.0, 21.0, 14.0, 8.0, 5.0, 5.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-8.328125, -8.0731201171875, -7.818115234375, -7.5631103515625, -7.30810546875, -7.0531005859375, -6.798095703125, -6.5430908203125, -6.2880859375, -6.0330810546875, -5.778076171875, -5.5230712890625, -5.26806640625, -5.0130615234375, -4.758056640625, -4.5030517578125, -4.248046875, -3.9930419921875, -3.738037109375, -3.4830322265625, -3.22802734375, -2.9730224609375, -2.718017578125, -2.4630126953125, -2.2080078125, -1.9530029296875, -1.697998046875, -1.4429931640625, -1.18798828125, -0.9329833984375, -0.677978515625, -0.4229736328125, -0.16796875, 0.0870361328125, 0.342041015625, 0.5970458984375, 0.85205078125, 1.1070556640625, 1.362060546875, 1.6170654296875, 1.8720703125, 2.1270751953125, 2.382080078125, 2.6370849609375, 2.89208984375, 3.1470947265625, 3.402099609375, 3.6571044921875, 3.912109375, 4.1671142578125, 4.422119140625, 4.6771240234375, 4.93212890625, 5.1871337890625, 5.442138671875, 5.6971435546875, 5.9521484375, 6.2071533203125, 6.462158203125, 6.7171630859375, 6.97216796875, 7.2271728515625, 7.482177734375, 7.7371826171875, 7.9921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 9.0, 7.0, 5.0, 10.0, 14.0, 13.0, 16.0, 16.0, 22.0, 19.0, 26.0, 28.0, 33.0, 29.0, 36.0, 39.0, 48.0, 44.0, 46.0, 51.0, 44.0, 36.0, 43.0, 42.0, 31.0, 33.0, 40.0, 25.0, 28.0, 32.0, 21.0, 20.0, 19.0, 20.0, 12.0, 5.0, 11.0, 6.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.309255599975586, -18.591999053955078, -17.87474250793457, -17.157485961914062, -16.440229415893555, -15.722972869873047, -15.005716323852539, -14.288459777832031, -13.571203231811523, -12.853946685791016, -12.136690139770508, -11.41943359375, -10.702177047729492, -9.984920501708984, -9.267663955688477, -8.550407409667969, -7.833150863647461, -7.115894317626953, -6.398637771606445, -5.6813812255859375, -4.96412467956543, -4.246868133544922, -3.529611587524414, -2.8123550415039062, -2.0950984954833984, -1.3778419494628906, -0.6605854034423828, 0.056671142578125, 0.7739276885986328, 1.4911842346191406, 2.2084407806396484, 2.9256973266601562, 3.642953872680664, 4.360210418701172, 5.07746696472168, 5.7947235107421875, 6.511980056762695, 7.229236602783203, 7.946493148803711, 8.663749694824219, 9.381006240844727, 10.098262786865234, 10.815519332885742, 11.53277587890625, 12.250032424926758, 12.967288970947266, 13.684545516967773, 14.401802062988281, 15.119058609008789, 15.836315155029297, 16.553571701049805, 17.270828247070312, 17.98808479309082, 18.705341339111328, 19.422597885131836, 20.139854431152344, 20.85711097717285, 21.57436752319336, 22.291624069213867, 23.008880615234375, 23.726137161254883, 24.44339370727539, 25.1606502532959, 25.877906799316406, 26.595163345336914]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 5.0, 4.0, 6.0, 8.0, 2.0, 17.0, 9.0, 17.0, 23.0, 27.0, 20.0, 26.0, 22.0, 23.0, 23.0, 23.0, 34.0, 38.0, 34.0, 50.0, 44.0, 42.0, 51.0, 44.0, 45.0, 30.0, 29.0, 35.0, 23.0, 34.0, 22.0, 31.0, 22.0, 23.0, 18.0, 16.0, 15.0, 8.0, 10.0, 12.0, 6.0, 9.0, 7.0, 4.0, 1.0, 7.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.487255096435547, -21.808433532714844, -21.12961196899414, -20.45079231262207, -19.771970748901367, -19.093149185180664, -18.414329528808594, -17.73550796508789, -17.056686401367188, -16.377864837646484, -15.699044227600098, -15.020223617553711, -14.341402053833008, -13.662580490112305, -12.983759880065918, -12.304939270019531, -11.626117706298828, -10.947296142578125, -10.268475532531738, -9.589654922485352, -8.910833358764648, -8.232011795043945, -7.553191184997559, -6.874370098114014, -6.195549011230469, -5.516727924346924, -4.837906837463379, -4.159085750579834, -3.480264663696289, -2.801443576812744, -2.122622489929199, -1.4438014030456543, -0.7649784088134766, -0.08615732192993164, 0.5926637649536133, 1.2714848518371582, 1.9503059387207031, 2.629127025604248, 3.307948112487793, 3.986769199371338, 4.665590286254883, 5.344411373138428, 6.023232460021973, 6.702053546905518, 7.3808746337890625, 8.059696197509766, 8.738516807556152, 9.417337417602539, 10.096158981323242, 10.774980545043945, 11.453801155090332, 12.132621765136719, 12.811443328857422, 13.490264892578125, 14.169085502624512, 14.847906112670898, 15.526727676391602, 16.205549240112305, 16.884368896484375, 17.563190460205078, 18.24201202392578, 18.920833587646484, 19.599655151367188, 20.278474807739258, 20.95729637145996]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 8.0, 9.0, 11.0, 14.0, 15.0, 32.0, 37.0, 56.0, 91.0, 129.0, 161.0, 316.0, 443.0, 684.0, 959.0, 1469.0, 2210.0, 3355.0, 4946.0, 7741.0, 12306.0, 21076.0, 39832.0, 80800.0, 160083.0, 242061.0, 213414.0, 121339.0, 59052.0, 30175.0, 16835.0, 10031.0, 6398.0, 4097.0, 2768.0, 1910.0, 1187.0, 851.0, 550.0, 366.0, 256.0, 167.0, 109.0, 68.0, 51.0, 36.0, 17.0, 22.0, 8.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.54736328125, -31.3759765625, -30.20458984375, -29.033203125, -27.86181640625, -26.6904296875, -25.51904296875, -24.34765625, -23.17626953125, -22.0048828125, -20.83349609375, -19.662109375, -18.49072265625, -17.3193359375, -16.14794921875, -14.9765625, -13.80517578125, -12.6337890625, -11.46240234375, -10.291015625, -9.11962890625, -7.9482421875, -6.77685546875, -5.60546875, -4.43408203125, -3.2626953125, -2.09130859375, -0.919921875, 0.25146484375, 1.4228515625, 2.59423828125, 3.765625, 4.93701171875, 6.1083984375, 7.27978515625, 8.451171875, 9.62255859375, 10.7939453125, 11.96533203125, 13.13671875, 14.30810546875, 15.4794921875, 16.65087890625, 17.822265625, 18.99365234375, 20.1650390625, 21.33642578125, 22.5078125, 23.67919921875, 24.8505859375, 26.02197265625, 27.193359375, 28.36474609375, 29.5361328125, 30.70751953125, 31.87890625, 33.05029296875, 34.2216796875, 35.39306640625, 36.564453125, 37.73583984375, 38.9072265625, 40.07861328125, 41.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 10.0, 8.0, 5.0, 5.0, 21.0, 13.0, 5.0, 25.0, 23.0, 26.0, 28.0, 29.0, 33.0, 25.0, 27.0, 37.0, 40.0, 50.0, 41.0, 40.0, 42.0, 47.0, 52.0, 28.0, 39.0, 29.0, 27.0, 32.0, 27.0, 27.0, 27.0, 24.0, 18.0, 16.0, 13.0, 9.0, 8.0, 11.0, 8.0, 7.0, 5.0, 4.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-23.8125, -23.116455078125, -22.42041015625, -21.724365234375, -21.0283203125, -20.332275390625, -19.63623046875, -18.940185546875, -18.244140625, -17.548095703125, -16.85205078125, -16.156005859375, -15.4599609375, -14.763916015625, -14.06787109375, -13.371826171875, -12.67578125, -11.979736328125, -11.28369140625, -10.587646484375, -9.8916015625, -9.195556640625, -8.49951171875, -7.803466796875, -7.107421875, -6.411376953125, -5.71533203125, -5.019287109375, -4.3232421875, -3.627197265625, -2.93115234375, -2.235107421875, -1.5390625, -0.843017578125, -0.14697265625, 0.549072265625, 1.2451171875, 1.941162109375, 2.63720703125, 3.333251953125, 4.029296875, 4.725341796875, 5.42138671875, 6.117431640625, 6.8134765625, 7.509521484375, 8.20556640625, 8.901611328125, 9.59765625, 10.293701171875, 10.98974609375, 11.685791015625, 12.3818359375, 13.077880859375, 13.77392578125, 14.469970703125, 15.166015625, 15.862060546875, 16.55810546875, 17.254150390625, 17.9501953125, 18.646240234375, 19.34228515625, 20.038330078125, 20.734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 27.0, 30.0, 43.0, 73.0, 95.0, 144.0, 217.0, 331.0, 498.0, 717.0, 1076.0, 1594.0, 2352.0, 3640.0, 5269.0, 8286.0, 12868.0, 20117.0, 33737.0, 58812.0, 106365.0, 178647.0, 219284.0, 164027.0, 94540.0, 52524.0, 30738.0, 18359.0, 11636.0, 7590.0, 4897.0, 3349.0, 2183.0, 1516.0, 1001.0, 678.0, 436.0, 271.0, 180.0, 150.0, 86.0, 49.0, 30.0, 25.0, 26.0, 13.0, 4.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-32.03125, -30.9775390625, -29.923828125, -28.8701171875, -27.81640625, -26.7626953125, -25.708984375, -24.6552734375, -23.6015625, -22.5478515625, -21.494140625, -20.4404296875, -19.38671875, -18.3330078125, -17.279296875, -16.2255859375, -15.171875, -14.1181640625, -13.064453125, -12.0107421875, -10.95703125, -9.9033203125, -8.849609375, -7.7958984375, -6.7421875, -5.6884765625, -4.634765625, -3.5810546875, -2.52734375, -1.4736328125, -0.419921875, 0.6337890625, 1.6875, 2.7412109375, 3.794921875, 4.8486328125, 5.90234375, 6.9560546875, 8.009765625, 9.0634765625, 10.1171875, 11.1708984375, 12.224609375, 13.2783203125, 14.33203125, 15.3857421875, 16.439453125, 17.4931640625, 18.546875, 19.6005859375, 20.654296875, 21.7080078125, 22.76171875, 23.8154296875, 24.869140625, 25.9228515625, 26.9765625, 28.0302734375, 29.083984375, 30.1376953125, 31.19140625, 32.2451171875, 33.298828125, 34.3525390625, 35.40625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 5.0, 3.0, 9.0, 20.0, 17.0, 11.0, 22.0, 15.0, 19.0, 29.0, 26.0, 28.0, 32.0, 30.0, 33.0, 44.0, 50.0, 33.0, 28.0, 37.0, 43.0, 48.0, 45.0, 34.0, 45.0, 31.0, 36.0, 25.0, 18.0, 27.0, 17.0, 17.0, 21.0, 20.0, 9.0, 12.0, 6.0, 8.0, 3.0, 11.0, 11.0, 4.0, 1.0, 6.0, 3.0, 2.0, 1.0, 3.0], "bins": [-16.453125, -15.99462890625, -15.5361328125, -15.07763671875, -14.619140625, -14.16064453125, -13.7021484375, -13.24365234375, -12.78515625, -12.32666015625, -11.8681640625, -11.40966796875, -10.951171875, -10.49267578125, -10.0341796875, -9.57568359375, -9.1171875, -8.65869140625, -8.2001953125, -7.74169921875, -7.283203125, -6.82470703125, -6.3662109375, -5.90771484375, -5.44921875, -4.99072265625, -4.5322265625, -4.07373046875, -3.615234375, -3.15673828125, -2.6982421875, -2.23974609375, -1.78125, -1.32275390625, -0.8642578125, -0.40576171875, 0.052734375, 0.51123046875, 0.9697265625, 1.42822265625, 1.88671875, 2.34521484375, 2.8037109375, 3.26220703125, 3.720703125, 4.17919921875, 4.6376953125, 5.09619140625, 5.5546875, 6.01318359375, 6.4716796875, 6.93017578125, 7.388671875, 7.84716796875, 8.3056640625, 8.76416015625, 9.22265625, 9.68115234375, 10.1396484375, 10.59814453125, 11.056640625, 11.51513671875, 11.9736328125, 12.43212890625, 12.890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 8.0, 5.0, 15.0, 14.0, 28.0, 31.0, 63.0, 76.0, 114.0, 174.0, 247.0, 389.0, 582.0, 904.0, 1380.0, 2120.0, 3399.0, 5850.0, 10181.0, 18845.0, 38489.0, 81884.0, 173060.0, 273137.0, 219579.0, 110692.0, 50635.0, 24977.0, 12968.0, 7194.0, 4203.0, 2566.0, 1646.0, 1095.0, 675.0, 442.0, 290.0, 201.0, 138.0, 89.0, 59.0, 35.0, 26.0, 22.0, 8.0, 11.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.8125, -17.25048828125, -16.6884765625, -16.12646484375, -15.564453125, -15.00244140625, -14.4404296875, -13.87841796875, -13.31640625, -12.75439453125, -12.1923828125, -11.63037109375, -11.068359375, -10.50634765625, -9.9443359375, -9.38232421875, -8.8203125, -8.25830078125, -7.6962890625, -7.13427734375, -6.572265625, -6.01025390625, -5.4482421875, -4.88623046875, -4.32421875, -3.76220703125, -3.2001953125, -2.63818359375, -2.076171875, -1.51416015625, -0.9521484375, -0.39013671875, 0.171875, 0.73388671875, 1.2958984375, 1.85791015625, 2.419921875, 2.98193359375, 3.5439453125, 4.10595703125, 4.66796875, 5.22998046875, 5.7919921875, 6.35400390625, 6.916015625, 7.47802734375, 8.0400390625, 8.60205078125, 9.1640625, 9.72607421875, 10.2880859375, 10.85009765625, 11.412109375, 11.97412109375, 12.5361328125, 13.09814453125, 13.66015625, 14.22216796875, 14.7841796875, 15.34619140625, 15.908203125, 16.47021484375, 17.0322265625, 17.59423828125, 18.15625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 6.0, 9.0, 14.0, 23.0, 28.0, 43.0, 62.0, 80.0, 90.0, 111.0, 91.0, 99.0, 92.0, 54.0, 38.0, 20.0, 22.0, 15.0, 17.0, 9.0, 10.0, 8.0, 6.0, 9.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015077590942382812, -0.0014591217041015625, -0.0014104843139648438, -0.001361846923828125, -0.0013132095336914062, -0.0012645721435546875, -0.0012159347534179688, -0.00116729736328125, -0.0011186599731445312, -0.0010700225830078125, -0.0010213851928710938, -0.000972747802734375, -0.0009241104125976562, -0.0008754730224609375, -0.0008268356323242188, -0.0007781982421875, -0.0007295608520507812, -0.0006809234619140625, -0.0006322860717773438, -0.000583648681640625, -0.0005350112915039062, -0.0004863739013671875, -0.00043773651123046875, -0.00038909912109375, -0.00034046173095703125, -0.0002918243408203125, -0.00024318695068359375, -0.000194549560546875, -0.00014591217041015625, -9.72747802734375e-05, -4.863739013671875e-05, 0.0, 4.863739013671875e-05, 9.72747802734375e-05, 0.00014591217041015625, 0.000194549560546875, 0.00024318695068359375, 0.0002918243408203125, 0.00034046173095703125, 0.00038909912109375, 0.00043773651123046875, 0.0004863739013671875, 0.0005350112915039062, 0.000583648681640625, 0.0006322860717773438, 0.0006809234619140625, 0.0007295608520507812, 0.0007781982421875, 0.0008268356323242188, 0.0008754730224609375, 0.0009241104125976562, 0.000972747802734375, 0.0010213851928710938, 0.0010700225830078125, 0.0011186599731445312, 0.00116729736328125, 0.0012159347534179688, 0.0012645721435546875, 0.0013132095336914062, 0.001361846923828125, 0.0014104843139648438, 0.0014591217041015625, 0.0015077590942382812, 0.001556396484375, 0.0016050338745117188]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 9.0, 6.0, 21.0, 30.0, 34.0, 84.0, 84.0, 138.0, 242.0, 335.0, 530.0, 892.0, 1523.0, 2662.0, 4880.0, 9145.0, 17679.0, 35278.0, 69995.0, 129472.0, 201296.0, 221061.0, 162301.0, 92698.0, 47580.0, 23940.0, 12092.0, 6190.0, 3369.0, 2019.0, 1092.0, 690.0, 405.0, 268.0, 184.0, 107.0, 80.0, 43.0, 37.0, 21.0, 13.0, 10.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.4375, -16.896240234375, -16.35498046875, -15.813720703125, -15.2724609375, -14.731201171875, -14.18994140625, -13.648681640625, -13.107421875, -12.566162109375, -12.02490234375, -11.483642578125, -10.9423828125, -10.401123046875, -9.85986328125, -9.318603515625, -8.77734375, -8.236083984375, -7.69482421875, -7.153564453125, -6.6123046875, -6.071044921875, -5.52978515625, -4.988525390625, -4.447265625, -3.906005859375, -3.36474609375, -2.823486328125, -2.2822265625, -1.740966796875, -1.19970703125, -0.658447265625, -0.1171875, 0.424072265625, 0.96533203125, 1.506591796875, 2.0478515625, 2.589111328125, 3.13037109375, 3.671630859375, 4.212890625, 4.754150390625, 5.29541015625, 5.836669921875, 6.3779296875, 6.919189453125, 7.46044921875, 8.001708984375, 8.54296875, 9.084228515625, 9.62548828125, 10.166748046875, 10.7080078125, 11.249267578125, 11.79052734375, 12.331787109375, 12.873046875, 13.414306640625, 13.95556640625, 14.496826171875, 15.0380859375, 15.579345703125, 16.12060546875, 16.661865234375, 17.203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 5.0, 12.0, 10.0, 13.0, 12.0, 23.0, 25.0, 33.0, 40.0, 40.0, 40.0, 51.0, 66.0, 79.0, 70.0, 77.0, 59.0, 65.0, 41.0, 45.0, 36.0, 32.0, 19.0, 20.0, 20.0, 6.0, 8.0, 13.0, 7.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-6.671875, -6.4896240234375, -6.307373046875, -6.1251220703125, -5.94287109375, -5.7606201171875, -5.578369140625, -5.3961181640625, -5.2138671875, -5.0316162109375, -4.849365234375, -4.6671142578125, -4.48486328125, -4.3026123046875, -4.120361328125, -3.9381103515625, -3.755859375, -3.5736083984375, -3.391357421875, -3.2091064453125, -3.02685546875, -2.8446044921875, -2.662353515625, -2.4801025390625, -2.2978515625, -2.1156005859375, -1.933349609375, -1.7510986328125, -1.56884765625, -1.3865966796875, -1.204345703125, -1.0220947265625, -0.83984375, -0.6575927734375, -0.475341796875, -0.2930908203125, -0.11083984375, 0.0714111328125, 0.253662109375, 0.4359130859375, 0.6181640625, 0.8004150390625, 0.982666015625, 1.1649169921875, 1.34716796875, 1.5294189453125, 1.711669921875, 1.8939208984375, 2.076171875, 2.2584228515625, 2.440673828125, 2.6229248046875, 2.80517578125, 2.9874267578125, 3.169677734375, 3.3519287109375, 3.5341796875, 3.7164306640625, 3.898681640625, 4.0809326171875, 4.26318359375, 4.4454345703125, 4.627685546875, 4.8099365234375, 4.9921875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 3.0, 2.0, 3.0, 7.0, 3.0, 6.0, 9.0, 15.0, 11.0, 20.0, 23.0, 21.0, 25.0, 25.0, 35.0, 35.0, 52.0, 41.0, 43.0, 53.0, 47.0, 44.0, 48.0, 53.0, 42.0, 43.0, 41.0, 46.0, 35.0, 33.0, 19.0, 26.0, 15.0, 21.0, 17.0, 12.0, 11.0, 4.0, 7.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.835206985473633, -18.094234466552734, -17.35326385498047, -16.61229133605957, -15.871318817138672, -15.13034725189209, -14.389375686645508, -13.64840316772461, -12.907431602478027, -12.166460037231445, -11.425487518310547, -10.684515953063965, -9.943544387817383, -9.202571868896484, -8.461600303649902, -7.720628261566162, -6.979656219482422, -6.238684177398682, -5.497712135314941, -4.756740570068359, -4.015768527984619, -3.274796485900879, -2.533824920654297, -1.7928528785705566, -1.0518808364868164, -0.3109089136123657, 0.43006300926208496, 1.171034812927246, 1.9120068550109863, 2.6529788970947266, 3.3939504623413086, 4.134922504425049, 4.875894546508789, 5.616866588592529, 6.3578386306762695, 7.098810195922852, 7.839782238006592, 8.580754280090332, 9.321725845336914, 10.062698364257812, 10.803669929504395, 11.544641494750977, 12.285614013671875, 13.026585578918457, 13.767557144165039, 14.508529663085938, 15.24950122833252, 15.990472793579102, 16.7314453125, 17.4724178314209, 18.213388442993164, 18.954360961914062, 19.69533348083496, 20.43630599975586, 21.177276611328125, 21.918249130249023, 22.659221649169922, 23.40019416809082, 24.141164779663086, 24.882137298583984, 25.623109817504883, 26.36408233642578, 27.105052947998047, 27.846025466918945, 28.58699607849121]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 6.0, 2.0, 5.0, 8.0, 13.0, 11.0, 7.0, 15.0, 21.0, 25.0, 22.0, 28.0, 29.0, 20.0, 34.0, 33.0, 33.0, 37.0, 43.0, 34.0, 45.0, 53.0, 46.0, 33.0, 40.0, 41.0, 37.0, 34.0, 22.0, 28.0, 27.0, 20.0, 28.0, 22.0, 19.0, 11.0, 16.0, 6.0, 14.0, 6.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.401037216186523, -21.73367691040039, -21.066314697265625, -20.398954391479492, -19.73159408569336, -19.064233779907227, -18.396873474121094, -17.729511260986328, -17.062150955200195, -16.394790649414062, -15.727429389953613, -15.060068130493164, -14.392707824707031, -13.725347518920898, -13.05798625946045, -12.390625, -11.723264694213867, -11.055904388427734, -10.388543128967285, -9.721181869506836, -9.053821563720703, -8.38646125793457, -7.719099998474121, -7.05173921585083, -6.384378433227539, -5.717017650604248, -5.049656867980957, -4.382296085357666, -3.714935302734375, -3.047574520111084, -2.380213737487793, -1.712852954864502, -1.045492172241211, -0.3781313896179199, 0.2892293930053711, 0.9565901756286621, 1.6239509582519531, 2.291311740875244, 2.958672523498535, 3.626033306121826, 4.293394088745117, 4.960754871368408, 5.628115653991699, 6.29547643661499, 6.962837219238281, 7.630198001861572, 8.297558784484863, 8.964920043945312, 9.632280349731445, 10.299640655517578, 10.967001914978027, 11.634363174438477, 12.30172348022461, 12.969083786010742, 13.636445045471191, 14.30380630493164, 14.971166610717773, 15.638526916503906, 16.305889129638672, 16.973249435424805, 17.640609741210938, 18.30797004699707, 18.975330352783203, 19.64269256591797, 20.3100528717041]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 0.0, 3.0, 9.0, 13.0, 25.0, 42.0, 66.0, 111.0, 205.0, 326.0, 456.0, 784.0, 1244.0, 2022.0, 3365.0, 5427.0, 8735.0, 13675.0, 20771.0, 31196.0, 44752.0, 61385.0, 80027.0, 96494.0, 108949.0, 112842.0, 106634.0, 93116.0, 75662.0, 57570.0, 41599.0, 28781.0, 19281.0, 12419.0, 7739.0, 4966.0, 2998.0, 1889.0, 1140.0, 728.0, 435.0, 250.0, 159.0, 86.0, 79.0, 47.0, 20.0, 16.0, 12.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.5546875, -15.0888671875, -14.623046875, -14.1572265625, -13.69140625, -13.2255859375, -12.759765625, -12.2939453125, -11.828125, -11.3623046875, -10.896484375, -10.4306640625, -9.96484375, -9.4990234375, -9.033203125, -8.5673828125, -8.1015625, -7.6357421875, -7.169921875, -6.7041015625, -6.23828125, -5.7724609375, -5.306640625, -4.8408203125, -4.375, -3.9091796875, -3.443359375, -2.9775390625, -2.51171875, -2.0458984375, -1.580078125, -1.1142578125, -0.6484375, -0.1826171875, 0.283203125, 0.7490234375, 1.21484375, 1.6806640625, 2.146484375, 2.6123046875, 3.078125, 3.5439453125, 4.009765625, 4.4755859375, 4.94140625, 5.4072265625, 5.873046875, 6.3388671875, 6.8046875, 7.2705078125, 7.736328125, 8.2021484375, 8.66796875, 9.1337890625, 9.599609375, 10.0654296875, 10.53125, 10.9970703125, 11.462890625, 11.9287109375, 12.39453125, 12.8603515625, 13.326171875, 13.7919921875, 14.2578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 10.0, 12.0, 13.0, 16.0, 25.0, 21.0, 27.0, 33.0, 23.0, 35.0, 42.0, 25.0, 35.0, 40.0, 50.0, 53.0, 32.0, 38.0, 46.0, 47.0, 38.0, 25.0, 43.0, 34.0, 31.0, 30.0, 23.0, 16.0, 23.0, 17.0, 15.0, 15.0, 8.0, 10.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.71875, -21.03271484375, -20.3466796875, -19.66064453125, -18.974609375, -18.28857421875, -17.6025390625, -16.91650390625, -16.23046875, -15.54443359375, -14.8583984375, -14.17236328125, -13.486328125, -12.80029296875, -12.1142578125, -11.42822265625, -10.7421875, -10.05615234375, -9.3701171875, -8.68408203125, -7.998046875, -7.31201171875, -6.6259765625, -5.93994140625, -5.25390625, -4.56787109375, -3.8818359375, -3.19580078125, -2.509765625, -1.82373046875, -1.1376953125, -0.45166015625, 0.234375, 0.92041015625, 1.6064453125, 2.29248046875, 2.978515625, 3.66455078125, 4.3505859375, 5.03662109375, 5.72265625, 6.40869140625, 7.0947265625, 7.78076171875, 8.466796875, 9.15283203125, 9.8388671875, 10.52490234375, 11.2109375, 11.89697265625, 12.5830078125, 13.26904296875, 13.955078125, 14.64111328125, 15.3271484375, 16.01318359375, 16.69921875, 17.38525390625, 18.0712890625, 18.75732421875, 19.443359375, 20.12939453125, 20.8154296875, 21.50146484375, 22.1875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 13.0, 13.0, 34.0, 40.0, 55.0, 76.0, 135.0, 205.0, 301.0, 453.0, 663.0, 1097.0, 1739.0, 2671.0, 4218.0, 6807.0, 10762.0, 16657.0, 25109.0, 37904.0, 54530.0, 73889.0, 92937.0, 109375.0, 116967.0, 114192.0, 101085.0, 82363.0, 62332.0, 44793.0, 30916.0, 20142.0, 13089.0, 8437.0, 5280.0, 3350.0, 2116.0, 1364.0, 863.0, 578.0, 344.0, 216.0, 150.0, 92.0, 60.0, 45.0, 33.0, 26.0, 15.0, 10.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0], "bins": [-16.90625, -16.3896484375, -15.873046875, -15.3564453125, -14.83984375, -14.3232421875, -13.806640625, -13.2900390625, -12.7734375, -12.2568359375, -11.740234375, -11.2236328125, -10.70703125, -10.1904296875, -9.673828125, -9.1572265625, -8.640625, -8.1240234375, -7.607421875, -7.0908203125, -6.57421875, -6.0576171875, -5.541015625, -5.0244140625, -4.5078125, -3.9912109375, -3.474609375, -2.9580078125, -2.44140625, -1.9248046875, -1.408203125, -0.8916015625, -0.375, 0.1416015625, 0.658203125, 1.1748046875, 1.69140625, 2.2080078125, 2.724609375, 3.2412109375, 3.7578125, 4.2744140625, 4.791015625, 5.3076171875, 5.82421875, 6.3408203125, 6.857421875, 7.3740234375, 7.890625, 8.4072265625, 8.923828125, 9.4404296875, 9.95703125, 10.4736328125, 10.990234375, 11.5068359375, 12.0234375, 12.5400390625, 13.056640625, 13.5732421875, 14.08984375, 14.6064453125, 15.123046875, 15.6396484375, 16.15625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 3.0, 6.0, 4.0, 7.0, 5.0, 8.0, 11.0, 14.0, 15.0, 25.0, 30.0, 18.0, 35.0, 23.0, 27.0, 40.0, 22.0, 31.0, 26.0, 32.0, 34.0, 42.0, 39.0, 42.0, 32.0, 38.0, 45.0, 39.0, 33.0, 31.0, 38.0, 19.0, 20.0, 15.0, 21.0, 22.0, 18.0, 20.0, 13.0, 12.0, 10.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 4.0, 6.0, 0.0, 4.0, 0.0, 1.0], "bins": [-12.90625, -12.5198974609375, -12.133544921875, -11.7471923828125, -11.36083984375, -10.9744873046875, -10.588134765625, -10.2017822265625, -9.8154296875, -9.4290771484375, -9.042724609375, -8.6563720703125, -8.27001953125, -7.8836669921875, -7.497314453125, -7.1109619140625, -6.724609375, -6.3382568359375, -5.951904296875, -5.5655517578125, -5.17919921875, -4.7928466796875, -4.406494140625, -4.0201416015625, -3.6337890625, -3.2474365234375, -2.861083984375, -2.4747314453125, -2.08837890625, -1.7020263671875, -1.315673828125, -0.9293212890625, -0.54296875, -0.1566162109375, 0.229736328125, 0.6160888671875, 1.00244140625, 1.3887939453125, 1.775146484375, 2.1614990234375, 2.5478515625, 2.9342041015625, 3.320556640625, 3.7069091796875, 4.09326171875, 4.4796142578125, 4.865966796875, 5.2523193359375, 5.638671875, 6.0250244140625, 6.411376953125, 6.7977294921875, 7.18408203125, 7.5704345703125, 7.956787109375, 8.3431396484375, 8.7294921875, 9.1158447265625, 9.502197265625, 9.8885498046875, 10.27490234375, 10.6612548828125, 11.047607421875, 11.4339599609375, 11.8203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 14.0, 21.0, 34.0, 48.0, 86.0, 152.0, 223.0, 388.0, 615.0, 1037.0, 1796.0, 3053.0, 4993.0, 8547.0, 14239.0, 23974.0, 39212.0, 60616.0, 89661.0, 119760.0, 141035.0, 143189.0, 125228.0, 95909.0, 66234.0, 42858.0, 26293.0, 15909.0, 9464.0, 5717.0, 3335.0, 1945.0, 1204.0, 715.0, 416.0, 256.0, 161.0, 88.0, 52.0, 33.0, 13.0, 11.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.046875, -7.79620361328125, -7.5455322265625, -7.29486083984375, -7.044189453125, -6.79351806640625, -6.5428466796875, -6.29217529296875, -6.04150390625, -5.79083251953125, -5.5401611328125, -5.28948974609375, -5.038818359375, -4.78814697265625, -4.5374755859375, -4.28680419921875, -4.0361328125, -3.78546142578125, -3.5347900390625, -3.28411865234375, -3.033447265625, -2.78277587890625, -2.5321044921875, -2.28143310546875, -2.03076171875, -1.78009033203125, -1.5294189453125, -1.27874755859375, -1.028076171875, -0.77740478515625, -0.5267333984375, -0.27606201171875, -0.025390625, 0.22528076171875, 0.4759521484375, 0.72662353515625, 0.977294921875, 1.22796630859375, 1.4786376953125, 1.72930908203125, 1.97998046875, 2.23065185546875, 2.4813232421875, 2.73199462890625, 2.982666015625, 3.23333740234375, 3.4840087890625, 3.73468017578125, 3.9853515625, 4.23602294921875, 4.4866943359375, 4.73736572265625, 4.988037109375, 5.23870849609375, 5.4893798828125, 5.74005126953125, 5.99072265625, 6.24139404296875, 6.4920654296875, 6.74273681640625, 6.993408203125, 7.24407958984375, 7.4947509765625, 7.74542236328125, 7.99609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 9.0, 8.0, 10.0, 17.0, 12.0, 16.0, 22.0, 23.0, 33.0, 40.0, 31.0, 38.0, 47.0, 56.0, 53.0, 52.0, 49.0, 48.0, 51.0, 57.0, 54.0, 39.0, 35.0, 38.0, 33.0, 18.0, 27.0, 17.0, 11.0, 15.0, 8.0, 9.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007271766662597656, -0.0006975308060646057, -0.0006678849458694458, -0.0006382390856742859, -0.000608593225479126, -0.0005789473652839661, -0.0005493015050888062, -0.0005196556448936462, -0.0004900097846984863, -0.0004603639245033264, -0.0004307180643081665, -0.0004010722041130066, -0.0003714263439178467, -0.00034178048372268677, -0.00031213462352752686, -0.00028248876333236694, -0.00025284290313720703, -0.00022319704294204712, -0.0001935511827468872, -0.0001639053225517273, -0.00013425946235656738, -0.00010461360216140747, -7.496774196624756e-05, -4.5321881771087646e-05, -1.5676021575927734e-05, 1.3969838619232178e-05, 4.361569881439209e-05, 7.3261559009552e-05, 0.00010290741920471191, 0.00013255327939987183, 0.00016219913959503174, 0.00019184499979019165, 0.00022149085998535156, 0.0002511367201805115, 0.0002807825803756714, 0.0003104284405708313, 0.0003400743007659912, 0.0003697201609611511, 0.00039936602115631104, 0.00042901188135147095, 0.00045865774154663086, 0.0004883036017417908, 0.0005179494619369507, 0.0005475953221321106, 0.0005772411823272705, 0.0006068870425224304, 0.0006365329027175903, 0.0006661787629127502, 0.0006958246231079102, 0.0007254704833030701, 0.00075511634349823, 0.0007847622036933899, 0.0008144080638885498, 0.0008440539240837097, 0.0008736997842788696, 0.0009033456444740295, 0.0009329915046691895, 0.0009626373648643494, 0.0009922832250595093, 0.0010219290852546692, 0.001051574945449829, 0.001081220805644989, 0.001110866665840149, 0.0011405125260353088, 0.0011701583862304688]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 10.0, 15.0, 24.0, 22.0, 51.0, 58.0, 107.0, 152.0, 265.0, 431.0, 761.0, 1341.0, 2258.0, 3922.0, 7142.0, 12678.0, 21715.0, 35810.0, 57630.0, 85680.0, 115920.0, 138994.0, 144600.0, 130304.0, 102630.0, 71731.0, 46674.0, 28634.0, 16594.0, 9622.0, 5443.0, 3057.0, 1749.0, 1030.0, 569.0, 383.0, 222.0, 116.0, 71.0, 49.0, 29.0, 15.0, 13.0, 8.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.03125, -7.7823486328125, -7.533447265625, -7.2845458984375, -7.03564453125, -6.7867431640625, -6.537841796875, -6.2889404296875, -6.0400390625, -5.7911376953125, -5.542236328125, -5.2933349609375, -5.04443359375, -4.7955322265625, -4.546630859375, -4.2977294921875, -4.048828125, -3.7999267578125, -3.551025390625, -3.3021240234375, -3.05322265625, -2.8043212890625, -2.555419921875, -2.3065185546875, -2.0576171875, -1.8087158203125, -1.559814453125, -1.3109130859375, -1.06201171875, -0.8131103515625, -0.564208984375, -0.3153076171875, -0.06640625, 0.1824951171875, 0.431396484375, 0.6802978515625, 0.92919921875, 1.1781005859375, 1.427001953125, 1.6759033203125, 1.9248046875, 2.1737060546875, 2.422607421875, 2.6715087890625, 2.92041015625, 3.1693115234375, 3.418212890625, 3.6671142578125, 3.916015625, 4.1649169921875, 4.413818359375, 4.6627197265625, 4.91162109375, 5.1605224609375, 5.409423828125, 5.6583251953125, 5.9072265625, 6.1561279296875, 6.405029296875, 6.6539306640625, 6.90283203125, 7.1517333984375, 7.400634765625, 7.6495361328125, 7.8984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 4.0, 10.0, 9.0, 8.0, 12.0, 16.0, 16.0, 18.0, 28.0, 31.0, 48.0, 45.0, 43.0, 40.0, 45.0, 48.0, 52.0, 39.0, 55.0, 50.0, 40.0, 51.0, 45.0, 36.0, 24.0, 20.0, 20.0, 28.0, 18.0, 21.0, 14.0, 12.0, 6.0, 8.0, 9.0, 6.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.32293701171875, -2.2376708984375, -2.15240478515625, -2.067138671875, -1.98187255859375, -1.8966064453125, -1.81134033203125, -1.72607421875, -1.64080810546875, -1.5555419921875, -1.47027587890625, -1.385009765625, -1.29974365234375, -1.2144775390625, -1.12921142578125, -1.0439453125, -0.95867919921875, -0.8734130859375, -0.78814697265625, -0.702880859375, -0.61761474609375, -0.5323486328125, -0.44708251953125, -0.36181640625, -0.27655029296875, -0.1912841796875, -0.10601806640625, -0.020751953125, 0.06451416015625, 0.1497802734375, 0.23504638671875, 0.3203125, 0.40557861328125, 0.4908447265625, 0.57611083984375, 0.661376953125, 0.74664306640625, 0.8319091796875, 0.91717529296875, 1.00244140625, 1.08770751953125, 1.1729736328125, 1.25823974609375, 1.343505859375, 1.42877197265625, 1.5140380859375, 1.59930419921875, 1.6845703125, 1.76983642578125, 1.8551025390625, 1.94036865234375, 2.025634765625, 2.11090087890625, 2.1961669921875, 2.28143310546875, 2.36669921875, 2.45196533203125, 2.5372314453125, 2.62249755859375, 2.707763671875, 2.79302978515625, 2.8782958984375, 2.96356201171875, 3.048828125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 4.0, 10.0, 12.0, 17.0, 12.0, 22.0, 18.0, 17.0, 33.0, 32.0, 30.0, 33.0, 40.0, 44.0, 38.0, 45.0, 50.0, 43.0, 44.0, 41.0, 41.0, 43.0, 41.0, 35.0, 38.0, 36.0, 30.0, 27.0, 17.0, 24.0, 22.0, 11.0, 8.0, 8.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.8098087310791, -21.138233184814453, -20.466657638549805, -19.795082092285156, -19.12350845336914, -18.451932907104492, -17.780357360839844, -17.108781814575195, -16.437206268310547, -15.765630722045898, -15.094056129455566, -14.422480583190918, -13.750905990600586, -13.079330444335938, -12.407754898071289, -11.73617935180664, -11.064605712890625, -10.393030166625977, -9.721455574035645, -9.049880027770996, -8.378305435180664, -7.706729888916016, -7.035154342651367, -6.363579273223877, -5.692004203796387, -5.0204291343688965, -4.348854064941406, -3.677278518676758, -3.0057034492492676, -2.3341283798217773, -1.662552833557129, -0.9909777641296387, -0.31940460205078125, 0.35217058658599854, 1.0237457752227783, 1.6953210830688477, 2.366896152496338, 3.038471221923828, 3.7100467681884766, 4.381621837615967, 5.053196907043457, 5.724771976470947, 6.3963470458984375, 7.067922592163086, 7.739497661590576, 8.411072731018066, 9.082648277282715, 9.754222869873047, 10.425798416137695, 11.097373962402344, 11.768948554992676, 12.440524101257324, 13.112098693847656, 13.783674240112305, 14.455249786376953, 15.126825332641602, 15.798399925231934, 16.469974517822266, 17.141550064086914, 17.813125610351562, 18.48470115661621, 19.15627670288086, 19.827850341796875, 20.499425888061523, 21.171001434326172]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 7.0, 17.0, 8.0, 6.0, 9.0, 17.0, 13.0, 23.0, 24.0, 19.0, 32.0, 33.0, 23.0, 31.0, 35.0, 47.0, 58.0, 28.0, 48.0, 43.0, 46.0, 25.0, 39.0, 35.0, 35.0, 40.0, 44.0, 21.0, 23.0, 16.0, 26.0, 22.0, 19.0, 8.0, 11.0, 10.0, 11.0, 6.0, 10.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.029443740844727, -20.367202758789062, -19.7049617767334, -19.042720794677734, -18.38047981262207, -17.718238830566406, -17.05599594116211, -16.393754959106445, -15.731513977050781, -15.069272994995117, -14.407032012939453, -13.744791030883789, -13.082549095153809, -12.420308113098145, -11.75806713104248, -11.0958251953125, -10.433585166931152, -9.771344184875488, -9.109103202819824, -8.446861267089844, -7.78462028503418, -7.122379302978516, -6.460138320922852, -5.797896862030029, -5.135655879974365, -4.473414897918701, -3.811173439025879, -3.148932456970215, -2.4866912364959717, -1.8244500160217285, -1.1622090339660645, -0.4999675750732422, 0.16227340698242188, 0.8245145678520203, 1.4867557287216187, 2.1489968299865723, 2.8112380504608154, 3.4734792709350586, 4.135720252990723, 4.797961711883545, 5.460202693939209, 6.122443675994873, 6.784685134887695, 7.446926116943359, 8.109167098999023, 8.771408081054688, 9.433649063110352, 10.095890998840332, 10.758131980895996, 11.42037296295166, 12.082613945007324, 12.744855880737305, 13.407096862792969, 14.069337844848633, 14.731578826904297, 15.393819808959961, 16.056060791015625, 16.71830177307129, 17.380542755126953, 18.042783737182617, 18.70502471923828, 19.367267608642578, 20.02950668334961, 20.691749572753906, 21.35399055480957]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 13.0, 9.0, 23.0, 37.0, 35.0, 57.0, 88.0, 134.0, 202.0, 297.0, 529.0, 908.0, 1342.0, 2239.0, 3789.0, 6367.0, 10961.0, 19143.0, 33886.0, 61417.0, 112748.0, 201629.0, 342803.0, 521297.0, 669180.0, 691780.0, 573551.0, 393460.0, 238562.0, 135125.0, 74692.0, 41494.0, 23387.0, 13412.0, 7821.0, 4742.0, 2753.0, 1694.0, 994.0, 645.0, 397.0, 243.0, 147.0, 99.0, 50.0, 37.0, 26.0, 19.0, 15.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.953125, -17.394775390625, -16.83642578125, -16.278076171875, -15.7197265625, -15.161376953125, -14.60302734375, -14.044677734375, -13.486328125, -12.927978515625, -12.36962890625, -11.811279296875, -11.2529296875, -10.694580078125, -10.13623046875, -9.577880859375, -9.01953125, -8.461181640625, -7.90283203125, -7.344482421875, -6.7861328125, -6.227783203125, -5.66943359375, -5.111083984375, -4.552734375, -3.994384765625, -3.43603515625, -2.877685546875, -2.3193359375, -1.760986328125, -1.20263671875, -0.644287109375, -0.0859375, 0.472412109375, 1.03076171875, 1.589111328125, 2.1474609375, 2.705810546875, 3.26416015625, 3.822509765625, 4.380859375, 4.939208984375, 5.49755859375, 6.055908203125, 6.6142578125, 7.172607421875, 7.73095703125, 8.289306640625, 8.84765625, 9.406005859375, 9.96435546875, 10.522705078125, 11.0810546875, 11.639404296875, 12.19775390625, 12.756103515625, 13.314453125, 13.872802734375, 14.43115234375, 14.989501953125, 15.5478515625, 16.106201171875, 16.66455078125, 17.222900390625, 17.78125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 10.0, 11.0, 14.0, 14.0, 17.0, 18.0, 22.0, 34.0, 31.0, 36.0, 38.0, 34.0, 36.0, 48.0, 35.0, 54.0, 49.0, 51.0, 47.0, 37.0, 45.0, 38.0, 35.0, 39.0, 22.0, 26.0, 15.0, 27.0, 22.0, 15.0, 15.0, 7.0, 12.0, 13.0, 6.0, 4.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.03125, -20.39208984375, -19.7529296875, -19.11376953125, -18.474609375, -17.83544921875, -17.1962890625, -16.55712890625, -15.91796875, -15.27880859375, -14.6396484375, -14.00048828125, -13.361328125, -12.72216796875, -12.0830078125, -11.44384765625, -10.8046875, -10.16552734375, -9.5263671875, -8.88720703125, -8.248046875, -7.60888671875, -6.9697265625, -6.33056640625, -5.69140625, -5.05224609375, -4.4130859375, -3.77392578125, -3.134765625, -2.49560546875, -1.8564453125, -1.21728515625, -0.578125, 0.06103515625, 0.7001953125, 1.33935546875, 1.978515625, 2.61767578125, 3.2568359375, 3.89599609375, 4.53515625, 5.17431640625, 5.8134765625, 6.45263671875, 7.091796875, 7.73095703125, 8.3701171875, 9.00927734375, 9.6484375, 10.28759765625, 10.9267578125, 11.56591796875, 12.205078125, 12.84423828125, 13.4833984375, 14.12255859375, 14.76171875, 15.40087890625, 16.0400390625, 16.67919921875, 17.318359375, 17.95751953125, 18.5966796875, 19.23583984375, 19.875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 4.0, 8.0, 17.0, 59.0, 57.0, 108.0, 184.0, 310.0, 497.0, 843.0, 1510.0, 2626.0, 4738.0, 8520.0, 15014.0, 26996.0, 48792.0, 87159.0, 152838.0, 259024.0, 409223.0, 579404.0, 683271.0, 642734.0, 489873.0, 323748.0, 196655.0, 114308.0, 64509.0, 36105.0, 19693.0, 10961.0, 6219.0, 3561.0, 1920.0, 1115.0, 703.0, 403.0, 242.0, 130.0, 79.0, 62.0, 26.0, 13.0, 10.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.875, -21.2265625, -20.578125, -19.9296875, -19.28125, -18.6328125, -17.984375, -17.3359375, -16.6875, -16.0390625, -15.390625, -14.7421875, -14.09375, -13.4453125, -12.796875, -12.1484375, -11.5, -10.8515625, -10.203125, -9.5546875, -8.90625, -8.2578125, -7.609375, -6.9609375, -6.3125, -5.6640625, -5.015625, -4.3671875, -3.71875, -3.0703125, -2.421875, -1.7734375, -1.125, -0.4765625, 0.171875, 0.8203125, 1.46875, 2.1171875, 2.765625, 3.4140625, 4.0625, 4.7109375, 5.359375, 6.0078125, 6.65625, 7.3046875, 7.953125, 8.6015625, 9.25, 9.8984375, 10.546875, 11.1953125, 11.84375, 12.4921875, 13.140625, 13.7890625, 14.4375, 15.0859375, 15.734375, 16.3828125, 17.03125, 17.6796875, 18.328125, 18.9765625, 19.625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 10.0, 5.0, 15.0, 15.0, 23.0, 24.0, 37.0, 45.0, 70.0, 59.0, 82.0, 96.0, 123.0, 144.0, 150.0, 157.0, 178.0, 201.0, 216.0, 257.0, 218.0, 238.0, 226.0, 212.0, 204.0, 196.0, 139.0, 123.0, 131.0, 91.0, 81.0, 72.0, 50.0, 42.0, 39.0, 33.0, 25.0, 13.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.71875, -8.4659423828125, -8.213134765625, -7.9603271484375, -7.70751953125, -7.4547119140625, -7.201904296875, -6.9490966796875, -6.6962890625, -6.4434814453125, -6.190673828125, -5.9378662109375, -5.68505859375, -5.4322509765625, -5.179443359375, -4.9266357421875, -4.673828125, -4.4210205078125, -4.168212890625, -3.9154052734375, -3.66259765625, -3.4097900390625, -3.156982421875, -2.9041748046875, -2.6513671875, -2.3985595703125, -2.145751953125, -1.8929443359375, -1.64013671875, -1.3873291015625, -1.134521484375, -0.8817138671875, -0.62890625, -0.3760986328125, -0.123291015625, 0.1295166015625, 0.38232421875, 0.6351318359375, 0.887939453125, 1.1407470703125, 1.3935546875, 1.6463623046875, 1.899169921875, 2.1519775390625, 2.40478515625, 2.6575927734375, 2.910400390625, 3.1632080078125, 3.416015625, 3.6688232421875, 3.921630859375, 4.1744384765625, 4.42724609375, 4.6800537109375, 4.932861328125, 5.1856689453125, 5.4384765625, 5.6912841796875, 5.944091796875, 6.1968994140625, 6.44970703125, 6.7025146484375, 6.955322265625, 7.2081298828125, 7.4609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 4.0, 10.0, 12.0, 9.0, 9.0, 11.0, 14.0, 17.0, 20.0, 22.0, 23.0, 22.0, 43.0, 38.0, 35.0, 36.0, 38.0, 56.0, 46.0, 38.0, 43.0, 30.0, 29.0, 37.0, 37.0, 37.0, 31.0, 32.0, 38.0, 28.0, 26.0, 22.0, 22.0, 13.0, 10.0, 11.0, 7.0, 10.0, 9.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.29783821105957, -19.682409286499023, -19.06698226928711, -18.451553344726562, -17.836124420166016, -17.22069549560547, -16.605266571044922, -15.989839553833008, -15.374410629272461, -14.758981704711914, -14.143553733825684, -13.528125762939453, -12.912696838378906, -12.29726791381836, -11.681839942932129, -11.066411972045898, -10.450983047485352, -9.835554122924805, -9.220126152038574, -8.604698181152344, -7.989269256591797, -7.373840808868408, -6.7584123611450195, -6.142983913421631, -5.527555465698242, -4.9121270179748535, -4.296698570251465, -3.681270122528076, -3.0658416748046875, -2.450413227081299, -1.8349847793579102, -1.2195563316345215, -0.6041259765625, 0.011302471160888672, 0.6267309188842773, 1.242159366607666, 1.8575878143310547, 2.4730162620544434, 3.088444709777832, 3.7038731575012207, 4.319301605224609, 4.934730052947998, 5.550158500671387, 6.165586948394775, 6.781015396118164, 7.396443843841553, 8.011872291564941, 8.627300262451172, 9.242729187011719, 9.858158111572266, 10.473586082458496, 11.089014053344727, 11.704442977905273, 12.31987190246582, 12.93529987335205, 13.550727844238281, 14.166156768798828, 14.781585693359375, 15.397013664245605, 16.012441635131836, 16.627870559692383, 17.24329948425293, 17.858726501464844, 18.47415542602539, 19.089584350585938]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 7.0, 3.0, 2.0, 9.0, 11.0, 12.0, 18.0, 15.0, 14.0, 16.0, 23.0, 23.0, 26.0, 28.0, 30.0, 23.0, 26.0, 36.0, 37.0, 53.0, 49.0, 43.0, 32.0, 29.0, 40.0, 32.0, 34.0, 39.0, 25.0, 29.0, 32.0, 28.0, 27.0, 22.0, 21.0, 9.0, 15.0, 10.0, 9.0, 14.0, 14.0, 8.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.31538200378418, -17.731037139892578, -17.146692276000977, -16.562347412109375, -15.97800350189209, -15.393658638000488, -14.809314727783203, -14.224969863891602, -13.640625, -13.056280136108398, -12.471935272216797, -11.887591361999512, -11.30324649810791, -10.718901634216309, -10.134557723999023, -9.550212860107422, -8.96586799621582, -8.381523132324219, -7.797178745269775, -7.212834358215332, -6.6284894943237305, -6.044144630432129, -5.4598002433776855, -4.875455856323242, -4.291110992431641, -3.706766366958618, -3.1224217414855957, -2.5380771160125732, -1.9537324905395508, -1.3693878650665283, -0.7850432395935059, -0.2006988525390625, 0.3836479187011719, 0.9679925441741943, 1.5523371696472168, 2.1366817951202393, 2.7210264205932617, 3.305371046066284, 3.8897156715393066, 4.47406005859375, 5.058404922485352, 5.642749786376953, 6.2270941734313965, 6.81143856048584, 7.395783424377441, 7.980128288269043, 8.564472198486328, 9.14881706237793, 9.733161926269531, 10.317506790161133, 10.901851654052734, 11.48619556427002, 12.070540428161621, 12.654885292053223, 13.239229202270508, 13.82357406616211, 14.407918930053711, 14.992263793945312, 15.576608657836914, 16.160953521728516, 16.745296478271484, 17.329641342163086, 17.913986206054688, 18.49833106994629, 19.08267593383789]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 11.0, 24.0, 32.0, 51.0, 90.0, 129.0, 223.0, 301.0, 508.0, 863.0, 1525.0, 2671.0, 4689.0, 8256.0, 14678.0, 25957.0, 44806.0, 74717.0, 114477.0, 152410.0, 167564.0, 150147.0, 111159.0, 72111.0, 43289.0, 25124.0, 14040.0, 7967.0, 4556.0, 2508.0, 1445.0, 884.0, 545.0, 294.0, 203.0, 106.0, 83.0, 40.0, 20.0, 18.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.953125, -17.400146484375, -16.84716796875, -16.294189453125, -15.7412109375, -15.188232421875, -14.63525390625, -14.082275390625, -13.529296875, -12.976318359375, -12.42333984375, -11.870361328125, -11.3173828125, -10.764404296875, -10.21142578125, -9.658447265625, -9.10546875, -8.552490234375, -7.99951171875, -7.446533203125, -6.8935546875, -6.340576171875, -5.78759765625, -5.234619140625, -4.681640625, -4.128662109375, -3.57568359375, -3.022705078125, -2.4697265625, -1.916748046875, -1.36376953125, -0.810791015625, -0.2578125, 0.295166015625, 0.84814453125, 1.401123046875, 1.9541015625, 2.507080078125, 3.06005859375, 3.613037109375, 4.166015625, 4.718994140625, 5.27197265625, 5.824951171875, 6.3779296875, 6.930908203125, 7.48388671875, 8.036865234375, 8.58984375, 9.142822265625, 9.69580078125, 10.248779296875, 10.8017578125, 11.354736328125, 11.90771484375, 12.460693359375, 13.013671875, 13.566650390625, 14.11962890625, 14.672607421875, 15.2255859375, 15.778564453125, 16.33154296875, 16.884521484375, 17.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 5.0, 7.0, 6.0, 17.0, 16.0, 17.0, 21.0, 14.0, 22.0, 24.0, 29.0, 34.0, 32.0, 28.0, 37.0, 35.0, 35.0, 27.0, 40.0, 40.0, 44.0, 43.0, 34.0, 36.0, 35.0, 32.0, 41.0, 32.0, 25.0, 19.0, 23.0, 16.0, 27.0, 17.0, 13.0, 8.0, 15.0, 4.0, 5.0, 12.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.8125, -19.20849609375, -18.6044921875, -18.00048828125, -17.396484375, -16.79248046875, -16.1884765625, -15.58447265625, -14.98046875, -14.37646484375, -13.7724609375, -13.16845703125, -12.564453125, -11.96044921875, -11.3564453125, -10.75244140625, -10.1484375, -9.54443359375, -8.9404296875, -8.33642578125, -7.732421875, -7.12841796875, -6.5244140625, -5.92041015625, -5.31640625, -4.71240234375, -4.1083984375, -3.50439453125, -2.900390625, -2.29638671875, -1.6923828125, -1.08837890625, -0.484375, 0.11962890625, 0.7236328125, 1.32763671875, 1.931640625, 2.53564453125, 3.1396484375, 3.74365234375, 4.34765625, 4.95166015625, 5.5556640625, 6.15966796875, 6.763671875, 7.36767578125, 7.9716796875, 8.57568359375, 9.1796875, 9.78369140625, 10.3876953125, 10.99169921875, 11.595703125, 12.19970703125, 12.8037109375, 13.40771484375, 14.01171875, 14.61572265625, 15.2197265625, 15.82373046875, 16.427734375, 17.03173828125, 17.6357421875, 18.23974609375, 18.84375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 6.0, 16.0, 30.0, 27.0, 49.0, 65.0, 101.0, 145.0, 244.0, 361.0, 502.0, 765.0, 1172.0, 1827.0, 2957.0, 4943.0, 8407.0, 14994.0, 27279.0, 51419.0, 96055.0, 164995.0, 219600.0, 191173.0, 118531.0, 64575.0, 34017.0, 18428.0, 10333.0, 5896.0, 3448.0, 2178.0, 1337.0, 898.0, 622.0, 387.0, 261.0, 174.0, 116.0, 75.0, 58.0, 35.0, 23.0, 9.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.5, -23.701416015625, -22.90283203125, -22.104248046875, -21.3056640625, -20.507080078125, -19.70849609375, -18.909912109375, -18.111328125, -17.312744140625, -16.51416015625, -15.715576171875, -14.9169921875, -14.118408203125, -13.31982421875, -12.521240234375, -11.72265625, -10.924072265625, -10.12548828125, -9.326904296875, -8.5283203125, -7.729736328125, -6.93115234375, -6.132568359375, -5.333984375, -4.535400390625, -3.73681640625, -2.938232421875, -2.1396484375, -1.341064453125, -0.54248046875, 0.256103515625, 1.0546875, 1.853271484375, 2.65185546875, 3.450439453125, 4.2490234375, 5.047607421875, 5.84619140625, 6.644775390625, 7.443359375, 8.241943359375, 9.04052734375, 9.839111328125, 10.6376953125, 11.436279296875, 12.23486328125, 13.033447265625, 13.83203125, 14.630615234375, 15.42919921875, 16.227783203125, 17.0263671875, 17.824951171875, 18.62353515625, 19.422119140625, 20.220703125, 21.019287109375, 21.81787109375, 22.616455078125, 23.4150390625, 24.213623046875, 25.01220703125, 25.810791015625, 26.609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 6.0, 9.0, 8.0, 9.0, 8.0, 12.0, 11.0, 12.0, 11.0, 28.0, 22.0, 24.0, 32.0, 43.0, 31.0, 29.0, 30.0, 41.0, 35.0, 40.0, 42.0, 47.0, 37.0, 32.0, 40.0, 34.0, 27.0, 29.0, 25.0, 30.0, 28.0, 23.0, 22.0, 24.0, 24.0, 20.0, 16.0, 11.0, 14.0, 9.0, 9.0, 4.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-13.671875, -13.2803955078125, -12.888916015625, -12.4974365234375, -12.10595703125, -11.7144775390625, -11.322998046875, -10.9315185546875, -10.5400390625, -10.1485595703125, -9.757080078125, -9.3656005859375, -8.97412109375, -8.5826416015625, -8.191162109375, -7.7996826171875, -7.408203125, -7.0167236328125, -6.625244140625, -6.2337646484375, -5.84228515625, -5.4508056640625, -5.059326171875, -4.6678466796875, -4.2763671875, -3.8848876953125, -3.493408203125, -3.1019287109375, -2.71044921875, -2.3189697265625, -1.927490234375, -1.5360107421875, -1.14453125, -0.7530517578125, -0.361572265625, 0.0299072265625, 0.42138671875, 0.8128662109375, 1.204345703125, 1.5958251953125, 1.9873046875, 2.3787841796875, 2.770263671875, 3.1617431640625, 3.55322265625, 3.9447021484375, 4.336181640625, 4.7276611328125, 5.119140625, 5.5106201171875, 5.902099609375, 6.2935791015625, 6.68505859375, 7.0765380859375, 7.468017578125, 7.8594970703125, 8.2509765625, 8.6424560546875, 9.033935546875, 9.4254150390625, 9.81689453125, 10.2083740234375, 10.599853515625, 10.9913330078125, 11.3828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 11.0, 11.0, 14.0, 15.0, 15.0, 19.0, 35.0, 36.0, 60.0, 98.0, 130.0, 183.0, 300.0, 448.0, 789.0, 1266.0, 2399.0, 4583.0, 9584.0, 21539.0, 50672.0, 118650.0, 234241.0, 280066.0, 177611.0, 81607.0, 34651.0, 14770.0, 6915.0, 3404.0, 1769.0, 917.0, 564.0, 368.0, 221.0, 140.0, 124.0, 80.0, 61.0, 53.0, 35.0, 22.0, 17.0, 13.0, 10.0, 13.0, 9.0, 8.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.671875, -12.239013671875, -11.80615234375, -11.373291015625, -10.9404296875, -10.507568359375, -10.07470703125, -9.641845703125, -9.208984375, -8.776123046875, -8.34326171875, -7.910400390625, -7.4775390625, -7.044677734375, -6.61181640625, -6.178955078125, -5.74609375, -5.313232421875, -4.88037109375, -4.447509765625, -4.0146484375, -3.581787109375, -3.14892578125, -2.716064453125, -2.283203125, -1.850341796875, -1.41748046875, -0.984619140625, -0.5517578125, -0.118896484375, 0.31396484375, 0.746826171875, 1.1796875, 1.612548828125, 2.04541015625, 2.478271484375, 2.9111328125, 3.343994140625, 3.77685546875, 4.209716796875, 4.642578125, 5.075439453125, 5.50830078125, 5.941162109375, 6.3740234375, 6.806884765625, 7.23974609375, 7.672607421875, 8.10546875, 8.538330078125, 8.97119140625, 9.404052734375, 9.8369140625, 10.269775390625, 10.70263671875, 11.135498046875, 11.568359375, 12.001220703125, 12.43408203125, 12.866943359375, 13.2998046875, 13.732666015625, 14.16552734375, 14.598388671875, 15.03125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 12.0, 17.0, 23.0, 25.0, 45.0, 67.0, 70.0, 91.0, 110.0, 99.0, 98.0, 97.0, 69.0, 47.0, 36.0, 25.0, 27.0, 7.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0014801025390625, -0.0014474540948867798, -0.0014148056507110596, -0.0013821572065353394, -0.0013495087623596191, -0.001316860318183899, -0.0012842118740081787, -0.0012515634298324585, -0.0012189149856567383, -0.001186266541481018, -0.0011536180973052979, -0.0011209696531295776, -0.0010883212089538574, -0.0010556727647781372, -0.001023024320602417, -0.0009903758764266968, -0.0009577274322509766, -0.0009250789880752563, -0.0008924305438995361, -0.0008597820997238159, -0.0008271336555480957, -0.0007944852113723755, -0.0007618367671966553, -0.0007291883230209351, -0.0006965398788452148, -0.0006638914346694946, -0.0006312429904937744, -0.0005985945463180542, -0.000565946102142334, -0.0005332976579666138, -0.0005006492137908936, -0.00046800076961517334, -0.0004353523254394531, -0.0004027038812637329, -0.0003700554370880127, -0.0003374069929122925, -0.00030475854873657227, -0.00027211010456085205, -0.00023946166038513184, -0.00020681321620941162, -0.0001741647720336914, -0.0001415163278579712, -0.00010886788368225098, -7.621943950653076e-05, -4.357099533081055e-05, -1.0922551155090332e-05, 2.1725893020629883e-05, 5.43743371963501e-05, 8.702278137207031e-05, 0.00011967122554779053, 0.00015231966972351074, 0.00018496811389923096, 0.00021761655807495117, 0.0002502650022506714, 0.0002829134464263916, 0.0003155618906021118, 0.00034821033477783203, 0.00038085877895355225, 0.00041350722312927246, 0.0004461556673049927, 0.0004788041114807129, 0.0005114525556564331, 0.0005441009998321533, 0.0005767494440078735, 0.0006093978881835938]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 20.0, 28.0, 27.0, 40.0, 60.0, 75.0, 138.0, 238.0, 364.0, 543.0, 1009.0, 1716.0, 3012.0, 5486.0, 10271.0, 19542.0, 37078.0, 68026.0, 114821.0, 165041.0, 188782.0, 166105.0, 116008.0, 68772.0, 37992.0, 19718.0, 10542.0, 5534.0, 3084.0, 1743.0, 1013.0, 618.0, 374.0, 242.0, 137.0, 106.0, 72.0, 53.0, 35.0, 21.0, 17.0, 14.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-12.109375, -11.748046875, -11.38671875, -11.025390625, -10.6640625, -10.302734375, -9.94140625, -9.580078125, -9.21875, -8.857421875, -8.49609375, -8.134765625, -7.7734375, -7.412109375, -7.05078125, -6.689453125, -6.328125, -5.966796875, -5.60546875, -5.244140625, -4.8828125, -4.521484375, -4.16015625, -3.798828125, -3.4375, -3.076171875, -2.71484375, -2.353515625, -1.9921875, -1.630859375, -1.26953125, -0.908203125, -0.546875, -0.185546875, 0.17578125, 0.537109375, 0.8984375, 1.259765625, 1.62109375, 1.982421875, 2.34375, 2.705078125, 3.06640625, 3.427734375, 3.7890625, 4.150390625, 4.51171875, 4.873046875, 5.234375, 5.595703125, 5.95703125, 6.318359375, 6.6796875, 7.041015625, 7.40234375, 7.763671875, 8.125, 8.486328125, 8.84765625, 9.208984375, 9.5703125, 9.931640625, 10.29296875, 10.654296875, 11.015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 7.0, 6.0, 7.0, 4.0, 14.0, 10.0, 15.0, 20.0, 23.0, 18.0, 30.0, 31.0, 36.0, 44.0, 42.0, 39.0, 60.0, 56.0, 50.0, 29.0, 42.0, 47.0, 47.0, 34.0, 42.0, 29.0, 30.0, 31.0, 29.0, 26.0, 19.0, 15.0, 11.0, 14.0, 12.0, 4.0, 2.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-3.375, -3.2701416015625, -3.165283203125, -3.0604248046875, -2.95556640625, -2.8507080078125, -2.745849609375, -2.6409912109375, -2.5361328125, -2.4312744140625, -2.326416015625, -2.2215576171875, -2.11669921875, -2.0118408203125, -1.906982421875, -1.8021240234375, -1.697265625, -1.5924072265625, -1.487548828125, -1.3826904296875, -1.27783203125, -1.1729736328125, -1.068115234375, -0.9632568359375, -0.8583984375, -0.7535400390625, -0.648681640625, -0.5438232421875, -0.43896484375, -0.3341064453125, -0.229248046875, -0.1243896484375, -0.01953125, 0.0853271484375, 0.190185546875, 0.2950439453125, 0.39990234375, 0.5047607421875, 0.609619140625, 0.7144775390625, 0.8193359375, 0.9241943359375, 1.029052734375, 1.1339111328125, 1.23876953125, 1.3436279296875, 1.448486328125, 1.5533447265625, 1.658203125, 1.7630615234375, 1.867919921875, 1.9727783203125, 2.07763671875, 2.1824951171875, 2.287353515625, 2.3922119140625, 2.4970703125, 2.6019287109375, 2.706787109375, 2.8116455078125, 2.91650390625, 3.0213623046875, 3.126220703125, 3.2310791015625, 3.3359375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 6.0, 4.0, 3.0, 13.0, 16.0, 19.0, 17.0, 16.0, 27.0, 21.0, 34.0, 30.0, 32.0, 30.0, 32.0, 39.0, 40.0, 43.0, 52.0, 33.0, 37.0, 39.0, 36.0, 35.0, 41.0, 35.0, 28.0, 30.0, 28.0, 23.0, 21.0, 24.0, 20.0, 17.0, 10.0, 15.0, 5.0, 5.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-19.37145233154297, -18.785348892211914, -18.199243545532227, -17.613140106201172, -17.027034759521484, -16.44093132019043, -15.854826927185059, -15.268722534179688, -14.682618141174316, -14.096513748168945, -13.510409355163574, -12.924304962158203, -12.338201522827148, -11.752096176147461, -11.165992736816406, -10.579888343811035, -9.993783950805664, -9.407679557800293, -8.821575164794922, -8.23547077178955, -7.649366855621338, -7.063262462615967, -6.477158546447754, -5.891054153442383, -5.304949760437012, -4.718845367431641, -4.1327409744262695, -3.5466370582580566, -2.9605326652526855, -2.3744282722473145, -1.7883241176605225, -1.2022199630737305, -0.6161174774169922, -0.030013203620910645, 0.5560910701751709, 1.1421953439712524, 1.728299617767334, 2.314404010772705, 2.900508165359497, 3.486612319946289, 4.07271671295166, 4.658821105957031, 5.244925498962402, 5.831029415130615, 6.417133808135986, 7.003238201141357, 7.58934211730957, 8.175446510314941, 8.761550903320312, 9.347655296325684, 9.933759689331055, 10.519864082336426, 11.105968475341797, 11.692071914672852, 12.278176307678223, 12.864280700683594, 13.450385093688965, 14.036489486694336, 14.622593879699707, 15.208698272705078, 15.794801712036133, 16.38090705871582, 16.967010498046875, 17.553115844726562, 18.139219284057617]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 11.0, 14.0, 13.0, 17.0, 13.0, 22.0, 23.0, 15.0, 25.0, 31.0, 25.0, 29.0, 31.0, 39.0, 43.0, 54.0, 39.0, 43.0, 34.0, 33.0, 40.0, 38.0, 34.0, 38.0, 26.0, 36.0, 30.0, 18.0, 31.0, 24.0, 17.0, 10.0, 15.0, 13.0, 8.0, 15.0, 11.0, 6.0, 4.0, 4.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.518085479736328, -17.92317771911621, -17.32826805114746, -16.733360290527344, -16.138450622558594, -15.543542861938477, -14.948634147644043, -14.35372543334961, -13.758816719055176, -13.163908004760742, -12.568999290466309, -11.974090576171875, -11.379182815551758, -10.784273147583008, -10.18936538696289, -9.594456672668457, -8.999547958374023, -8.40463924407959, -7.809730529785156, -7.214822292327881, -6.619913578033447, -6.025004863739014, -5.430096626281738, -4.835187911987305, -4.240279197692871, -3.6453704833984375, -3.050462007522583, -2.4555535316467285, -1.860644817352295, -1.2657361030578613, -0.6708276271820068, -0.07591915130615234, 0.5189895629882812, 1.1138981580734253, 1.7088067531585693, 2.303715229034424, 2.8986239433288574, 3.493532657623291, 4.088440895080566, 4.683349609375, 5.278258323669434, 5.873167037963867, 6.468075752258301, 7.062983989715576, 7.65789270401001, 8.252801895141602, 8.847709655761719, 9.442618370056152, 10.037527084350586, 10.63243579864502, 11.227344512939453, 11.822253227233887, 12.41716194152832, 13.012069702148438, 13.606978416442871, 14.201887130737305, 14.796795845031738, 15.391704559326172, 15.986613273620605, 16.58152198791504, 17.176429748535156, 17.771339416503906, 18.366247177124023, 18.96115493774414, 19.55606460571289]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 9.0, 9.0, 5.0, 7.0, 18.0, 37.0, 58.0, 93.0, 154.0, 250.0, 359.0, 622.0, 896.0, 1452.0, 2230.0, 3558.0, 5665.0, 8499.0, 12962.0, 18995.0, 27319.0, 37657.0, 50852.0, 65358.0, 79088.0, 91487.0, 98748.0, 100022.0, 94893.0, 84147.0, 70648.0, 55604.0, 42006.0, 30569.0, 21305.0, 15006.0, 9967.0, 6336.0, 4236.0, 2733.0, 1697.0, 1104.0, 698.0, 443.0, 283.0, 180.0, 118.0, 76.0, 46.0, 33.0, 14.0, 5.0, 2.0, 3.0, 3.0, 3.0], "bins": [-12.890625, -12.524169921875, -12.15771484375, -11.791259765625, -11.4248046875, -11.058349609375, -10.69189453125, -10.325439453125, -9.958984375, -9.592529296875, -9.22607421875, -8.859619140625, -8.4931640625, -8.126708984375, -7.76025390625, -7.393798828125, -7.02734375, -6.660888671875, -6.29443359375, -5.927978515625, -5.5615234375, -5.195068359375, -4.82861328125, -4.462158203125, -4.095703125, -3.729248046875, -3.36279296875, -2.996337890625, -2.6298828125, -2.263427734375, -1.89697265625, -1.530517578125, -1.1640625, -0.797607421875, -0.43115234375, -0.064697265625, 0.3017578125, 0.668212890625, 1.03466796875, 1.401123046875, 1.767578125, 2.134033203125, 2.50048828125, 2.866943359375, 3.2333984375, 3.599853515625, 3.96630859375, 4.332763671875, 4.69921875, 5.065673828125, 5.43212890625, 5.798583984375, 6.1650390625, 6.531494140625, 6.89794921875, 7.264404296875, 7.630859375, 7.997314453125, 8.36376953125, 8.730224609375, 9.0966796875, 9.463134765625, 9.82958984375, 10.196044921875, 10.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 4.0, 5.0, 13.0, 15.0, 17.0, 17.0, 14.0, 17.0, 21.0, 24.0, 21.0, 33.0, 35.0, 36.0, 32.0, 40.0, 41.0, 46.0, 43.0, 52.0, 43.0, 44.0, 27.0, 46.0, 46.0, 32.0, 35.0, 19.0, 25.0, 17.0, 22.0, 17.0, 16.0, 10.0, 17.0, 9.0, 4.0, 12.0, 2.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.15625, -20.51318359375, -19.8701171875, -19.22705078125, -18.583984375, -17.94091796875, -17.2978515625, -16.65478515625, -16.01171875, -15.36865234375, -14.7255859375, -14.08251953125, -13.439453125, -12.79638671875, -12.1533203125, -11.51025390625, -10.8671875, -10.22412109375, -9.5810546875, -8.93798828125, -8.294921875, -7.65185546875, -7.0087890625, -6.36572265625, -5.72265625, -5.07958984375, -4.4365234375, -3.79345703125, -3.150390625, -2.50732421875, -1.8642578125, -1.22119140625, -0.578125, 0.06494140625, 0.7080078125, 1.35107421875, 1.994140625, 2.63720703125, 3.2802734375, 3.92333984375, 4.56640625, 5.20947265625, 5.8525390625, 6.49560546875, 7.138671875, 7.78173828125, 8.4248046875, 9.06787109375, 9.7109375, 10.35400390625, 10.9970703125, 11.64013671875, 12.283203125, 12.92626953125, 13.5693359375, 14.21240234375, 14.85546875, 15.49853515625, 16.1416015625, 16.78466796875, 17.427734375, 18.07080078125, 18.7138671875, 19.35693359375, 20.0]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 8.0, 8.0, 12.0, 15.0, 29.0, 37.0, 77.0, 132.0, 179.0, 308.0, 478.0, 788.0, 1295.0, 2062.0, 3356.0, 5230.0, 8353.0, 13357.0, 20718.0, 30946.0, 45040.0, 62648.0, 82297.0, 100138.0, 112466.0, 115761.0, 109417.0, 92871.0, 73649.0, 55149.0, 38543.0, 26096.0, 17199.0, 11216.0, 6918.0, 4509.0, 2750.0, 1648.0, 1069.0, 673.0, 416.0, 265.0, 157.0, 99.0, 65.0, 52.0, 24.0, 22.0, 5.0, 4.0, 5.0, 3.0, 2.0], "bins": [-16.078125, -15.6351318359375, -15.192138671875, -14.7491455078125, -14.30615234375, -13.8631591796875, -13.420166015625, -12.9771728515625, -12.5341796875, -12.0911865234375, -11.648193359375, -11.2052001953125, -10.76220703125, -10.3192138671875, -9.876220703125, -9.4332275390625, -8.990234375, -8.5472412109375, -8.104248046875, -7.6612548828125, -7.21826171875, -6.7752685546875, -6.332275390625, -5.8892822265625, -5.4462890625, -5.0032958984375, -4.560302734375, -4.1173095703125, -3.67431640625, -3.2313232421875, -2.788330078125, -2.3453369140625, -1.90234375, -1.4593505859375, -1.016357421875, -0.5733642578125, -0.13037109375, 0.3126220703125, 0.755615234375, 1.1986083984375, 1.6416015625, 2.0845947265625, 2.527587890625, 2.9705810546875, 3.41357421875, 3.8565673828125, 4.299560546875, 4.7425537109375, 5.185546875, 5.6285400390625, 6.071533203125, 6.5145263671875, 6.95751953125, 7.4005126953125, 7.843505859375, 8.2864990234375, 8.7294921875, 9.1724853515625, 9.615478515625, 10.0584716796875, 10.50146484375, 10.9444580078125, 11.387451171875, 11.8304443359375, 12.2734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 9.0, 4.0, 8.0, 8.0, 12.0, 15.0, 15.0, 14.0, 22.0, 32.0, 19.0, 28.0, 30.0, 29.0, 33.0, 38.0, 44.0, 43.0, 35.0, 39.0, 40.0, 48.0, 33.0, 38.0, 35.0, 40.0, 25.0, 29.0, 33.0, 35.0, 29.0, 19.0, 19.0, 16.0, 18.0, 18.0, 11.0, 5.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0], "bins": [-14.40625, -13.9954833984375, -13.584716796875, -13.1739501953125, -12.76318359375, -12.3524169921875, -11.941650390625, -11.5308837890625, -11.1201171875, -10.7093505859375, -10.298583984375, -9.8878173828125, -9.47705078125, -9.0662841796875, -8.655517578125, -8.2447509765625, -7.833984375, -7.4232177734375, -7.012451171875, -6.6016845703125, -6.19091796875, -5.7801513671875, -5.369384765625, -4.9586181640625, -4.5478515625, -4.1370849609375, -3.726318359375, -3.3155517578125, -2.90478515625, -2.4940185546875, -2.083251953125, -1.6724853515625, -1.26171875, -0.8509521484375, -0.440185546875, -0.0294189453125, 0.38134765625, 0.7921142578125, 1.202880859375, 1.6136474609375, 2.0244140625, 2.4351806640625, 2.845947265625, 3.2567138671875, 3.66748046875, 4.0782470703125, 4.489013671875, 4.8997802734375, 5.310546875, 5.7213134765625, 6.132080078125, 6.5428466796875, 6.95361328125, 7.3643798828125, 7.775146484375, 8.1859130859375, 8.5966796875, 9.0074462890625, 9.418212890625, 9.8289794921875, 10.23974609375, 10.6505126953125, 11.061279296875, 11.4720458984375, 11.8828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 13.0, 18.0, 25.0, 31.0, 55.0, 81.0, 113.0, 213.0, 388.0, 615.0, 950.0, 1711.0, 3022.0, 5408.0, 9319.0, 16251.0, 28101.0, 46684.0, 72907.0, 104587.0, 132440.0, 147421.0, 140793.0, 116196.0, 84468.0, 55372.0, 34389.0, 20085.0, 11506.0, 6491.0, 3749.0, 2056.0, 1265.0, 720.0, 441.0, 240.0, 154.0, 92.0, 66.0, 38.0, 29.0, 22.0, 14.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.71484375, -6.49603271484375, -6.2772216796875, -6.05841064453125, -5.839599609375, -5.62078857421875, -5.4019775390625, -5.18316650390625, -4.96435546875, -4.74554443359375, -4.5267333984375, -4.30792236328125, -4.089111328125, -3.87030029296875, -3.6514892578125, -3.43267822265625, -3.2138671875, -2.99505615234375, -2.7762451171875, -2.55743408203125, -2.338623046875, -2.11981201171875, -1.9010009765625, -1.68218994140625, -1.46337890625, -1.24456787109375, -1.0257568359375, -0.80694580078125, -0.588134765625, -0.36932373046875, -0.1505126953125, 0.06829833984375, 0.287109375, 0.50592041015625, 0.7247314453125, 0.94354248046875, 1.162353515625, 1.38116455078125, 1.5999755859375, 1.81878662109375, 2.03759765625, 2.25640869140625, 2.4752197265625, 2.69403076171875, 2.912841796875, 3.13165283203125, 3.3504638671875, 3.56927490234375, 3.7880859375, 4.00689697265625, 4.2257080078125, 4.44451904296875, 4.663330078125, 4.88214111328125, 5.1009521484375, 5.31976318359375, 5.53857421875, 5.75738525390625, 5.9761962890625, 6.19500732421875, 6.413818359375, 6.63262939453125, 6.8514404296875, 7.07025146484375, 7.2890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 3.0, 11.0, 12.0, 6.0, 9.0, 14.0, 14.0, 21.0, 20.0, 26.0, 21.0, 26.0, 46.0, 36.0, 38.0, 48.0, 34.0, 41.0, 44.0, 45.0, 44.0, 38.0, 45.0, 41.0, 35.0, 34.0, 45.0, 21.0, 29.0, 22.0, 25.0, 25.0, 12.0, 16.0, 13.0, 10.0, 6.0, 11.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007143020629882812, -0.0006935968995094299, -0.0006728917360305786, -0.0006521865725517273, -0.000631481409072876, -0.0006107762455940247, -0.0005900710821151733, -0.000569365918636322, -0.0005486607551574707, -0.0005279555916786194, -0.0005072504281997681, -0.00048654526472091675, -0.00046584010124206543, -0.0004451349377632141, -0.0004244297742843628, -0.0004037246108055115, -0.00038301944732666016, -0.00036231428384780884, -0.0003416091203689575, -0.0003209039568901062, -0.0003001987934112549, -0.00027949362993240356, -0.00025878846645355225, -0.00023808330297470093, -0.0002173781394958496, -0.0001966729760169983, -0.00017596781253814697, -0.00015526264905929565, -0.00013455748558044434, -0.00011385232210159302, -9.31471586227417e-05, -7.244199514389038e-05, -5.173683166503906e-05, -3.1031668186187744e-05, -1.0326504707336426e-05, 1.0378658771514893e-05, 3.108382225036621e-05, 5.178898572921753e-05, 7.249414920806885e-05, 9.319931268692017e-05, 0.00011390447616577148, 0.0001346096396446228, 0.00015531480312347412, 0.00017601996660232544, 0.00019672513008117676, 0.00021743029356002808, 0.0002381354570388794, 0.0002588406205177307, 0.00027954578399658203, 0.00030025094747543335, 0.00032095611095428467, 0.000341661274433136, 0.0003623664379119873, 0.0003830716013908386, 0.00040377676486968994, 0.00042448192834854126, 0.0004451870918273926, 0.0004658922553062439, 0.0004865974187850952, 0.0005073025822639465, 0.0005280077457427979, 0.0005487129092216492, 0.0005694180727005005, 0.0005901232361793518, 0.0006108283996582031]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 4.0, 9.0, 24.0, 26.0, 35.0, 72.0, 112.0, 144.0, 271.0, 460.0, 712.0, 1167.0, 1907.0, 3113.0, 5311.0, 8603.0, 13405.0, 21509.0, 33518.0, 49506.0, 69459.0, 92897.0, 111757.0, 122884.0, 121686.0, 108175.0, 88043.0, 65511.0, 46097.0, 30355.0, 19739.0, 12290.0, 7670.0, 4709.0, 2887.0, 1734.0, 1037.0, 662.0, 380.0, 270.0, 146.0, 102.0, 62.0, 24.0, 25.0, 23.0, 11.0, 8.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6953125, -5.510986328125, -5.32666015625, -5.142333984375, -4.9580078125, -4.773681640625, -4.58935546875, -4.405029296875, -4.220703125, -4.036376953125, -3.85205078125, -3.667724609375, -3.4833984375, -3.299072265625, -3.11474609375, -2.930419921875, -2.74609375, -2.561767578125, -2.37744140625, -2.193115234375, -2.0087890625, -1.824462890625, -1.64013671875, -1.455810546875, -1.271484375, -1.087158203125, -0.90283203125, -0.718505859375, -0.5341796875, -0.349853515625, -0.16552734375, 0.018798828125, 0.203125, 0.387451171875, 0.57177734375, 0.756103515625, 0.9404296875, 1.124755859375, 1.30908203125, 1.493408203125, 1.677734375, 1.862060546875, 2.04638671875, 2.230712890625, 2.4150390625, 2.599365234375, 2.78369140625, 2.968017578125, 3.15234375, 3.336669921875, 3.52099609375, 3.705322265625, 3.8896484375, 4.073974609375, 4.25830078125, 4.442626953125, 4.626953125, 4.811279296875, 4.99560546875, 5.179931640625, 5.3642578125, 5.548583984375, 5.73291015625, 5.917236328125, 6.1015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 4.0, 21.0, 17.0, 27.0, 15.0, 21.0, 36.0, 40.0, 44.0, 52.0, 50.0, 58.0, 57.0, 56.0, 70.0, 66.0, 46.0, 45.0, 40.0, 47.0, 26.0, 30.0, 26.0, 22.0, 16.0, 17.0, 9.0, 11.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.810546875, -2.70953369140625, -2.6085205078125, -2.50750732421875, -2.406494140625, -2.30548095703125, -2.2044677734375, -2.10345458984375, -2.00244140625, -1.90142822265625, -1.8004150390625, -1.69940185546875, -1.598388671875, -1.49737548828125, -1.3963623046875, -1.29534912109375, -1.1943359375, -1.09332275390625, -0.9923095703125, -0.89129638671875, -0.790283203125, -0.68927001953125, -0.5882568359375, -0.48724365234375, -0.38623046875, -0.28521728515625, -0.1842041015625, -0.08319091796875, 0.017822265625, 0.11883544921875, 0.2198486328125, 0.32086181640625, 0.421875, 0.52288818359375, 0.6239013671875, 0.72491455078125, 0.825927734375, 0.92694091796875, 1.0279541015625, 1.12896728515625, 1.22998046875, 1.33099365234375, 1.4320068359375, 1.53302001953125, 1.634033203125, 1.73504638671875, 1.8360595703125, 1.93707275390625, 2.0380859375, 2.13909912109375, 2.2401123046875, 2.34112548828125, 2.442138671875, 2.54315185546875, 2.6441650390625, 2.74517822265625, 2.84619140625, 2.94720458984375, 3.0482177734375, 3.14923095703125, 3.250244140625, 3.35125732421875, 3.4522705078125, 3.55328369140625, 3.654296875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 8.0, 7.0, 3.0, 10.0, 9.0, 11.0, 13.0, 15.0, 21.0, 21.0, 33.0, 30.0, 36.0, 46.0, 36.0, 41.0, 45.0, 44.0, 46.0, 46.0, 43.0, 42.0, 41.0, 40.0, 42.0, 35.0, 41.0, 27.0, 28.0, 27.0, 22.0, 20.0, 10.0, 17.0, 13.0, 7.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.684804916381836, -20.044353485107422, -19.40390396118164, -18.763452529907227, -18.123001098632812, -17.48255157470703, -16.842100143432617, -16.201648712158203, -15.561198234558105, -14.920747756958008, -14.280296325683594, -13.639845848083496, -12.999395370483398, -12.358943939208984, -11.718493461608887, -11.078042984008789, -10.437591552734375, -9.797141075134277, -9.156689643859863, -8.516239166259766, -7.87578821182251, -7.235337257385254, -6.594886779785156, -5.9544358253479, -5.3139848709106445, -4.673533916473389, -4.033082962036133, -3.392632484436035, -2.7521815299987793, -2.1117305755615234, -1.4712798595428467, -0.8308291435241699, -0.19037818908691406, 0.45007264614105225, 1.0905234813690186, 1.7309743165969849, 2.371425151824951, 3.011876106262207, 3.652326822280884, 4.2927775382995605, 4.933228492736816, 5.573679447174072, 6.214130401611328, 6.854580879211426, 7.495031833648682, 8.135482788085938, 8.775933265686035, 9.416383743286133, 10.056835174560547, 10.697285652160645, 11.337737083435059, 11.978187561035156, 12.61863899230957, 13.259089469909668, 13.899539947509766, 14.53999137878418, 15.180441856384277, 15.820892333984375, 16.46134376525879, 17.101795196533203, 17.742244720458984, 18.3826961517334, 19.023147583007812, 19.663597106933594, 20.304048538208008]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 6.0, 6.0, 1.0, 6.0, 2.0, 12.0, 7.0, 10.0, 4.0, 12.0, 12.0, 18.0, 27.0, 16.0, 23.0, 17.0, 36.0, 35.0, 27.0, 26.0, 24.0, 33.0, 32.0, 30.0, 35.0, 34.0, 39.0, 42.0, 36.0, 40.0, 34.0, 27.0, 22.0, 32.0, 25.0, 20.0, 21.0, 18.0, 23.0, 18.0, 24.0, 9.0, 11.0, 14.0, 13.0, 9.0, 4.0, 8.0, 12.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 3.0], "bins": [-18.1922550201416, -17.644514083862305, -17.096773147583008, -16.549034118652344, -16.001293182373047, -15.45355224609375, -14.905811309814453, -14.358071327209473, -13.810331344604492, -13.262590408325195, -12.714850425720215, -12.167109489440918, -11.619369506835938, -11.07162857055664, -10.523887634277344, -9.976147651672363, -9.428406715393066, -8.88066577911377, -8.332925796508789, -7.785184860229492, -7.237444877624512, -6.689703941345215, -6.141963481903076, -5.5942230224609375, -5.046482563018799, -4.49874210357666, -3.9510016441345215, -3.4032609462738037, -2.855520486831665, -2.3077800273895264, -1.7600393295288086, -1.21229887008667, -0.6645584106445312, -0.1168178915977478, 0.43092262744903564, 0.9786632061004639, 1.5264036655426025, 2.074144124984741, 2.621884822845459, 3.1696252822875977, 3.7173657417297363, 4.265106201171875, 4.812846660614014, 5.360587120056152, 5.908328056335449, 6.45606803894043, 7.003808975219727, 7.551549434661865, 8.099289894104004, 8.6470308303833, 9.194770812988281, 9.742511749267578, 10.290251731872559, 10.837992668151855, 11.385732650756836, 11.933473587036133, 12.48121452331543, 13.028955459594727, 13.576695442199707, 14.124436378479004, 14.672176361083984, 15.219917297363281, 15.767658233642578, 16.315399169921875, 16.86313819885254]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 3.0, 7.0, 12.0, 21.0, 31.0, 42.0, 42.0, 75.0, 134.0, 176.0, 300.0, 454.0, 605.0, 1071.0, 1754.0, 2932.0, 4875.0, 8463.0, 14297.0, 24930.0, 44612.0, 81004.0, 146377.0, 257791.0, 424279.0, 608296.0, 709087.0, 654612.0, 488808.0, 310605.0, 179712.0, 100695.0, 55392.0, 30786.0, 17541.0, 10132.0, 5765.0, 3273.0, 2025.0, 1301.0, 694.0, 455.0, 277.0, 174.0, 130.0, 71.0, 49.0, 33.0, 22.0, 22.0, 14.0, 10.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.25, -15.702392578125, -15.15478515625, -14.607177734375, -14.0595703125, -13.511962890625, -12.96435546875, -12.416748046875, -11.869140625, -11.321533203125, -10.77392578125, -10.226318359375, -9.6787109375, -9.131103515625, -8.58349609375, -8.035888671875, -7.48828125, -6.940673828125, -6.39306640625, -5.845458984375, -5.2978515625, -4.750244140625, -4.20263671875, -3.655029296875, -3.107421875, -2.559814453125, -2.01220703125, -1.464599609375, -0.9169921875, -0.369384765625, 0.17822265625, 0.725830078125, 1.2734375, 1.821044921875, 2.36865234375, 2.916259765625, 3.4638671875, 4.011474609375, 4.55908203125, 5.106689453125, 5.654296875, 6.201904296875, 6.74951171875, 7.297119140625, 7.8447265625, 8.392333984375, 8.93994140625, 9.487548828125, 10.03515625, 10.582763671875, 11.13037109375, 11.677978515625, 12.2255859375, 12.773193359375, 13.32080078125, 13.868408203125, 14.416015625, 14.963623046875, 15.51123046875, 16.058837890625, 16.6064453125, 17.154052734375, 17.70166015625, 18.249267578125, 18.796875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 4.0, 9.0, 6.0, 8.0, 6.0, 6.0, 10.0, 7.0, 15.0, 16.0, 9.0, 20.0, 18.0, 20.0, 27.0, 39.0, 24.0, 27.0, 31.0, 40.0, 30.0, 36.0, 33.0, 29.0, 39.0, 35.0, 37.0, 29.0, 39.0, 25.0, 29.0, 36.0, 21.0, 33.0, 23.0, 24.0, 14.0, 19.0, 16.0, 21.0, 11.0, 15.0, 9.0, 5.0, 15.0, 5.0, 5.0, 8.0, 1.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0], "bins": [-15.1796875, -14.712158203125, -14.24462890625, -13.777099609375, -13.3095703125, -12.842041015625, -12.37451171875, -11.906982421875, -11.439453125, -10.971923828125, -10.50439453125, -10.036865234375, -9.5693359375, -9.101806640625, -8.63427734375, -8.166748046875, -7.69921875, -7.231689453125, -6.76416015625, -6.296630859375, -5.8291015625, -5.361572265625, -4.89404296875, -4.426513671875, -3.958984375, -3.491455078125, -3.02392578125, -2.556396484375, -2.0888671875, -1.621337890625, -1.15380859375, -0.686279296875, -0.21875, 0.248779296875, 0.71630859375, 1.183837890625, 1.6513671875, 2.118896484375, 2.58642578125, 3.053955078125, 3.521484375, 3.989013671875, 4.45654296875, 4.924072265625, 5.3916015625, 5.859130859375, 6.32666015625, 6.794189453125, 7.26171875, 7.729248046875, 8.19677734375, 8.664306640625, 9.1318359375, 9.599365234375, 10.06689453125, 10.534423828125, 11.001953125, 11.469482421875, 11.93701171875, 12.404541015625, 12.8720703125, 13.339599609375, 13.80712890625, 14.274658203125, 14.7421875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 9.0, 6.0, 7.0, 19.0, 25.0, 25.0, 55.0, 77.0, 128.0, 208.0, 360.0, 526.0, 991.0, 1551.0, 2611.0, 4601.0, 8057.0, 13929.0, 24518.0, 42949.0, 75780.0, 130674.0, 219840.0, 351080.0, 510467.0, 638458.0, 652883.0, 541545.0, 384106.0, 244037.0, 146687.0, 84562.0, 48585.0, 27630.0, 15597.0, 8944.0, 5064.0, 3035.0, 1803.0, 1060.0, 675.0, 431.0, 279.0, 155.0, 101.0, 66.0, 35.0, 17.0, 12.0, 10.0, 9.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.52294921875, -16.9208984375, -16.31884765625, -15.716796875, -15.11474609375, -14.5126953125, -13.91064453125, -13.30859375, -12.70654296875, -12.1044921875, -11.50244140625, -10.900390625, -10.29833984375, -9.6962890625, -9.09423828125, -8.4921875, -7.89013671875, -7.2880859375, -6.68603515625, -6.083984375, -5.48193359375, -4.8798828125, -4.27783203125, -3.67578125, -3.07373046875, -2.4716796875, -1.86962890625, -1.267578125, -0.66552734375, -0.0634765625, 0.53857421875, 1.140625, 1.74267578125, 2.3447265625, 2.94677734375, 3.548828125, 4.15087890625, 4.7529296875, 5.35498046875, 5.95703125, 6.55908203125, 7.1611328125, 7.76318359375, 8.365234375, 8.96728515625, 9.5693359375, 10.17138671875, 10.7734375, 11.37548828125, 11.9775390625, 12.57958984375, 13.181640625, 13.78369140625, 14.3857421875, 14.98779296875, 15.58984375, 16.19189453125, 16.7939453125, 17.39599609375, 17.998046875, 18.60009765625, 19.2021484375, 19.80419921875, 20.40625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 2.0, 8.0, 11.0, 22.0, 24.0, 25.0, 34.0, 28.0, 43.0, 54.0, 65.0, 82.0, 101.0, 126.0, 158.0, 159.0, 171.0, 199.0, 200.0, 212.0, 224.0, 229.0, 214.0, 221.0, 204.0, 189.0, 168.0, 172.0, 121.0, 120.0, 93.0, 78.0, 66.0, 61.0, 53.0, 30.0, 20.0, 22.0, 13.0, 14.0, 7.0, 6.0, 8.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.8046875, -7.56939697265625, -7.3341064453125, -7.09881591796875, -6.863525390625, -6.62823486328125, -6.3929443359375, -6.15765380859375, -5.92236328125, -5.68707275390625, -5.4517822265625, -5.21649169921875, -4.981201171875, -4.74591064453125, -4.5106201171875, -4.27532958984375, -4.0400390625, -3.80474853515625, -3.5694580078125, -3.33416748046875, -3.098876953125, -2.86358642578125, -2.6282958984375, -2.39300537109375, -2.15771484375, -1.92242431640625, -1.6871337890625, -1.45184326171875, -1.216552734375, -0.98126220703125, -0.7459716796875, -0.51068115234375, -0.275390625, -0.04010009765625, 0.1951904296875, 0.43048095703125, 0.665771484375, 0.90106201171875, 1.1363525390625, 1.37164306640625, 1.60693359375, 1.84222412109375, 2.0775146484375, 2.31280517578125, 2.548095703125, 2.78338623046875, 3.0186767578125, 3.25396728515625, 3.4892578125, 3.72454833984375, 3.9598388671875, 4.19512939453125, 4.430419921875, 4.66571044921875, 4.9010009765625, 5.13629150390625, 5.37158203125, 5.60687255859375, 5.8421630859375, 6.07745361328125, 6.312744140625, 6.54803466796875, 6.7833251953125, 7.01861572265625, 7.25390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 9.0, 12.0, 12.0, 16.0, 19.0, 27.0, 20.0, 31.0, 25.0, 41.0, 41.0, 34.0, 45.0, 35.0, 49.0, 48.0, 47.0, 45.0, 35.0, 38.0, 41.0, 42.0, 43.0, 34.0, 45.0, 22.0, 17.0, 21.0, 10.0, 12.0, 10.0, 11.0, 7.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.348783493041992, -18.72844123840332, -18.10809898376465, -17.487756729125977, -16.867414474487305, -16.247074127197266, -15.626730918884277, -15.006389617919922, -14.38604736328125, -13.765705108642578, -13.145362854003906, -12.525020599365234, -11.904679298400879, -11.284337043762207, -10.663994789123535, -10.04365348815918, -9.423310279846191, -8.80296802520752, -8.182625770568848, -7.562283992767334, -6.94194221496582, -6.321599960327148, -5.701257705688477, -5.080915927886963, -4.460573673248291, -3.8402316570281982, -3.2198896408081055, -2.5995473861694336, -1.9792053699493408, -1.358863353729248, -0.7385210990905762, -0.1181793212890625, 0.5021629333496094, 1.1225049495697021, 1.7428470849990845, 2.363189220428467, 2.9835312366485596, 3.6038732528686523, 4.224215507507324, 4.844557285308838, 5.46489953994751, 6.085241794586182, 6.705583572387695, 7.325925827026367, 7.946268081665039, 8.566610336303711, 9.186952590942383, 9.807293891906738, 10.42763614654541, 11.047978401184082, 11.668320655822754, 12.28866195678711, 12.909004211425781, 13.529346466064453, 14.149688720703125, 14.770030975341797, 15.390373229980469, 16.01071548461914, 16.631057739257812, 17.251399993896484, 17.871742248535156, 18.492084503173828, 19.1124267578125, 19.73276710510254, 20.35310935974121]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 5.0, 9.0, 7.0, 10.0, 17.0, 14.0, 16.0, 21.0, 29.0, 22.0, 27.0, 18.0, 22.0, 39.0, 38.0, 34.0, 39.0, 28.0, 35.0, 45.0, 48.0, 29.0, 36.0, 37.0, 28.0, 32.0, 33.0, 29.0, 30.0, 25.0, 18.0, 25.0, 15.0, 25.0, 14.0, 13.0, 20.0, 13.0, 6.0, 8.0, 6.0, 12.0, 5.0, 2.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.243106842041016, -17.684803009033203, -17.126497268676758, -16.568193435668945, -16.0098876953125, -15.451583862304688, -14.893280029296875, -14.334975242614746, -13.776670455932617, -13.218365669250488, -12.66006088256836, -12.101757049560547, -11.543452262878418, -10.985147476196289, -10.426843643188477, -9.868538856506348, -9.310234069824219, -8.75192928314209, -8.193624496459961, -7.635320663452148, -7.0770158767700195, -6.518711090087891, -5.96040678024292, -5.402102470397949, -4.84379768371582, -4.285492897033691, -3.7271885871887207, -3.168884038925171, -2.610579490661621, -2.0522749423980713, -1.4939703941345215, -0.9356658458709717, -0.3773632049560547, 0.18094134330749512, 0.7392458915710449, 1.2975504398345947, 1.8558549880981445, 2.4141595363616943, 2.972464084625244, 3.530768632888794, 4.089073181152344, 4.647377967834473, 5.205682277679443, 5.763986587524414, 6.322291374206543, 6.880596160888672, 7.438900470733643, 7.997204780578613, 8.555509567260742, 9.113814353942871, 9.672119140625, 10.230422973632812, 10.788727760314941, 11.34703254699707, 11.905336380004883, 12.463641166687012, 13.02194595336914, 13.58025074005127, 14.138555526733398, 14.696859359741211, 15.25516414642334, 15.813468933105469, 16.37177276611328, 16.930078506469727, 17.48838233947754]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 7.0, 6.0, 8.0, 10.0, 25.0, 36.0, 52.0, 78.0, 120.0, 215.0, 270.0, 399.0, 644.0, 992.0, 1527.0, 2510.0, 3855.0, 6334.0, 9978.0, 15828.0, 24411.0, 36783.0, 54774.0, 76475.0, 99715.0, 119583.0, 126929.0, 120479.0, 102054.0, 78598.0, 56756.0, 38787.0, 25580.0, 16264.0, 10288.0, 6728.0, 4170.0, 2596.0, 1665.0, 1054.0, 663.0, 434.0, 303.0, 198.0, 130.0, 84.0, 63.0, 42.0, 26.0, 14.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.0390625, -9.6993408203125, -9.359619140625, -9.0198974609375, -8.68017578125, -8.3404541015625, -8.000732421875, -7.6610107421875, -7.3212890625, -6.9815673828125, -6.641845703125, -6.3021240234375, -5.96240234375, -5.6226806640625, -5.282958984375, -4.9432373046875, -4.603515625, -4.2637939453125, -3.924072265625, -3.5843505859375, -3.24462890625, -2.9049072265625, -2.565185546875, -2.2254638671875, -1.8857421875, -1.5460205078125, -1.206298828125, -0.8665771484375, -0.52685546875, -0.1871337890625, 0.152587890625, 0.4923095703125, 0.83203125, 1.1717529296875, 1.511474609375, 1.8511962890625, 2.19091796875, 2.5306396484375, 2.870361328125, 3.2100830078125, 3.5498046875, 3.8895263671875, 4.229248046875, 4.5689697265625, 4.90869140625, 5.2484130859375, 5.588134765625, 5.9278564453125, 6.267578125, 6.6072998046875, 6.947021484375, 7.2867431640625, 7.62646484375, 7.9661865234375, 8.305908203125, 8.6456298828125, 8.9853515625, 9.3250732421875, 9.664794921875, 10.0045166015625, 10.34423828125, 10.6839599609375, 11.023681640625, 11.3634033203125, 11.703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 12.0, 4.0, 6.0, 9.0, 19.0, 22.0, 19.0, 16.0, 29.0, 27.0, 24.0, 30.0, 36.0, 34.0, 38.0, 40.0, 29.0, 41.0, 32.0, 44.0, 38.0, 41.0, 35.0, 32.0, 24.0, 26.0, 31.0, 28.0, 27.0, 21.0, 25.0, 16.0, 22.0, 12.0, 18.0, 14.0, 16.0, 11.0, 12.0, 6.0, 11.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-19.046875, -18.4677734375, -17.888671875, -17.3095703125, -16.73046875, -16.1513671875, -15.572265625, -14.9931640625, -14.4140625, -13.8349609375, -13.255859375, -12.6767578125, -12.09765625, -11.5185546875, -10.939453125, -10.3603515625, -9.78125, -9.2021484375, -8.623046875, -8.0439453125, -7.46484375, -6.8857421875, -6.306640625, -5.7275390625, -5.1484375, -4.5693359375, -3.990234375, -3.4111328125, -2.83203125, -2.2529296875, -1.673828125, -1.0947265625, -0.515625, 0.0634765625, 0.642578125, 1.2216796875, 1.80078125, 2.3798828125, 2.958984375, 3.5380859375, 4.1171875, 4.6962890625, 5.275390625, 5.8544921875, 6.43359375, 7.0126953125, 7.591796875, 8.1708984375, 8.75, 9.3291015625, 9.908203125, 10.4873046875, 11.06640625, 11.6455078125, 12.224609375, 12.8037109375, 13.3828125, 13.9619140625, 14.541015625, 15.1201171875, 15.69921875, 16.2783203125, 16.857421875, 17.4365234375, 18.015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 8.0, 8.0, 19.0, 24.0, 38.0, 55.0, 68.0, 98.0, 163.0, 270.0, 380.0, 652.0, 1200.0, 1896.0, 3379.0, 6312.0, 11527.0, 21728.0, 41422.0, 77417.0, 135917.0, 199172.0, 207410.0, 150265.0, 87673.0, 47248.0, 24755.0, 12941.0, 7103.0, 3864.0, 2234.0, 1253.0, 768.0, 473.0, 274.0, 179.0, 139.0, 73.0, 46.0, 40.0, 20.0, 19.0, 6.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-22.40625, -21.749267578125, -21.09228515625, -20.435302734375, -19.7783203125, -19.121337890625, -18.46435546875, -17.807373046875, -17.150390625, -16.493408203125, -15.83642578125, -15.179443359375, -14.5224609375, -13.865478515625, -13.20849609375, -12.551513671875, -11.89453125, -11.237548828125, -10.58056640625, -9.923583984375, -9.2666015625, -8.609619140625, -7.95263671875, -7.295654296875, -6.638671875, -5.981689453125, -5.32470703125, -4.667724609375, -4.0107421875, -3.353759765625, -2.69677734375, -2.039794921875, -1.3828125, -0.725830078125, -0.06884765625, 0.588134765625, 1.2451171875, 1.902099609375, 2.55908203125, 3.216064453125, 3.873046875, 4.530029296875, 5.18701171875, 5.843994140625, 6.5009765625, 7.157958984375, 7.81494140625, 8.471923828125, 9.12890625, 9.785888671875, 10.44287109375, 11.099853515625, 11.7568359375, 12.413818359375, 13.07080078125, 13.727783203125, 14.384765625, 15.041748046875, 15.69873046875, 16.355712890625, 17.0126953125, 17.669677734375, 18.32666015625, 18.983642578125, 19.640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 5.0, 5.0, 7.0, 14.0, 17.0, 21.0, 24.0, 24.0, 35.0, 24.0, 33.0, 27.0, 40.0, 32.0, 37.0, 52.0, 39.0, 40.0, 41.0, 59.0, 42.0, 44.0, 39.0, 45.0, 34.0, 36.0, 22.0, 27.0, 35.0, 23.0, 13.0, 11.0, 4.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9296875, -12.4833984375, -12.037109375, -11.5908203125, -11.14453125, -10.6982421875, -10.251953125, -9.8056640625, -9.359375, -8.9130859375, -8.466796875, -8.0205078125, -7.57421875, -7.1279296875, -6.681640625, -6.2353515625, -5.7890625, -5.3427734375, -4.896484375, -4.4501953125, -4.00390625, -3.5576171875, -3.111328125, -2.6650390625, -2.21875, -1.7724609375, -1.326171875, -0.8798828125, -0.43359375, 0.0126953125, 0.458984375, 0.9052734375, 1.3515625, 1.7978515625, 2.244140625, 2.6904296875, 3.13671875, 3.5830078125, 4.029296875, 4.4755859375, 4.921875, 5.3681640625, 5.814453125, 6.2607421875, 6.70703125, 7.1533203125, 7.599609375, 8.0458984375, 8.4921875, 8.9384765625, 9.384765625, 9.8310546875, 10.27734375, 10.7236328125, 11.169921875, 11.6162109375, 12.0625, 12.5087890625, 12.955078125, 13.4013671875, 13.84765625, 14.2939453125, 14.740234375, 15.1865234375, 15.6328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 9.0, 6.0, 9.0, 13.0, 32.0, 31.0, 49.0, 88.0, 117.0, 188.0, 256.0, 371.0, 514.0, 756.0, 1131.0, 1735.0, 2682.0, 4214.0, 6791.0, 11057.0, 18085.0, 30351.0, 51383.0, 84966.0, 131749.0, 175347.0, 175052.0, 133830.0, 85964.0, 51801.0, 30699.0, 18409.0, 11279.0, 6829.0, 4318.0, 2855.0, 1783.0, 1211.0, 807.0, 580.0, 389.0, 243.0, 174.0, 130.0, 67.0, 72.0, 54.0, 35.0, 15.0, 7.0, 10.0, 5.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0], "bins": [-8.015625, -7.7652587890625, -7.514892578125, -7.2645263671875, -7.01416015625, -6.7637939453125, -6.513427734375, -6.2630615234375, -6.0126953125, -5.7623291015625, -5.511962890625, -5.2615966796875, -5.01123046875, -4.7608642578125, -4.510498046875, -4.2601318359375, -4.009765625, -3.7593994140625, -3.509033203125, -3.2586669921875, -3.00830078125, -2.7579345703125, -2.507568359375, -2.2572021484375, -2.0068359375, -1.7564697265625, -1.506103515625, -1.2557373046875, -1.00537109375, -0.7550048828125, -0.504638671875, -0.2542724609375, -0.00390625, 0.2464599609375, 0.496826171875, 0.7471923828125, 0.99755859375, 1.2479248046875, 1.498291015625, 1.7486572265625, 1.9990234375, 2.2493896484375, 2.499755859375, 2.7501220703125, 3.00048828125, 3.2508544921875, 3.501220703125, 3.7515869140625, 4.001953125, 4.2523193359375, 4.502685546875, 4.7530517578125, 5.00341796875, 5.2537841796875, 5.504150390625, 5.7545166015625, 6.0048828125, 6.2552490234375, 6.505615234375, 6.7559814453125, 7.00634765625, 7.2567138671875, 7.507080078125, 7.7574462890625, 8.0078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 14.0, 16.0, 29.0, 25.0, 21.0, 52.0, 50.0, 66.0, 84.0, 91.0, 79.0, 76.0, 69.0, 68.0, 63.0, 43.0, 29.0, 27.0, 24.0, 13.0, 12.0, 10.0, 9.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005860328674316406, -0.0005631521344184875, -0.0005402714014053345, -0.0005173906683921814, -0.0004945099353790283, -0.00047162920236587524, -0.00044874846935272217, -0.0004258677363395691, -0.000402987003326416, -0.00038010627031326294, -0.00035722553730010986, -0.0003343448042869568, -0.0003114640712738037, -0.00028858333826065063, -0.00026570260524749756, -0.00024282187223434448, -0.0002199411392211914, -0.00019706040620803833, -0.00017417967319488525, -0.00015129894018173218, -0.0001284182071685791, -0.00010553747415542603, -8.265674114227295e-05, -5.977600812911987e-05, -3.68952751159668e-05, -1.401454210281372e-05, 8.866190910339355e-06, 3.174692392349243e-05, 5.462765693664551e-05, 7.750838994979858e-05, 0.00010038912296295166, 0.00012326985597610474, 0.0001461505889892578, 0.0001690313220024109, 0.00019191205501556396, 0.00021479278802871704, 0.00023767352104187012, 0.0002605542540550232, 0.00028343498706817627, 0.00030631572008132935, 0.0003291964530944824, 0.0003520771861076355, 0.0003749579191207886, 0.00039783865213394165, 0.0004207193851470947, 0.0004436001181602478, 0.0004664808511734009, 0.000489361584186554, 0.000512242317199707, 0.0005351230502128601, 0.0005580037832260132, 0.0005808845162391663, 0.0006037652492523193, 0.0006266459822654724, 0.0006495267152786255, 0.0006724074482917786, 0.0006952881813049316, 0.0007181689143180847, 0.0007410496473312378, 0.0007639303803443909, 0.0007868111133575439, 0.000809691846370697, 0.0008325725793838501, 0.0008554533123970032, 0.0008783340454101562]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 12.0, 19.0, 34.0, 47.0, 69.0, 92.0, 162.0, 198.0, 281.0, 463.0, 694.0, 1036.0, 1655.0, 2579.0, 3967.0, 5947.0, 9320.0, 14539.0, 22579.0, 34524.0, 52966.0, 76847.0, 106097.0, 131333.0, 140475.0, 127398.0, 101021.0, 73010.0, 49359.0, 32525.0, 20972.0, 13681.0, 8512.0, 5376.0, 3635.0, 2376.0, 1623.0, 1106.0, 688.0, 384.0, 283.0, 217.0, 149.0, 86.0, 71.0, 40.0, 39.0, 20.0, 15.0, 6.0, 6.0, 6.0, 5.0, 6.0, 1.0, 0.0, 1.0], "bins": [-7.609375, -7.3671875, -7.125, -6.8828125, -6.640625, -6.3984375, -6.15625, -5.9140625, -5.671875, -5.4296875, -5.1875, -4.9453125, -4.703125, -4.4609375, -4.21875, -3.9765625, -3.734375, -3.4921875, -3.25, -3.0078125, -2.765625, -2.5234375, -2.28125, -2.0390625, -1.796875, -1.5546875, -1.3125, -1.0703125, -0.828125, -0.5859375, -0.34375, -0.1015625, 0.140625, 0.3828125, 0.625, 0.8671875, 1.109375, 1.3515625, 1.59375, 1.8359375, 2.078125, 2.3203125, 2.5625, 2.8046875, 3.046875, 3.2890625, 3.53125, 3.7734375, 4.015625, 4.2578125, 4.5, 4.7421875, 4.984375, 5.2265625, 5.46875, 5.7109375, 5.953125, 6.1953125, 6.4375, 6.6796875, 6.921875, 7.1640625, 7.40625, 7.6484375, 7.890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 8.0, 5.0, 13.0, 13.0, 16.0, 25.0, 24.0, 27.0, 32.0, 46.0, 57.0, 54.0, 49.0, 69.0, 58.0, 64.0, 55.0, 48.0, 56.0, 44.0, 44.0, 26.0, 19.0, 21.0, 21.0, 18.0, 15.0, 13.0, 11.0, 6.0, 5.0, 8.0, 3.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4765625, -4.348785400390625, -4.22100830078125, -4.093231201171875, -3.9654541015625, -3.837677001953125, -3.70989990234375, -3.582122802734375, -3.454345703125, -3.326568603515625, -3.19879150390625, -3.071014404296875, -2.9432373046875, -2.815460205078125, -2.68768310546875, -2.559906005859375, -2.43212890625, -2.304351806640625, -2.17657470703125, -2.048797607421875, -1.9210205078125, -1.793243408203125, -1.66546630859375, -1.537689208984375, -1.409912109375, -1.282135009765625, -1.15435791015625, -1.026580810546875, -0.8988037109375, -0.771026611328125, -0.64324951171875, -0.515472412109375, -0.3876953125, -0.259918212890625, -0.13214111328125, -0.004364013671875, 0.1234130859375, 0.251190185546875, 0.37896728515625, 0.506744384765625, 0.634521484375, 0.762298583984375, 0.89007568359375, 1.017852783203125, 1.1456298828125, 1.273406982421875, 1.40118408203125, 1.528961181640625, 1.65673828125, 1.784515380859375, 1.91229248046875, 2.040069580078125, 2.1678466796875, 2.295623779296875, 2.42340087890625, 2.551177978515625, 2.678955078125, 2.806732177734375, 2.93450927734375, 3.062286376953125, 3.1900634765625, 3.317840576171875, 3.44561767578125, 3.573394775390625, 3.701171875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 9.0, 9.0, 13.0, 11.0, 13.0, 15.0, 19.0, 22.0, 33.0, 38.0, 28.0, 46.0, 38.0, 39.0, 46.0, 41.0, 53.0, 46.0, 40.0, 45.0, 47.0, 41.0, 51.0, 24.0, 35.0, 28.0, 28.0, 23.0, 10.0, 20.0, 12.0, 7.0, 11.0, 10.0, 11.0, 10.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.86770248413086, -19.252059936523438, -18.636415481567383, -18.02077293395996, -17.40513038635254, -16.789485931396484, -16.173843383789062, -15.55820083618164, -14.942557334899902, -14.326913833618164, -13.711271286010742, -13.095627784729004, -12.479984283447266, -11.864341735839844, -11.248698234558105, -10.633054733276367, -10.017412185668945, -9.401768684387207, -8.786126136779785, -8.170482635498047, -7.554839611053467, -6.939196586608887, -6.323553085327148, -5.707910060882568, -5.092267036437988, -4.476624011993408, -3.860980749130249, -3.24533748626709, -2.6296944618225098, -2.0140514373779297, -1.3984081745147705, -0.7827649116516113, -0.16712379455566406, 0.44851934909820557, 1.0641624927520752, 1.6798056364059448, 2.2954487800598145, 2.9110918045043945, 3.5267350673675537, 4.142378330230713, 4.758021354675293, 5.373664379119873, 5.989307403564453, 6.604950904846191, 7.2205939292907715, 7.836236953735352, 8.45188045501709, 9.067523956298828, 9.68316650390625, 10.298810005187988, 10.91445255279541, 11.530096054077148, 12.14573860168457, 12.761382102966309, 13.377025604248047, 13.992668151855469, 14.608311653137207, 15.223955154418945, 15.839597702026367, 16.45524024963379, 17.070884704589844, 17.686527252197266, 18.302169799804688, 18.917814254760742, 19.533456802368164]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 5.0, 14.0, 17.0, 14.0, 14.0, 11.0, 17.0, 29.0, 24.0, 26.0, 25.0, 20.0, 37.0, 31.0, 44.0, 32.0, 31.0, 42.0, 37.0, 41.0, 37.0, 33.0, 34.0, 33.0, 29.0, 25.0, 32.0, 30.0, 23.0, 19.0, 22.0, 18.0, 21.0, 13.0, 20.0, 15.0, 12.0, 11.0, 9.0, 14.0, 5.0, 7.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.9410343170166, -17.404281616210938, -16.867530822753906, -16.330778121948242, -15.794025421142578, -15.25727367401123, -14.720521926879883, -14.183769226074219, -13.647016525268555, -13.110264778137207, -12.573512077331543, -12.036760330200195, -11.500007629394531, -10.963255882263184, -10.426504135131836, -9.889751434326172, -9.352999687194824, -8.816247940063477, -8.279495239257812, -7.742743492126465, -7.205990791320801, -6.669239044189453, -6.132486820220947, -5.595734596252441, -5.0589823722839355, -4.52223014831543, -3.985477924346924, -3.448725938796997, -2.911973714828491, -2.3752214908599854, -1.8384695053100586, -1.3017172813415527, -0.7649650573730469, -0.2282128930091858, 0.3085392713546753, 0.8452913761138916, 1.3820436000823975, 1.9187958240509033, 2.45554780960083, 2.992300033569336, 3.529052257537842, 4.065804481506348, 4.6025567054748535, 5.139308929443359, 5.676060676574707, 6.212813377380371, 6.749565124511719, 7.286317348480225, 7.8230695724487305, 8.359821319580078, 8.896574020385742, 9.43332576751709, 9.970078468322754, 10.506830215454102, 11.043582916259766, 11.580334663391113, 12.117086410522461, 12.653838157653809, 13.190590858459473, 13.72734260559082, 14.264095306396484, 14.800847053527832, 15.33759880065918, 15.874351501464844, 16.411104202270508]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 12.0, 21.0, 48.0, 57.0, 102.0, 171.0, 298.0, 559.0, 1003.0, 1694.0, 2881.0, 5080.0, 8678.0, 14678.0, 24133.0, 38742.0, 58674.0, 83941.0, 108720.0, 127583.0, 133103.0, 124203.0, 101643.0, 75942.0, 52127.0, 33621.0, 20861.0, 12605.0, 7411.0, 4169.0, 2444.0, 1405.0, 837.0, 472.0, 263.0, 159.0, 77.0, 50.0, 37.0, 13.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.453125, -14.98974609375, -14.5263671875, -14.06298828125, -13.599609375, -13.13623046875, -12.6728515625, -12.20947265625, -11.74609375, -11.28271484375, -10.8193359375, -10.35595703125, -9.892578125, -9.42919921875, -8.9658203125, -8.50244140625, -8.0390625, -7.57568359375, -7.1123046875, -6.64892578125, -6.185546875, -5.72216796875, -5.2587890625, -4.79541015625, -4.33203125, -3.86865234375, -3.4052734375, -2.94189453125, -2.478515625, -2.01513671875, -1.5517578125, -1.08837890625, -0.625, -0.16162109375, 0.3017578125, 0.76513671875, 1.228515625, 1.69189453125, 2.1552734375, 2.61865234375, 3.08203125, 3.54541015625, 4.0087890625, 4.47216796875, 4.935546875, 5.39892578125, 5.8623046875, 6.32568359375, 6.7890625, 7.25244140625, 7.7158203125, 8.17919921875, 8.642578125, 9.10595703125, 9.5693359375, 10.03271484375, 10.49609375, 10.95947265625, 11.4228515625, 11.88623046875, 12.349609375, 12.81298828125, 13.2763671875, 13.73974609375, 14.203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 7.0, 5.0, 8.0, 6.0, 16.0, 12.0, 11.0, 17.0, 12.0, 22.0, 24.0, 19.0, 26.0, 33.0, 31.0, 31.0, 36.0, 31.0, 25.0, 34.0, 35.0, 44.0, 28.0, 38.0, 42.0, 23.0, 36.0, 41.0, 26.0, 34.0, 22.0, 26.0, 15.0, 25.0, 22.0, 14.0, 13.0, 11.0, 21.0, 15.0, 12.0, 14.0, 7.0, 3.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-17.71875, -17.177978515625, -16.63720703125, -16.096435546875, -15.5556640625, -15.014892578125, -14.47412109375, -13.933349609375, -13.392578125, -12.851806640625, -12.31103515625, -11.770263671875, -11.2294921875, -10.688720703125, -10.14794921875, -9.607177734375, -9.06640625, -8.525634765625, -7.98486328125, -7.444091796875, -6.9033203125, -6.362548828125, -5.82177734375, -5.281005859375, -4.740234375, -4.199462890625, -3.65869140625, -3.117919921875, -2.5771484375, -2.036376953125, -1.49560546875, -0.954833984375, -0.4140625, 0.126708984375, 0.66748046875, 1.208251953125, 1.7490234375, 2.289794921875, 2.83056640625, 3.371337890625, 3.912109375, 4.452880859375, 4.99365234375, 5.534423828125, 6.0751953125, 6.615966796875, 7.15673828125, 7.697509765625, 8.23828125, 8.779052734375, 9.31982421875, 9.860595703125, 10.4013671875, 10.942138671875, 11.48291015625, 12.023681640625, 12.564453125, 13.105224609375, 13.64599609375, 14.186767578125, 14.7275390625, 15.268310546875, 15.80908203125, 16.349853515625, 16.890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 3.0, 10.0, 18.0, 20.0, 30.0, 50.0, 75.0, 125.0, 191.0, 307.0, 506.0, 762.0, 1160.0, 1749.0, 2755.0, 4333.0, 6612.0, 10169.0, 15319.0, 23216.0, 33163.0, 46830.0, 62148.0, 78324.0, 93730.0, 104400.0, 106741.0, 102072.0, 90312.0, 74180.0, 57683.0, 42280.0, 29903.0, 20506.0, 13631.0, 8910.0, 5797.0, 3739.0, 2449.0, 1506.0, 1024.0, 682.0, 395.0, 271.0, 176.0, 110.0, 74.0, 45.0, 34.0, 14.0, 11.0, 9.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3477783203125, -10.961181640625, -10.5745849609375, -10.18798828125, -9.8013916015625, -9.414794921875, -9.0281982421875, -8.6416015625, -8.2550048828125, -7.868408203125, -7.4818115234375, -7.09521484375, -6.7086181640625, -6.322021484375, -5.9354248046875, -5.548828125, -5.1622314453125, -4.775634765625, -4.3890380859375, -4.00244140625, -3.6158447265625, -3.229248046875, -2.8426513671875, -2.4560546875, -2.0694580078125, -1.682861328125, -1.2962646484375, -0.90966796875, -0.5230712890625, -0.136474609375, 0.2501220703125, 0.63671875, 1.0233154296875, 1.409912109375, 1.7965087890625, 2.18310546875, 2.5697021484375, 2.956298828125, 3.3428955078125, 3.7294921875, 4.1160888671875, 4.502685546875, 4.8892822265625, 5.27587890625, 5.6624755859375, 6.049072265625, 6.4356689453125, 6.822265625, 7.2088623046875, 7.595458984375, 7.9820556640625, 8.36865234375, 8.7552490234375, 9.141845703125, 9.5284423828125, 9.9150390625, 10.3016357421875, 10.688232421875, 11.0748291015625, 11.46142578125, 11.8480224609375, 12.234619140625, 12.6212158203125, 13.0078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 4.0, 8.0, 5.0, 12.0, 6.0, 16.0, 13.0, 11.0, 15.0, 18.0, 19.0, 25.0, 28.0, 30.0, 31.0, 51.0, 33.0, 51.0, 36.0, 44.0, 47.0, 35.0, 43.0, 50.0, 29.0, 28.0, 33.0, 35.0, 36.0, 25.0, 22.0, 30.0, 25.0, 14.0, 21.0, 13.0, 15.0, 16.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.1796875, -11.7880859375, -11.396484375, -11.0048828125, -10.61328125, -10.2216796875, -9.830078125, -9.4384765625, -9.046875, -8.6552734375, -8.263671875, -7.8720703125, -7.48046875, -7.0888671875, -6.697265625, -6.3056640625, -5.9140625, -5.5224609375, -5.130859375, -4.7392578125, -4.34765625, -3.9560546875, -3.564453125, -3.1728515625, -2.78125, -2.3896484375, -1.998046875, -1.6064453125, -1.21484375, -0.8232421875, -0.431640625, -0.0400390625, 0.3515625, 0.7431640625, 1.134765625, 1.5263671875, 1.91796875, 2.3095703125, 2.701171875, 3.0927734375, 3.484375, 3.8759765625, 4.267578125, 4.6591796875, 5.05078125, 5.4423828125, 5.833984375, 6.2255859375, 6.6171875, 7.0087890625, 7.400390625, 7.7919921875, 8.18359375, 8.5751953125, 8.966796875, 9.3583984375, 9.75, 10.1416015625, 10.533203125, 10.9248046875, 11.31640625, 11.7080078125, 12.099609375, 12.4912109375, 12.8828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 8.0, 13.0, 23.0, 23.0, 45.0, 68.0, 110.0, 219.0, 366.0, 694.0, 1126.0, 2002.0, 3420.0, 6234.0, 10721.0, 18547.0, 30973.0, 49694.0, 74866.0, 103842.0, 129700.0, 141543.0, 134997.0, 112594.0, 83144.0, 56563.0, 35895.0, 21373.0, 12771.0, 7334.0, 4151.0, 2348.0, 1315.0, 734.0, 455.0, 237.0, 154.0, 107.0, 51.0, 33.0, 16.0, 16.0, 8.0, 5.0, 4.0, 9.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.859375, -5.6617431640625, -5.464111328125, -5.2664794921875, -5.06884765625, -4.8712158203125, -4.673583984375, -4.4759521484375, -4.2783203125, -4.0806884765625, -3.883056640625, -3.6854248046875, -3.48779296875, -3.2901611328125, -3.092529296875, -2.8948974609375, -2.697265625, -2.4996337890625, -2.302001953125, -2.1043701171875, -1.90673828125, -1.7091064453125, -1.511474609375, -1.3138427734375, -1.1162109375, -0.9185791015625, -0.720947265625, -0.5233154296875, -0.32568359375, -0.1280517578125, 0.069580078125, 0.2672119140625, 0.46484375, 0.6624755859375, 0.860107421875, 1.0577392578125, 1.25537109375, 1.4530029296875, 1.650634765625, 1.8482666015625, 2.0458984375, 2.2435302734375, 2.441162109375, 2.6387939453125, 2.83642578125, 3.0340576171875, 3.231689453125, 3.4293212890625, 3.626953125, 3.8245849609375, 4.022216796875, 4.2198486328125, 4.41748046875, 4.6151123046875, 4.812744140625, 5.0103759765625, 5.2080078125, 5.4056396484375, 5.603271484375, 5.8009033203125, 5.99853515625, 6.1961669921875, 6.393798828125, 6.5914306640625, 6.7890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 4.0, 5.0, 10.0, 11.0, 11.0, 18.0, 16.0, 28.0, 23.0, 30.0, 33.0, 35.0, 41.0, 57.0, 42.0, 50.0, 53.0, 70.0, 57.0, 48.0, 53.0, 41.0, 37.0, 23.0, 35.0, 29.0, 21.0, 19.0, 17.0, 11.0, 14.0, 7.0, 6.0, 6.0, 7.0, 9.0, 7.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0006823539733886719, -0.0006611272692680359, -0.0006399005651473999, -0.0006186738610267639, -0.0005974471569061279, -0.0005762204527854919, -0.000554993748664856, -0.00053376704454422, -0.000512540340423584, -0.000491313636302948, -0.000470086932182312, -0.000448860228061676, -0.00042763352394104004, -0.00040640681982040405, -0.00038518011569976807, -0.0003639534115791321, -0.0003427267074584961, -0.0003215000033378601, -0.0003002732992172241, -0.00027904659509658813, -0.00025781989097595215, -0.00023659318685531616, -0.00021536648273468018, -0.0001941397786140442, -0.0001729130744934082, -0.00015168637037277222, -0.00013045966625213623, -0.00010923296213150024, -8.800625801086426e-05, -6.677955389022827e-05, -4.5552849769592285e-05, -2.43261456489563e-05, -3.0994415283203125e-06, 1.8127262592315674e-05, 3.935396671295166e-05, 6.0580670833587646e-05, 8.180737495422363e-05, 0.00010303407907485962, 0.0001242607831954956, 0.0001454874873161316, 0.00016671419143676758, 0.00018794089555740356, 0.00020916759967803955, 0.00023039430379867554, 0.0002516210079193115, 0.0002728477120399475, 0.0002940744161605835, 0.0003153011202812195, 0.00033652782440185547, 0.00035775452852249146, 0.00037898123264312744, 0.00040020793676376343, 0.0004214346408843994, 0.0004426613450050354, 0.0004638880491256714, 0.0004851147532463074, 0.0005063414573669434, 0.0005275681614875793, 0.0005487948656082153, 0.0005700215697288513, 0.0005912482738494873, 0.0006124749779701233, 0.0006337016820907593, 0.0006549283862113953, 0.0006761550903320312]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 7.0, 17.0, 27.0, 48.0, 68.0, 112.0, 172.0, 272.0, 401.0, 661.0, 1096.0, 1687.0, 2645.0, 4155.0, 6653.0, 10432.0, 15586.0, 23692.0, 34667.0, 49094.0, 66114.0, 83943.0, 99681.0, 109315.0, 109929.0, 102336.0, 88694.0, 70025.0, 53127.0, 37970.0, 26432.0, 17613.0, 11527.0, 7371.0, 4819.0, 3034.0, 1878.0, 1211.0, 724.0, 492.0, 301.0, 185.0, 122.0, 74.0, 54.0, 33.0, 24.0, 12.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.558349609375, -4.40185546875, -4.245361328125, -4.0888671875, -3.932373046875, -3.77587890625, -3.619384765625, -3.462890625, -3.306396484375, -3.14990234375, -2.993408203125, -2.8369140625, -2.680419921875, -2.52392578125, -2.367431640625, -2.2109375, -2.054443359375, -1.89794921875, -1.741455078125, -1.5849609375, -1.428466796875, -1.27197265625, -1.115478515625, -0.958984375, -0.802490234375, -0.64599609375, -0.489501953125, -0.3330078125, -0.176513671875, -0.02001953125, 0.136474609375, 0.29296875, 0.449462890625, 0.60595703125, 0.762451171875, 0.9189453125, 1.075439453125, 1.23193359375, 1.388427734375, 1.544921875, 1.701416015625, 1.85791015625, 2.014404296875, 2.1708984375, 2.327392578125, 2.48388671875, 2.640380859375, 2.796875, 2.953369140625, 3.10986328125, 3.266357421875, 3.4228515625, 3.579345703125, 3.73583984375, 3.892333984375, 4.048828125, 4.205322265625, 4.36181640625, 4.518310546875, 4.6748046875, 4.831298828125, 4.98779296875, 5.144287109375, 5.30078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 10.0, 14.0, 8.0, 12.0, 13.0, 10.0, 21.0, 16.0, 12.0, 31.0, 25.0, 27.0, 33.0, 39.0, 43.0, 43.0, 30.0, 42.0, 45.0, 40.0, 43.0, 36.0, 41.0, 37.0, 35.0, 37.0, 34.0, 28.0, 33.0, 23.0, 20.0, 22.0, 17.0, 20.0, 10.0, 14.0, 10.0, 3.0, 10.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.763671875, -1.698211669921875, -1.63275146484375, -1.567291259765625, -1.5018310546875, -1.436370849609375, -1.37091064453125, -1.305450439453125, -1.239990234375, -1.174530029296875, -1.10906982421875, -1.043609619140625, -0.9781494140625, -0.912689208984375, -0.84722900390625, -0.781768798828125, -0.71630859375, -0.650848388671875, -0.58538818359375, -0.519927978515625, -0.4544677734375, -0.389007568359375, -0.32354736328125, -0.258087158203125, -0.192626953125, -0.127166748046875, -0.06170654296875, 0.003753662109375, 0.0692138671875, 0.134674072265625, 0.20013427734375, 0.265594482421875, 0.3310546875, 0.396514892578125, 0.46197509765625, 0.527435302734375, 0.5928955078125, 0.658355712890625, 0.72381591796875, 0.789276123046875, 0.854736328125, 0.920196533203125, 0.98565673828125, 1.051116943359375, 1.1165771484375, 1.182037353515625, 1.24749755859375, 1.312957763671875, 1.37841796875, 1.443878173828125, 1.50933837890625, 1.574798583984375, 1.6402587890625, 1.705718994140625, 1.77117919921875, 1.836639404296875, 1.902099609375, 1.967559814453125, 2.03302001953125, 2.098480224609375, 2.1639404296875, 2.229400634765625, 2.29486083984375, 2.360321044921875, 2.42578125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 1.0, 7.0, 6.0, 4.0, 8.0, 14.0, 6.0, 14.0, 13.0, 13.0, 27.0, 34.0, 34.0, 25.0, 30.0, 33.0, 49.0, 33.0, 33.0, 48.0, 46.0, 43.0, 37.0, 39.0, 46.0, 39.0, 31.0, 30.0, 29.0, 30.0, 20.0, 25.0, 31.0, 21.0, 13.0, 17.0, 11.0, 12.0, 6.0, 12.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-16.721254348754883, -16.153564453125, -15.5858736038208, -15.018182754516602, -14.450492858886719, -13.88280200958252, -13.31511116027832, -12.747421264648438, -12.179730415344238, -11.612039566040039, -11.044349670410156, -10.476658821105957, -9.908967971801758, -9.341278076171875, -8.773587226867676, -8.205896377563477, -7.638206481933594, -7.070516109466553, -6.502825736999512, -5.9351348876953125, -5.3674445152282715, -4.7997541427612305, -4.232063293457031, -3.6643729209899902, -3.096682548522949, -2.528992176055908, -1.961301565170288, -1.3936110734939575, -0.825920581817627, -0.25823020935058594, 0.3094604015350342, 0.8771510124206543, 1.4448394775390625, 2.0125298500061035, 2.5802204608917236, 3.1479110717773438, 3.7156014442443848, 4.283291816711426, 4.850982666015625, 5.418673038482666, 5.986363410949707, 6.554053783416748, 7.121744155883789, 7.689435005187988, 8.257125854492188, 8.82481575012207, 9.39250659942627, 9.960197448730469, 10.527887344360352, 11.09557819366455, 11.663268089294434, 12.230958938598633, 12.798648834228516, 13.366339683532715, 13.934030532836914, 14.501720428466797, 15.069411277770996, 15.637102127075195, 16.204792022705078, 16.77248191833496, 17.340173721313477, 17.90786361694336, 18.475553512573242, 19.043245315551758, 19.61093521118164]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 14.0, 11.0, 15.0, 10.0, 19.0, 14.0, 25.0, 18.0, 24.0, 26.0, 20.0, 35.0, 33.0, 39.0, 33.0, 34.0, 37.0, 47.0, 39.0, 33.0, 45.0, 35.0, 36.0, 38.0, 42.0, 32.0, 21.0, 32.0, 21.0, 29.0, 20.0, 15.0, 21.0, 18.0, 13.0, 10.0, 9.0, 8.0, 6.0, 7.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.333984375, -17.72174835205078, -17.109512329101562, -16.497278213500977, -15.885042190551758, -15.272806167602539, -14.660571098327637, -14.048336029052734, -13.436100006103516, -12.823863983154297, -12.211628913879395, -11.599393844604492, -10.987157821655273, -10.374921798706055, -9.762686729431152, -9.15045166015625, -8.538215637207031, -7.925980091094971, -7.31374454498291, -6.70150899887085, -6.089273452758789, -5.4770379066467285, -4.864802360534668, -4.252566814422607, -3.640331268310547, -3.0280957221984863, -2.415860176086426, -1.8036246299743652, -1.1913890838623047, -0.5791535377502441, 0.033082008361816406, 0.645317554473877, 1.2575550079345703, 1.8697905540466309, 2.4820261001586914, 3.094261646270752, 3.7064971923828125, 4.318732738494873, 4.930968284606934, 5.543203830718994, 6.155439376831055, 6.767674922943115, 7.379910469055176, 7.992146015167236, 8.604381561279297, 9.216617584228516, 9.828852653503418, 10.44108772277832, 11.053323745727539, 11.665559768676758, 12.27779483795166, 12.890029907226562, 13.502265930175781, 14.114501953125, 14.726737022399902, 15.338972091674805, 15.951208114624023, 16.563444137573242, 17.175678253173828, 17.787914276123047, 18.400150299072266, 19.012386322021484, 19.624622344970703, 20.23685646057129, 20.849092483520508]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 7.0, 4.0, 15.0, 24.0, 37.0, 36.0, 51.0, 107.0, 163.0, 234.0, 341.0, 511.0, 808.0, 1277.0, 1985.0, 3091.0, 5096.0, 8472.0, 13963.0, 23471.0, 39766.0, 68711.0, 118121.0, 199324.0, 321115.0, 473163.0, 603713.0, 643699.0, 566150.0, 420068.0, 276055.0, 166761.0, 98567.0, 57147.0, 33648.0, 19303.0, 11493.0, 6834.0, 4143.0, 2505.0, 1601.0, 998.0, 645.0, 377.0, 250.0, 154.0, 108.0, 53.0, 52.0, 32.0, 18.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0], "bins": [-16.28125, -15.792724609375, -15.30419921875, -14.815673828125, -14.3271484375, -13.838623046875, -13.35009765625, -12.861572265625, -12.373046875, -11.884521484375, -11.39599609375, -10.907470703125, -10.4189453125, -9.930419921875, -9.44189453125, -8.953369140625, -8.46484375, -7.976318359375, -7.48779296875, -6.999267578125, -6.5107421875, -6.022216796875, -5.53369140625, -5.045166015625, -4.556640625, -4.068115234375, -3.57958984375, -3.091064453125, -2.6025390625, -2.114013671875, -1.62548828125, -1.136962890625, -0.6484375, -0.159912109375, 0.32861328125, 0.817138671875, 1.3056640625, 1.794189453125, 2.28271484375, 2.771240234375, 3.259765625, 3.748291015625, 4.23681640625, 4.725341796875, 5.2138671875, 5.702392578125, 6.19091796875, 6.679443359375, 7.16796875, 7.656494140625, 8.14501953125, 8.633544921875, 9.1220703125, 9.610595703125, 10.09912109375, 10.587646484375, 11.076171875, 11.564697265625, 12.05322265625, 12.541748046875, 13.0302734375, 13.518798828125, 14.00732421875, 14.495849609375, 14.984375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 3.0, 9.0, 17.0, 16.0, 7.0, 16.0, 23.0, 23.0, 27.0, 22.0, 29.0, 28.0, 33.0, 17.0, 28.0, 34.0, 38.0, 25.0, 41.0, 38.0, 42.0, 35.0, 39.0, 30.0, 34.0, 37.0, 27.0, 20.0, 27.0, 23.0, 22.0, 20.0, 18.0, 24.0, 17.0, 17.0, 15.0, 17.0, 6.0, 4.0, 10.0, 9.0, 4.0, 1.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-15.265625, -14.7884521484375, -14.311279296875, -13.8341064453125, -13.35693359375, -12.8797607421875, -12.402587890625, -11.9254150390625, -11.4482421875, -10.9710693359375, -10.493896484375, -10.0167236328125, -9.53955078125, -9.0623779296875, -8.585205078125, -8.1080322265625, -7.630859375, -7.1536865234375, -6.676513671875, -6.1993408203125, -5.72216796875, -5.2449951171875, -4.767822265625, -4.2906494140625, -3.8134765625, -3.3363037109375, -2.859130859375, -2.3819580078125, -1.90478515625, -1.4276123046875, -0.950439453125, -0.4732666015625, 0.00390625, 0.4810791015625, 0.958251953125, 1.4354248046875, 1.91259765625, 2.3897705078125, 2.866943359375, 3.3441162109375, 3.8212890625, 4.2984619140625, 4.775634765625, 5.2528076171875, 5.72998046875, 6.2071533203125, 6.684326171875, 7.1614990234375, 7.638671875, 8.1158447265625, 8.593017578125, 9.0701904296875, 9.54736328125, 10.0245361328125, 10.501708984375, 10.9788818359375, 11.4560546875, 11.9332275390625, 12.410400390625, 12.8875732421875, 13.36474609375, 13.8419189453125, 14.319091796875, 14.7962646484375, 15.2734375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 12.0, 14.0, 23.0, 43.0, 65.0, 111.0, 145.0, 295.0, 430.0, 676.0, 1115.0, 1908.0, 3232.0, 5587.0, 9589.0, 16428.0, 29192.0, 50770.0, 87417.0, 149491.0, 246541.0, 382415.0, 533270.0, 637130.0, 624706.0, 507071.0, 355091.0, 227089.0, 136787.0, 79250.0, 45905.0, 26083.0, 14930.0, 8789.0, 5116.0, 3043.0, 1772.0, 1074.0, 677.0, 387.0, 220.0, 137.0, 94.0, 59.0, 35.0, 32.0, 12.0, 14.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.59912109375, -17.0107421875, -16.42236328125, -15.833984375, -15.24560546875, -14.6572265625, -14.06884765625, -13.48046875, -12.89208984375, -12.3037109375, -11.71533203125, -11.126953125, -10.53857421875, -9.9501953125, -9.36181640625, -8.7734375, -8.18505859375, -7.5966796875, -7.00830078125, -6.419921875, -5.83154296875, -5.2431640625, -4.65478515625, -4.06640625, -3.47802734375, -2.8896484375, -2.30126953125, -1.712890625, -1.12451171875, -0.5361328125, 0.05224609375, 0.640625, 1.22900390625, 1.8173828125, 2.40576171875, 2.994140625, 3.58251953125, 4.1708984375, 4.75927734375, 5.34765625, 5.93603515625, 6.5244140625, 7.11279296875, 7.701171875, 8.28955078125, 8.8779296875, 9.46630859375, 10.0546875, 10.64306640625, 11.2314453125, 11.81982421875, 12.408203125, 12.99658203125, 13.5849609375, 14.17333984375, 14.76171875, 15.35009765625, 15.9384765625, 16.52685546875, 17.115234375, 17.70361328125, 18.2919921875, 18.88037109375, 19.46875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 9.0, 11.0, 26.0, 21.0, 27.0, 38.0, 41.0, 58.0, 60.0, 80.0, 110.0, 127.0, 151.0, 170.0, 210.0, 237.0, 231.0, 256.0, 234.0, 262.0, 238.0, 226.0, 200.0, 203.0, 149.0, 142.0, 126.0, 103.0, 87.0, 61.0, 50.0, 39.0, 25.0, 21.0, 11.0, 11.0, 8.0, 7.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.78515625, -7.52044677734375, -7.2557373046875, -6.99102783203125, -6.726318359375, -6.46160888671875, -6.1968994140625, -5.93218994140625, -5.66748046875, -5.40277099609375, -5.1380615234375, -4.87335205078125, -4.608642578125, -4.34393310546875, -4.0792236328125, -3.81451416015625, -3.5498046875, -3.28509521484375, -3.0203857421875, -2.75567626953125, -2.490966796875, -2.22625732421875, -1.9615478515625, -1.69683837890625, -1.43212890625, -1.16741943359375, -0.9027099609375, -0.63800048828125, -0.373291015625, -0.10858154296875, 0.1561279296875, 0.42083740234375, 0.685546875, 0.95025634765625, 1.2149658203125, 1.47967529296875, 1.744384765625, 2.00909423828125, 2.2738037109375, 2.53851318359375, 2.80322265625, 3.06793212890625, 3.3326416015625, 3.59735107421875, 3.862060546875, 4.12677001953125, 4.3914794921875, 4.65618896484375, 4.9208984375, 5.18560791015625, 5.4503173828125, 5.71502685546875, 5.979736328125, 6.24444580078125, 6.5091552734375, 6.77386474609375, 7.03857421875, 7.30328369140625, 7.5679931640625, 7.83270263671875, 8.097412109375, 8.36212158203125, 8.6268310546875, 8.89154052734375, 9.15625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 14.0, 12.0, 18.0, 22.0, 16.0, 30.0, 29.0, 30.0, 33.0, 39.0, 39.0, 51.0, 50.0, 46.0, 47.0, 46.0, 40.0, 47.0, 61.0, 41.0, 42.0, 40.0, 31.0, 18.0, 21.0, 23.0, 26.0, 23.0, 10.0, 16.0, 6.0, 8.0, 4.0, 0.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.351669311523438, -19.65229606628418, -18.952922821044922, -18.253549575805664, -17.554176330566406, -16.85480308532715, -16.15542984008789, -15.456056594848633, -14.756683349609375, -14.057310104370117, -13.35793685913086, -12.658563613891602, -11.959190368652344, -11.259817123413086, -10.560443878173828, -9.86107063293457, -9.161697387695312, -8.462324142456055, -7.762950897216797, -7.063577651977539, -6.364204406738281, -5.664831161499023, -4.965457916259766, -4.266084671020508, -3.56671142578125, -2.867338180541992, -2.1679649353027344, -1.4685916900634766, -0.7692184448242188, -0.06984519958496094, 0.6295280456542969, 1.3289012908935547, 2.0282764434814453, 2.727649688720703, 3.427022933959961, 4.126396179199219, 4.825769424438477, 5.525142669677734, 6.224515914916992, 6.92388916015625, 7.623262405395508, 8.322635650634766, 9.022008895874023, 9.721382141113281, 10.420755386352539, 11.120128631591797, 11.819501876831055, 12.518875122070312, 13.21824836730957, 13.917621612548828, 14.616994857788086, 15.316368103027344, 16.0157413482666, 16.71511459350586, 17.414487838745117, 18.113861083984375, 18.813234329223633, 19.51260757446289, 20.21198081970215, 20.911354064941406, 21.610727310180664, 22.310100555419922, 23.00947380065918, 23.708847045898438, 24.408220291137695]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 5.0, 3.0, 4.0, 6.0, 11.0, 11.0, 17.0, 20.0, 18.0, 21.0, 24.0, 25.0, 29.0, 38.0, 36.0, 25.0, 46.0, 47.0, 43.0, 46.0, 39.0, 39.0, 51.0, 40.0, 40.0, 42.0, 34.0, 28.0, 23.0, 25.0, 28.0, 24.0, 22.0, 15.0, 12.0, 19.0, 16.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.457382202148438, -17.819278717041016, -17.181175231933594, -16.543071746826172, -15.90496826171875, -15.266864776611328, -14.628761291503906, -13.990657806396484, -13.352554321289062, -12.71445083618164, -12.076347351074219, -11.438243865966797, -10.800140380859375, -10.162036895751953, -9.523933410644531, -8.88582992553711, -8.247726440429688, -7.609622955322266, -6.971519470214844, -6.333415985107422, -5.6953125, -5.057209014892578, -4.419105529785156, -3.7810020446777344, -3.1428985595703125, -2.5047950744628906, -1.8666915893554688, -1.2285881042480469, -0.590484619140625, 0.047618865966796875, 0.6857223510742188, 1.3238258361816406, 1.9619293212890625, 2.6000328063964844, 3.2381362915039062, 3.876239776611328, 4.51434326171875, 5.152446746826172, 5.790550231933594, 6.428653717041016, 7.0667572021484375, 7.704860687255859, 8.342964172363281, 8.981067657470703, 9.619171142578125, 10.257274627685547, 10.895378112792969, 11.53348159790039, 12.171585083007812, 12.809688568115234, 13.447792053222656, 14.085895538330078, 14.7239990234375, 15.362102508544922, 16.000205993652344, 16.638309478759766, 17.276412963867188, 17.91451644897461, 18.55261993408203, 19.190723419189453, 19.828826904296875, 20.466930389404297, 21.10503387451172, 21.74313735961914, 22.381240844726562]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 10.0, 8.0, 18.0, 31.0, 33.0, 54.0, 80.0, 149.0, 234.0, 375.0, 592.0, 962.0, 1550.0, 2508.0, 3945.0, 6426.0, 10275.0, 16883.0, 26479.0, 41017.0, 60650.0, 85096.0, 109059.0, 127331.0, 130225.0, 119083.0, 96159.0, 71876.0, 49278.0, 33179.0, 20884.0, 12985.0, 8067.0, 4974.0, 3016.0, 1947.0, 1144.0, 711.0, 451.0, 297.0, 184.0, 121.0, 79.0, 48.0, 26.0, 16.0, 12.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.5078125, -10.17138671875, -9.8349609375, -9.49853515625, -9.162109375, -8.82568359375, -8.4892578125, -8.15283203125, -7.81640625, -7.47998046875, -7.1435546875, -6.80712890625, -6.470703125, -6.13427734375, -5.7978515625, -5.46142578125, -5.125, -4.78857421875, -4.4521484375, -4.11572265625, -3.779296875, -3.44287109375, -3.1064453125, -2.77001953125, -2.43359375, -2.09716796875, -1.7607421875, -1.42431640625, -1.087890625, -0.75146484375, -0.4150390625, -0.07861328125, 0.2578125, 0.59423828125, 0.9306640625, 1.26708984375, 1.603515625, 1.93994140625, 2.2763671875, 2.61279296875, 2.94921875, 3.28564453125, 3.6220703125, 3.95849609375, 4.294921875, 4.63134765625, 4.9677734375, 5.30419921875, 5.640625, 5.97705078125, 6.3134765625, 6.64990234375, 6.986328125, 7.32275390625, 7.6591796875, 7.99560546875, 8.33203125, 8.66845703125, 9.0048828125, 9.34130859375, 9.677734375, 10.01416015625, 10.3505859375, 10.68701171875, 11.0234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 12.0, 11.0, 12.0, 12.0, 10.0, 22.0, 16.0, 20.0, 19.0, 27.0, 33.0, 31.0, 33.0, 28.0, 27.0, 49.0, 42.0, 31.0, 48.0, 41.0, 35.0, 48.0, 36.0, 38.0, 39.0, 23.0, 23.0, 20.0, 31.0, 22.0, 23.0, 16.0, 16.0, 25.0, 12.0, 10.0, 14.0, 3.0, 12.0, 11.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.625, -18.03125, -17.4375, -16.84375, -16.25, -15.65625, -15.0625, -14.46875, -13.875, -13.28125, -12.6875, -12.09375, -11.5, -10.90625, -10.3125, -9.71875, -9.125, -8.53125, -7.9375, -7.34375, -6.75, -6.15625, -5.5625, -4.96875, -4.375, -3.78125, -3.1875, -2.59375, -2.0, -1.40625, -0.8125, -0.21875, 0.375, 0.96875, 1.5625, 2.15625, 2.75, 3.34375, 3.9375, 4.53125, 5.125, 5.71875, 6.3125, 6.90625, 7.5, 8.09375, 8.6875, 9.28125, 9.875, 10.46875, 11.0625, 11.65625, 12.25, 12.84375, 13.4375, 14.03125, 14.625, 15.21875, 15.8125, 16.40625, 17.0, 17.59375, 18.1875, 18.78125, 19.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 13.0, 13.0, 24.0, 30.0, 48.0, 76.0, 128.0, 188.0, 294.0, 399.0, 658.0, 1026.0, 1695.0, 2778.0, 4642.0, 7849.0, 13339.0, 23199.0, 39968.0, 67060.0, 104994.0, 149002.0, 171532.0, 157067.0, 116240.0, 75849.0, 45854.0, 26479.0, 15553.0, 9113.0, 5269.0, 3078.0, 1977.0, 1142.0, 703.0, 428.0, 302.0, 163.0, 120.0, 90.0, 54.0, 37.0, 28.0, 14.0, 13.0, 10.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.65625, -16.129638671875, -15.60302734375, -15.076416015625, -14.5498046875, -14.023193359375, -13.49658203125, -12.969970703125, -12.443359375, -11.916748046875, -11.39013671875, -10.863525390625, -10.3369140625, -9.810302734375, -9.28369140625, -8.757080078125, -8.23046875, -7.703857421875, -7.17724609375, -6.650634765625, -6.1240234375, -5.597412109375, -5.07080078125, -4.544189453125, -4.017578125, -3.490966796875, -2.96435546875, -2.437744140625, -1.9111328125, -1.384521484375, -0.85791015625, -0.331298828125, 0.1953125, 0.721923828125, 1.24853515625, 1.775146484375, 2.3017578125, 2.828369140625, 3.35498046875, 3.881591796875, 4.408203125, 4.934814453125, 5.46142578125, 5.988037109375, 6.5146484375, 7.041259765625, 7.56787109375, 8.094482421875, 8.62109375, 9.147705078125, 9.67431640625, 10.200927734375, 10.7275390625, 11.254150390625, 11.78076171875, 12.307373046875, 12.833984375, 13.360595703125, 13.88720703125, 14.413818359375, 14.9404296875, 15.467041015625, 15.99365234375, 16.520263671875, 17.046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 4.0, 9.0, 14.0, 6.0, 13.0, 27.0, 19.0, 16.0, 21.0, 16.0, 33.0, 23.0, 25.0, 31.0, 41.0, 40.0, 36.0, 44.0, 31.0, 42.0, 33.0, 28.0, 37.0, 40.0, 25.0, 38.0, 36.0, 28.0, 28.0, 30.0, 15.0, 20.0, 19.0, 19.0, 15.0, 18.0, 9.0, 12.0, 9.0, 9.0, 9.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-11.8125, -11.4539794921875, -11.095458984375, -10.7369384765625, -10.37841796875, -10.0198974609375, -9.661376953125, -9.3028564453125, -8.9443359375, -8.5858154296875, -8.227294921875, -7.8687744140625, -7.51025390625, -7.1517333984375, -6.793212890625, -6.4346923828125, -6.076171875, -5.7176513671875, -5.359130859375, -5.0006103515625, -4.64208984375, -4.2835693359375, -3.925048828125, -3.5665283203125, -3.2080078125, -2.8494873046875, -2.490966796875, -2.1324462890625, -1.77392578125, -1.4154052734375, -1.056884765625, -0.6983642578125, -0.33984375, 0.0186767578125, 0.377197265625, 0.7357177734375, 1.09423828125, 1.4527587890625, 1.811279296875, 2.1697998046875, 2.5283203125, 2.8868408203125, 3.245361328125, 3.6038818359375, 3.96240234375, 4.3209228515625, 4.679443359375, 5.0379638671875, 5.396484375, 5.7550048828125, 6.113525390625, 6.4720458984375, 6.83056640625, 7.1890869140625, 7.547607421875, 7.9061279296875, 8.2646484375, 8.6231689453125, 8.981689453125, 9.3402099609375, 9.69873046875, 10.0572509765625, 10.415771484375, 10.7742919921875, 11.1328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 12.0, 20.0, 27.0, 36.0, 68.0, 86.0, 167.0, 208.0, 304.0, 488.0, 739.0, 1094.0, 1719.0, 2685.0, 4196.0, 6817.0, 10731.0, 17258.0, 27542.0, 43282.0, 67099.0, 97967.0, 131682.0, 151988.0, 143752.0, 114291.0, 79670.0, 52837.0, 33878.0, 21431.0, 13350.0, 8299.0, 5268.0, 3315.0, 2132.0, 1405.0, 876.0, 635.0, 401.0, 249.0, 175.0, 138.0, 71.0, 42.0, 40.0, 25.0, 18.0, 14.0, 12.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.30859375, -6.1097412109375, -5.910888671875, -5.7120361328125, -5.51318359375, -5.3143310546875, -5.115478515625, -4.9166259765625, -4.7177734375, -4.5189208984375, -4.320068359375, -4.1212158203125, -3.92236328125, -3.7235107421875, -3.524658203125, -3.3258056640625, -3.126953125, -2.9281005859375, -2.729248046875, -2.5303955078125, -2.33154296875, -2.1326904296875, -1.933837890625, -1.7349853515625, -1.5361328125, -1.3372802734375, -1.138427734375, -0.9395751953125, -0.74072265625, -0.5418701171875, -0.343017578125, -0.1441650390625, 0.0546875, 0.2535400390625, 0.452392578125, 0.6512451171875, 0.85009765625, 1.0489501953125, 1.247802734375, 1.4466552734375, 1.6455078125, 1.8443603515625, 2.043212890625, 2.2420654296875, 2.44091796875, 2.6397705078125, 2.838623046875, 3.0374755859375, 3.236328125, 3.4351806640625, 3.634033203125, 3.8328857421875, 4.03173828125, 4.2305908203125, 4.429443359375, 4.6282958984375, 4.8271484375, 5.0260009765625, 5.224853515625, 5.4237060546875, 5.62255859375, 5.8214111328125, 6.020263671875, 6.2191162109375, 6.41796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 8.0, 2.0, 5.0, 7.0, 4.0, 13.0, 13.0, 9.0, 21.0, 27.0, 28.0, 29.0, 37.0, 45.0, 29.0, 42.0, 61.0, 50.0, 47.0, 43.0, 52.0, 46.0, 42.0, 38.0, 48.0, 32.0, 29.0, 31.0, 29.0, 25.0, 15.0, 25.0, 14.0, 10.0, 10.0, 8.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0], "bins": [-0.0005035400390625, -0.0004904791712760925, -0.00047741830348968506, -0.0004643574357032776, -0.0004512965679168701, -0.00043823570013046265, -0.0004251748323440552, -0.0004121139645576477, -0.00039905309677124023, -0.00038599222898483276, -0.0003729313611984253, -0.0003598704934120178, -0.00034680962562561035, -0.0003337487578392029, -0.0003206878900527954, -0.00030762702226638794, -0.00029456615447998047, -0.000281505286693573, -0.00026844441890716553, -0.00025538355112075806, -0.00024232268333435059, -0.00022926181554794312, -0.00021620094776153564, -0.00020314007997512817, -0.0001900792121887207, -0.00017701834440231323, -0.00016395747661590576, -0.0001508966088294983, -0.00013783574104309082, -0.00012477487325668335, -0.00011171400547027588, -9.865313768386841e-05, -8.559226989746094e-05, -7.253140211105347e-05, -5.9470534324645996e-05, -4.6409666538238525e-05, -3.3348798751831055e-05, -2.0287930965423584e-05, -7.227063179016113e-06, 5.833804607391357e-06, 1.8894672393798828e-05, 3.19555401802063e-05, 4.501640796661377e-05, 5.807727575302124e-05, 7.113814353942871e-05, 8.419901132583618e-05, 9.725987911224365e-05, 0.00011032074689865112, 0.0001233816146850586, 0.00013644248247146606, 0.00014950335025787354, 0.000162564218044281, 0.00017562508583068848, 0.00018868595361709595, 0.00020174682140350342, 0.0002148076891899109, 0.00022786855697631836, 0.00024092942476272583, 0.0002539902925491333, 0.00026705116033554077, 0.00028011202812194824, 0.0002931728959083557, 0.0003062337636947632, 0.00031929463148117065, 0.0003323554992675781]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 13.0, 14.0, 14.0, 30.0, 52.0, 79.0, 92.0, 160.0, 215.0, 354.0, 544.0, 766.0, 1192.0, 1808.0, 2924.0, 4550.0, 7190.0, 11440.0, 17748.0, 27551.0, 41517.0, 60367.0, 83916.0, 107285.0, 124562.0, 127615.0, 116803.0, 95481.0, 71248.0, 49642.0, 33045.0, 21815.0, 13912.0, 8869.0, 5549.0, 3655.0, 2350.0, 1423.0, 967.0, 614.0, 428.0, 235.0, 182.0, 113.0, 83.0, 53.0, 33.0, 16.0, 14.0, 13.0, 5.0, 6.0, 1.0, 1.0, 1.0, 3.0], "bins": [-6.96484375, -6.7552490234375, -6.545654296875, -6.3360595703125, -6.12646484375, -5.9168701171875, -5.707275390625, -5.4976806640625, -5.2880859375, -5.0784912109375, -4.868896484375, -4.6593017578125, -4.44970703125, -4.2401123046875, -4.030517578125, -3.8209228515625, -3.611328125, -3.4017333984375, -3.192138671875, -2.9825439453125, -2.77294921875, -2.5633544921875, -2.353759765625, -2.1441650390625, -1.9345703125, -1.7249755859375, -1.515380859375, -1.3057861328125, -1.09619140625, -0.8865966796875, -0.677001953125, -0.4674072265625, -0.2578125, -0.0482177734375, 0.161376953125, 0.3709716796875, 0.58056640625, 0.7901611328125, 0.999755859375, 1.2093505859375, 1.4189453125, 1.6285400390625, 1.838134765625, 2.0477294921875, 2.25732421875, 2.4669189453125, 2.676513671875, 2.8861083984375, 3.095703125, 3.3052978515625, 3.514892578125, 3.7244873046875, 3.93408203125, 4.1436767578125, 4.353271484375, 4.5628662109375, 4.7724609375, 4.9820556640625, 5.191650390625, 5.4012451171875, 5.61083984375, 5.8204345703125, 6.030029296875, 6.2396240234375, 6.44921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 8.0, 5.0, 7.0, 10.0, 11.0, 13.0, 8.0, 20.0, 17.0, 21.0, 29.0, 35.0, 50.0, 48.0, 46.0, 43.0, 53.0, 60.0, 51.0, 63.0, 48.0, 48.0, 39.0, 39.0, 51.0, 30.0, 37.0, 24.0, 21.0, 15.0, 7.0, 11.0, 6.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.998046875, -2.90325927734375, -2.8084716796875, -2.71368408203125, -2.618896484375, -2.52410888671875, -2.4293212890625, -2.33453369140625, -2.23974609375, -2.14495849609375, -2.0501708984375, -1.95538330078125, -1.860595703125, -1.76580810546875, -1.6710205078125, -1.57623291015625, -1.4814453125, -1.38665771484375, -1.2918701171875, -1.19708251953125, -1.102294921875, -1.00750732421875, -0.9127197265625, -0.81793212890625, -0.72314453125, -0.62835693359375, -0.5335693359375, -0.43878173828125, -0.343994140625, -0.24920654296875, -0.1544189453125, -0.05963134765625, 0.03515625, 0.12994384765625, 0.2247314453125, 0.31951904296875, 0.414306640625, 0.50909423828125, 0.6038818359375, 0.69866943359375, 0.79345703125, 0.88824462890625, 0.9830322265625, 1.07781982421875, 1.172607421875, 1.26739501953125, 1.3621826171875, 1.45697021484375, 1.5517578125, 1.64654541015625, 1.7413330078125, 1.83612060546875, 1.930908203125, 2.02569580078125, 2.1204833984375, 2.21527099609375, 2.31005859375, 2.40484619140625, 2.4996337890625, 2.59442138671875, 2.689208984375, 2.78399658203125, 2.8787841796875, 2.97357177734375, 3.068359375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 2.0, 4.0, 10.0, 9.0, 12.0, 21.0, 21.0, 37.0, 27.0, 39.0, 24.0, 31.0, 44.0, 47.0, 54.0, 49.0, 45.0, 52.0, 53.0, 53.0, 51.0, 44.0, 51.0, 33.0, 26.0, 23.0, 21.0, 17.0, 27.0, 26.0, 12.0, 15.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15675163269043, -19.442813873291016, -18.728878021240234, -18.01494026184082, -17.301002502441406, -16.587064743041992, -15.873127937316895, -15.159191131591797, -14.445253372192383, -13.731315612792969, -13.017378807067871, -12.303442001342773, -11.58950424194336, -10.875566482543945, -10.161629676818848, -9.44769287109375, -8.733755111694336, -8.019817352294922, -7.305880546569824, -6.591943264007568, -5.8780059814453125, -5.164068698883057, -4.450131416320801, -3.736194133758545, -3.022256851196289, -2.308319568634033, -1.5943822860717773, -0.8804450035095215, -0.16650772094726562, 0.5474295616149902, 1.261366844177246, 1.975304126739502, 2.6892433166503906, 3.4031805992126465, 4.117117881774902, 4.831055164337158, 5.544992446899414, 6.25892972946167, 6.972867012023926, 7.686804294586182, 8.400741577148438, 9.114679336547852, 9.82861614227295, 10.542552947998047, 11.256490707397461, 11.970428466796875, 12.684365272521973, 13.39830207824707, 14.112239837646484, 14.826177597045898, 15.540114402770996, 16.254051208496094, 16.967988967895508, 17.681926727294922, 18.395862579345703, 19.109800338745117, 19.82373809814453, 20.537675857543945, 21.25161361694336, 21.96554946899414, 22.679487228393555, 23.39342498779297, 24.10736083984375, 24.821298599243164, 25.535236358642578]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 1.0, 3.0, 8.0, 13.0, 12.0, 11.0, 19.0, 16.0, 19.0, 27.0, 25.0, 25.0, 38.0, 35.0, 26.0, 42.0, 39.0, 44.0, 39.0, 49.0, 49.0, 45.0, 40.0, 34.0, 38.0, 45.0, 27.0, 30.0, 20.0, 26.0, 23.0, 21.0, 23.0, 18.0, 12.0, 17.0, 13.0, 9.0, 8.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.175724029541016, -17.55483055114746, -16.933937072753906, -16.313045501708984, -15.69215202331543, -15.071258544921875, -14.45036506652832, -13.829471588134766, -13.208579063415527, -12.587685585021973, -11.966793060302734, -11.34589958190918, -10.725006103515625, -10.104113578796387, -9.483220100402832, -8.862327575683594, -8.241434097290039, -7.620541095733643, -6.999648094177246, -6.378754615783691, -5.757861614227295, -5.136968612670898, -4.516075134277344, -3.8951821327209473, -3.274289131164551, -2.6533961296081543, -2.0325028896331787, -1.4116097688674927, -0.7907166481018066, -0.16982364654541016, 0.45106959342956543, 1.071962833404541, 1.6928539276123047, 2.313746929168701, 2.9346401691436768, 3.5555334091186523, 4.176426410675049, 4.797319412231445, 5.418212890625, 6.0391058921813965, 6.659998893737793, 7.2808918952941895, 7.901784896850586, 8.52267837524414, 9.143571853637695, 9.764464378356934, 10.385357856750488, 11.006250381469727, 11.627143859863281, 12.248037338256836, 12.868929862976074, 13.489823341369629, 14.110715866088867, 14.731609344482422, 15.352502822875977, 15.973396301269531, 16.594287872314453, 17.215181350708008, 17.836074829101562, 18.456966400146484, 19.07785987854004, 19.698753356933594, 20.31964683532715, 20.940540313720703, 21.561433792114258]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 6.0, 8.0, 12.0, 16.0, 24.0, 52.0, 61.0, 91.0, 138.0, 251.0, 346.0, 590.0, 906.0, 1479.0, 2362.0, 3617.0, 5746.0, 8909.0, 13522.0, 20726.0, 30548.0, 42404.0, 58020.0, 74451.0, 90422.0, 102069.0, 107495.0, 104884.0, 94055.0, 78497.0, 62061.0, 46027.0, 33000.0, 22880.0, 15333.0, 9984.0, 6383.0, 4085.0, 2637.0, 1618.0, 1054.0, 665.0, 405.0, 263.0, 160.0, 101.0, 63.0, 48.0, 32.0, 17.0, 18.0, 5.0, 5.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.3984375, -11.0262451171875, -10.654052734375, -10.2818603515625, -9.90966796875, -9.5374755859375, -9.165283203125, -8.7930908203125, -8.4208984375, -8.0487060546875, -7.676513671875, -7.3043212890625, -6.93212890625, -6.5599365234375, -6.187744140625, -5.8155517578125, -5.443359375, -5.0711669921875, -4.698974609375, -4.3267822265625, -3.95458984375, -3.5823974609375, -3.210205078125, -2.8380126953125, -2.4658203125, -2.0936279296875, -1.721435546875, -1.3492431640625, -0.97705078125, -0.6048583984375, -0.232666015625, 0.1395263671875, 0.51171875, 0.8839111328125, 1.256103515625, 1.6282958984375, 2.00048828125, 2.3726806640625, 2.744873046875, 3.1170654296875, 3.4892578125, 3.8614501953125, 4.233642578125, 4.6058349609375, 4.97802734375, 5.3502197265625, 5.722412109375, 6.0946044921875, 6.466796875, 6.8389892578125, 7.211181640625, 7.5833740234375, 7.95556640625, 8.3277587890625, 8.699951171875, 9.0721435546875, 9.4443359375, 9.8165283203125, 10.188720703125, 10.5609130859375, 10.93310546875, 11.3052978515625, 11.677490234375, 12.0496826171875, 12.421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 4.0, 11.0, 19.0, 9.0, 23.0, 27.0, 18.0, 29.0, 36.0, 29.0, 36.0, 34.0, 42.0, 45.0, 35.0, 41.0, 44.0, 56.0, 50.0, 36.0, 52.0, 40.0, 41.0, 29.0, 34.0, 34.0, 28.0, 20.0, 8.0, 17.0, 21.0, 14.0, 7.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.836669921875, -18.14208984375, -17.447509765625, -16.7529296875, -16.058349609375, -15.36376953125, -14.669189453125, -13.974609375, -13.280029296875, -12.58544921875, -11.890869140625, -11.1962890625, -10.501708984375, -9.80712890625, -9.112548828125, -8.41796875, -7.723388671875, -7.02880859375, -6.334228515625, -5.6396484375, -4.945068359375, -4.25048828125, -3.555908203125, -2.861328125, -2.166748046875, -1.47216796875, -0.777587890625, -0.0830078125, 0.611572265625, 1.30615234375, 2.000732421875, 2.6953125, 3.389892578125, 4.08447265625, 4.779052734375, 5.4736328125, 6.168212890625, 6.86279296875, 7.557373046875, 8.251953125, 8.946533203125, 9.64111328125, 10.335693359375, 11.0302734375, 11.724853515625, 12.41943359375, 13.114013671875, 13.80859375, 14.503173828125, 15.19775390625, 15.892333984375, 16.5869140625, 17.281494140625, 17.97607421875, 18.670654296875, 19.365234375, 20.059814453125, 20.75439453125, 21.448974609375, 22.1435546875, 22.838134765625, 23.53271484375, 24.227294921875, 24.921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 8.0, 10.0, 18.0, 35.0, 70.0, 72.0, 116.0, 235.0, 351.0, 467.0, 805.0, 1270.0, 2030.0, 3087.0, 4705.0, 7160.0, 11480.0, 17361.0, 26060.0, 37469.0, 52682.0, 69850.0, 87747.0, 102608.0, 110087.0, 109776.0, 99985.0, 84010.0, 66037.0, 49234.0, 34756.0, 23758.0, 16018.0, 10478.0, 6789.0, 4206.0, 2684.0, 1795.0, 1164.0, 726.0, 493.0, 313.0, 194.0, 126.0, 72.0, 55.0, 31.0, 27.0, 12.0, 11.0, 7.0, 6.0, 4.0, 3.0, 3.0], "bins": [-13.6953125, -13.291259765625, -12.88720703125, -12.483154296875, -12.0791015625, -11.675048828125, -11.27099609375, -10.866943359375, -10.462890625, -10.058837890625, -9.65478515625, -9.250732421875, -8.8466796875, -8.442626953125, -8.03857421875, -7.634521484375, -7.23046875, -6.826416015625, -6.42236328125, -6.018310546875, -5.6142578125, -5.210205078125, -4.80615234375, -4.402099609375, -3.998046875, -3.593994140625, -3.18994140625, -2.785888671875, -2.3818359375, -1.977783203125, -1.57373046875, -1.169677734375, -0.765625, -0.361572265625, 0.04248046875, 0.446533203125, 0.8505859375, 1.254638671875, 1.65869140625, 2.062744140625, 2.466796875, 2.870849609375, 3.27490234375, 3.678955078125, 4.0830078125, 4.487060546875, 4.89111328125, 5.295166015625, 5.69921875, 6.103271484375, 6.50732421875, 6.911376953125, 7.3154296875, 7.719482421875, 8.12353515625, 8.527587890625, 8.931640625, 9.335693359375, 9.73974609375, 10.143798828125, 10.5478515625, 10.951904296875, 11.35595703125, 11.760009765625, 12.1640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 2.0, 6.0, 7.0, 10.0, 8.0, 20.0, 8.0, 16.0, 13.0, 20.0, 26.0, 24.0, 36.0, 19.0, 35.0, 38.0, 24.0, 37.0, 30.0, 35.0, 50.0, 46.0, 41.0, 48.0, 39.0, 43.0, 34.0, 31.0, 42.0, 33.0, 34.0, 17.0, 24.0, 13.0, 14.0, 14.0, 8.0, 12.0, 8.0, 10.0, 11.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-12.6796875, -12.296142578125, -11.91259765625, -11.529052734375, -11.1455078125, -10.761962890625, -10.37841796875, -9.994873046875, -9.611328125, -9.227783203125, -8.84423828125, -8.460693359375, -8.0771484375, -7.693603515625, -7.31005859375, -6.926513671875, -6.54296875, -6.159423828125, -5.77587890625, -5.392333984375, -5.0087890625, -4.625244140625, -4.24169921875, -3.858154296875, -3.474609375, -3.091064453125, -2.70751953125, -2.323974609375, -1.9404296875, -1.556884765625, -1.17333984375, -0.789794921875, -0.40625, -0.022705078125, 0.36083984375, 0.744384765625, 1.1279296875, 1.511474609375, 1.89501953125, 2.278564453125, 2.662109375, 3.045654296875, 3.42919921875, 3.812744140625, 4.1962890625, 4.579833984375, 4.96337890625, 5.346923828125, 5.73046875, 6.114013671875, 6.49755859375, 6.881103515625, 7.2646484375, 7.648193359375, 8.03173828125, 8.415283203125, 8.798828125, 9.182373046875, 9.56591796875, 9.949462890625, 10.3330078125, 10.716552734375, 11.10009765625, 11.483642578125, 11.8671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 13.0, 34.0, 39.0, 76.0, 101.0, 154.0, 266.0, 420.0, 672.0, 1039.0, 1728.0, 2711.0, 4305.0, 6800.0, 10900.0, 17019.0, 25818.0, 38347.0, 54479.0, 73463.0, 92835.0, 108410.0, 115567.0, 113601.0, 100482.0, 82255.0, 63117.0, 45733.0, 30875.0, 20802.0, 13420.0, 8683.0, 5537.0, 3328.0, 2071.0, 1292.0, 837.0, 462.0, 327.0, 195.0, 123.0, 78.0, 54.0, 30.0, 19.0, 22.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.71484375, -4.57080078125, -4.4267578125, -4.28271484375, -4.138671875, -3.99462890625, -3.8505859375, -3.70654296875, -3.5625, -3.41845703125, -3.2744140625, -3.13037109375, -2.986328125, -2.84228515625, -2.6982421875, -2.55419921875, -2.41015625, -2.26611328125, -2.1220703125, -1.97802734375, -1.833984375, -1.68994140625, -1.5458984375, -1.40185546875, -1.2578125, -1.11376953125, -0.9697265625, -0.82568359375, -0.681640625, -0.53759765625, -0.3935546875, -0.24951171875, -0.10546875, 0.03857421875, 0.1826171875, 0.32666015625, 0.470703125, 0.61474609375, 0.7587890625, 0.90283203125, 1.046875, 1.19091796875, 1.3349609375, 1.47900390625, 1.623046875, 1.76708984375, 1.9111328125, 2.05517578125, 2.19921875, 2.34326171875, 2.4873046875, 2.63134765625, 2.775390625, 2.91943359375, 3.0634765625, 3.20751953125, 3.3515625, 3.49560546875, 3.6396484375, 3.78369140625, 3.927734375, 4.07177734375, 4.2158203125, 4.35986328125, 4.50390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 9.0, 3.0, 5.0, 14.0, 9.0, 15.0, 12.0, 20.0, 17.0, 27.0, 26.0, 30.0, 33.0, 46.0, 32.0, 59.0, 43.0, 59.0, 46.0, 50.0, 50.0, 47.0, 33.0, 46.0, 33.0, 31.0, 36.0, 30.0, 26.0, 19.0, 18.0, 19.0, 9.0, 10.0, 8.0, 2.0, 6.0, 4.0, 0.0, 1.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006513595581054688, -0.0006326362490653992, -0.0006139129400253296, -0.00059518963098526, -0.0005764663219451904, -0.0005577430129051208, -0.0005390197038650513, -0.0005202963948249817, -0.0005015730857849121, -0.00048284977674484253, -0.00046412646770477295, -0.00044540315866470337, -0.0004266798496246338, -0.0004079565405845642, -0.00038923323154449463, -0.00037050992250442505, -0.00035178661346435547, -0.0003330633044242859, -0.0003143399953842163, -0.00029561668634414673, -0.00027689337730407715, -0.00025817006826400757, -0.000239446759223938, -0.0002207234501838684, -0.00020200014114379883, -0.00018327683210372925, -0.00016455352306365967, -0.0001458302140235901, -0.0001271069049835205, -0.00010838359594345093, -8.966028690338135e-05, -7.093697786331177e-05, -5.221366882324219e-05, -3.349035978317261e-05, -1.4767050743103027e-05, 3.956258296966553e-06, 2.2679567337036133e-05, 4.140287637710571e-05, 6.012618541717529e-05, 7.884949445724487e-05, 9.757280349731445e-05, 0.00011629611253738403, 0.0001350194215774536, 0.0001537427306175232, 0.00017246603965759277, 0.00019118934869766235, 0.00020991265773773193, 0.00022863596677780151, 0.0002473592758178711, 0.0002660825848579407, 0.00028480589389801025, 0.00030352920293807983, 0.0003222525119781494, 0.000340975821018219, 0.0003596991300582886, 0.00037842243909835815, 0.00039714574813842773, 0.0004158690571784973, 0.0004345923662185669, 0.0004533156752586365, 0.00047203898429870605, 0.0004907622933387756, 0.0005094856023788452, 0.0005282089114189148, 0.0005469322204589844]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 15.0, 16.0, 43.0, 66.0, 69.0, 136.0, 184.0, 297.0, 428.0, 637.0, 974.0, 1552.0, 2324.0, 3375.0, 5107.0, 7508.0, 11014.0, 15795.0, 22678.0, 31452.0, 42251.0, 55128.0, 69354.0, 82251.0, 92109.0, 97585.0, 95765.0, 89448.0, 77447.0, 64147.0, 49945.0, 38477.0, 27752.0, 20023.0, 13884.0, 9604.0, 6541.0, 4478.0, 2963.0, 1952.0, 1266.0, 872.0, 567.0, 363.0, 261.0, 163.0, 99.0, 66.0, 44.0, 28.0, 15.0, 20.0, 6.0, 4.0, 5.0], "bins": [-4.4296875, -4.302459716796875, -4.17523193359375, -4.048004150390625, -3.9207763671875, -3.793548583984375, -3.66632080078125, -3.539093017578125, -3.411865234375, -3.284637451171875, -3.15740966796875, -3.030181884765625, -2.9029541015625, -2.775726318359375, -2.64849853515625, -2.521270751953125, -2.39404296875, -2.266815185546875, -2.13958740234375, -2.012359619140625, -1.8851318359375, -1.757904052734375, -1.63067626953125, -1.503448486328125, -1.376220703125, -1.248992919921875, -1.12176513671875, -0.994537353515625, -0.8673095703125, -0.740081787109375, -0.61285400390625, -0.485626220703125, -0.3583984375, -0.231170654296875, -0.10394287109375, 0.023284912109375, 0.1505126953125, 0.277740478515625, 0.40496826171875, 0.532196044921875, 0.659423828125, 0.786651611328125, 0.91387939453125, 1.041107177734375, 1.1683349609375, 1.295562744140625, 1.42279052734375, 1.550018310546875, 1.67724609375, 1.804473876953125, 1.93170166015625, 2.058929443359375, 2.1861572265625, 2.313385009765625, 2.44061279296875, 2.567840576171875, 2.695068359375, 2.822296142578125, 2.94952392578125, 3.076751708984375, 3.2039794921875, 3.331207275390625, 3.45843505859375, 3.585662841796875, 3.712890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 0.0, 2.0, 4.0, 6.0, 5.0, 11.0, 10.0, 9.0, 14.0, 14.0, 26.0, 24.0, 19.0, 38.0, 30.0, 37.0, 32.0, 30.0, 38.0, 46.0, 39.0, 45.0, 48.0, 39.0, 47.0, 37.0, 44.0, 26.0, 42.0, 28.0, 34.0, 26.0, 26.0, 16.0, 17.0, 15.0, 12.0, 13.0, 7.0, 13.0, 8.0, 7.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.001953125, -1.94000244140625, -1.8780517578125, -1.81610107421875, -1.754150390625, -1.69219970703125, -1.6302490234375, -1.56829833984375, -1.50634765625, -1.44439697265625, -1.3824462890625, -1.32049560546875, -1.258544921875, -1.19659423828125, -1.1346435546875, -1.07269287109375, -1.0107421875, -0.94879150390625, -0.8868408203125, -0.82489013671875, -0.762939453125, -0.70098876953125, -0.6390380859375, -0.57708740234375, -0.51513671875, -0.45318603515625, -0.3912353515625, -0.32928466796875, -0.267333984375, -0.20538330078125, -0.1434326171875, -0.08148193359375, -0.01953125, 0.04241943359375, 0.1043701171875, 0.16632080078125, 0.228271484375, 0.29022216796875, 0.3521728515625, 0.41412353515625, 0.47607421875, 0.53802490234375, 0.5999755859375, 0.66192626953125, 0.723876953125, 0.78582763671875, 0.8477783203125, 0.90972900390625, 0.9716796875, 1.03363037109375, 1.0955810546875, 1.15753173828125, 1.219482421875, 1.28143310546875, 1.3433837890625, 1.40533447265625, 1.46728515625, 1.52923583984375, 1.5911865234375, 1.65313720703125, 1.715087890625, 1.77703857421875, 1.8389892578125, 1.90093994140625, 1.962890625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 8.0, 12.0, 15.0, 19.0, 32.0, 28.0, 26.0, 33.0, 31.0, 26.0, 38.0, 44.0, 48.0, 46.0, 52.0, 42.0, 61.0, 46.0, 45.0, 52.0, 35.0, 36.0, 31.0, 29.0, 29.0, 26.0, 27.0, 9.0, 20.0, 16.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.49630355834961, -18.811979293823242, -18.127655029296875, -17.443328857421875, -16.759004592895508, -16.07468032836914, -15.390355110168457, -14.706029891967773, -14.021705627441406, -13.337381362915039, -12.653056144714355, -11.968730926513672, -11.284406661987305, -10.600082397460938, -9.915757179260254, -9.23143196105957, -8.547107696533203, -7.862782955169678, -7.178458213806152, -6.494133472442627, -5.809808731079102, -5.125483989715576, -4.441159248352051, -3.7568345069885254, -3.072509765625, -2.3881850242614746, -1.7038602828979492, -1.0195355415344238, -0.33521080017089844, 0.34911394119262695, 1.0334386825561523, 1.7177634239196777, 2.402090072631836, 3.0864148139953613, 3.7707395553588867, 4.455064296722412, 5.1393890380859375, 5.823713779449463, 6.508038520812988, 7.192363262176514, 7.876688003540039, 8.561012268066406, 9.24533748626709, 9.929662704467773, 10.61398696899414, 11.298311233520508, 11.982636451721191, 12.666961669921875, 13.351285934448242, 14.03561019897461, 14.719935417175293, 15.404260635375977, 16.088584899902344, 16.77290916442871, 17.457233428955078, 18.141559600830078, 18.825883865356445, 19.510208129882812, 20.194534301757812, 20.87885856628418, 21.563182830810547, 22.247507095336914, 22.93183135986328, 23.61615753173828, 24.30048179626465]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 12.0, 11.0, 7.0, 19.0, 17.0, 15.0, 22.0, 20.0, 19.0, 30.0, 25.0, 36.0, 39.0, 41.0, 38.0, 40.0, 39.0, 43.0, 42.0, 45.0, 36.0, 45.0, 33.0, 33.0, 36.0, 26.0, 38.0, 17.0, 23.0, 25.0, 20.0, 14.0, 18.0, 17.0, 14.0, 7.0, 8.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.404924392700195, -18.76725959777832, -18.129594802856445, -17.491928100585938, -16.854263305664062, -16.216598510742188, -15.578933715820312, -14.941268920898438, -14.303603172302246, -13.665938377380371, -13.02827262878418, -12.390607833862305, -11.75294303894043, -11.115277290344238, -10.477612495422363, -9.839946746826172, -9.202281951904297, -8.564617156982422, -7.9269514083862305, -7.2892866134643555, -6.651621341705322, -6.013956069946289, -5.376291275024414, -4.738626003265381, -4.100960731506348, -3.4632954597473145, -2.8256304264068604, -2.1879653930664062, -1.550300121307373, -0.9126348495483398, -0.27496981620788574, 0.36269521713256836, 1.0003585815429688, 1.6380237340927124, 2.275688886642456, 2.91335391998291, 3.5510191917419434, 4.188684463500977, 4.826349258422852, 5.464014530181885, 6.101679801940918, 6.739345073699951, 7.377010345458984, 8.01467514038086, 8.652339935302734, 9.290005683898926, 9.9276704788208, 10.565336227416992, 11.203001022338867, 11.840665817260742, 12.478331565856934, 13.115996360778809, 13.753662109375, 14.391326904296875, 15.02899169921875, 15.666656494140625, 16.3043212890625, 16.941986083984375, 17.57965087890625, 18.217317581176758, 18.854982376098633, 19.492647171020508, 20.130311965942383, 20.767976760864258, 21.405643463134766]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 13.0, 9.0, 22.0, 29.0, 48.0, 49.0, 102.0, 143.0, 242.0, 375.0, 580.0, 934.0, 1360.0, 2137.0, 3470.0, 5717.0, 9620.0, 16175.0, 27708.0, 48613.0, 84915.0, 149224.0, 254459.0, 402727.0, 563536.0, 663521.0, 633712.0, 498406.0, 337504.0, 206370.0, 118650.0, 68271.0, 39046.0, 22877.0, 13205.0, 7970.0, 4795.0, 2943.0, 1714.0, 1068.0, 719.0, 450.0, 302.0, 196.0, 112.0, 84.0, 56.0, 39.0, 27.0, 8.0, 8.0, 11.0, 5.0, 4.0, 4.0], "bins": [-17.5, -16.9970703125, -16.494140625, -15.9912109375, -15.48828125, -14.9853515625, -14.482421875, -13.9794921875, -13.4765625, -12.9736328125, -12.470703125, -11.9677734375, -11.46484375, -10.9619140625, -10.458984375, -9.9560546875, -9.453125, -8.9501953125, -8.447265625, -7.9443359375, -7.44140625, -6.9384765625, -6.435546875, -5.9326171875, -5.4296875, -4.9267578125, -4.423828125, -3.9208984375, -3.41796875, -2.9150390625, -2.412109375, -1.9091796875, -1.40625, -0.9033203125, -0.400390625, 0.1025390625, 0.60546875, 1.1083984375, 1.611328125, 2.1142578125, 2.6171875, 3.1201171875, 3.623046875, 4.1259765625, 4.62890625, 5.1318359375, 5.634765625, 6.1376953125, 6.640625, 7.1435546875, 7.646484375, 8.1494140625, 8.65234375, 9.1552734375, 9.658203125, 10.1611328125, 10.6640625, 11.1669921875, 11.669921875, 12.1728515625, 12.67578125, 13.1787109375, 13.681640625, 14.1845703125, 14.6875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 14.0, 6.0, 9.0, 6.0, 13.0, 16.0, 19.0, 22.0, 19.0, 31.0, 22.0, 35.0, 25.0, 23.0, 34.0, 54.0, 43.0, 52.0, 38.0, 37.0, 40.0, 46.0, 40.0, 33.0, 33.0, 33.0, 35.0, 24.0, 32.0, 20.0, 15.0, 16.0, 24.0, 24.0, 12.0, 7.0, 8.0, 11.0, 8.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.125, -15.568603515625, -15.01220703125, -14.455810546875, -13.8994140625, -13.343017578125, -12.78662109375, -12.230224609375, -11.673828125, -11.117431640625, -10.56103515625, -10.004638671875, -9.4482421875, -8.891845703125, -8.33544921875, -7.779052734375, -7.22265625, -6.666259765625, -6.10986328125, -5.553466796875, -4.9970703125, -4.440673828125, -3.88427734375, -3.327880859375, -2.771484375, -2.215087890625, -1.65869140625, -1.102294921875, -0.5458984375, 0.010498046875, 0.56689453125, 1.123291015625, 1.6796875, 2.236083984375, 2.79248046875, 3.348876953125, 3.9052734375, 4.461669921875, 5.01806640625, 5.574462890625, 6.130859375, 6.687255859375, 7.24365234375, 7.800048828125, 8.3564453125, 8.912841796875, 9.46923828125, 10.025634765625, 10.58203125, 11.138427734375, 11.69482421875, 12.251220703125, 12.8076171875, 13.364013671875, 13.92041015625, 14.476806640625, 15.033203125, 15.589599609375, 16.14599609375, 16.702392578125, 17.2587890625, 17.815185546875, 18.37158203125, 18.927978515625, 19.484375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 11.0, 3.0, 12.0, 17.0, 27.0, 49.0, 75.0, 130.0, 265.0, 378.0, 640.0, 1080.0, 1761.0, 3057.0, 5127.0, 8402.0, 14273.0, 24067.0, 40580.0, 68832.0, 115492.0, 190819.0, 301629.0, 440631.0, 569435.0, 625889.0, 568999.0, 438436.0, 300954.0, 190374.0, 115369.0, 68146.0, 40408.0, 23816.0, 14209.0, 8294.0, 4974.0, 2988.0, 1868.0, 1088.0, 659.0, 390.0, 269.0, 155.0, 93.0, 44.0, 41.0, 14.0, 12.0, 4.0, 1.0, 5.0, 3.0, 1.0], "bins": [-20.3125, -19.740234375, -19.16796875, -18.595703125, -18.0234375, -17.451171875, -16.87890625, -16.306640625, -15.734375, -15.162109375, -14.58984375, -14.017578125, -13.4453125, -12.873046875, -12.30078125, -11.728515625, -11.15625, -10.583984375, -10.01171875, -9.439453125, -8.8671875, -8.294921875, -7.72265625, -7.150390625, -6.578125, -6.005859375, -5.43359375, -4.861328125, -4.2890625, -3.716796875, -3.14453125, -2.572265625, -2.0, -1.427734375, -0.85546875, -0.283203125, 0.2890625, 0.861328125, 1.43359375, 2.005859375, 2.578125, 3.150390625, 3.72265625, 4.294921875, 4.8671875, 5.439453125, 6.01171875, 6.583984375, 7.15625, 7.728515625, 8.30078125, 8.873046875, 9.4453125, 10.017578125, 10.58984375, 11.162109375, 11.734375, 12.306640625, 12.87890625, 13.451171875, 14.0234375, 14.595703125, 15.16796875, 15.740234375, 16.3125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 12.0, 11.0, 10.0, 8.0, 19.0, 16.0, 31.0, 37.0, 41.0, 37.0, 37.0, 71.0, 87.0, 120.0, 115.0, 104.0, 134.0, 167.0, 165.0, 189.0, 190.0, 170.0, 201.0, 201.0, 200.0, 196.0, 204.0, 193.0, 166.0, 142.0, 118.0, 110.0, 108.0, 71.0, 62.0, 64.0, 49.0, 45.0, 29.0, 40.0, 26.0, 11.0, 17.0, 9.0, 9.0, 11.0, 7.0, 3.0, 3.0, 5.0, 2.0, 3.0], "bins": [-7.46875, -7.25555419921875, -7.0423583984375, -6.82916259765625, -6.615966796875, -6.40277099609375, -6.1895751953125, -5.97637939453125, -5.76318359375, -5.54998779296875, -5.3367919921875, -5.12359619140625, -4.910400390625, -4.69720458984375, -4.4840087890625, -4.27081298828125, -4.0576171875, -3.84442138671875, -3.6312255859375, -3.41802978515625, -3.204833984375, -2.99163818359375, -2.7784423828125, -2.56524658203125, -2.35205078125, -2.13885498046875, -1.9256591796875, -1.71246337890625, -1.499267578125, -1.28607177734375, -1.0728759765625, -0.85968017578125, -0.646484375, -0.43328857421875, -0.2200927734375, -0.00689697265625, 0.206298828125, 0.41949462890625, 0.6326904296875, 0.84588623046875, 1.05908203125, 1.27227783203125, 1.4854736328125, 1.69866943359375, 1.911865234375, 2.12506103515625, 2.3382568359375, 2.55145263671875, 2.7646484375, 2.97784423828125, 3.1910400390625, 3.40423583984375, 3.617431640625, 3.83062744140625, 4.0438232421875, 4.25701904296875, 4.47021484375, 4.68341064453125, 4.8966064453125, 5.10980224609375, 5.322998046875, 5.53619384765625, 5.7493896484375, 5.96258544921875, 6.17578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 10.0, 9.0, 16.0, 18.0, 17.0, 18.0, 22.0, 31.0, 43.0, 28.0, 39.0, 34.0, 44.0, 55.0, 64.0, 52.0, 41.0, 50.0, 49.0, 50.0, 46.0, 37.0, 32.0, 28.0, 33.0, 24.0, 20.0, 16.0, 11.0, 14.0, 9.0, 4.0, 7.0, 4.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.23534393310547, -22.53009033203125, -21.82483673095703, -21.119583129882812, -20.41432762145996, -19.709074020385742, -19.003820419311523, -18.298566818237305, -17.593311309814453, -16.888057708740234, -16.182804107666016, -15.47754955291748, -14.772294998168945, -14.067041397094727, -13.361787796020508, -12.656534194946289, -11.95128059387207, -11.246026992797852, -10.540772438049316, -9.835518836975098, -9.130264282226562, -8.425010681152344, -7.719757080078125, -7.014503002166748, -6.309248924255371, -5.603994846343994, -4.898740768432617, -4.193487167358398, -3.4882330894470215, -2.7829790115356445, -2.077725410461426, -1.3724713325500488, -0.6672191619873047, 0.038034796714782715, 0.7432887554168701, 1.448542594909668, 2.153796672821045, 2.859050750732422, 3.5643043518066406, 4.269558429718018, 4.9748125076293945, 5.6800665855407715, 6.385320663452148, 7.090574264526367, 7.795828342437744, 8.501082420349121, 9.20633602142334, 9.911590576171875, 10.616844177246094, 11.322097778320312, 12.027352333068848, 12.732605934143066, 13.437860488891602, 14.14311408996582, 14.848367691040039, 15.553621292114258, 16.25887680053711, 16.964130401611328, 17.669384002685547, 18.374637603759766, 19.079893112182617, 19.785146713256836, 20.490400314331055, 21.195653915405273, 21.900907516479492]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 9.0, 6.0, 7.0, 9.0, 10.0, 15.0, 15.0, 17.0, 21.0, 29.0, 26.0, 28.0, 37.0, 29.0, 46.0, 42.0, 34.0, 47.0, 42.0, 36.0, 36.0, 41.0, 36.0, 41.0, 34.0, 35.0, 40.0, 33.0, 29.0, 14.0, 23.0, 12.0, 16.0, 19.0, 10.0, 16.0, 17.0, 8.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.522321701049805, -16.929426193237305, -16.336528778076172, -15.743633270263672, -15.150737762451172, -14.557841300964355, -13.964944839477539, -13.372049331665039, -12.779152870178223, -12.186256408691406, -11.593360900878906, -11.00046443939209, -10.407567977905273, -9.814672470092773, -9.221776008605957, -8.62887954711914, -8.03598403930664, -7.443088054656982, -6.850192070007324, -6.257295608520508, -5.66439962387085, -5.071503639221191, -4.478607177734375, -3.885711193084717, -3.2928152084350586, -2.6999192237854004, -2.107023000717163, -1.5141268968582153, -0.9212307929992676, -0.3283348083496094, 0.26456141471862793, 0.8574576377868652, 1.4503555297851562, 2.0432515144348145, 2.6361477375030518, 3.229043960571289, 3.8219399452209473, 4.4148359298706055, 5.007732391357422, 5.60062837600708, 6.193524360656738, 6.7864203453063965, 7.379316329956055, 7.972212791442871, 8.565109252929688, 9.158004760742188, 9.750901222229004, 10.34379768371582, 10.93669319152832, 11.529589653015137, 12.122485160827637, 12.715381622314453, 13.308277130126953, 13.90117359161377, 14.494070053100586, 15.086965560913086, 15.679862022399902, 16.27275848388672, 16.86565399169922, 17.45854949951172, 18.05144691467285, 18.64434242248535, 19.23723793029785, 19.830135345458984, 20.423030853271484]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 22.0, 28.0, 54.0, 79.0, 133.0, 246.0, 484.0, 756.0, 1511.0, 2634.0, 4838.0, 8799.0, 15653.0, 27235.0, 45227.0, 72365.0, 104643.0, 134951.0, 150277.0, 143370.0, 117483.0, 84722.0, 55192.0, 33924.0, 19122.0, 11073.0, 6163.0, 3333.0, 1818.0, 1048.0, 565.0, 330.0, 174.0, 111.0, 74.0, 32.0, 23.0, 18.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.939208984375, -11.55029296875, -11.161376953125, -10.7724609375, -10.383544921875, -9.99462890625, -9.605712890625, -9.216796875, -8.827880859375, -8.43896484375, -8.050048828125, -7.6611328125, -7.272216796875, -6.88330078125, -6.494384765625, -6.10546875, -5.716552734375, -5.32763671875, -4.938720703125, -4.5498046875, -4.160888671875, -3.77197265625, -3.383056640625, -2.994140625, -2.605224609375, -2.21630859375, -1.827392578125, -1.4384765625, -1.049560546875, -0.66064453125, -0.271728515625, 0.1171875, 0.506103515625, 0.89501953125, 1.283935546875, 1.6728515625, 2.061767578125, 2.45068359375, 2.839599609375, 3.228515625, 3.617431640625, 4.00634765625, 4.395263671875, 4.7841796875, 5.173095703125, 5.56201171875, 5.950927734375, 6.33984375, 6.728759765625, 7.11767578125, 7.506591796875, 7.8955078125, 8.284423828125, 8.67333984375, 9.062255859375, 9.451171875, 9.840087890625, 10.22900390625, 10.617919921875, 11.0068359375, 11.395751953125, 11.78466796875, 12.173583984375, 12.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 4.0, 1.0, 5.0, 5.0, 6.0, 6.0, 7.0, 4.0, 12.0, 10.0, 15.0, 9.0, 17.0, 22.0, 25.0, 25.0, 30.0, 23.0, 35.0, 42.0, 45.0, 33.0, 40.0, 37.0, 43.0, 40.0, 45.0, 47.0, 31.0, 27.0, 38.0, 33.0, 34.0, 30.0, 27.0, 28.0, 18.0, 15.0, 11.0, 14.0, 14.0, 13.0, 12.0, 10.0, 6.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.439697265625, -15.83251953125, -15.225341796875, -14.6181640625, -14.010986328125, -13.40380859375, -12.796630859375, -12.189453125, -11.582275390625, -10.97509765625, -10.367919921875, -9.7607421875, -9.153564453125, -8.54638671875, -7.939208984375, -7.33203125, -6.724853515625, -6.11767578125, -5.510498046875, -4.9033203125, -4.296142578125, -3.68896484375, -3.081787109375, -2.474609375, -1.867431640625, -1.26025390625, -0.653076171875, -0.0458984375, 0.561279296875, 1.16845703125, 1.775634765625, 2.3828125, 2.989990234375, 3.59716796875, 4.204345703125, 4.8115234375, 5.418701171875, 6.02587890625, 6.633056640625, 7.240234375, 7.847412109375, 8.45458984375, 9.061767578125, 9.6689453125, 10.276123046875, 10.88330078125, 11.490478515625, 12.09765625, 12.704833984375, 13.31201171875, 13.919189453125, 14.5263671875, 15.133544921875, 15.74072265625, 16.347900390625, 16.955078125, 17.562255859375, 18.16943359375, 18.776611328125, 19.3837890625, 19.990966796875, 20.59814453125, 21.205322265625, 21.8125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 16.0, 28.0, 37.0, 52.0, 81.0, 135.0, 188.0, 282.0, 466.0, 646.0, 1130.0, 1863.0, 2970.0, 5122.0, 8502.0, 14723.0, 25482.0, 42466.0, 69447.0, 107016.0, 146469.0, 166748.0, 151508.0, 114133.0, 75065.0, 47028.0, 27489.0, 16180.0, 9380.0, 5563.0, 3181.0, 2027.0, 1132.0, 690.0, 456.0, 276.0, 190.0, 120.0, 76.0, 54.0, 42.0, 29.0, 17.0, 12.0, 17.0, 6.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0], "bins": [-16.5, -16.0086669921875, -15.517333984375, -15.0260009765625, -14.53466796875, -14.0433349609375, -13.552001953125, -13.0606689453125, -12.5693359375, -12.0780029296875, -11.586669921875, -11.0953369140625, -10.60400390625, -10.1126708984375, -9.621337890625, -9.1300048828125, -8.638671875, -8.1473388671875, -7.656005859375, -7.1646728515625, -6.67333984375, -6.1820068359375, -5.690673828125, -5.1993408203125, -4.7080078125, -4.2166748046875, -3.725341796875, -3.2340087890625, -2.74267578125, -2.2513427734375, -1.760009765625, -1.2686767578125, -0.77734375, -0.2860107421875, 0.205322265625, 0.6966552734375, 1.18798828125, 1.6793212890625, 2.170654296875, 2.6619873046875, 3.1533203125, 3.6446533203125, 4.135986328125, 4.6273193359375, 5.11865234375, 5.6099853515625, 6.101318359375, 6.5926513671875, 7.083984375, 7.5753173828125, 8.066650390625, 8.5579833984375, 9.04931640625, 9.5406494140625, 10.031982421875, 10.5233154296875, 11.0146484375, 11.5059814453125, 11.997314453125, 12.4886474609375, 12.97998046875, 13.4713134765625, 13.962646484375, 14.4539794921875, 14.9453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 6.0, 6.0, 5.0, 4.0, 11.0, 13.0, 14.0, 16.0, 24.0, 18.0, 17.0, 30.0, 35.0, 28.0, 35.0, 31.0, 38.0, 28.0, 48.0, 44.0, 45.0, 31.0, 38.0, 37.0, 45.0, 41.0, 38.0, 34.0, 31.0, 29.0, 26.0, 21.0, 24.0, 19.0, 14.0, 12.0, 4.0, 14.0, 6.0, 8.0, 9.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0], "bins": [-14.0546875, -13.669921875, -13.28515625, -12.900390625, -12.515625, -12.130859375, -11.74609375, -11.361328125, -10.9765625, -10.591796875, -10.20703125, -9.822265625, -9.4375, -9.052734375, -8.66796875, -8.283203125, -7.8984375, -7.513671875, -7.12890625, -6.744140625, -6.359375, -5.974609375, -5.58984375, -5.205078125, -4.8203125, -4.435546875, -4.05078125, -3.666015625, -3.28125, -2.896484375, -2.51171875, -2.126953125, -1.7421875, -1.357421875, -0.97265625, -0.587890625, -0.203125, 0.181640625, 0.56640625, 0.951171875, 1.3359375, 1.720703125, 2.10546875, 2.490234375, 2.875, 3.259765625, 3.64453125, 4.029296875, 4.4140625, 4.798828125, 5.18359375, 5.568359375, 5.953125, 6.337890625, 6.72265625, 7.107421875, 7.4921875, 7.876953125, 8.26171875, 8.646484375, 9.03125, 9.416015625, 9.80078125, 10.185546875, 10.5703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 9.0, 21.0, 35.0, 42.0, 55.0, 94.0, 153.0, 264.0, 434.0, 709.0, 1224.0, 2132.0, 3802.0, 7023.0, 12474.0, 23085.0, 41969.0, 76966.0, 130251.0, 184257.0, 197246.0, 152361.0, 95382.0, 53789.0, 29130.0, 15839.0, 8549.0, 4789.0, 2686.0, 1552.0, 868.0, 554.0, 309.0, 173.0, 108.0, 70.0, 54.0, 36.0, 19.0, 15.0, 5.0, 8.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5, -8.2359619140625, -7.971923828125, -7.7078857421875, -7.44384765625, -7.1798095703125, -6.915771484375, -6.6517333984375, -6.3876953125, -6.1236572265625, -5.859619140625, -5.5955810546875, -5.33154296875, -5.0675048828125, -4.803466796875, -4.5394287109375, -4.275390625, -4.0113525390625, -3.747314453125, -3.4832763671875, -3.21923828125, -2.9552001953125, -2.691162109375, -2.4271240234375, -2.1630859375, -1.8990478515625, -1.635009765625, -1.3709716796875, -1.10693359375, -0.8428955078125, -0.578857421875, -0.3148193359375, -0.05078125, 0.2132568359375, 0.477294921875, 0.7413330078125, 1.00537109375, 1.2694091796875, 1.533447265625, 1.7974853515625, 2.0615234375, 2.3255615234375, 2.589599609375, 2.8536376953125, 3.11767578125, 3.3817138671875, 3.645751953125, 3.9097900390625, 4.173828125, 4.4378662109375, 4.701904296875, 4.9659423828125, 5.22998046875, 5.4940185546875, 5.758056640625, 6.0220947265625, 6.2861328125, 6.5501708984375, 6.814208984375, 7.0782470703125, 7.34228515625, 7.6063232421875, 7.870361328125, 8.1343994140625, 8.3984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 6.0, 11.0, 11.0, 21.0, 22.0, 23.0, 31.0, 34.0, 25.0, 46.0, 48.0, 44.0, 52.0, 47.0, 66.0, 50.0, 58.0, 60.0, 55.0, 52.0, 58.0, 27.0, 28.0, 19.0, 17.0, 20.0, 9.0, 6.0, 13.0, 4.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.0005269050598144531, -0.0005116760730743408, -0.0004964470863342285, -0.0004812180995941162, -0.0004659891128540039, -0.0004507601261138916, -0.0004355311393737793, -0.000420302152633667, -0.0004050731658935547, -0.0003898441791534424, -0.0003746151924133301, -0.0003593862056732178, -0.00034415721893310547, -0.00032892823219299316, -0.00031369924545288086, -0.00029847025871276855, -0.00028324127197265625, -0.00026801228523254395, -0.00025278329849243164, -0.00023755431175231934, -0.00022232532501220703, -0.00020709633827209473, -0.00019186735153198242, -0.00017663836479187012, -0.0001614093780517578, -0.0001461803913116455, -0.0001309514045715332, -0.0001157224178314209, -0.0001004934310913086, -8.526444435119629e-05, -7.003545761108398e-05, -5.480647087097168e-05, -3.9577484130859375e-05, -2.434849739074707e-05, -9.119510650634766e-06, 6.109476089477539e-06, 2.1338462829589844e-05, 3.656744956970215e-05, 5.179643630981445e-05, 6.702542304992676e-05, 8.225440979003906e-05, 9.748339653015137e-05, 0.00011271238327026367, 0.00012794137001037598, 0.00014317035675048828, 0.00015839934349060059, 0.0001736283302307129, 0.0001888573169708252, 0.0002040863037109375, 0.0002193152904510498, 0.0002345442771911621, 0.0002497732639312744, 0.0002650022506713867, 0.000280231237411499, 0.00029546022415161133, 0.00031068921089172363, 0.00032591819763183594, 0.00034114718437194824, 0.00035637617111206055, 0.00037160515785217285, 0.00038683414459228516, 0.00040206313133239746, 0.00041729211807250977, 0.00043252110481262207, 0.0004477500915527344]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 8.0, 6.0, 19.0, 25.0, 43.0, 46.0, 84.0, 138.0, 201.0, 321.0, 517.0, 811.0, 1308.0, 2116.0, 3136.0, 5075.0, 8131.0, 13041.0, 20542.0, 32404.0, 49078.0, 71487.0, 96968.0, 120694.0, 133987.0, 128883.0, 109048.0, 82948.0, 58821.0, 39576.0, 25590.0, 16153.0, 10246.0, 6288.0, 4038.0, 2538.0, 1500.0, 987.0, 643.0, 393.0, 258.0, 146.0, 113.0, 76.0, 37.0, 23.0, 17.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-7.58203125, -7.35040283203125, -7.1187744140625, -6.88714599609375, -6.655517578125, -6.42388916015625, -6.1922607421875, -5.96063232421875, -5.72900390625, -5.49737548828125, -5.2657470703125, -5.03411865234375, -4.802490234375, -4.57086181640625, -4.3392333984375, -4.10760498046875, -3.8759765625, -3.64434814453125, -3.4127197265625, -3.18109130859375, -2.949462890625, -2.71783447265625, -2.4862060546875, -2.25457763671875, -2.02294921875, -1.79132080078125, -1.5596923828125, -1.32806396484375, -1.096435546875, -0.86480712890625, -0.6331787109375, -0.40155029296875, -0.169921875, 0.06170654296875, 0.2933349609375, 0.52496337890625, 0.756591796875, 0.98822021484375, 1.2198486328125, 1.45147705078125, 1.68310546875, 1.91473388671875, 2.1463623046875, 2.37799072265625, 2.609619140625, 2.84124755859375, 3.0728759765625, 3.30450439453125, 3.5361328125, 3.76776123046875, 3.9993896484375, 4.23101806640625, 4.462646484375, 4.69427490234375, 4.9259033203125, 5.15753173828125, 5.38916015625, 5.62078857421875, 5.8524169921875, 6.08404541015625, 6.315673828125, 6.54730224609375, 6.7789306640625, 7.01055908203125, 7.2421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 12.0, 5.0, 13.0, 10.0, 10.0, 18.0, 33.0, 21.0, 34.0, 34.0, 47.0, 40.0, 43.0, 61.0, 55.0, 52.0, 60.0, 55.0, 54.0, 44.0, 38.0, 41.0, 34.0, 45.0, 29.0, 17.0, 27.0, 11.0, 9.0, 8.0, 4.0, 8.0, 0.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.255859375, -3.15716552734375, -3.0584716796875, -2.95977783203125, -2.861083984375, -2.76239013671875, -2.6636962890625, -2.56500244140625, -2.46630859375, -2.36761474609375, -2.2689208984375, -2.17022705078125, -2.071533203125, -1.97283935546875, -1.8741455078125, -1.77545166015625, -1.6767578125, -1.57806396484375, -1.4793701171875, -1.38067626953125, -1.281982421875, -1.18328857421875, -1.0845947265625, -0.98590087890625, -0.88720703125, -0.78851318359375, -0.6898193359375, -0.59112548828125, -0.492431640625, -0.39373779296875, -0.2950439453125, -0.19635009765625, -0.09765625, 0.00103759765625, 0.0997314453125, 0.19842529296875, 0.297119140625, 0.39581298828125, 0.4945068359375, 0.59320068359375, 0.69189453125, 0.79058837890625, 0.8892822265625, 0.98797607421875, 1.086669921875, 1.18536376953125, 1.2840576171875, 1.38275146484375, 1.4814453125, 1.58013916015625, 1.6788330078125, 1.77752685546875, 1.876220703125, 1.97491455078125, 2.0736083984375, 2.17230224609375, 2.27099609375, 2.36968994140625, 2.4683837890625, 2.56707763671875, 2.665771484375, 2.76446533203125, 2.8631591796875, 2.96185302734375, 3.060546875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 9.0, 5.0, 11.0, 15.0, 20.0, 10.0, 17.0, 21.0, 23.0, 23.0, 24.0, 39.0, 40.0, 41.0, 35.0, 51.0, 67.0, 42.0, 45.0, 44.0, 54.0, 44.0, 46.0, 43.0, 33.0, 32.0, 22.0, 18.0, 21.0, 22.0, 15.0, 20.0, 12.0, 9.0, 9.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.479982376098633, -20.81294059753418, -20.145898818969727, -19.478857040405273, -18.811817169189453, -18.144775390625, -17.477733612060547, -16.810691833496094, -16.14365005493164, -15.476608276367188, -14.809566497802734, -14.142525672912598, -13.475483894348145, -12.808442115783691, -12.141401290893555, -11.474359512329102, -10.807317733764648, -10.140275955200195, -9.473234176635742, -8.806193351745605, -8.139151573181152, -7.472109794616699, -6.805068492889404, -6.138027191162109, -5.470985412597656, -4.803943634033203, -4.136902332305908, -3.469860792160034, -2.80281925201416, -2.135777711868286, -1.468736171722412, -0.8016948699951172, -0.13465309143066406, 0.53238844871521, 1.199429988861084, 1.866471529006958, 2.533513069152832, 3.200554609298706, 3.86759614944458, 4.534637451171875, 5.201679229736328, 5.868721008300781, 6.535762310028076, 7.202803611755371, 7.869845390319824, 8.536887168884277, 9.203927993774414, 9.870969772338867, 10.53801155090332, 11.205053329467773, 11.872095108032227, 12.539135932922363, 13.206177711486816, 13.87321949005127, 14.540260314941406, 15.20730209350586, 15.874343872070312, 16.541385650634766, 17.20842742919922, 17.875469207763672, 18.542510986328125, 19.209550857543945, 19.8765926361084, 20.54363441467285, 21.210676193237305]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 5.0, 4.0, 6.0, 10.0, 9.0, 4.0, 8.0, 10.0, 18.0, 17.0, 22.0, 18.0, 25.0, 30.0, 32.0, 34.0, 38.0, 43.0, 41.0, 39.0, 44.0, 40.0, 43.0, 39.0, 38.0, 38.0, 40.0, 44.0, 28.0, 45.0, 21.0, 21.0, 18.0, 20.0, 15.0, 19.0, 14.0, 15.0, 14.0, 10.0, 7.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.20357894897461, -16.610828399658203, -16.018075942993164, -15.425325393676758, -14.832573890686035, -14.239822387695312, -13.647071838378906, -13.054320335388184, -12.461568832397461, -11.868817329406738, -11.276065826416016, -10.68331527709961, -10.090563774108887, -9.497812271118164, -8.905061721801758, -8.312310218811035, -7.7195587158203125, -7.12680721282959, -6.534056186676025, -5.941305160522461, -5.348553657531738, -4.755802154541016, -4.163051128387451, -3.5703001022338867, -2.977548599243164, -2.3847973346710205, -1.792046070098877, -1.1992948055267334, -0.6065435409545898, -0.013792276382446289, 0.5789589881896973, 1.1717100143432617, 1.7644615173339844, 2.357212781906128, 2.9499640464782715, 3.542715311050415, 4.135466575622559, 4.728218078613281, 5.320969104766846, 5.91372013092041, 6.506471633911133, 7.0992231369018555, 7.69197416305542, 8.284725189208984, 8.877476692199707, 9.47022819519043, 10.062978744506836, 10.655730247497559, 11.248481750488281, 11.841233253479004, 12.433984756469727, 13.026735305786133, 13.619486808776855, 14.212238311767578, 14.804988861083984, 15.397740364074707, 15.99049186706543, 16.583242416381836, 17.175994873046875, 17.76874542236328, 18.361495971679688, 18.954248428344727, 19.546998977661133, 20.139751434326172, 20.732501983642578]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 10.0, 12.0, 19.0, 37.0, 55.0, 79.0, 114.0, 176.0, 282.0, 421.0, 670.0, 992.0, 1490.0, 2371.0, 3664.0, 5334.0, 7989.0, 11682.0, 17289.0, 24537.0, 34229.0, 45124.0, 58536.0, 72549.0, 85496.0, 94294.0, 98321.0, 95686.0, 86905.0, 74661.0, 60824.0, 47711.0, 35163.0, 25898.0, 17977.0, 12590.0, 8636.0, 5715.0, 3741.0, 2553.0, 1605.0, 1089.0, 745.0, 461.0, 292.0, 182.0, 128.0, 80.0, 49.0, 36.0, 17.0, 19.0, 11.0, 7.0, 1.0, 4.0, 1.0], "bins": [-10.984375, -10.6572265625, -10.330078125, -10.0029296875, -9.67578125, -9.3486328125, -9.021484375, -8.6943359375, -8.3671875, -8.0400390625, -7.712890625, -7.3857421875, -7.05859375, -6.7314453125, -6.404296875, -6.0771484375, -5.75, -5.4228515625, -5.095703125, -4.7685546875, -4.44140625, -4.1142578125, -3.787109375, -3.4599609375, -3.1328125, -2.8056640625, -2.478515625, -2.1513671875, -1.82421875, -1.4970703125, -1.169921875, -0.8427734375, -0.515625, -0.1884765625, 0.138671875, 0.4658203125, 0.79296875, 1.1201171875, 1.447265625, 1.7744140625, 2.1015625, 2.4287109375, 2.755859375, 3.0830078125, 3.41015625, 3.7373046875, 4.064453125, 4.3916015625, 4.71875, 5.0458984375, 5.373046875, 5.7001953125, 6.02734375, 6.3544921875, 6.681640625, 7.0087890625, 7.3359375, 7.6630859375, 7.990234375, 8.3173828125, 8.64453125, 8.9716796875, 9.298828125, 9.6259765625, 9.953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 6.0, 7.0, 4.0, 3.0, 8.0, 10.0, 8.0, 15.0, 16.0, 20.0, 24.0, 20.0, 29.0, 25.0, 31.0, 30.0, 34.0, 40.0, 50.0, 38.0, 45.0, 35.0, 47.0, 49.0, 26.0, 42.0, 44.0, 38.0, 39.0, 29.0, 22.0, 33.0, 22.0, 17.0, 13.0, 15.0, 16.0, 15.0, 10.0, 9.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75, -18.128173828125, -17.50634765625, -16.884521484375, -16.2626953125, -15.640869140625, -15.01904296875, -14.397216796875, -13.775390625, -13.153564453125, -12.53173828125, -11.909912109375, -11.2880859375, -10.666259765625, -10.04443359375, -9.422607421875, -8.80078125, -8.178955078125, -7.55712890625, -6.935302734375, -6.3134765625, -5.691650390625, -5.06982421875, -4.447998046875, -3.826171875, -3.204345703125, -2.58251953125, -1.960693359375, -1.3388671875, -0.717041015625, -0.09521484375, 0.526611328125, 1.1484375, 1.770263671875, 2.39208984375, 3.013916015625, 3.6357421875, 4.257568359375, 4.87939453125, 5.501220703125, 6.123046875, 6.744873046875, 7.36669921875, 7.988525390625, 8.6103515625, 9.232177734375, 9.85400390625, 10.475830078125, 11.09765625, 11.719482421875, 12.34130859375, 12.963134765625, 13.5849609375, 14.206787109375, 14.82861328125, 15.450439453125, 16.072265625, 16.694091796875, 17.31591796875, 17.937744140625, 18.5595703125, 19.181396484375, 19.80322265625, 20.425048828125, 21.046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 5.0, 8.0, 17.0, 17.0, 43.0, 66.0, 74.0, 141.0, 209.0, 318.0, 511.0, 754.0, 1216.0, 1834.0, 2858.0, 4329.0, 6487.0, 9818.0, 14903.0, 21790.0, 31500.0, 44212.0, 59248.0, 75600.0, 90758.0, 101903.0, 106474.0, 102277.0, 91495.0, 76564.0, 59497.0, 44600.0, 32361.0, 22398.0, 15033.0, 10144.0, 6611.0, 4302.0, 2818.0, 1823.0, 1187.0, 820.0, 563.0, 327.0, 208.0, 172.0, 87.0, 51.0, 46.0, 33.0, 19.0, 12.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0], "bins": [-12.390625, -12.0096435546875, -11.628662109375, -11.2476806640625, -10.86669921875, -10.4857177734375, -10.104736328125, -9.7237548828125, -9.3427734375, -8.9617919921875, -8.580810546875, -8.1998291015625, -7.81884765625, -7.4378662109375, -7.056884765625, -6.6759033203125, -6.294921875, -5.9139404296875, -5.532958984375, -5.1519775390625, -4.77099609375, -4.3900146484375, -4.009033203125, -3.6280517578125, -3.2470703125, -2.8660888671875, -2.485107421875, -2.1041259765625, -1.72314453125, -1.3421630859375, -0.961181640625, -0.5802001953125, -0.19921875, 0.1817626953125, 0.562744140625, 0.9437255859375, 1.32470703125, 1.7056884765625, 2.086669921875, 2.4676513671875, 2.8486328125, 3.2296142578125, 3.610595703125, 3.9915771484375, 4.37255859375, 4.7535400390625, 5.134521484375, 5.5155029296875, 5.896484375, 6.2774658203125, 6.658447265625, 7.0394287109375, 7.42041015625, 7.8013916015625, 8.182373046875, 8.5633544921875, 8.9443359375, 9.3253173828125, 9.706298828125, 10.0872802734375, 10.46826171875, 10.8492431640625, 11.230224609375, 11.6112060546875, 11.9921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 10.0, 12.0, 8.0, 9.0, 16.0, 20.0, 17.0, 17.0, 21.0, 20.0, 27.0, 28.0, 30.0, 43.0, 36.0, 44.0, 34.0, 33.0, 28.0, 35.0, 30.0, 32.0, 36.0, 44.0, 27.0, 40.0, 31.0, 39.0, 32.0, 15.0, 18.0, 20.0, 11.0, 20.0, 9.0, 14.0, 14.0, 7.0, 4.0, 7.0, 11.0, 4.0, 2.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-11.3046875, -10.97119140625, -10.6376953125, -10.30419921875, -9.970703125, -9.63720703125, -9.3037109375, -8.97021484375, -8.63671875, -8.30322265625, -7.9697265625, -7.63623046875, -7.302734375, -6.96923828125, -6.6357421875, -6.30224609375, -5.96875, -5.63525390625, -5.3017578125, -4.96826171875, -4.634765625, -4.30126953125, -3.9677734375, -3.63427734375, -3.30078125, -2.96728515625, -2.6337890625, -2.30029296875, -1.966796875, -1.63330078125, -1.2998046875, -0.96630859375, -0.6328125, -0.29931640625, 0.0341796875, 0.36767578125, 0.701171875, 1.03466796875, 1.3681640625, 1.70166015625, 2.03515625, 2.36865234375, 2.7021484375, 3.03564453125, 3.369140625, 3.70263671875, 4.0361328125, 4.36962890625, 4.703125, 5.03662109375, 5.3701171875, 5.70361328125, 6.037109375, 6.37060546875, 6.7041015625, 7.03759765625, 7.37109375, 7.70458984375, 8.0380859375, 8.37158203125, 8.705078125, 9.03857421875, 9.3720703125, 9.70556640625, 10.0390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 9.0, 4.0, 4.0, 5.0, 8.0, 11.0, 28.0, 25.0, 29.0, 39.0, 57.0, 78.0, 129.0, 145.0, 195.0, 324.0, 515.0, 890.0, 1440.0, 2358.0, 4018.0, 6918.0, 11719.0, 20481.0, 34139.0, 54149.0, 80280.0, 109212.0, 133122.0, 142113.0, 131400.0, 106879.0, 77250.0, 51634.0, 32152.0, 19270.0, 11108.0, 6631.0, 3755.0, 2212.0, 1367.0, 807.0, 522.0, 343.0, 237.0, 152.0, 106.0, 85.0, 61.0, 34.0, 30.0, 29.0, 12.0, 16.0, 14.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0], "bins": [-5.51953125, -5.34942626953125, -5.1793212890625, -5.00921630859375, -4.839111328125, -4.66900634765625, -4.4989013671875, -4.32879638671875, -4.15869140625, -3.98858642578125, -3.8184814453125, -3.64837646484375, -3.478271484375, -3.30816650390625, -3.1380615234375, -2.96795654296875, -2.7978515625, -2.62774658203125, -2.4576416015625, -2.28753662109375, -2.117431640625, -1.94732666015625, -1.7772216796875, -1.60711669921875, -1.43701171875, -1.26690673828125, -1.0968017578125, -0.92669677734375, -0.756591796875, -0.58648681640625, -0.4163818359375, -0.24627685546875, -0.076171875, 0.09393310546875, 0.2640380859375, 0.43414306640625, 0.604248046875, 0.77435302734375, 0.9444580078125, 1.11456298828125, 1.28466796875, 1.45477294921875, 1.6248779296875, 1.79498291015625, 1.965087890625, 2.13519287109375, 2.3052978515625, 2.47540283203125, 2.6455078125, 2.81561279296875, 2.9857177734375, 3.15582275390625, 3.325927734375, 3.49603271484375, 3.6661376953125, 3.83624267578125, 4.00634765625, 4.17645263671875, 4.3465576171875, 4.51666259765625, 4.686767578125, 4.85687255859375, 5.0269775390625, 5.19708251953125, 5.3671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 13.0, 6.0, 19.0, 23.0, 20.0, 28.0, 42.0, 54.0, 46.0, 62.0, 63.0, 72.0, 63.0, 66.0, 59.0, 60.0, 42.0, 48.0, 42.0, 40.0, 29.0, 22.0, 22.0, 21.0, 12.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008058547973632812, -0.0007820576429367065, -0.0007582604885101318, -0.0007344633340835571, -0.0007106661796569824, -0.0006868690252304077, -0.000663071870803833, -0.0006392747163772583, -0.0006154775619506836, -0.0005916804075241089, -0.0005678832530975342, -0.0005440860986709595, -0.0005202889442443848, -0.0004964917898178101, -0.00047269463539123535, -0.00044889748096466064, -0.00042510032653808594, -0.00040130317211151123, -0.0003775060176849365, -0.0003537088632583618, -0.0003299117088317871, -0.0003061145544052124, -0.0002823173999786377, -0.000258520245552063, -0.00023472309112548828, -0.00021092593669891357, -0.00018712878227233887, -0.00016333162784576416, -0.00013953447341918945, -0.00011573731899261475, -9.194016456604004e-05, -6.814301013946533e-05, -4.4345855712890625e-05, -2.0548701286315918e-05, 3.248453140258789e-06, 2.7045607566833496e-05, 5.08427619934082e-05, 7.463991641998291e-05, 9.843707084655762e-05, 0.00012223422527313232, 0.00014603137969970703, 0.00016982853412628174, 0.00019362568855285645, 0.00021742284297943115, 0.00024121999740600586, 0.00026501715183258057, 0.0002888143062591553, 0.00031261146068573, 0.0003364086151123047, 0.0003602057695388794, 0.0003840029239654541, 0.0004078000783920288, 0.0004315972328186035, 0.0004553943872451782, 0.00047919154167175293, 0.0005029886960983276, 0.0005267858505249023, 0.000550583004951477, 0.0005743801593780518, 0.0005981773138046265, 0.0006219744682312012, 0.0006457716226577759, 0.0006695687770843506, 0.0006933659315109253, 0.0007171630859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 7.0, 11.0, 17.0, 33.0, 50.0, 84.0, 143.0, 241.0, 449.0, 914.0, 1830.0, 4061.0, 9376.0, 21553.0, 48686.0, 96879.0, 162618.0, 210624.0, 200987.0, 141957.0, 79695.0, 38132.0, 16703.0, 7252.0, 3139.0, 1486.0, 714.0, 408.0, 195.0, 109.0, 65.0, 42.0, 23.0, 19.0, 18.0, 12.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5234375, -9.2420654296875, -8.960693359375, -8.6793212890625, -8.39794921875, -8.1165771484375, -7.835205078125, -7.5538330078125, -7.2724609375, -6.9910888671875, -6.709716796875, -6.4283447265625, -6.14697265625, -5.8656005859375, -5.584228515625, -5.3028564453125, -5.021484375, -4.7401123046875, -4.458740234375, -4.1773681640625, -3.89599609375, -3.6146240234375, -3.333251953125, -3.0518798828125, -2.7705078125, -2.4891357421875, -2.207763671875, -1.9263916015625, -1.64501953125, -1.3636474609375, -1.082275390625, -0.8009033203125, -0.51953125, -0.2381591796875, 0.043212890625, 0.3245849609375, 0.60595703125, 0.8873291015625, 1.168701171875, 1.4500732421875, 1.7314453125, 2.0128173828125, 2.294189453125, 2.5755615234375, 2.85693359375, 3.1383056640625, 3.419677734375, 3.7010498046875, 3.982421875, 4.2637939453125, 4.545166015625, 4.8265380859375, 5.10791015625, 5.3892822265625, 5.670654296875, 5.9520263671875, 6.2333984375, 6.5147705078125, 6.796142578125, 7.0775146484375, 7.35888671875, 7.6402587890625, 7.921630859375, 8.2030029296875, 8.484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 1.0, 3.0, 6.0, 13.0, 12.0, 11.0, 19.0, 20.0, 20.0, 28.0, 17.0, 29.0, 37.0, 35.0, 37.0, 38.0, 44.0, 38.0, 36.0, 49.0, 46.0, 42.0, 53.0, 42.0, 46.0, 36.0, 26.0, 19.0, 21.0, 30.0, 24.0, 15.0, 22.0, 14.0, 12.0, 13.0, 10.0, 6.0, 5.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.03515625, -1.971221923828125, -1.90728759765625, -1.843353271484375, -1.7794189453125, -1.715484619140625, -1.65155029296875, -1.587615966796875, -1.523681640625, -1.459747314453125, -1.39581298828125, -1.331878662109375, -1.2679443359375, -1.204010009765625, -1.14007568359375, -1.076141357421875, -1.01220703125, -0.948272705078125, -0.88433837890625, -0.820404052734375, -0.7564697265625, -0.692535400390625, -0.62860107421875, -0.564666748046875, -0.500732421875, -0.436798095703125, -0.37286376953125, -0.308929443359375, -0.2449951171875, -0.181060791015625, -0.11712646484375, -0.053192138671875, 0.0107421875, 0.074676513671875, 0.13861083984375, 0.202545166015625, 0.2664794921875, 0.330413818359375, 0.39434814453125, 0.458282470703125, 0.522216796875, 0.586151123046875, 0.65008544921875, 0.714019775390625, 0.7779541015625, 0.841888427734375, 0.90582275390625, 0.969757080078125, 1.03369140625, 1.097625732421875, 1.16156005859375, 1.225494384765625, 1.2894287109375, 1.353363037109375, 1.41729736328125, 1.481231689453125, 1.545166015625, 1.609100341796875, 1.67303466796875, 1.736968994140625, 1.8009033203125, 1.864837646484375, 1.92877197265625, 1.992706298828125, 2.056640625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 5.0, 4.0, 7.0, 13.0, 18.0, 16.0, 15.0, 25.0, 26.0, 21.0, 39.0, 32.0, 35.0, 55.0, 40.0, 51.0, 59.0, 51.0, 46.0, 55.0, 59.0, 43.0, 47.0, 42.0, 32.0, 24.0, 27.0, 19.0, 21.0, 18.0, 12.0, 12.0, 11.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.590105056762695, -22.868511199951172, -22.14691734313965, -21.425323486328125, -20.703731536865234, -19.98213768005371, -19.260543823242188, -18.538949966430664, -17.81735610961914, -17.095762252807617, -16.374168395996094, -15.652575492858887, -14.93098258972168, -14.209388732910156, -13.487794876098633, -12.76620101928711, -12.044609069824219, -11.323015213012695, -10.601422309875488, -9.879828453063965, -9.158235549926758, -8.436641693115234, -7.715047836303711, -6.993454456329346, -6.2718610763549805, -5.550267696380615, -4.82867431640625, -4.107080459594727, -3.3854870796203613, -2.663893699645996, -1.9422998428344727, -1.2207064628601074, -0.4991111755371094, 0.2224823236465454, 0.9440758228302002, 1.6656694412231445, 2.3872628211975098, 3.108856201171875, 3.8304500579833984, 4.552043437957764, 5.273636817932129, 5.995230197906494, 6.716823577880859, 7.438417434692383, 8.160011291503906, 8.881604194641113, 9.603198051452637, 10.324790954589844, 11.046384811401367, 11.76797866821289, 12.489571571350098, 13.211165428161621, 13.932758331298828, 14.654352188110352, 15.375946044921875, 16.0975399017334, 16.819133758544922, 17.540727615356445, 18.26232147216797, 18.98391342163086, 19.705507278442383, 20.427101135253906, 21.14869499206543, 21.870288848876953, 22.591880798339844]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 5.0, 3.0, 8.0, 9.0, 13.0, 17.0, 15.0, 19.0, 22.0, 23.0, 23.0, 23.0, 32.0, 30.0, 33.0, 35.0, 36.0, 31.0, 52.0, 41.0, 40.0, 37.0, 42.0, 33.0, 27.0, 37.0, 43.0, 31.0, 31.0, 27.0, 28.0, 22.0, 26.0, 16.0, 13.0, 11.0, 10.0, 10.0, 12.0, 5.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.025646209716797, -19.424264907836914, -18.822885513305664, -18.22150421142578, -17.6201229095459, -17.018741607666016, -16.417362213134766, -15.815980911254883, -15.214600563049316, -14.61322021484375, -14.011838912963867, -13.4104585647583, -12.809078216552734, -12.207696914672852, -11.606316566467285, -11.004936218261719, -10.403554916381836, -9.80217456817627, -9.200793266296387, -8.59941291809082, -7.998032093048096, -7.396651268005371, -6.795270919799805, -6.19389009475708, -5.5925092697143555, -4.991128444671631, -4.389747619628906, -3.78836727142334, -3.1869864463806152, -2.5856056213378906, -1.9842250347137451, -1.3828444480895996, -0.7814655303955078, -0.18008482456207275, 0.4212958812713623, 1.0226765871047974, 1.6240572929382324, 2.225438117980957, 2.8268187046051025, 3.428199291229248, 4.029580116271973, 4.630960941314697, 5.232341766357422, 5.833722114562988, 6.435102939605713, 7.0364837646484375, 7.637864112854004, 8.23924446105957, 8.840625762939453, 9.44200611114502, 10.043387413024902, 10.644767761230469, 11.246149063110352, 11.847529411315918, 12.448909759521484, 13.050291061401367, 13.651671409606934, 14.2530517578125, 14.854433059692383, 15.45581340789795, 16.057193756103516, 16.6585750579834, 17.25995635986328, 17.86133575439453, 18.462717056274414]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 16.0, 17.0, 24.0, 50.0, 73.0, 96.0, 180.0, 314.0, 509.0, 802.0, 1433.0, 2259.0, 3906.0, 6950.0, 12280.0, 22274.0, 39845.0, 74017.0, 138748.0, 255226.0, 437647.0, 644232.0, 753910.0, 680457.0, 481907.0, 289734.0, 159228.0, 85117.0, 46216.0, 24997.0, 13652.0, 7635.0, 4411.0, 2524.0, 1450.0, 816.0, 491.0, 339.0, 204.0, 111.0, 69.0, 43.0, 32.0, 17.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-20.765625, -20.16552734375, -19.5654296875, -18.96533203125, -18.365234375, -17.76513671875, -17.1650390625, -16.56494140625, -15.96484375, -15.36474609375, -14.7646484375, -14.16455078125, -13.564453125, -12.96435546875, -12.3642578125, -11.76416015625, -11.1640625, -10.56396484375, -9.9638671875, -9.36376953125, -8.763671875, -8.16357421875, -7.5634765625, -6.96337890625, -6.36328125, -5.76318359375, -5.1630859375, -4.56298828125, -3.962890625, -3.36279296875, -2.7626953125, -2.16259765625, -1.5625, -0.96240234375, -0.3623046875, 0.23779296875, 0.837890625, 1.43798828125, 2.0380859375, 2.63818359375, 3.23828125, 3.83837890625, 4.4384765625, 5.03857421875, 5.638671875, 6.23876953125, 6.8388671875, 7.43896484375, 8.0390625, 8.63916015625, 9.2392578125, 9.83935546875, 10.439453125, 11.03955078125, 11.6396484375, 12.23974609375, 12.83984375, 13.43994140625, 14.0400390625, 14.64013671875, 15.240234375, 15.84033203125, 16.4404296875, 17.04052734375, 17.640625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 10.0, 18.0, 11.0, 15.0, 13.0, 16.0, 25.0, 28.0, 29.0, 22.0, 36.0, 36.0, 42.0, 41.0, 35.0, 28.0, 41.0, 36.0, 48.0, 26.0, 42.0, 42.0, 42.0, 32.0, 38.0, 27.0, 26.0, 23.0, 27.0, 27.0, 19.0, 11.0, 15.0, 10.0, 12.0, 8.0, 8.0, 1.0, 3.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.20556640625, -16.6611328125, -16.11669921875, -15.572265625, -15.02783203125, -14.4833984375, -13.93896484375, -13.39453125, -12.85009765625, -12.3056640625, -11.76123046875, -11.216796875, -10.67236328125, -10.1279296875, -9.58349609375, -9.0390625, -8.49462890625, -7.9501953125, -7.40576171875, -6.861328125, -6.31689453125, -5.7724609375, -5.22802734375, -4.68359375, -4.13916015625, -3.5947265625, -3.05029296875, -2.505859375, -1.96142578125, -1.4169921875, -0.87255859375, -0.328125, 0.21630859375, 0.7607421875, 1.30517578125, 1.849609375, 2.39404296875, 2.9384765625, 3.48291015625, 4.02734375, 4.57177734375, 5.1162109375, 5.66064453125, 6.205078125, 6.74951171875, 7.2939453125, 7.83837890625, 8.3828125, 8.92724609375, 9.4716796875, 10.01611328125, 10.560546875, 11.10498046875, 11.6494140625, 12.19384765625, 12.73828125, 13.28271484375, 13.8271484375, 14.37158203125, 14.916015625, 15.46044921875, 16.0048828125, 16.54931640625, 17.09375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 12.0, 13.0, 17.0, 20.0, 31.0, 43.0, 66.0, 111.0, 225.0, 359.0, 554.0, 833.0, 1445.0, 2456.0, 4222.0, 6995.0, 12300.0, 21802.0, 38619.0, 67962.0, 121255.0, 207646.0, 340937.0, 503460.0, 641292.0, 667034.0, 562486.0, 396834.0, 251241.0, 148556.0, 84699.0, 47378.0, 26882.0, 15239.0, 8817.0, 4945.0, 3026.0, 1720.0, 1043.0, 634.0, 398.0, 240.0, 152.0, 109.0, 60.0, 38.0, 34.0, 14.0, 8.0, 9.0, 6.0, 6.0, 3.0, 3.0], "bins": [-23.3125, -22.64990234375, -21.9873046875, -21.32470703125, -20.662109375, -19.99951171875, -19.3369140625, -18.67431640625, -18.01171875, -17.34912109375, -16.6865234375, -16.02392578125, -15.361328125, -14.69873046875, -14.0361328125, -13.37353515625, -12.7109375, -12.04833984375, -11.3857421875, -10.72314453125, -10.060546875, -9.39794921875, -8.7353515625, -8.07275390625, -7.41015625, -6.74755859375, -6.0849609375, -5.42236328125, -4.759765625, -4.09716796875, -3.4345703125, -2.77197265625, -2.109375, -1.44677734375, -0.7841796875, -0.12158203125, 0.541015625, 1.20361328125, 1.8662109375, 2.52880859375, 3.19140625, 3.85400390625, 4.5166015625, 5.17919921875, 5.841796875, 6.50439453125, 7.1669921875, 7.82958984375, 8.4921875, 9.15478515625, 9.8173828125, 10.47998046875, 11.142578125, 11.80517578125, 12.4677734375, 13.13037109375, 13.79296875, 14.45556640625, 15.1181640625, 15.78076171875, 16.443359375, 17.10595703125, 17.7685546875, 18.43115234375, 19.09375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 22.0, 16.0, 24.0, 29.0, 46.0, 35.0, 53.0, 53.0, 66.0, 77.0, 103.0, 121.0, 162.0, 150.0, 174.0, 194.0, 199.0, 189.0, 210.0, 215.0, 220.0, 187.0, 190.0, 156.0, 169.0, 186.0, 137.0, 97.0, 91.0, 81.0, 91.0, 61.0, 54.0, 45.0, 26.0, 34.0, 25.0, 18.0, 20.0, 11.0, 6.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.97265625, -7.73333740234375, -7.4940185546875, -7.25469970703125, -7.015380859375, -6.77606201171875, -6.5367431640625, -6.29742431640625, -6.05810546875, -5.81878662109375, -5.5794677734375, -5.34014892578125, -5.100830078125, -4.86151123046875, -4.6221923828125, -4.38287353515625, -4.1435546875, -3.90423583984375, -3.6649169921875, -3.42559814453125, -3.186279296875, -2.94696044921875, -2.7076416015625, -2.46832275390625, -2.22900390625, -1.98968505859375, -1.7503662109375, -1.51104736328125, -1.271728515625, -1.03240966796875, -0.7930908203125, -0.55377197265625, -0.314453125, -0.07513427734375, 0.1641845703125, 0.40350341796875, 0.642822265625, 0.88214111328125, 1.1214599609375, 1.36077880859375, 1.60009765625, 1.83941650390625, 2.0787353515625, 2.31805419921875, 2.557373046875, 2.79669189453125, 3.0360107421875, 3.27532958984375, 3.5146484375, 3.75396728515625, 3.9932861328125, 4.23260498046875, 4.471923828125, 4.71124267578125, 4.9505615234375, 5.18988037109375, 5.42919921875, 5.66851806640625, 5.9078369140625, 6.14715576171875, 6.386474609375, 6.62579345703125, 6.8651123046875, 7.10443115234375, 7.34375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 3.0, 6.0, 13.0, 12.0, 24.0, 23.0, 13.0, 27.0, 24.0, 36.0, 36.0, 42.0, 43.0, 33.0, 40.0, 45.0, 37.0, 47.0, 44.0, 32.0, 47.0, 43.0, 39.0, 49.0, 37.0, 30.0, 22.0, 17.0, 21.0, 22.0, 12.0, 14.0, 10.0, 8.0, 8.0, 5.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.688480377197266, -21.00305938720703, -20.317638397216797, -19.632217407226562, -18.946796417236328, -18.261375427246094, -17.57595443725586, -16.890533447265625, -16.20511245727539, -15.519691467285156, -14.834270477294922, -14.148849487304688, -13.463428497314453, -12.778007507324219, -12.092586517333984, -11.40716552734375, -10.721744537353516, -10.036323547363281, -9.350902557373047, -8.665481567382812, -7.980060577392578, -7.294639587402344, -6.609218597412109, -5.923797607421875, -5.238376617431641, -4.552955627441406, -3.867534637451172, -3.1821136474609375, -2.496692657470703, -1.8112716674804688, -1.1258506774902344, -0.4404296875, 0.2449932098388672, 0.9304141998291016, 1.615835189819336, 2.3012561798095703, 2.9866771697998047, 3.672098159790039, 4.357519149780273, 5.042940139770508, 5.728361129760742, 6.413782119750977, 7.099203109741211, 7.784624099731445, 8.47004508972168, 9.155466079711914, 9.840887069702148, 10.526308059692383, 11.211729049682617, 11.897150039672852, 12.582571029663086, 13.26799201965332, 13.953413009643555, 14.638833999633789, 15.324254989624023, 16.009675979614258, 16.695096969604492, 17.380517959594727, 18.06593894958496, 18.751359939575195, 19.43678092956543, 20.122201919555664, 20.8076229095459, 21.493043899536133, 22.178464889526367]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 10.0, 1.0, 9.0, 11.0, 6.0, 11.0, 20.0, 18.0, 17.0, 23.0, 30.0, 31.0, 29.0, 25.0, 35.0, 20.0, 39.0, 44.0, 42.0, 42.0, 41.0, 38.0, 44.0, 37.0, 33.0, 29.0, 38.0, 28.0, 39.0, 31.0, 29.0, 20.0, 20.0, 21.0, 18.0, 8.0, 22.0, 12.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.586881637573242, -20.977073669433594, -20.367265701293945, -19.75745964050293, -19.14765167236328, -18.537843704223633, -17.928035736083984, -17.318227767944336, -16.708419799804688, -16.09861183166504, -15.488804817199707, -14.878996849060059, -14.269189834594727, -13.659381866455078, -13.04957389831543, -12.439765930175781, -11.829959869384766, -11.220151901245117, -10.610344886779785, -10.000536918640137, -9.390729904174805, -8.780921936035156, -8.171113967895508, -7.561306476593018, -6.951498985290527, -6.341691493988037, -5.731884002685547, -5.122076034545898, -4.512268543243408, -3.902461051940918, -3.2926533222198486, -2.6828455924987793, -2.0730361938476562, -1.4632285833358765, -0.8534209728240967, -0.2436133623123169, 0.3661942481994629, 0.9760017395019531, 1.5858094692230225, 2.195617198944092, 2.805424690246582, 3.4152321815490723, 4.0250396728515625, 4.634847640991211, 5.244655132293701, 5.854462623596191, 6.46427059173584, 7.07407808303833, 7.68388557434082, 8.293693542480469, 8.9035005569458, 9.51330852508545, 10.123115539550781, 10.73292350769043, 11.342731475830078, 11.952539443969727, 12.562346458435059, 13.172154426574707, 13.781961441040039, 14.391769409179688, 15.001577377319336, 15.611384391784668, 16.22119140625, 16.83099937438965, 17.440807342529297]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 11.0, 15.0, 17.0, 32.0, 42.0, 59.0, 103.0, 189.0, 287.0, 433.0, 840.0, 1281.0, 2132.0, 3450.0, 5807.0, 9425.0, 15380.0, 24199.0, 37753.0, 56445.0, 78767.0, 103510.0, 122143.0, 129642.0, 122266.0, 102189.0, 77753.0, 55303.0, 36906.0, 23439.0, 15006.0, 9273.0, 5704.0, 3398.0, 2071.0, 1292.0, 780.0, 434.0, 293.0, 186.0, 96.0, 75.0, 52.0, 27.0, 13.0, 15.0, 9.0, 9.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.0703125, -9.7503662109375, -9.430419921875, -9.1104736328125, -8.79052734375, -8.4705810546875, -8.150634765625, -7.8306884765625, -7.5107421875, -7.1907958984375, -6.870849609375, -6.5509033203125, -6.23095703125, -5.9110107421875, -5.591064453125, -5.2711181640625, -4.951171875, -4.6312255859375, -4.311279296875, -3.9913330078125, -3.67138671875, -3.3514404296875, -3.031494140625, -2.7115478515625, -2.3916015625, -2.0716552734375, -1.751708984375, -1.4317626953125, -1.11181640625, -0.7918701171875, -0.471923828125, -0.1519775390625, 0.16796875, 0.4879150390625, 0.807861328125, 1.1278076171875, 1.44775390625, 1.7677001953125, 2.087646484375, 2.4075927734375, 2.7275390625, 3.0474853515625, 3.367431640625, 3.6873779296875, 4.00732421875, 4.3272705078125, 4.647216796875, 4.9671630859375, 5.287109375, 5.6070556640625, 5.927001953125, 6.2469482421875, 6.56689453125, 6.8868408203125, 7.206787109375, 7.5267333984375, 7.8466796875, 8.1666259765625, 8.486572265625, 8.8065185546875, 9.12646484375, 9.4464111328125, 9.766357421875, 10.0863037109375, 10.40625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 13.0, 9.0, 15.0, 11.0, 15.0, 21.0, 22.0, 18.0, 29.0, 31.0, 33.0, 40.0, 36.0, 46.0, 35.0, 39.0, 31.0, 54.0, 45.0, 57.0, 29.0, 28.0, 43.0, 40.0, 27.0, 37.0, 16.0, 27.0, 22.0, 22.0, 17.0, 17.0, 20.0, 8.0, 8.0, 9.0, 0.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.779541015625, -21.10595703125, -20.432373046875, -19.7587890625, -19.085205078125, -18.41162109375, -17.738037109375, -17.064453125, -16.390869140625, -15.71728515625, -15.043701171875, -14.3701171875, -13.696533203125, -13.02294921875, -12.349365234375, -11.67578125, -11.002197265625, -10.32861328125, -9.655029296875, -8.9814453125, -8.307861328125, -7.63427734375, -6.960693359375, -6.287109375, -5.613525390625, -4.93994140625, -4.266357421875, -3.5927734375, -2.919189453125, -2.24560546875, -1.572021484375, -0.8984375, -0.224853515625, 0.44873046875, 1.122314453125, 1.7958984375, 2.469482421875, 3.14306640625, 3.816650390625, 4.490234375, 5.163818359375, 5.83740234375, 6.510986328125, 7.1845703125, 7.858154296875, 8.53173828125, 9.205322265625, 9.87890625, 10.552490234375, 11.22607421875, 11.899658203125, 12.5732421875, 13.246826171875, 13.92041015625, 14.593994140625, 15.267578125, 15.941162109375, 16.61474609375, 17.288330078125, 17.9619140625, 18.635498046875, 19.30908203125, 19.982666015625, 20.65625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 14.0, 30.0, 62.0, 63.0, 136.0, 162.0, 329.0, 558.0, 989.0, 1690.0, 3396.0, 6341.0, 12459.0, 24826.0, 48642.0, 91478.0, 152537.0, 204233.0, 196676.0, 138537.0, 79905.0, 41582.0, 21276.0, 10573.0, 5522.0, 2854.0, 1552.0, 866.0, 507.0, 299.0, 156.0, 122.0, 54.0, 47.0, 28.0, 22.0, 8.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.09375, -19.482666015625, -18.87158203125, -18.260498046875, -17.6494140625, -17.038330078125, -16.42724609375, -15.816162109375, -15.205078125, -14.593994140625, -13.98291015625, -13.371826171875, -12.7607421875, -12.149658203125, -11.53857421875, -10.927490234375, -10.31640625, -9.705322265625, -9.09423828125, -8.483154296875, -7.8720703125, -7.260986328125, -6.64990234375, -6.038818359375, -5.427734375, -4.816650390625, -4.20556640625, -3.594482421875, -2.9833984375, -2.372314453125, -1.76123046875, -1.150146484375, -0.5390625, 0.072021484375, 0.68310546875, 1.294189453125, 1.9052734375, 2.516357421875, 3.12744140625, 3.738525390625, 4.349609375, 4.960693359375, 5.57177734375, 6.182861328125, 6.7939453125, 7.405029296875, 8.01611328125, 8.627197265625, 9.23828125, 9.849365234375, 10.46044921875, 11.071533203125, 11.6826171875, 12.293701171875, 12.90478515625, 13.515869140625, 14.126953125, 14.738037109375, 15.34912109375, 15.960205078125, 16.5712890625, 17.182373046875, 17.79345703125, 18.404541015625, 19.015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 7.0, 6.0, 10.0, 19.0, 17.0, 19.0, 17.0, 23.0, 22.0, 28.0, 22.0, 32.0, 31.0, 27.0, 27.0, 31.0, 36.0, 36.0, 37.0, 38.0, 44.0, 39.0, 38.0, 34.0, 40.0, 32.0, 29.0, 29.0, 25.0, 23.0, 28.0, 24.0, 25.0, 13.0, 15.0, 12.0, 14.0, 6.0, 3.0, 4.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.828125, -11.44921875, -11.0703125, -10.69140625, -10.3125, -9.93359375, -9.5546875, -9.17578125, -8.796875, -8.41796875, -8.0390625, -7.66015625, -7.28125, -6.90234375, -6.5234375, -6.14453125, -5.765625, -5.38671875, -5.0078125, -4.62890625, -4.25, -3.87109375, -3.4921875, -3.11328125, -2.734375, -2.35546875, -1.9765625, -1.59765625, -1.21875, -0.83984375, -0.4609375, -0.08203125, 0.296875, 0.67578125, 1.0546875, 1.43359375, 1.8125, 2.19140625, 2.5703125, 2.94921875, 3.328125, 3.70703125, 4.0859375, 4.46484375, 4.84375, 5.22265625, 5.6015625, 5.98046875, 6.359375, 6.73828125, 7.1171875, 7.49609375, 7.875, 8.25390625, 8.6328125, 9.01171875, 9.390625, 9.76953125, 10.1484375, 10.52734375, 10.90625, 11.28515625, 11.6640625, 12.04296875, 12.421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 9.0, 7.0, 16.0, 17.0, 21.0, 48.0, 47.0, 68.0, 102.0, 129.0, 192.0, 292.0, 430.0, 708.0, 1079.0, 1927.0, 3060.0, 5277.0, 9241.0, 16200.0, 28533.0, 49199.0, 84148.0, 130772.0, 174071.0, 179076.0, 140652.0, 92088.0, 55373.0, 31978.0, 18212.0, 10494.0, 5984.0, 3488.0, 2079.0, 1245.0, 769.0, 485.0, 335.0, 214.0, 150.0, 105.0, 65.0, 59.0, 28.0, 23.0, 19.0, 13.0, 7.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.75390625, -6.5367431640625, -6.319580078125, -6.1024169921875, -5.88525390625, -5.6680908203125, -5.450927734375, -5.2337646484375, -5.0166015625, -4.7994384765625, -4.582275390625, -4.3651123046875, -4.14794921875, -3.9307861328125, -3.713623046875, -3.4964599609375, -3.279296875, -3.0621337890625, -2.844970703125, -2.6278076171875, -2.41064453125, -2.1934814453125, -1.976318359375, -1.7591552734375, -1.5419921875, -1.3248291015625, -1.107666015625, -0.8905029296875, -0.67333984375, -0.4561767578125, -0.239013671875, -0.0218505859375, 0.1953125, 0.4124755859375, 0.629638671875, 0.8468017578125, 1.06396484375, 1.2811279296875, 1.498291015625, 1.7154541015625, 1.9326171875, 2.1497802734375, 2.366943359375, 2.5841064453125, 2.80126953125, 3.0184326171875, 3.235595703125, 3.4527587890625, 3.669921875, 3.8870849609375, 4.104248046875, 4.3214111328125, 4.53857421875, 4.7557373046875, 4.972900390625, 5.1900634765625, 5.4072265625, 5.6243896484375, 5.841552734375, 6.0587158203125, 6.27587890625, 6.4930419921875, 6.710205078125, 6.9273681640625, 7.14453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 10.0, 3.0, 11.0, 18.0, 18.0, 29.0, 25.0, 35.0, 38.0, 45.0, 45.0, 53.0, 49.0, 49.0, 44.0, 65.0, 50.0, 56.0, 58.0, 47.0, 37.0, 40.0, 27.0, 27.0, 28.0, 21.0, 17.0, 12.0, 8.0, 9.0, 8.0, 0.0, 2.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004208087921142578, -0.0004077740013599396, -0.00039473921060562134, -0.0003817044198513031, -0.00036866962909698486, -0.0003556348383426666, -0.0003426000475883484, -0.00032956525683403015, -0.0003165304660797119, -0.0003034956753253937, -0.00029046088457107544, -0.0002774260938167572, -0.00026439130306243896, -0.00025135651230812073, -0.0002383217215538025, -0.00022528693079948425, -0.00021225214004516602, -0.00019921734929084778, -0.00018618255853652954, -0.0001731477677822113, -0.00016011297702789307, -0.00014707818627357483, -0.0001340433955192566, -0.00012100860476493835, -0.00010797381401062012, -9.493902325630188e-05, -8.190423250198364e-05, -6.88694417476654e-05, -5.583465099334717e-05, -4.279986023902893e-05, -2.9765069484710693e-05, -1.6730278730392456e-05, -3.6954879760742188e-06, 9.339302778244019e-06, 2.2374093532562256e-05, 3.540888428688049e-05, 4.844367504119873e-05, 6.147846579551697e-05, 7.45132565498352e-05, 8.754804730415344e-05, 0.00010058283805847168, 0.00011361762881278992, 0.00012665241956710815, 0.0001396872103214264, 0.00015272200107574463, 0.00016575679183006287, 0.0001787915825843811, 0.00019182637333869934, 0.00020486116409301758, 0.00021789595484733582, 0.00023093074560165405, 0.0002439655363559723, 0.00025700032711029053, 0.00027003511786460876, 0.000283069908618927, 0.00029610469937324524, 0.0003091394901275635, 0.0003221742808818817, 0.00033520907163619995, 0.0003482438623905182, 0.0003612786531448364, 0.00037431344389915466, 0.0003873482346534729, 0.00040038302540779114, 0.0004134178161621094]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 9.0, 8.0, 13.0, 21.0, 26.0, 42.0, 64.0, 64.0, 100.0, 154.0, 224.0, 353.0, 586.0, 1007.0, 1733.0, 3073.0, 5429.0, 9823.0, 18024.0, 32560.0, 56556.0, 93091.0, 136079.0, 168510.0, 167969.0, 134410.0, 91669.0, 55616.0, 31531.0, 17348.0, 9627.0, 5407.0, 3018.0, 1676.0, 1029.0, 602.0, 365.0, 255.0, 139.0, 98.0, 73.0, 49.0, 44.0, 28.0, 16.0, 16.0, 14.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.3828125, -9.106689453125, -8.83056640625, -8.554443359375, -8.2783203125, -8.002197265625, -7.72607421875, -7.449951171875, -7.173828125, -6.897705078125, -6.62158203125, -6.345458984375, -6.0693359375, -5.793212890625, -5.51708984375, -5.240966796875, -4.96484375, -4.688720703125, -4.41259765625, -4.136474609375, -3.8603515625, -3.584228515625, -3.30810546875, -3.031982421875, -2.755859375, -2.479736328125, -2.20361328125, -1.927490234375, -1.6513671875, -1.375244140625, -1.09912109375, -0.822998046875, -0.546875, -0.270751953125, 0.00537109375, 0.281494140625, 0.5576171875, 0.833740234375, 1.10986328125, 1.385986328125, 1.662109375, 1.938232421875, 2.21435546875, 2.490478515625, 2.7666015625, 3.042724609375, 3.31884765625, 3.594970703125, 3.87109375, 4.147216796875, 4.42333984375, 4.699462890625, 4.9755859375, 5.251708984375, 5.52783203125, 5.803955078125, 6.080078125, 6.356201171875, 6.63232421875, 6.908447265625, 7.1845703125, 7.460693359375, 7.73681640625, 8.012939453125, 8.2890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 11.0, 9.0, 14.0, 14.0, 12.0, 26.0, 23.0, 28.0, 32.0, 27.0, 27.0, 50.0, 53.0, 52.0, 67.0, 69.0, 52.0, 78.0, 49.0, 51.0, 36.0, 40.0, 33.0, 27.0, 13.0, 14.0, 16.0, 11.0, 16.0, 8.0, 10.0, 7.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.671875, -3.570220947265625, -3.46856689453125, -3.366912841796875, -3.2652587890625, -3.163604736328125, -3.06195068359375, -2.960296630859375, -2.858642578125, -2.756988525390625, -2.65533447265625, -2.553680419921875, -2.4520263671875, -2.350372314453125, -2.24871826171875, -2.147064208984375, -2.04541015625, -1.943756103515625, -1.84210205078125, -1.740447998046875, -1.6387939453125, -1.537139892578125, -1.43548583984375, -1.333831787109375, -1.232177734375, -1.130523681640625, -1.02886962890625, -0.927215576171875, -0.8255615234375, -0.723907470703125, -0.62225341796875, -0.520599365234375, -0.4189453125, -0.317291259765625, -0.21563720703125, -0.113983154296875, -0.0123291015625, 0.089324951171875, 0.19097900390625, 0.292633056640625, 0.394287109375, 0.495941162109375, 0.59759521484375, 0.699249267578125, 0.8009033203125, 0.902557373046875, 1.00421142578125, 1.105865478515625, 1.20751953125, 1.309173583984375, 1.41082763671875, 1.512481689453125, 1.6141357421875, 1.715789794921875, 1.81744384765625, 1.919097900390625, 2.020751953125, 2.122406005859375, 2.22406005859375, 2.325714111328125, 2.4273681640625, 2.529022216796875, 2.63067626953125, 2.732330322265625, 2.833984375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 7.0, 2.0, 10.0, 19.0, 17.0, 18.0, 20.0, 35.0, 34.0, 23.0, 28.0, 46.0, 43.0, 37.0, 44.0, 35.0, 44.0, 42.0, 39.0, 43.0, 48.0, 43.0, 36.0, 37.0, 41.0, 27.0, 24.0, 26.0, 21.0, 13.0, 19.0, 10.0, 10.0, 9.0, 9.0, 5.0, 6.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-21.88576316833496, -21.210844039916992, -20.535926818847656, -19.861007690429688, -19.18609046936035, -18.511171340942383, -17.836254119873047, -17.161334991455078, -16.48641586303711, -15.811497688293457, -15.136579513549805, -14.461660385131836, -13.7867431640625, -13.111824035644531, -12.436905860900879, -11.761987686157227, -11.08707046508789, -10.412152290344238, -9.737234115600586, -9.062314987182617, -8.387397766113281, -7.712479114532471, -7.03756046295166, -6.362642288208008, -5.6877241134643555, -5.012805938720703, -4.337887763977051, -3.6629691123962402, -2.988050937652588, -2.3131327629089355, -1.638214111328125, -0.9632959365844727, -0.2883777618408203, 0.3865405321121216, 1.0614588260650635, 1.736377239227295, 2.4112954139709473, 3.0862135887145996, 3.76113224029541, 4.4360504150390625, 5.110968589782715, 5.785886764526367, 6.4608049392700195, 7.13572359085083, 7.810641765594482, 8.485559463500977, 9.160478591918945, 9.835396766662598, 10.51031494140625, 11.185233116149902, 11.860151290893555, 12.535070419311523, 13.20998764038086, 13.884906768798828, 14.55982494354248, 15.234743118286133, 15.909661293029785, 16.584579467773438, 17.259498596191406, 17.934415817260742, 18.60933494567871, 19.284252166748047, 19.959171295166016, 20.634090423583984, 21.30900764465332]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 7.0, 4.0, 11.0, 11.0, 8.0, 19.0, 14.0, 15.0, 21.0, 27.0, 26.0, 21.0, 33.0, 31.0, 21.0, 34.0, 43.0, 41.0, 49.0, 41.0, 35.0, 42.0, 42.0, 31.0, 41.0, 31.0, 33.0, 40.0, 32.0, 29.0, 20.0, 18.0, 22.0, 23.0, 16.0, 14.0, 12.0, 15.0, 4.0, 2.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-21.122201919555664, -20.521953582763672, -19.92170524597168, -19.321456909179688, -18.721210479736328, -18.120962142944336, -17.520713806152344, -16.92046546936035, -16.32021713256836, -15.719968795776367, -15.119721412658691, -14.5194730758667, -13.919224739074707, -13.318977355957031, -12.718729019165039, -12.118480682373047, -11.518233299255371, -10.917984962463379, -10.317737579345703, -9.717489242553711, -9.117240905761719, -8.516992568969727, -7.916745185852051, -7.316496849060059, -6.716248989105225, -6.116001129150391, -5.515752792358398, -4.9155049324035645, -4.3152570724487305, -3.7150087356567383, -3.1147608757019043, -2.514512538909912, -1.9142646789550781, -1.314016580581665, -0.7137686014175415, -0.11352062225341797, 0.4867274761199951, 1.0869755744934082, 1.6872234344482422, 2.2874717712402344, 2.8877196311950684, 3.4879677295684814, 4.0882158279418945, 4.6884636878967285, 5.2887115478515625, 5.888959884643555, 6.489207744598389, 7.089456081390381, 7.689703941345215, 8.289952278137207, 8.890199661254883, 9.490447998046875, 10.090696334838867, 10.69094467163086, 11.291192054748535, 11.891440391540527, 12.491687774658203, 13.091936111450195, 13.692183494567871, 14.292431831359863, 14.892680168151855, 15.492927551269531, 16.093175888061523, 16.693424224853516, 17.293672561645508]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 11.0, 21.0, 29.0, 25.0, 58.0, 75.0, 163.0, 214.0, 379.0, 491.0, 826.0, 1330.0, 2145.0, 3132.0, 5358.0, 8335.0, 12538.0, 19612.0, 28761.0, 41414.0, 57207.0, 74622.0, 91105.0, 103862.0, 109405.0, 106779.0, 96323.0, 80235.0, 62089.0, 46279.0, 32464.0, 22269.0, 14863.0, 9374.0, 6197.0, 3832.0, 2424.0, 1553.0, 968.0, 634.0, 432.0, 247.0, 146.0, 118.0, 81.0, 41.0, 31.0, 28.0, 15.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.9140625, -11.537841796875, -11.16162109375, -10.785400390625, -10.4091796875, -10.032958984375, -9.65673828125, -9.280517578125, -8.904296875, -8.528076171875, -8.15185546875, -7.775634765625, -7.3994140625, -7.023193359375, -6.64697265625, -6.270751953125, -5.89453125, -5.518310546875, -5.14208984375, -4.765869140625, -4.3896484375, -4.013427734375, -3.63720703125, -3.260986328125, -2.884765625, -2.508544921875, -2.13232421875, -1.756103515625, -1.3798828125, -1.003662109375, -0.62744140625, -0.251220703125, 0.125, 0.501220703125, 0.87744140625, 1.253662109375, 1.6298828125, 2.006103515625, 2.38232421875, 2.758544921875, 3.134765625, 3.510986328125, 3.88720703125, 4.263427734375, 4.6396484375, 5.015869140625, 5.39208984375, 5.768310546875, 6.14453125, 6.520751953125, 6.89697265625, 7.273193359375, 7.6494140625, 8.025634765625, 8.40185546875, 8.778076171875, 9.154296875, 9.530517578125, 9.90673828125, 10.282958984375, 10.6591796875, 11.035400390625, 11.41162109375, 11.787841796875, 12.1640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 4.0, 4.0, 9.0, 7.0, 12.0, 20.0, 20.0, 20.0, 21.0, 28.0, 27.0, 20.0, 34.0, 16.0, 31.0, 28.0, 36.0, 40.0, 45.0, 48.0, 36.0, 43.0, 33.0, 46.0, 34.0, 32.0, 43.0, 30.0, 30.0, 28.0, 27.0, 22.0, 15.0, 18.0, 20.0, 17.0, 9.0, 7.0, 5.0, 10.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-21.6875, -21.07275390625, -20.4580078125, -19.84326171875, -19.228515625, -18.61376953125, -17.9990234375, -17.38427734375, -16.76953125, -16.15478515625, -15.5400390625, -14.92529296875, -14.310546875, -13.69580078125, -13.0810546875, -12.46630859375, -11.8515625, -11.23681640625, -10.6220703125, -10.00732421875, -9.392578125, -8.77783203125, -8.1630859375, -7.54833984375, -6.93359375, -6.31884765625, -5.7041015625, -5.08935546875, -4.474609375, -3.85986328125, -3.2451171875, -2.63037109375, -2.015625, -1.40087890625, -0.7861328125, -0.17138671875, 0.443359375, 1.05810546875, 1.6728515625, 2.28759765625, 2.90234375, 3.51708984375, 4.1318359375, 4.74658203125, 5.361328125, 5.97607421875, 6.5908203125, 7.20556640625, 7.8203125, 8.43505859375, 9.0498046875, 9.66455078125, 10.279296875, 10.89404296875, 11.5087890625, 12.12353515625, 12.73828125, 13.35302734375, 13.9677734375, 14.58251953125, 15.197265625, 15.81201171875, 16.4267578125, 17.04150390625, 17.65625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 12.0, 16.0, 28.0, 38.0, 63.0, 86.0, 150.0, 240.0, 368.0, 584.0, 926.0, 1378.0, 2022.0, 3180.0, 4875.0, 7592.0, 11614.0, 17454.0, 25653.0, 36966.0, 51042.0, 67242.0, 83563.0, 97712.0, 105939.0, 106969.0, 99330.0, 84981.0, 68460.0, 52067.0, 38047.0, 26941.0, 18287.0, 12085.0, 7871.0, 5245.0, 3416.0, 2208.0, 1429.0, 881.0, 560.0, 369.0, 258.0, 155.0, 108.0, 63.0, 30.0, 23.0, 14.0, 8.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.796875, -12.3975830078125, -11.998291015625, -11.5989990234375, -11.19970703125, -10.8004150390625, -10.401123046875, -10.0018310546875, -9.6025390625, -9.2032470703125, -8.803955078125, -8.4046630859375, -8.00537109375, -7.6060791015625, -7.206787109375, -6.8074951171875, -6.408203125, -6.0089111328125, -5.609619140625, -5.2103271484375, -4.81103515625, -4.4117431640625, -4.012451171875, -3.6131591796875, -3.2138671875, -2.8145751953125, -2.415283203125, -2.0159912109375, -1.61669921875, -1.2174072265625, -0.818115234375, -0.4188232421875, -0.01953125, 0.3797607421875, 0.779052734375, 1.1783447265625, 1.57763671875, 1.9769287109375, 2.376220703125, 2.7755126953125, 3.1748046875, 3.5740966796875, 3.973388671875, 4.3726806640625, 4.77197265625, 5.1712646484375, 5.570556640625, 5.9698486328125, 6.369140625, 6.7684326171875, 7.167724609375, 7.5670166015625, 7.96630859375, 8.3656005859375, 8.764892578125, 9.1641845703125, 9.5634765625, 9.9627685546875, 10.362060546875, 10.7613525390625, 11.16064453125, 11.5599365234375, 11.959228515625, 12.3585205078125, 12.7578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 7.0, 7.0, 10.0, 14.0, 14.0, 12.0, 27.0, 19.0, 26.0, 11.0, 22.0, 23.0, 15.0, 33.0, 35.0, 48.0, 32.0, 34.0, 31.0, 45.0, 36.0, 45.0, 46.0, 30.0, 38.0, 31.0, 44.0, 20.0, 38.0, 25.0, 28.0, 22.0, 16.0, 24.0, 17.0, 9.0, 12.0, 9.0, 8.0, 5.0, 6.0, 5.0, 4.0, 5.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.2421875, -11.8603515625, -11.478515625, -11.0966796875, -10.71484375, -10.3330078125, -9.951171875, -9.5693359375, -9.1875, -8.8056640625, -8.423828125, -8.0419921875, -7.66015625, -7.2783203125, -6.896484375, -6.5146484375, -6.1328125, -5.7509765625, -5.369140625, -4.9873046875, -4.60546875, -4.2236328125, -3.841796875, -3.4599609375, -3.078125, -2.6962890625, -2.314453125, -1.9326171875, -1.55078125, -1.1689453125, -0.787109375, -0.4052734375, -0.0234375, 0.3583984375, 0.740234375, 1.1220703125, 1.50390625, 1.8857421875, 2.267578125, 2.6494140625, 3.03125, 3.4130859375, 3.794921875, 4.1767578125, 4.55859375, 4.9404296875, 5.322265625, 5.7041015625, 6.0859375, 6.4677734375, 6.849609375, 7.2314453125, 7.61328125, 7.9951171875, 8.376953125, 8.7587890625, 9.140625, 9.5224609375, 9.904296875, 10.2861328125, 10.66796875, 11.0498046875, 11.431640625, 11.8134765625, 12.1953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 4.0, 4.0, 12.0, 15.0, 18.0, 31.0, 48.0, 60.0, 105.0, 156.0, 273.0, 455.0, 727.0, 1197.0, 1954.0, 3421.0, 5565.0, 9178.0, 14777.0, 23457.0, 35998.0, 53429.0, 74801.0, 96580.0, 115589.0, 123643.0, 119849.0, 104981.0, 83598.0, 61885.0, 42746.0, 27858.0, 17945.0, 11140.0, 6711.0, 4072.0, 2326.0, 1487.0, 923.0, 586.0, 358.0, 215.0, 133.0, 75.0, 52.0, 42.0, 21.0, 20.0, 13.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0], "bins": [-5.26171875, -5.1055908203125, -4.949462890625, -4.7933349609375, -4.63720703125, -4.4810791015625, -4.324951171875, -4.1688232421875, -4.0126953125, -3.8565673828125, -3.700439453125, -3.5443115234375, -3.38818359375, -3.2320556640625, -3.075927734375, -2.9197998046875, -2.763671875, -2.6075439453125, -2.451416015625, -2.2952880859375, -2.13916015625, -1.9830322265625, -1.826904296875, -1.6707763671875, -1.5146484375, -1.3585205078125, -1.202392578125, -1.0462646484375, -0.89013671875, -0.7340087890625, -0.577880859375, -0.4217529296875, -0.265625, -0.1094970703125, 0.046630859375, 0.2027587890625, 0.35888671875, 0.5150146484375, 0.671142578125, 0.8272705078125, 0.9833984375, 1.1395263671875, 1.295654296875, 1.4517822265625, 1.60791015625, 1.7640380859375, 1.920166015625, 2.0762939453125, 2.232421875, 2.3885498046875, 2.544677734375, 2.7008056640625, 2.85693359375, 3.0130615234375, 3.169189453125, 3.3253173828125, 3.4814453125, 3.6375732421875, 3.793701171875, 3.9498291015625, 4.10595703125, 4.2620849609375, 4.418212890625, 4.5743408203125, 4.73046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 13.0, 12.0, 14.0, 20.0, 20.0, 26.0, 35.0, 47.0, 39.0, 47.0, 58.0, 55.0, 54.0, 76.0, 64.0, 59.0, 44.0, 54.0, 41.0, 45.0, 38.0, 35.0, 26.0, 19.0, 7.0, 11.0, 9.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 4.0], "bins": [-0.0009446144104003906, -0.0009220317006111145, -0.0008994489908218384, -0.0008768662810325623, -0.0008542835712432861, -0.00083170086145401, -0.0008091181516647339, -0.0007865354418754578, -0.0007639527320861816, -0.0007413700222969055, -0.0007187873125076294, -0.0006962046027183533, -0.0006736218929290771, -0.000651039183139801, -0.0006284564733505249, -0.0006058737635612488, -0.0005832910537719727, -0.0005607083439826965, -0.0005381256341934204, -0.0005155429244041443, -0.0004929602146148682, -0.00047037750482559204, -0.0004477947950363159, -0.0004252120852470398, -0.00040262937545776367, -0.00038004666566848755, -0.0003574639558792114, -0.0003348812460899353, -0.0003122985363006592, -0.00028971582651138306, -0.00026713311672210693, -0.0002445504069328308, -0.0002219676971435547, -0.00019938498735427856, -0.00017680227756500244, -0.00015421956777572632, -0.0001316368579864502, -0.00010905414819717407, -8.647143840789795e-05, -6.388872861862183e-05, -4.13060188293457e-05, -1.872330904006958e-05, 3.859400749206543e-06, 2.6442110538482666e-05, 4.902482032775879e-05, 7.160753011703491e-05, 9.419023990631104e-05, 0.00011677294969558716, 0.00013935565948486328, 0.0001619383692741394, 0.00018452107906341553, 0.00020710378885269165, 0.00022968649864196777, 0.0002522692084312439, 0.00027485191822052, 0.00029743462800979614, 0.00032001733779907227, 0.0003426000475883484, 0.0003651827573776245, 0.00038776546716690063, 0.00041034817695617676, 0.0004329308867454529, 0.000455513596534729, 0.0004780963063240051, 0.0005006790161132812]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 7.0, 4.0, 5.0, 15.0, 23.0, 36.0, 49.0, 89.0, 132.0, 212.0, 355.0, 538.0, 893.0, 1385.0, 2345.0, 3903.0, 6233.0, 9958.0, 15447.0, 24215.0, 36396.0, 52171.0, 71662.0, 91304.0, 107826.0, 116725.0, 114352.0, 103639.0, 85936.0, 65325.0, 47221.0, 32350.0, 21490.0, 13735.0, 8676.0, 5395.0, 3272.0, 2009.0, 1211.0, 755.0, 495.0, 276.0, 184.0, 119.0, 71.0, 49.0, 28.0, 26.0, 10.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.03515625, -4.8770751953125, -4.718994140625, -4.5609130859375, -4.40283203125, -4.2447509765625, -4.086669921875, -3.9285888671875, -3.7705078125, -3.6124267578125, -3.454345703125, -3.2962646484375, -3.13818359375, -2.9801025390625, -2.822021484375, -2.6639404296875, -2.505859375, -2.3477783203125, -2.189697265625, -2.0316162109375, -1.87353515625, -1.7154541015625, -1.557373046875, -1.3992919921875, -1.2412109375, -1.0831298828125, -0.925048828125, -0.7669677734375, -0.60888671875, -0.4508056640625, -0.292724609375, -0.1346435546875, 0.0234375, 0.1815185546875, 0.339599609375, 0.4976806640625, 0.65576171875, 0.8138427734375, 0.971923828125, 1.1300048828125, 1.2880859375, 1.4461669921875, 1.604248046875, 1.7623291015625, 1.92041015625, 2.0784912109375, 2.236572265625, 2.3946533203125, 2.552734375, 2.7108154296875, 2.868896484375, 3.0269775390625, 3.18505859375, 3.3431396484375, 3.501220703125, 3.6593017578125, 3.8173828125, 3.9754638671875, 4.133544921875, 4.2916259765625, 4.44970703125, 4.6077880859375, 4.765869140625, 4.9239501953125, 5.08203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 8.0, 15.0, 11.0, 9.0, 17.0, 17.0, 17.0, 28.0, 27.0, 33.0, 33.0, 39.0, 33.0, 57.0, 50.0, 36.0, 37.0, 38.0, 49.0, 60.0, 47.0, 45.0, 39.0, 36.0, 39.0, 23.0, 25.0, 19.0, 24.0, 20.0, 15.0, 11.0, 11.0, 9.0, 1.0, 5.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.028167724609375, -1.96063232421875, -1.893096923828125, -1.8255615234375, -1.758026123046875, -1.69049072265625, -1.622955322265625, -1.555419921875, -1.487884521484375, -1.42034912109375, -1.352813720703125, -1.2852783203125, -1.217742919921875, -1.15020751953125, -1.082672119140625, -1.01513671875, -0.947601318359375, -0.88006591796875, -0.812530517578125, -0.7449951171875, -0.677459716796875, -0.60992431640625, -0.542388916015625, -0.474853515625, -0.407318115234375, -0.33978271484375, -0.272247314453125, -0.2047119140625, -0.137176513671875, -0.06964111328125, -0.002105712890625, 0.0654296875, 0.132965087890625, 0.20050048828125, 0.268035888671875, 0.3355712890625, 0.403106689453125, 0.47064208984375, 0.538177490234375, 0.605712890625, 0.673248291015625, 0.74078369140625, 0.808319091796875, 0.8758544921875, 0.943389892578125, 1.01092529296875, 1.078460693359375, 1.14599609375, 1.213531494140625, 1.28106689453125, 1.348602294921875, 1.4161376953125, 1.483673095703125, 1.55120849609375, 1.618743896484375, 1.686279296875, 1.753814697265625, 1.82135009765625, 1.888885498046875, 1.9564208984375, 2.023956298828125, 2.09149169921875, 2.159027099609375, 2.2265625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 9.0, 7.0, 14.0, 15.0, 20.0, 18.0, 27.0, 31.0, 30.0, 26.0, 24.0, 37.0, 53.0, 36.0, 36.0, 34.0, 39.0, 52.0, 40.0, 40.0, 56.0, 43.0, 40.0, 36.0, 21.0, 30.0, 24.0, 25.0, 21.0, 19.0, 16.0, 11.0, 12.0, 6.0, 6.0, 6.0, 4.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.727628707885742, -20.070180892944336, -19.41273307800293, -18.755285263061523, -18.09783935546875, -17.440391540527344, -16.782943725585938, -16.12549591064453, -15.468048095703125, -14.810600280761719, -14.153152465820312, -13.495705604553223, -12.838257789611816, -12.18080997467041, -11.52336311340332, -10.865915298461914, -10.208467483520508, -9.551019668579102, -8.893571853637695, -8.236124992370605, -7.578677177429199, -6.921229362487793, -6.263782024383545, -5.606334686279297, -4.948886871337891, -4.291439056396484, -3.6339917182922363, -2.976544141769409, -2.319096565246582, -1.6616489887237549, -1.0042014122009277, -0.3467540740966797, 0.3106956481933594, 0.9681432247161865, 1.6255908012390137, 2.283038377761841, 2.940485954284668, 3.597933530807495, 4.255381107330322, 4.91282844543457, 5.570276260375977, 6.227724075317383, 6.885171413421631, 7.542618751525879, 8.200066566467285, 8.857514381408691, 9.514961242675781, 10.172409057617188, 10.829856872558594, 11.4873046875, 12.144752502441406, 12.802199363708496, 13.459647178649902, 14.117094993591309, 14.774541854858398, 15.431989669799805, 16.08943748474121, 16.746885299682617, 17.404333114624023, 18.06178092956543, 18.719226837158203, 19.37667465209961, 20.034122467041016, 20.691570281982422, 21.349018096923828]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 6.0, 6.0, 12.0, 11.0, 14.0, 15.0, 15.0, 26.0, 27.0, 19.0, 30.0, 34.0, 32.0, 39.0, 33.0, 34.0, 29.0, 40.0, 34.0, 33.0, 28.0, 30.0, 50.0, 40.0, 37.0, 33.0, 33.0, 36.0, 27.0, 18.0, 21.0, 22.0, 12.0, 15.0, 12.0, 19.0, 10.0, 17.0, 9.0, 8.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.596355438232422, -20.969160079956055, -20.341964721679688, -19.714767456054688, -19.08757209777832, -18.460376739501953, -17.833179473876953, -17.205984115600586, -16.57878875732422, -15.951593399047852, -15.324397087097168, -14.697200775146484, -14.070005416870117, -13.44281005859375, -12.815613746643066, -12.188417434692383, -11.561222076416016, -10.934026718139648, -10.306830406188965, -9.679634094238281, -9.052438735961914, -8.425243377685547, -7.798047065734863, -7.170851230621338, -6.5436553955078125, -5.916459560394287, -5.289263725280762, -4.662067890167236, -4.034872055053711, -3.4076762199401855, -2.78048038482666, -2.1532845497131348, -1.5260868072509766, -0.8988909721374512, -0.2716951370239258, 0.3555006980895996, 0.982696533203125, 1.6098923683166504, 2.237088203430176, 2.864284038543701, 3.4914798736572266, 4.118675708770752, 4.745871543884277, 5.373067378997803, 6.000263214111328, 6.6274590492248535, 7.254654884338379, 7.881850719451904, 8.50904655456543, 9.136241912841797, 9.76343822479248, 10.390634536743164, 11.017829895019531, 11.645025253295898, 12.272221565246582, 12.899417877197266, 13.526613235473633, 14.15380859375, 14.781004905700684, 15.408201217651367, 16.035396575927734, 16.6625919342041, 17.28978729248047, 17.91698455810547, 18.544179916381836]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 9.0, 17.0, 16.0, 41.0, 45.0, 74.0, 144.0, 175.0, 302.0, 447.0, 737.0, 1130.0, 1705.0, 2674.0, 4270.0, 6748.0, 10890.0, 17787.0, 29001.0, 47579.0, 79475.0, 131882.0, 215017.0, 335535.0, 479274.0, 592116.0, 616369.0, 535782.0, 400085.0, 265338.0, 165332.0, 99960.0, 60027.0, 36303.0, 22064.0, 13511.0, 8430.0, 5130.0, 3284.0, 1967.0, 1249.0, 800.0, 539.0, 357.0, 237.0, 155.0, 101.0, 62.0, 46.0, 17.0, 10.0, 14.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0], "bins": [-16.890625, -16.366455078125, -15.84228515625, -15.318115234375, -14.7939453125, -14.269775390625, -13.74560546875, -13.221435546875, -12.697265625, -12.173095703125, -11.64892578125, -11.124755859375, -10.6005859375, -10.076416015625, -9.55224609375, -9.028076171875, -8.50390625, -7.979736328125, -7.45556640625, -6.931396484375, -6.4072265625, -5.883056640625, -5.35888671875, -4.834716796875, -4.310546875, -3.786376953125, -3.26220703125, -2.738037109375, -2.2138671875, -1.689697265625, -1.16552734375, -0.641357421875, -0.1171875, 0.406982421875, 0.93115234375, 1.455322265625, 1.9794921875, 2.503662109375, 3.02783203125, 3.552001953125, 4.076171875, 4.600341796875, 5.12451171875, 5.648681640625, 6.1728515625, 6.697021484375, 7.22119140625, 7.745361328125, 8.26953125, 8.793701171875, 9.31787109375, 9.842041015625, 10.3662109375, 10.890380859375, 11.41455078125, 11.938720703125, 12.462890625, 12.987060546875, 13.51123046875, 14.035400390625, 14.5595703125, 15.083740234375, 15.60791015625, 16.132080078125, 16.65625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 5.0, 6.0, 12.0, 15.0, 11.0, 11.0, 17.0, 22.0, 19.0, 26.0, 32.0, 27.0, 27.0, 32.0, 35.0, 26.0, 38.0, 41.0, 38.0, 43.0, 40.0, 37.0, 36.0, 37.0, 43.0, 30.0, 37.0, 25.0, 26.0, 23.0, 16.0, 28.0, 25.0, 10.0, 13.0, 12.0, 16.0, 11.0, 14.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.109375, -19.531494140625, -18.95361328125, -18.375732421875, -17.7978515625, -17.219970703125, -16.64208984375, -16.064208984375, -15.486328125, -14.908447265625, -14.33056640625, -13.752685546875, -13.1748046875, -12.596923828125, -12.01904296875, -11.441162109375, -10.86328125, -10.285400390625, -9.70751953125, -9.129638671875, -8.5517578125, -7.973876953125, -7.39599609375, -6.818115234375, -6.240234375, -5.662353515625, -5.08447265625, -4.506591796875, -3.9287109375, -3.350830078125, -2.77294921875, -2.195068359375, -1.6171875, -1.039306640625, -0.46142578125, 0.116455078125, 0.6943359375, 1.272216796875, 1.85009765625, 2.427978515625, 3.005859375, 3.583740234375, 4.16162109375, 4.739501953125, 5.3173828125, 5.895263671875, 6.47314453125, 7.051025390625, 7.62890625, 8.206787109375, 8.78466796875, 9.362548828125, 9.9404296875, 10.518310546875, 11.09619140625, 11.674072265625, 12.251953125, 12.829833984375, 13.40771484375, 13.985595703125, 14.5634765625, 15.141357421875, 15.71923828125, 16.297119140625, 16.875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 8.0, 16.0, 18.0, 40.0, 52.0, 88.0, 123.0, 216.0, 350.0, 499.0, 744.0, 1226.0, 1973.0, 3094.0, 4941.0, 7989.0, 12677.0, 20922.0, 34789.0, 56383.0, 92603.0, 148635.0, 232955.0, 345432.0, 469421.0, 564385.0, 576920.0, 506943.0, 387521.0, 268122.0, 173769.0, 109144.0, 66776.0, 40837.0, 24626.0, 15097.0, 9155.0, 5844.0, 3677.0, 2271.0, 1493.0, 944.0, 597.0, 356.0, 215.0, 156.0, 91.0, 53.0, 39.0, 26.0, 12.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-19.4375, -18.833251953125, -18.22900390625, -17.624755859375, -17.0205078125, -16.416259765625, -15.81201171875, -15.207763671875, -14.603515625, -13.999267578125, -13.39501953125, -12.790771484375, -12.1865234375, -11.582275390625, -10.97802734375, -10.373779296875, -9.76953125, -9.165283203125, -8.56103515625, -7.956787109375, -7.3525390625, -6.748291015625, -6.14404296875, -5.539794921875, -4.935546875, -4.331298828125, -3.72705078125, -3.122802734375, -2.5185546875, -1.914306640625, -1.31005859375, -0.705810546875, -0.1015625, 0.502685546875, 1.10693359375, 1.711181640625, 2.3154296875, 2.919677734375, 3.52392578125, 4.128173828125, 4.732421875, 5.336669921875, 5.94091796875, 6.545166015625, 7.1494140625, 7.753662109375, 8.35791015625, 8.962158203125, 9.56640625, 10.170654296875, 10.77490234375, 11.379150390625, 11.9833984375, 12.587646484375, 13.19189453125, 13.796142578125, 14.400390625, 15.004638671875, 15.60888671875, 16.213134765625, 16.8173828125, 17.421630859375, 18.02587890625, 18.630126953125, 19.234375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 15.0, 9.0, 16.0, 21.0, 31.0, 33.0, 32.0, 45.0, 74.0, 85.0, 96.0, 121.0, 127.0, 148.0, 181.0, 181.0, 209.0, 215.0, 220.0, 225.0, 257.0, 197.0, 238.0, 212.0, 195.0, 162.0, 132.0, 100.0, 107.0, 75.0, 75.0, 51.0, 38.0, 30.0, 21.0, 24.0, 16.0, 8.0, 13.0, 7.0, 10.0, 4.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.859375, -8.577880859375, -8.29638671875, -8.014892578125, -7.7333984375, -7.451904296875, -7.17041015625, -6.888916015625, -6.607421875, -6.325927734375, -6.04443359375, -5.762939453125, -5.4814453125, -5.199951171875, -4.91845703125, -4.636962890625, -4.35546875, -4.073974609375, -3.79248046875, -3.510986328125, -3.2294921875, -2.947998046875, -2.66650390625, -2.385009765625, -2.103515625, -1.822021484375, -1.54052734375, -1.259033203125, -0.9775390625, -0.696044921875, -0.41455078125, -0.133056640625, 0.1484375, 0.429931640625, 0.71142578125, 0.992919921875, 1.2744140625, 1.555908203125, 1.83740234375, 2.118896484375, 2.400390625, 2.681884765625, 2.96337890625, 3.244873046875, 3.5263671875, 3.807861328125, 4.08935546875, 4.370849609375, 4.65234375, 4.933837890625, 5.21533203125, 5.496826171875, 5.7783203125, 6.059814453125, 6.34130859375, 6.622802734375, 6.904296875, 7.185791015625, 7.46728515625, 7.748779296875, 8.0302734375, 8.311767578125, 8.59326171875, 8.874755859375, 9.15625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 4.0, 9.0, 11.0, 11.0, 5.0, 12.0, 19.0, 21.0, 24.0, 20.0, 24.0, 24.0, 29.0, 33.0, 20.0, 44.0, 51.0, 42.0, 46.0, 40.0, 45.0, 35.0, 41.0, 34.0, 39.0, 33.0, 26.0, 24.0, 33.0, 23.0, 25.0, 25.0, 19.0, 12.0, 16.0, 14.0, 9.0, 10.0, 10.0, 3.0, 7.0, 7.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.27958106994629, -18.638505935668945, -17.9974308013916, -17.35635757446289, -16.715282440185547, -16.074207305908203, -15.43313217163086, -14.792057037353516, -14.150982856750488, -13.509907722473145, -12.868833541870117, -12.227758407592773, -11.58668327331543, -10.945609092712402, -10.304533958435059, -9.663459777832031, -9.022384643554688, -8.381309509277344, -7.740235328674316, -7.099160194396973, -6.458085536956787, -5.817010879516602, -5.175935745239258, -4.534861087799072, -3.8937864303588867, -3.252711772918701, -2.6116368770599365, -1.9705621004104614, -1.3294873237609863, -0.6884126663208008, -0.04733777046203613, 0.5937371253967285, 1.2348098754882812, 1.8758846521377563, 2.5169594287872314, 3.158034324645996, 3.7991089820861816, 4.440183639526367, 5.081258773803711, 5.7223334312438965, 6.363408088684082, 7.004482746124268, 7.645557403564453, 8.286632537841797, 8.92770767211914, 9.568781852722168, 10.209856986999512, 10.850931167602539, 11.492006301879883, 12.133081436157227, 12.774155616760254, 13.415230751037598, 14.056304931640625, 14.697380065917969, 15.338455200195312, 15.979530334472656, 16.62060546875, 17.261680603027344, 17.902755737304688, 18.5438289642334, 19.184904098510742, 19.825979232788086, 20.46705436706543, 21.108129501342773, 21.749202728271484]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 4.0, 6.0, 9.0, 11.0, 8.0, 19.0, 11.0, 11.0, 16.0, 16.0, 25.0, 21.0, 17.0, 22.0, 21.0, 37.0, 29.0, 22.0, 31.0, 27.0, 33.0, 32.0, 40.0, 39.0, 41.0, 41.0, 35.0, 42.0, 34.0, 24.0, 31.0, 32.0, 19.0, 13.0, 21.0, 20.0, 10.0, 21.0, 11.0, 9.0, 20.0, 13.0, 12.0, 5.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0], "bins": [-19.8543701171875, -19.280012130737305, -18.70565414428711, -18.131298065185547, -17.55694007873535, -16.982582092285156, -16.40822410583496, -15.833866119384766, -15.259509086608887, -14.685151100158691, -14.110794067382812, -13.536436080932617, -12.962078094482422, -12.387721061706543, -11.813363075256348, -11.239006042480469, -10.664648056030273, -10.090290069580078, -9.5159330368042, -8.941575050354004, -8.367218017578125, -7.79286003112793, -7.218502044677734, -6.644144535064697, -6.06978702545166, -5.495429515838623, -4.921072006225586, -4.346714019775391, -3.7723565101623535, -3.1979990005493164, -2.6236412525177, -2.049283504486084, -1.4749279022216797, -0.900570273399353, -0.32621264457702637, 0.2481449842453003, 0.822502613067627, 1.396860122680664, 1.9712178707122803, 2.5455756187438965, 3.1199331283569336, 3.6942906379699707, 4.268648147583008, 4.843006134033203, 5.41736364364624, 5.991721153259277, 6.566079139709473, 7.14043664932251, 7.714794158935547, 8.289152145385742, 8.863509178161621, 9.437867164611816, 10.012224197387695, 10.58658218383789, 11.160940170288086, 11.735298156738281, 12.30965518951416, 12.884013175964355, 13.458370208740234, 14.03272819519043, 14.607086181640625, 15.181443214416504, 15.7558012008667, 16.330158233642578, 16.904516220092773]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 21.0, 29.0, 48.0, 71.0, 113.0, 205.0, 322.0, 433.0, 762.0, 1167.0, 1809.0, 2929.0, 4560.0, 7132.0, 11027.0, 17291.0, 25917.0, 38524.0, 55133.0, 75573.0, 95747.0, 112182.0, 119437.0, 114857.0, 100399.0, 80031.0, 59581.0, 41883.0, 28666.0, 19050.0, 12155.0, 7922.0, 5033.0, 3176.0, 1943.0, 1242.0, 761.0, 485.0, 321.0, 193.0, 135.0, 102.0, 66.0, 43.0, 27.0, 15.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-9.9296875, -9.63427734375, -9.3388671875, -9.04345703125, -8.748046875, -8.45263671875, -8.1572265625, -7.86181640625, -7.56640625, -7.27099609375, -6.9755859375, -6.68017578125, -6.384765625, -6.08935546875, -5.7939453125, -5.49853515625, -5.203125, -4.90771484375, -4.6123046875, -4.31689453125, -4.021484375, -3.72607421875, -3.4306640625, -3.13525390625, -2.83984375, -2.54443359375, -2.2490234375, -1.95361328125, -1.658203125, -1.36279296875, -1.0673828125, -0.77197265625, -0.4765625, -0.18115234375, 0.1142578125, 0.40966796875, 0.705078125, 1.00048828125, 1.2958984375, 1.59130859375, 1.88671875, 2.18212890625, 2.4775390625, 2.77294921875, 3.068359375, 3.36376953125, 3.6591796875, 3.95458984375, 4.25, 4.54541015625, 4.8408203125, 5.13623046875, 5.431640625, 5.72705078125, 6.0224609375, 6.31787109375, 6.61328125, 6.90869140625, 7.2041015625, 7.49951171875, 7.794921875, 8.09033203125, 8.3857421875, 8.68115234375, 8.9765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 7.0, 10.0, 12.0, 12.0, 13.0, 17.0, 17.0, 21.0, 21.0, 17.0, 17.0, 31.0, 37.0, 37.0, 22.0, 32.0, 38.0, 33.0, 34.0, 48.0, 33.0, 37.0, 40.0, 33.0, 40.0, 37.0, 20.0, 30.0, 19.0, 25.0, 25.0, 18.0, 18.0, 20.0, 16.0, 14.0, 9.0, 9.0, 14.0, 8.0, 4.0, 4.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-21.09375, -20.477783203125, -19.86181640625, -19.245849609375, -18.6298828125, -18.013916015625, -17.39794921875, -16.781982421875, -16.166015625, -15.550048828125, -14.93408203125, -14.318115234375, -13.7021484375, -13.086181640625, -12.47021484375, -11.854248046875, -11.23828125, -10.622314453125, -10.00634765625, -9.390380859375, -8.7744140625, -8.158447265625, -7.54248046875, -6.926513671875, -6.310546875, -5.694580078125, -5.07861328125, -4.462646484375, -3.8466796875, -3.230712890625, -2.61474609375, -1.998779296875, -1.3828125, -0.766845703125, -0.15087890625, 0.465087890625, 1.0810546875, 1.697021484375, 2.31298828125, 2.928955078125, 3.544921875, 4.160888671875, 4.77685546875, 5.392822265625, 6.0087890625, 6.624755859375, 7.24072265625, 7.856689453125, 8.47265625, 9.088623046875, 9.70458984375, 10.320556640625, 10.9365234375, 11.552490234375, 12.16845703125, 12.784423828125, 13.400390625, 14.016357421875, 14.63232421875, 15.248291015625, 15.8642578125, 16.480224609375, 17.09619140625, 17.712158203125, 18.328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 12.0, 16.0, 25.0, 34.0, 63.0, 89.0, 148.0, 216.0, 319.0, 518.0, 815.0, 1227.0, 2065.0, 3450.0, 5522.0, 9096.0, 15294.0, 25120.0, 42439.0, 68167.0, 103790.0, 141304.0, 162339.0, 150405.0, 115429.0, 77399.0, 48721.0, 29390.0, 17724.0, 10750.0, 6469.0, 3924.0, 2387.0, 1401.0, 951.0, 610.0, 354.0, 214.0, 113.0, 78.0, 64.0, 40.0, 20.0, 21.0, 12.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.6015625, -15.12353515625, -14.6455078125, -14.16748046875, -13.689453125, -13.21142578125, -12.7333984375, -12.25537109375, -11.77734375, -11.29931640625, -10.8212890625, -10.34326171875, -9.865234375, -9.38720703125, -8.9091796875, -8.43115234375, -7.953125, -7.47509765625, -6.9970703125, -6.51904296875, -6.041015625, -5.56298828125, -5.0849609375, -4.60693359375, -4.12890625, -3.65087890625, -3.1728515625, -2.69482421875, -2.216796875, -1.73876953125, -1.2607421875, -0.78271484375, -0.3046875, 0.17333984375, 0.6513671875, 1.12939453125, 1.607421875, 2.08544921875, 2.5634765625, 3.04150390625, 3.51953125, 3.99755859375, 4.4755859375, 4.95361328125, 5.431640625, 5.90966796875, 6.3876953125, 6.86572265625, 7.34375, 7.82177734375, 8.2998046875, 8.77783203125, 9.255859375, 9.73388671875, 10.2119140625, 10.68994140625, 11.16796875, 11.64599609375, 12.1240234375, 12.60205078125, 13.080078125, 13.55810546875, 14.0361328125, 14.51416015625, 14.9921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 7.0, 8.0, 8.0, 15.0, 13.0, 15.0, 20.0, 15.0, 25.0, 20.0, 35.0, 33.0, 38.0, 29.0, 28.0, 36.0, 41.0, 42.0, 39.0, 44.0, 53.0, 44.0, 36.0, 31.0, 44.0, 32.0, 37.0, 33.0, 23.0, 28.0, 20.0, 18.0, 18.0, 9.0, 15.0, 9.0, 9.0, 11.0, 9.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -11.9527587890625, -11.507080078125, -11.0614013671875, -10.61572265625, -10.1700439453125, -9.724365234375, -9.2786865234375, -8.8330078125, -8.3873291015625, -7.941650390625, -7.4959716796875, -7.05029296875, -6.6046142578125, -6.158935546875, -5.7132568359375, -5.267578125, -4.8218994140625, -4.376220703125, -3.9305419921875, -3.48486328125, -3.0391845703125, -2.593505859375, -2.1478271484375, -1.7021484375, -1.2564697265625, -0.810791015625, -0.3651123046875, 0.08056640625, 0.5262451171875, 0.971923828125, 1.4176025390625, 1.86328125, 2.3089599609375, 2.754638671875, 3.2003173828125, 3.64599609375, 4.0916748046875, 4.537353515625, 4.9830322265625, 5.4287109375, 5.8743896484375, 6.320068359375, 6.7657470703125, 7.21142578125, 7.6571044921875, 8.102783203125, 8.5484619140625, 8.994140625, 9.4398193359375, 9.885498046875, 10.3311767578125, 10.77685546875, 11.2225341796875, 11.668212890625, 12.1138916015625, 12.5595703125, 13.0052490234375, 13.450927734375, 13.8966064453125, 14.34228515625, 14.7879638671875, 15.233642578125, 15.6793212890625, 16.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 9.0, 18.0, 24.0, 22.0, 42.0, 40.0, 71.0, 103.0, 160.0, 246.0, 379.0, 637.0, 1096.0, 1930.0, 3486.0, 6456.0, 12233.0, 23451.0, 44520.0, 82758.0, 139284.0, 194460.0, 198845.0, 147069.0, 88808.0, 48543.0, 25034.0, 13071.0, 7013.0, 3698.0, 2018.0, 1204.0, 642.0, 402.0, 258.0, 169.0, 96.0, 90.0, 36.0, 22.0, 20.0, 28.0, 12.0, 9.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.98046875, -7.72357177734375, -7.4666748046875, -7.20977783203125, -6.952880859375, -6.69598388671875, -6.4390869140625, -6.18218994140625, -5.92529296875, -5.66839599609375, -5.4114990234375, -5.15460205078125, -4.897705078125, -4.64080810546875, -4.3839111328125, -4.12701416015625, -3.8701171875, -3.61322021484375, -3.3563232421875, -3.09942626953125, -2.842529296875, -2.58563232421875, -2.3287353515625, -2.07183837890625, -1.81494140625, -1.55804443359375, -1.3011474609375, -1.04425048828125, -0.787353515625, -0.53045654296875, -0.2735595703125, -0.01666259765625, 0.240234375, 0.49713134765625, 0.7540283203125, 1.01092529296875, 1.267822265625, 1.52471923828125, 1.7816162109375, 2.03851318359375, 2.29541015625, 2.55230712890625, 2.8092041015625, 3.06610107421875, 3.322998046875, 3.57989501953125, 3.8367919921875, 4.09368896484375, 4.3505859375, 4.60748291015625, 4.8643798828125, 5.12127685546875, 5.378173828125, 5.63507080078125, 5.8919677734375, 6.14886474609375, 6.40576171875, 6.66265869140625, 6.9195556640625, 7.17645263671875, 7.433349609375, 7.69024658203125, 7.9471435546875, 8.20404052734375, 8.4609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 2.0, 7.0, 7.0, 2.0, 12.0, 9.0, 17.0, 22.0, 26.0, 26.0, 35.0, 49.0, 44.0, 43.0, 57.0, 56.0, 62.0, 62.0, 55.0, 51.0, 51.0, 52.0, 38.0, 35.0, 24.0, 37.0, 16.0, 15.0, 27.0, 13.0, 7.0, 9.0, 9.0, 4.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.00049591064453125, -0.0004831776022911072, -0.00047044456005096436, -0.00045771151781082153, -0.0004449784755706787, -0.0004322454333305359, -0.00041951239109039307, -0.00040677934885025024, -0.0003940463066101074, -0.0003813132643699646, -0.0003685802221298218, -0.00035584717988967896, -0.00034311413764953613, -0.0003303810954093933, -0.0003176480531692505, -0.00030491501092910767, -0.00029218196868896484, -0.000279448926448822, -0.0002667158842086792, -0.0002539828419685364, -0.00024124979972839355, -0.00022851675748825073, -0.0002157837152481079, -0.0002030506730079651, -0.00019031763076782227, -0.00017758458852767944, -0.00016485154628753662, -0.0001521185040473938, -0.00013938546180725098, -0.00012665241956710815, -0.00011391937732696533, -0.00010118633508682251, -8.845329284667969e-05, -7.572025060653687e-05, -6.298720836639404e-05, -5.025416612625122e-05, -3.75211238861084e-05, -2.4788081645965576e-05, -1.2055039405822754e-05, 6.780028343200684e-07, 1.341104507446289e-05, 2.6144087314605713e-05, 3.8877129554748535e-05, 5.161017179489136e-05, 6.434321403503418e-05, 7.7076256275177e-05, 8.980929851531982e-05, 0.00010254234075546265, 0.00011527538299560547, 0.0001280084252357483, 0.0001407414674758911, 0.00015347450971603394, 0.00016620755195617676, 0.00017894059419631958, 0.0001916736364364624, 0.00020440667867660522, 0.00021713972091674805, 0.00022987276315689087, 0.0002426058053970337, 0.0002553388476371765, 0.00026807188987731934, 0.00028080493211746216, 0.000293537974357605, 0.0003062710165977478, 0.0003190040588378906]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 10.0, 5.0, 11.0, 13.0, 26.0, 28.0, 45.0, 64.0, 87.0, 137.0, 163.0, 247.0, 358.0, 598.0, 813.0, 1308.0, 2035.0, 3419.0, 5545.0, 9307.0, 15840.0, 26860.0, 44827.0, 71412.0, 105177.0, 137797.0, 154016.0, 144651.0, 114348.0, 80418.0, 51410.0, 31214.0, 18420.0, 10998.0, 6430.0, 3858.0, 2279.0, 1477.0, 912.0, 603.0, 401.0, 313.0, 221.0, 125.0, 101.0, 70.0, 48.0, 37.0, 28.0, 17.0, 14.0, 12.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.359375, -8.103271484375, -7.84716796875, -7.591064453125, -7.3349609375, -7.078857421875, -6.82275390625, -6.566650390625, -6.310546875, -6.054443359375, -5.79833984375, -5.542236328125, -5.2861328125, -5.030029296875, -4.77392578125, -4.517822265625, -4.26171875, -4.005615234375, -3.74951171875, -3.493408203125, -3.2373046875, -2.981201171875, -2.72509765625, -2.468994140625, -2.212890625, -1.956787109375, -1.70068359375, -1.444580078125, -1.1884765625, -0.932373046875, -0.67626953125, -0.420166015625, -0.1640625, 0.092041015625, 0.34814453125, 0.604248046875, 0.8603515625, 1.116455078125, 1.37255859375, 1.628662109375, 1.884765625, 2.140869140625, 2.39697265625, 2.653076171875, 2.9091796875, 3.165283203125, 3.42138671875, 3.677490234375, 3.93359375, 4.189697265625, 4.44580078125, 4.701904296875, 4.9580078125, 5.214111328125, 5.47021484375, 5.726318359375, 5.982421875, 6.238525390625, 6.49462890625, 6.750732421875, 7.0068359375, 7.262939453125, 7.51904296875, 7.775146484375, 8.03125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 1.0, 6.0, 3.0, 5.0, 16.0, 8.0, 8.0, 16.0, 13.0, 19.0, 27.0, 26.0, 27.0, 39.0, 36.0, 57.0, 59.0, 44.0, 57.0, 51.0, 40.0, 49.0, 58.0, 45.0, 42.0, 41.0, 37.0, 34.0, 28.0, 17.0, 17.0, 10.0, 12.0, 13.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.623443603515625, -2.53204345703125, -2.440643310546875, -2.3492431640625, -2.257843017578125, -2.16644287109375, -2.075042724609375, -1.983642578125, -1.892242431640625, -1.80084228515625, -1.709442138671875, -1.6180419921875, -1.526641845703125, -1.43524169921875, -1.343841552734375, -1.25244140625, -1.161041259765625, -1.06964111328125, -0.978240966796875, -0.8868408203125, -0.795440673828125, -0.70404052734375, -0.612640380859375, -0.521240234375, -0.429840087890625, -0.33843994140625, -0.247039794921875, -0.1556396484375, -0.064239501953125, 0.02716064453125, 0.118560791015625, 0.2099609375, 0.301361083984375, 0.39276123046875, 0.484161376953125, 0.5755615234375, 0.666961669921875, 0.75836181640625, 0.849761962890625, 0.941162109375, 1.032562255859375, 1.12396240234375, 1.215362548828125, 1.3067626953125, 1.398162841796875, 1.48956298828125, 1.580963134765625, 1.67236328125, 1.763763427734375, 1.85516357421875, 1.946563720703125, 2.0379638671875, 2.129364013671875, 2.22076416015625, 2.312164306640625, 2.403564453125, 2.494964599609375, 2.58636474609375, 2.677764892578125, 2.7691650390625, 2.860565185546875, 2.95196533203125, 3.043365478515625, 3.134765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 2.0, 5.0, 1.0, 4.0, 7.0, 8.0, 9.0, 15.0, 13.0, 12.0, 17.0, 27.0, 24.0, 15.0, 27.0, 23.0, 38.0, 38.0, 34.0, 37.0, 39.0, 38.0, 47.0, 45.0, 46.0, 47.0, 35.0, 35.0, 28.0, 31.0, 23.0, 31.0, 21.0, 27.0, 19.0, 19.0, 17.0, 9.0, 17.0, 10.0, 10.0, 7.0, 12.0, 2.0, 8.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.51545524597168, -18.891408920288086, -18.267362594604492, -17.643314361572266, -17.019268035888672, -16.395221710205078, -15.771175384521484, -15.14712905883789, -14.52308177947998, -13.899035453796387, -13.274988174438477, -12.650941848754883, -12.026895523071289, -11.402848243713379, -10.778801918029785, -10.154754638671875, -9.530708312988281, -8.906661987304688, -8.282614707946777, -7.658568382263184, -7.034521579742432, -6.41047477722168, -5.786428451538086, -5.162381649017334, -4.538334846496582, -3.91428804397583, -3.2902414798736572, -2.6661949157714844, -2.0421481132507324, -1.4181013107299805, -0.7940547466278076, -0.17000818252563477, 0.45404052734375, 1.0780872106552124, 1.7021338939666748, 2.3261804580688477, 2.9502272605895996, 3.5742740631103516, 4.198320388793945, 4.822367191314697, 5.446413993835449, 6.070460796356201, 6.694507598876953, 7.318553924560547, 7.942600727081299, 8.56664752960205, 9.190693855285645, 9.814741134643555, 10.438787460327148, 11.062833786010742, 11.686881065368652, 12.310927391052246, 12.934974670410156, 13.55902099609375, 14.183067321777344, 14.807113647460938, 15.431160926818848, 16.055208206176758, 16.67925453186035, 17.303300857543945, 17.92734718322754, 18.551395416259766, 19.17544174194336, 19.799488067626953, 20.423534393310547]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 5.0, 9.0, 13.0, 7.0, 13.0, 14.0, 12.0, 17.0, 13.0, 16.0, 25.0, 27.0, 20.0, 23.0, 26.0, 40.0, 31.0, 20.0, 33.0, 33.0, 35.0, 42.0, 39.0, 30.0, 43.0, 32.0, 45.0, 26.0, 39.0, 26.0, 27.0, 25.0, 20.0, 17.0, 13.0, 15.0, 20.0, 13.0, 12.0, 16.0, 12.0, 9.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-20.018753051757812, -19.439897537231445, -18.86104393005371, -18.282188415527344, -17.703332901000977, -17.124479293823242, -16.545623779296875, -15.966769218444824, -15.387914657592773, -14.809060096740723, -14.230204582214355, -13.651350021362305, -13.072495460510254, -12.493640899658203, -11.914785385131836, -11.335930824279785, -10.757075309753418, -10.178220748901367, -9.599365234375, -9.02051067352295, -8.441656112670898, -7.8628010749816895, -7.2839460372924805, -6.70509147644043, -6.126236438751221, -5.547381401062012, -4.968526840209961, -4.389671802520752, -3.810817003250122, -3.231962203979492, -2.653107166290283, -2.0742526054382324, -1.4953975677490234, -0.9165427088737488, -0.3376878499984741, 0.2411670684814453, 0.8200218677520752, 1.398876667022705, 1.977731704711914, 2.556586265563965, 3.135441303253174, 3.7142961025238037, 4.293150901794434, 4.872005939483643, 5.450860977172852, 6.029715538024902, 6.608570575714111, 7.187425136566162, 7.766280174255371, 8.345134735107422, 8.923990249633789, 9.50284481048584, 10.08169937133789, 10.660554885864258, 11.239409446716309, 11.81826400756836, 12.397119522094727, 12.975974082946777, 13.554829597473145, 14.133684158325195, 14.712538719177246, 15.291393280029297, 15.870248794555664, 16.44910430908203, 17.027957916259766]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 11.0, 14.0, 26.0, 46.0, 49.0, 108.0, 181.0, 307.0, 489.0, 850.0, 1372.0, 2363.0, 3842.0, 6286.0, 9956.0, 15668.0, 24462.0, 36565.0, 53368.0, 72962.0, 93622.0, 110575.0, 119520.0, 116930.0, 103155.0, 83288.0, 63385.0, 45237.0, 30547.0, 20001.0, 12554.0, 8068.0, 5033.0, 3056.0, 1879.0, 1105.0, 705.0, 390.0, 230.0, 150.0, 91.0, 52.0, 23.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9453125, -13.4920654296875, -13.038818359375, -12.5855712890625, -12.13232421875, -11.6790771484375, -11.225830078125, -10.7725830078125, -10.3193359375, -9.8660888671875, -9.412841796875, -8.9595947265625, -8.50634765625, -8.0531005859375, -7.599853515625, -7.1466064453125, -6.693359375, -6.2401123046875, -5.786865234375, -5.3336181640625, -4.88037109375, -4.4271240234375, -3.973876953125, -3.5206298828125, -3.0673828125, -2.6141357421875, -2.160888671875, -1.7076416015625, -1.25439453125, -0.8011474609375, -0.347900390625, 0.1053466796875, 0.55859375, 1.0118408203125, 1.465087890625, 1.9183349609375, 2.37158203125, 2.8248291015625, 3.278076171875, 3.7313232421875, 4.1845703125, 4.6378173828125, 5.091064453125, 5.5443115234375, 5.99755859375, 6.4508056640625, 6.904052734375, 7.3572998046875, 7.810546875, 8.2637939453125, 8.717041015625, 9.1702880859375, 9.62353515625, 10.0767822265625, 10.530029296875, 10.9832763671875, 11.4365234375, 11.8897705078125, 12.343017578125, 12.7962646484375, 13.24951171875, 13.7027587890625, 14.156005859375, 14.6092529296875, 15.0625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 0.0, 6.0, 3.0, 6.0, 5.0, 8.0, 4.0, 3.0, 10.0, 11.0, 20.0, 11.0, 15.0, 19.0, 18.0, 27.0, 23.0, 27.0, 25.0, 32.0, 30.0, 37.0, 38.0, 31.0, 36.0, 54.0, 49.0, 39.0, 43.0, 33.0, 44.0, 34.0, 44.0, 17.0, 24.0, 18.0, 21.0, 14.0, 27.0, 14.0, 18.0, 12.0, 16.0, 11.0, 3.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.671875, -21.025634765625, -20.37939453125, -19.733154296875, -19.0869140625, -18.440673828125, -17.79443359375, -17.148193359375, -16.501953125, -15.855712890625, -15.20947265625, -14.563232421875, -13.9169921875, -13.270751953125, -12.62451171875, -11.978271484375, -11.33203125, -10.685791015625, -10.03955078125, -9.393310546875, -8.7470703125, -8.100830078125, -7.45458984375, -6.808349609375, -6.162109375, -5.515869140625, -4.86962890625, -4.223388671875, -3.5771484375, -2.930908203125, -2.28466796875, -1.638427734375, -0.9921875, -0.345947265625, 0.30029296875, 0.946533203125, 1.5927734375, 2.239013671875, 2.88525390625, 3.531494140625, 4.177734375, 4.823974609375, 5.47021484375, 6.116455078125, 6.7626953125, 7.408935546875, 8.05517578125, 8.701416015625, 9.34765625, 9.993896484375, 10.64013671875, 11.286376953125, 11.9326171875, 12.578857421875, 13.22509765625, 13.871337890625, 14.517578125, 15.163818359375, 15.81005859375, 16.456298828125, 17.1025390625, 17.748779296875, 18.39501953125, 19.041259765625, 19.6875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 10.0, 4.0, 11.0, 15.0, 30.0, 55.0, 78.0, 125.0, 193.0, 323.0, 562.0, 822.0, 1475.0, 2215.0, 3533.0, 5694.0, 9035.0, 13956.0, 21543.0, 31749.0, 45492.0, 62618.0, 80861.0, 97713.0, 109519.0, 112944.0, 106514.0, 92483.0, 74089.0, 56215.0, 40206.0, 27434.0, 18253.0, 12032.0, 7807.0, 4989.0, 3121.0, 1848.0, 1156.0, 724.0, 420.0, 280.0, 172.0, 91.0, 59.0, 37.0, 23.0, 16.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.6640625, -15.1939697265625, -14.723876953125, -14.2537841796875, -13.78369140625, -13.3135986328125, -12.843505859375, -12.3734130859375, -11.9033203125, -11.4332275390625, -10.963134765625, -10.4930419921875, -10.02294921875, -9.5528564453125, -9.082763671875, -8.6126708984375, -8.142578125, -7.6724853515625, -7.202392578125, -6.7322998046875, -6.26220703125, -5.7921142578125, -5.322021484375, -4.8519287109375, -4.3818359375, -3.9117431640625, -3.441650390625, -2.9715576171875, -2.50146484375, -2.0313720703125, -1.561279296875, -1.0911865234375, -0.62109375, -0.1510009765625, 0.319091796875, 0.7891845703125, 1.25927734375, 1.7293701171875, 2.199462890625, 2.6695556640625, 3.1396484375, 3.6097412109375, 4.079833984375, 4.5499267578125, 5.02001953125, 5.4901123046875, 5.960205078125, 6.4302978515625, 6.900390625, 7.3704833984375, 7.840576171875, 8.3106689453125, 8.78076171875, 9.2508544921875, 9.720947265625, 10.1910400390625, 10.6611328125, 11.1312255859375, 11.601318359375, 12.0714111328125, 12.54150390625, 13.0115966796875, 13.481689453125, 13.9517822265625, 14.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 9.0, 13.0, 15.0, 9.0, 18.0, 16.0, 22.0, 20.0, 28.0, 22.0, 24.0, 32.0, 36.0, 33.0, 38.0, 31.0, 46.0, 39.0, 43.0, 33.0, 44.0, 48.0, 41.0, 35.0, 38.0, 34.0, 19.0, 23.0, 23.0, 26.0, 23.0, 10.0, 14.0, 12.0, 19.0, 7.0, 11.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9921875, -12.5660400390625, -12.139892578125, -11.7137451171875, -11.28759765625, -10.8614501953125, -10.435302734375, -10.0091552734375, -9.5830078125, -9.1568603515625, -8.730712890625, -8.3045654296875, -7.87841796875, -7.4522705078125, -7.026123046875, -6.5999755859375, -6.173828125, -5.7476806640625, -5.321533203125, -4.8953857421875, -4.46923828125, -4.0430908203125, -3.616943359375, -3.1907958984375, -2.7646484375, -2.3385009765625, -1.912353515625, -1.4862060546875, -1.06005859375, -0.6339111328125, -0.207763671875, 0.2183837890625, 0.64453125, 1.0706787109375, 1.496826171875, 1.9229736328125, 2.34912109375, 2.7752685546875, 3.201416015625, 3.6275634765625, 4.0537109375, 4.4798583984375, 4.906005859375, 5.3321533203125, 5.75830078125, 6.1844482421875, 6.610595703125, 7.0367431640625, 7.462890625, 7.8890380859375, 8.315185546875, 8.7413330078125, 9.16748046875, 9.5936279296875, 10.019775390625, 10.4459228515625, 10.8720703125, 11.2982177734375, 11.724365234375, 12.1505126953125, 12.57666015625, 13.0028076171875, 13.428955078125, 13.8551025390625, 14.28125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 8.0, 15.0, 29.0, 64.0, 77.0, 150.0, 243.0, 375.0, 680.0, 1018.0, 1830.0, 2989.0, 4889.0, 8126.0, 12700.0, 19978.0, 30676.0, 44841.0, 62925.0, 83437.0, 102933.0, 116243.0, 118591.0, 110149.0, 93623.0, 73800.0, 54065.0, 37189.0, 24929.0, 15888.0, 10081.0, 6198.0, 3946.0, 2329.0, 1396.0, 850.0, 484.0, 311.0, 208.0, 106.0, 60.0, 58.0, 27.0, 15.0, 13.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.8870849609375, -4.707763671875, -4.5284423828125, -4.34912109375, -4.1697998046875, -3.990478515625, -3.8111572265625, -3.6318359375, -3.4525146484375, -3.273193359375, -3.0938720703125, -2.91455078125, -2.7352294921875, -2.555908203125, -2.3765869140625, -2.197265625, -2.0179443359375, -1.838623046875, -1.6593017578125, -1.47998046875, -1.3006591796875, -1.121337890625, -0.9420166015625, -0.7626953125, -0.5833740234375, -0.404052734375, -0.2247314453125, -0.04541015625, 0.1339111328125, 0.313232421875, 0.4925537109375, 0.671875, 0.8511962890625, 1.030517578125, 1.2098388671875, 1.38916015625, 1.5684814453125, 1.747802734375, 1.9271240234375, 2.1064453125, 2.2857666015625, 2.465087890625, 2.6444091796875, 2.82373046875, 3.0030517578125, 3.182373046875, 3.3616943359375, 3.541015625, 3.7203369140625, 3.899658203125, 4.0789794921875, 4.25830078125, 4.4376220703125, 4.616943359375, 4.7962646484375, 4.9755859375, 5.1549072265625, 5.334228515625, 5.5135498046875, 5.69287109375, 5.8721923828125, 6.051513671875, 6.2308349609375, 6.41015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 7.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 8.0, 11.0, 6.0, 17.0, 19.0, 17.0, 29.0, 36.0, 36.0, 24.0, 34.0, 44.0, 54.0, 44.0, 46.0, 54.0, 34.0, 48.0, 46.0, 30.0, 37.0, 42.0, 27.0, 28.0, 33.0, 18.0, 35.0, 16.0, 19.0, 12.0, 16.0, 17.0, 7.0, 9.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006513595581054688, -0.0006301775574684143, -0.0006089955568313599, -0.0005878135561943054, -0.000566631555557251, -0.0005454495549201965, -0.0005242675542831421, -0.0005030855536460876, -0.0004819035530090332, -0.00046072155237197876, -0.0004395395517349243, -0.0004183575510978699, -0.00039717555046081543, -0.000375993549823761, -0.00035481154918670654, -0.0003336295485496521, -0.00031244754791259766, -0.0002912655472755432, -0.00027008354663848877, -0.0002489015460014343, -0.00022771954536437988, -0.00020653754472732544, -0.000185355544090271, -0.00016417354345321655, -0.0001429915428161621, -0.00012180954217910767, -0.00010062754154205322, -7.944554090499878e-05, -5.8263540267944336e-05, -3.708153963088989e-05, -1.589953899383545e-05, 5.282461643218994e-06, 2.6464462280273438e-05, 4.764646291732788e-05, 6.882846355438232e-05, 9.001046419143677e-05, 0.00011119246482849121, 0.00013237446546554565, 0.0001535564661026001, 0.00017473846673965454, 0.00019592046737670898, 0.00021710246801376343, 0.00023828446865081787, 0.0002594664692878723, 0.00028064846992492676, 0.0003018304705619812, 0.00032301247119903564, 0.0003441944718360901, 0.00036537647247314453, 0.000386558473110199, 0.0004077404737472534, 0.00042892247438430786, 0.0004501044750213623, 0.00047128647565841675, 0.0004924684762954712, 0.0005136504769325256, 0.0005348324775695801, 0.0005560144782066345, 0.000577196478843689, 0.0005983784794807434, 0.0006195604801177979, 0.0006407424807548523, 0.0006619244813919067, 0.0006831064820289612, 0.0007042884826660156]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 16.0, 18.0, 21.0, 28.0, 55.0, 98.0, 152.0, 216.0, 342.0, 619.0, 929.0, 1523.0, 2264.0, 3727.0, 5712.0, 8896.0, 13386.0, 20478.0, 30127.0, 42766.0, 58227.0, 75798.0, 92795.0, 105797.0, 110423.0, 105760.0, 94507.0, 77447.0, 59790.0, 44474.0, 31135.0, 21157.0, 14055.0, 9393.0, 5910.0, 3947.0, 2470.0, 1542.0, 967.0, 577.0, 368.0, 245.0, 151.0, 88.0, 64.0, 29.0, 28.0, 18.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.46484375, -5.2916259765625, -5.118408203125, -4.9451904296875, -4.77197265625, -4.5987548828125, -4.425537109375, -4.2523193359375, -4.0791015625, -3.9058837890625, -3.732666015625, -3.5594482421875, -3.38623046875, -3.2130126953125, -3.039794921875, -2.8665771484375, -2.693359375, -2.5201416015625, -2.346923828125, -2.1737060546875, -2.00048828125, -1.8272705078125, -1.654052734375, -1.4808349609375, -1.3076171875, -1.1343994140625, -0.961181640625, -0.7879638671875, -0.61474609375, -0.4415283203125, -0.268310546875, -0.0950927734375, 0.078125, 0.2513427734375, 0.424560546875, 0.5977783203125, 0.77099609375, 0.9442138671875, 1.117431640625, 1.2906494140625, 1.4638671875, 1.6370849609375, 1.810302734375, 1.9835205078125, 2.15673828125, 2.3299560546875, 2.503173828125, 2.6763916015625, 2.849609375, 3.0228271484375, 3.196044921875, 3.3692626953125, 3.54248046875, 3.7156982421875, 3.888916015625, 4.0621337890625, 4.2353515625, 4.4085693359375, 4.581787109375, 4.7550048828125, 4.92822265625, 5.1014404296875, 5.274658203125, 5.4478759765625, 5.62109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 2.0, 9.0, 7.0, 9.0, 18.0, 16.0, 18.0, 19.0, 23.0, 29.0, 26.0, 23.0, 30.0, 34.0, 48.0, 44.0, 38.0, 52.0, 54.0, 55.0, 45.0, 40.0, 51.0, 45.0, 44.0, 34.0, 27.0, 27.0, 17.0, 19.0, 15.0, 19.0, 15.0, 9.0, 11.0, 4.0, 5.0, 8.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5, -2.42596435546875, -2.3519287109375, -2.27789306640625, -2.203857421875, -2.12982177734375, -2.0557861328125, -1.98175048828125, -1.90771484375, -1.83367919921875, -1.7596435546875, -1.68560791015625, -1.611572265625, -1.53753662109375, -1.4635009765625, -1.38946533203125, -1.3154296875, -1.24139404296875, -1.1673583984375, -1.09332275390625, -1.019287109375, -0.94525146484375, -0.8712158203125, -0.79718017578125, -0.72314453125, -0.64910888671875, -0.5750732421875, -0.50103759765625, -0.427001953125, -0.35296630859375, -0.2789306640625, -0.20489501953125, -0.130859375, -0.05682373046875, 0.0172119140625, 0.09124755859375, 0.165283203125, 0.23931884765625, 0.3133544921875, 0.38739013671875, 0.46142578125, 0.53546142578125, 0.6094970703125, 0.68353271484375, 0.757568359375, 0.83160400390625, 0.9056396484375, 0.97967529296875, 1.0537109375, 1.12774658203125, 1.2017822265625, 1.27581787109375, 1.349853515625, 1.42388916015625, 1.4979248046875, 1.57196044921875, 1.64599609375, 1.72003173828125, 1.7940673828125, 1.86810302734375, 1.942138671875, 2.01617431640625, 2.0902099609375, 2.16424560546875, 2.23828125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 7.0, 3.0, 7.0, 9.0, 10.0, 10.0, 14.0, 10.0, 16.0, 29.0, 12.0, 30.0, 24.0, 33.0, 29.0, 26.0, 42.0, 44.0, 50.0, 31.0, 52.0, 42.0, 44.0, 54.0, 35.0, 33.0, 36.0, 30.0, 34.0, 33.0, 22.0, 25.0, 16.0, 18.0, 6.0, 18.0, 12.0, 10.0, 6.0, 5.0, 8.0, 2.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.590803146362305, -19.92736053466797, -19.263916015625, -18.600473403930664, -17.937030792236328, -17.27358627319336, -16.610143661499023, -15.946701049804688, -15.283257484436035, -14.619813919067383, -13.956371307373047, -13.292927742004395, -12.629484176635742, -11.966041564941406, -11.302597999572754, -10.639154434204102, -9.975711822509766, -9.312268257141113, -8.648825645446777, -7.985382080078125, -7.321938991546631, -6.658495903015137, -5.995052337646484, -5.33160924911499, -4.668166160583496, -4.004723072052002, -3.3412797451019287, -2.6778364181518555, -2.0143933296203613, -1.3509502410888672, -0.687506914138794, -0.024063587188720703, 0.6393775939941406, 1.3028208017349243, 1.966264009475708, 2.6297073364257812, 3.2931504249572754, 3.9565935134887695, 4.620037078857422, 5.283480167388916, 5.94692325592041, 6.610366344451904, 7.273809432983398, 7.937252998352051, 8.600696563720703, 9.264139175415039, 9.927582740783691, 10.591026306152344, 11.25446891784668, 11.917912483215332, 12.581355094909668, 13.24479866027832, 13.908241271972656, 14.571684837341309, 15.235128402709961, 15.898571014404297, 16.562015533447266, 17.2254581451416, 17.88890266418457, 18.552345275878906, 19.215787887573242, 19.879230499267578, 20.542675018310547, 21.206117630004883, 21.86956024169922]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 6.0, 11.0, 6.0, 15.0, 15.0, 9.0, 19.0, 22.0, 24.0, 25.0, 27.0, 39.0, 31.0, 31.0, 40.0, 34.0, 44.0, 38.0, 40.0, 46.0, 36.0, 35.0, 36.0, 39.0, 40.0, 41.0, 25.0, 30.0, 28.0, 21.0, 30.0, 10.0, 19.0, 15.0, 12.0, 9.0, 14.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-27.00551986694336, -26.270401000976562, -25.535280227661133, -24.800161361694336, -24.06504249572754, -23.32992172241211, -22.594802856445312, -21.859683990478516, -21.124563217163086, -20.38944435119629, -19.65432357788086, -18.919204711914062, -18.184085845947266, -17.448965072631836, -16.71384620666504, -15.978726387023926, -15.243607521057129, -14.508487701416016, -13.773368835449219, -13.038249015808105, -12.303129196166992, -11.568010330200195, -10.832890510559082, -10.097770690917969, -9.362651824951172, -8.627532005310059, -7.8924126625061035, -7.157293319702148, -6.422173500061035, -5.68705415725708, -4.951934814453125, -4.216814994812012, -3.4816951751708984, -2.7465755939483643, -2.01145601272583, -1.276336669921875, -0.5412170886993408, 0.19390249252319336, 0.9290218353271484, 1.6641416549682617, 2.399260997772217, 3.134380578994751, 3.869500160217285, 4.60461950302124, 5.339738845825195, 6.074858665466309, 6.809978008270264, 7.545097827911377, 8.280217170715332, 9.015336990356445, 9.750455856323242, 10.485575675964355, 11.220695495605469, 11.955814361572266, 12.690934181213379, 13.426054000854492, 14.161172866821289, 14.896292686462402, 15.6314115524292, 16.366531372070312, 17.10165023803711, 17.83677101135254, 18.571889877319336, 19.307010650634766, 20.042129516601562]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 14.0, 10.0, 20.0, 40.0, 47.0, 92.0, 128.0, 211.0, 269.0, 530.0, 789.0, 1307.0, 2133.0, 3686.0, 6347.0, 11826.0, 21783.0, 41220.0, 79851.0, 156247.0, 298798.0, 521158.0, 748789.0, 809105.0, 641556.0, 398323.0, 215609.0, 110678.0, 57137.0, 29572.0, 16137.0, 8744.0, 5010.0, 2834.0, 1623.0, 1002.0, 566.0, 383.0, 253.0, 146.0, 116.0, 69.0, 43.0, 28.0, 15.0, 11.0, 9.0, 6.0, 5.0, 5.0, 0.0, 1.0], "bins": [-28.5625, -27.751953125, -26.94140625, -26.130859375, -25.3203125, -24.509765625, -23.69921875, -22.888671875, -22.078125, -21.267578125, -20.45703125, -19.646484375, -18.8359375, -18.025390625, -17.21484375, -16.404296875, -15.59375, -14.783203125, -13.97265625, -13.162109375, -12.3515625, -11.541015625, -10.73046875, -9.919921875, -9.109375, -8.298828125, -7.48828125, -6.677734375, -5.8671875, -5.056640625, -4.24609375, -3.435546875, -2.625, -1.814453125, -1.00390625, -0.193359375, 0.6171875, 1.427734375, 2.23828125, 3.048828125, 3.859375, 4.669921875, 5.48046875, 6.291015625, 7.1015625, 7.912109375, 8.72265625, 9.533203125, 10.34375, 11.154296875, 11.96484375, 12.775390625, 13.5859375, 14.396484375, 15.20703125, 16.017578125, 16.828125, 17.638671875, 18.44921875, 19.259765625, 20.0703125, 20.880859375, 21.69140625, 22.501953125, 23.3125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 7.0, 7.0, 5.0, 7.0, 13.0, 12.0, 18.0, 19.0, 23.0, 21.0, 21.0, 22.0, 22.0, 41.0, 44.0, 41.0, 43.0, 36.0, 46.0, 44.0, 36.0, 42.0, 41.0, 26.0, 49.0, 30.0, 29.0, 31.0, 27.0, 26.0, 23.0, 18.0, 23.0, 26.0, 15.0, 12.0, 8.0, 10.0, 5.0, 10.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 2.0], "bins": [-25.609375, -24.91845703125, -24.2275390625, -23.53662109375, -22.845703125, -22.15478515625, -21.4638671875, -20.77294921875, -20.08203125, -19.39111328125, -18.7001953125, -18.00927734375, -17.318359375, -16.62744140625, -15.9365234375, -15.24560546875, -14.5546875, -13.86376953125, -13.1728515625, -12.48193359375, -11.791015625, -11.10009765625, -10.4091796875, -9.71826171875, -9.02734375, -8.33642578125, -7.6455078125, -6.95458984375, -6.263671875, -5.57275390625, -4.8818359375, -4.19091796875, -3.5, -2.80908203125, -2.1181640625, -1.42724609375, -0.736328125, -0.04541015625, 0.6455078125, 1.33642578125, 2.02734375, 2.71826171875, 3.4091796875, 4.10009765625, 4.791015625, 5.48193359375, 6.1728515625, 6.86376953125, 7.5546875, 8.24560546875, 8.9365234375, 9.62744140625, 10.318359375, 11.00927734375, 11.7001953125, 12.39111328125, 13.08203125, 13.77294921875, 14.4638671875, 15.15478515625, 15.845703125, 16.53662109375, 17.2275390625, 17.91845703125, 18.609375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 13.0, 13.0, 25.0, 33.0, 71.0, 90.0, 171.0, 277.0, 459.0, 788.0, 1342.0, 2340.0, 4335.0, 7482.0, 13443.0, 23883.0, 42960.0, 77640.0, 136351.0, 234831.0, 375326.0, 537195.0, 655231.0, 652117.0, 528861.0, 368432.0, 227708.0, 133038.0, 74839.0, 41959.0, 23174.0, 12870.0, 7250.0, 4090.0, 2363.0, 1434.0, 747.0, 447.0, 288.0, 159.0, 83.0, 51.0, 31.0, 17.0, 11.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.5, -23.6826171875, -22.865234375, -22.0478515625, -21.23046875, -20.4130859375, -19.595703125, -18.7783203125, -17.9609375, -17.1435546875, -16.326171875, -15.5087890625, -14.69140625, -13.8740234375, -13.056640625, -12.2392578125, -11.421875, -10.6044921875, -9.787109375, -8.9697265625, -8.15234375, -7.3349609375, -6.517578125, -5.7001953125, -4.8828125, -4.0654296875, -3.248046875, -2.4306640625, -1.61328125, -0.7958984375, 0.021484375, 0.8388671875, 1.65625, 2.4736328125, 3.291015625, 4.1083984375, 4.92578125, 5.7431640625, 6.560546875, 7.3779296875, 8.1953125, 9.0126953125, 9.830078125, 10.6474609375, 11.46484375, 12.2822265625, 13.099609375, 13.9169921875, 14.734375, 15.5517578125, 16.369140625, 17.1865234375, 18.00390625, 18.8212890625, 19.638671875, 20.4560546875, 21.2734375, 22.0908203125, 22.908203125, 23.7255859375, 24.54296875, 25.3603515625, 26.177734375, 26.9951171875, 27.8125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 9.0, 13.0, 14.0, 22.0, 25.0, 41.0, 47.0, 50.0, 55.0, 59.0, 84.0, 100.0, 103.0, 108.0, 129.0, 147.0, 179.0, 171.0, 182.0, 197.0, 204.0, 187.0, 200.0, 222.0, 197.0, 173.0, 159.0, 144.0, 134.0, 118.0, 112.0, 83.0, 79.0, 53.0, 61.0, 46.0, 33.0, 23.0, 21.0, 16.0, 19.0, 11.0, 6.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.921875, -8.6368408203125, -8.351806640625, -8.0667724609375, -7.78173828125, -7.4967041015625, -7.211669921875, -6.9266357421875, -6.6416015625, -6.3565673828125, -6.071533203125, -5.7864990234375, -5.50146484375, -5.2164306640625, -4.931396484375, -4.6463623046875, -4.361328125, -4.0762939453125, -3.791259765625, -3.5062255859375, -3.22119140625, -2.9361572265625, -2.651123046875, -2.3660888671875, -2.0810546875, -1.7960205078125, -1.510986328125, -1.2259521484375, -0.94091796875, -0.6558837890625, -0.370849609375, -0.0858154296875, 0.19921875, 0.4842529296875, 0.769287109375, 1.0543212890625, 1.33935546875, 1.6243896484375, 1.909423828125, 2.1944580078125, 2.4794921875, 2.7645263671875, 3.049560546875, 3.3345947265625, 3.61962890625, 3.9046630859375, 4.189697265625, 4.4747314453125, 4.759765625, 5.0447998046875, 5.329833984375, 5.6148681640625, 5.89990234375, 6.1849365234375, 6.469970703125, 6.7550048828125, 7.0400390625, 7.3250732421875, 7.610107421875, 7.8951416015625, 8.18017578125, 8.4652099609375, 8.750244140625, 9.0352783203125, 9.3203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 5.0, 6.0, 3.0, 8.0, 7.0, 4.0, 12.0, 15.0, 15.0, 17.0, 19.0, 24.0, 42.0, 37.0, 46.0, 47.0, 35.0, 54.0, 45.0, 40.0, 40.0, 43.0, 41.0, 50.0, 47.0, 37.0, 31.0, 24.0, 29.0, 25.0, 22.0, 25.0, 17.0, 19.0, 20.0, 10.0, 11.0, 4.0, 8.0, 2.0, 8.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.99365997314453, -27.18751335144043, -26.381364822387695, -25.575218200683594, -24.76906967163086, -23.962923049926758, -23.156776428222656, -22.350627899169922, -21.54448127746582, -20.73833465576172, -19.932186126708984, -19.126039505004883, -18.31989097595215, -17.513744354248047, -16.707595825195312, -15.901449203491211, -15.095301628112793, -14.289154052734375, -13.483006477355957, -12.676858901977539, -11.870712280273438, -11.06456470489502, -10.258417129516602, -9.4522705078125, -8.646121978759766, -7.839974403381348, -7.033827304840088, -6.22767972946167, -5.42153263092041, -4.615385055541992, -3.809237480163574, -3.0030903816223145, -2.1969432830810547, -1.3907959461212158, -0.5846484899520874, 0.22149896621704102, 1.0276463031768799, 1.8337936401367188, 2.6399412155151367, 3.4460883140563965, 4.2522358894348145, 5.058383464813232, 5.864530563354492, 6.67067813873291, 7.476825714111328, 8.28297233581543, 9.089120864868164, 9.895267486572266, 10.701415061950684, 11.507562637329102, 12.31371021270752, 13.119857788085938, 13.926004409790039, 14.732151985168457, 15.538299560546875, 16.344446182250977, 17.15059471130371, 17.956741333007812, 18.762889862060547, 19.56903648376465, 20.375185012817383, 21.181331634521484, 21.98748016357422, 22.79362678527832, 23.599773406982422]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 7.0, 4.0, 14.0, 12.0, 17.0, 22.0, 21.0, 28.0, 27.0, 23.0, 22.0, 30.0, 31.0, 30.0, 40.0, 34.0, 48.0, 29.0, 43.0, 38.0, 46.0, 47.0, 38.0, 43.0, 36.0, 29.0, 41.0, 25.0, 30.0, 21.0, 18.0, 22.0, 14.0, 11.0, 9.0, 8.0, 6.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.282615661621094, -25.497875213623047, -24.713136672973633, -23.928396224975586, -23.14365577697754, -22.358917236328125, -21.574176788330078, -20.78943634033203, -20.004695892333984, -19.219955444335938, -18.435216903686523, -17.650476455688477, -16.86573600769043, -16.080997467041016, -15.296257019042969, -14.511516571044922, -13.726778030395508, -12.942038536071777, -12.15729808807373, -11.37255859375, -10.587818145751953, -9.803078651428223, -9.018339157104492, -8.233598709106445, -7.448859214782715, -6.664119243621826, -5.8793792724609375, -5.094639778137207, -4.309899806976318, -3.5251598358154297, -2.740420341491699, -1.9556803703308105, -1.1709403991699219, -0.38620054721832275, 0.39853930473327637, 1.183279037475586, 1.9680190086364746, 2.7527589797973633, 3.5374984741210938, 4.322238445281982, 5.106978416442871, 5.89171838760376, 6.676458358764648, 7.461197853088379, 8.24593734741211, 9.030677795410156, 9.815417289733887, 10.600156784057617, 11.384897232055664, 12.169636726379395, 12.954377174377441, 13.739116668701172, 14.523857116699219, 15.30859661102295, 16.09333610534668, 16.878076553344727, 17.66281509399414, 18.447555541992188, 19.2322940826416, 20.01703453063965, 20.801774978637695, 21.58651351928711, 22.371253967285156, 23.155994415283203, 23.94073486328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 9.0, 24.0, 24.0, 42.0, 42.0, 58.0, 110.0, 170.0, 234.0, 367.0, 489.0, 813.0, 1267.0, 1933.0, 3086.0, 5074.0, 8365.0, 13275.0, 21123.0, 33835.0, 52420.0, 76324.0, 104311.0, 127190.0, 136386.0, 127937.0, 105800.0, 78800.0, 54103.0, 35460.0, 22378.0, 13925.0, 8509.0, 5440.0, 3348.0, 2101.0, 1303.0, 815.0, 564.0, 360.0, 244.0, 146.0, 111.0, 79.0, 45.0, 39.0, 23.0, 15.0, 12.0, 5.0, 10.0, 7.0, 1.0, 0.0, 1.0], "bins": [-13.3984375, -12.9990234375, -12.599609375, -12.2001953125, -11.80078125, -11.4013671875, -11.001953125, -10.6025390625, -10.203125, -9.8037109375, -9.404296875, -9.0048828125, -8.60546875, -8.2060546875, -7.806640625, -7.4072265625, -7.0078125, -6.6083984375, -6.208984375, -5.8095703125, -5.41015625, -5.0107421875, -4.611328125, -4.2119140625, -3.8125, -3.4130859375, -3.013671875, -2.6142578125, -2.21484375, -1.8154296875, -1.416015625, -1.0166015625, -0.6171875, -0.2177734375, 0.181640625, 0.5810546875, 0.98046875, 1.3798828125, 1.779296875, 2.1787109375, 2.578125, 2.9775390625, 3.376953125, 3.7763671875, 4.17578125, 4.5751953125, 4.974609375, 5.3740234375, 5.7734375, 6.1728515625, 6.572265625, 6.9716796875, 7.37109375, 7.7705078125, 8.169921875, 8.5693359375, 8.96875, 9.3681640625, 9.767578125, 10.1669921875, 10.56640625, 10.9658203125, 11.365234375, 11.7646484375, 12.1640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 2.0, 4.0, 7.0, 10.0, 10.0, 8.0, 13.0, 16.0, 20.0, 20.0, 28.0, 24.0, 27.0, 39.0, 26.0, 30.0, 28.0, 33.0, 39.0, 46.0, 42.0, 36.0, 43.0, 49.0, 48.0, 46.0, 33.0, 35.0, 21.0, 33.0, 20.0, 26.0, 24.0, 27.0, 16.0, 16.0, 13.0, 7.0, 6.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-28.484375, -27.66845703125, -26.8525390625, -26.03662109375, -25.220703125, -24.40478515625, -23.5888671875, -22.77294921875, -21.95703125, -21.14111328125, -20.3251953125, -19.50927734375, -18.693359375, -17.87744140625, -17.0615234375, -16.24560546875, -15.4296875, -14.61376953125, -13.7978515625, -12.98193359375, -12.166015625, -11.35009765625, -10.5341796875, -9.71826171875, -8.90234375, -8.08642578125, -7.2705078125, -6.45458984375, -5.638671875, -4.82275390625, -4.0068359375, -3.19091796875, -2.375, -1.55908203125, -0.7431640625, 0.07275390625, 0.888671875, 1.70458984375, 2.5205078125, 3.33642578125, 4.15234375, 4.96826171875, 5.7841796875, 6.60009765625, 7.416015625, 8.23193359375, 9.0478515625, 9.86376953125, 10.6796875, 11.49560546875, 12.3115234375, 13.12744140625, 13.943359375, 14.75927734375, 15.5751953125, 16.39111328125, 17.20703125, 18.02294921875, 18.8388671875, 19.65478515625, 20.470703125, 21.28662109375, 22.1025390625, 22.91845703125, 23.734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 3.0, 6.0, 10.0, 13.0, 16.0, 28.0, 38.0, 68.0, 85.0, 142.0, 190.0, 312.0, 488.0, 833.0, 1290.0, 2261.0, 3908.0, 7212.0, 13401.0, 25124.0, 47375.0, 87754.0, 148690.0, 203232.0, 197630.0, 137954.0, 78929.0, 42149.0, 22359.0, 11772.0, 6454.0, 3568.0, 1998.0, 1176.0, 738.0, 444.0, 265.0, 229.0, 120.0, 95.0, 55.0, 41.0, 23.0, 21.0, 17.0, 10.0, 7.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.375, -24.60400390625, -23.8330078125, -23.06201171875, -22.291015625, -21.52001953125, -20.7490234375, -19.97802734375, -19.20703125, -18.43603515625, -17.6650390625, -16.89404296875, -16.123046875, -15.35205078125, -14.5810546875, -13.81005859375, -13.0390625, -12.26806640625, -11.4970703125, -10.72607421875, -9.955078125, -9.18408203125, -8.4130859375, -7.64208984375, -6.87109375, -6.10009765625, -5.3291015625, -4.55810546875, -3.787109375, -3.01611328125, -2.2451171875, -1.47412109375, -0.703125, 0.06787109375, 0.8388671875, 1.60986328125, 2.380859375, 3.15185546875, 3.9228515625, 4.69384765625, 5.46484375, 6.23583984375, 7.0068359375, 7.77783203125, 8.548828125, 9.31982421875, 10.0908203125, 10.86181640625, 11.6328125, 12.40380859375, 13.1748046875, 13.94580078125, 14.716796875, 15.48779296875, 16.2587890625, 17.02978515625, 17.80078125, 18.57177734375, 19.3427734375, 20.11376953125, 20.884765625, 21.65576171875, 22.4267578125, 23.19775390625, 23.96875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 8.0, 8.0, 8.0, 7.0, 15.0, 16.0, 28.0, 29.0, 19.0, 34.0, 33.0, 35.0, 39.0, 39.0, 49.0, 30.0, 46.0, 32.0, 49.0, 41.0, 48.0, 51.0, 34.0, 41.0, 23.0, 37.0, 27.0, 25.0, 29.0, 13.0, 19.0, 14.0, 15.0, 7.0, 13.0, 10.0, 11.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.609375, -16.060302734375, -15.51123046875, -14.962158203125, -14.4130859375, -13.864013671875, -13.31494140625, -12.765869140625, -12.216796875, -11.667724609375, -11.11865234375, -10.569580078125, -10.0205078125, -9.471435546875, -8.92236328125, -8.373291015625, -7.82421875, -7.275146484375, -6.72607421875, -6.177001953125, -5.6279296875, -5.078857421875, -4.52978515625, -3.980712890625, -3.431640625, -2.882568359375, -2.33349609375, -1.784423828125, -1.2353515625, -0.686279296875, -0.13720703125, 0.411865234375, 0.9609375, 1.510009765625, 2.05908203125, 2.608154296875, 3.1572265625, 3.706298828125, 4.25537109375, 4.804443359375, 5.353515625, 5.902587890625, 6.45166015625, 7.000732421875, 7.5498046875, 8.098876953125, 8.64794921875, 9.197021484375, 9.74609375, 10.295166015625, 10.84423828125, 11.393310546875, 11.9423828125, 12.491455078125, 13.04052734375, 13.589599609375, 14.138671875, 14.687744140625, 15.23681640625, 15.785888671875, 16.3349609375, 16.884033203125, 17.43310546875, 17.982177734375, 18.53125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 9.0, 11.0, 10.0, 20.0, 27.0, 34.0, 62.0, 86.0, 130.0, 183.0, 231.0, 395.0, 619.0, 1006.0, 1840.0, 3099.0, 6069.0, 12690.0, 27234.0, 59602.0, 121533.0, 207617.0, 243011.0, 178878.0, 96526.0, 45742.0, 20750.0, 9780.0, 4882.0, 2525.0, 1404.0, 832.0, 540.0, 360.0, 220.0, 161.0, 101.0, 89.0, 54.0, 46.0, 29.0, 30.0, 19.0, 13.0, 14.0, 6.0, 8.0, 7.0, 1.0, 0.0, 4.0, 0.0, 2.0], "bins": [-11.9453125, -11.5869140625, -11.228515625, -10.8701171875, -10.51171875, -10.1533203125, -9.794921875, -9.4365234375, -9.078125, -8.7197265625, -8.361328125, -8.0029296875, -7.64453125, -7.2861328125, -6.927734375, -6.5693359375, -6.2109375, -5.8525390625, -5.494140625, -5.1357421875, -4.77734375, -4.4189453125, -4.060546875, -3.7021484375, -3.34375, -2.9853515625, -2.626953125, -2.2685546875, -1.91015625, -1.5517578125, -1.193359375, -0.8349609375, -0.4765625, -0.1181640625, 0.240234375, 0.5986328125, 0.95703125, 1.3154296875, 1.673828125, 2.0322265625, 2.390625, 2.7490234375, 3.107421875, 3.4658203125, 3.82421875, 4.1826171875, 4.541015625, 4.8994140625, 5.2578125, 5.6162109375, 5.974609375, 6.3330078125, 6.69140625, 7.0498046875, 7.408203125, 7.7666015625, 8.125, 8.4833984375, 8.841796875, 9.2001953125, 9.55859375, 9.9169921875, 10.275390625, 10.6337890625, 10.9921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 7.0, 5.0, 4.0, 9.0, 11.0, 16.0, 22.0, 29.0, 44.0, 43.0, 57.0, 52.0, 55.0, 52.0, 66.0, 68.0, 62.0, 68.0, 62.0, 59.0, 50.0, 34.0, 28.0, 27.0, 19.0, 15.0, 15.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005707740783691406, -0.0005525946617126465, -0.0005344152450561523, -0.0005162358283996582, -0.0004980564117431641, -0.0004798769950866699, -0.0004616975784301758, -0.00044351816177368164, -0.0004253387451171875, -0.00040715932846069336, -0.0003889799118041992, -0.0003708004951477051, -0.00035262107849121094, -0.0003344416618347168, -0.00031626224517822266, -0.0002980828285217285, -0.0002799034118652344, -0.00026172399520874023, -0.0002435445785522461, -0.00022536516189575195, -0.0002071857452392578, -0.00018900632858276367, -0.00017082691192626953, -0.0001526474952697754, -0.00013446807861328125, -0.00011628866195678711, -9.810924530029297e-05, -7.992982864379883e-05, -6.175041198730469e-05, -4.357099533081055e-05, -2.5391578674316406e-05, -7.212162017822266e-06, 1.0967254638671875e-05, 2.9146671295166016e-05, 4.7326087951660156e-05, 6.55055046081543e-05, 8.368492126464844e-05, 0.00010186433792114258, 0.00012004375457763672, 0.00013822317123413086, 0.000156402587890625, 0.00017458200454711914, 0.00019276142120361328, 0.00021094083786010742, 0.00022912025451660156, 0.0002472996711730957, 0.00026547908782958984, 0.000283658504486084, 0.0003018379211425781, 0.00032001733779907227, 0.0003381967544555664, 0.00035637617111206055, 0.0003745555877685547, 0.00039273500442504883, 0.00041091442108154297, 0.0004290938377380371, 0.00044727325439453125, 0.0004654526710510254, 0.00048363208770751953, 0.0005018115043640137, 0.0005199909210205078, 0.000538170337677002, 0.0005563497543334961, 0.0005745291709899902, 0.0005927085876464844]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 6.0, 8.0, 17.0, 15.0, 21.0, 27.0, 37.0, 65.0, 97.0, 111.0, 181.0, 286.0, 495.0, 782.0, 1436.0, 2784.0, 6036.0, 13986.0, 35078.0, 85025.0, 179470.0, 265619.0, 232787.0, 128516.0, 55467.0, 22312.0, 9052.0, 4180.0, 1940.0, 1036.0, 566.0, 334.0, 233.0, 160.0, 109.0, 90.0, 48.0, 34.0, 28.0, 21.0, 10.0, 11.0, 7.0, 6.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.764892578125, -14.23291015625, -13.700927734375, -13.1689453125, -12.636962890625, -12.10498046875, -11.572998046875, -11.041015625, -10.509033203125, -9.97705078125, -9.445068359375, -8.9130859375, -8.381103515625, -7.84912109375, -7.317138671875, -6.78515625, -6.253173828125, -5.72119140625, -5.189208984375, -4.6572265625, -4.125244140625, -3.59326171875, -3.061279296875, -2.529296875, -1.997314453125, -1.46533203125, -0.933349609375, -0.4013671875, 0.130615234375, 0.66259765625, 1.194580078125, 1.7265625, 2.258544921875, 2.79052734375, 3.322509765625, 3.8544921875, 4.386474609375, 4.91845703125, 5.450439453125, 5.982421875, 6.514404296875, 7.04638671875, 7.578369140625, 8.1103515625, 8.642333984375, 9.17431640625, 9.706298828125, 10.23828125, 10.770263671875, 11.30224609375, 11.834228515625, 12.3662109375, 12.898193359375, 13.43017578125, 13.962158203125, 14.494140625, 15.026123046875, 15.55810546875, 16.090087890625, 16.6220703125, 17.154052734375, 17.68603515625, 18.218017578125, 18.75]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 10.0, 10.0, 15.0, 12.0, 19.0, 24.0, 30.0, 26.0, 48.0, 55.0, 67.0, 71.0, 66.0, 71.0, 70.0, 74.0, 54.0, 57.0, 49.0, 36.0, 30.0, 28.0, 24.0, 19.0, 6.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.069580078125, -3.90478515625, -3.739990234375, -3.5751953125, -3.410400390625, -3.24560546875, -3.080810546875, -2.916015625, -2.751220703125, -2.58642578125, -2.421630859375, -2.2568359375, -2.092041015625, -1.92724609375, -1.762451171875, -1.59765625, -1.432861328125, -1.26806640625, -1.103271484375, -0.9384765625, -0.773681640625, -0.60888671875, -0.444091796875, -0.279296875, -0.114501953125, 0.05029296875, 0.215087890625, 0.3798828125, 0.544677734375, 0.70947265625, 0.874267578125, 1.0390625, 1.203857421875, 1.36865234375, 1.533447265625, 1.6982421875, 1.863037109375, 2.02783203125, 2.192626953125, 2.357421875, 2.522216796875, 2.68701171875, 2.851806640625, 3.0166015625, 3.181396484375, 3.34619140625, 3.510986328125, 3.67578125, 3.840576171875, 4.00537109375, 4.170166015625, 4.3349609375, 4.499755859375, 4.66455078125, 4.829345703125, 4.994140625, 5.158935546875, 5.32373046875, 5.488525390625, 5.6533203125, 5.818115234375, 5.98291015625, 6.147705078125, 6.3125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 5.0, 4.0, 6.0, 3.0, 9.0, 5.0, 11.0, 11.0, 13.0, 14.0, 19.0, 27.0, 24.0, 38.0, 31.0, 42.0, 42.0, 37.0, 43.0, 51.0, 37.0, 45.0, 45.0, 50.0, 47.0, 27.0, 36.0, 40.0, 23.0, 37.0, 17.0, 28.0, 24.0, 18.0, 13.0, 18.0, 14.0, 9.0, 15.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.167091369628906, -25.39385414123535, -24.62061882019043, -23.847381591796875, -23.074146270751953, -22.3009090423584, -21.527673721313477, -20.754436492919922, -19.981201171875, -19.207963943481445, -18.434728622436523, -17.66149139404297, -16.888256072998047, -16.115018844604492, -15.34178352355957, -14.568546295166016, -13.795310020446777, -13.022073745727539, -12.2488374710083, -11.475601196289062, -10.702364921569824, -9.929128646850586, -9.155891418457031, -8.38265609741211, -7.609419345855713, -6.836183071136475, -6.062946796417236, -5.28971004486084, -4.516473770141602, -3.7432377338409424, -2.970001220703125, -2.1967649459838867, -1.4235286712646484, -0.6502923369407654, 0.12294399738311768, 0.8961803913116455, 1.6694166660308838, 2.442652940750122, 3.2158894538879395, 3.9891257286071777, 4.762362003326416, 5.535598278045654, 6.308834552764893, 7.082071304321289, 7.855307579040527, 8.628543853759766, 9.401780128479004, 10.175016403198242, 10.94825267791748, 11.721488952636719, 12.494725227355957, 13.267961502075195, 14.041197776794434, 14.814434051513672, 15.587671279907227, 16.36090660095215, 17.134143829345703, 17.907381057739258, 18.68061637878418, 19.453853607177734, 20.227088928222656, 21.00032615661621, 21.773561477661133, 22.546798706054688, 23.32003402709961]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 8.0, 7.0, 7.0, 10.0, 16.0, 14.0, 15.0, 23.0, 20.0, 23.0, 30.0, 28.0, 28.0, 31.0, 31.0, 38.0, 45.0, 38.0, 32.0, 43.0, 41.0, 40.0, 40.0, 49.0, 37.0, 40.0, 41.0, 32.0, 33.0, 25.0, 20.0, 24.0, 17.0, 17.0, 9.0, 8.0, 11.0, 7.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-26.76115608215332, -25.968358993530273, -25.175559997558594, -24.382762908935547, -23.5899658203125, -22.79716682434082, -22.004369735717773, -21.211570739746094, -20.418773651123047, -19.6259765625, -18.83317756652832, -18.040380477905273, -17.247583389282227, -16.454784393310547, -15.6619873046875, -14.869189262390137, -14.07639217376709, -13.283594131469727, -12.49079704284668, -11.697999000549316, -10.905200958251953, -10.112403869628906, -9.319605827331543, -8.52680778503418, -7.734010219573975, -6.9412126541137695, -6.148414611816406, -5.355617046356201, -4.562819480895996, -3.770021438598633, -2.9772238731384277, -2.1844258308410645, -1.3916282653808594, -0.59883052110672, 0.19396722316741943, 0.9867649078369141, 1.7795627117156982, 2.5723605155944824, 3.3651580810546875, 4.157956123352051, 4.950753688812256, 5.743551254272461, 6.536349296569824, 7.329146862030029, 8.121944427490234, 8.914742469787598, 9.707540512084961, 10.500337600708008, 11.293135643005371, 12.085933685302734, 12.878730773925781, 13.671528816223145, 14.464326858520508, 15.257123947143555, 16.049922943115234, 16.84272003173828, 17.635517120361328, 18.428314208984375, 19.221113204956055, 20.0139102935791, 20.80670738220215, 21.599506378173828, 22.392303466796875, 23.185100555419922, 23.9778995513916]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 14.0, 17.0, 29.0, 56.0, 95.0, 176.0, 232.0, 364.0, 582.0, 928.0, 1379.0, 2169.0, 3466.0, 5365.0, 8122.0, 12753.0, 19295.0, 28341.0, 40491.0, 56435.0, 73880.0, 90355.0, 104036.0, 109316.0, 106855.0, 96702.0, 80628.0, 62678.0, 46290.0, 32736.0, 22349.0, 14970.0, 9874.0, 6337.0, 4069.0, 2589.0, 1674.0, 1089.0, 664.0, 420.0, 258.0, 184.0, 113.0, 60.0, 42.0, 24.0, 26.0, 7.0, 12.0, 6.0, 1.0, 4.0, 1.0, 1.0], "bins": [-15.9296875, -15.4569091796875, -14.984130859375, -14.5113525390625, -14.03857421875, -13.5657958984375, -13.093017578125, -12.6202392578125, -12.1474609375, -11.6746826171875, -11.201904296875, -10.7291259765625, -10.25634765625, -9.7835693359375, -9.310791015625, -8.8380126953125, -8.365234375, -7.8924560546875, -7.419677734375, -6.9468994140625, -6.47412109375, -6.0013427734375, -5.528564453125, -5.0557861328125, -4.5830078125, -4.1102294921875, -3.637451171875, -3.1646728515625, -2.69189453125, -2.2191162109375, -1.746337890625, -1.2735595703125, -0.80078125, -0.3280029296875, 0.144775390625, 0.6175537109375, 1.09033203125, 1.5631103515625, 2.035888671875, 2.5086669921875, 2.9814453125, 3.4542236328125, 3.927001953125, 4.3997802734375, 4.87255859375, 5.3453369140625, 5.818115234375, 6.2908935546875, 6.763671875, 7.2364501953125, 7.709228515625, 8.1820068359375, 8.65478515625, 9.1275634765625, 9.600341796875, 10.0731201171875, 10.5458984375, 11.0186767578125, 11.491455078125, 11.9642333984375, 12.43701171875, 12.9097900390625, 13.382568359375, 13.8553466796875, 14.328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 4.0, 7.0, 7.0, 11.0, 12.0, 22.0, 19.0, 24.0, 28.0, 29.0, 21.0, 29.0, 34.0, 36.0, 30.0, 39.0, 29.0, 40.0, 44.0, 42.0, 30.0, 40.0, 43.0, 52.0, 50.0, 30.0, 32.0, 26.0, 28.0, 23.0, 32.0, 14.0, 12.0, 13.0, 9.0, 14.0, 4.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0], "bins": [-27.609375, -26.84326171875, -26.0771484375, -25.31103515625, -24.544921875, -23.77880859375, -23.0126953125, -22.24658203125, -21.48046875, -20.71435546875, -19.9482421875, -19.18212890625, -18.416015625, -17.64990234375, -16.8837890625, -16.11767578125, -15.3515625, -14.58544921875, -13.8193359375, -13.05322265625, -12.287109375, -11.52099609375, -10.7548828125, -9.98876953125, -9.22265625, -8.45654296875, -7.6904296875, -6.92431640625, -6.158203125, -5.39208984375, -4.6259765625, -3.85986328125, -3.09375, -2.32763671875, -1.5615234375, -0.79541015625, -0.029296875, 0.73681640625, 1.5029296875, 2.26904296875, 3.03515625, 3.80126953125, 4.5673828125, 5.33349609375, 6.099609375, 6.86572265625, 7.6318359375, 8.39794921875, 9.1640625, 9.93017578125, 10.6962890625, 11.46240234375, 12.228515625, 12.99462890625, 13.7607421875, 14.52685546875, 15.29296875, 16.05908203125, 16.8251953125, 17.59130859375, 18.357421875, 19.12353515625, 19.8896484375, 20.65576171875, 21.421875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 10.0, 7.0, 11.0, 21.0, 38.0, 58.0, 63.0, 97.0, 136.0, 247.0, 406.0, 589.0, 959.0, 1435.0, 2199.0, 3262.0, 5001.0, 7482.0, 10989.0, 16615.0, 23658.0, 33595.0, 45404.0, 59843.0, 75083.0, 88748.0, 99304.0, 101935.0, 98326.0, 88346.0, 74747.0, 59450.0, 45487.0, 32779.0, 23120.0, 16306.0, 11062.0, 7514.0, 4922.0, 3277.0, 2014.0, 1389.0, 928.0, 573.0, 388.0, 259.0, 170.0, 131.0, 63.0, 42.0, 26.0, 11.0, 15.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0], "bins": [-16.265625, -15.764892578125, -15.26416015625, -14.763427734375, -14.2626953125, -13.761962890625, -13.26123046875, -12.760498046875, -12.259765625, -11.759033203125, -11.25830078125, -10.757568359375, -10.2568359375, -9.756103515625, -9.25537109375, -8.754638671875, -8.25390625, -7.753173828125, -7.25244140625, -6.751708984375, -6.2509765625, -5.750244140625, -5.24951171875, -4.748779296875, -4.248046875, -3.747314453125, -3.24658203125, -2.745849609375, -2.2451171875, -1.744384765625, -1.24365234375, -0.742919921875, -0.2421875, 0.258544921875, 0.75927734375, 1.260009765625, 1.7607421875, 2.261474609375, 2.76220703125, 3.262939453125, 3.763671875, 4.264404296875, 4.76513671875, 5.265869140625, 5.7666015625, 6.267333984375, 6.76806640625, 7.268798828125, 7.76953125, 8.270263671875, 8.77099609375, 9.271728515625, 9.7724609375, 10.273193359375, 10.77392578125, 11.274658203125, 11.775390625, 12.276123046875, 12.77685546875, 13.277587890625, 13.7783203125, 14.279052734375, 14.77978515625, 15.280517578125, 15.78125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 9.0, 21.0, 16.0, 24.0, 19.0, 27.0, 24.0, 40.0, 38.0, 48.0, 38.0, 48.0, 46.0, 38.0, 58.0, 50.0, 53.0, 42.0, 44.0, 45.0, 46.0, 32.0, 22.0, 29.0, 17.0, 25.0, 15.0, 17.0, 11.0, 10.0, 10.0, 3.0, 6.0, 10.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -17.077392578125, -16.46728515625, -15.857177734375, -15.2470703125, -14.636962890625, -14.02685546875, -13.416748046875, -12.806640625, -12.196533203125, -11.58642578125, -10.976318359375, -10.3662109375, -9.756103515625, -9.14599609375, -8.535888671875, -7.92578125, -7.315673828125, -6.70556640625, -6.095458984375, -5.4853515625, -4.875244140625, -4.26513671875, -3.655029296875, -3.044921875, -2.434814453125, -1.82470703125, -1.214599609375, -0.6044921875, 0.005615234375, 0.61572265625, 1.225830078125, 1.8359375, 2.446044921875, 3.05615234375, 3.666259765625, 4.2763671875, 4.886474609375, 5.49658203125, 6.106689453125, 6.716796875, 7.326904296875, 7.93701171875, 8.547119140625, 9.1572265625, 9.767333984375, 10.37744140625, 10.987548828125, 11.59765625, 12.207763671875, 12.81787109375, 13.427978515625, 14.0380859375, 14.648193359375, 15.25830078125, 15.868408203125, 16.478515625, 17.088623046875, 17.69873046875, 18.308837890625, 18.9189453125, 19.529052734375, 20.13916015625, 20.749267578125, 21.359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 10.0, 22.0, 23.0, 31.0, 42.0, 79.0, 109.0, 170.0, 271.0, 392.0, 647.0, 979.0, 1663.0, 2726.0, 4753.0, 8136.0, 13809.0, 24188.0, 41177.0, 66845.0, 101558.0, 137965.0, 158019.0, 150663.0, 120611.0, 84273.0, 52846.0, 31834.0, 18514.0, 10666.0, 6214.0, 3748.0, 2045.0, 1279.0, 821.0, 462.0, 340.0, 201.0, 148.0, 99.0, 58.0, 44.0, 24.0, 18.0, 12.0, 14.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.1875, -10.8560791015625, -10.524658203125, -10.1932373046875, -9.86181640625, -9.5303955078125, -9.198974609375, -8.8675537109375, -8.5361328125, -8.2047119140625, -7.873291015625, -7.5418701171875, -7.21044921875, -6.8790283203125, -6.547607421875, -6.2161865234375, -5.884765625, -5.5533447265625, -5.221923828125, -4.8905029296875, -4.55908203125, -4.2276611328125, -3.896240234375, -3.5648193359375, -3.2333984375, -2.9019775390625, -2.570556640625, -2.2391357421875, -1.90771484375, -1.5762939453125, -1.244873046875, -0.9134521484375, -0.58203125, -0.2506103515625, 0.080810546875, 0.4122314453125, 0.74365234375, 1.0750732421875, 1.406494140625, 1.7379150390625, 2.0693359375, 2.4007568359375, 2.732177734375, 3.0635986328125, 3.39501953125, 3.7264404296875, 4.057861328125, 4.3892822265625, 4.720703125, 5.0521240234375, 5.383544921875, 5.7149658203125, 6.04638671875, 6.3778076171875, 6.709228515625, 7.0406494140625, 7.3720703125, 7.7034912109375, 8.034912109375, 8.3663330078125, 8.69775390625, 9.0291748046875, 9.360595703125, 9.6920166015625, 10.0234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 1.0, 8.0, 12.0, 16.0, 22.0, 23.0, 27.0, 42.0, 59.0, 52.0, 76.0, 72.0, 82.0, 73.0, 97.0, 57.0, 60.0, 60.0, 38.0, 40.0, 20.0, 17.0, 17.0, 6.0, 8.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013017654418945312, -0.001253172755241394, -0.0012045800685882568, -0.0011559873819351196, -0.0011073946952819824, -0.0010588020086288452, -0.001010209321975708, -0.0009616166353225708, -0.0009130239486694336, -0.0008644312620162964, -0.0008158385753631592, -0.000767245888710022, -0.0007186532020568848, -0.0006700605154037476, -0.0006214678287506104, -0.0005728751420974731, -0.0005242824554443359, -0.00047568976879119873, -0.0004270970821380615, -0.0003785043954849243, -0.0003299117088317871, -0.0002813190221786499, -0.0002327263355255127, -0.0001841336488723755, -0.00013554096221923828, -8.694827556610107e-05, -3.835558891296387e-05, 1.023709774017334e-05, 5.882978439331055e-05, 0.00010742247104644775, 0.00015601515769958496, 0.00020460784435272217, 0.0002532005310058594, 0.0003017932176589966, 0.0003503859043121338, 0.000398978590965271, 0.0004475712776184082, 0.0004961639642715454, 0.0005447566509246826, 0.0005933493375778198, 0.000641942024230957, 0.0006905347108840942, 0.0007391273975372314, 0.0007877200841903687, 0.0008363127708435059, 0.0008849054574966431, 0.0009334981441497803, 0.0009820908308029175, 0.0010306835174560547, 0.001079276204109192, 0.001127868890762329, 0.0011764615774154663, 0.0012250542640686035, 0.0012736469507217407, 0.001322239637374878, 0.0013708323240280151, 0.0014194250106811523, 0.0014680176973342896, 0.0015166103839874268, 0.001565203070640564, 0.0016137957572937012, 0.0016623884439468384, 0.0017109811305999756, 0.0017595738172531128, 0.00180816650390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 9.0, 8.0, 15.0, 20.0, 44.0, 41.0, 80.0, 112.0, 159.0, 224.0, 355.0, 580.0, 963.0, 1525.0, 2496.0, 4062.0, 6760.0, 11373.0, 18433.0, 30445.0, 48094.0, 72901.0, 102180.0, 129142.0, 142881.0, 135274.0, 111461.0, 82203.0, 55437.0, 35822.0, 21724.0, 13146.0, 8061.0, 4922.0, 2877.0, 1712.0, 1086.0, 668.0, 447.0, 276.0, 177.0, 122.0, 88.0, 47.0, 32.0, 28.0, 19.0, 14.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3984375, -9.0919189453125, -8.785400390625, -8.4788818359375, -8.17236328125, -7.8658447265625, -7.559326171875, -7.2528076171875, -6.9462890625, -6.6397705078125, -6.333251953125, -6.0267333984375, -5.72021484375, -5.4136962890625, -5.107177734375, -4.8006591796875, -4.494140625, -4.1876220703125, -3.881103515625, -3.5745849609375, -3.26806640625, -2.9615478515625, -2.655029296875, -2.3485107421875, -2.0419921875, -1.7354736328125, -1.428955078125, -1.1224365234375, -0.81591796875, -0.5093994140625, -0.202880859375, 0.1036376953125, 0.41015625, 0.7166748046875, 1.023193359375, 1.3297119140625, 1.63623046875, 1.9427490234375, 2.249267578125, 2.5557861328125, 2.8623046875, 3.1688232421875, 3.475341796875, 3.7818603515625, 4.08837890625, 4.3948974609375, 4.701416015625, 5.0079345703125, 5.314453125, 5.6209716796875, 5.927490234375, 6.2340087890625, 6.54052734375, 6.8470458984375, 7.153564453125, 7.4600830078125, 7.7666015625, 8.0731201171875, 8.379638671875, 8.6861572265625, 8.99267578125, 9.2991943359375, 9.605712890625, 9.9122314453125, 10.21875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 10.0, 8.0, 15.0, 16.0, 18.0, 26.0, 34.0, 30.0, 26.0, 42.0, 47.0, 40.0, 47.0, 49.0, 62.0, 60.0, 54.0, 50.0, 47.0, 49.0, 45.0, 42.0, 35.0, 19.0, 20.0, 24.0, 10.0, 12.0, 7.0, 6.0, 6.0, 3.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.85546875, -3.734588623046875, -3.61370849609375, -3.492828369140625, -3.3719482421875, -3.251068115234375, -3.13018798828125, -3.009307861328125, -2.888427734375, -2.767547607421875, -2.64666748046875, -2.525787353515625, -2.4049072265625, -2.284027099609375, -2.16314697265625, -2.042266845703125, -1.92138671875, -1.800506591796875, -1.67962646484375, -1.558746337890625, -1.4378662109375, -1.316986083984375, -1.19610595703125, -1.075225830078125, -0.954345703125, -0.833465576171875, -0.71258544921875, -0.591705322265625, -0.4708251953125, -0.349945068359375, -0.22906494140625, -0.108184814453125, 0.0126953125, 0.133575439453125, 0.25445556640625, 0.375335693359375, 0.4962158203125, 0.617095947265625, 0.73797607421875, 0.858856201171875, 0.979736328125, 1.100616455078125, 1.22149658203125, 1.342376708984375, 1.4632568359375, 1.584136962890625, 1.70501708984375, 1.825897216796875, 1.94677734375, 2.067657470703125, 2.18853759765625, 2.309417724609375, 2.4302978515625, 2.551177978515625, 2.67205810546875, 2.792938232421875, 2.913818359375, 3.034698486328125, 3.15557861328125, 3.276458740234375, 3.3973388671875, 3.518218994140625, 3.63909912109375, 3.759979248046875, 3.880859375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 0.0, 4.0, 5.0, 11.0, 9.0, 10.0, 9.0, 12.0, 12.0, 15.0, 23.0, 27.0, 20.0, 26.0, 37.0, 36.0, 36.0, 50.0, 32.0, 59.0, 46.0, 44.0, 56.0, 41.0, 44.0, 31.0, 31.0, 26.0, 35.0, 19.0, 31.0, 28.0, 26.0, 18.0, 15.0, 15.0, 18.0, 3.0, 14.0, 6.0, 7.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-28.57404899597168, -27.79125213623047, -27.008453369140625, -26.22565460205078, -25.44285774230957, -24.66006088256836, -23.877262115478516, -23.094463348388672, -22.31166648864746, -21.52886962890625, -20.746070861816406, -19.963272094726562, -19.18047523498535, -18.39767837524414, -17.614879608154297, -16.832080841064453, -16.049283981323242, -15.266486167907715, -14.483688354492188, -13.70089054107666, -12.918092727661133, -12.135294914245605, -11.352497100830078, -10.56969928741455, -9.786901473999023, -9.004103660583496, -8.221305847167969, -7.438508033752441, -6.655710220336914, -5.872912406921387, -5.090114593505859, -4.307316780090332, -3.5245189666748047, -2.7417211532592773, -1.95892333984375, -1.1761255264282227, -0.3933277130126953, 0.38947010040283203, 1.1722679138183594, 1.9550657272338867, 2.737863540649414, 3.5206613540649414, 4.303459167480469, 5.086256980895996, 5.869054794311523, 6.651852607727051, 7.434650421142578, 8.217448234558105, 9.000246047973633, 9.78304386138916, 10.565841674804688, 11.348639488220215, 12.131437301635742, 12.91423511505127, 13.697032928466797, 14.479830741882324, 15.262628555297852, 16.045425415039062, 16.828224182128906, 17.61102294921875, 18.39381980895996, 19.176616668701172, 19.959415435791016, 20.74221420288086, 21.52501106262207]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 6.0, 12.0, 9.0, 13.0, 16.0, 20.0, 18.0, 32.0, 27.0, 31.0, 29.0, 35.0, 35.0, 40.0, 49.0, 34.0, 42.0, 47.0, 54.0, 41.0, 49.0, 45.0, 36.0, 29.0, 38.0, 30.0, 26.0, 24.0, 22.0, 12.0, 19.0, 15.0, 15.0, 8.0, 11.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.14990997314453, -27.194936752319336, -26.239961624145508, -25.284988403320312, -24.330015182495117, -23.375041961669922, -22.420066833496094, -21.4650936126709, -20.510120391845703, -19.555147171020508, -18.60017204284668, -17.645198822021484, -16.69022560119629, -15.735251426696777, -14.780277252197266, -13.82530403137207, -12.870329856872559, -11.915355682373047, -10.960382461547852, -10.00540828704834, -9.050435066223145, -8.095460891723633, -7.140487194061279, -6.185513496398926, -5.230539798736572, -4.275566101074219, -3.3205924034118652, -2.3656184673309326, -1.410644769668579, -0.4556708335876465, 0.49930286407470703, 1.4542765617370605, 2.409250259399414, 3.3642239570617676, 4.319197654724121, 5.274171829223633, 6.229145050048828, 7.18411922454834, 8.139093399047852, 9.094066619873047, 10.049039840698242, 11.004014015197754, 11.95898723602295, 12.913961410522461, 13.868934631347656, 14.823908805847168, 15.77888298034668, 16.733856201171875, 17.688831329345703, 18.6438045501709, 19.598779678344727, 20.553752899169922, 21.508726119995117, 22.463699340820312, 23.41867446899414, 24.373647689819336, 25.32862091064453, 26.283594131469727, 27.238569259643555, 28.19354248046875, 29.148515701293945, 30.10348892211914, 31.05846405029297, 32.01343536376953, 32.96841049194336]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 3.0, 18.0, 8.0, 10.0, 17.0, 30.0, 31.0, 42.0, 41.0, 60.0, 89.0, 109.0, 182.0, 244.0, 316.0, 495.0, 735.0, 1209.0, 1933.0, 3269.0, 6173.0, 1017118.0, 8065.0, 3942.0, 2265.0, 1414.0, 877.0, 560.0, 363.0, 233.0, 191.0, 140.0, 90.0, 79.0, 52.0, 59.0, 30.0, 29.0, 21.0, 10.0, 17.0, 8.0, 9.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-386.8968811035156, -374.68023681640625, -362.4635925292969, -350.2469482421875, -338.0303039550781, -325.81365966796875, -313.59698486328125, -301.38037109375, -289.1636962890625, -276.9470520019531, -264.73040771484375, -252.51376342773438, -240.297119140625, -228.08047485351562, -215.8638153076172, -203.6471710205078, -191.4305419921875, -179.21389770507812, -166.99725341796875, -154.78060913085938, -142.56396484375, -130.34732055664062, -118.13066101074219, -105.91401672363281, -93.69737243652344, -81.48072814941406, -69.26408386230469, -57.04743194580078, -44.830787658691406, -32.61414337158203, -20.397491455078125, -8.18084716796875, 4.0357666015625, 16.252412796020508, 28.469058990478516, 40.685707092285156, 52.90235137939453, 65.1189956665039, 77.33564758300781, 89.55229187011719, 101.76893615722656, 113.98558044433594, 126.20222473144531, 138.41888427734375, 150.63552856445312, 162.8521728515625, 175.06881713867188, 187.28546142578125, 199.50210571289062, 211.71875, 223.93539428710938, 236.15203857421875, 248.36868286132812, 260.5853271484375, 272.802001953125, 285.01861572265625, 297.23529052734375, 309.4519348144531, 321.6685791015625, 333.8852233886719, 346.10186767578125, 358.3185119628906, 370.53515625, 382.7518310546875, 394.96844482421875]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 17.0, 19.0, 30.0, 35.0, 42.0, 83.0, 112.0, 164.0, 202.0, 300.0, 380.0, 493.0, 624.0, 850.0, 1029.0, 1300.0, 1680.0, 2176.0, 2896.0, 4299.0, 7145.0, 16449.0, 224087.0, 51163432.0, 18634.0, 7597.0, 4552.0, 3058.0, 2189.0, 1699.0, 1341.0, 1069.0, 871.0, 609.0, 495.0, 387.0, 268.0, 237.0, 171.0, 93.0, 95.0, 70.0, 43.0, 30.0, 25.0, 12.0, 9.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-537.3463134765625, -521.5675048828125, -505.78863525390625, -490.0097961425781, -474.23095703125, -458.4521179199219, -442.67327880859375, -426.89447021484375, -411.1156005859375, -395.3367614746094, -379.55792236328125, -363.7790832519531, -348.000244140625, -332.2214050292969, -316.44256591796875, -300.66375732421875, -284.8849182128906, -269.1060791015625, -253.32723999023438, -237.54840087890625, -221.76956176757812, -205.99072265625, -190.21189880371094, -174.4330596923828, -158.6542205810547, -142.87538146972656, -127.09654235839844, -111.31771087646484, -95.53887176513672, -79.7600326538086, -63.981201171875, -48.202362060546875, -32.423492431640625, -16.644655227661133, -0.8658180236816406, 14.913017272949219, 30.691856384277344, 46.47069549560547, 62.24952697753906, 78.02836608886719, 93.80720520019531, 109.58604431152344, 125.36488342285156, 141.14370727539062, 156.92254638671875, 172.70138549804688, 188.480224609375, 204.25906372070312, 220.03790283203125, 235.81674194335938, 251.5955810546875, 267.3744201660156, 283.15325927734375, 298.9320983886719, 314.7109375, 330.48974609375, 346.26861572265625, 362.0474548339844, 377.8262939453125, 393.6051330566406, 409.38397216796875, 425.1628112792969, 440.941650390625, 456.720458984375, 472.4992980957031]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 11.0, 16.0, 24.0, 51.0, 48.0, 77.0, 122.0, 198.0, 294.0, 476.0, 760.0, 1215.0, 1902.0, 3002.0, 4863.0, 7764.0, 12456.0, 20614.0, 34024.0, 58659.0, 102562.0, 184849.0, 354541.0, 749986.0, 1615059.0, 1610177.0, 743795.0, 351989.0, 184271.0, 101824.0, 58280.0, 34259.0, 20373.0, 12402.0, 7658.0, 4692.0, 2864.0, 1939.0, 1216.0, 767.0, 459.0, 324.0, 179.0, 151.0, 99.0, 54.0, 41.0, 22.0, 16.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.34375, -59.22802734375, -57.1123046875, -54.99658203125, -52.880859375, -50.76513671875, -48.6494140625, -46.53369140625, -44.41796875, -42.30224609375, -40.1865234375, -38.07080078125, -35.955078125, -33.83935546875, -31.7236328125, -29.60791015625, -27.4921875, -25.37646484375, -23.2607421875, -21.14501953125, -19.029296875, -16.91357421875, -14.7978515625, -12.68212890625, -10.56640625, -8.45068359375, -6.3349609375, -4.21923828125, -2.103515625, 0.01220703125, 2.1279296875, 4.24365234375, 6.359375, 8.47509765625, 10.5908203125, 12.70654296875, 14.822265625, 16.93798828125, 19.0537109375, 21.16943359375, 23.28515625, 25.40087890625, 27.5166015625, 29.63232421875, 31.748046875, 33.86376953125, 35.9794921875, 38.09521484375, 40.2109375, 42.32666015625, 44.4423828125, 46.55810546875, 48.673828125, 50.78955078125, 52.9052734375, 55.02099609375, 57.13671875, 59.25244140625, 61.3681640625, 63.48388671875, 65.599609375, 67.71533203125, 69.8310546875, 71.94677734375, 74.0625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 14.0, 2.0, 8.0, 13.0, 8.0, 12.0, 19.0, 17.0, 21.0, 33.0, 39.0, 46.0, 56.0, 55.0, 87.0, 103.0, 159.0, 196.0, 191.0, 176.0, 170.0, 139.0, 107.0, 74.0, 54.0, 44.0, 33.0, 25.0, 13.0, 20.0, 23.0, 15.0, 9.0, 4.0, 10.0, 8.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.0625, -39.7646484375, -38.466796875, -37.1689453125, -35.87109375, -34.5732421875, -33.275390625, -31.9775390625, -30.6796875, -29.3818359375, -28.083984375, -26.7861328125, -25.48828125, -24.1904296875, -22.892578125, -21.5947265625, -20.296875, -18.9990234375, -17.701171875, -16.4033203125, -15.10546875, -13.8076171875, -12.509765625, -11.2119140625, -9.9140625, -8.6162109375, -7.318359375, -6.0205078125, -4.72265625, -3.4248046875, -2.126953125, -0.8291015625, 0.46875, 1.7666015625, 3.064453125, 4.3623046875, 5.66015625, 6.9580078125, 8.255859375, 9.5537109375, 10.8515625, 12.1494140625, 13.447265625, 14.7451171875, 16.04296875, 17.3408203125, 18.638671875, 19.9365234375, 21.234375, 22.5322265625, 23.830078125, 25.1279296875, 26.42578125, 27.7236328125, 29.021484375, 30.3193359375, 31.6171875, 32.9150390625, 34.212890625, 35.5107421875, 36.80859375, 38.1064453125, 39.404296875, 40.7021484375, 42.0]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 8.0, 12.0, 30.0, 54.0, 40.0, 86.0, 138.0, 164.0, 287.0, 403.0, 686.0, 1163.0, 1862.0, 3026.0, 4899.0, 8118.0, 12906.0, 21629.0, 35074.0, 56471.0, 91955.0, 148269.0, 242110.0, 428265.0, 1049957.0, 2172243.0, 988487.0, 413488.0, 233537.0, 144243.0, 88870.0, 55090.0, 34012.0, 20698.0, 12627.0, 7919.0, 4819.0, 2982.0, 1733.0, 1144.0, 719.0, 423.0, 280.0, 184.0, 116.0, 77.0, 47.0, 33.0, 21.0, 13.0, 12.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-36.0625, -34.87890625, -33.6953125, -32.51171875, -31.328125, -30.14453125, -28.9609375, -27.77734375, -26.59375, -25.41015625, -24.2265625, -23.04296875, -21.859375, -20.67578125, -19.4921875, -18.30859375, -17.125, -15.94140625, -14.7578125, -13.57421875, -12.390625, -11.20703125, -10.0234375, -8.83984375, -7.65625, -6.47265625, -5.2890625, -4.10546875, -2.921875, -1.73828125, -0.5546875, 0.62890625, 1.8125, 2.99609375, 4.1796875, 5.36328125, 6.546875, 7.73046875, 8.9140625, 10.09765625, 11.28125, 12.46484375, 13.6484375, 14.83203125, 16.015625, 17.19921875, 18.3828125, 19.56640625, 20.75, 21.93359375, 23.1171875, 24.30078125, 25.484375, 26.66796875, 27.8515625, 29.03515625, 30.21875, 31.40234375, 32.5859375, 33.76953125, 34.953125, 36.13671875, 37.3203125, 38.50390625, 39.6875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 8.0, 6.0, 8.0, 9.0, 9.0, 11.0, 18.0, 21.0, 23.0, 31.0, 47.0, 48.0, 60.0, 77.0, 116.0, 204.0, 326.0, 294.0, 193.0, 130.0, 77.0, 51.0, 49.0, 48.0, 23.0, 24.0, 21.0, 21.0, 11.0, 14.0, 12.0, 6.0, 7.0, 5.0, 0.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.90625, -57.90478515625, -55.9033203125, -53.90185546875, -51.900390625, -49.89892578125, -47.8974609375, -45.89599609375, -43.89453125, -41.89306640625, -39.8916015625, -37.89013671875, -35.888671875, -33.88720703125, -31.8857421875, -29.88427734375, -27.8828125, -25.88134765625, -23.8798828125, -21.87841796875, -19.876953125, -17.87548828125, -15.8740234375, -13.87255859375, -11.87109375, -9.86962890625, -7.8681640625, -5.86669921875, -3.865234375, -1.86376953125, 0.1376953125, 2.13916015625, 4.140625, 6.14208984375, 8.1435546875, 10.14501953125, 12.146484375, 14.14794921875, 16.1494140625, 18.15087890625, 20.15234375, 22.15380859375, 24.1552734375, 26.15673828125, 28.158203125, 30.15966796875, 32.1611328125, 34.16259765625, 36.1640625, 38.16552734375, 40.1669921875, 42.16845703125, 44.169921875, 46.17138671875, 48.1728515625, 50.17431640625, 52.17578125, 54.17724609375, 56.1787109375, 58.18017578125, 60.181640625, 62.18310546875, 64.1845703125, 66.18603515625, 68.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 13.0, 24.0, 32.0, 38.0, 66.0, 107.0, 135.0, 210.0, 344.0, 573.0, 913.0, 1640.0, 2976.0, 5554.0, 10394.0, 19349.0, 36654.0, 72488.0, 192352.0, 5591775.0, 202148.0, 73578.0, 37120.0, 19425.0, 10387.0, 5606.0, 3107.0, 1770.0, 1030.0, 584.0, 384.0, 249.0, 152.0, 94.0, 56.0, 31.0, 20.0, 17.0, 9.0, 9.0, 3.0, 2.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-108.875, -105.720703125, -102.56640625, -99.412109375, -96.2578125, -93.103515625, -89.94921875, -86.794921875, -83.640625, -80.486328125, -77.33203125, -74.177734375, -71.0234375, -67.869140625, -64.71484375, -61.560546875, -58.40625, -55.251953125, -52.09765625, -48.943359375, -45.7890625, -42.634765625, -39.48046875, -36.326171875, -33.171875, -30.017578125, -26.86328125, -23.708984375, -20.5546875, -17.400390625, -14.24609375, -11.091796875, -7.9375, -4.783203125, -1.62890625, 1.525390625, 4.6796875, 7.833984375, 10.98828125, 14.142578125, 17.296875, 20.451171875, 23.60546875, 26.759765625, 29.9140625, 33.068359375, 36.22265625, 39.376953125, 42.53125, 45.685546875, 48.83984375, 51.994140625, 55.1484375, 58.302734375, 61.45703125, 64.611328125, 67.765625, 70.919921875, 74.07421875, 77.228515625, 80.3828125, 83.537109375, 86.69140625, 89.845703125, 93.0]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 4.0, 8.0, 11.0, 11.0, 12.0, 10.0, 11.0, 15.0, 20.0, 28.0, 30.0, 35.0, 28.0, 46.0, 41.0, 46.0, 73.0, 166.0, 296.0, 330.0, 242.0, 114.0, 63.0, 58.0, 43.0, 39.0, 28.0, 33.0, 22.0, 23.0, 35.0, 17.0, 15.0, 11.0, 13.0, 8.0, 11.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.3125, -80.5615234375, -77.810546875, -75.0595703125, -72.30859375, -69.5576171875, -66.806640625, -64.0556640625, -61.3046875, -58.5537109375, -55.802734375, -53.0517578125, -50.30078125, -47.5498046875, -44.798828125, -42.0478515625, -39.296875, -36.5458984375, -33.794921875, -31.0439453125, -28.29296875, -25.5419921875, -22.791015625, -20.0400390625, -17.2890625, -14.5380859375, -11.787109375, -9.0361328125, -6.28515625, -3.5341796875, -0.783203125, 1.9677734375, 4.71875, 7.4697265625, 10.220703125, 12.9716796875, 15.72265625, 18.4736328125, 21.224609375, 23.9755859375, 26.7265625, 29.4775390625, 32.228515625, 34.9794921875, 37.73046875, 40.4814453125, 43.232421875, 45.9833984375, 48.734375, 51.4853515625, 54.236328125, 56.9873046875, 59.73828125, 62.4892578125, 65.240234375, 67.9912109375, 70.7421875, 73.4931640625, 76.244140625, 78.9951171875, 81.74609375, 84.4970703125, 87.248046875, 89.9990234375, 92.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 13.0, 10.0, 18.0, 30.0, 43.0, 49.0, 61.0, 91.0, 135.0, 176.0, 113.0, 61.0, 51.0, 30.0, 29.0, 28.0, 13.0, 8.0, 11.0, 10.0, 3.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2196.351318359375, -2126.36474609375, -2056.3779296875, -1986.391357421875, -1916.4046630859375, -1846.41796875, -1776.431396484375, -1706.4447021484375, -1636.4580078125, -1566.4713134765625, -1496.4847412109375, -1426.498046875, -1356.5113525390625, -1286.524658203125, -1216.5380859375, -1146.5513916015625, -1076.5648193359375, -1006.5781860351562, -936.5914916992188, -866.6048583984375, -796.6181640625, -726.6315307617188, -656.6448974609375, -586.658203125, -516.6715698242188, -446.6849060058594, -376.6982421875, -306.71160888671875, -236.72494506835938, -166.73828125, -96.75164794921875, -26.764984130859375, 43.2216796875, 113.20833587646484, 183.1949920654297, 253.181640625, 323.1683044433594, 393.15496826171875, 463.1416015625, 533.1282958984375, 603.1149291992188, 673.1015625, 743.0882568359375, 813.0748901367188, 883.0615234375, 953.0482177734375, 1023.0348510742188, 1093.021484375, 1163.0081787109375, 1232.994873046875, 1302.9814453125, 1372.9681396484375, 1442.954833984375, 1512.94140625, 1582.9281005859375, 1652.914794921875, 1722.9013671875, 1792.8880615234375, 1862.8746337890625, 1932.861328125, 2002.8480224609375, 2072.834716796875, 2142.8212890625, 2212.807861328125, 2282.794677734375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 7.0, 5.0, 12.0, 14.0, 11.0, 14.0, 26.0, 23.0, 28.0, 32.0, 32.0, 42.0, 62.0, 99.0, 128.0, 97.0, 66.0, 56.0, 43.0, 37.0, 15.0, 22.0, 28.0, 21.0, 16.0, 14.0, 10.0, 15.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2089.05224609375, -2023.41552734375, -1957.7786865234375, -1892.1419677734375, -1826.505126953125, -1760.868408203125, -1695.231689453125, -1629.594970703125, -1563.9581298828125, -1498.3214111328125, -1432.6845703125, -1367.0478515625, -1301.4111328125, -1235.7742919921875, -1170.1375732421875, -1104.500732421875, -1038.864013671875, -973.2272338867188, -907.5904541015625, -841.9537353515625, -776.3169555664062, -710.68017578125, -645.04345703125, -579.4066772460938, -513.7698974609375, -448.13311767578125, -382.4963684082031, -316.859619140625, -251.22283935546875, -185.5860595703125, -119.94931030273438, -54.31256103515625, 11.32421875, 76.96098327636719, 142.59774780273438, 208.23451232910156, 273.87127685546875, 339.508056640625, 405.1448059082031, 470.78155517578125, 536.4183349609375, 602.0551147460938, 667.69189453125, 733.32861328125, 798.9653930664062, 864.6021728515625, 930.2388916015625, 995.8756713867188, 1061.512451171875, 1127.149169921875, 1192.7860107421875, 1258.4227294921875, 1324.0595703125, 1389.6962890625, 1455.3330078125, 1520.9697265625, 1586.6065673828125, 1652.2432861328125, 1717.880126953125, 1783.516845703125, 1849.153564453125, 1914.7904052734375, 1980.4271240234375, 2046.06396484375, 2111.70068359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 11.0, 14.0, 22.0, 32.0, 39.0, 43.0, 97.0, 137.0, 230.0, 360.0, 577.0, 984.0, 1763.0, 2949.0, 5569.0, 10788.0, 23874.0, 70588.0, 398752.0, 3289919.0, 285226.0, 57991.0, 21490.0, 10036.0, 5295.0, 2892.0, 1732.0, 1007.0, 656.0, 376.0, 247.0, 181.0, 130.0, 83.0, 70.0, 38.0, 21.0, 15.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.1119384765625, -11.700439453125, -11.2889404296875, -10.87744140625, -10.4659423828125, -10.054443359375, -9.6429443359375, -9.2314453125, -8.8199462890625, -8.408447265625, -7.9969482421875, -7.58544921875, -7.1739501953125, -6.762451171875, -6.3509521484375, -5.939453125, -5.5279541015625, -5.116455078125, -4.7049560546875, -4.29345703125, -3.8819580078125, -3.470458984375, -3.0589599609375, -2.6474609375, -2.2359619140625, -1.824462890625, -1.4129638671875, -1.00146484375, -0.5899658203125, -0.178466796875, 0.2330322265625, 0.64453125, 1.0560302734375, 1.467529296875, 1.8790283203125, 2.29052734375, 2.7020263671875, 3.113525390625, 3.5250244140625, 3.9365234375, 4.3480224609375, 4.759521484375, 5.1710205078125, 5.58251953125, 5.9940185546875, 6.405517578125, 6.8170166015625, 7.228515625, 7.6400146484375, 8.051513671875, 8.4630126953125, 8.87451171875, 9.2860107421875, 9.697509765625, 10.1090087890625, 10.5205078125, 10.9320068359375, 11.343505859375, 11.7550048828125, 12.16650390625, 12.5780029296875, 12.989501953125, 13.4010009765625, 13.8125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 2.0, 9.0, 7.0, 8.0, 9.0, 15.0, 28.0, 50.0, 66.0, 98.0, 140.0, 169.0, 113.0, 83.0, 67.0, 37.0, 24.0, 8.0, 14.0, 6.0, 2.0, 1.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.15802001953125, -2.0914306640625, -2.02484130859375, -1.958251953125, -1.89166259765625, -1.8250732421875, -1.75848388671875, -1.69189453125, -1.62530517578125, -1.5587158203125, -1.49212646484375, -1.425537109375, -1.35894775390625, -1.2923583984375, -1.22576904296875, -1.1591796875, -1.09259033203125, -1.0260009765625, -0.95941162109375, -0.892822265625, -0.82623291015625, -0.7596435546875, -0.69305419921875, -0.62646484375, -0.55987548828125, -0.4932861328125, -0.42669677734375, -0.360107421875, -0.29351806640625, -0.2269287109375, -0.16033935546875, -0.09375, -0.02716064453125, 0.0394287109375, 0.10601806640625, 0.172607421875, 0.23919677734375, 0.3057861328125, 0.37237548828125, 0.43896484375, 0.50555419921875, 0.5721435546875, 0.63873291015625, 0.705322265625, 0.77191162109375, 0.8385009765625, 0.90509033203125, 0.9716796875, 1.03826904296875, 1.1048583984375, 1.17144775390625, 1.238037109375, 1.30462646484375, 1.3712158203125, 1.43780517578125, 1.50439453125, 1.57098388671875, 1.6375732421875, 1.70416259765625, 1.770751953125, 1.83734130859375, 1.9039306640625, 1.97052001953125, 2.037109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 19.0, 11.0, 26.0, 35.0, 57.0, 96.0, 155.0, 208.0, 376.0, 653.0, 1028.0, 1993.0, 3505.0, 6813.0, 14246.0, 31626.0, 76637.0, 211754.0, 710720.0, 2104556.0, 688145.0, 206752.0, 75385.0, 30773.0, 13784.0, 6713.0, 3499.0, 1950.0, 1052.0, 620.0, 347.0, 253.0, 157.0, 93.0, 66.0, 42.0, 37.0, 29.0, 17.0, 11.0, 12.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.046875, -8.7501220703125, -8.453369140625, -8.1566162109375, -7.85986328125, -7.5631103515625, -7.266357421875, -6.9696044921875, -6.6728515625, -6.3760986328125, -6.079345703125, -5.7825927734375, -5.48583984375, -5.1890869140625, -4.892333984375, -4.5955810546875, -4.298828125, -4.0020751953125, -3.705322265625, -3.4085693359375, -3.11181640625, -2.8150634765625, -2.518310546875, -2.2215576171875, -1.9248046875, -1.6280517578125, -1.331298828125, -1.0345458984375, -0.73779296875, -0.4410400390625, -0.144287109375, 0.1524658203125, 0.44921875, 0.7459716796875, 1.042724609375, 1.3394775390625, 1.63623046875, 1.9329833984375, 2.229736328125, 2.5264892578125, 2.8232421875, 3.1199951171875, 3.416748046875, 3.7135009765625, 4.01025390625, 4.3070068359375, 4.603759765625, 4.9005126953125, 5.197265625, 5.4940185546875, 5.790771484375, 6.0875244140625, 6.38427734375, 6.6810302734375, 6.977783203125, 7.2745361328125, 7.5712890625, 7.8680419921875, 8.164794921875, 8.4615478515625, 8.75830078125, 9.0550537109375, 9.351806640625, 9.6485595703125, 9.9453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 7.0, 7.0, 13.0, 15.0, 22.0, 35.0, 31.0, 52.0, 60.0, 88.0, 105.0, 151.0, 213.0, 324.0, 459.0, 764.0, 524.0, 332.0, 230.0, 154.0, 135.0, 89.0, 67.0, 49.0, 28.0, 25.0, 24.0, 21.0, 12.0, 12.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83203125, -3.69287109375, -3.5537109375, -3.41455078125, -3.275390625, -3.13623046875, -2.9970703125, -2.85791015625, -2.71875, -2.57958984375, -2.4404296875, -2.30126953125, -2.162109375, -2.02294921875, -1.8837890625, -1.74462890625, -1.60546875, -1.46630859375, -1.3271484375, -1.18798828125, -1.048828125, -0.90966796875, -0.7705078125, -0.63134765625, -0.4921875, -0.35302734375, -0.2138671875, -0.07470703125, 0.064453125, 0.20361328125, 0.3427734375, 0.48193359375, 0.62109375, 0.76025390625, 0.8994140625, 1.03857421875, 1.177734375, 1.31689453125, 1.4560546875, 1.59521484375, 1.734375, 1.87353515625, 2.0126953125, 2.15185546875, 2.291015625, 2.43017578125, 2.5693359375, 2.70849609375, 2.84765625, 2.98681640625, 3.1259765625, 3.26513671875, 3.404296875, 3.54345703125, 3.6826171875, 3.82177734375, 3.9609375, 4.10009765625, 4.2392578125, 4.37841796875, 4.517578125, 4.65673828125, 4.7958984375, 4.93505859375, 5.07421875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 10.0, 11.0, 21.0, 33.0, 37.0, 79.0, 98.0, 135.0, 133.0, 149.0, 88.0, 78.0, 50.0, 27.0, 25.0, 5.0, 11.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.77008056640625, -48.440250396728516, -47.11042022705078, -45.78059387207031, -44.45076370239258, -43.120933532714844, -41.79110336303711, -40.461273193359375, -39.131446838378906, -37.80161666870117, -36.47178649902344, -35.14196014404297, -33.812129974365234, -32.4822998046875, -31.152469635009766, -29.82263946533203, -28.492809295654297, -27.162979125976562, -25.83315086364746, -24.503320693969727, -23.173492431640625, -21.84366226196289, -20.513832092285156, -19.184001922607422, -17.85417366027832, -16.524343490600586, -15.194515228271484, -13.86468505859375, -12.534855842590332, -11.205026626586914, -9.87519645690918, -8.545367240905762, -7.215541839599609, -5.885712623596191, -4.555882930755615, -3.226053476333618, -1.896224021911621, -0.5663948059082031, 0.763434886932373, 2.093264579772949, 3.423093795776367, 4.752923011779785, 6.082752704620361, 7.4125823974609375, 8.742411613464355, 10.072240829467773, 11.402070999145508, 12.731900215148926, 14.061729431152344, 15.391558647155762, 16.72138786315918, 18.051218032836914, 19.381046295166016, 20.71087646484375, 22.040706634521484, 23.37053680419922, 24.70036506652832, 26.030195236206055, 27.360023498535156, 28.68985366821289, 30.019683837890625, 31.349512100219727, 32.67934036254883, 34.00917053222656, 35.3390007019043]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 6.0, 8.0, 15.0, 16.0, 5.0, 12.0, 26.0, 27.0, 28.0, 42.0, 37.0, 40.0, 51.0, 52.0, 52.0, 53.0, 37.0, 42.0, 41.0, 53.0, 43.0, 31.0, 40.0, 28.0, 36.0, 25.0, 28.0, 20.0, 21.0, 17.0, 14.0, 8.0, 15.0, 8.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.163835525512695, -23.426963806152344, -22.690092086791992, -21.95322036743164, -21.216346740722656, -20.479475021362305, -19.742603302001953, -19.0057315826416, -18.26885986328125, -17.5319881439209, -16.795116424560547, -16.058242797851562, -15.321371078491211, -14.58449935913086, -13.847627639770508, -13.110755920410156, -12.373882293701172, -11.63701057434082, -10.900137901306152, -10.1632661819458, -9.426393508911133, -8.689521789550781, -7.95265007019043, -7.21577787399292, -6.47890567779541, -5.7420334815979, -5.005161285400391, -4.268289566040039, -3.5314173698425293, -2.7945451736450195, -2.057673454284668, -1.3208012580871582, -0.5839309692382812, 0.15294110774993896, 0.8898131847381592, 1.6266851425170898, 2.3635573387145996, 3.1004295349121094, 3.837301254272461, 4.574173450469971, 5.3110456466674805, 6.04791784286499, 6.7847900390625, 7.521661758422852, 8.258533477783203, 8.995406150817871, 9.732277870178223, 10.46915054321289, 11.206022262573242, 11.942893981933594, 12.679766654968262, 13.416638374328613, 14.153511047363281, 14.890382766723633, 15.627254486083984, 16.364126205444336, 17.100997924804688, 17.83786964416504, 18.57474136352539, 19.311614990234375, 20.048486709594727, 20.785358428955078, 21.52223014831543, 22.25910186767578, 22.995975494384766]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 7.0, 12.0, 20.0, 18.0, 36.0, 50.0, 78.0, 116.0, 191.0, 234.0, 361.0, 570.0, 798.0, 1306.0, 2039.0, 3274.0, 5732.0, 11406.0, 25847.0, 73771.0, 295413.0, 444674.0, 113605.0, 35939.0, 14796.0, 7288.0, 4052.0, 2450.0, 1498.0, 968.0, 661.0, 415.0, 297.0, 195.0, 145.0, 104.0, 66.0, 33.0, 31.0, 12.0, 17.0, 14.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.375, -5.21771240234375, -5.0604248046875, -4.90313720703125, -4.745849609375, -4.58856201171875, -4.4312744140625, -4.27398681640625, -4.11669921875, -3.95941162109375, -3.8021240234375, -3.64483642578125, -3.487548828125, -3.33026123046875, -3.1729736328125, -3.01568603515625, -2.8583984375, -2.70111083984375, -2.5438232421875, -2.38653564453125, -2.229248046875, -2.07196044921875, -1.9146728515625, -1.75738525390625, -1.60009765625, -1.44281005859375, -1.2855224609375, -1.12823486328125, -0.970947265625, -0.81365966796875, -0.6563720703125, -0.49908447265625, -0.341796875, -0.18450927734375, -0.0272216796875, 0.13006591796875, 0.287353515625, 0.44464111328125, 0.6019287109375, 0.75921630859375, 0.91650390625, 1.07379150390625, 1.2310791015625, 1.38836669921875, 1.545654296875, 1.70294189453125, 1.8602294921875, 2.01751708984375, 2.1748046875, 2.33209228515625, 2.4893798828125, 2.64666748046875, 2.803955078125, 2.96124267578125, 3.1185302734375, 3.27581787109375, 3.43310546875, 3.59039306640625, 3.7476806640625, 3.90496826171875, 4.062255859375, 4.21954345703125, 4.3768310546875, 4.53411865234375, 4.69140625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 6.0, 7.0, 8.0, 7.0, 24.0, 27.0, 43.0, 53.0, 67.0, 102.0, 116.0, 96.0, 108.0, 86.0, 60.0, 49.0, 33.0, 19.0, 20.0, 10.0, 10.0, 7.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 0.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.017578125, -1.95147705078125, -1.8853759765625, -1.81927490234375, -1.753173828125, -1.68707275390625, -1.6209716796875, -1.55487060546875, -1.48876953125, -1.42266845703125, -1.3565673828125, -1.29046630859375, -1.224365234375, -1.15826416015625, -1.0921630859375, -1.02606201171875, -0.9599609375, -0.89385986328125, -0.8277587890625, -0.76165771484375, -0.695556640625, -0.62945556640625, -0.5633544921875, -0.49725341796875, -0.43115234375, -0.36505126953125, -0.2989501953125, -0.23284912109375, -0.166748046875, -0.10064697265625, -0.0345458984375, 0.03155517578125, 0.09765625, 0.16375732421875, 0.2298583984375, 0.29595947265625, 0.362060546875, 0.42816162109375, 0.4942626953125, 0.56036376953125, 0.62646484375, 0.69256591796875, 0.7586669921875, 0.82476806640625, 0.890869140625, 0.95697021484375, 1.0230712890625, 1.08917236328125, 1.1552734375, 1.22137451171875, 1.2874755859375, 1.35357666015625, 1.419677734375, 1.48577880859375, 1.5518798828125, 1.61798095703125, 1.68408203125, 1.75018310546875, 1.8162841796875, 1.88238525390625, 1.948486328125, 2.01458740234375, 2.0806884765625, 2.14678955078125, 2.212890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 7.0, 17.0, 23.0, 38.0, 43.0, 75.0, 146.0, 225.0, 444.0, 810.0, 1809.0, 4006.0, 9711.0, 25965.0, 85299.0, 351550.0, 418175.0, 100910.0, 30342.0, 10612.0, 4368.0, 1927.0, 985.0, 475.0, 244.0, 115.0, 82.0, 53.0, 23.0, 25.0, 10.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.875, -8.6065673828125, -8.338134765625, -8.0697021484375, -7.80126953125, -7.5328369140625, -7.264404296875, -6.9959716796875, -6.7275390625, -6.4591064453125, -6.190673828125, -5.9222412109375, -5.65380859375, -5.3853759765625, -5.116943359375, -4.8485107421875, -4.580078125, -4.3116455078125, -4.043212890625, -3.7747802734375, -3.50634765625, -3.2379150390625, -2.969482421875, -2.7010498046875, -2.4326171875, -2.1641845703125, -1.895751953125, -1.6273193359375, -1.35888671875, -1.0904541015625, -0.822021484375, -0.5535888671875, -0.28515625, -0.0167236328125, 0.251708984375, 0.5201416015625, 0.78857421875, 1.0570068359375, 1.325439453125, 1.5938720703125, 1.8623046875, 2.1307373046875, 2.399169921875, 2.6676025390625, 2.93603515625, 3.2044677734375, 3.472900390625, 3.7413330078125, 4.009765625, 4.2781982421875, 4.546630859375, 4.8150634765625, 5.08349609375, 5.3519287109375, 5.620361328125, 5.8887939453125, 6.1572265625, 6.4256591796875, 6.694091796875, 6.9625244140625, 7.23095703125, 7.4993896484375, 7.767822265625, 8.0362548828125, 8.3046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 6.0, 7.0, 5.0, 12.0, 7.0, 16.0, 13.0, 19.0, 20.0, 19.0, 22.0, 40.0, 31.0, 26.0, 40.0, 33.0, 37.0, 42.0, 30.0, 39.0, 48.0, 39.0, 50.0, 39.0, 35.0, 31.0, 41.0, 31.0, 30.0, 28.0, 25.0, 29.0, 18.0, 11.0, 8.0, 15.0, 15.0, 9.0, 4.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.25390625, -7.01971435546875, -6.7855224609375, -6.55133056640625, -6.317138671875, -6.08294677734375, -5.8487548828125, -5.61456298828125, -5.38037109375, -5.14617919921875, -4.9119873046875, -4.67779541015625, -4.443603515625, -4.20941162109375, -3.9752197265625, -3.74102783203125, -3.5068359375, -3.27264404296875, -3.0384521484375, -2.80426025390625, -2.570068359375, -2.33587646484375, -2.1016845703125, -1.86749267578125, -1.63330078125, -1.39910888671875, -1.1649169921875, -0.93072509765625, -0.696533203125, -0.46234130859375, -0.2281494140625, 0.00604248046875, 0.240234375, 0.47442626953125, 0.7086181640625, 0.94281005859375, 1.177001953125, 1.41119384765625, 1.6453857421875, 1.87957763671875, 2.11376953125, 2.34796142578125, 2.5821533203125, 2.81634521484375, 3.050537109375, 3.28472900390625, 3.5189208984375, 3.75311279296875, 3.9873046875, 4.22149658203125, 4.4556884765625, 4.68988037109375, 4.924072265625, 5.15826416015625, 5.3924560546875, 5.62664794921875, 5.86083984375, 6.09503173828125, 6.3292236328125, 6.56341552734375, 6.797607421875, 7.03179931640625, 7.2659912109375, 7.50018310546875, 7.734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 12.0, 16.0, 17.0, 24.0, 41.0, 63.0, 128.0, 197.0, 400.0, 1002.0, 2643.0, 9029.0, 44812.0, 429286.0, 494047.0, 51843.0, 10021.0, 2913.0, 1008.0, 449.0, 269.0, 126.0, 77.0, 43.0, 24.0, 28.0, 12.0, 10.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0625, -5.79931640625, -5.5361328125, -5.27294921875, -5.009765625, -4.74658203125, -4.4833984375, -4.22021484375, -3.95703125, -3.69384765625, -3.4306640625, -3.16748046875, -2.904296875, -2.64111328125, -2.3779296875, -2.11474609375, -1.8515625, -1.58837890625, -1.3251953125, -1.06201171875, -0.798828125, -0.53564453125, -0.2724609375, -0.00927734375, 0.25390625, 0.51708984375, 0.7802734375, 1.04345703125, 1.306640625, 1.56982421875, 1.8330078125, 2.09619140625, 2.359375, 2.62255859375, 2.8857421875, 3.14892578125, 3.412109375, 3.67529296875, 3.9384765625, 4.20166015625, 4.46484375, 4.72802734375, 4.9912109375, 5.25439453125, 5.517578125, 5.78076171875, 6.0439453125, 6.30712890625, 6.5703125, 6.83349609375, 7.0966796875, 7.35986328125, 7.623046875, 7.88623046875, 8.1494140625, 8.41259765625, 8.67578125, 8.93896484375, 9.2021484375, 9.46533203125, 9.728515625, 9.99169921875, 10.2548828125, 10.51806640625, 10.78125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 6.0, 9.0, 5.0, 9.0, 22.0, 18.0, 24.0, 35.0, 38.0, 51.0, 65.0, 69.0, 93.0, 103.0, 96.0, 68.0, 42.0, 70.0, 42.0, 35.0, 21.0, 22.0, 19.0, 17.0, 10.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00034427642822265625, -0.00033511221408843994, -0.00032594799995422363, -0.0003167837858200073, -0.000307619571685791, -0.0002984553575515747, -0.0002892911434173584, -0.0002801269292831421, -0.0002709627151489258, -0.00026179850101470947, -0.00025263428688049316, -0.00024347007274627686, -0.00023430585861206055, -0.00022514164447784424, -0.00021597743034362793, -0.00020681321620941162, -0.0001976490020751953, -0.000188484787940979, -0.0001793205738067627, -0.0001701563596725464, -0.00016099214553833008, -0.00015182793140411377, -0.00014266371726989746, -0.00013349950313568115, -0.00012433528900146484, -0.00011517107486724854, -0.00010600686073303223, -9.684264659881592e-05, -8.767843246459961e-05, -7.85142183303833e-05, -6.935000419616699e-05, -6.0185790061950684e-05, -5.1021575927734375e-05, -4.1857361793518066e-05, -3.269314765930176e-05, -2.352893352508545e-05, -1.436471939086914e-05, -5.200505256652832e-06, 3.9637088775634766e-06, 1.3127923011779785e-05, 2.2292137145996094e-05, 3.14563512802124e-05, 4.062056541442871e-05, 4.978477954864502e-05, 5.894899368286133e-05, 6.811320781707764e-05, 7.727742195129395e-05, 8.644163608551025e-05, 9.560585021972656e-05, 0.00010477006435394287, 0.00011393427848815918, 0.0001230984926223755, 0.0001322627067565918, 0.0001414269208908081, 0.00015059113502502441, 0.00015975534915924072, 0.00016891956329345703, 0.00017808377742767334, 0.00018724799156188965, 0.00019641220569610596, 0.00020557641983032227, 0.00021474063396453857, 0.00022390484809875488, 0.0002330690622329712, 0.0002422332763671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 10.0, 12.0, 25.0, 30.0, 51.0, 79.0, 120.0, 173.0, 316.0, 517.0, 931.0, 1768.0, 3520.0, 7702.0, 18932.0, 56234.0, 205305.0, 463074.0, 200860.0, 55350.0, 18446.0, 7540.0, 3505.0, 1776.0, 924.0, 521.0, 304.0, 206.0, 117.0, 71.0, 37.0, 24.0, 24.0, 10.0, 9.0, 11.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.9609375, -4.80340576171875, -4.6458740234375, -4.48834228515625, -4.330810546875, -4.17327880859375, -4.0157470703125, -3.85821533203125, -3.70068359375, -3.54315185546875, -3.3856201171875, -3.22808837890625, -3.070556640625, -2.91302490234375, -2.7554931640625, -2.59796142578125, -2.4404296875, -2.28289794921875, -2.1253662109375, -1.96783447265625, -1.810302734375, -1.65277099609375, -1.4952392578125, -1.33770751953125, -1.18017578125, -1.02264404296875, -0.8651123046875, -0.70758056640625, -0.550048828125, -0.39251708984375, -0.2349853515625, -0.07745361328125, 0.080078125, 0.23760986328125, 0.3951416015625, 0.55267333984375, 0.710205078125, 0.86773681640625, 1.0252685546875, 1.18280029296875, 1.34033203125, 1.49786376953125, 1.6553955078125, 1.81292724609375, 1.970458984375, 2.12799072265625, 2.2855224609375, 2.44305419921875, 2.6005859375, 2.75811767578125, 2.9156494140625, 3.07318115234375, 3.230712890625, 3.38824462890625, 3.5457763671875, 3.70330810546875, 3.86083984375, 4.01837158203125, 4.1759033203125, 4.33343505859375, 4.490966796875, 4.64849853515625, 4.8060302734375, 4.96356201171875, 5.12109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 7.0, 10.0, 11.0, 12.0, 13.0, 26.0, 20.0, 28.0, 39.0, 45.0, 43.0, 46.0, 74.0, 69.0, 75.0, 63.0, 69.0, 46.0, 48.0, 43.0, 43.0, 37.0, 28.0, 19.0, 20.0, 12.0, 13.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.769989013671875, -2.65911865234375, -2.548248291015625, -2.4373779296875, -2.326507568359375, -2.21563720703125, -2.104766845703125, -1.993896484375, -1.883026123046875, -1.77215576171875, -1.661285400390625, -1.5504150390625, -1.439544677734375, -1.32867431640625, -1.217803955078125, -1.10693359375, -0.996063232421875, -0.88519287109375, -0.774322509765625, -0.6634521484375, -0.552581787109375, -0.44171142578125, -0.330841064453125, -0.219970703125, -0.109100341796875, 0.00177001953125, 0.112640380859375, 0.2235107421875, 0.334381103515625, 0.44525146484375, 0.556121826171875, 0.6669921875, 0.777862548828125, 0.88873291015625, 0.999603271484375, 1.1104736328125, 1.221343994140625, 1.33221435546875, 1.443084716796875, 1.553955078125, 1.664825439453125, 1.77569580078125, 1.886566162109375, 1.9974365234375, 2.108306884765625, 2.21917724609375, 2.330047607421875, 2.44091796875, 2.551788330078125, 2.66265869140625, 2.773529052734375, 2.8843994140625, 2.995269775390625, 3.10614013671875, 3.217010498046875, 3.327880859375, 3.438751220703125, 3.54962158203125, 3.660491943359375, 3.7713623046875, 3.882232666015625, 3.99310302734375, 4.103973388671875, 4.21484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 10.0, 11.0, 10.0, 40.0, 68.0, 218.0, 344.0, 151.0, 81.0, 25.0, 24.0, 6.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.21674346923828, -59.088218688964844, -54.959693908691406, -50.83116912841797, -46.70264434814453, -42.574119567871094, -38.44559860229492, -34.317073822021484, -30.188549041748047, -26.06002426147461, -21.931499481201172, -17.802976608276367, -13.67445182800293, -9.545927047729492, -5.4174041748046875, -1.28887939453125, 2.8396453857421875, 6.968169689178467, 11.096693992614746, 15.225217819213867, 19.353742599487305, 23.482267379760742, 27.610790252685547, 31.739315032958984, 35.86783981323242, 39.99636459350586, 44.1248893737793, 48.25341033935547, 52.381935119628906, 56.510459899902344, 60.63898468017578, 64.76750946044922, 68.89604187011719, 73.02456665039062, 77.15309143066406, 81.2816162109375, 85.41014099121094, 89.53866577148438, 93.66719055175781, 97.79571533203125, 101.92424011230469, 106.05276489257812, 110.18128967285156, 114.309814453125, 118.43833923339844, 122.56686401367188, 126.69538879394531, 130.82391357421875, 134.95242309570312, 139.08094787597656, 143.20947265625, 147.33799743652344, 151.46652221679688, 155.5950469970703, 159.72357177734375, 163.8520965576172, 167.98062133789062, 172.10914611816406, 176.2376708984375, 180.36619567871094, 184.49472045898438, 188.6232452392578, 192.75177001953125, 196.8802947998047, 201.00881958007812]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 1.0, 4.0, 4.0, 8.0, 9.0, 22.0, 27.0, 69.0, 104.0, 154.0, 159.0, 124.0, 121.0, 60.0, 33.0, 22.0, 16.0, 6.0, 5.0, 5.0, 11.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.57891845703125, -139.5331573486328, -134.4873809814453, -129.44161987304688, -124.3958511352539, -119.35008239746094, -114.3043212890625, -109.25855255126953, -104.21278381347656, -99.1670150756836, -94.12124633789062, -89.07548522949219, -84.02971649169922, -78.98394775390625, -73.93818664550781, -68.89241790771484, -63.846649169921875, -58.800880432128906, -53.7551155090332, -48.7093505859375, -43.66358184814453, -38.61781311035156, -33.57204818725586, -28.526283264160156, -23.480514526367188, -18.43474769592285, -13.388980865478516, -8.34321403503418, -3.2974472045898438, 1.7483196258544922, 6.794086456298828, 11.839851379394531, 16.885635375976562, 21.9314022064209, 26.977169036865234, 32.02293395996094, 37.068702697753906, 42.114471435546875, 47.16023635864258, 52.20600128173828, 57.25177001953125, 62.29753875732422, 67.34330749511719, 72.38906860351562, 77.4348373413086, 82.48060607910156, 87.5263671875, 92.57213592529297, 97.61790466308594, 102.6636734008789, 107.70944213867188, 112.75520324707031, 117.80097198486328, 122.84674072265625, 127.89250183105469, 132.93826293945312, 137.98403930664062, 143.02980041503906, 148.07557678222656, 153.121337890625, 158.1671142578125, 163.21287536621094, 168.25863647460938, 173.30441284179688, 178.3501739501953]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 3.0, 8.0, 4.0, 5.0, 6.0, 14.0, 13.0, 21.0, 32.0, 50.0, 101.0, 191.0, 351.0, 680.0, 1523.0, 4169.0, 13335.0, 73131.0, 3603114.0, 447629.0, 35587.0, 8536.0, 2987.0, 1292.0, 627.0, 346.0, 215.0, 105.0, 68.0, 48.0, 31.0, 15.0, 12.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.359375, -23.291748046875, -22.22412109375, -21.156494140625, -20.0888671875, -19.021240234375, -17.95361328125, -16.885986328125, -15.818359375, -14.750732421875, -13.68310546875, -12.615478515625, -11.5478515625, -10.480224609375, -9.41259765625, -8.344970703125, -7.27734375, -6.209716796875, -5.14208984375, -4.074462890625, -3.0068359375, -1.939208984375, -0.87158203125, 0.196044921875, 1.263671875, 2.331298828125, 3.39892578125, 4.466552734375, 5.5341796875, 6.601806640625, 7.66943359375, 8.737060546875, 9.8046875, 10.872314453125, 11.93994140625, 13.007568359375, 14.0751953125, 15.142822265625, 16.21044921875, 17.278076171875, 18.345703125, 19.413330078125, 20.48095703125, 21.548583984375, 22.6162109375, 23.683837890625, 24.75146484375, 25.819091796875, 26.88671875, 27.954345703125, 29.02197265625, 30.089599609375, 31.1572265625, 32.224853515625, 33.29248046875, 34.360107421875, 35.427734375, 36.495361328125, 37.56298828125, 38.630615234375, 39.6982421875, 40.765869140625, 41.83349609375, 42.901123046875, 43.96875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 9.0, 6.0, 11.0, 5.0, 15.0, 23.0, 28.0, 39.0, 41.0, 59.0, 74.0, 69.0, 87.0, 92.0, 78.0, 65.0, 58.0, 45.0, 44.0, 30.0, 33.0, 18.0, 20.0, 7.0, 11.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3984375, -1.343658447265625, -1.28887939453125, -1.234100341796875, -1.1793212890625, -1.124542236328125, -1.06976318359375, -1.014984130859375, -0.960205078125, -0.905426025390625, -0.85064697265625, -0.795867919921875, -0.7410888671875, -0.686309814453125, -0.63153076171875, -0.576751708984375, -0.52197265625, -0.467193603515625, -0.41241455078125, -0.357635498046875, -0.3028564453125, -0.248077392578125, -0.19329833984375, -0.138519287109375, -0.083740234375, -0.028961181640625, 0.02581787109375, 0.080596923828125, 0.1353759765625, 0.190155029296875, 0.24493408203125, 0.299713134765625, 0.3544921875, 0.409271240234375, 0.46405029296875, 0.518829345703125, 0.5736083984375, 0.628387451171875, 0.68316650390625, 0.737945556640625, 0.792724609375, 0.847503662109375, 0.90228271484375, 0.957061767578125, 1.0118408203125, 1.066619873046875, 1.12139892578125, 1.176177978515625, 1.23095703125, 1.285736083984375, 1.34051513671875, 1.395294189453125, 1.4500732421875, 1.504852294921875, 1.55963134765625, 1.614410400390625, 1.669189453125, 1.723968505859375, 1.77874755859375, 1.833526611328125, 1.8883056640625, 1.943084716796875, 1.99786376953125, 2.052642822265625, 2.107421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 21.0, 25.0, 41.0, 76.0, 89.0, 182.0, 289.0, 468.0, 877.0, 1750.0, 3766.0, 8902.0, 22183.0, 68441.0, 295146.0, 3023586.0, 603608.0, 109519.0, 32739.0, 12196.0, 5233.0, 2369.0, 1150.0, 637.0, 380.0, 194.0, 127.0, 91.0, 72.0, 32.0, 20.0, 21.0, 7.0, 11.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-17.765625, -17.1865234375, -16.607421875, -16.0283203125, -15.44921875, -14.8701171875, -14.291015625, -13.7119140625, -13.1328125, -12.5537109375, -11.974609375, -11.3955078125, -10.81640625, -10.2373046875, -9.658203125, -9.0791015625, -8.5, -7.9208984375, -7.341796875, -6.7626953125, -6.18359375, -5.6044921875, -5.025390625, -4.4462890625, -3.8671875, -3.2880859375, -2.708984375, -2.1298828125, -1.55078125, -0.9716796875, -0.392578125, 0.1865234375, 0.765625, 1.3447265625, 1.923828125, 2.5029296875, 3.08203125, 3.6611328125, 4.240234375, 4.8193359375, 5.3984375, 5.9775390625, 6.556640625, 7.1357421875, 7.71484375, 8.2939453125, 8.873046875, 9.4521484375, 10.03125, 10.6103515625, 11.189453125, 11.7685546875, 12.34765625, 12.9267578125, 13.505859375, 14.0849609375, 14.6640625, 15.2431640625, 15.822265625, 16.4013671875, 16.98046875, 17.5595703125, 18.138671875, 18.7177734375, 19.296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 12.0, 18.0, 22.0, 18.0, 45.0, 60.0, 89.0, 131.0, 253.0, 445.0, 1492.0, 626.0, 302.0, 158.0, 107.0, 72.0, 65.0, 39.0, 17.0, 18.0, 11.0, 13.0, 8.0, 14.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.4453125, -3.339935302734375, -3.23455810546875, -3.129180908203125, -3.0238037109375, -2.918426513671875, -2.81304931640625, -2.707672119140625, -2.602294921875, -2.496917724609375, -2.39154052734375, -2.286163330078125, -2.1807861328125, -2.075408935546875, -1.97003173828125, -1.864654541015625, -1.75927734375, -1.653900146484375, -1.54852294921875, -1.443145751953125, -1.3377685546875, -1.232391357421875, -1.12701416015625, -1.021636962890625, -0.916259765625, -0.810882568359375, -0.70550537109375, -0.600128173828125, -0.4947509765625, -0.389373779296875, -0.28399658203125, -0.178619384765625, -0.0732421875, 0.032135009765625, 0.13751220703125, 0.242889404296875, 0.3482666015625, 0.453643798828125, 0.55902099609375, 0.664398193359375, 0.769775390625, 0.875152587890625, 0.98052978515625, 1.085906982421875, 1.1912841796875, 1.296661376953125, 1.40203857421875, 1.507415771484375, 1.61279296875, 1.718170166015625, 1.82354736328125, 1.928924560546875, 2.0343017578125, 2.139678955078125, 2.24505615234375, 2.350433349609375, 2.455810546875, 2.561187744140625, 2.66656494140625, 2.771942138671875, 2.8773193359375, 2.982696533203125, 3.08807373046875, 3.193450927734375, 3.298828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 24.0, 33.0, 83.0, 127.0, 197.0, 192.0, 130.0, 87.0, 49.0, 23.0, 13.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.113744735717773, -17.041501998901367, -15.969259262084961, -14.897016525268555, -13.824773788452148, -12.752531051635742, -11.680288314819336, -10.60804557800293, -9.535802841186523, -8.463560104370117, -7.391317367553711, -6.319074630737305, -5.246831893920898, -4.174589157104492, -3.102346420288086, -2.0301036834716797, -0.9578609466552734, 0.11438179016113281, 1.186624526977539, 2.2588672637939453, 3.3311100006103516, 4.403352737426758, 5.475595474243164, 6.54783821105957, 7.620080947875977, 8.692323684692383, 9.764566421508789, 10.836809158325195, 11.909051895141602, 12.981294631958008, 14.053537368774414, 15.12578010559082, 16.19802474975586, 17.270267486572266, 18.342510223388672, 19.414752960205078, 20.486995697021484, 21.55923843383789, 22.631481170654297, 23.703723907470703, 24.77596664428711, 25.848209381103516, 26.920452117919922, 27.992694854736328, 29.064937591552734, 30.13718032836914, 31.209423065185547, 32.28166580200195, 33.35390853881836, 34.426151275634766, 35.49839401245117, 36.57063674926758, 37.642879486083984, 38.71512222290039, 39.7873649597168, 40.8596076965332, 41.93185043334961, 43.004093170166016, 44.07633590698242, 45.14857864379883, 46.220821380615234, 47.29306411743164, 48.36530685424805, 49.43754959106445, 50.50979232788086]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 4.0, 7.0, 14.0, 15.0, 15.0, 22.0, 28.0, 26.0, 48.0, 31.0, 62.0, 62.0, 59.0, 58.0, 62.0, 64.0, 55.0, 67.0, 45.0, 45.0, 42.0, 39.0, 31.0, 20.0, 19.0, 16.0, 14.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.030752182006836, -21.472139358520508, -20.913524627685547, -20.35491180419922, -19.79629898071289, -19.237686157226562, -18.679073333740234, -18.120458602905273, -17.561845779418945, -17.003232955932617, -16.444618225097656, -15.886005401611328, -15.327392578125, -14.768779754638672, -14.210165977478027, -13.651552200317383, -13.092939376831055, -12.534326553344727, -11.975712776184082, -11.417098999023438, -10.85848617553711, -10.299873352050781, -9.741259574890137, -9.182645797729492, -8.624032974243164, -8.065420150756836, -7.506806373596191, -6.948193073272705, -6.389579772949219, -5.830966472625732, -5.272353172302246, -4.71373987197876, -4.155128479003906, -3.59651517868042, -3.0379018783569336, -2.4792885780334473, -1.920675277709961, -1.3620619773864746, -0.8034486770629883, -0.24483537673950195, 0.3137779235839844, 0.8723912239074707, 1.431004524230957, 1.9896178245544434, 2.5482311248779297, 3.106844425201416, 3.6654577255249023, 4.224071025848389, 4.782684326171875, 5.341297626495361, 5.899910926818848, 6.458524227142334, 7.01713752746582, 7.575750827789307, 8.134364128112793, 8.692977905273438, 9.251590728759766, 9.810203552246094, 10.368817329406738, 10.927431106567383, 11.486043930053711, 12.044656753540039, 12.603270530700684, 13.161884307861328, 13.720497131347656]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 9.0, 6.0, 17.0, 23.0, 20.0, 37.0, 34.0, 84.0, 108.0, 189.0, 283.0, 433.0, 708.0, 1379.0, 2628.0, 5434.0, 13108.0, 37763.0, 133118.0, 430730.0, 300114.0, 80003.0, 24387.0, 9306.0, 4053.0, 1898.0, 1026.0, 626.0, 339.0, 253.0, 139.0, 87.0, 54.0, 38.0, 30.0, 12.0, 16.0, 15.0, 7.0, 9.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1171875, -13.67333984375, -13.2294921875, -12.78564453125, -12.341796875, -11.89794921875, -11.4541015625, -11.01025390625, -10.56640625, -10.12255859375, -9.6787109375, -9.23486328125, -8.791015625, -8.34716796875, -7.9033203125, -7.45947265625, -7.015625, -6.57177734375, -6.1279296875, -5.68408203125, -5.240234375, -4.79638671875, -4.3525390625, -3.90869140625, -3.46484375, -3.02099609375, -2.5771484375, -2.13330078125, -1.689453125, -1.24560546875, -0.8017578125, -0.35791015625, 0.0859375, 0.52978515625, 0.9736328125, 1.41748046875, 1.861328125, 2.30517578125, 2.7490234375, 3.19287109375, 3.63671875, 4.08056640625, 4.5244140625, 4.96826171875, 5.412109375, 5.85595703125, 6.2998046875, 6.74365234375, 7.1875, 7.63134765625, 8.0751953125, 8.51904296875, 8.962890625, 9.40673828125, 9.8505859375, 10.29443359375, 10.73828125, 11.18212890625, 11.6259765625, 12.06982421875, 12.513671875, 12.95751953125, 13.4013671875, 13.84521484375, 14.2890625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 9.0, 13.0, 12.0, 19.0, 22.0, 29.0, 38.0, 51.0, 55.0, 42.0, 62.0, 81.0, 81.0, 68.0, 63.0, 69.0, 48.0, 46.0, 29.0, 26.0, 22.0, 21.0, 14.0, 17.0, 10.0, 10.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.35546875, -1.3050537109375, -1.254638671875, -1.2042236328125, -1.15380859375, -1.1033935546875, -1.052978515625, -1.0025634765625, -0.9521484375, -0.9017333984375, -0.851318359375, -0.8009033203125, -0.75048828125, -0.7000732421875, -0.649658203125, -0.5992431640625, -0.548828125, -0.4984130859375, -0.447998046875, -0.3975830078125, -0.34716796875, -0.2967529296875, -0.246337890625, -0.1959228515625, -0.1455078125, -0.0950927734375, -0.044677734375, 0.0057373046875, 0.05615234375, 0.1065673828125, 0.156982421875, 0.2073974609375, 0.2578125, 0.3082275390625, 0.358642578125, 0.4090576171875, 0.45947265625, 0.5098876953125, 0.560302734375, 0.6107177734375, 0.6611328125, 0.7115478515625, 0.761962890625, 0.8123779296875, 0.86279296875, 0.9132080078125, 0.963623046875, 1.0140380859375, 1.064453125, 1.1148681640625, 1.165283203125, 1.2156982421875, 1.26611328125, 1.3165283203125, 1.366943359375, 1.4173583984375, 1.4677734375, 1.5181884765625, 1.568603515625, 1.6190185546875, 1.66943359375, 1.7198486328125, 1.770263671875, 1.8206787109375, 1.87109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 11.0, 11.0, 27.0, 26.0, 37.0, 70.0, 82.0, 167.0, 270.0, 424.0, 694.0, 1268.0, 2441.0, 5289.0, 14623.0, 59179.0, 357232.0, 488431.0, 86803.0, 19069.0, 6303.0, 2708.0, 1399.0, 787.0, 439.0, 269.0, 172.0, 96.0, 75.0, 42.0, 30.0, 28.0, 11.0, 11.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.8984375, -14.4345703125, -13.970703125, -13.5068359375, -13.04296875, -12.5791015625, -12.115234375, -11.6513671875, -11.1875, -10.7236328125, -10.259765625, -9.7958984375, -9.33203125, -8.8681640625, -8.404296875, -7.9404296875, -7.4765625, -7.0126953125, -6.548828125, -6.0849609375, -5.62109375, -5.1572265625, -4.693359375, -4.2294921875, -3.765625, -3.3017578125, -2.837890625, -2.3740234375, -1.91015625, -1.4462890625, -0.982421875, -0.5185546875, -0.0546875, 0.4091796875, 0.873046875, 1.3369140625, 1.80078125, 2.2646484375, 2.728515625, 3.1923828125, 3.65625, 4.1201171875, 4.583984375, 5.0478515625, 5.51171875, 5.9755859375, 6.439453125, 6.9033203125, 7.3671875, 7.8310546875, 8.294921875, 8.7587890625, 9.22265625, 9.6865234375, 10.150390625, 10.6142578125, 11.078125, 11.5419921875, 12.005859375, 12.4697265625, 12.93359375, 13.3974609375, 13.861328125, 14.3251953125, 14.7890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 9.0, 7.0, 14.0, 25.0, 26.0, 40.0, 33.0, 48.0, 50.0, 61.0, 72.0, 81.0, 80.0, 73.0, 63.0, 69.0, 52.0, 49.0, 35.0, 25.0, 24.0, 15.0, 17.0, 9.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.421875, -10.1279296875, -9.833984375, -9.5400390625, -9.24609375, -8.9521484375, -8.658203125, -8.3642578125, -8.0703125, -7.7763671875, -7.482421875, -7.1884765625, -6.89453125, -6.6005859375, -6.306640625, -6.0126953125, -5.71875, -5.4248046875, -5.130859375, -4.8369140625, -4.54296875, -4.2490234375, -3.955078125, -3.6611328125, -3.3671875, -3.0732421875, -2.779296875, -2.4853515625, -2.19140625, -1.8974609375, -1.603515625, -1.3095703125, -1.015625, -0.7216796875, -0.427734375, -0.1337890625, 0.16015625, 0.4541015625, 0.748046875, 1.0419921875, 1.3359375, 1.6298828125, 1.923828125, 2.2177734375, 2.51171875, 2.8056640625, 3.099609375, 3.3935546875, 3.6875, 3.9814453125, 4.275390625, 4.5693359375, 4.86328125, 5.1572265625, 5.451171875, 5.7451171875, 6.0390625, 6.3330078125, 6.626953125, 6.9208984375, 7.21484375, 7.5087890625, 7.802734375, 8.0966796875, 8.390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 5.0, 12.0, 12.0, 22.0, 31.0, 41.0, 73.0, 120.0, 223.0, 374.0, 751.0, 1648.0, 4099.0, 12668.0, 56752.0, 379053.0, 488408.0, 79626.0, 15850.0, 5031.0, 1878.0, 862.0, 433.0, 226.0, 123.0, 80.0, 56.0, 34.0, 19.0, 16.0, 11.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.8125, -21.2545166015625, -20.696533203125, -20.1385498046875, -19.58056640625, -19.0225830078125, -18.464599609375, -17.9066162109375, -17.3486328125, -16.7906494140625, -16.232666015625, -15.6746826171875, -15.11669921875, -14.5587158203125, -14.000732421875, -13.4427490234375, -12.884765625, -12.3267822265625, -11.768798828125, -11.2108154296875, -10.65283203125, -10.0948486328125, -9.536865234375, -8.9788818359375, -8.4208984375, -7.8629150390625, -7.304931640625, -6.7469482421875, -6.18896484375, -5.6309814453125, -5.072998046875, -4.5150146484375, -3.95703125, -3.3990478515625, -2.841064453125, -2.2830810546875, -1.72509765625, -1.1671142578125, -0.609130859375, -0.0511474609375, 0.5068359375, 1.0648193359375, 1.622802734375, 2.1807861328125, 2.73876953125, 3.2967529296875, 3.854736328125, 4.4127197265625, 4.970703125, 5.5286865234375, 6.086669921875, 6.6446533203125, 7.20263671875, 7.7606201171875, 8.318603515625, 8.8765869140625, 9.4345703125, 9.9925537109375, 10.550537109375, 11.1085205078125, 11.66650390625, 12.2244873046875, 12.782470703125, 13.3404541015625, 13.8984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 19.0, 37.0, 97.0, 160.0, 247.0, 193.0, 102.0, 51.0, 34.0, 13.0, 5.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019741058349609375, -0.001913607120513916, -0.0018531084060668945, -0.001792609691619873, -0.0017321109771728516, -0.00167161226272583, -0.0016111135482788086, -0.0015506148338317871, -0.0014901161193847656, -0.0014296174049377441, -0.0013691186904907227, -0.0013086199760437012, -0.0012481212615966797, -0.0011876225471496582, -0.0011271238327026367, -0.0010666251182556152, -0.0010061264038085938, -0.0009456276893615723, -0.0008851289749145508, -0.0008246302604675293, -0.0007641315460205078, -0.0007036328315734863, -0.0006431341171264648, -0.0005826354026794434, -0.0005221366882324219, -0.0004616379737854004, -0.0004011392593383789, -0.0003406405448913574, -0.00028014183044433594, -0.00021964311599731445, -0.00015914440155029297, -9.864568710327148e-05, -3.814697265625e-05, 2.2351741790771484e-05, 8.285045623779297e-05, 0.00014334917068481445, 0.00020384788513183594, 0.0002643465995788574, 0.0003248453140258789, 0.0003853440284729004, 0.0004458427429199219, 0.0005063414573669434, 0.0005668401718139648, 0.0006273388862609863, 0.0006878376007080078, 0.0007483363151550293, 0.0008088350296020508, 0.0008693337440490723, 0.0009298324584960938, 0.0009903311729431152, 0.0010508298873901367, 0.0011113286018371582, 0.0011718273162841797, 0.0012323260307312012, 0.0012928247451782227, 0.0013533234596252441, 0.0014138221740722656, 0.0014743208885192871, 0.0015348196029663086, 0.00159531831741333, 0.0016558170318603516, 0.001716315746307373, 0.0017768144607543945, 0.001837313175201416, 0.0018978118896484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 11.0, 12.0, 10.0, 15.0, 31.0, 44.0, 63.0, 75.0, 118.0, 190.0, 283.0, 475.0, 739.0, 1407.0, 2636.0, 5370.0, 12703.0, 37418.0, 134261.0, 410093.0, 311611.0, 86561.0, 25625.0, 9563.0, 4189.0, 2120.0, 1129.0, 660.0, 380.0, 225.0, 183.0, 117.0, 65.0, 42.0, 32.0, 23.0, 21.0, 14.0, 11.0, 9.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-12.921875, -12.5283203125, -12.134765625, -11.7412109375, -11.34765625, -10.9541015625, -10.560546875, -10.1669921875, -9.7734375, -9.3798828125, -8.986328125, -8.5927734375, -8.19921875, -7.8056640625, -7.412109375, -7.0185546875, -6.625, -6.2314453125, -5.837890625, -5.4443359375, -5.05078125, -4.6572265625, -4.263671875, -3.8701171875, -3.4765625, -3.0830078125, -2.689453125, -2.2958984375, -1.90234375, -1.5087890625, -1.115234375, -0.7216796875, -0.328125, 0.0654296875, 0.458984375, 0.8525390625, 1.24609375, 1.6396484375, 2.033203125, 2.4267578125, 2.8203125, 3.2138671875, 3.607421875, 4.0009765625, 4.39453125, 4.7880859375, 5.181640625, 5.5751953125, 5.96875, 6.3623046875, 6.755859375, 7.1494140625, 7.54296875, 7.9365234375, 8.330078125, 8.7236328125, 9.1171875, 9.5107421875, 9.904296875, 10.2978515625, 10.69140625, 11.0849609375, 11.478515625, 11.8720703125, 12.265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 8.0, 7.0, 9.0, 18.0, 27.0, 37.0, 49.0, 59.0, 78.0, 97.0, 111.0, 117.0, 91.0, 82.0, 54.0, 31.0, 34.0, 24.0, 9.0, 12.0, 10.0, 13.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.7171630859375, -8.434326171875, -8.1514892578125, -7.86865234375, -7.5858154296875, -7.302978515625, -7.0201416015625, -6.7373046875, -6.4544677734375, -6.171630859375, -5.8887939453125, -5.60595703125, -5.3231201171875, -5.040283203125, -4.7574462890625, -4.474609375, -4.1917724609375, -3.908935546875, -3.6260986328125, -3.34326171875, -3.0604248046875, -2.777587890625, -2.4947509765625, -2.2119140625, -1.9290771484375, -1.646240234375, -1.3634033203125, -1.08056640625, -0.7977294921875, -0.514892578125, -0.2320556640625, 0.05078125, 0.3336181640625, 0.616455078125, 0.8992919921875, 1.18212890625, 1.4649658203125, 1.747802734375, 2.0306396484375, 2.3134765625, 2.5963134765625, 2.879150390625, 3.1619873046875, 3.44482421875, 3.7276611328125, 4.010498046875, 4.2933349609375, 4.576171875, 4.8590087890625, 5.141845703125, 5.4246826171875, 5.70751953125, 5.9903564453125, 6.273193359375, 6.5560302734375, 6.8388671875, 7.1217041015625, 7.404541015625, 7.6873779296875, 7.97021484375, 8.2530517578125, 8.535888671875, 8.8187255859375, 9.1015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 10.0, 30.0, 74.0, 147.0, 194.0, 208.0, 174.0, 72.0, 36.0, 15.0, 12.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.61133575439453, -82.18106842041016, -78.75079345703125, -75.32052612304688, -71.8902587890625, -68.45999145507812, -65.02972412109375, -61.599449157714844, -58.16918182373047, -54.738914489746094, -51.30864334106445, -47.87837219238281, -44.44810485839844, -41.01783752441406, -37.58756637573242, -34.15729522705078, -30.727027893066406, -27.2967586517334, -23.86648941040039, -20.436220169067383, -17.005950927734375, -13.575681686401367, -10.14541244506836, -6.715143203735352, -3.2848739624023438, 0.14539527893066406, 3.575664520263672, 7.00593376159668, 10.436203002929688, 13.866472244262695, 17.296741485595703, 20.72701072692871, 24.15728759765625, 27.587556838989258, 31.017826080322266, 34.448097229003906, 37.87836456298828, 41.308631896972656, 44.7389030456543, 48.16917419433594, 51.59944152832031, 55.02970886230469, 58.45998001098633, 61.89025115966797, 65.32051849365234, 68.75078582763672, 72.18106079101562, 75.611328125, 79.04159545898438, 82.47186279296875, 85.90213012695312, 89.33240509033203, 92.7626724243164, 96.19293975830078, 99.62321472167969, 103.05348205566406, 106.48374938964844, 109.91401672363281, 113.34428405761719, 116.7745590209961, 120.20482635498047, 123.63509368896484, 127.06536865234375, 130.49563598632812, 133.9259033203125]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 7.0, 6.0, 5.0, 6.0, 8.0, 9.0, 18.0, 19.0, 20.0, 28.0, 34.0, 43.0, 47.0, 44.0, 54.0, 70.0, 56.0, 57.0, 59.0, 57.0, 44.0, 52.0, 43.0, 39.0, 33.0, 21.0, 30.0, 22.0, 12.0, 11.0, 8.0, 10.0, 12.0, 6.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.20018768310547, -44.69313430786133, -43.18608093261719, -41.67902374267578, -40.17197036743164, -38.6649169921875, -37.15786361694336, -35.65081024169922, -34.14375686645508, -32.63670349121094, -31.129648208618164, -29.622594833374023, -28.115541458129883, -26.60848617553711, -25.10143280029297, -23.594379425048828, -22.087324142456055, -20.580270767211914, -19.07321548461914, -17.566162109375, -16.05910873413086, -14.552054405212402, -13.045000076293945, -11.537946701049805, -10.030892372131348, -8.52383804321289, -7.01678466796875, -5.509730339050293, -4.002676486968994, -2.4956226348876953, -0.9885683059692383, 0.5184850692749023, 2.0255393981933594, 3.532593250274658, 5.039647102355957, 6.546701431274414, 8.053754806518555, 9.560809135437012, 11.067863464355469, 12.57491683959961, 14.081971168518066, 15.589025497436523, 17.096078872680664, 18.603134155273438, 20.110187530517578, 21.61724090576172, 23.12429428100586, 24.63134765625, 26.138402938842773, 27.645456314086914, 29.152511596679688, 30.659564971923828, 32.16661834716797, 33.67367172241211, 35.18072509765625, 36.687782287597656, 38.1948356628418, 39.70188903808594, 41.20894241333008, 42.71599578857422, 44.223052978515625, 45.730106353759766, 47.237159729003906, 48.74421310424805, 50.25126647949219]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 17.0, 21.0, 27.0, 40.0, 75.0, 99.0, 173.0, 302.0, 546.0, 1012.0, 2177.0, 5043.0, 12167.0, 35190.0, 130661.0, 885802.0, 2806235.0, 227628.0, 54281.0, 18162.0, 7349.0, 3368.0, 1721.0, 896.0, 486.0, 282.0, 171.0, 128.0, 74.0, 36.0, 38.0, 20.0, 8.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.203125, -22.3798828125, -21.556640625, -20.7333984375, -19.91015625, -19.0869140625, -18.263671875, -17.4404296875, -16.6171875, -15.7939453125, -14.970703125, -14.1474609375, -13.32421875, -12.5009765625, -11.677734375, -10.8544921875, -10.03125, -9.2080078125, -8.384765625, -7.5615234375, -6.73828125, -5.9150390625, -5.091796875, -4.2685546875, -3.4453125, -2.6220703125, -1.798828125, -0.9755859375, -0.15234375, 0.6708984375, 1.494140625, 2.3173828125, 3.140625, 3.9638671875, 4.787109375, 5.6103515625, 6.43359375, 7.2568359375, 8.080078125, 8.9033203125, 9.7265625, 10.5498046875, 11.373046875, 12.1962890625, 13.01953125, 13.8427734375, 14.666015625, 15.4892578125, 16.3125, 17.1357421875, 17.958984375, 18.7822265625, 19.60546875, 20.4287109375, 21.251953125, 22.0751953125, 22.8984375, 23.7216796875, 24.544921875, 25.3681640625, 26.19140625, 27.0146484375, 27.837890625, 28.6611328125, 29.484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 9.0, 5.0, 7.0, 8.0, 9.0, 14.0, 21.0, 20.0, 42.0, 37.0, 51.0, 51.0, 71.0, 69.0, 76.0, 89.0, 75.0, 57.0, 62.0, 40.0, 48.0, 33.0, 12.0, 18.0, 21.0, 15.0, 14.0, 9.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.61114501953125, -1.5562744140625, -1.50140380859375, -1.446533203125, -1.39166259765625, -1.3367919921875, -1.28192138671875, -1.22705078125, -1.17218017578125, -1.1173095703125, -1.06243896484375, -1.007568359375, -0.95269775390625, -0.8978271484375, -0.84295654296875, -0.7880859375, -0.73321533203125, -0.6783447265625, -0.62347412109375, -0.568603515625, -0.51373291015625, -0.4588623046875, -0.40399169921875, -0.34912109375, -0.29425048828125, -0.2393798828125, -0.18450927734375, -0.129638671875, -0.07476806640625, -0.0198974609375, 0.03497314453125, 0.08984375, 0.14471435546875, 0.1995849609375, 0.25445556640625, 0.309326171875, 0.36419677734375, 0.4190673828125, 0.47393798828125, 0.52880859375, 0.58367919921875, 0.6385498046875, 0.69342041015625, 0.748291015625, 0.80316162109375, 0.8580322265625, 0.91290283203125, 0.9677734375, 1.02264404296875, 1.0775146484375, 1.13238525390625, 1.187255859375, 1.24212646484375, 1.2969970703125, 1.35186767578125, 1.40673828125, 1.46160888671875, 1.5164794921875, 1.57135009765625, 1.626220703125, 1.68109130859375, 1.7359619140625, 1.79083251953125, 1.845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 4.0, 10.0, 12.0, 20.0, 27.0, 61.0, 91.0, 174.0, 370.0, 941.0, 3478.0, 20841.0, 248409.0, 3512226.0, 373727.0, 27587.0, 4328.0, 1068.0, 406.0, 201.0, 116.0, 63.0, 45.0, 21.0, 13.0, 11.0, 11.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.65625, -45.1298828125, -43.603515625, -42.0771484375, -40.55078125, -39.0244140625, -37.498046875, -35.9716796875, -34.4453125, -32.9189453125, -31.392578125, -29.8662109375, -28.33984375, -26.8134765625, -25.287109375, -23.7607421875, -22.234375, -20.7080078125, -19.181640625, -17.6552734375, -16.12890625, -14.6025390625, -13.076171875, -11.5498046875, -10.0234375, -8.4970703125, -6.970703125, -5.4443359375, -3.91796875, -2.3916015625, -0.865234375, 0.6611328125, 2.1875, 3.7138671875, 5.240234375, 6.7666015625, 8.29296875, 9.8193359375, 11.345703125, 12.8720703125, 14.3984375, 15.9248046875, 17.451171875, 18.9775390625, 20.50390625, 22.0302734375, 23.556640625, 25.0830078125, 26.609375, 28.1357421875, 29.662109375, 31.1884765625, 32.71484375, 34.2412109375, 35.767578125, 37.2939453125, 38.8203125, 40.3466796875, 41.873046875, 43.3994140625, 44.92578125, 46.4521484375, 47.978515625, 49.5048828125, 51.03125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 13.0, 14.0, 12.0, 16.0, 28.0, 55.0, 65.0, 87.0, 122.0, 187.0, 304.0, 456.0, 865.0, 671.0, 397.0, 283.0, 159.0, 104.0, 75.0, 53.0, 27.0, 26.0, 16.0, 13.0, 6.0, 9.0, 6.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.796661376953125, -3.64996337890625, -3.503265380859375, -3.3565673828125, -3.209869384765625, -3.06317138671875, -2.916473388671875, -2.769775390625, -2.623077392578125, -2.47637939453125, -2.329681396484375, -2.1829833984375, -2.036285400390625, -1.88958740234375, -1.742889404296875, -1.59619140625, -1.449493408203125, -1.30279541015625, -1.156097412109375, -1.0093994140625, -0.862701416015625, -0.71600341796875, -0.569305419921875, -0.422607421875, -0.275909423828125, -0.12921142578125, 0.017486572265625, 0.1641845703125, 0.310882568359375, 0.45758056640625, 0.604278564453125, 0.7509765625, 0.897674560546875, 1.04437255859375, 1.191070556640625, 1.3377685546875, 1.484466552734375, 1.63116455078125, 1.777862548828125, 1.924560546875, 2.071258544921875, 2.21795654296875, 2.364654541015625, 2.5113525390625, 2.658050537109375, 2.80474853515625, 2.951446533203125, 3.09814453125, 3.244842529296875, 3.39154052734375, 3.538238525390625, 3.6849365234375, 3.831634521484375, 3.97833251953125, 4.125030517578125, 4.271728515625, 4.418426513671875, 4.56512451171875, 4.711822509765625, 4.8585205078125, 5.005218505859375, 5.15191650390625, 5.298614501953125, 5.4453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 22.0, 24.0, 73.0, 85.0, 127.0, 141.0, 166.0, 134.0, 82.0, 58.0, 33.0, 20.0, 7.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-62.87931442260742, -61.62422180175781, -60.3691291809082, -59.114036560058594, -57.85894775390625, -56.60385513305664, -55.34876251220703, -54.09366989135742, -52.83857727050781, -51.5834846496582, -50.328392028808594, -49.073299407958984, -47.818206787109375, -46.56311798095703, -45.30802536010742, -44.05293273925781, -42.7978401184082, -41.542747497558594, -40.287654876708984, -39.032562255859375, -37.77747344970703, -36.52238082885742, -35.26728820800781, -34.0121955871582, -32.757102966308594, -31.502010345458984, -30.246917724609375, -28.9918270111084, -27.73673439025879, -26.48164176940918, -25.226551055908203, -23.971458435058594, -22.71636962890625, -21.46127700805664, -20.20618438720703, -18.951093673706055, -17.696001052856445, -16.440908432006836, -15.185816764831543, -13.93072509765625, -12.67563247680664, -11.420539855957031, -10.165448188781738, -8.910356521606445, -7.655263900756836, -6.400171756744385, -5.145079612731934, -3.8899879455566406, -2.6348953247070312, -1.37980318069458, -0.1247110366821289, 1.1303811073303223, 2.3854732513427734, 3.6405653953552246, 4.895657539367676, 6.150749206542969, 7.405841827392578, 8.660934448242188, 9.91602611541748, 11.171117782592773, 12.426210403442383, 13.681303024291992, 14.936394691467285, 16.191486358642578, 17.446578979492188]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 10.0, 14.0, 11.0, 18.0, 24.0, 25.0, 26.0, 33.0, 49.0, 39.0, 49.0, 53.0, 51.0, 48.0, 46.0, 42.0, 47.0, 53.0, 42.0, 43.0, 44.0, 33.0, 31.0, 22.0, 27.0, 11.0, 25.0, 25.0, 6.0, 8.0, 11.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.885196685791016, -17.287769317626953, -16.69034194946289, -16.092914581298828, -15.495487213134766, -14.898059844970703, -14.300633430480957, -13.703206062316895, -13.105778694152832, -12.50835132598877, -11.910923957824707, -11.313496589660645, -10.716070175170898, -10.118642807006836, -9.521215438842773, -8.923788070678711, -8.326360702514648, -7.728933334350586, -7.131505966186523, -6.534079074859619, -5.936651706695557, -5.339224338531494, -4.74179744720459, -4.144370079040527, -3.546942710876465, -2.9495153427124023, -2.352088212966919, -1.754660964012146, -1.157233715057373, -0.5598063468933105, 0.03762078285217285, 0.6350479125976562, 1.2324771881103516, 1.8299044370651245, 2.4273316860198975, 3.024758815765381, 3.6221861839294434, 4.219613552093506, 4.81704044342041, 5.414467811584473, 6.011895179748535, 6.609322547912598, 7.20674991607666, 7.8041768074035645, 8.401603698730469, 8.999031066894531, 9.596458435058594, 10.193885803222656, 10.791313171386719, 11.388740539550781, 11.986167907714844, 12.583595275878906, 13.181022644042969, 13.778450012207031, 14.375876426696777, 14.97330379486084, 15.570731163024902, 16.16815757751465, 16.76558494567871, 17.363012313842773, 17.960439682006836, 18.5578670501709, 19.15529441833496, 19.752721786499023, 20.350149154663086]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 16.0, 11.0, 14.0, 19.0, 30.0, 42.0, 60.0, 116.0, 160.0, 287.0, 485.0, 945.0, 1808.0, 4038.0, 9445.0, 22800.0, 59854.0, 164536.0, 360135.0, 261821.0, 99042.0, 36726.0, 14628.0, 6085.0, 2577.0, 1305.0, 654.0, 345.0, 201.0, 120.0, 84.0, 55.0, 31.0, 17.0, 20.0, 11.0, 10.0, 6.0, 1.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.571533203125, -17.01806640625, -16.464599609375, -15.9111328125, -15.357666015625, -14.80419921875, -14.250732421875, -13.697265625, -13.143798828125, -12.59033203125, -12.036865234375, -11.4833984375, -10.929931640625, -10.37646484375, -9.822998046875, -9.26953125, -8.716064453125, -8.16259765625, -7.609130859375, -7.0556640625, -6.502197265625, -5.94873046875, -5.395263671875, -4.841796875, -4.288330078125, -3.73486328125, -3.181396484375, -2.6279296875, -2.074462890625, -1.52099609375, -0.967529296875, -0.4140625, 0.139404296875, 0.69287109375, 1.246337890625, 1.7998046875, 2.353271484375, 2.90673828125, 3.460205078125, 4.013671875, 4.567138671875, 5.12060546875, 5.674072265625, 6.2275390625, 6.781005859375, 7.33447265625, 7.887939453125, 8.44140625, 8.994873046875, 9.54833984375, 10.101806640625, 10.6552734375, 11.208740234375, 11.76220703125, 12.315673828125, 12.869140625, 13.422607421875, 13.97607421875, 14.529541015625, 15.0830078125, 15.636474609375, 16.18994140625, 16.743408203125, 17.296875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 9.0, 7.0, 11.0, 16.0, 21.0, 35.0, 45.0, 36.0, 46.0, 57.0, 62.0, 52.0, 83.0, 66.0, 65.0, 63.0, 60.0, 36.0, 42.0, 25.0, 36.0, 32.0, 18.0, 20.0, 15.0, 8.0, 13.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4345703125, -1.3819580078125, -1.329345703125, -1.2767333984375, -1.22412109375, -1.1715087890625, -1.118896484375, -1.0662841796875, -1.013671875, -0.9610595703125, -0.908447265625, -0.8558349609375, -0.80322265625, -0.7506103515625, -0.697998046875, -0.6453857421875, -0.5927734375, -0.5401611328125, -0.487548828125, -0.4349365234375, -0.38232421875, -0.3297119140625, -0.277099609375, -0.2244873046875, -0.171875, -0.1192626953125, -0.066650390625, -0.0140380859375, 0.03857421875, 0.0911865234375, 0.143798828125, 0.1964111328125, 0.2490234375, 0.3016357421875, 0.354248046875, 0.4068603515625, 0.45947265625, 0.5120849609375, 0.564697265625, 0.6173095703125, 0.669921875, 0.7225341796875, 0.775146484375, 0.8277587890625, 0.88037109375, 0.9329833984375, 0.985595703125, 1.0382080078125, 1.0908203125, 1.1434326171875, 1.196044921875, 1.2486572265625, 1.30126953125, 1.3538818359375, 1.406494140625, 1.4591064453125, 1.51171875, 1.5643310546875, 1.616943359375, 1.6695556640625, 1.72216796875, 1.7747802734375, 1.827392578125, 1.8800048828125, 1.9326171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 9.0, 19.0, 27.0, 25.0, 63.0, 73.0, 117.0, 157.0, 262.0, 451.0, 884.0, 2022.0, 5251.0, 17182.0, 68227.0, 287011.0, 467310.0, 148265.0, 35222.0, 9779.0, 3286.0, 1320.0, 655.0, 345.0, 202.0, 139.0, 91.0, 49.0, 33.0, 25.0, 15.0, 10.0, 8.0, 8.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.96875, -29.16455078125, -28.3603515625, -27.55615234375, -26.751953125, -25.94775390625, -25.1435546875, -24.33935546875, -23.53515625, -22.73095703125, -21.9267578125, -21.12255859375, -20.318359375, -19.51416015625, -18.7099609375, -17.90576171875, -17.1015625, -16.29736328125, -15.4931640625, -14.68896484375, -13.884765625, -13.08056640625, -12.2763671875, -11.47216796875, -10.66796875, -9.86376953125, -9.0595703125, -8.25537109375, -7.451171875, -6.64697265625, -5.8427734375, -5.03857421875, -4.234375, -3.43017578125, -2.6259765625, -1.82177734375, -1.017578125, -0.21337890625, 0.5908203125, 1.39501953125, 2.19921875, 3.00341796875, 3.8076171875, 4.61181640625, 5.416015625, 6.22021484375, 7.0244140625, 7.82861328125, 8.6328125, 9.43701171875, 10.2412109375, 11.04541015625, 11.849609375, 12.65380859375, 13.4580078125, 14.26220703125, 15.06640625, 15.87060546875, 16.6748046875, 17.47900390625, 18.283203125, 19.08740234375, 19.8916015625, 20.69580078125, 21.5]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 11.0, 8.0, 16.0, 16.0, 13.0, 22.0, 29.0, 31.0, 37.0, 34.0, 43.0, 52.0, 46.0, 49.0, 42.0, 54.0, 51.0, 53.0, 55.0, 41.0, 47.0, 44.0, 41.0, 30.0, 36.0, 21.0, 17.0, 12.0, 8.0, 9.0, 8.0, 5.0, 10.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.857666015625, -10.54345703125, -10.229248046875, -9.9150390625, -9.600830078125, -9.28662109375, -8.972412109375, -8.658203125, -8.343994140625, -8.02978515625, -7.715576171875, -7.4013671875, -7.087158203125, -6.77294921875, -6.458740234375, -6.14453125, -5.830322265625, -5.51611328125, -5.201904296875, -4.8876953125, -4.573486328125, -4.25927734375, -3.945068359375, -3.630859375, -3.316650390625, -3.00244140625, -2.688232421875, -2.3740234375, -2.059814453125, -1.74560546875, -1.431396484375, -1.1171875, -0.802978515625, -0.48876953125, -0.174560546875, 0.1396484375, 0.453857421875, 0.76806640625, 1.082275390625, 1.396484375, 1.710693359375, 2.02490234375, 2.339111328125, 2.6533203125, 2.967529296875, 3.28173828125, 3.595947265625, 3.91015625, 4.224365234375, 4.53857421875, 4.852783203125, 5.1669921875, 5.481201171875, 5.79541015625, 6.109619140625, 6.423828125, 6.738037109375, 7.05224609375, 7.366455078125, 7.6806640625, 7.994873046875, 8.30908203125, 8.623291015625, 8.9375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 1.0, 3.0, 4.0, 5.0, 10.0, 7.0, 9.0, 13.0, 14.0, 12.0, 33.0, 41.0, 62.0, 130.0, 200.0, 335.0, 592.0, 1219.0, 2589.0, 6517.0, 19300.0, 69008.0, 262591.0, 452029.0, 167878.0, 44070.0, 13146.0, 4670.0, 1927.0, 984.0, 455.0, 269.0, 150.0, 94.0, 65.0, 24.0, 28.0, 12.0, 12.0, 11.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.203125, -15.650634765625, -15.09814453125, -14.545654296875, -13.9931640625, -13.440673828125, -12.88818359375, -12.335693359375, -11.783203125, -11.230712890625, -10.67822265625, -10.125732421875, -9.5732421875, -9.020751953125, -8.46826171875, -7.915771484375, -7.36328125, -6.810791015625, -6.25830078125, -5.705810546875, -5.1533203125, -4.600830078125, -4.04833984375, -3.495849609375, -2.943359375, -2.390869140625, -1.83837890625, -1.285888671875, -0.7333984375, -0.180908203125, 0.37158203125, 0.924072265625, 1.4765625, 2.029052734375, 2.58154296875, 3.134033203125, 3.6865234375, 4.239013671875, 4.79150390625, 5.343994140625, 5.896484375, 6.448974609375, 7.00146484375, 7.553955078125, 8.1064453125, 8.658935546875, 9.21142578125, 9.763916015625, 10.31640625, 10.868896484375, 11.42138671875, 11.973876953125, 12.5263671875, 13.078857421875, 13.63134765625, 14.183837890625, 14.736328125, 15.288818359375, 15.84130859375, 16.393798828125, 16.9462890625, 17.498779296875, 18.05126953125, 18.603759765625, 19.15625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 15.0, 11.0, 13.0, 18.0, 16.0, 11.0, 40.0, 44.0, 50.0, 77.0, 65.0, 72.0, 93.0, 77.0, 72.0, 60.0, 32.0, 47.0, 30.0, 25.0, 23.0, 16.0, 11.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.001888275146484375, -0.0018323957920074463, -0.0017765164375305176, -0.0017206370830535889, -0.0016647577285766602, -0.0016088783740997314, -0.0015529990196228027, -0.001497119665145874, -0.0014412403106689453, -0.0013853609561920166, -0.0013294816017150879, -0.0012736022472381592, -0.0012177228927612305, -0.0011618435382843018, -0.001105964183807373, -0.0010500848293304443, -0.0009942054748535156, -0.0009383261203765869, -0.0008824467658996582, -0.0008265674114227295, -0.0007706880569458008, -0.0007148087024688721, -0.0006589293479919434, -0.0006030499935150146, -0.0005471706390380859, -0.0004912912845611572, -0.0004354119300842285, -0.0003795325756072998, -0.0003236532211303711, -0.0002677738666534424, -0.00021189451217651367, -0.00015601515769958496, -0.00010013580322265625, -4.425644874572754e-05, 1.1622905731201172e-05, 6.750226020812988e-05, 0.0001233816146850586, 0.0001792609691619873, 0.00023514032363891602, 0.0002910196781158447, 0.00034689903259277344, 0.00040277838706970215, 0.00045865774154663086, 0.0005145370960235596, 0.0005704164505004883, 0.000626295804977417, 0.0006821751594543457, 0.0007380545139312744, 0.0007939338684082031, 0.0008498132228851318, 0.0009056925773620605, 0.0009615719318389893, 0.001017451286315918, 0.0010733306407928467, 0.0011292099952697754, 0.001185089349746704, 0.0012409687042236328, 0.0012968480587005615, 0.0013527274131774902, 0.001408606767654419, 0.0014644861221313477, 0.0015203654766082764, 0.001576244831085205, 0.0016321241855621338, 0.0016880035400390625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 20.0, 14.0, 27.0, 23.0, 53.0, 57.0, 95.0, 145.0, 196.0, 347.0, 542.0, 976.0, 1798.0, 3676.0, 8680.0, 22346.0, 67334.0, 235181.0, 450435.0, 173766.0, 51341.0, 17517.0, 6928.0, 3191.0, 1555.0, 803.0, 490.0, 330.0, 203.0, 147.0, 94.0, 68.0, 41.0, 30.0, 19.0, 19.0, 14.0, 7.0, 3.0, 8.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-18.109375, -17.5975341796875, -17.085693359375, -16.5738525390625, -16.06201171875, -15.5501708984375, -15.038330078125, -14.5264892578125, -14.0146484375, -13.5028076171875, -12.990966796875, -12.4791259765625, -11.96728515625, -11.4554443359375, -10.943603515625, -10.4317626953125, -9.919921875, -9.4080810546875, -8.896240234375, -8.3843994140625, -7.87255859375, -7.3607177734375, -6.848876953125, -6.3370361328125, -5.8251953125, -5.3133544921875, -4.801513671875, -4.2896728515625, -3.77783203125, -3.2659912109375, -2.754150390625, -2.2423095703125, -1.73046875, -1.2186279296875, -0.706787109375, -0.1949462890625, 0.31689453125, 0.8287353515625, 1.340576171875, 1.8524169921875, 2.3642578125, 2.8760986328125, 3.387939453125, 3.8997802734375, 4.41162109375, 4.9234619140625, 5.435302734375, 5.9471435546875, 6.458984375, 6.9708251953125, 7.482666015625, 7.9945068359375, 8.50634765625, 9.0181884765625, 9.530029296875, 10.0418701171875, 10.5537109375, 11.0655517578125, 11.577392578125, 12.0892333984375, 12.60107421875, 13.1129150390625, 13.624755859375, 14.1365966796875, 14.6484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 3.0, 6.0, 13.0, 11.0, 20.0, 22.0, 11.0, 16.0, 32.0, 39.0, 56.0, 55.0, 55.0, 83.0, 74.0, 69.0, 62.0, 73.0, 49.0, 53.0, 25.0, 21.0, 23.0, 23.0, 26.0, 25.0, 13.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.1875, -7.9222412109375, -7.656982421875, -7.3917236328125, -7.12646484375, -6.8612060546875, -6.595947265625, -6.3306884765625, -6.0654296875, -5.8001708984375, -5.534912109375, -5.2696533203125, -5.00439453125, -4.7391357421875, -4.473876953125, -4.2086181640625, -3.943359375, -3.6781005859375, -3.412841796875, -3.1475830078125, -2.88232421875, -2.6170654296875, -2.351806640625, -2.0865478515625, -1.8212890625, -1.5560302734375, -1.290771484375, -1.0255126953125, -0.76025390625, -0.4949951171875, -0.229736328125, 0.0355224609375, 0.30078125, 0.5660400390625, 0.831298828125, 1.0965576171875, 1.36181640625, 1.6270751953125, 1.892333984375, 2.1575927734375, 2.4228515625, 2.6881103515625, 2.953369140625, 3.2186279296875, 3.48388671875, 3.7491455078125, 4.014404296875, 4.2796630859375, 4.544921875, 4.8101806640625, 5.075439453125, 5.3406982421875, 5.60595703125, 5.8712158203125, 6.136474609375, 6.4017333984375, 6.6669921875, 6.9322509765625, 7.197509765625, 7.4627685546875, 7.72802734375, 7.9932861328125, 8.258544921875, 8.5238037109375, 8.7890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 13.0, 27.0, 67.0, 181.0, 295.0, 223.0, 123.0, 41.0, 21.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-321.84857177734375, -312.315673828125, -302.7828063964844, -293.2499084472656, -283.7170104980469, -274.1841125488281, -264.6512451171875, -255.11834716796875, -245.58544921875, -236.0525665283203, -226.51966857910156, -216.98678588867188, -207.45388793945312, -197.92100524902344, -188.38812255859375, -178.855224609375, -169.3223419189453, -159.78945922851562, -150.25656127929688, -140.7236785888672, -131.19078063964844, -121.65789794921875, -112.12500762939453, -102.59211730957031, -93.0592269897461, -83.52633666992188, -73.99344635009766, -64.46055603027344, -54.927669525146484, -45.394779205322266, -35.86189270019531, -26.329002380371094, -16.796112060546875, -7.263222694396973, 2.2696666717529297, 11.802555084228516, 21.335445404052734, 30.868335723876953, 40.401222229003906, 49.934112548828125, 59.467002868652344, 68.99989318847656, 78.53278350830078, 88.065673828125, 97.59855651855469, 107.13145446777344, 116.66433715820312, 126.19722747802734, 135.73011779785156, 145.26300048828125, 154.7958984375, 164.3287811279297, 173.86167907714844, 183.39456176757812, 192.92745971679688, 202.46034240722656, 211.99322509765625, 221.52610778808594, 231.0590057373047, 240.59188842773438, 250.12478637695312, 259.6576843261719, 269.1905517578125, 278.72344970703125, 288.25634765625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 10.0, 7.0, 13.0, 7.0, 16.0, 11.0, 15.0, 21.0, 22.0, 23.0, 30.0, 35.0, 39.0, 30.0, 49.0, 44.0, 45.0, 37.0, 42.0, 42.0, 46.0, 47.0, 36.0, 37.0, 41.0, 33.0, 31.0, 34.0, 22.0, 19.0, 18.0, 14.0, 9.0, 13.0, 10.0, 9.0, 7.0, 10.0, 5.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-59.08879852294922, -57.03484344482422, -54.98088836669922, -52.92693328857422, -50.87297821044922, -48.81902313232422, -46.76506423950195, -44.71110916137695, -42.65715408325195, -40.60319900512695, -38.54924392700195, -36.49528884887695, -34.44132995605469, -32.38737487792969, -30.333419799804688, -28.279464721679688, -26.225509643554688, -24.171554565429688, -22.117599487304688, -20.063642501831055, -18.009687423706055, -15.955732345581055, -13.901776313781738, -11.847820281982422, -9.793865203857422, -7.739909648895264, -5.6859540939331055, -3.6319985389709473, -1.578042984008789, 0.47591209411621094, 2.5298681259155273, 4.583824157714844, 6.6377716064453125, 8.691726684570312, 10.745682716369629, 12.799638748168945, 14.853593826293945, 16.907548904418945, 18.961505889892578, 21.015460968017578, 23.069416046142578, 25.123371124267578, 27.177326202392578, 29.23128318786621, 31.28523826599121, 33.339195251464844, 35.393150329589844, 37.447105407714844, 39.501060485839844, 41.555015563964844, 43.608970642089844, 45.662925720214844, 47.716880798339844, 49.770835876464844, 51.82479476928711, 53.87874984741211, 55.93270492553711, 57.98666000366211, 60.04061508178711, 62.09457015991211, 64.14852905273438, 66.20248413085938, 68.25643920898438, 70.31039428710938, 72.36434936523438]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 5.0, 11.0, 12.0, 10.0, 15.0, 26.0, 28.0, 52.0, 91.0, 96.0, 157.0, 255.0, 413.0, 765.0, 1309.0, 2457.0, 5030.0, 11114.0, 26994.0, 75214.0, 270423.0, 2748741.0, 811358.0, 153873.0, 49133.0, 18857.0, 8379.0, 4086.0, 2091.0, 1147.0, 671.0, 472.0, 311.0, 206.0, 138.0, 88.0, 71.0, 42.0, 33.0, 16.0, 17.0, 11.0, 12.0, 18.0, 6.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-21.609375, -20.88427734375, -20.1591796875, -19.43408203125, -18.708984375, -17.98388671875, -17.2587890625, -16.53369140625, -15.80859375, -15.08349609375, -14.3583984375, -13.63330078125, -12.908203125, -12.18310546875, -11.4580078125, -10.73291015625, -10.0078125, -9.28271484375, -8.5576171875, -7.83251953125, -7.107421875, -6.38232421875, -5.6572265625, -4.93212890625, -4.20703125, -3.48193359375, -2.7568359375, -2.03173828125, -1.306640625, -0.58154296875, 0.1435546875, 0.86865234375, 1.59375, 2.31884765625, 3.0439453125, 3.76904296875, 4.494140625, 5.21923828125, 5.9443359375, 6.66943359375, 7.39453125, 8.11962890625, 8.8447265625, 9.56982421875, 10.294921875, 11.02001953125, 11.7451171875, 12.47021484375, 13.1953125, 13.92041015625, 14.6455078125, 15.37060546875, 16.095703125, 16.82080078125, 17.5458984375, 18.27099609375, 18.99609375, 19.72119140625, 20.4462890625, 21.17138671875, 21.896484375, 22.62158203125, 23.3466796875, 24.07177734375, 24.796875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 6.0, 3.0, 10.0, 14.0, 9.0, 25.0, 23.0, 30.0, 33.0, 41.0, 47.0, 41.0, 41.0, 53.0, 58.0, 64.0, 48.0, 60.0, 40.0, 53.0, 53.0, 45.0, 33.0, 39.0, 22.0, 19.0, 15.0, 11.0, 16.0, 11.0, 4.0, 8.0, 8.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6566619873046875, -1.595550537109375, -1.5344390869140625, -1.47332763671875, -1.4122161865234375, -1.351104736328125, -1.2899932861328125, -1.2288818359375, -1.1677703857421875, -1.106658935546875, -1.0455474853515625, -0.98443603515625, -0.9233245849609375, -0.862213134765625, -0.8011016845703125, -0.739990234375, -0.6788787841796875, -0.617767333984375, -0.5566558837890625, -0.49554443359375, -0.4344329833984375, -0.373321533203125, -0.3122100830078125, -0.2510986328125, -0.1899871826171875, -0.128875732421875, -0.0677642822265625, -0.00665283203125, 0.0544586181640625, 0.115570068359375, 0.1766815185546875, 0.23779296875, 0.2989044189453125, 0.360015869140625, 0.4211273193359375, 0.48223876953125, 0.5433502197265625, 0.604461669921875, 0.6655731201171875, 0.7266845703125, 0.7877960205078125, 0.848907470703125, 0.9100189208984375, 0.97113037109375, 1.0322418212890625, 1.093353271484375, 1.1544647216796875, 1.215576171875, 1.2766876220703125, 1.337799072265625, 1.3989105224609375, 1.46002197265625, 1.5211334228515625, 1.582244873046875, 1.6433563232421875, 1.7044677734375, 1.7655792236328125, 1.826690673828125, 1.8878021240234375, 1.94891357421875, 2.0100250244140625, 2.071136474609375, 2.1322479248046875, 2.193359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 14.0, 16.0, 16.0, 22.0, 55.0, 76.0, 116.0, 172.0, 310.0, 496.0, 905.0, 1612.0, 3267.0, 6985.0, 17693.0, 52318.0, 201869.0, 1362243.0, 2202213.0, 247301.0, 61260.0, 19933.0, 7835.0, 3485.0, 1722.0, 952.0, 548.0, 310.0, 187.0, 121.0, 62.0, 48.0, 32.0, 19.0, 7.0, 15.0, 14.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-29.578125, -28.68359375, -27.7890625, -26.89453125, -26.0, -25.10546875, -24.2109375, -23.31640625, -22.421875, -21.52734375, -20.6328125, -19.73828125, -18.84375, -17.94921875, -17.0546875, -16.16015625, -15.265625, -14.37109375, -13.4765625, -12.58203125, -11.6875, -10.79296875, -9.8984375, -9.00390625, -8.109375, -7.21484375, -6.3203125, -5.42578125, -4.53125, -3.63671875, -2.7421875, -1.84765625, -0.953125, -0.05859375, 0.8359375, 1.73046875, 2.625, 3.51953125, 4.4140625, 5.30859375, 6.203125, 7.09765625, 7.9921875, 8.88671875, 9.78125, 10.67578125, 11.5703125, 12.46484375, 13.359375, 14.25390625, 15.1484375, 16.04296875, 16.9375, 17.83203125, 18.7265625, 19.62109375, 20.515625, 21.41015625, 22.3046875, 23.19921875, 24.09375, 24.98828125, 25.8828125, 26.77734375, 27.671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 14.0, 15.0, 20.0, 37.0, 53.0, 72.0, 102.0, 114.0, 229.0, 323.0, 622.0, 1156.0, 429.0, 297.0, 171.0, 115.0, 80.0, 51.0, 49.0, 18.0, 18.0, 19.0, 7.0, 6.0, 5.0, 11.0, 10.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.44140625, -7.2305908203125, -7.019775390625, -6.8089599609375, -6.59814453125, -6.3873291015625, -6.176513671875, -5.9656982421875, -5.7548828125, -5.5440673828125, -5.333251953125, -5.1224365234375, -4.91162109375, -4.7008056640625, -4.489990234375, -4.2791748046875, -4.068359375, -3.8575439453125, -3.646728515625, -3.4359130859375, -3.22509765625, -3.0142822265625, -2.803466796875, -2.5926513671875, -2.3818359375, -2.1710205078125, -1.960205078125, -1.7493896484375, -1.53857421875, -1.3277587890625, -1.116943359375, -0.9061279296875, -0.6953125, -0.4844970703125, -0.273681640625, -0.0628662109375, 0.14794921875, 0.3587646484375, 0.569580078125, 0.7803955078125, 0.9912109375, 1.2020263671875, 1.412841796875, 1.6236572265625, 1.83447265625, 2.0452880859375, 2.256103515625, 2.4669189453125, 2.677734375, 2.8885498046875, 3.099365234375, 3.3101806640625, 3.52099609375, 3.7318115234375, 3.942626953125, 4.1534423828125, 4.3642578125, 4.5750732421875, 4.785888671875, 4.9967041015625, 5.20751953125, 5.4183349609375, 5.629150390625, 5.8399658203125, 6.05078125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 11.0, 18.0, 19.0, 86.0, 191.0, 267.0, 213.0, 120.0, 56.0, 15.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-160.84622192382812, -157.54103088378906, -154.23583984375, -150.9306640625, -147.62547302246094, -144.32028198242188, -141.0150909423828, -137.70989990234375, -134.4047088623047, -131.09951782226562, -127.7943344116211, -124.48914337158203, -121.18395233154297, -117.87876892089844, -114.57357788085938, -111.26838684082031, -107.96321105957031, -104.65802001953125, -101.35283660888672, -98.04764556884766, -94.7424545288086, -91.43727111816406, -88.132080078125, -84.82688903808594, -81.52169799804688, -78.21650695800781, -74.91132354736328, -71.60613250732422, -68.30094146728516, -64.99575805664062, -61.69056701660156, -58.385379791259766, -55.08019256591797, -51.77500534057617, -48.46981430053711, -45.16462707519531, -41.859439849853516, -38.55425262451172, -35.249061584472656, -31.94387435913086, -28.63868522644043, -25.33349609375, -22.028308868408203, -18.723119735717773, -15.41793155670166, -12.112743377685547, -8.807554244995117, -5.50236701965332, -2.1971778869628906, 1.1080105304718018, 4.413198947906494, 7.718387603759766, 11.023575782775879, 14.328763961791992, 17.633953094482422, 20.93914031982422, 24.24432945251465, 27.549518585205078, 30.854705810546875, 34.15989685058594, 37.465084075927734, 40.77027130126953, 44.075462341308594, 47.380645751953125, 50.68583679199219]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 8.0, 5.0, 11.0, 8.0, 7.0, 9.0, 7.0, 15.0, 20.0, 27.0, 18.0, 19.0, 28.0, 38.0, 22.0, 41.0, 41.0, 41.0, 33.0, 52.0, 46.0, 41.0, 45.0, 34.0, 38.0, 26.0, 36.0, 35.0, 39.0, 30.0, 24.0, 23.0, 18.0, 17.0, 16.0, 16.0, 12.0, 8.0, 7.0, 7.0, 4.0, 2.0, 6.0, 3.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-24.859554290771484, -24.095962524414062, -23.332368850708008, -22.568777084350586, -21.80518341064453, -21.04159164428711, -20.277999877929688, -19.514408111572266, -18.75081443786621, -17.98722267150879, -17.223628997802734, -16.460037231445312, -15.696444511413574, -14.932851791381836, -14.169260025024414, -13.405667304992676, -12.642074584960938, -11.8784818649292, -11.114889144897461, -10.351297378540039, -9.5877046585083, -8.824111938476562, -8.06052017211914, -7.296927452087402, -6.533334732055664, -5.769742012023926, -5.006149768829346, -4.242557525634766, -3.4789648056030273, -2.715372323989868, -1.951779842376709, -1.188187599182129, -0.4245948791503906, 0.33899760246276855, 1.1025900840759277, 1.866182565689087, 2.629775047302246, 3.3933675289154053, 4.1569600105285645, 4.9205522537231445, 5.684144973754883, 6.447737693786621, 7.211329936981201, 7.974922180175781, 8.73851490020752, 9.502107620239258, 10.26569938659668, 11.029292106628418, 11.792884826660156, 12.556477546691895, 13.320070266723633, 14.083662033081055, 14.847254753112793, 15.610847473144531, 16.374439239501953, 17.138031005859375, 17.90162467956543, 18.66521644592285, 19.428810119628906, 20.192401885986328, 20.95599365234375, 21.719587326049805, 22.483179092407227, 23.24677276611328, 24.010364532470703]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 12.0, 20.0, 23.0, 27.0, 38.0, 58.0, 106.0, 159.0, 206.0, 358.0, 662.0, 1174.0, 2118.0, 4373.0, 8855.0, 19203.0, 40406.0, 85325.0, 172143.0, 272525.0, 219916.0, 115239.0, 55266.0, 26025.0, 12226.0, 5782.0, 2828.0, 1419.0, 795.0, 428.0, 295.0, 175.0, 125.0, 58.0, 54.0, 32.0, 21.0, 25.0, 15.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.90625, -13.453369140625, -13.00048828125, -12.547607421875, -12.0947265625, -11.641845703125, -11.18896484375, -10.736083984375, -10.283203125, -9.830322265625, -9.37744140625, -8.924560546875, -8.4716796875, -8.018798828125, -7.56591796875, -7.113037109375, -6.66015625, -6.207275390625, -5.75439453125, -5.301513671875, -4.8486328125, -4.395751953125, -3.94287109375, -3.489990234375, -3.037109375, -2.584228515625, -2.13134765625, -1.678466796875, -1.2255859375, -0.772705078125, -0.31982421875, 0.133056640625, 0.5859375, 1.038818359375, 1.49169921875, 1.944580078125, 2.3974609375, 2.850341796875, 3.30322265625, 3.756103515625, 4.208984375, 4.661865234375, 5.11474609375, 5.567626953125, 6.0205078125, 6.473388671875, 6.92626953125, 7.379150390625, 7.83203125, 8.284912109375, 8.73779296875, 9.190673828125, 9.6435546875, 10.096435546875, 10.54931640625, 11.002197265625, 11.455078125, 11.907958984375, 12.36083984375, 12.813720703125, 13.2666015625, 13.719482421875, 14.17236328125, 14.625244140625, 15.078125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 11.0, 9.0, 15.0, 16.0, 18.0, 20.0, 22.0, 23.0, 31.0, 25.0, 48.0, 60.0, 54.0, 42.0, 53.0, 49.0, 52.0, 41.0, 49.0, 51.0, 40.0, 41.0, 30.0, 28.0, 34.0, 21.0, 27.0, 12.0, 11.0, 14.0, 8.0, 11.0, 9.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7841796875, -1.7180023193359375, -1.651824951171875, -1.5856475830078125, -1.51947021484375, -1.4532928466796875, -1.387115478515625, -1.3209381103515625, -1.2547607421875, -1.1885833740234375, -1.122406005859375, -1.0562286376953125, -0.99005126953125, -0.9238739013671875, -0.857696533203125, -0.7915191650390625, -0.725341796875, -0.6591644287109375, -0.592987060546875, -0.5268096923828125, -0.46063232421875, -0.3944549560546875, -0.328277587890625, -0.2621002197265625, -0.1959228515625, -0.1297454833984375, -0.063568115234375, 0.0026092529296875, 0.06878662109375, 0.1349639892578125, 0.201141357421875, 0.2673187255859375, 0.33349609375, 0.3996734619140625, 0.465850830078125, 0.5320281982421875, 0.59820556640625, 0.6643829345703125, 0.730560302734375, 0.7967376708984375, 0.8629150390625, 0.9290924072265625, 0.995269775390625, 1.0614471435546875, 1.12762451171875, 1.1938018798828125, 1.259979248046875, 1.3261566162109375, 1.392333984375, 1.4585113525390625, 1.524688720703125, 1.5908660888671875, 1.65704345703125, 1.7232208251953125, 1.789398193359375, 1.8555755615234375, 1.9217529296875, 1.9879302978515625, 2.054107666015625, 2.1202850341796875, 2.18646240234375, 2.2526397705078125, 2.318817138671875, 2.3849945068359375, 2.451171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 4.0, 10.0, 16.0, 31.0, 37.0, 26.0, 55.0, 76.0, 117.0, 137.0, 186.0, 330.0, 447.0, 843.0, 1564.0, 3232.0, 7495.0, 19161.0, 54524.0, 160508.0, 411584.0, 253172.0, 85230.0, 29583.0, 10796.0, 4553.0, 2050.0, 1007.0, 604.0, 360.0, 252.0, 164.0, 101.0, 83.0, 50.0, 45.0, 29.0, 19.0, 18.0, 17.0, 10.0, 11.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.1875, -22.406982421875, -21.62646484375, -20.845947265625, -20.0654296875, -19.284912109375, -18.50439453125, -17.723876953125, -16.943359375, -16.162841796875, -15.38232421875, -14.601806640625, -13.8212890625, -13.040771484375, -12.26025390625, -11.479736328125, -10.69921875, -9.918701171875, -9.13818359375, -8.357666015625, -7.5771484375, -6.796630859375, -6.01611328125, -5.235595703125, -4.455078125, -3.674560546875, -2.89404296875, -2.113525390625, -1.3330078125, -0.552490234375, 0.22802734375, 1.008544921875, 1.7890625, 2.569580078125, 3.35009765625, 4.130615234375, 4.9111328125, 5.691650390625, 6.47216796875, 7.252685546875, 8.033203125, 8.813720703125, 9.59423828125, 10.374755859375, 11.1552734375, 11.935791015625, 12.71630859375, 13.496826171875, 14.27734375, 15.057861328125, 15.83837890625, 16.618896484375, 17.3994140625, 18.179931640625, 18.96044921875, 19.740966796875, 20.521484375, 21.302001953125, 22.08251953125, 22.863037109375, 23.6435546875, 24.424072265625, 25.20458984375, 25.985107421875, 26.765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 8.0, 6.0, 6.0, 6.0, 11.0, 12.0, 13.0, 19.0, 24.0, 24.0, 29.0, 31.0, 26.0, 39.0, 35.0, 39.0, 36.0, 53.0, 56.0, 42.0, 56.0, 43.0, 36.0, 45.0, 32.0, 42.0, 29.0, 34.0, 33.0, 20.0, 27.0, 14.0, 12.0, 8.0, 14.0, 6.0, 6.0, 6.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.734375, -12.2916259765625, -11.848876953125, -11.4061279296875, -10.96337890625, -10.5206298828125, -10.077880859375, -9.6351318359375, -9.1923828125, -8.7496337890625, -8.306884765625, -7.8641357421875, -7.42138671875, -6.9786376953125, -6.535888671875, -6.0931396484375, -5.650390625, -5.2076416015625, -4.764892578125, -4.3221435546875, -3.87939453125, -3.4366455078125, -2.993896484375, -2.5511474609375, -2.1083984375, -1.6656494140625, -1.222900390625, -0.7801513671875, -0.33740234375, 0.1053466796875, 0.548095703125, 0.9908447265625, 1.43359375, 1.8763427734375, 2.319091796875, 2.7618408203125, 3.20458984375, 3.6473388671875, 4.090087890625, 4.5328369140625, 4.9755859375, 5.4183349609375, 5.861083984375, 6.3038330078125, 6.74658203125, 7.1893310546875, 7.632080078125, 8.0748291015625, 8.517578125, 8.9603271484375, 9.403076171875, 9.8458251953125, 10.28857421875, 10.7313232421875, 11.174072265625, 11.6168212890625, 12.0595703125, 12.5023193359375, 12.945068359375, 13.3878173828125, 13.83056640625, 14.2733154296875, 14.716064453125, 15.1588134765625, 15.6015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 10.0, 22.0, 13.0, 16.0, 34.0, 55.0, 77.0, 143.0, 239.0, 455.0, 896.0, 2099.0, 4831.0, 12808.0, 39943.0, 152448.0, 532489.0, 220625.0, 53768.0, 16613.0, 6178.0, 2485.0, 1072.0, 534.0, 265.0, 141.0, 86.0, 70.0, 38.0, 23.0, 27.0, 15.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.03125, -19.45263671875, -18.8740234375, -18.29541015625, -17.716796875, -17.13818359375, -16.5595703125, -15.98095703125, -15.40234375, -14.82373046875, -14.2451171875, -13.66650390625, -13.087890625, -12.50927734375, -11.9306640625, -11.35205078125, -10.7734375, -10.19482421875, -9.6162109375, -9.03759765625, -8.458984375, -7.88037109375, -7.3017578125, -6.72314453125, -6.14453125, -5.56591796875, -4.9873046875, -4.40869140625, -3.830078125, -3.25146484375, -2.6728515625, -2.09423828125, -1.515625, -0.93701171875, -0.3583984375, 0.22021484375, 0.798828125, 1.37744140625, 1.9560546875, 2.53466796875, 3.11328125, 3.69189453125, 4.2705078125, 4.84912109375, 5.427734375, 6.00634765625, 6.5849609375, 7.16357421875, 7.7421875, 8.32080078125, 8.8994140625, 9.47802734375, 10.056640625, 10.63525390625, 11.2138671875, 11.79248046875, 12.37109375, 12.94970703125, 13.5283203125, 14.10693359375, 14.685546875, 15.26416015625, 15.8427734375, 16.42138671875, 17.0]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 6.0, 19.0, 13.0, 23.0, 29.0, 21.0, 42.0, 39.0, 64.0, 96.0, 178.0, 140.0, 69.0, 53.0, 41.0, 26.0, 21.0, 19.0, 19.0, 7.0, 17.0, 7.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0037059783935546875, -0.003614872694015503, -0.0035237669944763184, -0.003432661294937134, -0.0033415555953979492, -0.0032504498958587646, -0.00315934419631958, -0.0030682384967803955, -0.002977132797241211, -0.0028860270977020264, -0.002794921398162842, -0.0027038156986236572, -0.0026127099990844727, -0.002521604299545288, -0.0024304986000061035, -0.002339392900466919, -0.0022482872009277344, -0.00215718150138855, -0.0020660758018493652, -0.0019749701023101807, -0.001883864402770996, -0.0017927587032318115, -0.001701653003692627, -0.0016105473041534424, -0.0015194416046142578, -0.0014283359050750732, -0.0013372302055358887, -0.001246124505996704, -0.0011550188064575195, -0.001063913106918335, -0.0009728074073791504, -0.0008817017078399658, -0.0007905960083007812, -0.0006994903087615967, -0.0006083846092224121, -0.0005172789096832275, -0.00042617321014404297, -0.0003350675106048584, -0.00024396181106567383, -0.00015285611152648926, -6.175041198730469e-05, 2.9355287551879883e-05, 0.00012046098709106445, 0.00021156668663024902, 0.0003026723861694336, 0.00039377808570861816, 0.00048488378524780273, 0.0005759894847869873, 0.0006670951843261719, 0.0007582008838653564, 0.000849306583404541, 0.0009404122829437256, 0.0010315179824829102, 0.0011226236820220947, 0.0012137293815612793, 0.0013048350811004639, 0.0013959407806396484, 0.001487046480178833, 0.0015781521797180176, 0.0016692578792572021, 0.0017603635787963867, 0.0018514692783355713, 0.0019425749778747559, 0.0020336806774139404, 0.002124786376953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 12.0, 14.0, 17.0, 19.0, 35.0, 49.0, 69.0, 75.0, 123.0, 170.0, 274.0, 477.0, 805.0, 1469.0, 2925.0, 5893.0, 13675.0, 35363.0, 113014.0, 471695.0, 288496.0, 69825.0, 24111.0, 10000.0, 4588.0, 2233.0, 1185.0, 636.0, 399.0, 248.0, 187.0, 110.0, 91.0, 52.0, 51.0, 39.0, 32.0, 25.0, 15.0, 14.0, 10.0, 10.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.25, -18.6806640625, -18.111328125, -17.5419921875, -16.97265625, -16.4033203125, -15.833984375, -15.2646484375, -14.6953125, -14.1259765625, -13.556640625, -12.9873046875, -12.41796875, -11.8486328125, -11.279296875, -10.7099609375, -10.140625, -9.5712890625, -9.001953125, -8.4326171875, -7.86328125, -7.2939453125, -6.724609375, -6.1552734375, -5.5859375, -5.0166015625, -4.447265625, -3.8779296875, -3.30859375, -2.7392578125, -2.169921875, -1.6005859375, -1.03125, -0.4619140625, 0.107421875, 0.6767578125, 1.24609375, 1.8154296875, 2.384765625, 2.9541015625, 3.5234375, 4.0927734375, 4.662109375, 5.2314453125, 5.80078125, 6.3701171875, 6.939453125, 7.5087890625, 8.078125, 8.6474609375, 9.216796875, 9.7861328125, 10.35546875, 10.9248046875, 11.494140625, 12.0634765625, 12.6328125, 13.2021484375, 13.771484375, 14.3408203125, 14.91015625, 15.4794921875, 16.048828125, 16.6181640625, 17.1875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 10.0, 6.0, 6.0, 11.0, 12.0, 15.0, 17.0, 32.0, 25.0, 28.0, 40.0, 59.0, 77.0, 87.0, 113.0, 78.0, 74.0, 58.0, 57.0, 34.0, 18.0, 20.0, 17.0, 13.0, 11.0, 9.0, 11.0, 5.0, 7.0, 9.0, 3.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.6197509765625, -9.270751953125, -8.9217529296875, -8.57275390625, -8.2237548828125, -7.874755859375, -7.5257568359375, -7.1767578125, -6.8277587890625, -6.478759765625, -6.1297607421875, -5.78076171875, -5.4317626953125, -5.082763671875, -4.7337646484375, -4.384765625, -4.0357666015625, -3.686767578125, -3.3377685546875, -2.98876953125, -2.6397705078125, -2.290771484375, -1.9417724609375, -1.5927734375, -1.2437744140625, -0.894775390625, -0.5457763671875, -0.19677734375, 0.1522216796875, 0.501220703125, 0.8502197265625, 1.19921875, 1.5482177734375, 1.897216796875, 2.2462158203125, 2.59521484375, 2.9442138671875, 3.293212890625, 3.6422119140625, 3.9912109375, 4.3402099609375, 4.689208984375, 5.0382080078125, 5.38720703125, 5.7362060546875, 6.085205078125, 6.4342041015625, 6.783203125, 7.1322021484375, 7.481201171875, 7.8302001953125, 8.17919921875, 8.5281982421875, 8.877197265625, 9.2261962890625, 9.5751953125, 9.9241943359375, 10.273193359375, 10.6221923828125, 10.97119140625, 11.3201904296875, 11.669189453125, 12.0181884765625, 12.3671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 12.0, 17.0, 33.0, 37.0, 45.0, 78.0, 97.0, 111.0, 133.0, 108.0, 87.0, 75.0, 58.0, 31.0, 26.0, 21.0, 6.0, 2.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.860107421875, -131.72422790527344, -126.58834838867188, -121.45246887207031, -116.31658935546875, -111.18070983886719, -106.04483032226562, -100.90895080566406, -95.7730712890625, -90.63719177246094, -85.50131225585938, -80.36543273925781, -75.22955322265625, -70.09367370605469, -64.95779418945312, -59.82191467285156, -54.68603515625, -49.55015563964844, -44.414276123046875, -39.27839660644531, -34.14251708984375, -29.006637573242188, -23.870758056640625, -18.734878540039062, -13.5989990234375, -8.463119506835938, -3.327239990234375, 1.8086395263671875, 6.94451904296875, 12.080398559570312, 17.216278076171875, 22.352157592773438, 27.488037109375, 32.62391662597656, 37.759796142578125, 42.89567565917969, 48.03155517578125, 53.16743469238281, 58.303314208984375, 63.43919372558594, 68.5750732421875, 73.71095275878906, 78.84683227539062, 83.98271179199219, 89.11859130859375, 94.25447082519531, 99.39035034179688, 104.52622985839844, 109.662109375, 114.79798889160156, 119.93386840820312, 125.06974792480469, 130.20562744140625, 135.3415069580078, 140.47738647460938, 145.61326599121094, 150.7491455078125, 155.88502502441406, 161.02090454101562, 166.1567840576172, 171.29266357421875, 176.4285430908203, 181.56442260742188, 186.70030212402344, 191.836181640625]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 5.0, 8.0, 5.0, 9.0, 7.0, 17.0, 14.0, 11.0, 19.0, 22.0, 16.0, 25.0, 22.0, 32.0, 34.0, 29.0, 31.0, 35.0, 37.0, 33.0, 43.0, 55.0, 43.0, 36.0, 42.0, 30.0, 33.0, 26.0, 41.0, 35.0, 41.0, 21.0, 20.0, 19.0, 19.0, 23.0, 15.0, 7.0, 8.0, 7.0, 7.0, 2.0, 9.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-95.60684967041016, -92.68412017822266, -89.76139068603516, -86.83865356445312, -83.91592407226562, -80.99319458007812, -78.07046508789062, -75.14773559570312, -72.22500610351562, -69.30227661132812, -66.37954711914062, -63.45681381225586, -60.53408432006836, -57.611351013183594, -54.688621520996094, -51.765892028808594, -48.84315872192383, -45.92042922973633, -42.99769592285156, -40.07496643066406, -37.15223693847656, -34.22950744628906, -31.306774139404297, -28.384044647216797, -25.461313247680664, -22.53858184814453, -19.61585235595703, -16.6931209564209, -13.770390510559082, -10.847660064697266, -7.924928665161133, -5.002199172973633, -2.0794677734375, 0.8432629108428955, 3.765993595123291, 6.688724517822266, 9.611454963684082, 12.534185409545898, 15.456916809082031, 18.37964630126953, 21.302377700805664, 24.225109100341797, 27.147838592529297, 30.07056999206543, 32.99330139160156, 35.91603088378906, 38.83876037597656, 41.76148986816406, 44.68422317504883, 47.60695266723633, 50.529685974121094, 53.452415466308594, 56.375144958496094, 59.297874450683594, 62.22060775756836, 65.14334106445312, 68.06607055664062, 70.98880004882812, 73.91152954101562, 76.83425903320312, 79.75699615478516, 82.67972564697266, 85.60245513916016, 88.52518463134766, 91.44791412353516]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 7.0, 12.0, 25.0, 22.0, 49.0, 97.0, 151.0, 263.0, 463.0, 850.0, 1923.0, 4241.0, 9888.0, 26133.0, 80999.0, 364395.0, 3272353.0, 318958.0, 73323.0, 23745.0, 8847.0, 3751.0, 1735.0, 911.0, 447.0, 284.0, 154.0, 89.0, 58.0, 35.0, 20.0, 17.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.765625, -23.01025390625, -22.2548828125, -21.49951171875, -20.744140625, -19.98876953125, -19.2333984375, -18.47802734375, -17.72265625, -16.96728515625, -16.2119140625, -15.45654296875, -14.701171875, -13.94580078125, -13.1904296875, -12.43505859375, -11.6796875, -10.92431640625, -10.1689453125, -9.41357421875, -8.658203125, -7.90283203125, -7.1474609375, -6.39208984375, -5.63671875, -4.88134765625, -4.1259765625, -3.37060546875, -2.615234375, -1.85986328125, -1.1044921875, -0.34912109375, 0.40625, 1.16162109375, 1.9169921875, 2.67236328125, 3.427734375, 4.18310546875, 4.9384765625, 5.69384765625, 6.44921875, 7.20458984375, 7.9599609375, 8.71533203125, 9.470703125, 10.22607421875, 10.9814453125, 11.73681640625, 12.4921875, 13.24755859375, 14.0029296875, 14.75830078125, 15.513671875, 16.26904296875, 17.0244140625, 17.77978515625, 18.53515625, 19.29052734375, 20.0458984375, 20.80126953125, 21.556640625, 22.31201171875, 23.0673828125, 23.82275390625, 24.578125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 5.0, 12.0, 15.0, 12.0, 12.0, 10.0, 23.0, 22.0, 37.0, 34.0, 33.0, 39.0, 31.0, 49.0, 46.0, 58.0, 54.0, 38.0, 47.0, 62.0, 47.0, 30.0, 42.0, 38.0, 33.0, 19.0, 32.0, 19.0, 20.0, 12.0, 11.0, 7.0, 9.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.798828125, -2.715789794921875, -2.63275146484375, -2.549713134765625, -2.4666748046875, -2.383636474609375, -2.30059814453125, -2.217559814453125, -2.134521484375, -2.051483154296875, -1.96844482421875, -1.885406494140625, -1.8023681640625, -1.719329833984375, -1.63629150390625, -1.553253173828125, -1.47021484375, -1.387176513671875, -1.30413818359375, -1.221099853515625, -1.1380615234375, -1.055023193359375, -0.97198486328125, -0.888946533203125, -0.805908203125, -0.722869873046875, -0.63983154296875, -0.556793212890625, -0.4737548828125, -0.390716552734375, -0.30767822265625, -0.224639892578125, -0.1416015625, -0.058563232421875, 0.02447509765625, 0.107513427734375, 0.1905517578125, 0.273590087890625, 0.35662841796875, 0.439666748046875, 0.522705078125, 0.605743408203125, 0.68878173828125, 0.771820068359375, 0.8548583984375, 0.937896728515625, 1.02093505859375, 1.103973388671875, 1.18701171875, 1.270050048828125, 1.35308837890625, 1.436126708984375, 1.5191650390625, 1.602203369140625, 1.68524169921875, 1.768280029296875, 1.851318359375, 1.934356689453125, 2.01739501953125, 2.100433349609375, 2.1834716796875, 2.266510009765625, 2.34954833984375, 2.432586669921875, 2.515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 5.0, 8.0, 16.0, 26.0, 33.0, 64.0, 120.0, 202.0, 345.0, 606.0, 1142.0, 2338.0, 5297.0, 13828.0, 44103.0, 183018.0, 2264404.0, 1454759.0, 161164.0, 40048.0, 12981.0, 5073.0, 2276.0, 1125.0, 517.0, 311.0, 178.0, 112.0, 66.0, 39.0, 26.0, 16.0, 12.0, 10.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53125, -22.625, -21.71875, -20.8125, -19.90625, -19.0, -18.09375, -17.1875, -16.28125, -15.375, -14.46875, -13.5625, -12.65625, -11.75, -10.84375, -9.9375, -9.03125, -8.125, -7.21875, -6.3125, -5.40625, -4.5, -3.59375, -2.6875, -1.78125, -0.875, 0.03125, 0.9375, 1.84375, 2.75, 3.65625, 4.5625, 5.46875, 6.375, 7.28125, 8.1875, 9.09375, 10.0, 10.90625, 11.8125, 12.71875, 13.625, 14.53125, 15.4375, 16.34375, 17.25, 18.15625, 19.0625, 19.96875, 20.875, 21.78125, 22.6875, 23.59375, 24.5, 25.40625, 26.3125, 27.21875, 28.125, 29.03125, 29.9375, 30.84375, 31.75, 32.65625, 33.5625, 34.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 12.0, 9.0, 14.0, 16.0, 23.0, 24.0, 41.0, 48.0, 68.0, 97.0, 123.0, 224.0, 306.0, 715.0, 1247.0, 380.0, 205.0, 148.0, 84.0, 72.0, 44.0, 51.0, 24.0, 18.0, 20.0, 9.0, 7.0, 4.0, 7.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.109375, -6.90130615234375, -6.6932373046875, -6.48516845703125, -6.277099609375, -6.06903076171875, -5.8609619140625, -5.65289306640625, -5.44482421875, -5.23675537109375, -5.0286865234375, -4.82061767578125, -4.612548828125, -4.40447998046875, -4.1964111328125, -3.98834228515625, -3.7802734375, -3.57220458984375, -3.3641357421875, -3.15606689453125, -2.947998046875, -2.73992919921875, -2.5318603515625, -2.32379150390625, -2.11572265625, -1.90765380859375, -1.6995849609375, -1.49151611328125, -1.283447265625, -1.07537841796875, -0.8673095703125, -0.65924072265625, -0.451171875, -0.24310302734375, -0.0350341796875, 0.17303466796875, 0.381103515625, 0.58917236328125, 0.7972412109375, 1.00531005859375, 1.21337890625, 1.42144775390625, 1.6295166015625, 1.83758544921875, 2.045654296875, 2.25372314453125, 2.4617919921875, 2.66986083984375, 2.8779296875, 3.08599853515625, 3.2940673828125, 3.50213623046875, 3.710205078125, 3.91827392578125, 4.1263427734375, 4.33441162109375, 4.54248046875, 4.75054931640625, 4.9586181640625, 5.16668701171875, 5.374755859375, 5.58282470703125, 5.7908935546875, 5.99896240234375, 6.20703125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 14.0, 21.0, 64.0, 74.0, 157.0, 177.0, 171.0, 135.0, 93.0, 51.0, 22.0, 13.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.34422302246094, -124.75031280517578, -122.15640258789062, -119.5625, -116.96858978271484, -114.37467956542969, -111.78076934814453, -109.18685913085938, -106.59294891357422, -103.99903869628906, -101.4051284790039, -98.81121826171875, -96.21731567382812, -93.62340545654297, -91.02949523925781, -88.43558502197266, -85.8416748046875, -83.24776458740234, -80.65385437011719, -78.05995178222656, -75.4660415649414, -72.87213134765625, -70.2782211303711, -67.68431091308594, -65.09040832519531, -62.496498107910156, -59.902591705322266, -57.30868148803711, -54.71477127075195, -52.12086486816406, -49.526954650878906, -46.93304443359375, -44.339134216308594, -41.74522399902344, -39.15131759643555, -36.55740737915039, -33.963497161865234, -31.36958885192871, -28.775680541992188, -26.18177032470703, -23.587862014770508, -20.993953704833984, -18.400043487548828, -15.806135177612305, -13.212225914001465, -10.618316650390625, -8.024408340454102, -5.430498123168945, -2.836589813232422, -0.24268078804016113, 2.3512282371520996, 4.945137023925781, 7.539046287536621, 10.132955551147461, 12.726863861083984, 15.32077407836914, 17.914682388305664, 20.508590698242188, 23.102500915527344, 25.696409225463867, 28.29031753540039, 30.884227752685547, 33.47813415527344, 36.072044372558594, 38.66595458984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 1.0, 9.0, 10.0, 9.0, 16.0, 19.0, 23.0, 22.0, 28.0, 34.0, 25.0, 29.0, 30.0, 38.0, 47.0, 47.0, 41.0, 43.0, 64.0, 39.0, 37.0, 42.0, 50.0, 31.0, 29.0, 34.0, 32.0, 32.0, 23.0, 16.0, 15.0, 18.0, 13.0, 11.0, 7.0, 16.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.120281219482422, -22.178024291992188, -21.235767364501953, -20.29351043701172, -19.35125160217285, -18.408994674682617, -17.466737747192383, -16.52448081970215, -15.582223892211914, -14.63996696472168, -13.697709083557129, -12.755452156066895, -11.81319522857666, -10.87093734741211, -9.928680419921875, -8.98642349243164, -8.04416561126709, -7.101908206939697, -6.159651279449463, -5.21739387512207, -4.275136947631836, -3.3328795433044434, -2.390622138977051, -1.4483652114868164, -0.5061078071594238, 0.4361494183540344, 1.3784066438674927, 2.3206639289855957, 3.262921094894409, 4.205178260803223, 5.147435665130615, 6.08969259262085, 7.031949996948242, 7.974207401275635, 8.916464805603027, 9.858721733093262, 10.800978660583496, 11.743236541748047, 12.685493469238281, 13.627750396728516, 14.57000732421875, 15.512264251708984, 16.45452117919922, 17.396778106689453, 18.33903694152832, 19.281293869018555, 20.22355079650879, 21.165807723999023, 22.10806655883789, 23.050323486328125, 23.99258041381836, 24.934837341308594, 25.87709617614746, 26.819353103637695, 27.76161003112793, 28.703866958618164, 29.6461238861084, 30.588380813598633, 31.530637741088867, 32.472896575927734, 33.41515350341797, 34.3574104309082, 35.29966735839844, 36.24192428588867, 37.184181213378906]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 12.0, 18.0, 21.0, 43.0, 41.0, 86.0, 169.0, 248.0, 448.0, 877.0, 1735.0, 3563.0, 7146.0, 15399.0, 33799.0, 76562.0, 165531.0, 296265.0, 237140.0, 113610.0, 51549.0, 23330.0, 10753.0, 4995.0, 2476.0, 1222.0, 616.0, 337.0, 220.0, 131.0, 74.0, 40.0, 29.0, 13.0, 22.0, 13.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.5625, -17.084716796875, -16.60693359375, -16.129150390625, -15.6513671875, -15.173583984375, -14.69580078125, -14.218017578125, -13.740234375, -13.262451171875, -12.78466796875, -12.306884765625, -11.8291015625, -11.351318359375, -10.87353515625, -10.395751953125, -9.91796875, -9.440185546875, -8.96240234375, -8.484619140625, -8.0068359375, -7.529052734375, -7.05126953125, -6.573486328125, -6.095703125, -5.617919921875, -5.14013671875, -4.662353515625, -4.1845703125, -3.706787109375, -3.22900390625, -2.751220703125, -2.2734375, -1.795654296875, -1.31787109375, -0.840087890625, -0.3623046875, 0.115478515625, 0.59326171875, 1.071044921875, 1.548828125, 2.026611328125, 2.50439453125, 2.982177734375, 3.4599609375, 3.937744140625, 4.41552734375, 4.893310546875, 5.37109375, 5.848876953125, 6.32666015625, 6.804443359375, 7.2822265625, 7.760009765625, 8.23779296875, 8.715576171875, 9.193359375, 9.671142578125, 10.14892578125, 10.626708984375, 11.1044921875, 11.582275390625, 12.06005859375, 12.537841796875, 13.015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 6.0, 10.0, 7.0, 9.0, 10.0, 17.0, 12.0, 19.0, 20.0, 28.0, 36.0, 30.0, 27.0, 33.0, 40.0, 48.0, 48.0, 52.0, 59.0, 37.0, 47.0, 42.0, 50.0, 42.0, 36.0, 37.0, 26.0, 32.0, 24.0, 16.0, 20.0, 13.0, 13.0, 12.0, 5.0, 11.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.962890625, -2.877197265625, -2.79150390625, -2.705810546875, -2.6201171875, -2.534423828125, -2.44873046875, -2.363037109375, -2.27734375, -2.191650390625, -2.10595703125, -2.020263671875, -1.9345703125, -1.848876953125, -1.76318359375, -1.677490234375, -1.591796875, -1.506103515625, -1.42041015625, -1.334716796875, -1.2490234375, -1.163330078125, -1.07763671875, -0.991943359375, -0.90625, -0.820556640625, -0.73486328125, -0.649169921875, -0.5634765625, -0.477783203125, -0.39208984375, -0.306396484375, -0.220703125, -0.135009765625, -0.04931640625, 0.036376953125, 0.1220703125, 0.207763671875, 0.29345703125, 0.379150390625, 0.46484375, 0.550537109375, 0.63623046875, 0.721923828125, 0.8076171875, 0.893310546875, 0.97900390625, 1.064697265625, 1.150390625, 1.236083984375, 1.32177734375, 1.407470703125, 1.4931640625, 1.578857421875, 1.66455078125, 1.750244140625, 1.8359375, 1.921630859375, 2.00732421875, 2.093017578125, 2.1787109375, 2.264404296875, 2.35009765625, 2.435791015625, 2.521484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 10.0, 10.0, 14.0, 20.0, 29.0, 42.0, 62.0, 94.0, 132.0, 217.0, 338.0, 555.0, 937.0, 1865.0, 3849.0, 8429.0, 21329.0, 57799.0, 156989.0, 356890.0, 271224.0, 103642.0, 37470.0, 14315.0, 6072.0, 2796.0, 1406.0, 788.0, 443.0, 249.0, 173.0, 95.0, 84.0, 50.0, 46.0, 19.0, 25.0, 9.0, 11.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.640625, -20.02978515625, -19.4189453125, -18.80810546875, -18.197265625, -17.58642578125, -16.9755859375, -16.36474609375, -15.75390625, -15.14306640625, -14.5322265625, -13.92138671875, -13.310546875, -12.69970703125, -12.0888671875, -11.47802734375, -10.8671875, -10.25634765625, -9.6455078125, -9.03466796875, -8.423828125, -7.81298828125, -7.2021484375, -6.59130859375, -5.98046875, -5.36962890625, -4.7587890625, -4.14794921875, -3.537109375, -2.92626953125, -2.3154296875, -1.70458984375, -1.09375, -0.48291015625, 0.1279296875, 0.73876953125, 1.349609375, 1.96044921875, 2.5712890625, 3.18212890625, 3.79296875, 4.40380859375, 5.0146484375, 5.62548828125, 6.236328125, 6.84716796875, 7.4580078125, 8.06884765625, 8.6796875, 9.29052734375, 9.9013671875, 10.51220703125, 11.123046875, 11.73388671875, 12.3447265625, 12.95556640625, 13.56640625, 14.17724609375, 14.7880859375, 15.39892578125, 16.009765625, 16.62060546875, 17.2314453125, 17.84228515625, 18.453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 6.0, 10.0, 12.0, 13.0, 13.0, 20.0, 26.0, 22.0, 35.0, 24.0, 40.0, 41.0, 39.0, 55.0, 48.0, 44.0, 45.0, 46.0, 38.0, 56.0, 44.0, 48.0, 37.0, 33.0, 32.0, 29.0, 23.0, 20.0, 16.0, 10.0, 10.0, 7.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.375, -16.8536376953125, -16.332275390625, -15.8109130859375, -15.28955078125, -14.7681884765625, -14.246826171875, -13.7254638671875, -13.2041015625, -12.6827392578125, -12.161376953125, -11.6400146484375, -11.11865234375, -10.5972900390625, -10.075927734375, -9.5545654296875, -9.033203125, -8.5118408203125, -7.990478515625, -7.4691162109375, -6.94775390625, -6.4263916015625, -5.905029296875, -5.3836669921875, -4.8623046875, -4.3409423828125, -3.819580078125, -3.2982177734375, -2.77685546875, -2.2554931640625, -1.734130859375, -1.2127685546875, -0.69140625, -0.1700439453125, 0.351318359375, 0.8726806640625, 1.39404296875, 1.9154052734375, 2.436767578125, 2.9581298828125, 3.4794921875, 4.0008544921875, 4.522216796875, 5.0435791015625, 5.56494140625, 6.0863037109375, 6.607666015625, 7.1290283203125, 7.650390625, 8.1717529296875, 8.693115234375, 9.2144775390625, 9.73583984375, 10.2572021484375, 10.778564453125, 11.2999267578125, 11.8212890625, 12.3426513671875, 12.864013671875, 13.3853759765625, 13.90673828125, 14.4281005859375, 14.949462890625, 15.4708251953125, 15.9921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 19.0, 32.0, 31.0, 65.0, 70.0, 109.0, 194.0, 340.0, 624.0, 1255.0, 2595.0, 6423.0, 16487.0, 50088.0, 171337.0, 433786.0, 253564.0, 72920.0, 23358.0, 8468.0, 3366.0, 1535.0, 787.0, 427.0, 254.0, 128.0, 90.0, 54.0, 42.0, 27.0, 18.0, 9.0, 13.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6484375, -9.333740234375, -9.01904296875, -8.704345703125, -8.3896484375, -8.074951171875, -7.76025390625, -7.445556640625, -7.130859375, -6.816162109375, -6.50146484375, -6.186767578125, -5.8720703125, -5.557373046875, -5.24267578125, -4.927978515625, -4.61328125, -4.298583984375, -3.98388671875, -3.669189453125, -3.3544921875, -3.039794921875, -2.72509765625, -2.410400390625, -2.095703125, -1.781005859375, -1.46630859375, -1.151611328125, -0.8369140625, -0.522216796875, -0.20751953125, 0.107177734375, 0.421875, 0.736572265625, 1.05126953125, 1.365966796875, 1.6806640625, 1.995361328125, 2.31005859375, 2.624755859375, 2.939453125, 3.254150390625, 3.56884765625, 3.883544921875, 4.1982421875, 4.512939453125, 4.82763671875, 5.142333984375, 5.45703125, 5.771728515625, 6.08642578125, 6.401123046875, 6.7158203125, 7.030517578125, 7.34521484375, 7.659912109375, 7.974609375, 8.289306640625, 8.60400390625, 8.918701171875, 9.2333984375, 9.548095703125, 9.86279296875, 10.177490234375, 10.4921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 0.0, 3.0, 5.0, 5.0, 8.0, 6.0, 16.0, 15.0, 17.0, 23.0, 22.0, 35.0, 55.0, 47.0, 72.0, 105.0, 113.0, 106.0, 75.0, 57.0, 35.0, 37.0, 30.0, 28.0, 17.0, 11.0, 19.0, 11.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0018749237060546875, -0.001817077398300171, -0.0017592310905456543, -0.0017013847827911377, -0.001643538475036621, -0.0015856921672821045, -0.0015278458595275879, -0.0014699995517730713, -0.0014121532440185547, -0.001354306936264038, -0.0012964606285095215, -0.0012386143207550049, -0.0011807680130004883, -0.0011229217052459717, -0.001065075397491455, -0.0010072290897369385, -0.0009493827819824219, -0.0008915364742279053, -0.0008336901664733887, -0.0007758438587188721, -0.0007179975509643555, -0.0006601512432098389, -0.0006023049354553223, -0.0005444586277008057, -0.00048661231994628906, -0.00042876601219177246, -0.00037091970443725586, -0.00031307339668273926, -0.00025522708892822266, -0.00019738078117370605, -0.00013953447341918945, -8.168816566467285e-05, -2.384185791015625e-05, 3.400444984436035e-05, 9.185075759887695e-05, 0.00014969706535339355, 0.00020754337310791016, 0.00026538968086242676, 0.00032323598861694336, 0.00038108229637145996, 0.00043892860412597656, 0.0004967749118804932, 0.0005546212196350098, 0.0006124675273895264, 0.000670313835144043, 0.0007281601428985596, 0.0007860064506530762, 0.0008438527584075928, 0.0009016990661621094, 0.000959545373916626, 0.0010173916816711426, 0.0010752379894256592, 0.0011330842971801758, 0.0011909306049346924, 0.001248776912689209, 0.0013066232204437256, 0.0013644695281982422, 0.0014223158359527588, 0.0014801621437072754, 0.001538008451461792, 0.0015958547592163086, 0.0016537010669708252, 0.0017115473747253418, 0.0017693936824798584, 0.001827239990234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 9.0, 31.0, 30.0, 38.0, 48.0, 83.0, 105.0, 181.0, 292.0, 500.0, 834.0, 1727.0, 3463.0, 7993.0, 19435.0, 54214.0, 177292.0, 439013.0, 231809.0, 69406.0, 23779.0, 9611.0, 4200.0, 2007.0, 1010.0, 506.0, 305.0, 201.0, 122.0, 83.0, 56.0, 43.0, 35.0, 25.0, 9.0, 14.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.9296875, -8.6175537109375, -8.305419921875, -7.9932861328125, -7.68115234375, -7.3690185546875, -7.056884765625, -6.7447509765625, -6.4326171875, -6.1204833984375, -5.808349609375, -5.4962158203125, -5.18408203125, -4.8719482421875, -4.559814453125, -4.2476806640625, -3.935546875, -3.6234130859375, -3.311279296875, -2.9991455078125, -2.68701171875, -2.3748779296875, -2.062744140625, -1.7506103515625, -1.4384765625, -1.1263427734375, -0.814208984375, -0.5020751953125, -0.18994140625, 0.1221923828125, 0.434326171875, 0.7464599609375, 1.05859375, 1.3707275390625, 1.682861328125, 1.9949951171875, 2.30712890625, 2.6192626953125, 2.931396484375, 3.2435302734375, 3.5556640625, 3.8677978515625, 4.179931640625, 4.4920654296875, 4.80419921875, 5.1163330078125, 5.428466796875, 5.7406005859375, 6.052734375, 6.3648681640625, 6.677001953125, 6.9891357421875, 7.30126953125, 7.6134033203125, 7.925537109375, 8.2376708984375, 8.5498046875, 8.8619384765625, 9.174072265625, 9.4862060546875, 9.79833984375, 10.1104736328125, 10.422607421875, 10.7347412109375, 11.046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 2.0, 6.0, 10.0, 9.0, 12.0, 9.0, 24.0, 24.0, 25.0, 29.0, 38.0, 51.0, 62.0, 75.0, 81.0, 89.0, 77.0, 59.0, 68.0, 57.0, 43.0, 31.0, 28.0, 17.0, 17.0, 8.0, 8.0, 6.0, 5.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.27423095703125, -9.0328369140625, -8.79144287109375, -8.550048828125, -8.30865478515625, -8.0672607421875, -7.82586669921875, -7.58447265625, -7.34307861328125, -7.1016845703125, -6.86029052734375, -6.618896484375, -6.37750244140625, -6.1361083984375, -5.89471435546875, -5.6533203125, -5.41192626953125, -5.1705322265625, -4.92913818359375, -4.687744140625, -4.44635009765625, -4.2049560546875, -3.96356201171875, -3.72216796875, -3.48077392578125, -3.2393798828125, -2.99798583984375, -2.756591796875, -2.51519775390625, -2.2738037109375, -2.03240966796875, -1.791015625, -1.54962158203125, -1.3082275390625, -1.06683349609375, -0.825439453125, -0.58404541015625, -0.3426513671875, -0.10125732421875, 0.14013671875, 0.38153076171875, 0.6229248046875, 0.86431884765625, 1.105712890625, 1.34710693359375, 1.5885009765625, 1.82989501953125, 2.0712890625, 2.31268310546875, 2.5540771484375, 2.79547119140625, 3.036865234375, 3.27825927734375, 3.5196533203125, 3.76104736328125, 4.00244140625, 4.24383544921875, 4.4852294921875, 4.72662353515625, 4.968017578125, 5.20941162109375, 5.4508056640625, 5.69219970703125, 5.93359375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 13.0, 21.0, 30.0, 49.0, 63.0, 87.0, 113.0, 138.0, 127.0, 104.0, 81.0, 50.0, 43.0, 25.0, 19.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.12112426757812, -109.714111328125, -105.30709838867188, -100.90008544921875, -96.49308013916016, -92.08606719970703, -87.6790542602539, -83.27204132080078, -78.86503601074219, -74.45802307128906, -70.05101013183594, -65.64399719238281, -61.23699188232422, -56.829978942871094, -52.42296600341797, -48.015953063964844, -43.60894012451172, -39.201927185058594, -34.794918060302734, -30.38790512084961, -25.980894088745117, -21.573883056640625, -17.1668701171875, -12.759859085083008, -8.352848052978516, -3.9458365440368652, 0.46117496490478516, 4.868186950683594, 9.275197982788086, 13.682209014892578, 18.089221954345703, 22.496232986450195, 26.903244018554688, 31.31025505065918, 35.71726608276367, 40.1242790222168, 44.531288146972656, 48.93830108642578, 53.345314025878906, 57.75232696533203, 62.15933609008789, 66.56634521484375, 70.97335815429688, 75.38037109375, 79.78738403320312, 84.19439697265625, 88.60140991210938, 93.00841522216797, 97.4154281616211, 101.82244110107422, 106.22945404052734, 110.63645935058594, 115.04347229003906, 119.45048522949219, 123.85749816894531, 128.26451110839844, 132.67152404785156, 137.0785369873047, 141.4855499267578, 145.89256286621094, 150.29957580566406, 154.70657348632812, 159.11358642578125, 163.52059936523438, 167.9276123046875]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 5.0, 11.0, 17.0, 10.0, 15.0, 15.0, 17.0, 30.0, 33.0, 40.0, 38.0, 45.0, 54.0, 44.0, 41.0, 44.0, 60.0, 53.0, 51.0, 44.0, 51.0, 43.0, 43.0, 36.0, 27.0, 25.0, 13.0, 18.0, 13.0, 10.0, 10.0, 13.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-116.56708526611328, -113.34964752197266, -110.1322021484375, -106.91476440429688, -103.69732666015625, -100.4798812866211, -97.26244354248047, -94.04499816894531, -90.82756042480469, -87.61012268066406, -84.3926773071289, -81.17523956298828, -77.95779418945312, -74.7403564453125, -71.52291870117188, -68.30548095703125, -65.0880355834961, -61.8705940246582, -58.65315246582031, -55.43571472167969, -52.2182731628418, -49.000831604003906, -45.78339385986328, -42.56595230102539, -39.3485107421875, -36.13106918334961, -32.91362762451172, -29.696189880371094, -26.478748321533203, -23.261306762695312, -20.043867111206055, -16.826427459716797, -13.608978271484375, -10.3915376663208, -7.174097061157227, -3.9566564559936523, -0.7392158508300781, 2.4782257080078125, 5.69566535949707, 8.913105010986328, 12.130546569824219, 15.347987174987793, 18.565427780151367, 21.782867431640625, 25.000308990478516, 28.217750549316406, 31.435190200805664, 34.65262985229492, 37.87007141113281, 41.0875129699707, 44.304954528808594, 47.52239227294922, 50.73983383178711, 53.957275390625, 57.174713134765625, 60.392154693603516, 63.609596252441406, 66.82703399658203, 70.04447937011719, 73.26191711425781, 76.47935485839844, 79.6968002319336, 82.91423797607422, 86.13168334960938, 89.34912109375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 7.0, 8.0, 18.0, 21.0, 40.0, 58.0, 81.0, 138.0, 260.0, 427.0, 672.0, 1216.0, 2315.0, 4706.0, 10185.0, 24422.0, 70483.0, 314369.0, 3382206.0, 276153.0, 65190.0, 22602.0, 9239.0, 4501.0, 2078.0, 1182.0, 638.0, 390.0, 233.0, 152.0, 101.0, 60.0, 33.0, 29.0, 24.0, 15.0, 10.0, 4.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.890625, -17.2392578125, -16.587890625, -15.9365234375, -15.28515625, -14.6337890625, -13.982421875, -13.3310546875, -12.6796875, -12.0283203125, -11.376953125, -10.7255859375, -10.07421875, -9.4228515625, -8.771484375, -8.1201171875, -7.46875, -6.8173828125, -6.166015625, -5.5146484375, -4.86328125, -4.2119140625, -3.560546875, -2.9091796875, -2.2578125, -1.6064453125, -0.955078125, -0.3037109375, 0.34765625, 0.9990234375, 1.650390625, 2.3017578125, 2.953125, 3.6044921875, 4.255859375, 4.9072265625, 5.55859375, 6.2099609375, 6.861328125, 7.5126953125, 8.1640625, 8.8154296875, 9.466796875, 10.1181640625, 10.76953125, 11.4208984375, 12.072265625, 12.7236328125, 13.375, 14.0263671875, 14.677734375, 15.3291015625, 15.98046875, 16.6318359375, 17.283203125, 17.9345703125, 18.5859375, 19.2373046875, 19.888671875, 20.5400390625, 21.19140625, 21.8427734375, 22.494140625, 23.1455078125, 23.796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 3.0, 11.0, 4.0, 12.0, 11.0, 9.0, 18.0, 20.0, 25.0, 27.0, 24.0, 27.0, 46.0, 29.0, 39.0, 43.0, 37.0, 60.0, 56.0, 51.0, 55.0, 38.0, 43.0, 40.0, 36.0, 33.0, 32.0, 25.0, 29.0, 21.0, 15.0, 6.0, 12.0, 15.0, 11.0, 7.0, 10.0, 6.0, 4.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.21484375, -3.1253662109375, -3.035888671875, -2.9464111328125, -2.85693359375, -2.7674560546875, -2.677978515625, -2.5885009765625, -2.4990234375, -2.4095458984375, -2.320068359375, -2.2305908203125, -2.14111328125, -2.0516357421875, -1.962158203125, -1.8726806640625, -1.783203125, -1.6937255859375, -1.604248046875, -1.5147705078125, -1.42529296875, -1.3358154296875, -1.246337890625, -1.1568603515625, -1.0673828125, -0.9779052734375, -0.888427734375, -0.7989501953125, -0.70947265625, -0.6199951171875, -0.530517578125, -0.4410400390625, -0.3515625, -0.2620849609375, -0.172607421875, -0.0831298828125, 0.00634765625, 0.0958251953125, 0.185302734375, 0.2747802734375, 0.3642578125, 0.4537353515625, 0.543212890625, 0.6326904296875, 0.72216796875, 0.8116455078125, 0.901123046875, 0.9906005859375, 1.080078125, 1.1695556640625, 1.259033203125, 1.3485107421875, 1.43798828125, 1.5274658203125, 1.616943359375, 1.7064208984375, 1.7958984375, 1.8853759765625, 1.974853515625, 2.0643310546875, 2.15380859375, 2.2432861328125, 2.332763671875, 2.4222412109375, 2.51171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 18.0, 26.0, 51.0, 78.0, 107.0, 172.0, 307.0, 528.0, 1022.0, 1752.0, 3497.0, 7677.0, 19279.0, 54618.0, 202193.0, 2701593.0, 991022.0, 142108.0, 41154.0, 14732.0, 6095.0, 2816.0, 1412.0, 832.0, 432.0, 293.0, 160.0, 99.0, 65.0, 40.0, 30.0, 18.0, 15.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.125, -22.399658203125, -21.67431640625, -20.948974609375, -20.2236328125, -19.498291015625, -18.77294921875, -18.047607421875, -17.322265625, -16.596923828125, -15.87158203125, -15.146240234375, -14.4208984375, -13.695556640625, -12.97021484375, -12.244873046875, -11.51953125, -10.794189453125, -10.06884765625, -9.343505859375, -8.6181640625, -7.892822265625, -7.16748046875, -6.442138671875, -5.716796875, -4.991455078125, -4.26611328125, -3.540771484375, -2.8154296875, -2.090087890625, -1.36474609375, -0.639404296875, 0.0859375, 0.811279296875, 1.53662109375, 2.261962890625, 2.9873046875, 3.712646484375, 4.43798828125, 5.163330078125, 5.888671875, 6.614013671875, 7.33935546875, 8.064697265625, 8.7900390625, 9.515380859375, 10.24072265625, 10.966064453125, 11.69140625, 12.416748046875, 13.14208984375, 13.867431640625, 14.5927734375, 15.318115234375, 16.04345703125, 16.768798828125, 17.494140625, 18.219482421875, 18.94482421875, 19.670166015625, 20.3955078125, 21.120849609375, 21.84619140625, 22.571533203125, 23.296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 5.0, 7.0, 18.0, 28.0, 16.0, 30.0, 41.0, 59.0, 85.0, 114.0, 203.0, 379.0, 1385.0, 849.0, 293.0, 173.0, 111.0, 57.0, 56.0, 38.0, 32.0, 17.0, 16.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.80859375, -6.5882568359375, -6.367919921875, -6.1475830078125, -5.92724609375, -5.7069091796875, -5.486572265625, -5.2662353515625, -5.0458984375, -4.8255615234375, -4.605224609375, -4.3848876953125, -4.16455078125, -3.9442138671875, -3.723876953125, -3.5035400390625, -3.283203125, -3.0628662109375, -2.842529296875, -2.6221923828125, -2.40185546875, -2.1815185546875, -1.961181640625, -1.7408447265625, -1.5205078125, -1.3001708984375, -1.079833984375, -0.8594970703125, -0.63916015625, -0.4188232421875, -0.198486328125, 0.0218505859375, 0.2421875, 0.4625244140625, 0.682861328125, 0.9031982421875, 1.12353515625, 1.3438720703125, 1.564208984375, 1.7845458984375, 2.0048828125, 2.2252197265625, 2.445556640625, 2.6658935546875, 2.88623046875, 3.1065673828125, 3.326904296875, 3.5472412109375, 3.767578125, 3.9879150390625, 4.208251953125, 4.4285888671875, 4.64892578125, 4.8692626953125, 5.089599609375, 5.3099365234375, 5.5302734375, 5.7506103515625, 5.970947265625, 6.1912841796875, 6.41162109375, 6.6319580078125, 6.852294921875, 7.0726318359375, 7.29296875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 11.0, 23.0, 41.0, 84.0, 179.0, 198.0, 209.0, 130.0, 59.0, 32.0, 24.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.11735916137695, -38.554901123046875, -35.9924430847168, -33.42998504638672, -30.867528915405273, -28.305070877075195, -25.74261474609375, -23.180156707763672, -20.617698669433594, -18.055240631103516, -15.492783546447754, -12.930326461791992, -10.367868423461914, -7.805410385131836, -5.242953300476074, -2.6804962158203125, -0.11803817749023438, 2.4444193840026855, 5.0068769454956055, 7.569334506988525, 10.131792068481445, 12.694250106811523, 15.256707191467285, 17.819164276123047, 20.381622314453125, 22.944080352783203, 25.50653839111328, 28.068994522094727, 30.631452560424805, 33.19390869140625, 35.75636672973633, 38.318824768066406, 40.88128662109375, 43.44374465942383, 46.006202697753906, 48.568660736083984, 51.13111877441406, 53.693572998046875, 56.25603103637695, 58.81848907470703, 61.38094711303711, 63.94340515136719, 66.505859375, 69.06832122802734, 71.63077545166016, 74.1932373046875, 76.75569152832031, 79.31814575195312, 81.88060760498047, 84.44306182861328, 87.00552368164062, 89.56797790527344, 92.13043975830078, 94.6928939819336, 97.25535583496094, 99.81781005859375, 102.38026428222656, 104.94271850585938, 107.50518035888672, 110.06763458251953, 112.63009643554688, 115.19255065917969, 117.75501251220703, 120.31746673583984, 122.87992858886719]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 8.0, 6.0, 13.0, 7.0, 11.0, 11.0, 17.0, 20.0, 14.0, 20.0, 28.0, 33.0, 30.0, 36.0, 40.0, 36.0, 43.0, 46.0, 39.0, 34.0, 35.0, 37.0, 47.0, 38.0, 40.0, 28.0, 34.0, 23.0, 29.0, 32.0, 31.0, 26.0, 27.0, 10.0, 17.0, 9.0, 7.0, 8.0, 9.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 2.0], "bins": [-27.335079193115234, -26.576263427734375, -25.81744956970215, -25.05863380432129, -24.299819946289062, -23.541004180908203, -22.782188415527344, -22.023374557495117, -21.26456069946289, -20.50574493408203, -19.746931076049805, -18.988115310668945, -18.22930145263672, -17.47048568725586, -16.711669921875, -15.952856063842773, -15.194040298461914, -14.435225486755371, -13.676410675048828, -12.917594909667969, -12.158781051635742, -11.399965286254883, -10.64115047454834, -9.882335662841797, -9.123520851135254, -8.364706039428711, -7.605891227722168, -6.847075939178467, -6.088261127471924, -5.329446315765381, -4.57063102722168, -3.8118162155151367, -3.0530033111572266, -2.2941884994506836, -1.5353734493255615, -0.7765583992004395, -0.017743587493896484, 0.7410712242126465, 1.4998865127563477, 2.2587013244628906, 3.0175161361694336, 3.7763309478759766, 4.5351457595825195, 5.293961048126221, 6.052775859832764, 6.811590671539307, 7.570405960083008, 8.32922077178955, 9.088035583496094, 9.846850395202637, 10.60566520690918, 11.364480972290039, 12.123294830322266, 12.882110595703125, 13.640925407409668, 14.399740219116211, 15.158555030822754, 15.917369842529297, 16.676185607910156, 17.434999465942383, 18.193815231323242, 18.95262908935547, 19.711444854736328, 20.470260620117188, 21.229074478149414]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 26.0, 23.0, 48.0, 70.0, 111.0, 193.0, 288.0, 540.0, 981.0, 1735.0, 3196.0, 6317.0, 11818.0, 23517.0, 47105.0, 93881.0, 182018.0, 268114.0, 197726.0, 104813.0, 52145.0, 25933.0, 13123.0, 6745.0, 3639.0, 1920.0, 1065.0, 608.0, 342.0, 183.0, 102.0, 80.0, 52.0, 21.0, 16.0, 12.0, 15.0, 5.0, 7.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.4010009765625, -11.981689453125, -11.5623779296875, -11.14306640625, -10.7237548828125, -10.304443359375, -9.8851318359375, -9.4658203125, -9.0465087890625, -8.627197265625, -8.2078857421875, -7.78857421875, -7.3692626953125, -6.949951171875, -6.5306396484375, -6.111328125, -5.6920166015625, -5.272705078125, -4.8533935546875, -4.43408203125, -4.0147705078125, -3.595458984375, -3.1761474609375, -2.7568359375, -2.3375244140625, -1.918212890625, -1.4989013671875, -1.07958984375, -0.6602783203125, -0.240966796875, 0.1783447265625, 0.59765625, 1.0169677734375, 1.436279296875, 1.8555908203125, 2.27490234375, 2.6942138671875, 3.113525390625, 3.5328369140625, 3.9521484375, 4.3714599609375, 4.790771484375, 5.2100830078125, 5.62939453125, 6.0487060546875, 6.468017578125, 6.8873291015625, 7.306640625, 7.7259521484375, 8.145263671875, 8.5645751953125, 8.98388671875, 9.4031982421875, 9.822509765625, 10.2418212890625, 10.6611328125, 11.0804443359375, 11.499755859375, 11.9190673828125, 12.33837890625, 12.7576904296875, 13.177001953125, 13.5963134765625, 14.015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 8.0, 10.0, 10.0, 12.0, 12.0, 15.0, 18.0, 23.0, 36.0, 35.0, 39.0, 30.0, 43.0, 57.0, 35.0, 40.0, 57.0, 53.0, 43.0, 38.0, 42.0, 53.0, 26.0, 38.0, 36.0, 33.0, 26.0, 21.0, 21.0, 17.0, 7.0, 22.0, 10.0, 8.0, 3.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.220703125, -3.124359130859375, -3.02801513671875, -2.931671142578125, -2.8353271484375, -2.738983154296875, -2.64263916015625, -2.546295166015625, -2.449951171875, -2.353607177734375, -2.25726318359375, -2.160919189453125, -2.0645751953125, -1.968231201171875, -1.87188720703125, -1.775543212890625, -1.67919921875, -1.582855224609375, -1.48651123046875, -1.390167236328125, -1.2938232421875, -1.197479248046875, -1.10113525390625, -1.004791259765625, -0.908447265625, -0.812103271484375, -0.71575927734375, -0.619415283203125, -0.5230712890625, -0.426727294921875, -0.33038330078125, -0.234039306640625, -0.1376953125, -0.041351318359375, 0.05499267578125, 0.151336669921875, 0.2476806640625, 0.344024658203125, 0.44036865234375, 0.536712646484375, 0.633056640625, 0.729400634765625, 0.82574462890625, 0.922088623046875, 1.0184326171875, 1.114776611328125, 1.21112060546875, 1.307464599609375, 1.40380859375, 1.500152587890625, 1.59649658203125, 1.692840576171875, 1.7891845703125, 1.885528564453125, 1.98187255859375, 2.078216552734375, 2.174560546875, 2.270904541015625, 2.36724853515625, 2.463592529296875, 2.5599365234375, 2.656280517578125, 2.75262451171875, 2.848968505859375, 2.9453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 8.0, 16.0, 17.0, 24.0, 41.0, 63.0, 92.0, 164.0, 265.0, 362.0, 769.0, 1561.0, 3824.0, 11697.0, 41443.0, 154354.0, 452539.0, 275190.0, 74851.0, 20159.0, 6301.0, 2366.0, 1070.0, 554.0, 300.0, 191.0, 106.0, 77.0, 50.0, 29.0, 14.0, 10.0, 18.0, 11.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.191162109375, -21.49169921875, -20.792236328125, -20.0927734375, -19.393310546875, -18.69384765625, -17.994384765625, -17.294921875, -16.595458984375, -15.89599609375, -15.196533203125, -14.4970703125, -13.797607421875, -13.09814453125, -12.398681640625, -11.69921875, -10.999755859375, -10.30029296875, -9.600830078125, -8.9013671875, -8.201904296875, -7.50244140625, -6.802978515625, -6.103515625, -5.404052734375, -4.70458984375, -4.005126953125, -3.3056640625, -2.606201171875, -1.90673828125, -1.207275390625, -0.5078125, 0.191650390625, 0.89111328125, 1.590576171875, 2.2900390625, 2.989501953125, 3.68896484375, 4.388427734375, 5.087890625, 5.787353515625, 6.48681640625, 7.186279296875, 7.8857421875, 8.585205078125, 9.28466796875, 9.984130859375, 10.68359375, 11.383056640625, 12.08251953125, 12.781982421875, 13.4814453125, 14.180908203125, 14.88037109375, 15.579833984375, 16.279296875, 16.978759765625, 17.67822265625, 18.377685546875, 19.0771484375, 19.776611328125, 20.47607421875, 21.175537109375, 21.875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 8.0, 1.0, 9.0, 8.0, 12.0, 8.0, 10.0, 19.0, 14.0, 26.0, 17.0, 30.0, 28.0, 42.0, 29.0, 38.0, 42.0, 34.0, 45.0, 46.0, 42.0, 38.0, 44.0, 35.0, 46.0, 49.0, 42.0, 33.0, 28.0, 27.0, 26.0, 18.0, 26.0, 19.0, 12.0, 7.0, 10.0, 7.0, 7.0, 7.0, 1.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.109375, -14.67626953125, -14.2431640625, -13.81005859375, -13.376953125, -12.94384765625, -12.5107421875, -12.07763671875, -11.64453125, -11.21142578125, -10.7783203125, -10.34521484375, -9.912109375, -9.47900390625, -9.0458984375, -8.61279296875, -8.1796875, -7.74658203125, -7.3134765625, -6.88037109375, -6.447265625, -6.01416015625, -5.5810546875, -5.14794921875, -4.71484375, -4.28173828125, -3.8486328125, -3.41552734375, -2.982421875, -2.54931640625, -2.1162109375, -1.68310546875, -1.25, -0.81689453125, -0.3837890625, 0.04931640625, 0.482421875, 0.91552734375, 1.3486328125, 1.78173828125, 2.21484375, 2.64794921875, 3.0810546875, 3.51416015625, 3.947265625, 4.38037109375, 4.8134765625, 5.24658203125, 5.6796875, 6.11279296875, 6.5458984375, 6.97900390625, 7.412109375, 7.84521484375, 8.2783203125, 8.71142578125, 9.14453125, 9.57763671875, 10.0107421875, 10.44384765625, 10.876953125, 11.31005859375, 11.7431640625, 12.17626953125, 12.609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 7.0, 12.0, 19.0, 24.0, 31.0, 52.0, 85.0, 150.0, 281.0, 461.0, 969.0, 2024.0, 4563.0, 12155.0, 37800.0, 152340.0, 484974.0, 261238.0, 61958.0, 17687.0, 6318.0, 2617.0, 1290.0, 625.0, 337.0, 193.0, 123.0, 81.0, 49.0, 27.0, 21.0, 11.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.0625, -11.7147216796875, -11.366943359375, -11.0191650390625, -10.67138671875, -10.3236083984375, -9.975830078125, -9.6280517578125, -9.2802734375, -8.9324951171875, -8.584716796875, -8.2369384765625, -7.88916015625, -7.5413818359375, -7.193603515625, -6.8458251953125, -6.498046875, -6.1502685546875, -5.802490234375, -5.4547119140625, -5.10693359375, -4.7591552734375, -4.411376953125, -4.0635986328125, -3.7158203125, -3.3680419921875, -3.020263671875, -2.6724853515625, -2.32470703125, -1.9769287109375, -1.629150390625, -1.2813720703125, -0.93359375, -0.5858154296875, -0.238037109375, 0.1097412109375, 0.45751953125, 0.8052978515625, 1.153076171875, 1.5008544921875, 1.8486328125, 2.1964111328125, 2.544189453125, 2.8919677734375, 3.23974609375, 3.5875244140625, 3.935302734375, 4.2830810546875, 4.630859375, 4.9786376953125, 5.326416015625, 5.6741943359375, 6.02197265625, 6.3697509765625, 6.717529296875, 7.0653076171875, 7.4130859375, 7.7608642578125, 8.108642578125, 8.4564208984375, 8.80419921875, 9.1519775390625, 9.499755859375, 9.8475341796875, 10.1953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 8.0, 10.0, 9.0, 21.0, 35.0, 50.0, 61.0, 73.0, 141.0, 185.0, 117.0, 72.0, 53.0, 28.0, 36.0, 24.0, 16.0, 15.0, 7.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002399444580078125, -0.0023117363452911377, -0.0022240281105041504, -0.002136319875717163, -0.0020486116409301758, -0.0019609034061431885, -0.0018731951713562012, -0.0017854869365692139, -0.0016977787017822266, -0.0016100704669952393, -0.001522362232208252, -0.0014346539974212646, -0.0013469457626342773, -0.00125923752784729, -0.0011715292930603027, -0.0010838210582733154, -0.0009961128234863281, -0.0009084045886993408, -0.0008206963539123535, -0.0007329881191253662, -0.0006452798843383789, -0.0005575716495513916, -0.0004698634147644043, -0.000382155179977417, -0.0002944469451904297, -0.00020673871040344238, -0.00011903047561645508, -3.1322240829467773e-05, 5.638599395751953e-05, 0.00014409422874450684, 0.00023180246353149414, 0.00031951069831848145, 0.00040721893310546875, 0.0004949271678924561, 0.0005826354026794434, 0.0006703436374664307, 0.000758051872253418, 0.0008457601070404053, 0.0009334683418273926, 0.0010211765766143799, 0.0011088848114013672, 0.0011965930461883545, 0.0012843012809753418, 0.001372009515762329, 0.0014597177505493164, 0.0015474259853363037, 0.001635134220123291, 0.0017228424549102783, 0.0018105506896972656, 0.001898258924484253, 0.0019859671592712402, 0.0020736753940582275, 0.002161383628845215, 0.002249091863632202, 0.0023368000984191895, 0.0024245083332061768, 0.002512216567993164, 0.0025999248027801514, 0.0026876330375671387, 0.002775341272354126, 0.0028630495071411133, 0.0029507577419281006, 0.003038465976715088, 0.003126174211502075, 0.0032138824462890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 14.0, 12.0, 23.0, 42.0, 41.0, 63.0, 128.0, 189.0, 384.0, 673.0, 1405.0, 2841.0, 6964.0, 20270.0, 76767.0, 370725.0, 436077.0, 93816.0, 23759.0, 7916.0, 3218.0, 1507.0, 754.0, 351.0, 211.0, 134.0, 90.0, 52.0, 34.0, 27.0, 16.0, 15.0, 11.0, 2.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.96875, -12.5765380859375, -12.184326171875, -11.7921142578125, -11.39990234375, -11.0076904296875, -10.615478515625, -10.2232666015625, -9.8310546875, -9.4388427734375, -9.046630859375, -8.6544189453125, -8.26220703125, -7.8699951171875, -7.477783203125, -7.0855712890625, -6.693359375, -6.3011474609375, -5.908935546875, -5.5167236328125, -5.12451171875, -4.7322998046875, -4.340087890625, -3.9478759765625, -3.5556640625, -3.1634521484375, -2.771240234375, -2.3790283203125, -1.98681640625, -1.5946044921875, -1.202392578125, -0.8101806640625, -0.41796875, -0.0257568359375, 0.366455078125, 0.7586669921875, 1.15087890625, 1.5430908203125, 1.935302734375, 2.3275146484375, 2.7197265625, 3.1119384765625, 3.504150390625, 3.8963623046875, 4.28857421875, 4.6807861328125, 5.072998046875, 5.4652099609375, 5.857421875, 6.2496337890625, 6.641845703125, 7.0340576171875, 7.42626953125, 7.8184814453125, 8.210693359375, 8.6029052734375, 8.9951171875, 9.3873291015625, 9.779541015625, 10.1717529296875, 10.56396484375, 10.9561767578125, 11.348388671875, 11.7406005859375, 12.1328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 4.0, 6.0, 6.0, 9.0, 13.0, 27.0, 25.0, 47.0, 38.0, 53.0, 66.0, 98.0, 111.0, 87.0, 78.0, 79.0, 55.0, 44.0, 40.0, 20.0, 21.0, 18.0, 4.0, 6.0, 12.0, 9.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.7734375, -9.5003662109375, -9.227294921875, -8.9542236328125, -8.68115234375, -8.4080810546875, -8.135009765625, -7.8619384765625, -7.5888671875, -7.3157958984375, -7.042724609375, -6.7696533203125, -6.49658203125, -6.2235107421875, -5.950439453125, -5.6773681640625, -5.404296875, -5.1312255859375, -4.858154296875, -4.5850830078125, -4.31201171875, -4.0389404296875, -3.765869140625, -3.4927978515625, -3.2197265625, -2.9466552734375, -2.673583984375, -2.4005126953125, -2.12744140625, -1.8543701171875, -1.581298828125, -1.3082275390625, -1.03515625, -0.7620849609375, -0.489013671875, -0.2159423828125, 0.05712890625, 0.3302001953125, 0.603271484375, 0.8763427734375, 1.1494140625, 1.4224853515625, 1.695556640625, 1.9686279296875, 2.24169921875, 2.5147705078125, 2.787841796875, 3.0609130859375, 3.333984375, 3.6070556640625, 3.880126953125, 4.1531982421875, 4.42626953125, 4.6993408203125, 4.972412109375, 5.2454833984375, 5.5185546875, 5.7916259765625, 6.064697265625, 6.3377685546875, 6.61083984375, 6.8839111328125, 7.156982421875, 7.4300537109375, 7.703125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 31.0, 36.0, 52.0, 71.0, 101.0, 108.0, 125.0, 128.0, 102.0, 76.0, 58.0, 28.0, 19.0, 17.0, 13.0, 10.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.25979614257812, -118.14527893066406, -114.03075408935547, -109.91622924804688, -105.80171203613281, -101.68719482421875, -97.57266998291016, -93.45814514160156, -89.3436279296875, -85.22911071777344, -81.11458587646484, -77.00006103515625, -72.88554382324219, -68.77102661132812, -64.65650177001953, -60.5419807434082, -56.427459716796875, -52.31293869018555, -48.19841766357422, -44.08389663696289, -39.96937561035156, -35.854854583740234, -31.740333557128906, -27.625812530517578, -23.51129150390625, -19.396770477294922, -15.282249450683594, -11.167728424072266, -7.0532073974609375, -2.9386863708496094, 1.1758346557617188, 5.290355682373047, 9.404861450195312, 13.51938247680664, 17.63390350341797, 21.748424530029297, 25.862945556640625, 29.977466583251953, 34.09198760986328, 38.20650863647461, 42.32102966308594, 46.435550689697266, 50.550071716308594, 54.66459274291992, 58.77911376953125, 62.89363479614258, 67.0081558227539, 71.1226806640625, 75.23719787597656, 79.35171508789062, 83.46623992919922, 87.58076477050781, 91.69528198242188, 95.80979919433594, 99.92432403564453, 104.03884887695312, 108.15336608886719, 112.26788330078125, 116.38240814208984, 120.49693298339844, 124.6114501953125, 128.72596740722656, 132.84048461914062, 136.95501708984375, 141.0695343017578]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 9.0, 15.0, 10.0, 17.0, 9.0, 19.0, 17.0, 22.0, 14.0, 28.0, 31.0, 35.0, 35.0, 42.0, 48.0, 48.0, 33.0, 39.0, 46.0, 41.0, 40.0, 36.0, 36.0, 32.0, 36.0, 41.0, 35.0, 35.0, 15.0, 18.0, 13.0, 21.0, 13.0, 14.0, 13.0, 8.0, 5.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-70.58682250976562, -68.28035736083984, -65.97389221191406, -63.66742706298828, -61.3609619140625, -59.05449676513672, -56.74803161621094, -54.441566467285156, -52.135101318359375, -49.828636169433594, -47.52217102050781, -45.21570587158203, -42.90924072265625, -40.60277557373047, -38.29631042480469, -35.989845275878906, -33.683380126953125, -31.376914978027344, -29.070449829101562, -26.76398468017578, -24.45751953125, -22.15105438232422, -19.844589233398438, -17.538124084472656, -15.231658935546875, -12.925193786621094, -10.618728637695312, -8.312263488769531, -6.00579833984375, -3.6993331909179688, -1.3928680419921875, 0.9135971069335938, 3.220062255859375, 5.526527404785156, 7.8329925537109375, 10.139457702636719, 12.4459228515625, 14.752388000488281, 17.058853149414062, 19.365318298339844, 21.671783447265625, 23.978248596191406, 26.284713745117188, 28.59117889404297, 30.89764404296875, 33.20410919189453, 35.51057434082031, 37.817039489746094, 40.123504638671875, 42.429969787597656, 44.73643493652344, 47.04290008544922, 49.349365234375, 51.65583038330078, 53.96229553222656, 56.268760681152344, 58.575225830078125, 60.881690979003906, 63.18815612792969, 65.49462127685547, 67.80108642578125, 70.10755157470703, 72.41401672363281, 74.7204818725586, 77.02694702148438]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 10.0, 16.0, 26.0, 40.0, 94.0, 133.0, 242.0, 478.0, 947.0, 1924.0, 4829.0, 11601.0, 31725.0, 99929.0, 459119.0, 3116531.0, 342070.0, 81025.0, 26222.0, 9637.0, 4027.0, 1787.0, 869.0, 443.0, 208.0, 143.0, 78.0, 47.0, 28.0, 16.0, 21.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.546875, -21.891845703125, -21.23681640625, -20.581787109375, -19.9267578125, -19.271728515625, -18.61669921875, -17.961669921875, -17.306640625, -16.651611328125, -15.99658203125, -15.341552734375, -14.6865234375, -14.031494140625, -13.37646484375, -12.721435546875, -12.06640625, -11.411376953125, -10.75634765625, -10.101318359375, -9.4462890625, -8.791259765625, -8.13623046875, -7.481201171875, -6.826171875, -6.171142578125, -5.51611328125, -4.861083984375, -4.2060546875, -3.551025390625, -2.89599609375, -2.240966796875, -1.5859375, -0.930908203125, -0.27587890625, 0.379150390625, 1.0341796875, 1.689208984375, 2.34423828125, 2.999267578125, 3.654296875, 4.309326171875, 4.96435546875, 5.619384765625, 6.2744140625, 6.929443359375, 7.58447265625, 8.239501953125, 8.89453125, 9.549560546875, 10.20458984375, 10.859619140625, 11.5146484375, 12.169677734375, 12.82470703125, 13.479736328125, 14.134765625, 14.789794921875, 15.44482421875, 16.099853515625, 16.7548828125, 17.409912109375, 18.06494140625, 18.719970703125, 19.375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 11.0, 5.0, 16.0, 12.0, 21.0, 14.0, 20.0, 18.0, 18.0, 20.0, 25.0, 37.0, 42.0, 37.0, 42.0, 43.0, 37.0, 35.0, 41.0, 43.0, 52.0, 42.0, 33.0, 42.0, 42.0, 30.0, 30.0, 30.0, 26.0, 17.0, 21.0, 12.0, 14.0, 12.0, 12.0, 8.0, 6.0, 4.0, 5.0, 8.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.87890625, -2.793609619140625, -2.70831298828125, -2.623016357421875, -2.5377197265625, -2.452423095703125, -2.36712646484375, -2.281829833984375, -2.196533203125, -2.111236572265625, -2.02593994140625, -1.940643310546875, -1.8553466796875, -1.770050048828125, -1.68475341796875, -1.599456787109375, -1.51416015625, -1.428863525390625, -1.34356689453125, -1.258270263671875, -1.1729736328125, -1.087677001953125, -1.00238037109375, -0.917083740234375, -0.831787109375, -0.746490478515625, -0.66119384765625, -0.575897216796875, -0.4906005859375, -0.405303955078125, -0.32000732421875, -0.234710693359375, -0.1494140625, -0.064117431640625, 0.02117919921875, 0.106475830078125, 0.1917724609375, 0.277069091796875, 0.36236572265625, 0.447662353515625, 0.532958984375, 0.618255615234375, 0.70355224609375, 0.788848876953125, 0.8741455078125, 0.959442138671875, 1.04473876953125, 1.130035400390625, 1.21533203125, 1.300628662109375, 1.38592529296875, 1.471221923828125, 1.5565185546875, 1.641815185546875, 1.72711181640625, 1.812408447265625, 1.897705078125, 1.983001708984375, 2.06829833984375, 2.153594970703125, 2.2388916015625, 2.324188232421875, 2.40948486328125, 2.494781494140625, 2.580078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 13.0, 10.0, 13.0, 18.0, 29.0, 44.0, 53.0, 85.0, 127.0, 210.0, 340.0, 604.0, 1260.0, 2433.0, 5110.0, 11907.0, 28986.0, 81917.0, 280930.0, 2094758.0, 1335884.0, 233331.0, 70664.0, 25638.0, 10447.0, 4604.0, 2219.0, 1179.0, 598.0, 325.0, 193.0, 116.0, 77.0, 42.0, 36.0, 26.0, 12.0, 10.0, 13.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.796875, -17.239501953125, -16.68212890625, -16.124755859375, -15.5673828125, -15.010009765625, -14.45263671875, -13.895263671875, -13.337890625, -12.780517578125, -12.22314453125, -11.665771484375, -11.1083984375, -10.551025390625, -9.99365234375, -9.436279296875, -8.87890625, -8.321533203125, -7.76416015625, -7.206787109375, -6.6494140625, -6.092041015625, -5.53466796875, -4.977294921875, -4.419921875, -3.862548828125, -3.30517578125, -2.747802734375, -2.1904296875, -1.633056640625, -1.07568359375, -0.518310546875, 0.0390625, 0.596435546875, 1.15380859375, 1.711181640625, 2.2685546875, 2.825927734375, 3.38330078125, 3.940673828125, 4.498046875, 5.055419921875, 5.61279296875, 6.170166015625, 6.7275390625, 7.284912109375, 7.84228515625, 8.399658203125, 8.95703125, 9.514404296875, 10.07177734375, 10.629150390625, 11.1865234375, 11.743896484375, 12.30126953125, 12.858642578125, 13.416015625, 13.973388671875, 14.53076171875, 15.088134765625, 15.6455078125, 16.202880859375, 16.76025390625, 17.317626953125, 17.875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 6.0, 7.0, 11.0, 25.0, 24.0, 28.0, 45.0, 42.0, 79.0, 92.0, 115.0, 179.0, 239.0, 412.0, 966.0, 612.0, 365.0, 223.0, 157.0, 105.0, 76.0, 51.0, 49.0, 31.0, 23.0, 22.0, 21.0, 13.0, 12.0, 10.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.078125, -6.8402099609375, -6.602294921875, -6.3643798828125, -6.12646484375, -5.8885498046875, -5.650634765625, -5.4127197265625, -5.1748046875, -4.9368896484375, -4.698974609375, -4.4610595703125, -4.22314453125, -3.9852294921875, -3.747314453125, -3.5093994140625, -3.271484375, -3.0335693359375, -2.795654296875, -2.5577392578125, -2.31982421875, -2.0819091796875, -1.843994140625, -1.6060791015625, -1.3681640625, -1.1302490234375, -0.892333984375, -0.6544189453125, -0.41650390625, -0.1785888671875, 0.059326171875, 0.2972412109375, 0.53515625, 0.7730712890625, 1.010986328125, 1.2489013671875, 1.48681640625, 1.7247314453125, 1.962646484375, 2.2005615234375, 2.4384765625, 2.6763916015625, 2.914306640625, 3.1522216796875, 3.39013671875, 3.6280517578125, 3.865966796875, 4.1038818359375, 4.341796875, 4.5797119140625, 4.817626953125, 5.0555419921875, 5.29345703125, 5.5313720703125, 5.769287109375, 6.0072021484375, 6.2451171875, 6.4830322265625, 6.720947265625, 6.9588623046875, 7.19677734375, 7.4346923828125, 7.672607421875, 7.9105224609375, 8.1484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 10.0, 12.0, 34.0, 61.0, 77.0, 145.0, 174.0, 152.0, 131.0, 90.0, 44.0, 24.0, 23.0, 12.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.36531066894531, -54.29949951171875, -51.23368453979492, -48.167869567871094, -45.10205841064453, -42.03624725341797, -38.97043228149414, -35.90461730957031, -32.83880615234375, -29.772993087768555, -26.70718002319336, -23.641366958618164, -20.57555389404297, -17.509740829467773, -14.443927764892578, -11.378114700317383, -8.312301635742188, -5.246488571166992, -2.180675506591797, 0.8851375579833984, 3.9509506225585938, 7.016763687133789, 10.082576751708984, 13.14838981628418, 16.214202880859375, 19.28001594543457, 22.345829010009766, 25.41164207458496, 28.477455139160156, 31.54326820373535, 34.60908126831055, 37.674896240234375, 40.74070739746094, 43.8065185546875, 46.87233352661133, 49.938148498535156, 53.00395965576172, 56.06977081298828, 59.13558578491211, 62.20140075683594, 65.2672119140625, 68.33302307128906, 71.39883422851562, 74.46465301513672, 77.53046417236328, 80.59627532958984, 83.66209411621094, 86.7279052734375, 89.79371643066406, 92.85952758789062, 95.92533874511719, 98.99115753173828, 102.05696868896484, 105.1227798461914, 108.1885986328125, 111.25440979003906, 114.32022094726562, 117.38603210449219, 120.45184326171875, 123.51766204833984, 126.5834732055664, 129.6492919921875, 132.71510314941406, 135.78091430664062, 138.8467254638672]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 8.0, 7.0, 11.0, 6.0, 13.0, 17.0, 13.0, 23.0, 16.0, 12.0, 34.0, 28.0, 32.0, 25.0, 36.0, 31.0, 28.0, 33.0, 38.0, 37.0, 39.0, 35.0, 39.0, 34.0, 39.0, 30.0, 29.0, 27.0, 38.0, 25.0, 23.0, 28.0, 26.0, 26.0, 13.0, 15.0, 12.0, 10.0, 13.0, 11.0, 9.0, 7.0, 5.0, 3.0, 9.0, 2.0, 6.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.857507705688477, -28.95193099975586, -28.046356201171875, -27.14078140258789, -26.235204696655273, -25.329627990722656, -24.424053192138672, -23.518478393554688, -22.61290168762207, -21.707324981689453, -20.80175018310547, -19.896175384521484, -18.990598678588867, -18.08502197265625, -17.179447174072266, -16.27387237548828, -15.368295669555664, -14.462719917297363, -13.557144165039062, -12.651568412780762, -11.745992660522461, -10.84041690826416, -9.93484115600586, -9.029265403747559, -8.123689651489258, -7.218113899230957, -6.312538146972656, -5.4069623947143555, -4.501386642456055, -3.595810890197754, -2.690235137939453, -1.7846593856811523, -0.8790817260742188, 0.02649402618408203, 0.9320697784423828, 1.8376455307006836, 2.7432212829589844, 3.648797035217285, 4.554372787475586, 5.459948539733887, 6.3655242919921875, 7.271100044250488, 8.176675796508789, 9.08225154876709, 9.98782730102539, 10.893403053283691, 11.798978805541992, 12.704554557800293, 13.610130310058594, 14.515706062316895, 15.421281814575195, 16.326858520507812, 17.232433319091797, 18.13800811767578, 19.0435848236084, 19.949161529541016, 20.854736328125, 21.760311126708984, 22.6658878326416, 23.57146453857422, 24.477039337158203, 25.382614135742188, 26.288190841674805, 27.193767547607422, 28.099342346191406]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 7.0, 8.0, 21.0, 27.0, 28.0, 45.0, 104.0, 172.0, 316.0, 664.0, 1453.0, 3569.0, 9208.0, 23927.0, 65817.0, 188892.0, 438502.0, 203520.0, 70129.0, 25854.0, 9497.0, 3770.0, 1586.0, 671.0, 335.0, 177.0, 85.0, 52.0, 40.0, 23.0, 21.0, 9.0, 9.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 3.0], "bins": [-29.46875, -28.74169921875, -28.0146484375, -27.28759765625, -26.560546875, -25.83349609375, -25.1064453125, -24.37939453125, -23.65234375, -22.92529296875, -22.1982421875, -21.47119140625, -20.744140625, -20.01708984375, -19.2900390625, -18.56298828125, -17.8359375, -17.10888671875, -16.3818359375, -15.65478515625, -14.927734375, -14.20068359375, -13.4736328125, -12.74658203125, -12.01953125, -11.29248046875, -10.5654296875, -9.83837890625, -9.111328125, -8.38427734375, -7.6572265625, -6.93017578125, -6.203125, -5.47607421875, -4.7490234375, -4.02197265625, -3.294921875, -2.56787109375, -1.8408203125, -1.11376953125, -0.38671875, 0.34033203125, 1.0673828125, 1.79443359375, 2.521484375, 3.24853515625, 3.9755859375, 4.70263671875, 5.4296875, 6.15673828125, 6.8837890625, 7.61083984375, 8.337890625, 9.06494140625, 9.7919921875, 10.51904296875, 11.24609375, 11.97314453125, 12.7001953125, 13.42724609375, 14.154296875, 14.88134765625, 15.6083984375, 16.33544921875, 17.0625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 9.0, 4.0, 11.0, 21.0, 16.0, 18.0, 27.0, 17.0, 19.0, 31.0, 27.0, 38.0, 46.0, 44.0, 50.0, 45.0, 37.0, 51.0, 49.0, 54.0, 55.0, 44.0, 34.0, 32.0, 30.0, 27.0, 29.0, 22.0, 21.0, 15.0, 17.0, 16.0, 8.0, 9.0, 7.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.115234375, -3.01849365234375, -2.9217529296875, -2.82501220703125, -2.728271484375, -2.63153076171875, -2.5347900390625, -2.43804931640625, -2.34130859375, -2.24456787109375, -2.1478271484375, -2.05108642578125, -1.954345703125, -1.85760498046875, -1.7608642578125, -1.66412353515625, -1.5673828125, -1.47064208984375, -1.3739013671875, -1.27716064453125, -1.180419921875, -1.08367919921875, -0.9869384765625, -0.89019775390625, -0.79345703125, -0.69671630859375, -0.5999755859375, -0.50323486328125, -0.406494140625, -0.30975341796875, -0.2130126953125, -0.11627197265625, -0.01953125, 0.07720947265625, 0.1739501953125, 0.27069091796875, 0.367431640625, 0.46417236328125, 0.5609130859375, 0.65765380859375, 0.75439453125, 0.85113525390625, 0.9478759765625, 1.04461669921875, 1.141357421875, 1.23809814453125, 1.3348388671875, 1.43157958984375, 1.5283203125, 1.62506103515625, 1.7218017578125, 1.81854248046875, 1.915283203125, 2.01202392578125, 2.1087646484375, 2.20550537109375, 2.30224609375, 2.39898681640625, 2.4957275390625, 2.59246826171875, 2.689208984375, 2.78594970703125, 2.8826904296875, 2.97943115234375, 3.076171875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 10.0, 15.0, 20.0, 26.0, 37.0, 52.0, 85.0, 185.0, 255.0, 437.0, 844.0, 1746.0, 3624.0, 8766.0, 27102.0, 99183.0, 406881.0, 370137.0, 89404.0, 24399.0, 8390.0, 3325.0, 1682.0, 813.0, 431.0, 262.0, 146.0, 103.0, 63.0, 30.0, 27.0, 14.0, 13.0, 7.0, 10.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.27490234375, -19.5498046875, -18.82470703125, -18.099609375, -17.37451171875, -16.6494140625, -15.92431640625, -15.19921875, -14.47412109375, -13.7490234375, -13.02392578125, -12.298828125, -11.57373046875, -10.8486328125, -10.12353515625, -9.3984375, -8.67333984375, -7.9482421875, -7.22314453125, -6.498046875, -5.77294921875, -5.0478515625, -4.32275390625, -3.59765625, -2.87255859375, -2.1474609375, -1.42236328125, -0.697265625, 0.02783203125, 0.7529296875, 1.47802734375, 2.203125, 2.92822265625, 3.6533203125, 4.37841796875, 5.103515625, 5.82861328125, 6.5537109375, 7.27880859375, 8.00390625, 8.72900390625, 9.4541015625, 10.17919921875, 10.904296875, 11.62939453125, 12.3544921875, 13.07958984375, 13.8046875, 14.52978515625, 15.2548828125, 15.97998046875, 16.705078125, 17.43017578125, 18.1552734375, 18.88037109375, 19.60546875, 20.33056640625, 21.0556640625, 21.78076171875, 22.505859375, 23.23095703125, 23.9560546875, 24.68115234375, 25.40625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 8.0, 5.0, 11.0, 8.0, 12.0, 7.0, 17.0, 10.0, 24.0, 25.0, 27.0, 37.0, 44.0, 36.0, 42.0, 53.0, 53.0, 51.0, 54.0, 48.0, 44.0, 48.0, 38.0, 42.0, 44.0, 33.0, 23.0, 23.0, 27.0, 20.0, 11.0, 14.0, 18.0, 7.0, 7.0, 10.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.1875, -16.69091796875, -16.1943359375, -15.69775390625, -15.201171875, -14.70458984375, -14.2080078125, -13.71142578125, -13.21484375, -12.71826171875, -12.2216796875, -11.72509765625, -11.228515625, -10.73193359375, -10.2353515625, -9.73876953125, -9.2421875, -8.74560546875, -8.2490234375, -7.75244140625, -7.255859375, -6.75927734375, -6.2626953125, -5.76611328125, -5.26953125, -4.77294921875, -4.2763671875, -3.77978515625, -3.283203125, -2.78662109375, -2.2900390625, -1.79345703125, -1.296875, -0.80029296875, -0.3037109375, 0.19287109375, 0.689453125, 1.18603515625, 1.6826171875, 2.17919921875, 2.67578125, 3.17236328125, 3.6689453125, 4.16552734375, 4.662109375, 5.15869140625, 5.6552734375, 6.15185546875, 6.6484375, 7.14501953125, 7.6416015625, 8.13818359375, 8.634765625, 9.13134765625, 9.6279296875, 10.12451171875, 10.62109375, 11.11767578125, 11.6142578125, 12.11083984375, 12.607421875, 13.10400390625, 13.6005859375, 14.09716796875, 14.59375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 6.0, 7.0, 12.0, 20.0, 26.0, 31.0, 65.0, 104.0, 207.0, 375.0, 800.0, 1700.0, 4040.0, 10715.0, 34493.0, 150490.0, 586109.0, 196210.0, 41933.0, 12602.0, 4753.0, 2001.0, 865.0, 462.0, 223.0, 107.0, 80.0, 42.0, 20.0, 17.0, 9.0, 5.0, 8.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.796875, -18.282958984375, -17.76904296875, -17.255126953125, -16.7412109375, -16.227294921875, -15.71337890625, -15.199462890625, -14.685546875, -14.171630859375, -13.65771484375, -13.143798828125, -12.6298828125, -12.115966796875, -11.60205078125, -11.088134765625, -10.57421875, -10.060302734375, -9.54638671875, -9.032470703125, -8.5185546875, -8.004638671875, -7.49072265625, -6.976806640625, -6.462890625, -5.948974609375, -5.43505859375, -4.921142578125, -4.4072265625, -3.893310546875, -3.37939453125, -2.865478515625, -2.3515625, -1.837646484375, -1.32373046875, -0.809814453125, -0.2958984375, 0.218017578125, 0.73193359375, 1.245849609375, 1.759765625, 2.273681640625, 2.78759765625, 3.301513671875, 3.8154296875, 4.329345703125, 4.84326171875, 5.357177734375, 5.87109375, 6.385009765625, 6.89892578125, 7.412841796875, 7.9267578125, 8.440673828125, 8.95458984375, 9.468505859375, 9.982421875, 10.496337890625, 11.01025390625, 11.524169921875, 12.0380859375, 12.552001953125, 13.06591796875, 13.579833984375, 14.09375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 0.0, 6.0, 5.0, 9.0, 15.0, 23.0, 36.0, 60.0, 99.0, 224.0, 255.0, 99.0, 69.0, 23.0, 22.0, 20.0, 15.0, 8.0, 2.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006664276123046875, -0.006501883268356323, -0.0063394904136657715, -0.00617709755897522, -0.006014704704284668, -0.005852311849594116, -0.0056899189949035645, -0.005527526140213013, -0.005365133285522461, -0.005202740430831909, -0.005040347576141357, -0.004877954721450806, -0.004715561866760254, -0.004553169012069702, -0.00439077615737915, -0.004228383302688599, -0.004065990447998047, -0.003903597593307495, -0.0037412047386169434, -0.0035788118839263916, -0.00341641902923584, -0.003254026174545288, -0.0030916333198547363, -0.0029292404651641846, -0.002766847610473633, -0.002604454755783081, -0.0024420619010925293, -0.0022796690464019775, -0.0021172761917114258, -0.001954883337020874, -0.0017924904823303223, -0.0016300976276397705, -0.0014677047729492188, -0.001305311918258667, -0.0011429190635681152, -0.0009805262088775635, -0.0008181333541870117, -0.00065574049949646, -0.0004933476448059082, -0.00033095479011535645, -0.0001685619354248047, -6.16908073425293e-06, 0.00015622377395629883, 0.0003186166286468506, 0.00048100948333740234, 0.0006434023380279541, 0.0008057951927185059, 0.0009681880474090576, 0.0011305809020996094, 0.0012929737567901611, 0.0014553666114807129, 0.0016177594661712646, 0.0017801523208618164, 0.0019425451755523682, 0.00210493803024292, 0.0022673308849334717, 0.0024297237396240234, 0.002592116594314575, 0.002754509449005127, 0.0029169023036956787, 0.0030792951583862305, 0.0032416880130767822, 0.003404080867767334, 0.0035664737224578857, 0.0037288665771484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 13.0, 14.0, 22.0, 19.0, 30.0, 43.0, 72.0, 98.0, 174.0, 271.0, 485.0, 806.0, 1587.0, 3156.0, 6305.0, 14018.0, 34730.0, 105722.0, 406004.0, 335565.0, 85603.0, 29774.0, 12403.0, 5553.0, 2771.0, 1422.0, 711.0, 449.0, 219.0, 169.0, 81.0, 65.0, 49.0, 46.0, 26.0, 20.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 4.0], "bins": [-13.0, -12.6380615234375, -12.276123046875, -11.9141845703125, -11.55224609375, -11.1903076171875, -10.828369140625, -10.4664306640625, -10.1044921875, -9.7425537109375, -9.380615234375, -9.0186767578125, -8.65673828125, -8.2947998046875, -7.932861328125, -7.5709228515625, -7.208984375, -6.8470458984375, -6.485107421875, -6.1231689453125, -5.76123046875, -5.3992919921875, -5.037353515625, -4.6754150390625, -4.3134765625, -3.9515380859375, -3.589599609375, -3.2276611328125, -2.86572265625, -2.5037841796875, -2.141845703125, -1.7799072265625, -1.41796875, -1.0560302734375, -0.694091796875, -0.3321533203125, 0.02978515625, 0.3917236328125, 0.753662109375, 1.1156005859375, 1.4775390625, 1.8394775390625, 2.201416015625, 2.5633544921875, 2.92529296875, 3.2872314453125, 3.649169921875, 4.0111083984375, 4.373046875, 4.7349853515625, 5.096923828125, 5.4588623046875, 5.82080078125, 6.1827392578125, 6.544677734375, 6.9066162109375, 7.2685546875, 7.6304931640625, 7.992431640625, 8.3543701171875, 8.71630859375, 9.0782470703125, 9.440185546875, 9.8021240234375, 10.1640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 4.0, 5.0, 6.0, 3.0, 7.0, 10.0, 12.0, 16.0, 21.0, 22.0, 24.0, 25.0, 42.0, 42.0, 88.0, 95.0, 105.0, 82.0, 84.0, 72.0, 59.0, 25.0, 21.0, 23.0, 19.0, 11.0, 8.0, 6.0, 9.0, 10.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.85546875, -7.57196044921875, -7.2884521484375, -7.00494384765625, -6.721435546875, -6.43792724609375, -6.1544189453125, -5.87091064453125, -5.58740234375, -5.30389404296875, -5.0203857421875, -4.73687744140625, -4.453369140625, -4.16986083984375, -3.8863525390625, -3.60284423828125, -3.3193359375, -3.03582763671875, -2.7523193359375, -2.46881103515625, -2.185302734375, -1.90179443359375, -1.6182861328125, -1.33477783203125, -1.05126953125, -0.76776123046875, -0.4842529296875, -0.20074462890625, 0.082763671875, 0.36627197265625, 0.6497802734375, 0.93328857421875, 1.216796875, 1.50030517578125, 1.7838134765625, 2.06732177734375, 2.350830078125, 2.63433837890625, 2.9178466796875, 3.20135498046875, 3.48486328125, 3.76837158203125, 4.0518798828125, 4.33538818359375, 4.618896484375, 4.90240478515625, 5.1859130859375, 5.46942138671875, 5.7529296875, 6.03643798828125, 6.3199462890625, 6.60345458984375, 6.886962890625, 7.17047119140625, 7.4539794921875, 7.73748779296875, 8.02099609375, 8.30450439453125, 8.5880126953125, 8.87152099609375, 9.155029296875, 9.43853759765625, 9.7220458984375, 10.00555419921875, 10.2890625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 9.0, 14.0, 27.0, 23.0, 30.0, 45.0, 60.0, 65.0, 82.0, 98.0, 96.0, 87.0, 75.0, 81.0, 53.0, 45.0, 28.0, 22.0, 18.0, 12.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.95111083984375, -107.02330017089844, -103.09548950195312, -99.16767883300781, -95.2398681640625, -91.31205749511719, -87.3842544555664, -83.4564437866211, -79.52863311767578, -75.60082244873047, -71.67301177978516, -67.74520111083984, -63.8173942565918, -59.889583587646484, -55.96177673339844, -52.033966064453125, -48.10615539550781, -44.1783447265625, -40.25053405761719, -36.32272720336914, -32.39491653442383, -28.467105865478516, -24.539297103881836, -20.611488342285156, -16.683677673339844, -12.755867958068848, -8.828058242797852, -4.9002485275268555, -0.9724388122558594, 2.955371856689453, 6.883180618286133, 10.810989379882812, 14.738800048828125, 18.666610717773438, 22.594419479370117, 26.522228240966797, 30.45003890991211, 34.37784957885742, 38.30565643310547, 42.23346710205078, 46.161277770996094, 50.089088439941406, 54.01689910888672, 57.944705963134766, 61.87251663208008, 65.80032348632812, 69.72813415527344, 73.65594482421875, 77.58375549316406, 81.51156616210938, 85.43937683105469, 89.3671875, 93.29499816894531, 97.22280883789062, 101.1506118774414, 105.07842254638672, 109.00623321533203, 112.93404388427734, 116.86185455322266, 120.78966522216797, 124.71746826171875, 128.64527893066406, 132.57308959960938, 136.5009002685547, 140.4287109375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 9.0, 8.0, 8.0, 6.0, 13.0, 13.0, 22.0, 13.0, 21.0, 23.0, 26.0, 24.0, 27.0, 28.0, 36.0, 48.0, 37.0, 37.0, 36.0, 38.0, 38.0, 33.0, 43.0, 32.0, 27.0, 35.0, 28.0, 18.0, 26.0, 39.0, 20.0, 17.0, 26.0, 15.0, 17.0, 20.0, 7.0, 16.0, 9.0, 6.0, 7.0, 9.0, 6.0, 7.0, 5.0, 2.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0], "bins": [-78.81031799316406, -76.43183135986328, -74.0533447265625, -71.67485809326172, -69.29637145996094, -66.91789245605469, -64.5394058227539, -62.160919189453125, -59.782432556152344, -57.40394592285156, -55.02545928955078, -52.646976470947266, -50.268489837646484, -47.8900032043457, -45.51152038574219, -43.133033752441406, -40.754547119140625, -38.376060485839844, -35.99757385253906, -33.61909103393555, -31.240604400634766, -28.862117767333984, -26.483633041381836, -24.105148315429688, -21.726661682128906, -19.348175048828125, -16.969690322875977, -14.591204643249512, -12.212718963623047, -9.834233283996582, -7.455747604370117, -5.077262878417969, -2.6987838745117188, -0.3202981948852539, 2.058187484741211, 4.436673164367676, 6.815158843994141, 9.193644523620605, 11.57213020324707, 13.950614929199219, 16.3291015625, 18.70758819580078, 21.08607292175293, 23.464557647705078, 25.84304428100586, 28.22153091430664, 30.60001564025879, 32.97850036621094, 35.35698699951172, 37.7354736328125, 40.11396026611328, 42.4924430847168, 44.87092971801758, 47.24941635131836, 49.627899169921875, 52.006385803222656, 54.38487243652344, 56.76335906982422, 59.141845703125, 61.520328521728516, 63.8988151550293, 66.27729797363281, 68.6557846069336, 71.03427124023438, 73.41275787353516]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 12.0, 21.0, 28.0, 49.0, 65.0, 136.0, 238.0, 432.0, 902.0, 2051.0, 4623.0, 11854.0, 34741.0, 125666.0, 1302435.0, 2506817.0, 143446.0, 38562.0, 13057.0, 5039.0, 2079.0, 955.0, 445.0, 257.0, 151.0, 83.0, 51.0, 33.0, 18.0, 14.0, 3.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 3.0], "bins": [-30.0, -29.26904296875, -28.5380859375, -27.80712890625, -27.076171875, -26.34521484375, -25.6142578125, -24.88330078125, -24.15234375, -23.42138671875, -22.6904296875, -21.95947265625, -21.228515625, -20.49755859375, -19.7666015625, -19.03564453125, -18.3046875, -17.57373046875, -16.8427734375, -16.11181640625, -15.380859375, -14.64990234375, -13.9189453125, -13.18798828125, -12.45703125, -11.72607421875, -10.9951171875, -10.26416015625, -9.533203125, -8.80224609375, -8.0712890625, -7.34033203125, -6.609375, -5.87841796875, -5.1474609375, -4.41650390625, -3.685546875, -2.95458984375, -2.2236328125, -1.49267578125, -0.76171875, -0.03076171875, 0.7001953125, 1.43115234375, 2.162109375, 2.89306640625, 3.6240234375, 4.35498046875, 5.0859375, 5.81689453125, 6.5478515625, 7.27880859375, 8.009765625, 8.74072265625, 9.4716796875, 10.20263671875, 10.93359375, 11.66455078125, 12.3955078125, 13.12646484375, 13.857421875, 14.58837890625, 15.3193359375, 16.05029296875, 16.78125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 9.0, 9.0, 7.0, 12.0, 14.0, 15.0, 17.0, 17.0, 17.0, 22.0, 21.0, 17.0, 43.0, 37.0, 21.0, 41.0, 45.0, 45.0, 41.0, 41.0, 44.0, 43.0, 39.0, 41.0, 41.0, 44.0, 31.0, 31.0, 32.0, 27.0, 24.0, 10.0, 15.0, 23.0, 18.0, 7.0, 8.0, 10.0, 11.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.10711669921875, -3.0032958984375, -2.89947509765625, -2.795654296875, -2.69183349609375, -2.5880126953125, -2.48419189453125, -2.38037109375, -2.27655029296875, -2.1727294921875, -2.06890869140625, -1.965087890625, -1.86126708984375, -1.7574462890625, -1.65362548828125, -1.5498046875, -1.44598388671875, -1.3421630859375, -1.23834228515625, -1.134521484375, -1.03070068359375, -0.9268798828125, -0.82305908203125, -0.71923828125, -0.61541748046875, -0.5115966796875, -0.40777587890625, -0.303955078125, -0.20013427734375, -0.0963134765625, 0.00750732421875, 0.111328125, 0.21514892578125, 0.3189697265625, 0.42279052734375, 0.526611328125, 0.63043212890625, 0.7342529296875, 0.83807373046875, 0.94189453125, 1.04571533203125, 1.1495361328125, 1.25335693359375, 1.357177734375, 1.46099853515625, 1.5648193359375, 1.66864013671875, 1.7724609375, 1.87628173828125, 1.9801025390625, 2.08392333984375, 2.187744140625, 2.29156494140625, 2.3953857421875, 2.49920654296875, 2.60302734375, 2.70684814453125, 2.8106689453125, 2.91448974609375, 3.018310546875, 3.12213134765625, 3.2259521484375, 3.32977294921875, 3.43359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 14.0, 15.0, 22.0, 31.0, 43.0, 68.0, 98.0, 149.0, 259.0, 427.0, 744.0, 1233.0, 2214.0, 4290.0, 8684.0, 19251.0, 48349.0, 149153.0, 809484.0, 2738231.0, 279888.0, 77355.0, 29097.0, 12361.0, 5882.0, 2997.0, 1623.0, 977.0, 491.0, 288.0, 208.0, 111.0, 95.0, 49.0, 32.0, 25.0, 15.0, 9.0, 9.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.875, -18.181640625, -17.48828125, -16.794921875, -16.1015625, -15.408203125, -14.71484375, -14.021484375, -13.328125, -12.634765625, -11.94140625, -11.248046875, -10.5546875, -9.861328125, -9.16796875, -8.474609375, -7.78125, -7.087890625, -6.39453125, -5.701171875, -5.0078125, -4.314453125, -3.62109375, -2.927734375, -2.234375, -1.541015625, -0.84765625, -0.154296875, 0.5390625, 1.232421875, 1.92578125, 2.619140625, 3.3125, 4.005859375, 4.69921875, 5.392578125, 6.0859375, 6.779296875, 7.47265625, 8.166015625, 8.859375, 9.552734375, 10.24609375, 10.939453125, 11.6328125, 12.326171875, 13.01953125, 13.712890625, 14.40625, 15.099609375, 15.79296875, 16.486328125, 17.1796875, 17.873046875, 18.56640625, 19.259765625, 19.953125, 20.646484375, 21.33984375, 22.033203125, 22.7265625, 23.419921875, 24.11328125, 24.806640625, 25.5]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 6.0, 2.0, 7.0, 8.0, 9.0, 11.0, 9.0, 20.0, 20.0, 33.0, 41.0, 78.0, 105.0, 164.0, 254.0, 507.0, 1339.0, 618.0, 254.0, 175.0, 121.0, 71.0, 51.0, 37.0, 29.0, 25.0, 22.0, 11.0, 11.0, 10.0, 2.0, 7.0, 6.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.1953125, -8.894775390625, -8.59423828125, -8.293701171875, -7.9931640625, -7.692626953125, -7.39208984375, -7.091552734375, -6.791015625, -6.490478515625, -6.18994140625, -5.889404296875, -5.5888671875, -5.288330078125, -4.98779296875, -4.687255859375, -4.38671875, -4.086181640625, -3.78564453125, -3.485107421875, -3.1845703125, -2.884033203125, -2.58349609375, -2.282958984375, -1.982421875, -1.681884765625, -1.38134765625, -1.080810546875, -0.7802734375, -0.479736328125, -0.17919921875, 0.121337890625, 0.421875, 0.722412109375, 1.02294921875, 1.323486328125, 1.6240234375, 1.924560546875, 2.22509765625, 2.525634765625, 2.826171875, 3.126708984375, 3.42724609375, 3.727783203125, 4.0283203125, 4.328857421875, 4.62939453125, 4.929931640625, 5.23046875, 5.531005859375, 5.83154296875, 6.132080078125, 6.4326171875, 6.733154296875, 7.03369140625, 7.334228515625, 7.634765625, 7.935302734375, 8.23583984375, 8.536376953125, 8.8369140625, 9.137451171875, 9.43798828125, 9.738525390625, 10.0390625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 18.0, 20.0, 25.0, 35.0, 53.0, 66.0, 90.0, 97.0, 102.0, 88.0, 93.0, 78.0, 60.0, 45.0, 33.0, 22.0, 19.0, 16.0, 7.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.43256378173828, -33.533267974853516, -31.63397216796875, -29.734676361083984, -27.83538055419922, -25.936084747314453, -24.03679084777832, -22.137495040893555, -20.23819923400879, -18.338903427124023, -16.439607620239258, -14.540312767028809, -12.641016960144043, -10.741721153259277, -8.842426300048828, -6.9431304931640625, -5.043834686279297, -3.1445391178131104, -1.2452435493469238, 0.6540517807006836, 2.553347587585449, 4.452643394470215, 6.351938247680664, 8.25123405456543, 10.150529861450195, 12.049825668334961, 13.949121475219727, 15.848416328430176, 17.747711181640625, 19.64700698852539, 21.546302795410156, 23.445598602294922, 25.344894409179688, 27.244190216064453, 29.14348602294922, 31.042781829833984, 32.94207763671875, 34.841373443603516, 36.74066925048828, 38.63996124267578, 40.53926086425781, 42.43855667114258, 44.337852478027344, 46.23714828491211, 48.136444091796875, 50.03573989868164, 51.935035705566406, 53.834327697753906, 55.73362350463867, 57.63291931152344, 59.5322151184082, 61.43151092529297, 63.330806732177734, 65.2301025390625, 67.12939453125, 69.02869415283203, 70.92798614501953, 72.82727813720703, 74.72657775878906, 76.62586975097656, 78.5251693725586, 80.4244613647461, 82.32376098632812, 84.22305297851562, 86.12235260009766]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 5.0, 4.0, 11.0, 8.0, 12.0, 14.0, 12.0, 15.0, 26.0, 19.0, 28.0, 30.0, 32.0, 40.0, 38.0, 58.0, 57.0, 53.0, 45.0, 55.0, 49.0, 52.0, 55.0, 30.0, 31.0, 27.0, 33.0, 22.0, 24.0, 21.0, 15.0, 19.0, 10.0, 17.0, 9.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.38115692138672, -42.113739013671875, -40.846317291259766, -39.578895568847656, -38.31147766113281, -37.04405975341797, -35.77663803100586, -34.50921630859375, -33.241798400878906, -31.97437858581543, -30.706958770751953, -29.439538955688477, -28.172119140625, -26.904699325561523, -25.637279510498047, -24.36985969543457, -23.102439880371094, -21.835020065307617, -20.56760025024414, -19.300180435180664, -18.032760620117188, -16.76534080505371, -15.497920989990234, -14.230501174926758, -12.963081359863281, -11.695661544799805, -10.428241729736328, -9.160821914672852, -7.893402099609375, -6.625982284545898, -5.358562469482422, -4.091142654418945, -2.8237228393554688, -1.5563030242919922, -0.2888832092285156, 0.9785366058349609, 2.2459564208984375, 3.513376235961914, 4.780796051025391, 6.048215866088867, 7.315635681152344, 8.58305549621582, 9.850475311279297, 11.117895126342773, 12.38531494140625, 13.652734756469727, 14.920154571533203, 16.18757438659668, 17.454994201660156, 18.722414016723633, 19.98983383178711, 21.257253646850586, 22.524673461914062, 23.79209327697754, 25.059513092041016, 26.326932907104492, 27.59435272216797, 28.861772537231445, 30.129192352294922, 31.3966121673584, 32.664031982421875, 33.93144989013672, 35.19887161254883, 36.46629333496094, 37.73371124267578]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 7.0, 10.0, 9.0, 24.0, 44.0, 59.0, 69.0, 192.0, 253.0, 525.0, 943.0, 1768.0, 3455.0, 6918.0, 13927.0, 27859.0, 56319.0, 110090.0, 219459.0, 286067.0, 158881.0, 80202.0, 40948.0, 20256.0, 9837.0, 4957.0, 2564.0, 1288.0, 691.0, 408.0, 206.0, 135.0, 68.0, 42.0, 32.0, 17.0, 9.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.265625, -19.74951171875, -19.2333984375, -18.71728515625, -18.201171875, -17.68505859375, -17.1689453125, -16.65283203125, -16.13671875, -15.62060546875, -15.1044921875, -14.58837890625, -14.072265625, -13.55615234375, -13.0400390625, -12.52392578125, -12.0078125, -11.49169921875, -10.9755859375, -10.45947265625, -9.943359375, -9.42724609375, -8.9111328125, -8.39501953125, -7.87890625, -7.36279296875, -6.8466796875, -6.33056640625, -5.814453125, -5.29833984375, -4.7822265625, -4.26611328125, -3.75, -3.23388671875, -2.7177734375, -2.20166015625, -1.685546875, -1.16943359375, -0.6533203125, -0.13720703125, 0.37890625, 0.89501953125, 1.4111328125, 1.92724609375, 2.443359375, 2.95947265625, 3.4755859375, 3.99169921875, 4.5078125, 5.02392578125, 5.5400390625, 6.05615234375, 6.572265625, 7.08837890625, 7.6044921875, 8.12060546875, 8.63671875, 9.15283203125, 9.6689453125, 10.18505859375, 10.701171875, 11.21728515625, 11.7333984375, 12.24951171875, 12.765625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 10.0, 11.0, 12.0, 13.0, 10.0, 18.0, 14.0, 28.0, 24.0, 23.0, 31.0, 32.0, 36.0, 29.0, 31.0, 32.0, 49.0, 56.0, 41.0, 52.0, 49.0, 38.0, 43.0, 47.0, 44.0, 33.0, 29.0, 20.0, 23.0, 17.0, 13.0, 23.0, 8.0, 10.0, 7.0, 14.0, 11.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.817718505859375, -2.70770263671875, -2.597686767578125, -2.4876708984375, -2.377655029296875, -2.26763916015625, -2.157623291015625, -2.047607421875, -1.937591552734375, -1.82757568359375, -1.717559814453125, -1.6075439453125, -1.497528076171875, -1.38751220703125, -1.277496337890625, -1.16748046875, -1.057464599609375, -0.94744873046875, -0.837432861328125, -0.7274169921875, -0.617401123046875, -0.50738525390625, -0.397369384765625, -0.287353515625, -0.177337646484375, -0.06732177734375, 0.042694091796875, 0.1527099609375, 0.262725830078125, 0.37274169921875, 0.482757568359375, 0.5927734375, 0.702789306640625, 0.81280517578125, 0.922821044921875, 1.0328369140625, 1.142852783203125, 1.25286865234375, 1.362884521484375, 1.472900390625, 1.582916259765625, 1.69293212890625, 1.802947998046875, 1.9129638671875, 2.022979736328125, 2.13299560546875, 2.243011474609375, 2.35302734375, 2.463043212890625, 2.57305908203125, 2.683074951171875, 2.7930908203125, 2.903106689453125, 3.01312255859375, 3.123138427734375, 3.233154296875, 3.343170166015625, 3.45318603515625, 3.563201904296875, 3.6732177734375, 3.783233642578125, 3.89324951171875, 4.003265380859375, 4.11328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 10.0, 11.0, 13.0, 13.0, 25.0, 44.0, 38.0, 62.0, 73.0, 122.0, 158.0, 252.0, 340.0, 546.0, 973.0, 1995.0, 4598.0, 11510.0, 33709.0, 99698.0, 307232.0, 387146.0, 129684.0, 44190.0, 15013.0, 5690.0, 2367.0, 1125.0, 645.0, 386.0, 256.0, 172.0, 135.0, 93.0, 47.0, 49.0, 39.0, 17.0, 17.0, 21.0, 9.0, 10.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.65625, -18.015625, -17.375, -16.734375, -16.09375, -15.453125, -14.8125, -14.171875, -13.53125, -12.890625, -12.25, -11.609375, -10.96875, -10.328125, -9.6875, -9.046875, -8.40625, -7.765625, -7.125, -6.484375, -5.84375, -5.203125, -4.5625, -3.921875, -3.28125, -2.640625, -2.0, -1.359375, -0.71875, -0.078125, 0.5625, 1.203125, 1.84375, 2.484375, 3.125, 3.765625, 4.40625, 5.046875, 5.6875, 6.328125, 6.96875, 7.609375, 8.25, 8.890625, 9.53125, 10.171875, 10.8125, 11.453125, 12.09375, 12.734375, 13.375, 14.015625, 14.65625, 15.296875, 15.9375, 16.578125, 17.21875, 17.859375, 18.5, 19.140625, 19.78125, 20.421875, 21.0625, 21.703125, 22.34375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 11.0, 10.0, 8.0, 14.0, 14.0, 19.0, 21.0, 34.0, 31.0, 22.0, 43.0, 47.0, 43.0, 49.0, 53.0, 58.0, 44.0, 52.0, 52.0, 58.0, 44.0, 36.0, 42.0, 38.0, 28.0, 25.0, 23.0, 16.0, 14.0, 10.0, 10.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0], "bins": [-23.765625, -23.1746826171875, -22.583740234375, -21.9927978515625, -21.40185546875, -20.8109130859375, -20.219970703125, -19.6290283203125, -19.0380859375, -18.4471435546875, -17.856201171875, -17.2652587890625, -16.67431640625, -16.0833740234375, -15.492431640625, -14.9014892578125, -14.310546875, -13.7196044921875, -13.128662109375, -12.5377197265625, -11.94677734375, -11.3558349609375, -10.764892578125, -10.1739501953125, -9.5830078125, -8.9920654296875, -8.401123046875, -7.8101806640625, -7.21923828125, -6.6282958984375, -6.037353515625, -5.4464111328125, -4.85546875, -4.2645263671875, -3.673583984375, -3.0826416015625, -2.49169921875, -1.9007568359375, -1.309814453125, -0.7188720703125, -0.1279296875, 0.4630126953125, 1.053955078125, 1.6448974609375, 2.23583984375, 2.8267822265625, 3.417724609375, 4.0086669921875, 4.599609375, 5.1905517578125, 5.781494140625, 6.3724365234375, 6.96337890625, 7.5543212890625, 8.145263671875, 8.7362060546875, 9.3271484375, 9.9180908203125, 10.509033203125, 11.0999755859375, 11.69091796875, 12.2818603515625, 12.872802734375, 13.4637451171875, 14.0546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 15.0, 12.0, 36.0, 49.0, 77.0, 114.0, 229.0, 466.0, 1049.0, 2864.0, 8508.0, 30912.0, 136170.0, 623329.0, 188316.0, 39952.0, 10720.0, 3323.0, 1287.0, 497.0, 255.0, 133.0, 76.0, 47.0, 40.0, 18.0, 20.0, 5.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.626708984375, -21.01904296875, -20.411376953125, -19.8037109375, -19.196044921875, -18.58837890625, -17.980712890625, -17.373046875, -16.765380859375, -16.15771484375, -15.550048828125, -14.9423828125, -14.334716796875, -13.72705078125, -13.119384765625, -12.51171875, -11.904052734375, -11.29638671875, -10.688720703125, -10.0810546875, -9.473388671875, -8.86572265625, -8.258056640625, -7.650390625, -7.042724609375, -6.43505859375, -5.827392578125, -5.2197265625, -4.612060546875, -4.00439453125, -3.396728515625, -2.7890625, -2.181396484375, -1.57373046875, -0.966064453125, -0.3583984375, 0.249267578125, 0.85693359375, 1.464599609375, 2.072265625, 2.679931640625, 3.28759765625, 3.895263671875, 4.5029296875, 5.110595703125, 5.71826171875, 6.325927734375, 6.93359375, 7.541259765625, 8.14892578125, 8.756591796875, 9.3642578125, 9.971923828125, 10.57958984375, 11.187255859375, 11.794921875, 12.402587890625, 13.01025390625, 13.617919921875, 14.2255859375, 14.833251953125, 15.44091796875, 16.048583984375, 16.65625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 14.0, 18.0, 26.0, 23.0, 39.0, 52.0, 106.0, 233.0, 219.0, 91.0, 50.0, 31.0, 24.0, 18.0, 9.0, 14.0, 5.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0059356689453125, -0.0057656168937683105, -0.005595564842224121, -0.005425512790679932, -0.005255460739135742, -0.005085408687591553, -0.004915356636047363, -0.004745304584503174, -0.004575252532958984, -0.004405200481414795, -0.0042351484298706055, -0.004065096378326416, -0.0038950443267822266, -0.003724992275238037, -0.0035549402236938477, -0.003384888172149658, -0.0032148361206054688, -0.0030447840690612793, -0.00287473201751709, -0.0027046799659729004, -0.002534627914428711, -0.0023645758628845215, -0.002194523811340332, -0.0020244717597961426, -0.0018544197082519531, -0.0016843676567077637, -0.0015143156051635742, -0.0013442635536193848, -0.0011742115020751953, -0.0010041594505310059, -0.0008341073989868164, -0.000664055347442627, -0.0004940032958984375, -0.00032395124435424805, -0.0001538991928100586, 1.615285873413086e-05, 0.0001862049102783203, 0.00035625696182250977, 0.0005263090133666992, 0.0006963610649108887, 0.0008664131164550781, 0.0010364651679992676, 0.001206517219543457, 0.0013765692710876465, 0.001546621322631836, 0.0017166733741760254, 0.0018867254257202148, 0.0020567774772644043, 0.0022268295288085938, 0.002396881580352783, 0.0025669336318969727, 0.002736985683441162, 0.0029070377349853516, 0.003077089786529541, 0.0032471418380737305, 0.00341719388961792, 0.0035872459411621094, 0.003757297992706299, 0.003927350044250488, 0.004097402095794678, 0.004267454147338867, 0.004437506198883057, 0.004607558250427246, 0.0047776103019714355, 0.004947662353515625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 6.0, 7.0, 8.0, 14.0, 30.0, 45.0, 50.0, 137.0, 203.0, 522.0, 1410.0, 5865.0, 34327.0, 452348.0, 507606.0, 37182.0, 6164.0, 1525.0, 527.0, 243.0, 126.0, 85.0, 34.0, 33.0, 16.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.242919921875, -22.31396484375, -21.385009765625, -20.4560546875, -19.527099609375, -18.59814453125, -17.669189453125, -16.740234375, -15.811279296875, -14.88232421875, -13.953369140625, -13.0244140625, -12.095458984375, -11.16650390625, -10.237548828125, -9.30859375, -8.379638671875, -7.45068359375, -6.521728515625, -5.5927734375, -4.663818359375, -3.73486328125, -2.805908203125, -1.876953125, -0.947998046875, -0.01904296875, 0.909912109375, 1.8388671875, 2.767822265625, 3.69677734375, 4.625732421875, 5.5546875, 6.483642578125, 7.41259765625, 8.341552734375, 9.2705078125, 10.199462890625, 11.12841796875, 12.057373046875, 12.986328125, 13.915283203125, 14.84423828125, 15.773193359375, 16.7021484375, 17.631103515625, 18.56005859375, 19.489013671875, 20.41796875, 21.346923828125, 22.27587890625, 23.204833984375, 24.1337890625, 25.062744140625, 25.99169921875, 26.920654296875, 27.849609375, 28.778564453125, 29.70751953125, 30.636474609375, 31.5654296875, 32.494384765625, 33.42333984375, 34.352294921875, 35.28125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 6.0, 13.0, 10.0, 24.0, 21.0, 45.0, 70.0, 105.0, 154.0, 155.0, 132.0, 84.0, 57.0, 41.0, 21.0, 18.0, 16.0, 12.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.34375, -12.79443359375, -12.2451171875, -11.69580078125, -11.146484375, -10.59716796875, -10.0478515625, -9.49853515625, -8.94921875, -8.39990234375, -7.8505859375, -7.30126953125, -6.751953125, -6.20263671875, -5.6533203125, -5.10400390625, -4.5546875, -4.00537109375, -3.4560546875, -2.90673828125, -2.357421875, -1.80810546875, -1.2587890625, -0.70947265625, -0.16015625, 0.38916015625, 0.9384765625, 1.48779296875, 2.037109375, 2.58642578125, 3.1357421875, 3.68505859375, 4.234375, 4.78369140625, 5.3330078125, 5.88232421875, 6.431640625, 6.98095703125, 7.5302734375, 8.07958984375, 8.62890625, 9.17822265625, 9.7275390625, 10.27685546875, 10.826171875, 11.37548828125, 11.9248046875, 12.47412109375, 13.0234375, 13.57275390625, 14.1220703125, 14.67138671875, 15.220703125, 15.77001953125, 16.3193359375, 16.86865234375, 17.41796875, 17.96728515625, 18.5166015625, 19.06591796875, 19.615234375, 20.16455078125, 20.7138671875, 21.26318359375, 21.8125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 12.0, 34.0, 59.0, 118.0, 171.0, 194.0, 197.0, 108.0, 52.0, 30.0, 15.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.4147491455078, -151.77200317382812, -143.1292724609375, -134.4865264892578, -125.84378051757812, -117.20103454589844, -108.55829620361328, -99.91555786132812, -91.27281188964844, -82.63006591796875, -73.9873275756836, -65.34458923339844, -56.70184326171875, -48.05910110473633, -39.416358947753906, -30.773616790771484, -22.130874633789062, -13.48813247680664, -4.845390319824219, 3.797351837158203, 12.440093994140625, 21.082836151123047, 29.72557830810547, 38.36832046508789, 47.01106262207031, 55.653804779052734, 64.29654693603516, 72.93928527832031, 81.58203125, 90.22477722167969, 98.86751556396484, 107.51025390625, 116.15301513671875, 124.79576110839844, 133.43850708007812, 142.08123779296875, 150.72398376464844, 159.36672973632812, 168.00946044921875, 176.65220642089844, 185.29495239257812, 193.9376983642578, 202.5804443359375, 211.22317504882812, 219.8659210205078, 228.5086669921875, 237.15139770507812, 245.7941436767578, 254.4368896484375, 263.0796203613281, 271.7223815917969, 280.3651123046875, 289.00787353515625, 297.6506042480469, 306.2933349609375, 314.93609619140625, 323.5788269042969, 332.2215576171875, 340.86431884765625, 349.5070495605469, 358.1497802734375, 366.79254150390625, 375.4352722167969, 384.0780334472656, 392.72076416015625]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 1.0, 3.0, 4.0, 4.0, 11.0, 8.0, 10.0, 11.0, 20.0, 26.0, 12.0, 21.0, 25.0, 22.0, 26.0, 24.0, 32.0, 30.0, 46.0, 42.0, 45.0, 37.0, 41.0, 50.0, 39.0, 37.0, 42.0, 29.0, 35.0, 40.0, 36.0, 19.0, 15.0, 24.0, 22.0, 27.0, 13.0, 15.0, 9.0, 9.0, 7.0, 4.0, 5.0, 5.0, 3.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.94683837890625, -73.39485168457031, -70.8428726196289, -68.29088592529297, -65.73890686035156, -63.186920166015625, -60.63493728637695, -58.08295440673828, -55.53097152709961, -52.97898864746094, -50.427005767822266, -47.875022888183594, -45.323036193847656, -42.77105712890625, -40.21907043457031, -37.66708755493164, -35.11510467529297, -32.5631217956543, -30.011138916015625, -27.45915412902832, -24.90717124938965, -22.355188369750977, -19.803203582763672, -17.251220703125, -14.699237823486328, -12.147254943847656, -9.595271110534668, -7.043287754058838, -4.491304397583008, -1.939321517944336, 0.6126623153686523, 3.1646461486816406, 5.7166290283203125, 8.268611907958984, 10.820595741271973, 13.372579574584961, 15.924562454223633, 18.476545333862305, 21.02853012084961, 23.58051300048828, 26.132495880126953, 28.684478759765625, 31.236461639404297, 33.78844451904297, 36.340431213378906, 38.89241027832031, 41.44439697265625, 43.99637985229492, 46.548362731933594, 49.100345611572266, 51.65232849121094, 54.20431137084961, 56.75629425048828, 59.30828094482422, 61.86026382446289, 64.41224670410156, 66.9642333984375, 69.51622009277344, 72.06819915771484, 74.62018585205078, 77.17216491699219, 79.72415161132812, 82.27613067626953, 84.82811737060547, 87.38009643554688]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 8.0, 15.0, 15.0, 22.0, 30.0, 61.0, 62.0, 137.0, 180.0, 314.0, 544.0, 795.0, 1361.0, 2363.0, 4038.0, 7314.0, 13725.0, 27591.0, 61578.0, 166338.0, 774907.0, 2655437.0, 300690.0, 95155.0, 40138.0, 19116.0, 9738.0, 5379.0, 2974.0, 1671.0, 977.0, 558.0, 383.0, 239.0, 132.0, 92.0, 69.0, 37.0, 39.0, 12.0, 15.0, 11.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.25, -15.745849609375, -15.24169921875, -14.737548828125, -14.2333984375, -13.729248046875, -13.22509765625, -12.720947265625, -12.216796875, -11.712646484375, -11.20849609375, -10.704345703125, -10.2001953125, -9.696044921875, -9.19189453125, -8.687744140625, -8.18359375, -7.679443359375, -7.17529296875, -6.671142578125, -6.1669921875, -5.662841796875, -5.15869140625, -4.654541015625, -4.150390625, -3.646240234375, -3.14208984375, -2.637939453125, -2.1337890625, -1.629638671875, -1.12548828125, -0.621337890625, -0.1171875, 0.386962890625, 0.89111328125, 1.395263671875, 1.8994140625, 2.403564453125, 2.90771484375, 3.411865234375, 3.916015625, 4.420166015625, 4.92431640625, 5.428466796875, 5.9326171875, 6.436767578125, 6.94091796875, 7.445068359375, 7.94921875, 8.453369140625, 8.95751953125, 9.461669921875, 9.9658203125, 10.469970703125, 10.97412109375, 11.478271484375, 11.982421875, 12.486572265625, 12.99072265625, 13.494873046875, 13.9990234375, 14.503173828125, 15.00732421875, 15.511474609375, 16.015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 10.0, 7.0, 13.0, 5.0, 17.0, 23.0, 19.0, 24.0, 39.0, 23.0, 32.0, 45.0, 49.0, 35.0, 49.0, 70.0, 58.0, 60.0, 48.0, 49.0, 54.0, 32.0, 49.0, 25.0, 33.0, 25.0, 23.0, 15.0, 20.0, 11.0, 7.0, 14.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.04327392578125, -3.9107666015625, -3.77825927734375, -3.645751953125, -3.51324462890625, -3.3807373046875, -3.24822998046875, -3.11572265625, -2.98321533203125, -2.8507080078125, -2.71820068359375, -2.585693359375, -2.45318603515625, -2.3206787109375, -2.18817138671875, -2.0556640625, -1.92315673828125, -1.7906494140625, -1.65814208984375, -1.525634765625, -1.39312744140625, -1.2606201171875, -1.12811279296875, -0.99560546875, -0.86309814453125, -0.7305908203125, -0.59808349609375, -0.465576171875, -0.33306884765625, -0.2005615234375, -0.06805419921875, 0.064453125, 0.19696044921875, 0.3294677734375, 0.46197509765625, 0.594482421875, 0.72698974609375, 0.8594970703125, 0.99200439453125, 1.12451171875, 1.25701904296875, 1.3895263671875, 1.52203369140625, 1.654541015625, 1.78704833984375, 1.9195556640625, 2.05206298828125, 2.1845703125, 2.31707763671875, 2.4495849609375, 2.58209228515625, 2.714599609375, 2.84710693359375, 2.9796142578125, 3.11212158203125, 3.24462890625, 3.37713623046875, 3.5096435546875, 3.64215087890625, 3.774658203125, 3.90716552734375, 4.0396728515625, 4.17218017578125, 4.3046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 7.0, 15.0, 14.0, 22.0, 42.0, 64.0, 76.0, 137.0, 179.0, 266.0, 453.0, 705.0, 1132.0, 1880.0, 3210.0, 5650.0, 10135.0, 18837.0, 36896.0, 77884.0, 186566.0, 610545.0, 2349790.0, 560687.0, 176864.0, 74442.0, 35657.0, 18554.0, 9950.0, 5586.0, 3116.0, 1839.0, 1121.0, 643.0, 436.0, 293.0, 187.0, 128.0, 88.0, 59.0, 41.0, 28.0, 12.0, 11.0, 8.0, 4.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.890625, -14.41748046875, -13.9443359375, -13.47119140625, -12.998046875, -12.52490234375, -12.0517578125, -11.57861328125, -11.10546875, -10.63232421875, -10.1591796875, -9.68603515625, -9.212890625, -8.73974609375, -8.2666015625, -7.79345703125, -7.3203125, -6.84716796875, -6.3740234375, -5.90087890625, -5.427734375, -4.95458984375, -4.4814453125, -4.00830078125, -3.53515625, -3.06201171875, -2.5888671875, -2.11572265625, -1.642578125, -1.16943359375, -0.6962890625, -0.22314453125, 0.25, 0.72314453125, 1.1962890625, 1.66943359375, 2.142578125, 2.61572265625, 3.0888671875, 3.56201171875, 4.03515625, 4.50830078125, 4.9814453125, 5.45458984375, 5.927734375, 6.40087890625, 6.8740234375, 7.34716796875, 7.8203125, 8.29345703125, 8.7666015625, 9.23974609375, 9.712890625, 10.18603515625, 10.6591796875, 11.13232421875, 11.60546875, 12.07861328125, 12.5517578125, 13.02490234375, 13.498046875, 13.97119140625, 14.4443359375, 14.91748046875, 15.390625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 8.0, 15.0, 20.0, 21.0, 31.0, 36.0, 37.0, 45.0, 65.0, 81.0, 146.0, 217.0, 333.0, 640.0, 935.0, 490.0, 273.0, 169.0, 109.0, 94.0, 64.0, 46.0, 56.0, 29.0, 29.0, 11.0, 11.0, 15.0, 9.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6796875, -8.3729248046875, -8.066162109375, -7.7593994140625, -7.45263671875, -7.1458740234375, -6.839111328125, -6.5323486328125, -6.2255859375, -5.9188232421875, -5.612060546875, -5.3052978515625, -4.99853515625, -4.6917724609375, -4.385009765625, -4.0782470703125, -3.771484375, -3.4647216796875, -3.157958984375, -2.8511962890625, -2.54443359375, -2.2376708984375, -1.930908203125, -1.6241455078125, -1.3173828125, -1.0106201171875, -0.703857421875, -0.3970947265625, -0.09033203125, 0.2164306640625, 0.523193359375, 0.8299560546875, 1.13671875, 1.4434814453125, 1.750244140625, 2.0570068359375, 2.36376953125, 2.6705322265625, 2.977294921875, 3.2840576171875, 3.5908203125, 3.8975830078125, 4.204345703125, 4.5111083984375, 4.81787109375, 5.1246337890625, 5.431396484375, 5.7381591796875, 6.044921875, 6.3516845703125, 6.658447265625, 6.9652099609375, 7.27197265625, 7.5787353515625, 7.885498046875, 8.1922607421875, 8.4990234375, 8.8057861328125, 9.112548828125, 9.4193115234375, 9.72607421875, 10.0328369140625, 10.339599609375, 10.6463623046875, 10.953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 9.0, 24.0, 55.0, 76.0, 143.0, 163.0, 162.0, 121.0, 103.0, 61.0, 45.0, 14.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-138.03591918945312, -134.3201904296875, -130.60447692871094, -126.88874816894531, -123.17302703857422, -119.4572982788086, -115.7415771484375, -112.02584838867188, -108.31012725830078, -104.59440612792969, -100.87867736816406, -97.16295623779297, -93.44723510742188, -89.73150634765625, -86.01578521728516, -82.30006408691406, -78.58433532714844, -74.86861419677734, -71.15288543701172, -67.43716430664062, -63.721439361572266, -60.005714416503906, -56.28999328613281, -52.57426834106445, -48.858551025390625, -45.142826080322266, -41.42710494995117, -37.71138000488281, -33.99565505981445, -30.279932022094727, -26.564208984375, -22.84848403930664, -19.13275909423828, -15.417035102844238, -11.701311111450195, -7.985588073730469, -4.269864082336426, -0.5541400909423828, 3.1615829467773438, 6.877307891845703, 10.59303092956543, 14.308754920959473, 18.024478912353516, 21.740201950073242, 25.45592498779297, 29.171649932861328, 32.88737487792969, 36.60309600830078, 40.31882095336914, 44.0345458984375, 47.750267028808594, 51.46599197387695, 55.18171691894531, 58.897438049316406, 62.613162994384766, 66.32888793945312, 70.04460906982422, 73.76033020019531, 77.47605895996094, 81.19178009033203, 84.90750122070312, 88.62322998046875, 92.33895111083984, 96.05467224121094, 99.77040100097656]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 10.0, 8.0, 8.0, 14.0, 12.0, 15.0, 12.0, 17.0, 15.0, 34.0, 36.0, 24.0, 32.0, 30.0, 52.0, 39.0, 44.0, 34.0, 53.0, 50.0, 39.0, 41.0, 45.0, 30.0, 35.0, 33.0, 36.0, 26.0, 34.0, 27.0, 18.0, 16.0, 10.0, 10.0, 8.0, 7.0, 9.0, 5.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0], "bins": [-47.174259185791016, -45.86351776123047, -44.55277633666992, -43.242034912109375, -41.93129348754883, -40.62055206298828, -39.309810638427734, -37.99906921386719, -36.688323974609375, -35.37758255004883, -34.06684112548828, -32.756099700927734, -31.445358276367188, -30.13461685180664, -28.82387351989746, -27.513132095336914, -26.202392578125, -24.891651153564453, -23.580909729003906, -22.27016830444336, -20.959426879882812, -19.648685455322266, -18.337942123413086, -17.02720069885254, -15.716459274291992, -14.405717849731445, -13.094976425170898, -11.784234046936035, -10.473492622375488, -9.162751197814941, -7.852009296417236, -6.541267395019531, -5.230522155761719, -3.9197804927825928, -2.609038829803467, -1.2982971668243408, 0.012444496154785156, 1.323185920715332, 2.633927822113037, 3.944669723510742, 5.255411148071289, 6.566152572631836, 7.876894474029541, 9.187636375427246, 10.498377799987793, 11.80911922454834, 13.119861602783203, 14.43060302734375, 15.741344451904297, 17.052085876464844, 18.36282730102539, 19.673568725585938, 20.984310150146484, 22.29505157470703, 23.60579490661621, 24.916536331176758, 26.227277755737305, 27.53801918029785, 28.8487606048584, 30.159502029418945, 31.470245361328125, 32.78098678588867, 34.09172821044922, 35.402469635009766, 36.71321105957031]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 8.0, 5.0, 13.0, 26.0, 43.0, 49.0, 83.0, 144.0, 244.0, 406.0, 801.0, 1569.0, 3042.0, 6282.0, 13748.0, 31227.0, 75862.0, 259002.0, 457703.0, 116755.0, 44897.0, 19344.0, 8702.0, 4129.0, 2067.0, 1060.0, 591.0, 296.0, 208.0, 85.0, 57.0, 35.0, 26.0, 14.0, 6.0, 9.0, 10.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.803466796875, -20.09130859375, -19.379150390625, -18.6669921875, -17.954833984375, -17.24267578125, -16.530517578125, -15.818359375, -15.106201171875, -14.39404296875, -13.681884765625, -12.9697265625, -12.257568359375, -11.54541015625, -10.833251953125, -10.12109375, -9.408935546875, -8.69677734375, -7.984619140625, -7.2724609375, -6.560302734375, -5.84814453125, -5.135986328125, -4.423828125, -3.711669921875, -2.99951171875, -2.287353515625, -1.5751953125, -0.863037109375, -0.15087890625, 0.561279296875, 1.2734375, 1.985595703125, 2.69775390625, 3.409912109375, 4.1220703125, 4.834228515625, 5.54638671875, 6.258544921875, 6.970703125, 7.682861328125, 8.39501953125, 9.107177734375, 9.8193359375, 10.531494140625, 11.24365234375, 11.955810546875, 12.66796875, 13.380126953125, 14.09228515625, 14.804443359375, 15.5166015625, 16.228759765625, 16.94091796875, 17.653076171875, 18.365234375, 19.077392578125, 19.78955078125, 20.501708984375, 21.2138671875, 21.926025390625, 22.63818359375, 23.350341796875, 24.0625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 8.0, 14.0, 10.0, 11.0, 17.0, 24.0, 20.0, 30.0, 27.0, 27.0, 21.0, 41.0, 40.0, 58.0, 54.0, 68.0, 44.0, 50.0, 53.0, 56.0, 51.0, 37.0, 34.0, 32.0, 19.0, 30.0, 19.0, 20.0, 21.0, 21.0, 14.0, 7.0, 8.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9765625, -3.8427734375, -3.708984375, -3.5751953125, -3.44140625, -3.3076171875, -3.173828125, -3.0400390625, -2.90625, -2.7724609375, -2.638671875, -2.5048828125, -2.37109375, -2.2373046875, -2.103515625, -1.9697265625, -1.8359375, -1.7021484375, -1.568359375, -1.4345703125, -1.30078125, -1.1669921875, -1.033203125, -0.8994140625, -0.765625, -0.6318359375, -0.498046875, -0.3642578125, -0.23046875, -0.0966796875, 0.037109375, 0.1708984375, 0.3046875, 0.4384765625, 0.572265625, 0.7060546875, 0.83984375, 0.9736328125, 1.107421875, 1.2412109375, 1.375, 1.5087890625, 1.642578125, 1.7763671875, 1.91015625, 2.0439453125, 2.177734375, 2.3115234375, 2.4453125, 2.5791015625, 2.712890625, 2.8466796875, 2.98046875, 3.1142578125, 3.248046875, 3.3818359375, 3.515625, 3.6494140625, 3.783203125, 3.9169921875, 4.05078125, 4.1845703125, 4.318359375, 4.4521484375, 4.5859375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 6.0, 11.0, 15.0, 25.0, 22.0, 43.0, 51.0, 74.0, 104.0, 147.0, 225.0, 403.0, 617.0, 1130.0, 2324.0, 5357.0, 15002.0, 54229.0, 283194.0, 555263.0, 92663.0, 23401.0, 7473.0, 3086.0, 1470.0, 831.0, 481.0, 261.0, 192.0, 141.0, 74.0, 65.0, 43.0, 41.0, 14.0, 19.0, 14.0, 9.0, 4.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-28.21875, -27.393310546875, -26.56787109375, -25.742431640625, -24.9169921875, -24.091552734375, -23.26611328125, -22.440673828125, -21.615234375, -20.789794921875, -19.96435546875, -19.138916015625, -18.3134765625, -17.488037109375, -16.66259765625, -15.837158203125, -15.01171875, -14.186279296875, -13.36083984375, -12.535400390625, -11.7099609375, -10.884521484375, -10.05908203125, -9.233642578125, -8.408203125, -7.582763671875, -6.75732421875, -5.931884765625, -5.1064453125, -4.281005859375, -3.45556640625, -2.630126953125, -1.8046875, -0.979248046875, -0.15380859375, 0.671630859375, 1.4970703125, 2.322509765625, 3.14794921875, 3.973388671875, 4.798828125, 5.624267578125, 6.44970703125, 7.275146484375, 8.1005859375, 8.926025390625, 9.75146484375, 10.576904296875, 11.40234375, 12.227783203125, 13.05322265625, 13.878662109375, 14.7041015625, 15.529541015625, 16.35498046875, 17.180419921875, 18.005859375, 18.831298828125, 19.65673828125, 20.482177734375, 21.3076171875, 22.133056640625, 22.95849609375, 23.783935546875, 24.609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 7.0, 11.0, 10.0, 11.0, 13.0, 16.0, 23.0, 21.0, 27.0, 37.0, 50.0, 48.0, 46.0, 48.0, 64.0, 49.0, 53.0, 49.0, 43.0, 32.0, 54.0, 40.0, 37.0, 21.0, 35.0, 28.0, 25.0, 14.0, 17.0, 13.0, 10.0, 7.0, 11.0, 9.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.125, -16.51953125, -15.9140625, -15.30859375, -14.703125, -14.09765625, -13.4921875, -12.88671875, -12.28125, -11.67578125, -11.0703125, -10.46484375, -9.859375, -9.25390625, -8.6484375, -8.04296875, -7.4375, -6.83203125, -6.2265625, -5.62109375, -5.015625, -4.41015625, -3.8046875, -3.19921875, -2.59375, -1.98828125, -1.3828125, -0.77734375, -0.171875, 0.43359375, 1.0390625, 1.64453125, 2.25, 2.85546875, 3.4609375, 4.06640625, 4.671875, 5.27734375, 5.8828125, 6.48828125, 7.09375, 7.69921875, 8.3046875, 8.91015625, 9.515625, 10.12109375, 10.7265625, 11.33203125, 11.9375, 12.54296875, 13.1484375, 13.75390625, 14.359375, 14.96484375, 15.5703125, 16.17578125, 16.78125, 17.38671875, 17.9921875, 18.59765625, 19.203125, 19.80859375, 20.4140625, 21.01953125, 21.625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 7.0, 7.0, 13.0, 15.0, 22.0, 46.0, 88.0, 134.0, 283.0, 611.0, 1678.0, 5287.0, 24602.0, 332029.0, 639034.0, 34611.0, 6619.0, 1994.0, 701.0, 347.0, 163.0, 103.0, 65.0, 27.0, 21.0, 13.0, 11.0, 6.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.4375, -32.427001953125, -31.41650390625, -30.406005859375, -29.3955078125, -28.385009765625, -27.37451171875, -26.364013671875, -25.353515625, -24.343017578125, -23.33251953125, -22.322021484375, -21.3115234375, -20.301025390625, -19.29052734375, -18.280029296875, -17.26953125, -16.259033203125, -15.24853515625, -14.238037109375, -13.2275390625, -12.217041015625, -11.20654296875, -10.196044921875, -9.185546875, -8.175048828125, -7.16455078125, -6.154052734375, -5.1435546875, -4.133056640625, -3.12255859375, -2.112060546875, -1.1015625, -0.091064453125, 0.91943359375, 1.929931640625, 2.9404296875, 3.950927734375, 4.96142578125, 5.971923828125, 6.982421875, 7.992919921875, 9.00341796875, 10.013916015625, 11.0244140625, 12.034912109375, 13.04541015625, 14.055908203125, 15.06640625, 16.076904296875, 17.08740234375, 18.097900390625, 19.1083984375, 20.118896484375, 21.12939453125, 22.139892578125, 23.150390625, 24.160888671875, 25.17138671875, 26.181884765625, 27.1923828125, 28.202880859375, 29.21337890625, 30.223876953125, 31.234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 4.0, 11.0, 8.0, 8.0, 17.0, 22.0, 38.0, 41.0, 70.0, 190.0, 246.0, 111.0, 62.0, 32.0, 32.0, 18.0, 16.0, 16.0, 8.0, 6.0, 7.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00412750244140625, -0.00398629903793335, -0.0038450956344604492, -0.003703892230987549, -0.0035626888275146484, -0.003421485424041748, -0.0032802820205688477, -0.0031390786170959473, -0.002997875213623047, -0.0028566718101501465, -0.002715468406677246, -0.0025742650032043457, -0.0024330615997314453, -0.002291858196258545, -0.0021506547927856445, -0.002009451389312744, -0.0018682479858398438, -0.0017270445823669434, -0.001585841178894043, -0.0014446377754211426, -0.0013034343719482422, -0.0011622309684753418, -0.0010210275650024414, -0.000879824161529541, -0.0007386207580566406, -0.0005974173545837402, -0.00045621395111083984, -0.00031501054763793945, -0.00017380714416503906, -3.260374069213867e-05, 0.00010859966278076172, 0.0002498030662536621, 0.0003910064697265625, 0.0005322098731994629, 0.0006734132766723633, 0.0008146166801452637, 0.0009558200836181641, 0.0010970234870910645, 0.0012382268905639648, 0.0013794302940368652, 0.0015206336975097656, 0.001661837100982666, 0.0018030405044555664, 0.0019442439079284668, 0.002085447311401367, 0.0022266507148742676, 0.002367854118347168, 0.0025090575218200684, 0.0026502609252929688, 0.002791464328765869, 0.0029326677322387695, 0.00307387113571167, 0.0032150745391845703, 0.0033562779426574707, 0.003497481346130371, 0.0036386847496032715, 0.003779888153076172, 0.003921091556549072, 0.004062294960021973, 0.004203498363494873, 0.0043447017669677734, 0.004485905170440674, 0.004627108573913574, 0.004768311977386475, 0.004909515380859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 3.0, 9.0, 4.0, 20.0, 20.0, 31.0, 42.0, 92.0, 116.0, 211.0, 370.0, 755.0, 1571.0, 4161.0, 12467.0, 53044.0, 626115.0, 298643.0, 35667.0, 9144.0, 3178.0, 1371.0, 693.0, 341.0, 191.0, 94.0, 67.0, 45.0, 25.0, 20.0, 10.0, 6.0, 6.0, 3.0, 12.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.46875, -22.7548828125, -22.041015625, -21.3271484375, -20.61328125, -19.8994140625, -19.185546875, -18.4716796875, -17.7578125, -17.0439453125, -16.330078125, -15.6162109375, -14.90234375, -14.1884765625, -13.474609375, -12.7607421875, -12.046875, -11.3330078125, -10.619140625, -9.9052734375, -9.19140625, -8.4775390625, -7.763671875, -7.0498046875, -6.3359375, -5.6220703125, -4.908203125, -4.1943359375, -3.48046875, -2.7666015625, -2.052734375, -1.3388671875, -0.625, 0.0888671875, 0.802734375, 1.5166015625, 2.23046875, 2.9443359375, 3.658203125, 4.3720703125, 5.0859375, 5.7998046875, 6.513671875, 7.2275390625, 7.94140625, 8.6552734375, 9.369140625, 10.0830078125, 10.796875, 11.5107421875, 12.224609375, 12.9384765625, 13.65234375, 14.3662109375, 15.080078125, 15.7939453125, 16.5078125, 17.2216796875, 17.935546875, 18.6494140625, 19.36328125, 20.0771484375, 20.791015625, 21.5048828125, 22.21875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 7.0, 11.0, 9.0, 9.0, 9.0, 25.0, 34.0, 45.0, 66.0, 139.0, 168.0, 180.0, 110.0, 50.0, 34.0, 24.0, 17.0, 15.0, 13.0, 11.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5859375, -13.0809326171875, -12.575927734375, -12.0709228515625, -11.56591796875, -11.0609130859375, -10.555908203125, -10.0509033203125, -9.5458984375, -9.0408935546875, -8.535888671875, -8.0308837890625, -7.52587890625, -7.0208740234375, -6.515869140625, -6.0108642578125, -5.505859375, -5.0008544921875, -4.495849609375, -3.9908447265625, -3.48583984375, -2.9808349609375, -2.475830078125, -1.9708251953125, -1.4658203125, -0.9608154296875, -0.455810546875, 0.0491943359375, 0.55419921875, 1.0592041015625, 1.564208984375, 2.0692138671875, 2.57421875, 3.0792236328125, 3.584228515625, 4.0892333984375, 4.59423828125, 5.0992431640625, 5.604248046875, 6.1092529296875, 6.6142578125, 7.1192626953125, 7.624267578125, 8.1292724609375, 8.63427734375, 9.1392822265625, 9.644287109375, 10.1492919921875, 10.654296875, 11.1593017578125, 11.664306640625, 12.1693115234375, 12.67431640625, 13.1793212890625, 13.684326171875, 14.1893310546875, 14.6943359375, 15.1993408203125, 15.704345703125, 16.2093505859375, 16.71435546875, 17.2193603515625, 17.724365234375, 18.2293701171875, 18.734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 12.0, 28.0, 58.0, 113.0, 164.0, 197.0, 154.0, 111.0, 80.0, 42.0, 14.0, 12.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.37586975097656, -139.50830078125, -130.64073181152344, -121.77316284179688, -112.90559387207031, -104.03802490234375, -95.17045593261719, -86.30288696289062, -77.43531799316406, -68.5677490234375, -59.70018005371094, -50.832611083984375, -41.96504211425781, -33.09747314453125, -24.229904174804688, -15.362335205078125, -6.4947662353515625, 2.372802734375, 11.240371704101562, 20.107940673828125, 28.975509643554688, 37.84307861328125, 46.71064758300781, 55.578216552734375, 64.44578552246094, 73.3133544921875, 82.18092346191406, 91.04849243164062, 99.91606140136719, 108.78363037109375, 117.65119934082031, 126.51876831054688, 135.3863525390625, 144.25392150878906, 153.12149047851562, 161.9890594482422, 170.85662841796875, 179.7241973876953, 188.59176635742188, 197.45933532714844, 206.326904296875, 215.19447326660156, 224.06204223632812, 232.9296112060547, 241.79718017578125, 250.6647491455078, 259.5323181152344, 268.39990234375, 277.2674560546875, 286.135009765625, 295.0025939941406, 303.87017822265625, 312.73773193359375, 321.60528564453125, 330.4728698730469, 339.3404541015625, 348.2080078125, 357.0755615234375, 365.9431457519531, 374.81072998046875, 383.67828369140625, 392.54583740234375, 401.4134216308594, 410.281005859375, 419.1485595703125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 10.0, 10.0, 10.0, 16.0, 10.0, 16.0, 23.0, 23.0, 15.0, 29.0, 29.0, 25.0, 40.0, 32.0, 45.0, 42.0, 40.0, 39.0, 41.0, 39.0, 47.0, 42.0, 44.0, 31.0, 32.0, 38.0, 25.0, 26.0, 22.0, 23.0, 23.0, 20.0, 10.0, 18.0, 14.0, 13.0, 5.0, 5.0, 5.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-80.12784576416016, -77.42349243164062, -74.7191390991211, -72.01478576660156, -69.3104248046875, -66.60607147216797, -63.90171813964844, -61.197364807128906, -58.493011474609375, -55.788658142089844, -53.08430480957031, -50.379947662353516, -47.675594329833984, -44.97124099731445, -42.266883850097656, -39.562530517578125, -36.858177185058594, -34.15382385253906, -31.4494686126709, -28.745113372802734, -26.040760040283203, -23.336406707763672, -20.632051467895508, -17.927696228027344, -15.223342895507812, -12.518988609313965, -9.814634323120117, -7.1102800369262695, -4.405925750732422, -1.7015714645385742, 1.0027828216552734, 3.7071380615234375, 6.4114837646484375, 9.115838050842285, 11.820192337036133, 14.52454662322998, 17.228900909423828, 19.93325424194336, 22.637609481811523, 25.341964721679688, 28.04631805419922, 30.75067138671875, 33.45502471923828, 36.15938186645508, 38.86373519897461, 41.56808853149414, 44.27244567871094, 46.97679901123047, 49.68115234375, 52.38550567626953, 55.08985900878906, 57.79421615600586, 60.49856948852539, 63.20292282104492, 65.90727996826172, 68.61163330078125, 71.31598663330078, 74.02033996582031, 76.72469329833984, 79.42904663085938, 82.13340759277344, 84.83776092529297, 87.5421142578125, 90.24646759033203, 92.95082092285156]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 5.0, 6.0, 21.0, 14.0, 21.0, 28.0, 41.0, 54.0, 83.0, 129.0, 202.0, 322.0, 511.0, 743.0, 1128.0, 2067.0, 3553.0, 6227.0, 11617.0, 24266.0, 57685.0, 178455.0, 1937326.0, 1684657.0, 176242.0, 57371.0, 24472.0, 11876.0, 6275.0, 3510.0, 1991.0, 1267.0, 730.0, 429.0, 335.0, 199.0, 122.0, 85.0, 74.0, 44.0, 29.0, 16.0, 16.0, 17.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.341552734375, -17.72998046875, -17.118408203125, -16.5068359375, -15.895263671875, -15.28369140625, -14.672119140625, -14.060546875, -13.448974609375, -12.83740234375, -12.225830078125, -11.6142578125, -11.002685546875, -10.39111328125, -9.779541015625, -9.16796875, -8.556396484375, -7.94482421875, -7.333251953125, -6.7216796875, -6.110107421875, -5.49853515625, -4.886962890625, -4.275390625, -3.663818359375, -3.05224609375, -2.440673828125, -1.8291015625, -1.217529296875, -0.60595703125, 0.005615234375, 0.6171875, 1.228759765625, 1.84033203125, 2.451904296875, 3.0634765625, 3.675048828125, 4.28662109375, 4.898193359375, 5.509765625, 6.121337890625, 6.73291015625, 7.344482421875, 7.9560546875, 8.567626953125, 9.17919921875, 9.790771484375, 10.40234375, 11.013916015625, 11.62548828125, 12.237060546875, 12.8486328125, 13.460205078125, 14.07177734375, 14.683349609375, 15.294921875, 15.906494140625, 16.51806640625, 17.129638671875, 17.7412109375, 18.352783203125, 18.96435546875, 19.575927734375, 20.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 5.0, 2.0, 12.0, 9.0, 18.0, 18.0, 9.0, 13.0, 15.0, 24.0, 20.0, 27.0, 30.0, 40.0, 26.0, 44.0, 39.0, 48.0, 42.0, 56.0, 53.0, 51.0, 55.0, 26.0, 36.0, 39.0, 38.0, 20.0, 27.0, 34.0, 26.0, 18.0, 18.0, 9.0, 5.0, 10.0, 11.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.01953125, -3.88818359375, -3.7568359375, -3.62548828125, -3.494140625, -3.36279296875, -3.2314453125, -3.10009765625, -2.96875, -2.83740234375, -2.7060546875, -2.57470703125, -2.443359375, -2.31201171875, -2.1806640625, -2.04931640625, -1.91796875, -1.78662109375, -1.6552734375, -1.52392578125, -1.392578125, -1.26123046875, -1.1298828125, -0.99853515625, -0.8671875, -0.73583984375, -0.6044921875, -0.47314453125, -0.341796875, -0.21044921875, -0.0791015625, 0.05224609375, 0.18359375, 0.31494140625, 0.4462890625, 0.57763671875, 0.708984375, 0.84033203125, 0.9716796875, 1.10302734375, 1.234375, 1.36572265625, 1.4970703125, 1.62841796875, 1.759765625, 1.89111328125, 2.0224609375, 2.15380859375, 2.28515625, 2.41650390625, 2.5478515625, 2.67919921875, 2.810546875, 2.94189453125, 3.0732421875, 3.20458984375, 3.3359375, 3.46728515625, 3.5986328125, 3.72998046875, 3.861328125, 3.99267578125, 4.1240234375, 4.25537109375, 4.38671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 9.0, 14.0, 12.0, 24.0, 31.0, 30.0, 67.0, 83.0, 169.0, 209.0, 400.0, 631.0, 1255.0, 2219.0, 4323.0, 9354.0, 23052.0, 74618.0, 412284.0, 3193277.0, 363209.0, 68800.0, 21835.0, 9109.0, 4294.0, 2195.0, 1148.0, 619.0, 366.0, 241.0, 137.0, 102.0, 62.0, 31.0, 26.0, 12.0, 10.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.03125, -27.111328125, -26.19140625, -25.271484375, -24.3515625, -23.431640625, -22.51171875, -21.591796875, -20.671875, -19.751953125, -18.83203125, -17.912109375, -16.9921875, -16.072265625, -15.15234375, -14.232421875, -13.3125, -12.392578125, -11.47265625, -10.552734375, -9.6328125, -8.712890625, -7.79296875, -6.873046875, -5.953125, -5.033203125, -4.11328125, -3.193359375, -2.2734375, -1.353515625, -0.43359375, 0.486328125, 1.40625, 2.326171875, 3.24609375, 4.166015625, 5.0859375, 6.005859375, 6.92578125, 7.845703125, 8.765625, 9.685546875, 10.60546875, 11.525390625, 12.4453125, 13.365234375, 14.28515625, 15.205078125, 16.125, 17.044921875, 17.96484375, 18.884765625, 19.8046875, 20.724609375, 21.64453125, 22.564453125, 23.484375, 24.404296875, 25.32421875, 26.244140625, 27.1640625, 28.083984375, 29.00390625, 29.923828125, 30.84375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 4.0, 4.0, 10.0, 12.0, 20.0, 38.0, 40.0, 64.0, 138.0, 175.0, 383.0, 1023.0, 1182.0, 393.0, 210.0, 117.0, 82.0, 39.0, 27.0, 25.0, 20.0, 9.0, 13.0, 7.0, 10.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -16.0513916015625, -15.618408203125, -15.1854248046875, -14.75244140625, -14.3194580078125, -13.886474609375, -13.4534912109375, -13.0205078125, -12.5875244140625, -12.154541015625, -11.7215576171875, -11.28857421875, -10.8555908203125, -10.422607421875, -9.9896240234375, -9.556640625, -9.1236572265625, -8.690673828125, -8.2576904296875, -7.82470703125, -7.3917236328125, -6.958740234375, -6.5257568359375, -6.0927734375, -5.6597900390625, -5.226806640625, -4.7938232421875, -4.36083984375, -3.9278564453125, -3.494873046875, -3.0618896484375, -2.62890625, -2.1959228515625, -1.762939453125, -1.3299560546875, -0.89697265625, -0.4639892578125, -0.031005859375, 0.4019775390625, 0.8349609375, 1.2679443359375, 1.700927734375, 2.1339111328125, 2.56689453125, 2.9998779296875, 3.432861328125, 3.8658447265625, 4.298828125, 4.7318115234375, 5.164794921875, 5.5977783203125, 6.03076171875, 6.4637451171875, 6.896728515625, 7.3297119140625, 7.7626953125, 8.1956787109375, 8.628662109375, 9.0616455078125, 9.49462890625, 9.9276123046875, 10.360595703125, 10.7935791015625, 11.2265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 10.0, 16.0, 28.0, 46.0, 58.0, 84.0, 96.0, 103.0, 137.0, 102.0, 100.0, 71.0, 57.0, 31.0, 13.0, 14.0, 9.0, 9.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.20120239257812, -71.48805236816406, -68.77489471435547, -66.0617446899414, -63.34859085083008, -60.63543701171875, -57.92228698730469, -55.20913314819336, -52.49597930908203, -49.7828254699707, -47.06967544555664, -44.35652160644531, -41.643367767333984, -38.930213928222656, -36.217063903808594, -33.503910064697266, -30.790760040283203, -28.077608108520508, -25.36445426940918, -22.651302337646484, -19.938148498535156, -17.22499656677246, -14.511844635009766, -11.798690795898438, -9.085538864135742, -6.3723859786987305, -3.659233570098877, -0.9460811614990234, 1.7670717239379883, 4.480224609375, 7.193376541137695, 9.906530380249023, 12.619682312011719, 15.33283519744873, 18.045988082885742, 20.759140014648438, 23.472293853759766, 26.18544578552246, 28.898597717285156, 31.611751556396484, 34.32490539550781, 37.03805923461914, 39.7512092590332, 42.46436309814453, 45.17751693725586, 47.89067077636719, 50.60382080078125, 53.31697463989258, 56.03012466430664, 58.74327850341797, 61.45642852783203, 64.16958618164062, 66.88273620605469, 69.59588623046875, 72.30903625488281, 75.0221939086914, 77.73534393310547, 80.44849395751953, 83.16165161132812, 85.87480163574219, 88.58795166015625, 91.30110931396484, 94.0142593383789, 96.7274169921875, 99.44056701660156]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 10.0, 14.0, 6.0, 14.0, 14.0, 18.0, 22.0, 21.0, 28.0, 38.0, 45.0, 36.0, 40.0, 35.0, 41.0, 46.0, 44.0, 39.0, 42.0, 43.0, 44.0, 41.0, 39.0, 29.0, 29.0, 30.0, 27.0, 23.0, 18.0, 17.0, 13.0, 23.0, 11.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.97904586791992, -39.616050720214844, -38.25305938720703, -36.89006423950195, -35.527069091796875, -34.1640739440918, -32.80107879638672, -31.438087463378906, -30.075092315673828, -28.71209716796875, -27.349103927612305, -25.98611068725586, -24.62311553955078, -23.260120391845703, -21.897127151489258, -20.534133911132812, -19.171138763427734, -17.808143615722656, -16.44515037536621, -15.08215618133545, -13.719161987304688, -12.356167793273926, -10.993173599243164, -9.630179405212402, -8.26718521118164, -6.904191017150879, -5.541196823120117, -4.1782026290893555, -2.8152084350585938, -1.452214241027832, -0.08922004699707031, 1.2737741470336914, 2.636768341064453, 3.999762535095215, 5.362756729125977, 6.725750923156738, 8.0887451171875, 9.451739311218262, 10.814733505249023, 12.177727699279785, 13.540721893310547, 14.903716087341309, 16.26671028137207, 17.629703521728516, 18.992698669433594, 20.355693817138672, 21.718687057495117, 23.081680297851562, 24.44467544555664, 25.80767059326172, 27.170663833618164, 28.53365707397461, 29.896652221679688, 31.259647369384766, 32.622642517089844, 33.985633850097656, 35.348628997802734, 36.71162414550781, 38.074615478515625, 39.4376106262207, 40.80060577392578, 42.16360092163086, 43.52659606933594, 44.88958740234375, 46.25258255004883]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 9.0, 9.0, 13.0, 8.0, 20.0, 20.0, 19.0, 42.0, 54.0, 74.0, 123.0, 212.0, 337.0, 599.0, 1032.0, 1925.0, 3584.0, 6885.0, 13253.0, 26560.0, 56506.0, 177557.0, 480379.0, 170168.0, 55367.0, 25976.0, 13084.0, 6893.0, 3462.0, 1839.0, 1042.0, 587.0, 342.0, 197.0, 114.0, 80.0, 59.0, 34.0, 16.0, 16.0, 21.0, 12.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.59375, -16.01123046875, -15.4287109375, -14.84619140625, -14.263671875, -13.68115234375, -13.0986328125, -12.51611328125, -11.93359375, -11.35107421875, -10.7685546875, -10.18603515625, -9.603515625, -9.02099609375, -8.4384765625, -7.85595703125, -7.2734375, -6.69091796875, -6.1083984375, -5.52587890625, -4.943359375, -4.36083984375, -3.7783203125, -3.19580078125, -2.61328125, -2.03076171875, -1.4482421875, -0.86572265625, -0.283203125, 0.29931640625, 0.8818359375, 1.46435546875, 2.046875, 2.62939453125, 3.2119140625, 3.79443359375, 4.376953125, 4.95947265625, 5.5419921875, 6.12451171875, 6.70703125, 7.28955078125, 7.8720703125, 8.45458984375, 9.037109375, 9.61962890625, 10.2021484375, 10.78466796875, 11.3671875, 11.94970703125, 12.5322265625, 13.11474609375, 13.697265625, 14.27978515625, 14.8623046875, 15.44482421875, 16.02734375, 16.60986328125, 17.1923828125, 17.77490234375, 18.357421875, 18.93994140625, 19.5224609375, 20.10498046875, 20.6875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 6.0, 4.0, 2.0, 9.0, 11.0, 13.0, 15.0, 14.0, 20.0, 14.0, 25.0, 23.0, 33.0, 30.0, 29.0, 32.0, 32.0, 40.0, 52.0, 54.0, 46.0, 50.0, 35.0, 37.0, 38.0, 51.0, 46.0, 34.0, 23.0, 22.0, 22.0, 28.0, 19.0, 19.0, 13.0, 9.0, 15.0, 7.0, 6.0, 7.0, 3.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.078125, -3.93670654296875, -3.7952880859375, -3.65386962890625, -3.512451171875, -3.37103271484375, -3.2296142578125, -3.08819580078125, -2.94677734375, -2.80535888671875, -2.6639404296875, -2.52252197265625, -2.381103515625, -2.23968505859375, -2.0982666015625, -1.95684814453125, -1.8154296875, -1.67401123046875, -1.5325927734375, -1.39117431640625, -1.249755859375, -1.10833740234375, -0.9669189453125, -0.82550048828125, -0.68408203125, -0.54266357421875, -0.4012451171875, -0.25982666015625, -0.118408203125, 0.02301025390625, 0.1644287109375, 0.30584716796875, 0.447265625, 0.58868408203125, 0.7301025390625, 0.87152099609375, 1.012939453125, 1.15435791015625, 1.2957763671875, 1.43719482421875, 1.57861328125, 1.72003173828125, 1.8614501953125, 2.00286865234375, 2.144287109375, 2.28570556640625, 2.4271240234375, 2.56854248046875, 2.7099609375, 2.85137939453125, 2.9927978515625, 3.13421630859375, 3.275634765625, 3.41705322265625, 3.5584716796875, 3.69989013671875, 3.84130859375, 3.98272705078125, 4.1241455078125, 4.26556396484375, 4.406982421875, 4.54840087890625, 4.6898193359375, 4.83123779296875, 4.97265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 11.0, 13.0, 13.0, 20.0, 17.0, 39.0, 50.0, 79.0, 105.0, 203.0, 329.0, 636.0, 1203.0, 2786.0, 6435.0, 15942.0, 42174.0, 225011.0, 644881.0, 67569.0, 23958.0, 9442.0, 4076.0, 1675.0, 829.0, 430.0, 219.0, 128.0, 73.0, 63.0, 33.0, 19.0, 24.0, 11.0, 14.0, 14.0, 9.0, 5.0, 1.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.7060546875, -25.724609375, -24.7431640625, -23.76171875, -22.7802734375, -21.798828125, -20.8173828125, -19.8359375, -18.8544921875, -17.873046875, -16.8916015625, -15.91015625, -14.9287109375, -13.947265625, -12.9658203125, -11.984375, -11.0029296875, -10.021484375, -9.0400390625, -8.05859375, -7.0771484375, -6.095703125, -5.1142578125, -4.1328125, -3.1513671875, -2.169921875, -1.1884765625, -0.20703125, 0.7744140625, 1.755859375, 2.7373046875, 3.71875, 4.7001953125, 5.681640625, 6.6630859375, 7.64453125, 8.6259765625, 9.607421875, 10.5888671875, 11.5703125, 12.5517578125, 13.533203125, 14.5146484375, 15.49609375, 16.4775390625, 17.458984375, 18.4404296875, 19.421875, 20.4033203125, 21.384765625, 22.3662109375, 23.34765625, 24.3291015625, 25.310546875, 26.2919921875, 27.2734375, 28.2548828125, 29.236328125, 30.2177734375, 31.19921875, 32.1806640625, 33.162109375, 34.1435546875, 35.125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 7.0, 7.0, 7.0, 3.0, 7.0, 16.0, 14.0, 30.0, 37.0, 42.0, 46.0, 54.0, 65.0, 57.0, 67.0, 86.0, 67.0, 70.0, 59.0, 46.0, 47.0, 37.0, 26.0, 18.0, 23.0, 16.0, 10.0, 8.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.21875, -28.2177734375, -27.216796875, -26.2158203125, -25.21484375, -24.2138671875, -23.212890625, -22.2119140625, -21.2109375, -20.2099609375, -19.208984375, -18.2080078125, -17.20703125, -16.2060546875, -15.205078125, -14.2041015625, -13.203125, -12.2021484375, -11.201171875, -10.2001953125, -9.19921875, -8.1982421875, -7.197265625, -6.1962890625, -5.1953125, -4.1943359375, -3.193359375, -2.1923828125, -1.19140625, -0.1904296875, 0.810546875, 1.8115234375, 2.8125, 3.8134765625, 4.814453125, 5.8154296875, 6.81640625, 7.8173828125, 8.818359375, 9.8193359375, 10.8203125, 11.8212890625, 12.822265625, 13.8232421875, 14.82421875, 15.8251953125, 16.826171875, 17.8271484375, 18.828125, 19.8291015625, 20.830078125, 21.8310546875, 22.83203125, 23.8330078125, 24.833984375, 25.8349609375, 26.8359375, 27.8369140625, 28.837890625, 29.8388671875, 30.83984375, 31.8408203125, 32.841796875, 33.8427734375, 34.84375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 9.0, 25.0, 19.0, 32.0, 57.0, 95.0, 210.0, 316.0, 574.0, 1305.0, 2773.0, 6464.0, 16030.0, 41918.0, 186585.0, 677007.0, 71098.0, 26023.0, 10079.0, 4164.0, 1852.0, 881.0, 457.0, 236.0, 149.0, 60.0, 48.0, 36.0, 18.0, 17.0, 4.0, 7.0, 5.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.54248046875, -12.9599609375, -12.37744140625, -11.794921875, -11.21240234375, -10.6298828125, -10.04736328125, -9.46484375, -8.88232421875, -8.2998046875, -7.71728515625, -7.134765625, -6.55224609375, -5.9697265625, -5.38720703125, -4.8046875, -4.22216796875, -3.6396484375, -3.05712890625, -2.474609375, -1.89208984375, -1.3095703125, -0.72705078125, -0.14453125, 0.43798828125, 1.0205078125, 1.60302734375, 2.185546875, 2.76806640625, 3.3505859375, 3.93310546875, 4.515625, 5.09814453125, 5.6806640625, 6.26318359375, 6.845703125, 7.42822265625, 8.0107421875, 8.59326171875, 9.17578125, 9.75830078125, 10.3408203125, 10.92333984375, 11.505859375, 12.08837890625, 12.6708984375, 13.25341796875, 13.8359375, 14.41845703125, 15.0009765625, 15.58349609375, 16.166015625, 16.74853515625, 17.3310546875, 17.91357421875, 18.49609375, 19.07861328125, 19.6611328125, 20.24365234375, 20.826171875, 21.40869140625, 21.9912109375, 22.57373046875, 23.15625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 6.0, 8.0, 8.0, 5.0, 14.0, 3.0, 9.0, 12.0, 26.0, 25.0, 46.0, 172.0, 323.0, 158.0, 58.0, 19.0, 17.0, 17.0, 8.0, 8.0, 6.0, 2.0, 10.0, 11.0, 2.0, 8.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00447845458984375, -0.0043315887451171875, -0.004184722900390625, -0.0040378570556640625, -0.0038909912109375, -0.0037441253662109375, -0.003597259521484375, -0.0034503936767578125, -0.00330352783203125, -0.0031566619873046875, -0.003009796142578125, -0.0028629302978515625, -0.002716064453125, -0.0025691986083984375, -0.002422332763671875, -0.0022754669189453125, -0.00212860107421875, -0.0019817352294921875, -0.001834869384765625, -0.0016880035400390625, -0.0015411376953125, -0.0013942718505859375, -0.001247406005859375, -0.0011005401611328125, -0.00095367431640625, -0.0008068084716796875, -0.000659942626953125, -0.0005130767822265625, -0.0003662109375, -0.0002193450927734375, -7.2479248046875e-05, 7.43865966796875e-05, 0.00022125244140625, 0.0003681182861328125, 0.000514984130859375, 0.0006618499755859375, 0.0008087158203125, 0.0009555816650390625, 0.001102447509765625, 0.0012493133544921875, 0.00139617919921875, 0.0015430450439453125, 0.001689910888671875, 0.0018367767333984375, 0.001983642578125, 0.0021305084228515625, 0.002277374267578125, 0.0024242401123046875, 0.00257110595703125, 0.0027179718017578125, 0.002864837646484375, 0.0030117034912109375, 0.0031585693359375, 0.0033054351806640625, 0.003452301025390625, 0.0035991668701171875, 0.00374603271484375, 0.0038928985595703125, 0.004039764404296875, 0.0041866302490234375, 0.00433349609375, 0.0044803619384765625, 0.004627227783203125, 0.0047740936279296875, 0.00492095947265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 8.0, 14.0, 20.0, 27.0, 54.0, 85.0, 105.0, 196.0, 312.0, 526.0, 874.0, 1807.0, 4136.0, 10179.0, 26482.0, 73320.0, 656074.0, 202187.0, 43281.0, 16659.0, 6521.0, 2721.0, 1268.0, 648.0, 396.0, 211.0, 145.0, 91.0, 59.0, 35.0, 28.0, 20.0, 16.0, 8.0, 5.0, 9.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-18.703125, -18.1650390625, -17.626953125, -17.0888671875, -16.55078125, -16.0126953125, -15.474609375, -14.9365234375, -14.3984375, -13.8603515625, -13.322265625, -12.7841796875, -12.24609375, -11.7080078125, -11.169921875, -10.6318359375, -10.09375, -9.5556640625, -9.017578125, -8.4794921875, -7.94140625, -7.4033203125, -6.865234375, -6.3271484375, -5.7890625, -5.2509765625, -4.712890625, -4.1748046875, -3.63671875, -3.0986328125, -2.560546875, -2.0224609375, -1.484375, -0.9462890625, -0.408203125, 0.1298828125, 0.66796875, 1.2060546875, 1.744140625, 2.2822265625, 2.8203125, 3.3583984375, 3.896484375, 4.4345703125, 4.97265625, 5.5107421875, 6.048828125, 6.5869140625, 7.125, 7.6630859375, 8.201171875, 8.7392578125, 9.27734375, 9.8154296875, 10.353515625, 10.8916015625, 11.4296875, 11.9677734375, 12.505859375, 13.0439453125, 13.58203125, 14.1201171875, 14.658203125, 15.1962890625, 15.734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 5.0, 16.0, 15.0, 9.0, 13.0, 23.0, 21.0, 32.0, 64.0, 108.0, 173.0, 151.0, 113.0, 59.0, 33.0, 21.0, 16.0, 14.0, 13.0, 7.0, 2.0, 7.0, 9.0, 4.0, 4.0, 4.0, 5.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.59375, -10.201416015625, -9.80908203125, -9.416748046875, -9.0244140625, -8.632080078125, -8.23974609375, -7.847412109375, -7.455078125, -7.062744140625, -6.67041015625, -6.278076171875, -5.8857421875, -5.493408203125, -5.10107421875, -4.708740234375, -4.31640625, -3.924072265625, -3.53173828125, -3.139404296875, -2.7470703125, -2.354736328125, -1.96240234375, -1.570068359375, -1.177734375, -0.785400390625, -0.39306640625, -0.000732421875, 0.3916015625, 0.783935546875, 1.17626953125, 1.568603515625, 1.9609375, 2.353271484375, 2.74560546875, 3.137939453125, 3.5302734375, 3.922607421875, 4.31494140625, 4.707275390625, 5.099609375, 5.491943359375, 5.88427734375, 6.276611328125, 6.6689453125, 7.061279296875, 7.45361328125, 7.845947265625, 8.23828125, 8.630615234375, 9.02294921875, 9.415283203125, 9.8076171875, 10.199951171875, 10.59228515625, 10.984619140625, 11.376953125, 11.769287109375, 12.16162109375, 12.553955078125, 12.9462890625, 13.338623046875, 13.73095703125, 14.123291015625, 14.515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 16.0, 15.0, 23.0, 54.0, 45.0, 83.0, 114.0, 126.0, 134.0, 110.0, 79.0, 67.0, 46.0, 38.0, 21.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-237.42584228515625, -230.86273193359375, -224.2996368408203, -217.73654174804688, -211.17343139648438, -204.61032104492188, -198.04722595214844, -191.484130859375, -184.9210205078125, -178.35791015625, -171.79481506347656, -165.23171997070312, -158.66860961914062, -152.10549926757812, -145.5424041748047, -138.97930908203125, -132.41619873046875, -125.85309600830078, -119.28999328613281, -112.72689056396484, -106.16378784179688, -99.6006851196289, -93.03758239746094, -86.47447967529297, -79.911376953125, -73.34827423095703, -66.78517150878906, -60.222068786621094, -53.658966064453125, -47.095863342285156, -40.53276062011719, -33.96965789794922, -27.40655517578125, -20.84345245361328, -14.280349731445312, -7.717247009277344, -1.154144287109375, 5.408958435058594, 11.972061157226562, 18.53516387939453, 25.0982666015625, 31.66136932373047, 38.22447204589844, 44.787574768066406, 51.350677490234375, 57.913780212402344, 64.47688293457031, 71.03998565673828, 77.60308837890625, 84.16619110107422, 90.72929382324219, 97.29239654541016, 103.85549926757812, 110.4186019897461, 116.98170471191406, 123.54480743408203, 130.10791015625, 136.6710205078125, 143.23411560058594, 149.79721069335938, 156.36032104492188, 162.92343139648438, 169.4865264892578, 176.04962158203125, 182.61273193359375]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 4.0, 8.0, 17.0, 16.0, 18.0, 23.0, 22.0, 20.0, 33.0, 33.0, 27.0, 36.0, 44.0, 52.0, 47.0, 51.0, 40.0, 36.0, 46.0, 36.0, 44.0, 40.0, 38.0, 28.0, 36.0, 25.0, 38.0, 17.0, 13.0, 22.0, 20.0, 13.0, 9.0, 10.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.8253173828125, -97.4686279296875, -94.1119384765625, -90.7552490234375, -87.3985595703125, -84.0418701171875, -80.6851806640625, -77.3284912109375, -73.9718017578125, -70.6151123046875, -67.2584228515625, -63.9017333984375, -60.5450439453125, -57.1883544921875, -53.8316650390625, -50.4749755859375, -47.118282318115234, -43.761592864990234, -40.404903411865234, -37.048213958740234, -33.691524505615234, -30.3348331451416, -26.9781436920166, -23.6214542388916, -20.2647647857666, -16.9080753326416, -13.551385879516602, -10.194695472717285, -6.838006019592285, -3.4813156127929688, -0.12462615966796875, 3.2320632934570312, 6.588752746582031, 9.945442199707031, 13.302131652832031, 16.65882110595703, 20.01551055908203, 23.372201919555664, 26.728891372680664, 30.085580825805664, 33.44226837158203, 36.79895782470703, 40.15564727783203, 43.51233673095703, 46.86902618408203, 50.22571563720703, 53.58240509033203, 56.93909454345703, 60.2957878112793, 63.6524772644043, 67.00917053222656, 70.36585998535156, 73.72254943847656, 77.07923889160156, 80.43592834472656, 83.79261779785156, 87.14930725097656, 90.50599670410156, 93.86268615722656, 97.21937561035156, 100.57606506347656, 103.93275451660156, 107.28944396972656, 110.64613342285156, 114.00282287597656]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 13.0, 22.0, 23.0, 39.0, 56.0, 93.0, 180.0, 313.0, 572.0, 1117.0, 2288.0, 4911.0, 10559.0, 25244.0, 68824.0, 288015.0, 3319646.0, 345903.0, 77073.0, 27521.0, 11509.0, 5141.0, 2485.0, 1242.0, 640.0, 319.0, 185.0, 109.0, 91.0, 35.0, 30.0, 26.0, 12.0, 12.0, 5.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.713623046875, -31.70849609375, -30.703369140625, -29.6982421875, -28.693115234375, -27.68798828125, -26.682861328125, -25.677734375, -24.672607421875, -23.66748046875, -22.662353515625, -21.6572265625, -20.652099609375, -19.64697265625, -18.641845703125, -17.63671875, -16.631591796875, -15.62646484375, -14.621337890625, -13.6162109375, -12.611083984375, -11.60595703125, -10.600830078125, -9.595703125, -8.590576171875, -7.58544921875, -6.580322265625, -5.5751953125, -4.570068359375, -3.56494140625, -2.559814453125, -1.5546875, -0.549560546875, 0.45556640625, 1.460693359375, 2.4658203125, 3.470947265625, 4.47607421875, 5.481201171875, 6.486328125, 7.491455078125, 8.49658203125, 9.501708984375, 10.5068359375, 11.511962890625, 12.51708984375, 13.522216796875, 14.52734375, 15.532470703125, 16.53759765625, 17.542724609375, 18.5478515625, 19.552978515625, 20.55810546875, 21.563232421875, 22.568359375, 23.573486328125, 24.57861328125, 25.583740234375, 26.5888671875, 27.593994140625, 28.59912109375, 29.604248046875, 30.609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 4.0, 12.0, 13.0, 16.0, 19.0, 16.0, 19.0, 28.0, 31.0, 34.0, 30.0, 35.0, 41.0, 42.0, 45.0, 48.0, 53.0, 41.0, 58.0, 45.0, 49.0, 46.0, 46.0, 43.0, 28.0, 22.0, 23.0, 23.0, 14.0, 11.0, 15.0, 9.0, 6.0, 8.0, 4.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.684814453125, -4.52197265625, -4.359130859375, -4.1962890625, -4.033447265625, -3.87060546875, -3.707763671875, -3.544921875, -3.382080078125, -3.21923828125, -3.056396484375, -2.8935546875, -2.730712890625, -2.56787109375, -2.405029296875, -2.2421875, -2.079345703125, -1.91650390625, -1.753662109375, -1.5908203125, -1.427978515625, -1.26513671875, -1.102294921875, -0.939453125, -0.776611328125, -0.61376953125, -0.450927734375, -0.2880859375, -0.125244140625, 0.03759765625, 0.200439453125, 0.36328125, 0.526123046875, 0.68896484375, 0.851806640625, 1.0146484375, 1.177490234375, 1.34033203125, 1.503173828125, 1.666015625, 1.828857421875, 1.99169921875, 2.154541015625, 2.3173828125, 2.480224609375, 2.64306640625, 2.805908203125, 2.96875, 3.131591796875, 3.29443359375, 3.457275390625, 3.6201171875, 3.782958984375, 3.94580078125, 4.108642578125, 4.271484375, 4.434326171875, 4.59716796875, 4.760009765625, 4.9228515625, 5.085693359375, 5.24853515625, 5.411376953125, 5.57421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 8.0, 16.0, 22.0, 32.0, 41.0, 59.0, 105.0, 170.0, 253.0, 382.0, 557.0, 824.0, 1361.0, 2158.0, 3878.0, 7259.0, 15879.0, 39632.0, 123335.0, 734130.0, 2928231.0, 228575.0, 62120.0, 22691.0, 10169.0, 5129.0, 2859.0, 1621.0, 971.0, 595.0, 400.0, 262.0, 183.0, 104.0, 82.0, 77.0, 22.0, 20.0, 20.0, 9.0, 18.0, 7.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.5, -34.39794921875, -33.2958984375, -32.19384765625, -31.091796875, -29.98974609375, -28.8876953125, -27.78564453125, -26.68359375, -25.58154296875, -24.4794921875, -23.37744140625, -22.275390625, -21.17333984375, -20.0712890625, -18.96923828125, -17.8671875, -16.76513671875, -15.6630859375, -14.56103515625, -13.458984375, -12.35693359375, -11.2548828125, -10.15283203125, -9.05078125, -7.94873046875, -6.8466796875, -5.74462890625, -4.642578125, -3.54052734375, -2.4384765625, -1.33642578125, -0.234375, 0.86767578125, 1.9697265625, 3.07177734375, 4.173828125, 5.27587890625, 6.3779296875, 7.47998046875, 8.58203125, 9.68408203125, 10.7861328125, 11.88818359375, 12.990234375, 14.09228515625, 15.1943359375, 16.29638671875, 17.3984375, 18.50048828125, 19.6025390625, 20.70458984375, 21.806640625, 22.90869140625, 24.0107421875, 25.11279296875, 26.21484375, 27.31689453125, 28.4189453125, 29.52099609375, 30.623046875, 31.72509765625, 32.8271484375, 33.92919921875, 35.03125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 3.0, 4.0, 4.0, 11.0, 12.0, 21.0, 23.0, 36.0, 74.0, 85.0, 176.0, 324.0, 1054.0, 1366.0, 355.0, 183.0, 107.0, 61.0, 46.0, 33.0, 30.0, 14.0, 12.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.046875, -17.4462890625, -16.845703125, -16.2451171875, -15.64453125, -15.0439453125, -14.443359375, -13.8427734375, -13.2421875, -12.6416015625, -12.041015625, -11.4404296875, -10.83984375, -10.2392578125, -9.638671875, -9.0380859375, -8.4375, -7.8369140625, -7.236328125, -6.6357421875, -6.03515625, -5.4345703125, -4.833984375, -4.2333984375, -3.6328125, -3.0322265625, -2.431640625, -1.8310546875, -1.23046875, -0.6298828125, -0.029296875, 0.5712890625, 1.171875, 1.7724609375, 2.373046875, 2.9736328125, 3.57421875, 4.1748046875, 4.775390625, 5.3759765625, 5.9765625, 6.5771484375, 7.177734375, 7.7783203125, 8.37890625, 8.9794921875, 9.580078125, 10.1806640625, 10.78125, 11.3818359375, 11.982421875, 12.5830078125, 13.18359375, 13.7841796875, 14.384765625, 14.9853515625, 15.5859375, 16.1865234375, 16.787109375, 17.3876953125, 17.98828125, 18.5888671875, 19.189453125, 19.7900390625, 20.390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 10.0, 10.0, 23.0, 37.0, 62.0, 77.0, 113.0, 113.0, 141.0, 131.0, 79.0, 73.0, 39.0, 40.0, 25.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.73176574707031, -97.88178253173828, -94.03179931640625, -90.18182373046875, -86.33184051513672, -82.48185729980469, -78.63187408447266, -74.78189086914062, -70.9319076538086, -67.08192443847656, -63.2319450378418, -59.381961822509766, -55.531978607177734, -51.68199920654297, -47.83201599121094, -43.982032775878906, -40.13205337524414, -36.28207015991211, -32.432090759277344, -28.582107543945312, -24.73212432861328, -20.882143020629883, -17.032161712646484, -13.182178497314453, -9.332197189331055, -5.48221492767334, -1.6322331428527832, 2.2177486419677734, 6.067730903625488, 9.917713165283203, 13.767694473266602, 17.617677688598633, 21.46765899658203, 25.31764030456543, 29.16762351989746, 33.01760482788086, 36.86758804321289, 40.717567443847656, 44.56755065917969, 48.41753387451172, 52.26751708984375, 56.11750030517578, 59.96747970581055, 63.81746292114258, 67.66744232177734, 71.51742553710938, 75.3674087524414, 79.21739196777344, 83.06736755371094, 86.91735076904297, 90.767333984375, 94.6173095703125, 98.46729278564453, 102.31727600097656, 106.1672592163086, 110.01724243164062, 113.86722564697266, 117.71720886230469, 121.56719207763672, 125.41717529296875, 129.26715087890625, 133.1171417236328, 136.9671173095703, 140.81710815429688, 144.66708374023438]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 6.0, 11.0, 18.0, 8.0, 14.0, 11.0, 21.0, 22.0, 19.0, 28.0, 33.0, 25.0, 33.0, 30.0, 30.0, 48.0, 31.0, 46.0, 50.0, 51.0, 43.0, 52.0, 41.0, 30.0, 32.0, 41.0, 16.0, 20.0, 27.0, 20.0, 13.0, 17.0, 18.0, 11.0, 12.0, 11.0, 6.0, 7.0, 5.0, 6.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-58.35264587402344, -56.58753967285156, -54.82243347167969, -53.05732345581055, -51.29221725463867, -49.5271110534668, -47.762001037597656, -45.99689483642578, -44.231788635253906, -42.46668243408203, -40.701576232910156, -38.936466217041016, -37.17136001586914, -35.406253814697266, -33.641143798828125, -31.87603759765625, -30.110931396484375, -28.3458251953125, -26.580717086791992, -24.815608978271484, -23.05050277709961, -21.285396575927734, -19.520288467407227, -17.75518035888672, -15.990074157714844, -14.224967002868652, -12.459859848022461, -10.69475269317627, -8.929645538330078, -7.164538383483887, -5.399431228637695, -3.634324073791504, -1.8692207336425781, -0.10411357879638672, 1.6609935760498047, 3.426100730895996, 5.1912078857421875, 6.956315040588379, 8.72142219543457, 10.486529350280762, 12.251636505126953, 14.016743659973145, 15.781850814819336, 17.546958923339844, 19.31206512451172, 21.077171325683594, 22.8422794342041, 24.60738754272461, 26.372493743896484, 28.13759994506836, 29.902708053588867, 31.667816162109375, 33.43292236328125, 35.198028564453125, 36.963134765625, 38.72824478149414, 40.493350982666016, 42.25845718383789, 44.02356719970703, 45.788673400878906, 47.55377960205078, 49.318885803222656, 51.08399200439453, 52.84910202026367, 54.61420822143555]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 8.0, 6.0, 5.0, 4.0, 15.0, 24.0, 23.0, 46.0, 60.0, 80.0, 129.0, 205.0, 324.0, 585.0, 1062.0, 1936.0, 3647.0, 7060.0, 13862.0, 26994.0, 52017.0, 99729.0, 212283.0, 308912.0, 157234.0, 77844.0, 40711.0, 21054.0, 10743.0, 5379.0, 2877.0, 1579.0, 849.0, 471.0, 285.0, 159.0, 101.0, 79.0, 45.0, 36.0, 19.0, 14.0, 19.0, 12.0, 9.0, 7.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.03125, -19.429931640625, -18.82861328125, -18.227294921875, -17.6259765625, -17.024658203125, -16.42333984375, -15.822021484375, -15.220703125, -14.619384765625, -14.01806640625, -13.416748046875, -12.8154296875, -12.214111328125, -11.61279296875, -11.011474609375, -10.41015625, -9.808837890625, -9.20751953125, -8.606201171875, -8.0048828125, -7.403564453125, -6.80224609375, -6.200927734375, -5.599609375, -4.998291015625, -4.39697265625, -3.795654296875, -3.1943359375, -2.593017578125, -1.99169921875, -1.390380859375, -0.7890625, -0.187744140625, 0.41357421875, 1.014892578125, 1.6162109375, 2.217529296875, 2.81884765625, 3.420166015625, 4.021484375, 4.622802734375, 5.22412109375, 5.825439453125, 6.4267578125, 7.028076171875, 7.62939453125, 8.230712890625, 8.83203125, 9.433349609375, 10.03466796875, 10.635986328125, 11.2373046875, 11.838623046875, 12.43994140625, 13.041259765625, 13.642578125, 14.243896484375, 14.84521484375, 15.446533203125, 16.0478515625, 16.649169921875, 17.25048828125, 17.851806640625, 18.453125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 4.0, 7.0, 5.0, 11.0, 22.0, 11.0, 17.0, 28.0, 19.0, 29.0, 31.0, 24.0, 34.0, 35.0, 56.0, 49.0, 43.0, 59.0, 47.0, 43.0, 45.0, 61.0, 38.0, 41.0, 40.0, 32.0, 27.0, 23.0, 28.0, 19.0, 18.0, 14.0, 17.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.40606689453125, -5.1910400390625, -4.97601318359375, -4.760986328125, -4.54595947265625, -4.3309326171875, -4.11590576171875, -3.90087890625, -3.68585205078125, -3.4708251953125, -3.25579833984375, -3.040771484375, -2.82574462890625, -2.6107177734375, -2.39569091796875, -2.1806640625, -1.96563720703125, -1.7506103515625, -1.53558349609375, -1.320556640625, -1.10552978515625, -0.8905029296875, -0.67547607421875, -0.46044921875, -0.24542236328125, -0.0303955078125, 0.18463134765625, 0.399658203125, 0.61468505859375, 0.8297119140625, 1.04473876953125, 1.259765625, 1.47479248046875, 1.6898193359375, 1.90484619140625, 2.119873046875, 2.33489990234375, 2.5499267578125, 2.76495361328125, 2.97998046875, 3.19500732421875, 3.4100341796875, 3.62506103515625, 3.840087890625, 4.05511474609375, 4.2701416015625, 4.48516845703125, 4.7001953125, 4.91522216796875, 5.1302490234375, 5.34527587890625, 5.560302734375, 5.77532958984375, 5.9903564453125, 6.20538330078125, 6.42041015625, 6.63543701171875, 6.8504638671875, 7.06549072265625, 7.280517578125, 7.49554443359375, 7.7105712890625, 7.92559814453125, 8.140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 3.0, 10.0, 6.0, 14.0, 16.0, 29.0, 27.0, 32.0, 77.0, 85.0, 120.0, 181.0, 288.0, 499.0, 1016.0, 2216.0, 6702.0, 29668.0, 153558.0, 666412.0, 147907.0, 28644.0, 6472.0, 2170.0, 944.0, 529.0, 299.0, 221.0, 114.0, 97.0, 63.0, 40.0, 29.0, 18.0, 17.0, 11.0, 8.0, 7.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-45.28125, -43.84326171875, -42.4052734375, -40.96728515625, -39.529296875, -38.09130859375, -36.6533203125, -35.21533203125, -33.77734375, -32.33935546875, -30.9013671875, -29.46337890625, -28.025390625, -26.58740234375, -25.1494140625, -23.71142578125, -22.2734375, -20.83544921875, -19.3974609375, -17.95947265625, -16.521484375, -15.08349609375, -13.6455078125, -12.20751953125, -10.76953125, -9.33154296875, -7.8935546875, -6.45556640625, -5.017578125, -3.57958984375, -2.1416015625, -0.70361328125, 0.734375, 2.17236328125, 3.6103515625, 5.04833984375, 6.486328125, 7.92431640625, 9.3623046875, 10.80029296875, 12.23828125, 13.67626953125, 15.1142578125, 16.55224609375, 17.990234375, 19.42822265625, 20.8662109375, 22.30419921875, 23.7421875, 25.18017578125, 26.6181640625, 28.05615234375, 29.494140625, 30.93212890625, 32.3701171875, 33.80810546875, 35.24609375, 36.68408203125, 38.1220703125, 39.56005859375, 40.998046875, 42.43603515625, 43.8740234375, 45.31201171875, 46.75]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 6.0, 9.0, 6.0, 13.0, 9.0, 8.0, 20.0, 20.0, 15.0, 24.0, 26.0, 25.0, 43.0, 41.0, 30.0, 44.0, 41.0, 49.0, 53.0, 54.0, 49.0, 42.0, 54.0, 41.0, 25.0, 47.0, 18.0, 26.0, 16.0, 20.0, 22.0, 17.0, 8.0, 15.0, 10.0, 10.0, 4.0, 3.0, 7.0, 3.0, 4.0, 6.0, 8.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-34.0625, -33.035888671875, -32.00927734375, -30.982666015625, -29.9560546875, -28.929443359375, -27.90283203125, -26.876220703125, -25.849609375, -24.822998046875, -23.79638671875, -22.769775390625, -21.7431640625, -20.716552734375, -19.68994140625, -18.663330078125, -17.63671875, -16.610107421875, -15.58349609375, -14.556884765625, -13.5302734375, -12.503662109375, -11.47705078125, -10.450439453125, -9.423828125, -8.397216796875, -7.37060546875, -6.343994140625, -5.3173828125, -4.290771484375, -3.26416015625, -2.237548828125, -1.2109375, -0.184326171875, 0.84228515625, 1.868896484375, 2.8955078125, 3.922119140625, 4.94873046875, 5.975341796875, 7.001953125, 8.028564453125, 9.05517578125, 10.081787109375, 11.1083984375, 12.135009765625, 13.16162109375, 14.188232421875, 15.21484375, 16.241455078125, 17.26806640625, 18.294677734375, 19.3212890625, 20.347900390625, 21.37451171875, 22.401123046875, 23.427734375, 24.454345703125, 25.48095703125, 26.507568359375, 27.5341796875, 28.560791015625, 29.58740234375, 30.614013671875, 31.640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 7.0, 5.0, 10.0, 8.0, 10.0, 20.0, 49.0, 76.0, 142.0, 287.0, 679.0, 1635.0, 4485.0, 15226.0, 70702.0, 416399.0, 441991.0, 73538.0, 15622.0, 4570.0, 1723.0, 687.0, 334.0, 149.0, 72.0, 42.0, 27.0, 15.0, 9.0, 8.0, 8.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.608154296875, -20.88818359375, -20.168212890625, -19.4482421875, -18.728271484375, -18.00830078125, -17.288330078125, -16.568359375, -15.848388671875, -15.12841796875, -14.408447265625, -13.6884765625, -12.968505859375, -12.24853515625, -11.528564453125, -10.80859375, -10.088623046875, -9.36865234375, -8.648681640625, -7.9287109375, -7.208740234375, -6.48876953125, -5.768798828125, -5.048828125, -4.328857421875, -3.60888671875, -2.888916015625, -2.1689453125, -1.448974609375, -0.72900390625, -0.009033203125, 0.7109375, 1.430908203125, 2.15087890625, 2.870849609375, 3.5908203125, 4.310791015625, 5.03076171875, 5.750732421875, 6.470703125, 7.190673828125, 7.91064453125, 8.630615234375, 9.3505859375, 10.070556640625, 10.79052734375, 11.510498046875, 12.23046875, 12.950439453125, 13.67041015625, 14.390380859375, 15.1103515625, 15.830322265625, 16.55029296875, 17.270263671875, 17.990234375, 18.710205078125, 19.43017578125, 20.150146484375, 20.8701171875, 21.590087890625, 22.31005859375, 23.030029296875, 23.75]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 3.0, 10.0, 10.0, 16.0, 12.0, 11.0, 27.0, 31.0, 44.0, 45.0, 81.0, 160.0, 169.0, 86.0, 60.0, 41.0, 33.0, 31.0, 21.0, 28.0, 15.0, 5.0, 7.0, 10.0, 5.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.005039215087890625, -0.004900127649307251, -0.004761040210723877, -0.004621952772140503, -0.004482865333557129, -0.004343777894973755, -0.004204690456390381, -0.004065603017807007, -0.003926515579223633, -0.003787428140640259, -0.0036483407020568848, -0.0035092532634735107, -0.0033701658248901367, -0.0032310783863067627, -0.0030919909477233887, -0.0029529035091400146, -0.0028138160705566406, -0.0026747286319732666, -0.0025356411933898926, -0.0023965537548065186, -0.0022574663162231445, -0.0021183788776397705, -0.0019792914390563965, -0.0018402040004730225, -0.0017011165618896484, -0.0015620291233062744, -0.0014229416847229004, -0.0012838542461395264, -0.0011447668075561523, -0.0010056793689727783, -0.0008665919303894043, -0.0007275044918060303, -0.0005884170532226562, -0.0004493296146392822, -0.0003102421760559082, -0.00017115473747253418, -3.2067298889160156e-05, 0.00010702013969421387, 0.0002461075782775879, 0.0003851950168609619, 0.0005242824554443359, 0.00066336989402771, 0.000802457332611084, 0.000941544771194458, 0.001080632209777832, 0.001219719648361206, 0.00135880708694458, 0.001497894525527954, 0.0016369819641113281, 0.0017760694026947021, 0.0019151568412780762, 0.00205424427986145, 0.0021933317184448242, 0.0023324191570281982, 0.0024715065956115723, 0.0026105940341949463, 0.0027496814727783203, 0.0028887689113616943, 0.0030278563499450684, 0.0031669437885284424, 0.0033060312271118164, 0.0034451186656951904, 0.0035842061042785645, 0.0037232935428619385, 0.0038623809814453125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 4.0, 7.0, 6.0, 7.0, 14.0, 25.0, 35.0, 70.0, 120.0, 187.0, 355.0, 670.0, 1642.0, 4303.0, 15361.0, 80878.0, 523244.0, 351322.0, 53262.0, 11127.0, 3259.0, 1322.0, 597.0, 293.0, 182.0, 78.0, 59.0, 32.0, 23.0, 15.0, 11.0, 11.0, 7.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.28125, -24.462646484375, -23.64404296875, -22.825439453125, -22.0068359375, -21.188232421875, -20.36962890625, -19.551025390625, -18.732421875, -17.913818359375, -17.09521484375, -16.276611328125, -15.4580078125, -14.639404296875, -13.82080078125, -13.002197265625, -12.18359375, -11.364990234375, -10.54638671875, -9.727783203125, -8.9091796875, -8.090576171875, -7.27197265625, -6.453369140625, -5.634765625, -4.816162109375, -3.99755859375, -3.178955078125, -2.3603515625, -1.541748046875, -0.72314453125, 0.095458984375, 0.9140625, 1.732666015625, 2.55126953125, 3.369873046875, 4.1884765625, 5.007080078125, 5.82568359375, 6.644287109375, 7.462890625, 8.281494140625, 9.10009765625, 9.918701171875, 10.7373046875, 11.555908203125, 12.37451171875, 13.193115234375, 14.01171875, 14.830322265625, 15.64892578125, 16.467529296875, 17.2861328125, 18.104736328125, 18.92333984375, 19.741943359375, 20.560546875, 21.379150390625, 22.19775390625, 23.016357421875, 23.8349609375, 24.653564453125, 25.47216796875, 26.290771484375, 27.109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 3.0, 6.0, 8.0, 12.0, 13.0, 15.0, 19.0, 30.0, 33.0, 29.0, 48.0, 64.0, 77.0, 89.0, 96.0, 95.0, 73.0, 49.0, 60.0, 26.0, 31.0, 29.0, 17.0, 20.0, 12.0, 10.0, 5.0, 5.0, 3.0, 3.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.400146484375, -15.86279296875, -15.325439453125, -14.7880859375, -14.250732421875, -13.71337890625, -13.176025390625, -12.638671875, -12.101318359375, -11.56396484375, -11.026611328125, -10.4892578125, -9.951904296875, -9.41455078125, -8.877197265625, -8.33984375, -7.802490234375, -7.26513671875, -6.727783203125, -6.1904296875, -5.653076171875, -5.11572265625, -4.578369140625, -4.041015625, -3.503662109375, -2.96630859375, -2.428955078125, -1.8916015625, -1.354248046875, -0.81689453125, -0.279541015625, 0.2578125, 0.795166015625, 1.33251953125, 1.869873046875, 2.4072265625, 2.944580078125, 3.48193359375, 4.019287109375, 4.556640625, 5.093994140625, 5.63134765625, 6.168701171875, 6.7060546875, 7.243408203125, 7.78076171875, 8.318115234375, 8.85546875, 9.392822265625, 9.93017578125, 10.467529296875, 11.0048828125, 11.542236328125, 12.07958984375, 12.616943359375, 13.154296875, 13.691650390625, 14.22900390625, 14.766357421875, 15.3037109375, 15.841064453125, 16.37841796875, 16.915771484375, 17.453125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 11.0, 16.0, 15.0, 25.0, 63.0, 101.0, 110.0, 130.0, 120.0, 113.0, 99.0, 82.0, 51.0, 22.0, 15.0, 9.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-358.5999755859375, -349.4037170410156, -340.2074890136719, -331.01123046875, -321.81500244140625, -312.6187438964844, -303.4224853515625, -294.22625732421875, -285.0299987792969, -275.833740234375, -266.63751220703125, -257.4412536621094, -248.24501037597656, -239.04876708984375, -229.85250854492188, -220.65626525878906, -211.46002197265625, -202.26377868652344, -193.06753540039062, -183.87127685546875, -174.67503356933594, -165.47879028320312, -156.28253173828125, -147.08628845214844, -137.89004516601562, -128.6938018798828, -119.49755096435547, -110.30130004882812, -101.10505676269531, -91.9088134765625, -82.71256256103516, -73.51631164550781, -64.32005310058594, -55.12380599975586, -45.92755889892578, -36.7313117980957, -27.535064697265625, -18.338817596435547, -9.142570495605469, 0.053680419921875, 9.249923706054688, 18.446170806884766, 27.642417907714844, 36.83866500854492, 46.034912109375, 55.23115921020508, 64.42740631103516, 73.6236572265625, 82.81990051269531, 92.01614379882812, 101.21239471435547, 110.40864562988281, 119.60488891601562, 128.80113220214844, 137.99737548828125, 147.19363403320312, 156.38987731933594, 165.58612060546875, 174.78237915039062, 183.97862243652344, 193.17486572265625, 202.37110900878906, 211.56735229492188, 220.76361083984375, 229.95985412597656]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 12.0, 10.0, 8.0, 8.0, 13.0, 10.0, 17.0, 12.0, 20.0, 14.0, 27.0, 34.0, 20.0, 39.0, 29.0, 45.0, 47.0, 40.0, 41.0, 51.0, 33.0, 43.0, 40.0, 47.0, 34.0, 45.0, 35.0, 31.0, 27.0, 26.0, 15.0, 21.0, 18.0, 16.0, 16.0, 12.0, 7.0, 5.0, 5.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.96075439453125, -151.72427368164062, -146.48779296875, -141.25131225585938, -136.01483154296875, -130.77835083007812, -125.5418701171875, -120.30538940429688, -115.06890869140625, -109.83242797851562, -104.595947265625, -99.35946655273438, -94.12298583984375, -88.88650512695312, -83.6500244140625, -78.41354370117188, -73.17705535888672, -67.9405746459961, -62.70409393310547, -57.467613220214844, -52.23113250732422, -46.994651794433594, -41.7581672668457, -36.52168655395508, -31.285205841064453, -26.048725128173828, -20.812244415283203, -15.575761795043945, -10.33928108215332, -5.102800369262695, 0.1336822509765625, 5.3701629638671875, 10.606643676757812, 15.843124389648438, 21.079605102539062, 26.31608772277832, 31.552568435668945, 36.78904724121094, 42.02553176879883, 47.26201248168945, 52.49849319458008, 57.7349739074707, 62.97145462036133, 68.20793914794922, 73.44441986083984, 78.68090057373047, 83.9173812866211, 89.15386199951172, 94.39034271240234, 99.62682342529297, 104.8633041381836, 110.09978485107422, 115.33626556396484, 120.57274627685547, 125.80923461914062, 131.04571533203125, 136.28219604492188, 141.5186767578125, 146.75515747070312, 151.99163818359375, 157.22811889648438, 162.464599609375, 167.70108032226562, 172.93756103515625, 178.17404174804688]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 7.0, 7.0, 17.0, 24.0, 38.0, 43.0, 73.0, 110.0, 140.0, 244.0, 357.0, 576.0, 868.0, 1383.0, 2236.0, 3462.0, 5888.0, 10770.0, 20655.0, 42684.0, 103015.0, 332606.0, 2792714.0, 609992.0, 149825.0, 57973.0, 26559.0, 13499.0, 7284.0, 4271.0, 2574.0, 1583.0, 944.0, 660.0, 417.0, 264.0, 180.0, 117.0, 83.0, 47.0, 31.0, 20.0, 12.0, 10.0, 6.0, 1.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-23.046875, -22.341552734375, -21.63623046875, -20.930908203125, -20.2255859375, -19.520263671875, -18.81494140625, -18.109619140625, -17.404296875, -16.698974609375, -15.99365234375, -15.288330078125, -14.5830078125, -13.877685546875, -13.17236328125, -12.467041015625, -11.76171875, -11.056396484375, -10.35107421875, -9.645751953125, -8.9404296875, -8.235107421875, -7.52978515625, -6.824462890625, -6.119140625, -5.413818359375, -4.70849609375, -4.003173828125, -3.2978515625, -2.592529296875, -1.88720703125, -1.181884765625, -0.4765625, 0.228759765625, 0.93408203125, 1.639404296875, 2.3447265625, 3.050048828125, 3.75537109375, 4.460693359375, 5.166015625, 5.871337890625, 6.57666015625, 7.281982421875, 7.9873046875, 8.692626953125, 9.39794921875, 10.103271484375, 10.80859375, 11.513916015625, 12.21923828125, 12.924560546875, 13.6298828125, 14.335205078125, 15.04052734375, 15.745849609375, 16.451171875, 17.156494140625, 17.86181640625, 18.567138671875, 19.2724609375, 19.977783203125, 20.68310546875, 21.388427734375, 22.09375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 9.0, 10.0, 8.0, 8.0, 11.0, 18.0, 15.0, 12.0, 18.0, 31.0, 22.0, 26.0, 29.0, 43.0, 48.0, 37.0, 41.0, 41.0, 47.0, 47.0, 37.0, 42.0, 42.0, 39.0, 55.0, 38.0, 31.0, 28.0, 24.0, 17.0, 18.0, 17.0, 12.0, 11.0, 8.0, 15.0, 8.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.18359375, -5.98406982421875, -5.7845458984375, -5.58502197265625, -5.385498046875, -5.18597412109375, -4.9864501953125, -4.78692626953125, -4.58740234375, -4.38787841796875, -4.1883544921875, -3.98883056640625, -3.789306640625, -3.58978271484375, -3.3902587890625, -3.19073486328125, -2.9912109375, -2.79168701171875, -2.5921630859375, -2.39263916015625, -2.193115234375, -1.99359130859375, -1.7940673828125, -1.59454345703125, -1.39501953125, -1.19549560546875, -0.9959716796875, -0.79644775390625, -0.596923828125, -0.39739990234375, -0.1978759765625, 0.00164794921875, 0.201171875, 0.40069580078125, 0.6002197265625, 0.79974365234375, 0.999267578125, 1.19879150390625, 1.3983154296875, 1.59783935546875, 1.79736328125, 1.99688720703125, 2.1964111328125, 2.39593505859375, 2.595458984375, 2.79498291015625, 2.9945068359375, 3.19403076171875, 3.3935546875, 3.59307861328125, 3.7926025390625, 3.99212646484375, 4.191650390625, 4.39117431640625, 4.5906982421875, 4.79022216796875, 4.98974609375, 5.18927001953125, 5.3887939453125, 5.58831787109375, 5.787841796875, 5.98736572265625, 6.1868896484375, 6.38641357421875, 6.5859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 8.0, 7.0, 14.0, 28.0, 22.0, 32.0, 52.0, 78.0, 118.0, 164.0, 303.0, 400.0, 677.0, 1279.0, 2683.0, 6104.0, 16319.0, 55536.0, 311242.0, 3352508.0, 356454.0, 60388.0, 17249.0, 6412.0, 2821.0, 1366.0, 731.0, 421.0, 304.0, 188.0, 123.0, 78.0, 66.0, 44.0, 17.0, 13.0, 8.0, 13.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -50.8408203125, -49.119140625, -47.3974609375, -45.67578125, -43.9541015625, -42.232421875, -40.5107421875, -38.7890625, -37.0673828125, -35.345703125, -33.6240234375, -31.90234375, -30.1806640625, -28.458984375, -26.7373046875, -25.015625, -23.2939453125, -21.572265625, -19.8505859375, -18.12890625, -16.4072265625, -14.685546875, -12.9638671875, -11.2421875, -9.5205078125, -7.798828125, -6.0771484375, -4.35546875, -2.6337890625, -0.912109375, 0.8095703125, 2.53125, 4.2529296875, 5.974609375, 7.6962890625, 9.41796875, 11.1396484375, 12.861328125, 14.5830078125, 16.3046875, 18.0263671875, 19.748046875, 21.4697265625, 23.19140625, 24.9130859375, 26.634765625, 28.3564453125, 30.078125, 31.7998046875, 33.521484375, 35.2431640625, 36.96484375, 38.6865234375, 40.408203125, 42.1298828125, 43.8515625, 45.5732421875, 47.294921875, 49.0166015625, 50.73828125, 52.4599609375, 54.181640625, 55.9033203125, 57.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 8.0, 4.0, 17.0, 8.0, 16.0, 24.0, 24.0, 42.0, 54.0, 79.0, 155.0, 281.0, 636.0, 1503.0, 542.0, 265.0, 142.0, 83.0, 59.0, 31.0, 29.0, 22.0, 12.0, 10.0, 8.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.171875, -29.366455078125, -28.56103515625, -27.755615234375, -26.9501953125, -26.144775390625, -25.33935546875, -24.533935546875, -23.728515625, -22.923095703125, -22.11767578125, -21.312255859375, -20.5068359375, -19.701416015625, -18.89599609375, -18.090576171875, -17.28515625, -16.479736328125, -15.67431640625, -14.868896484375, -14.0634765625, -13.258056640625, -12.45263671875, -11.647216796875, -10.841796875, -10.036376953125, -9.23095703125, -8.425537109375, -7.6201171875, -6.814697265625, -6.00927734375, -5.203857421875, -4.3984375, -3.593017578125, -2.78759765625, -1.982177734375, -1.1767578125, -0.371337890625, 0.43408203125, 1.239501953125, 2.044921875, 2.850341796875, 3.65576171875, 4.461181640625, 5.2666015625, 6.072021484375, 6.87744140625, 7.682861328125, 8.48828125, 9.293701171875, 10.09912109375, 10.904541015625, 11.7099609375, 12.515380859375, 13.32080078125, 14.126220703125, 14.931640625, 15.737060546875, 16.54248046875, 17.347900390625, 18.1533203125, 18.958740234375, 19.76416015625, 20.569580078125, 21.375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 7.0, 13.0, 13.0, 33.0, 45.0, 75.0, 107.0, 94.0, 109.0, 117.0, 94.0, 87.0, 65.0, 47.0, 33.0, 26.0, 11.0, 7.0, 6.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.55540466308594, -134.26116943359375, -128.96693420410156, -123.6727066040039, -118.37847900390625, -113.08424377441406, -107.79000854492188, -102.49578094482422, -97.20155334472656, -91.90731811523438, -86.61309051513672, -81.31885528564453, -76.02462768554688, -70.73039245605469, -65.4361572265625, -60.141929626464844, -54.847694396972656, -49.553462982177734, -44.25923156738281, -38.964996337890625, -33.67076873779297, -28.376535415649414, -23.08230209350586, -17.788070678710938, -12.493839263916016, -7.1996073722839355, -1.9053754806518555, 3.388856887817383, 8.683088302612305, 13.977319717407227, 19.27155303955078, 24.565784454345703, 29.860015869140625, 35.15424728393555, 40.44847869873047, 45.742713928222656, 51.03694152832031, 56.3311767578125, 61.62540817260742, 66.91963958740234, 72.2138671875, 77.50810241699219, 82.80233001708984, 88.09656524658203, 93.39079284667969, 98.68502807617188, 103.97926330566406, 109.27349090576172, 114.5677261352539, 119.8619613647461, 125.15618896484375, 130.45042419433594, 135.74465942382812, 141.03887939453125, 146.33311462402344, 151.62734985351562, 156.9215850830078, 162.2158203125, 167.5100555419922, 172.8042755126953, 178.0985107421875, 183.3927459716797, 188.68698120117188, 193.981201171875, 199.2754364013672]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 4.0, 9.0, 8.0, 13.0, 16.0, 11.0, 18.0, 20.0, 23.0, 37.0, 37.0, 41.0, 32.0, 29.0, 42.0, 45.0, 51.0, 40.0, 59.0, 52.0, 49.0, 44.0, 45.0, 25.0, 37.0, 26.0, 27.0, 22.0, 20.0, 16.0, 26.0, 18.0, 9.0, 10.0, 7.0, 7.0, 3.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.6792221069336, -80.02071380615234, -77.3622055053711, -74.70369720458984, -72.0451889038086, -69.38668060302734, -66.7281723022461, -64.06967163085938, -61.41115951538086, -58.75265121459961, -56.09414291381836, -53.43563461303711, -50.777130126953125, -48.118621826171875, -45.460113525390625, -42.801605224609375, -40.143096923828125, -37.484588623046875, -34.826080322265625, -32.167572021484375, -29.509065628051758, -26.850557327270508, -24.19205093383789, -21.53354263305664, -18.87503433227539, -16.21652603149414, -13.558018684387207, -10.899511337280273, -8.241003036499023, -5.582494735717773, -2.92398738861084, -0.26548004150390625, 2.3930282592773438, 5.0515360832214355, 7.710043907165527, 10.368551254272461, 13.027059555053711, 15.685567855834961, 18.344074249267578, 21.002582550048828, 23.661090850830078, 26.319599151611328, 28.978107452392578, 31.636613845825195, 34.29512023925781, 36.95362854003906, 39.61213684082031, 42.27064514160156, 44.92915344238281, 47.58766174316406, 50.24617004394531, 52.90467834472656, 55.56318664550781, 58.22169494628906, 60.88019943237305, 63.5387077331543, 66.19721984863281, 68.85572814941406, 71.51423645019531, 74.17274475097656, 76.83125305175781, 79.48976135253906, 82.14826965332031, 84.80677795410156, 87.46527862548828]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 14.0, 17.0, 13.0, 39.0, 31.0, 72.0, 73.0, 134.0, 208.0, 263.0, 438.0, 763.0, 1208.0, 2179.0, 4013.0, 7395.0, 14004.0, 29473.0, 62589.0, 133566.0, 246375.0, 260315.0, 148172.0, 70217.0, 32852.0, 15825.0, 8033.0, 4352.0, 2284.0, 1345.0, 811.0, 529.0, 318.0, 200.0, 140.0, 90.0, 68.0, 38.0, 28.0, 20.0, 17.0, 2.0, 10.0, 3.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.4375, -19.80029296875, -19.1630859375, -18.52587890625, -17.888671875, -17.25146484375, -16.6142578125, -15.97705078125, -15.33984375, -14.70263671875, -14.0654296875, -13.42822265625, -12.791015625, -12.15380859375, -11.5166015625, -10.87939453125, -10.2421875, -9.60498046875, -8.9677734375, -8.33056640625, -7.693359375, -7.05615234375, -6.4189453125, -5.78173828125, -5.14453125, -4.50732421875, -3.8701171875, -3.23291015625, -2.595703125, -1.95849609375, -1.3212890625, -0.68408203125, -0.046875, 0.59033203125, 1.2275390625, 1.86474609375, 2.501953125, 3.13916015625, 3.7763671875, 4.41357421875, 5.05078125, 5.68798828125, 6.3251953125, 6.96240234375, 7.599609375, 8.23681640625, 8.8740234375, 9.51123046875, 10.1484375, 10.78564453125, 11.4228515625, 12.06005859375, 12.697265625, 13.33447265625, 13.9716796875, 14.60888671875, 15.24609375, 15.88330078125, 16.5205078125, 17.15771484375, 17.794921875, 18.43212890625, 19.0693359375, 19.70654296875, 20.34375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 9.0, 6.0, 9.0, 3.0, 5.0, 11.0, 14.0, 14.0, 20.0, 31.0, 31.0, 32.0, 36.0, 42.0, 34.0, 39.0, 45.0, 37.0, 56.0, 49.0, 51.0, 38.0, 47.0, 45.0, 47.0, 39.0, 37.0, 36.0, 17.0, 22.0, 19.0, 20.0, 14.0, 14.0, 8.0, 8.0, 5.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.4609375, -9.1990966796875, -8.937255859375, -8.6754150390625, -8.41357421875, -8.1517333984375, -7.889892578125, -7.6280517578125, -7.3662109375, -7.1043701171875, -6.842529296875, -6.5806884765625, -6.31884765625, -6.0570068359375, -5.795166015625, -5.5333251953125, -5.271484375, -5.0096435546875, -4.747802734375, -4.4859619140625, -4.22412109375, -3.9622802734375, -3.700439453125, -3.4385986328125, -3.1767578125, -2.9149169921875, -2.653076171875, -2.3912353515625, -2.12939453125, -1.8675537109375, -1.605712890625, -1.3438720703125, -1.08203125, -0.8201904296875, -0.558349609375, -0.2965087890625, -0.03466796875, 0.2271728515625, 0.489013671875, 0.7508544921875, 1.0126953125, 1.2745361328125, 1.536376953125, 1.7982177734375, 2.06005859375, 2.3218994140625, 2.583740234375, 2.8455810546875, 3.107421875, 3.3692626953125, 3.631103515625, 3.8929443359375, 4.15478515625, 4.4166259765625, 4.678466796875, 4.9403076171875, 5.2021484375, 5.4639892578125, 5.725830078125, 5.9876708984375, 6.24951171875, 6.5113525390625, 6.773193359375, 7.0350341796875, 7.296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 14.0, 18.0, 22.0, 36.0, 46.0, 91.0, 118.0, 193.0, 295.0, 506.0, 965.0, 2415.0, 9078.0, 54429.0, 436372.0, 470176.0, 59100.0, 9756.0, 2530.0, 1023.0, 519.0, 274.0, 206.0, 114.0, 70.0, 52.0, 39.0, 32.0, 14.0, 8.0, 12.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.71875, -47.0400390625, -45.361328125, -43.6826171875, -42.00390625, -40.3251953125, -38.646484375, -36.9677734375, -35.2890625, -33.6103515625, -31.931640625, -30.2529296875, -28.57421875, -26.8955078125, -25.216796875, -23.5380859375, -21.859375, -20.1806640625, -18.501953125, -16.8232421875, -15.14453125, -13.4658203125, -11.787109375, -10.1083984375, -8.4296875, -6.7509765625, -5.072265625, -3.3935546875, -1.71484375, -0.0361328125, 1.642578125, 3.3212890625, 5.0, 6.6787109375, 8.357421875, 10.0361328125, 11.71484375, 13.3935546875, 15.072265625, 16.7509765625, 18.4296875, 20.1083984375, 21.787109375, 23.4658203125, 25.14453125, 26.8232421875, 28.501953125, 30.1806640625, 31.859375, 33.5380859375, 35.216796875, 36.8955078125, 38.57421875, 40.2529296875, 41.931640625, 43.6103515625, 45.2890625, 46.9677734375, 48.646484375, 50.3251953125, 52.00390625, 53.6826171875, 55.361328125, 57.0400390625, 58.71875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 11.0, 7.0, 6.0, 24.0, 13.0, 17.0, 25.0, 21.0, 25.0, 26.0, 42.0, 36.0, 45.0, 37.0, 44.0, 44.0, 42.0, 49.0, 59.0, 38.0, 53.0, 36.0, 43.0, 33.0, 37.0, 27.0, 25.0, 23.0, 23.0, 22.0, 10.0, 12.0, 9.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.21875, -38.80517578125, -37.3916015625, -35.97802734375, -34.564453125, -33.15087890625, -31.7373046875, -30.32373046875, -28.91015625, -27.49658203125, -26.0830078125, -24.66943359375, -23.255859375, -21.84228515625, -20.4287109375, -19.01513671875, -17.6015625, -16.18798828125, -14.7744140625, -13.36083984375, -11.947265625, -10.53369140625, -9.1201171875, -7.70654296875, -6.29296875, -4.87939453125, -3.4658203125, -2.05224609375, -0.638671875, 0.77490234375, 2.1884765625, 3.60205078125, 5.015625, 6.42919921875, 7.8427734375, 9.25634765625, 10.669921875, 12.08349609375, 13.4970703125, 14.91064453125, 16.32421875, 17.73779296875, 19.1513671875, 20.56494140625, 21.978515625, 23.39208984375, 24.8056640625, 26.21923828125, 27.6328125, 29.04638671875, 30.4599609375, 31.87353515625, 33.287109375, 34.70068359375, 36.1142578125, 37.52783203125, 38.94140625, 40.35498046875, 41.7685546875, 43.18212890625, 44.595703125, 46.00927734375, 47.4228515625, 48.83642578125, 50.25]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 14.0, 17.0, 20.0, 39.0, 73.0, 205.0, 1092.0, 17702.0, 893993.0, 131355.0, 3375.0, 448.0, 101.0, 49.0, 25.0, 16.0, 13.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.25, -79.7373046875, -77.224609375, -74.7119140625, -72.19921875, -69.6865234375, -67.173828125, -64.6611328125, -62.1484375, -59.6357421875, -57.123046875, -54.6103515625, -52.09765625, -49.5849609375, -47.072265625, -44.5595703125, -42.046875, -39.5341796875, -37.021484375, -34.5087890625, -31.99609375, -29.4833984375, -26.970703125, -24.4580078125, -21.9453125, -19.4326171875, -16.919921875, -14.4072265625, -11.89453125, -9.3818359375, -6.869140625, -4.3564453125, -1.84375, 0.6689453125, 3.181640625, 5.6943359375, 8.20703125, 10.7197265625, 13.232421875, 15.7451171875, 18.2578125, 20.7705078125, 23.283203125, 25.7958984375, 28.30859375, 30.8212890625, 33.333984375, 35.8466796875, 38.359375, 40.8720703125, 43.384765625, 45.8974609375, 48.41015625, 50.9228515625, 53.435546875, 55.9482421875, 58.4609375, 60.9736328125, 63.486328125, 65.9990234375, 68.51171875, 71.0244140625, 73.537109375, 76.0498046875, 78.5625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 6.0, 13.0, 10.0, 13.0, 25.0, 27.0, 44.0, 40.0, 49.0, 56.0, 81.0, 91.0, 111.0, 86.0, 67.0, 43.0, 50.0, 44.0, 29.0, 25.0, 18.0, 8.0, 12.0, 8.0, 3.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004119873046875, -0.003968477249145508, -0.0038170814514160156, -0.0036656856536865234, -0.0035142898559570312, -0.003362894058227539, -0.003211498260498047, -0.0030601024627685547, -0.0029087066650390625, -0.0027573108673095703, -0.002605915069580078, -0.002454519271850586, -0.0023031234741210938, -0.0021517276763916016, -0.0020003318786621094, -0.0018489360809326172, -0.001697540283203125, -0.0015461444854736328, -0.0013947486877441406, -0.0012433528900146484, -0.0010919570922851562, -0.0009405612945556641, -0.0007891654968261719, -0.0006377696990966797, -0.0004863739013671875, -0.0003349781036376953, -0.00018358230590820312, -3.218650817871094e-05, 0.00011920928955078125, 0.00027060508728027344, 0.0004220008850097656, 0.0005733966827392578, 0.00072479248046875, 0.0008761882781982422, 0.0010275840759277344, 0.0011789798736572266, 0.0013303756713867188, 0.001481771469116211, 0.0016331672668457031, 0.0017845630645751953, 0.0019359588623046875, 0.0020873546600341797, 0.002238750457763672, 0.002390146255493164, 0.0025415420532226562, 0.0026929378509521484, 0.0028443336486816406, 0.002995729446411133, 0.003147125244140625, 0.003298521041870117, 0.0034499168395996094, 0.0036013126373291016, 0.0037527084350585938, 0.003904104232788086, 0.004055500030517578, 0.00420689582824707, 0.0043582916259765625, 0.004509687423706055, 0.004661083221435547, 0.004812479019165039, 0.004963874816894531, 0.0051152706146240234, 0.005266666412353516, 0.005418062210083008, 0.0055694580078125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 5.0, 4.0, 11.0, 11.0, 22.0, 20.0, 40.0, 65.0, 130.0, 212.0, 513.0, 1267.0, 3715.0, 14455.0, 96760.0, 653102.0, 240841.0, 27933.0, 6134.0, 1947.0, 687.0, 331.0, 129.0, 84.0, 44.0, 22.0, 15.0, 14.0, 8.0, 11.0, 3.0, 4.0, 3.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.609375, -29.504150390625, -28.39892578125, -27.293701171875, -26.1884765625, -25.083251953125, -23.97802734375, -22.872802734375, -21.767578125, -20.662353515625, -19.55712890625, -18.451904296875, -17.3466796875, -16.241455078125, -15.13623046875, -14.031005859375, -12.92578125, -11.820556640625, -10.71533203125, -9.610107421875, -8.5048828125, -7.399658203125, -6.29443359375, -5.189208984375, -4.083984375, -2.978759765625, -1.87353515625, -0.768310546875, 0.3369140625, 1.442138671875, 2.54736328125, 3.652587890625, 4.7578125, 5.863037109375, 6.96826171875, 8.073486328125, 9.1787109375, 10.283935546875, 11.38916015625, 12.494384765625, 13.599609375, 14.704833984375, 15.81005859375, 16.915283203125, 18.0205078125, 19.125732421875, 20.23095703125, 21.336181640625, 22.44140625, 23.546630859375, 24.65185546875, 25.757080078125, 26.8623046875, 27.967529296875, 29.07275390625, 30.177978515625, 31.283203125, 32.388427734375, 33.49365234375, 34.598876953125, 35.7041015625, 36.809326171875, 37.91455078125, 39.019775390625, 40.125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 11.0, 10.0, 20.0, 24.0, 63.0, 93.0, 116.0, 133.0, 136.0, 133.0, 95.0, 47.0, 51.0, 29.0, 12.0, 13.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.390625, -28.346923828125, -27.30322265625, -26.259521484375, -25.2158203125, -24.172119140625, -23.12841796875, -22.084716796875, -21.041015625, -19.997314453125, -18.95361328125, -17.909912109375, -16.8662109375, -15.822509765625, -14.77880859375, -13.735107421875, -12.69140625, -11.647705078125, -10.60400390625, -9.560302734375, -8.5166015625, -7.472900390625, -6.42919921875, -5.385498046875, -4.341796875, -3.298095703125, -2.25439453125, -1.210693359375, -0.1669921875, 0.876708984375, 1.92041015625, 2.964111328125, 4.0078125, 5.051513671875, 6.09521484375, 7.138916015625, 8.1826171875, 9.226318359375, 10.27001953125, 11.313720703125, 12.357421875, 13.401123046875, 14.44482421875, 15.488525390625, 16.5322265625, 17.575927734375, 18.61962890625, 19.663330078125, 20.70703125, 21.750732421875, 22.79443359375, 23.838134765625, 24.8818359375, 25.925537109375, 26.96923828125, 28.012939453125, 29.056640625, 30.100341796875, 31.14404296875, 32.187744140625, 33.2314453125, 34.275146484375, 35.31884765625, 36.362548828125, 37.40625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 7.0, 29.0, 111.0, 353.0, 370.0, 119.0, 20.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.05770874023438, -214.02015686035156, -178.98260498046875, -143.94505310058594, -108.90750122070312, -73.86994934082031, -38.8323974609375, -3.7948455810546875, 31.242706298828125, 66.28025817871094, 101.31781005859375, 136.35536193847656, 171.39291381835938, 206.4304656982422, 241.468017578125, 276.50555419921875, 311.5431213378906, 346.5806884765625, 381.61822509765625, 416.65576171875, 451.6933288574219, 486.73089599609375, 521.7684326171875, 556.8059692382812, 591.843505859375, 626.8810424804688, 661.9185791015625, 696.9561767578125, 731.9937133789062, 767.03125, 802.06884765625, 837.1063842773438, 872.1439208984375, 907.1814575195312, 942.218994140625, 977.256591796875, 1012.2941284179688, 1047.3316650390625, 1082.3692626953125, 1117.40673828125, 1152.4443359375, 1187.48193359375, 1222.5194091796875, 1257.5570068359375, 1292.594482421875, 1327.632080078125, 1362.669677734375, 1397.7071533203125, 1432.7447509765625, 1467.7823486328125, 1502.81982421875, 1537.857421875, 1572.89501953125, 1607.9324951171875, 1642.9700927734375, 1678.007568359375, 1713.045166015625, 1748.082763671875, 1783.1202392578125, 1818.1578369140625, 1853.1953125, 1888.23291015625, 1923.2705078125, 1958.3079833984375, 1993.3455810546875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 8.0, 6.0, 9.0, 9.0, 5.0, 14.0, 6.0, 12.0, 9.0, 26.0, 24.0, 30.0, 22.0, 27.0, 34.0, 36.0, 41.0, 37.0, 47.0, 43.0, 52.0, 49.0, 43.0, 41.0, 46.0, 44.0, 37.0, 36.0, 38.0, 30.0, 17.0, 21.0, 11.0, 14.0, 14.0, 17.0, 6.0, 14.0, 12.0, 3.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-222.6886749267578, -215.6664581298828, -208.6442413330078, -201.6220245361328, -194.5998077392578, -187.5775909423828, -180.55535888671875, -173.53314208984375, -166.51092529296875, -159.48870849609375, -152.46649169921875, -145.44427490234375, -138.42205810546875, -131.39984130859375, -124.37761688232422, -117.35540008544922, -110.33319091796875, -103.31097412109375, -96.28875732421875, -89.26654052734375, -82.24432373046875, -75.22210693359375, -68.19988250732422, -61.17766571044922, -54.15544891357422, -47.13323211669922, -40.11101531982422, -33.08879470825195, -26.066577911376953, -19.044361114501953, -12.022140502929688, -4.9999237060546875, 2.022308349609375, 9.044526100158691, 16.066743850708008, 23.08896255493164, 30.11117935180664, 37.13339614868164, 44.155616760253906, 51.177833557128906, 58.200050354003906, 65.2222671508789, 72.2444839477539, 79.26670837402344, 86.28892517089844, 93.31114196777344, 100.33335876464844, 107.35557556152344, 114.37779235839844, 121.40000915527344, 128.42222595214844, 135.44444274902344, 142.46665954589844, 149.48887634277344, 156.5111083984375, 163.5333251953125, 170.5555419921875, 177.5777587890625, 184.5999755859375, 191.6221923828125, 198.6444091796875, 205.6666259765625, 212.6888427734375, 219.7110595703125, 226.7332763671875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 8.0, 9.0, 13.0, 21.0, 22.0, 31.0, 38.0, 69.0, 89.0, 142.0, 153.0, 243.0, 403.0, 540.0, 948.0, 1575.0, 3070.0, 6191.0, 16092.0, 66717.0, 3891421.0, 163629.0, 25702.0, 8409.0, 3651.0, 1986.0, 1156.0, 608.0, 438.0, 266.0, 184.0, 131.0, 83.0, 69.0, 46.0, 28.0, 21.0, 13.0, 16.0, 15.0, 11.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-48.1875, -46.71337890625, -45.2392578125, -43.76513671875, -42.291015625, -40.81689453125, -39.3427734375, -37.86865234375, -36.39453125, -34.92041015625, -33.4462890625, -31.97216796875, -30.498046875, -29.02392578125, -27.5498046875, -26.07568359375, -24.6015625, -23.12744140625, -21.6533203125, -20.17919921875, -18.705078125, -17.23095703125, -15.7568359375, -14.28271484375, -12.80859375, -11.33447265625, -9.8603515625, -8.38623046875, -6.912109375, -5.43798828125, -3.9638671875, -2.48974609375, -1.015625, 0.45849609375, 1.9326171875, 3.40673828125, 4.880859375, 6.35498046875, 7.8291015625, 9.30322265625, 10.77734375, 12.25146484375, 13.7255859375, 15.19970703125, 16.673828125, 18.14794921875, 19.6220703125, 21.09619140625, 22.5703125, 24.04443359375, 25.5185546875, 26.99267578125, 28.466796875, 29.94091796875, 31.4150390625, 32.88916015625, 34.36328125, 35.83740234375, 37.3115234375, 38.78564453125, 40.259765625, 41.73388671875, 43.2080078125, 44.68212890625, 46.15625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 9.0, 2.0, 4.0, 16.0, 13.0, 17.0, 30.0, 26.0, 37.0, 31.0, 32.0, 44.0, 57.0, 53.0, 61.0, 53.0, 49.0, 57.0, 54.0, 56.0, 47.0, 38.0, 34.0, 35.0, 30.0, 29.0, 26.0, 8.0, 17.0, 8.0, 11.0, 4.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.0701904296875, -9.726318359375, -9.3824462890625, -9.03857421875, -8.6947021484375, -8.350830078125, -8.0069580078125, -7.6630859375, -7.3192138671875, -6.975341796875, -6.6314697265625, -6.28759765625, -5.9437255859375, -5.599853515625, -5.2559814453125, -4.912109375, -4.5682373046875, -4.224365234375, -3.8804931640625, -3.53662109375, -3.1927490234375, -2.848876953125, -2.5050048828125, -2.1611328125, -1.8172607421875, -1.473388671875, -1.1295166015625, -0.78564453125, -0.4417724609375, -0.097900390625, 0.2459716796875, 0.58984375, 0.9337158203125, 1.277587890625, 1.6214599609375, 1.96533203125, 2.3092041015625, 2.653076171875, 2.9969482421875, 3.3408203125, 3.6846923828125, 4.028564453125, 4.3724365234375, 4.71630859375, 5.0601806640625, 5.404052734375, 5.7479248046875, 6.091796875, 6.4356689453125, 6.779541015625, 7.1234130859375, 7.46728515625, 7.8111572265625, 8.155029296875, 8.4989013671875, 8.8427734375, 9.1866455078125, 9.530517578125, 9.8743896484375, 10.21826171875, 10.5621337890625, 10.906005859375, 11.2498779296875, 11.59375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 6.0, 11.0, 18.0, 25.0, 41.0, 42.0, 70.0, 109.0, 149.0, 214.0, 335.0, 542.0, 896.0, 1565.0, 3238.0, 7489.0, 32374.0, 3946760.0, 174303.0, 15362.0, 5042.0, 2470.0, 1231.0, 696.0, 428.0, 281.0, 200.0, 104.0, 84.0, 53.0, 39.0, 27.0, 17.0, 21.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-111.9375, -108.89453125, -105.8515625, -102.80859375, -99.765625, -96.72265625, -93.6796875, -90.63671875, -87.59375, -84.55078125, -81.5078125, -78.46484375, -75.421875, -72.37890625, -69.3359375, -66.29296875, -63.25, -60.20703125, -57.1640625, -54.12109375, -51.078125, -48.03515625, -44.9921875, -41.94921875, -38.90625, -35.86328125, -32.8203125, -29.77734375, -26.734375, -23.69140625, -20.6484375, -17.60546875, -14.5625, -11.51953125, -8.4765625, -5.43359375, -2.390625, 0.65234375, 3.6953125, 6.73828125, 9.78125, 12.82421875, 15.8671875, 18.91015625, 21.953125, 24.99609375, 28.0390625, 31.08203125, 34.125, 37.16796875, 40.2109375, 43.25390625, 46.296875, 49.33984375, 52.3828125, 55.42578125, 58.46875, 61.51171875, 64.5546875, 67.59765625, 70.640625, 73.68359375, 76.7265625, 79.76953125, 82.8125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 11.0, 9.0, 15.0, 37.0, 85.0, 439.0, 3191.0, 152.0, 54.0, 32.0, 9.0, 7.0, 6.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.28125, -23.6627197265625, -23.044189453125, -22.4256591796875, -21.80712890625, -21.1885986328125, -20.570068359375, -19.9515380859375, -19.3330078125, -18.7144775390625, -18.095947265625, -17.4774169921875, -16.85888671875, -16.2403564453125, -15.621826171875, -15.0032958984375, -14.384765625, -13.7662353515625, -13.147705078125, -12.5291748046875, -11.91064453125, -11.2921142578125, -10.673583984375, -10.0550537109375, -9.4365234375, -8.8179931640625, -8.199462890625, -7.5809326171875, -6.96240234375, -6.3438720703125, -5.725341796875, -5.1068115234375, -4.48828125, -3.8697509765625, -3.251220703125, -2.6326904296875, -2.01416015625, -1.3956298828125, -0.777099609375, -0.1585693359375, 0.4599609375, 1.0784912109375, 1.697021484375, 2.3155517578125, 2.93408203125, 3.5526123046875, 4.171142578125, 4.7896728515625, 5.408203125, 6.0267333984375, 6.645263671875, 7.2637939453125, 7.88232421875, 8.5008544921875, 9.119384765625, 9.7379150390625, 10.3564453125, 10.9749755859375, 11.593505859375, 12.2120361328125, 12.83056640625, 13.4490966796875, 14.067626953125, 14.6861572265625, 15.3046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 3.0, 3.0, 5.0, 7.0, 9.0, 14.0, 23.0, 34.0, 35.0, 46.0, 54.0, 71.0, 80.0, 77.0, 97.0, 90.0, 79.0, 72.0, 66.0, 30.0, 32.0, 21.0, 17.0, 7.0, 5.0, 11.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.845252990722656, -47.290611267089844, -45.73596954345703, -44.18132781982422, -42.626686096191406, -41.072044372558594, -39.51740264892578, -37.96276092529297, -36.408119201660156, -34.853477478027344, -33.29883575439453, -31.74419403076172, -30.189552307128906, -28.634910583496094, -27.08026885986328, -25.52562713623047, -23.970985412597656, -22.416343688964844, -20.86170196533203, -19.30706024169922, -17.752418518066406, -16.197776794433594, -14.643135070800781, -13.088493347167969, -11.533851623535156, -9.979209899902344, -8.424568176269531, -6.869926452636719, -5.315284729003906, -3.7606430053710938, -2.2060012817382812, -0.6513595581054688, 0.9032821655273438, 2.4579238891601562, 4.012565612792969, 5.567207336425781, 7.121849060058594, 8.676490783691406, 10.231132507324219, 11.785774230957031, 13.340415954589844, 14.895057678222656, 16.44969940185547, 18.00434112548828, 19.558982849121094, 21.113624572753906, 22.66826629638672, 24.22290802001953, 25.777549743652344, 27.332191467285156, 28.88683319091797, 30.44147491455078, 31.996116638183594, 33.550758361816406, 35.10540008544922, 36.66004180908203, 38.214683532714844, 39.769325256347656, 41.32396697998047, 42.87860870361328, 44.433250427246094, 45.987892150878906, 47.54253387451172, 49.09717559814453, 50.651817321777344]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 2.0, 9.0, 7.0, 17.0, 19.0, 15.0, 18.0, 23.0, 23.0, 34.0, 35.0, 33.0, 42.0, 37.0, 41.0, 46.0, 41.0, 36.0, 57.0, 40.0, 35.0, 44.0, 33.0, 32.0, 44.0, 28.0, 21.0, 34.0, 22.0, 24.0, 19.0, 14.0, 11.0, 7.0, 14.0, 7.0, 6.0, 4.0, 7.0, 1.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.44331359863281, -32.43024826049805, -31.417186737060547, -30.404123306274414, -29.39105987548828, -28.377994537353516, -27.364931106567383, -26.35186767578125, -25.338804244995117, -24.325740814208984, -23.31267738342285, -22.29961395263672, -21.286548614501953, -20.273487091064453, -19.260421752929688, -18.247358322143555, -17.234294891357422, -16.22123146057129, -15.208168029785156, -14.195103645324707, -13.182040214538574, -12.168976783752441, -11.155912399291992, -10.14284896850586, -9.129785537719727, -8.116722106933594, -7.103658199310303, -6.090594291687012, -5.077530860900879, -4.064467430114746, -3.051403522491455, -2.038339614868164, -1.025278091430664, -0.012214422225952148, 1.0008492469787598, 2.0139129161834717, 3.0269765853881836, 4.040040016174316, 5.053103923797607, 6.066167831420898, 7.079231262207031, 8.092294692993164, 9.105358123779297, 10.118422508239746, 11.131485939025879, 12.144549369812012, 13.157613754272461, 14.170677185058594, 15.183740615844727, 16.19680404663086, 17.209867477416992, 18.222930908203125, 19.23599624633789, 20.24905776977539, 21.262123107910156, 22.27518653869629, 23.288249969482422, 24.301313400268555, 25.314376831054688, 26.32744026184082, 27.340503692626953, 28.35356903076172, 29.36663246154785, 30.379695892333984, 31.392759323120117]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 6.0, 10.0, 7.0, 10.0, 19.0, 17.0, 21.0, 54.0, 63.0, 111.0, 189.0, 384.0, 715.0, 1520.0, 3047.0, 7063.0, 16051.0, 38311.0, 90190.0, 198487.0, 299391.0, 216272.0, 101196.0, 42568.0, 18012.0, 7930.0, 3448.0, 1672.0, 807.0, 395.0, 217.0, 133.0, 82.0, 58.0, 30.0, 17.0, 10.0, 11.0, 14.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.78125, -26.95361328125, -26.1259765625, -25.29833984375, -24.470703125, -23.64306640625, -22.8154296875, -21.98779296875, -21.16015625, -20.33251953125, -19.5048828125, -18.67724609375, -17.849609375, -17.02197265625, -16.1943359375, -15.36669921875, -14.5390625, -13.71142578125, -12.8837890625, -12.05615234375, -11.228515625, -10.40087890625, -9.5732421875, -8.74560546875, -7.91796875, -7.09033203125, -6.2626953125, -5.43505859375, -4.607421875, -3.77978515625, -2.9521484375, -2.12451171875, -1.296875, -0.46923828125, 0.3583984375, 1.18603515625, 2.013671875, 2.84130859375, 3.6689453125, 4.49658203125, 5.32421875, 6.15185546875, 6.9794921875, 7.80712890625, 8.634765625, 9.46240234375, 10.2900390625, 11.11767578125, 11.9453125, 12.77294921875, 13.6005859375, 14.42822265625, 15.255859375, 16.08349609375, 16.9111328125, 17.73876953125, 18.56640625, 19.39404296875, 20.2216796875, 21.04931640625, 21.876953125, 22.70458984375, 23.5322265625, 24.35986328125, 25.1875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 10.0, 3.0, 6.0, 10.0, 18.0, 14.0, 8.0, 20.0, 28.0, 19.0, 29.0, 26.0, 39.0, 50.0, 40.0, 37.0, 50.0, 46.0, 46.0, 50.0, 38.0, 33.0, 44.0, 51.0, 40.0, 41.0, 30.0, 26.0, 26.0, 20.0, 25.0, 15.0, 11.0, 16.0, 7.0, 8.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.140625, -10.7989501953125, -10.457275390625, -10.1156005859375, -9.77392578125, -9.4322509765625, -9.090576171875, -8.7489013671875, -8.4072265625, -8.0655517578125, -7.723876953125, -7.3822021484375, -7.04052734375, -6.6988525390625, -6.357177734375, -6.0155029296875, -5.673828125, -5.3321533203125, -4.990478515625, -4.6488037109375, -4.30712890625, -3.9654541015625, -3.623779296875, -3.2821044921875, -2.9404296875, -2.5987548828125, -2.257080078125, -1.9154052734375, -1.57373046875, -1.2320556640625, -0.890380859375, -0.5487060546875, -0.20703125, 0.1346435546875, 0.476318359375, 0.8179931640625, 1.15966796875, 1.5013427734375, 1.843017578125, 2.1846923828125, 2.5263671875, 2.8680419921875, 3.209716796875, 3.5513916015625, 3.89306640625, 4.2347412109375, 4.576416015625, 4.9180908203125, 5.259765625, 5.6014404296875, 5.943115234375, 6.2847900390625, 6.62646484375, 6.9681396484375, 7.309814453125, 7.6514892578125, 7.9931640625, 8.3348388671875, 8.676513671875, 9.0181884765625, 9.35986328125, 9.7015380859375, 10.043212890625, 10.3848876953125, 10.7265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 11.0, 20.0, 18.0, 16.0, 36.0, 44.0, 47.0, 87.0, 117.0, 201.0, 309.0, 511.0, 898.0, 1882.0, 5285.0, 20928.0, 111081.0, 535714.0, 301739.0, 51881.0, 11157.0, 3371.0, 1320.0, 675.0, 391.0, 274.0, 158.0, 110.0, 70.0, 50.0, 32.0, 27.0, 25.0, 18.0, 12.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.8125, -46.25927734375, -44.7060546875, -43.15283203125, -41.599609375, -40.04638671875, -38.4931640625, -36.93994140625, -35.38671875, -33.83349609375, -32.2802734375, -30.72705078125, -29.173828125, -27.62060546875, -26.0673828125, -24.51416015625, -22.9609375, -21.40771484375, -19.8544921875, -18.30126953125, -16.748046875, -15.19482421875, -13.6416015625, -12.08837890625, -10.53515625, -8.98193359375, -7.4287109375, -5.87548828125, -4.322265625, -2.76904296875, -1.2158203125, 0.33740234375, 1.890625, 3.44384765625, 4.9970703125, 6.55029296875, 8.103515625, 9.65673828125, 11.2099609375, 12.76318359375, 14.31640625, 15.86962890625, 17.4228515625, 18.97607421875, 20.529296875, 22.08251953125, 23.6357421875, 25.18896484375, 26.7421875, 28.29541015625, 29.8486328125, 31.40185546875, 32.955078125, 34.50830078125, 36.0615234375, 37.61474609375, 39.16796875, 40.72119140625, 42.2744140625, 43.82763671875, 45.380859375, 46.93408203125, 48.4873046875, 50.04052734375, 51.59375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 13.0, 8.0, 10.0, 11.0, 17.0, 20.0, 13.0, 25.0, 18.0, 21.0, 33.0, 35.0, 42.0, 47.0, 44.0, 44.0, 44.0, 29.0, 41.0, 44.0, 37.0, 46.0, 45.0, 28.0, 39.0, 26.0, 20.0, 19.0, 23.0, 24.0, 14.0, 17.0, 13.0, 12.0, 7.0, 12.0, 5.0, 9.0, 7.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-53.125, -51.4990234375, -49.873046875, -48.2470703125, -46.62109375, -44.9951171875, -43.369140625, -41.7431640625, -40.1171875, -38.4912109375, -36.865234375, -35.2392578125, -33.61328125, -31.9873046875, -30.361328125, -28.7353515625, -27.109375, -25.4833984375, -23.857421875, -22.2314453125, -20.60546875, -18.9794921875, -17.353515625, -15.7275390625, -14.1015625, -12.4755859375, -10.849609375, -9.2236328125, -7.59765625, -5.9716796875, -4.345703125, -2.7197265625, -1.09375, 0.5322265625, 2.158203125, 3.7841796875, 5.41015625, 7.0361328125, 8.662109375, 10.2880859375, 11.9140625, 13.5400390625, 15.166015625, 16.7919921875, 18.41796875, 20.0439453125, 21.669921875, 23.2958984375, 24.921875, 26.5478515625, 28.173828125, 29.7998046875, 31.42578125, 33.0517578125, 34.677734375, 36.3037109375, 37.9296875, 39.5556640625, 41.181640625, 42.8076171875, 44.43359375, 46.0595703125, 47.685546875, 49.3115234375, 50.9375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 14.0, 8.0, 7.0, 11.0, 14.0, 21.0, 22.0, 46.0, 64.0, 94.0, 116.0, 167.0, 299.0, 507.0, 994.0, 2096.0, 5164.0, 17974.0, 87761.0, 493517.0, 357726.0, 60521.0, 13458.0, 4130.0, 1719.0, 854.0, 449.0, 253.0, 160.0, 118.0, 79.0, 50.0, 40.0, 30.0, 16.0, 16.0, 8.0, 7.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.765625, -30.855224609375, -29.94482421875, -29.034423828125, -28.1240234375, -27.213623046875, -26.30322265625, -25.392822265625, -24.482421875, -23.572021484375, -22.66162109375, -21.751220703125, -20.8408203125, -19.930419921875, -19.02001953125, -18.109619140625, -17.19921875, -16.288818359375, -15.37841796875, -14.468017578125, -13.5576171875, -12.647216796875, -11.73681640625, -10.826416015625, -9.916015625, -9.005615234375, -8.09521484375, -7.184814453125, -6.2744140625, -5.364013671875, -4.45361328125, -3.543212890625, -2.6328125, -1.722412109375, -0.81201171875, 0.098388671875, 1.0087890625, 1.919189453125, 2.82958984375, 3.739990234375, 4.650390625, 5.560791015625, 6.47119140625, 7.381591796875, 8.2919921875, 9.202392578125, 10.11279296875, 11.023193359375, 11.93359375, 12.843994140625, 13.75439453125, 14.664794921875, 15.5751953125, 16.485595703125, 17.39599609375, 18.306396484375, 19.216796875, 20.127197265625, 21.03759765625, 21.947998046875, 22.8583984375, 23.768798828125, 24.67919921875, 25.589599609375, 26.5]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 17.0, 31.0, 50.0, 63.0, 100.0, 163.0, 158.0, 161.0, 104.0, 64.0, 33.0, 20.0, 16.0, 7.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038547515869140625, -0.003567427396774292, -0.0032801032066345215, -0.002992779016494751, -0.0027054548263549805, -0.00241813063621521, -0.0021308064460754395, -0.001843482255935669, -0.0015561580657958984, -0.001268833875656128, -0.0009815096855163574, -0.0006941854953765869, -0.0004068613052368164, -0.0001195371150970459, 0.0001677870750427246, 0.0004551112651824951, 0.0007424354553222656, 0.0010297596454620361, 0.0013170838356018066, 0.0016044080257415771, 0.0018917322158813477, 0.002179056406021118, 0.0024663805961608887, 0.002753704786300659, 0.0030410289764404297, 0.0033283531665802, 0.0036156773567199707, 0.003903001546859741, 0.004190325736999512, 0.004477649927139282, 0.004764974117279053, 0.005052298307418823, 0.005339622497558594, 0.005626946687698364, 0.005914270877838135, 0.006201595067977905, 0.006488919258117676, 0.006776243448257446, 0.007063567638397217, 0.007350891828536987, 0.007638216018676758, 0.007925540208816528, 0.008212864398956299, 0.00850018858909607, 0.00878751277923584, 0.00907483696937561, 0.00936216115951538, 0.009649485349655151, 0.009936809539794922, 0.010224133729934692, 0.010511457920074463, 0.010798782110214233, 0.011086106300354004, 0.011373430490493774, 0.011660754680633545, 0.011948078870773315, 0.012235403060913086, 0.012522727251052856, 0.012810051441192627, 0.013097375631332397, 0.013384699821472168, 0.013672024011611938, 0.013959348201751709, 0.01424667239189148, 0.01453399658203125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 8.0, 11.0, 23.0, 27.0, 56.0, 93.0, 158.0, 417.0, 1338.0, 5796.0, 54647.0, 755532.0, 213199.0, 13681.0, 2390.0, 682.0, 243.0, 125.0, 54.0, 25.0, 16.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -36.876953125, -35.25390625, -33.630859375, -32.0078125, -30.384765625, -28.76171875, -27.138671875, -25.515625, -23.892578125, -22.26953125, -20.646484375, -19.0234375, -17.400390625, -15.77734375, -14.154296875, -12.53125, -10.908203125, -9.28515625, -7.662109375, -6.0390625, -4.416015625, -2.79296875, -1.169921875, 0.453125, 2.076171875, 3.69921875, 5.322265625, 6.9453125, 8.568359375, 10.19140625, 11.814453125, 13.4375, 15.060546875, 16.68359375, 18.306640625, 19.9296875, 21.552734375, 23.17578125, 24.798828125, 26.421875, 28.044921875, 29.66796875, 31.291015625, 32.9140625, 34.537109375, 36.16015625, 37.783203125, 39.40625, 41.029296875, 42.65234375, 44.275390625, 45.8984375, 47.521484375, 49.14453125, 50.767578125, 52.390625, 54.013671875, 55.63671875, 57.259765625, 58.8828125, 60.505859375, 62.12890625, 63.751953125, 65.375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 9.0, 17.0, 22.0, 23.0, 31.0, 47.0, 60.0, 75.0, 101.0, 107.0, 98.0, 87.0, 76.0, 72.0, 62.0, 23.0, 17.0, 21.0, 13.0, 5.0, 10.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.515625, -22.552001953125, -21.58837890625, -20.624755859375, -19.6611328125, -18.697509765625, -17.73388671875, -16.770263671875, -15.806640625, -14.843017578125, -13.87939453125, -12.915771484375, -11.9521484375, -10.988525390625, -10.02490234375, -9.061279296875, -8.09765625, -7.134033203125, -6.17041015625, -5.206787109375, -4.2431640625, -3.279541015625, -2.31591796875, -1.352294921875, -0.388671875, 0.574951171875, 1.53857421875, 2.502197265625, 3.4658203125, 4.429443359375, 5.39306640625, 6.356689453125, 7.3203125, 8.283935546875, 9.24755859375, 10.211181640625, 11.1748046875, 12.138427734375, 13.10205078125, 14.065673828125, 15.029296875, 15.992919921875, 16.95654296875, 17.920166015625, 18.8837890625, 19.847412109375, 20.81103515625, 21.774658203125, 22.73828125, 23.701904296875, 24.66552734375, 25.629150390625, 26.5927734375, 27.556396484375, 28.52001953125, 29.483642578125, 30.447265625, 31.410888671875, 32.37451171875, 33.338134765625, 34.3017578125, 35.265380859375, 36.22900390625, 37.192626953125, 38.15625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 23.0, 78.0, 147.0, 215.0, 246.0, 185.0, 64.0, 28.0, 13.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-492.8465576171875, -466.9833679199219, -441.12017822265625, -415.25701904296875, -389.3938293457031, -363.5306396484375, -337.6674499511719, -311.80426025390625, -285.94110107421875, -260.0779113769531, -234.21473693847656, -208.35154724121094, -182.48837280273438, -156.62518310546875, -130.76199340820312, -104.89881896972656, -79.03561401367188, -53.17243194580078, -27.309246063232422, -1.4460601806640625, 24.41712188720703, 50.280303955078125, 76.14349365234375, 102.00666809082031, 127.86985778808594, 153.73304748535156, 179.59622192382812, 205.45941162109375, 231.32260131835938, 257.185791015625, 283.0489501953125, 308.9121398925781, 334.77532958984375, 360.6385192871094, 386.501708984375, 412.3648681640625, 438.2280578613281, 464.09124755859375, 489.9544372558594, 515.817626953125, 541.6807861328125, 567.5439453125, 593.4071655273438, 619.2703247070312, 645.133544921875, 670.9967041015625, 696.85986328125, 722.7230834960938, 748.5863037109375, 774.449462890625, 800.3126831054688, 826.1758422851562, 852.0390625, 877.9022216796875, 903.765380859375, 929.6286010742188, 955.4917602539062, 981.3549194335938, 1007.2181396484375, 1033.081298828125, 1058.9444580078125, 1084.8076171875, 1110.6708984375, 1136.5340576171875, 1162.397216796875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 14.0, 9.0, 13.0, 10.0, 10.0, 20.0, 29.0, 23.0, 28.0, 34.0, 31.0, 34.0, 29.0, 45.0, 57.0, 44.0, 58.0, 42.0, 55.0, 55.0, 35.0, 39.0, 35.0, 35.0, 30.0, 31.0, 22.0, 19.0, 22.0, 11.0, 12.0, 16.0, 8.0, 1.0, 10.0, 10.0, 2.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-319.8168640136719, -310.1666259765625, -300.5163879394531, -290.8661193847656, -281.21588134765625, -271.5656433105469, -261.9154052734375, -252.26516723632812, -242.6149139404297, -232.9646759033203, -223.31442260742188, -213.6641845703125, -204.01394653320312, -194.3636932373047, -184.7134552001953, -175.06320190429688, -165.4129638671875, -155.76272583007812, -146.1124725341797, -136.4622344970703, -126.8119888305664, -117.1617431640625, -107.51150512695312, -97.86125946044922, -88.21101379394531, -78.5607681274414, -68.9105224609375, -59.260284423828125, -49.61003875732422, -39.95979309082031, -30.309551239013672, -20.65930938720703, -11.009033203125, -1.3587894439697266, 8.291454315185547, 17.94169807434082, 27.591941833496094, 37.2421875, 46.89242935180664, 56.54267120361328, 66.19291687011719, 75.8431625366211, 85.493408203125, 95.14364624023438, 104.79389190673828, 114.44413757324219, 124.09437561035156, 133.74462890625, 143.39486694335938, 153.04510498046875, 162.6953582763672, 172.34559631347656, 181.995849609375, 191.64608764648438, 201.29632568359375, 210.94656372070312, 220.59681701660156, 230.24705505371094, 239.89730834960938, 249.54754638671875, 259.1977844238281, 268.8480224609375, 278.498291015625, 288.1485290527344, 297.79876708984375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 9.0, 8.0, 12.0, 19.0, 31.0, 41.0, 61.0, 85.0, 182.0, 280.0, 457.0, 704.0, 1273.0, 2368.0, 5206.0, 12895.0, 44610.0, 3607607.0, 460871.0, 36902.0, 11067.0, 4517.0, 2115.0, 1086.0, 695.0, 394.0, 260.0, 176.0, 119.0, 84.0, 60.0, 30.0, 24.0, 15.0, 7.0, 10.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.375, -46.64306640625, -44.9111328125, -43.17919921875, -41.447265625, -39.71533203125, -37.9833984375, -36.25146484375, -34.51953125, -32.78759765625, -31.0556640625, -29.32373046875, -27.591796875, -25.85986328125, -24.1279296875, -22.39599609375, -20.6640625, -18.93212890625, -17.2001953125, -15.46826171875, -13.736328125, -12.00439453125, -10.2724609375, -8.54052734375, -6.80859375, -5.07666015625, -3.3447265625, -1.61279296875, 0.119140625, 1.85107421875, 3.5830078125, 5.31494140625, 7.046875, 8.77880859375, 10.5107421875, 12.24267578125, 13.974609375, 15.70654296875, 17.4384765625, 19.17041015625, 20.90234375, 22.63427734375, 24.3662109375, 26.09814453125, 27.830078125, 29.56201171875, 31.2939453125, 33.02587890625, 34.7578125, 36.48974609375, 38.2216796875, 39.95361328125, 41.685546875, 43.41748046875, 45.1494140625, 46.88134765625, 48.61328125, 50.34521484375, 52.0771484375, 53.80908203125, 55.541015625, 57.27294921875, 59.0048828125, 60.73681640625, 62.46875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 8.0, 14.0, 15.0, 21.0, 26.0, 18.0, 31.0, 33.0, 37.0, 52.0, 60.0, 52.0, 64.0, 64.0, 64.0, 81.0, 59.0, 46.0, 58.0, 48.0, 27.0, 30.0, 19.0, 14.0, 15.0, 19.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.84375, -17.3697509765625, -16.895751953125, -16.4217529296875, -15.94775390625, -15.4737548828125, -14.999755859375, -14.5257568359375, -14.0517578125, -13.5777587890625, -13.103759765625, -12.6297607421875, -12.15576171875, -11.6817626953125, -11.207763671875, -10.7337646484375, -10.259765625, -9.7857666015625, -9.311767578125, -8.8377685546875, -8.36376953125, -7.8897705078125, -7.415771484375, -6.9417724609375, -6.4677734375, -5.9937744140625, -5.519775390625, -5.0457763671875, -4.57177734375, -4.0977783203125, -3.623779296875, -3.1497802734375, -2.67578125, -2.2017822265625, -1.727783203125, -1.2537841796875, -0.77978515625, -0.3057861328125, 0.168212890625, 0.6422119140625, 1.1162109375, 1.5902099609375, 2.064208984375, 2.5382080078125, 3.01220703125, 3.4862060546875, 3.960205078125, 4.4342041015625, 4.908203125, 5.3822021484375, 5.856201171875, 6.3302001953125, 6.80419921875, 7.2781982421875, 7.752197265625, 8.2261962890625, 8.7001953125, 9.1741943359375, 9.648193359375, 10.1221923828125, 10.59619140625, 11.0701904296875, 11.544189453125, 12.0181884765625, 12.4921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 15.0, 18.0, 24.0, 29.0, 40.0, 52.0, 95.0, 101.0, 155.0, 290.0, 474.0, 772.0, 1440.0, 2915.0, 6860.0, 20913.0, 119885.0, 3913240.0, 95960.0, 18594.0, 6291.0, 2668.0, 1391.0, 767.0, 406.0, 256.0, 186.0, 124.0, 96.0, 54.0, 37.0, 33.0, 18.0, 15.0, 18.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 3.0], "bins": [-88.25, -86.01318359375, -83.7763671875, -81.53955078125, -79.302734375, -77.06591796875, -74.8291015625, -72.59228515625, -70.35546875, -68.11865234375, -65.8818359375, -63.64501953125, -61.408203125, -59.17138671875, -56.9345703125, -54.69775390625, -52.4609375, -50.22412109375, -47.9873046875, -45.75048828125, -43.513671875, -41.27685546875, -39.0400390625, -36.80322265625, -34.56640625, -32.32958984375, -30.0927734375, -27.85595703125, -25.619140625, -23.38232421875, -21.1455078125, -18.90869140625, -16.671875, -14.43505859375, -12.1982421875, -9.96142578125, -7.724609375, -5.48779296875, -3.2509765625, -1.01416015625, 1.22265625, 3.45947265625, 5.6962890625, 7.93310546875, 10.169921875, 12.40673828125, 14.6435546875, 16.88037109375, 19.1171875, 21.35400390625, 23.5908203125, 25.82763671875, 28.064453125, 30.30126953125, 32.5380859375, 34.77490234375, 37.01171875, 39.24853515625, 41.4853515625, 43.72216796875, 45.958984375, 48.19580078125, 50.4326171875, 52.66943359375, 54.90625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 5.0, 9.0, 23.0, 26.0, 34.0, 77.0, 227.0, 3019.0, 406.0, 96.0, 60.0, 33.0, 10.0, 10.0, 4.0, 11.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -20.09228515625, -19.5126953125, -18.93310546875, -18.353515625, -17.77392578125, -17.1943359375, -16.61474609375, -16.03515625, -15.45556640625, -14.8759765625, -14.29638671875, -13.716796875, -13.13720703125, -12.5576171875, -11.97802734375, -11.3984375, -10.81884765625, -10.2392578125, -9.65966796875, -9.080078125, -8.50048828125, -7.9208984375, -7.34130859375, -6.76171875, -6.18212890625, -5.6025390625, -5.02294921875, -4.443359375, -3.86376953125, -3.2841796875, -2.70458984375, -2.125, -1.54541015625, -0.9658203125, -0.38623046875, 0.193359375, 0.77294921875, 1.3525390625, 1.93212890625, 2.51171875, 3.09130859375, 3.6708984375, 4.25048828125, 4.830078125, 5.40966796875, 5.9892578125, 6.56884765625, 7.1484375, 7.72802734375, 8.3076171875, 8.88720703125, 9.466796875, 10.04638671875, 10.6259765625, 11.20556640625, 11.78515625, 12.36474609375, 12.9443359375, 13.52392578125, 14.103515625, 14.68310546875, 15.2626953125, 15.84228515625, 16.421875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 7.0, 14.0, 22.0, 44.0, 49.0, 81.0, 87.0, 121.0, 125.0, 128.0, 101.0, 80.0, 44.0, 30.0, 14.0, 16.0, 10.0, 3.0, 11.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.79011535644531, -91.06727600097656, -88.34444427490234, -85.62161254882812, -82.89877319335938, -80.17593383789062, -77.4531021118164, -74.73027038574219, -72.00743103027344, -69.28459167480469, -66.56175994873047, -63.838924407958984, -61.1160888671875, -58.393253326416016, -55.67041778564453, -52.94758224487305, -50.22474670410156, -47.50191116333008, -44.779075622558594, -42.05624008178711, -39.333404541015625, -36.61056900024414, -33.887733459472656, -31.164897918701172, -28.442062377929688, -25.719226837158203, -22.99639129638672, -20.273555755615234, -17.55072021484375, -14.827884674072266, -12.105049133300781, -9.382213592529297, -6.6593780517578125, -3.936542510986328, -1.2137069702148438, 1.5091285705566406, 4.231964111328125, 6.954799652099609, 9.677635192871094, 12.400470733642578, 15.123306274414062, 17.846141815185547, 20.56897735595703, 23.291812896728516, 26.0146484375, 28.737483978271484, 31.46031951904297, 34.18315505981445, 36.90599060058594, 39.62882614135742, 42.351661682128906, 45.07449722290039, 47.797332763671875, 50.52016830444336, 53.243003845214844, 55.96583938598633, 58.68867492675781, 61.4115104675293, 64.13434600830078, 66.857177734375, 69.58001708984375, 72.3028564453125, 75.02568817138672, 77.74851989746094, 80.47135925292969]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 11.0, 14.0, 18.0, 13.0, 14.0, 18.0, 23.0, 24.0, 25.0, 21.0, 42.0, 32.0, 38.0, 40.0, 25.0, 57.0, 50.0, 36.0, 45.0, 44.0, 45.0, 46.0, 32.0, 32.0, 28.0, 31.0, 26.0, 14.0, 26.0, 21.0, 21.0, 12.0, 7.0, 12.0, 7.0, 8.0, 5.0, 4.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-39.73627853393555, -38.607452392578125, -37.47863006591797, -36.34980392456055, -35.220977783203125, -34.09215545654297, -32.96332931518555, -31.834505081176758, -30.70568084716797, -29.57685661315918, -28.44803237915039, -27.31920623779297, -26.19038200378418, -25.06155776977539, -23.93273162841797, -22.80390739440918, -21.67508316040039, -20.5462589263916, -19.417434692382812, -18.28860855102539, -17.1597843170166, -16.030960083007812, -14.902134895324707, -13.773309707641602, -12.644485473632812, -11.515661239624023, -10.386836051940918, -9.258010864257812, -8.129186630249023, -7.000361919403076, -5.871537208557129, -4.742712497711182, -3.6138916015625, -2.4850668907165527, -1.3562421798706055, -0.2274174690246582, 0.9014072418212891, 2.0302319526672363, 3.1590566635131836, 4.287881374359131, 5.416706085205078, 6.545530796051025, 7.674355506896973, 8.803180694580078, 9.932004928588867, 11.060829162597656, 12.189654350280762, 13.318479537963867, 14.447303771972656, 15.576128005981445, 16.704952239990234, 17.833778381347656, 18.962602615356445, 20.091426849365234, 21.220252990722656, 22.349077224731445, 23.477901458740234, 24.606725692749023, 25.735549926757812, 26.864376068115234, 27.993200302124023, 29.122024536132812, 30.250850677490234, 31.379674911499023, 32.50849914550781]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 6.0, 14.0, 18.0, 27.0, 37.0, 65.0, 93.0, 154.0, 255.0, 475.0, 729.0, 1401.0, 2713.0, 5529.0, 11463.0, 26688.0, 65846.0, 167271.0, 327997.0, 255002.0, 106532.0, 41967.0, 17881.0, 7953.0, 3960.0, 1984.0, 998.0, 611.0, 340.0, 206.0, 121.0, 65.0, 51.0, 36.0, 13.0, 17.0, 8.0, 7.0, 7.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-30.140625, -29.2734375, -28.40625, -27.5390625, -26.671875, -25.8046875, -24.9375, -24.0703125, -23.203125, -22.3359375, -21.46875, -20.6015625, -19.734375, -18.8671875, -18.0, -17.1328125, -16.265625, -15.3984375, -14.53125, -13.6640625, -12.796875, -11.9296875, -11.0625, -10.1953125, -9.328125, -8.4609375, -7.59375, -6.7265625, -5.859375, -4.9921875, -4.125, -3.2578125, -2.390625, -1.5234375, -0.65625, 0.2109375, 1.078125, 1.9453125, 2.8125, 3.6796875, 4.546875, 5.4140625, 6.28125, 7.1484375, 8.015625, 8.8828125, 9.75, 10.6171875, 11.484375, 12.3515625, 13.21875, 14.0859375, 14.953125, 15.8203125, 16.6875, 17.5546875, 18.421875, 19.2890625, 20.15625, 21.0234375, 21.890625, 22.7578125, 23.625, 24.4921875, 25.359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 12.0, 8.0, 10.0, 14.0, 16.0, 28.0, 37.0, 39.0, 34.0, 26.0, 43.0, 68.0, 70.0, 59.0, 59.0, 49.0, 48.0, 62.0, 46.0, 53.0, 39.0, 33.0, 35.0, 24.0, 20.0, 9.0, 14.0, 6.0, 5.0, 10.0, 3.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.375, -17.8966064453125, -17.418212890625, -16.9398193359375, -16.46142578125, -15.9830322265625, -15.504638671875, -15.0262451171875, -14.5478515625, -14.0694580078125, -13.591064453125, -13.1126708984375, -12.63427734375, -12.1558837890625, -11.677490234375, -11.1990966796875, -10.720703125, -10.2423095703125, -9.763916015625, -9.2855224609375, -8.80712890625, -8.3287353515625, -7.850341796875, -7.3719482421875, -6.8935546875, -6.4151611328125, -5.936767578125, -5.4583740234375, -4.97998046875, -4.5015869140625, -4.023193359375, -3.5447998046875, -3.06640625, -2.5880126953125, -2.109619140625, -1.6312255859375, -1.15283203125, -0.6744384765625, -0.196044921875, 0.2823486328125, 0.7607421875, 1.2391357421875, 1.717529296875, 2.1959228515625, 2.67431640625, 3.1527099609375, 3.631103515625, 4.1094970703125, 4.587890625, 5.0662841796875, 5.544677734375, 6.0230712890625, 6.50146484375, 6.9798583984375, 7.458251953125, 7.9366455078125, 8.4150390625, 8.8934326171875, 9.371826171875, 9.8502197265625, 10.32861328125, 10.8070068359375, 11.285400390625, 11.7637939453125, 12.2421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 10.0, 16.0, 19.0, 38.0, 50.0, 84.0, 134.0, 275.0, 563.0, 1357.0, 5543.0, 83427.0, 888916.0, 60901.0, 4823.0, 1254.0, 510.0, 265.0, 142.0, 91.0, 43.0, 23.0, 19.0, 12.0, 7.0, 5.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-112.25, -108.9921875, -105.734375, -102.4765625, -99.21875, -95.9609375, -92.703125, -89.4453125, -86.1875, -82.9296875, -79.671875, -76.4140625, -73.15625, -69.8984375, -66.640625, -63.3828125, -60.125, -56.8671875, -53.609375, -50.3515625, -47.09375, -43.8359375, -40.578125, -37.3203125, -34.0625, -30.8046875, -27.546875, -24.2890625, -21.03125, -17.7734375, -14.515625, -11.2578125, -8.0, -4.7421875, -1.484375, 1.7734375, 5.03125, 8.2890625, 11.546875, 14.8046875, 18.0625, 21.3203125, 24.578125, 27.8359375, 31.09375, 34.3515625, 37.609375, 40.8671875, 44.125, 47.3828125, 50.640625, 53.8984375, 57.15625, 60.4140625, 63.671875, 66.9296875, 70.1875, 73.4453125, 76.703125, 79.9609375, 83.21875, 86.4765625, 89.734375, 92.9921875, 96.25]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 5.0, 9.0, 14.0, 13.0, 22.0, 22.0, 15.0, 27.0, 25.0, 30.0, 30.0, 35.0, 36.0, 45.0, 31.0, 32.0, 38.0, 52.0, 50.0, 45.0, 59.0, 40.0, 33.0, 40.0, 31.0, 28.0, 28.0, 29.0, 18.0, 19.0, 22.0, 13.0, 10.0, 7.0, 5.0, 7.0, 4.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.90625, -56.07763671875, -54.2490234375, -52.42041015625, -50.591796875, -48.76318359375, -46.9345703125, -45.10595703125, -43.27734375, -41.44873046875, -39.6201171875, -37.79150390625, -35.962890625, -34.13427734375, -32.3056640625, -30.47705078125, -28.6484375, -26.81982421875, -24.9912109375, -23.16259765625, -21.333984375, -19.50537109375, -17.6767578125, -15.84814453125, -14.01953125, -12.19091796875, -10.3623046875, -8.53369140625, -6.705078125, -4.87646484375, -3.0478515625, -1.21923828125, 0.609375, 2.43798828125, 4.2666015625, 6.09521484375, 7.923828125, 9.75244140625, 11.5810546875, 13.40966796875, 15.23828125, 17.06689453125, 18.8955078125, 20.72412109375, 22.552734375, 24.38134765625, 26.2099609375, 28.03857421875, 29.8671875, 31.69580078125, 33.5244140625, 35.35302734375, 37.181640625, 39.01025390625, 40.8388671875, 42.66748046875, 44.49609375, 46.32470703125, 48.1533203125, 49.98193359375, 51.810546875, 53.63916015625, 55.4677734375, 57.29638671875, 59.125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 7.0, 11.0, 18.0, 28.0, 27.0, 47.0, 74.0, 103.0, 159.0, 264.0, 497.0, 916.0, 1983.0, 5616.0, 24123.0, 221481.0, 684567.0, 89024.0, 12948.0, 3530.0, 1365.0, 686.0, 376.0, 253.0, 127.0, 93.0, 72.0, 44.0, 30.0, 23.0, 17.0, 8.0, 8.0, 9.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.5625, -31.48828125, -30.4140625, -29.33984375, -28.265625, -27.19140625, -26.1171875, -25.04296875, -23.96875, -22.89453125, -21.8203125, -20.74609375, -19.671875, -18.59765625, -17.5234375, -16.44921875, -15.375, -14.30078125, -13.2265625, -12.15234375, -11.078125, -10.00390625, -8.9296875, -7.85546875, -6.78125, -5.70703125, -4.6328125, -3.55859375, -2.484375, -1.41015625, -0.3359375, 0.73828125, 1.8125, 2.88671875, 3.9609375, 5.03515625, 6.109375, 7.18359375, 8.2578125, 9.33203125, 10.40625, 11.48046875, 12.5546875, 13.62890625, 14.703125, 15.77734375, 16.8515625, 17.92578125, 19.0, 20.07421875, 21.1484375, 22.22265625, 23.296875, 24.37109375, 25.4453125, 26.51953125, 27.59375, 28.66796875, 29.7421875, 30.81640625, 31.890625, 32.96484375, 34.0390625, 35.11328125, 36.1875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 10.0, 7.0, 8.0, 12.0, 7.0, 15.0, 20.0, 31.0, 39.0, 66.0, 70.0, 84.0, 121.0, 104.0, 102.0, 74.0, 59.0, 55.0, 34.0, 22.0, 16.0, 13.0, 8.0, 6.0, 3.0, 10.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.006134033203125, -0.005959868431091309, -0.005785703659057617, -0.005611538887023926, -0.005437374114990234, -0.005263209342956543, -0.0050890445709228516, -0.00491487979888916, -0.004740715026855469, -0.004566550254821777, -0.004392385482788086, -0.0042182207107543945, -0.004044055938720703, -0.0038698911666870117, -0.0036957263946533203, -0.003521561622619629, -0.0033473968505859375, -0.003173232078552246, -0.0029990673065185547, -0.0028249025344848633, -0.002650737762451172, -0.0024765729904174805, -0.002302408218383789, -0.0021282434463500977, -0.0019540786743164062, -0.0017799139022827148, -0.0016057491302490234, -0.001431584358215332, -0.0012574195861816406, -0.0010832548141479492, -0.0009090900421142578, -0.0007349252700805664, -0.000560760498046875, -0.0003865957260131836, -0.0002124309539794922, -3.826618194580078e-05, 0.00013589859008789062, 0.00031006336212158203, 0.00048422813415527344, 0.0006583929061889648, 0.0008325576782226562, 0.0010067224502563477, 0.001180887222290039, 0.0013550519943237305, 0.0015292167663574219, 0.0017033815383911133, 0.0018775463104248047, 0.002051711082458496, 0.0022258758544921875, 0.002400040626525879, 0.0025742053985595703, 0.0027483701705932617, 0.002922534942626953, 0.0030966997146606445, 0.003270864486694336, 0.0034450292587280273, 0.0036191940307617188, 0.00379335880279541, 0.0039675235748291016, 0.004141688346862793, 0.004315853118896484, 0.004490017890930176, 0.004664182662963867, 0.004838347434997559, 0.00501251220703125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 9.0, 16.0, 18.0, 29.0, 73.0, 104.0, 207.0, 516.0, 1546.0, 7066.0, 109248.0, 879628.0, 43579.0, 4497.0, 1198.0, 379.0, 195.0, 95.0, 61.0, 33.0, 16.0, 15.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.125, -49.1865234375, -47.248046875, -45.3095703125, -43.37109375, -41.4326171875, -39.494140625, -37.5556640625, -35.6171875, -33.6787109375, -31.740234375, -29.8017578125, -27.86328125, -25.9248046875, -23.986328125, -22.0478515625, -20.109375, -18.1708984375, -16.232421875, -14.2939453125, -12.35546875, -10.4169921875, -8.478515625, -6.5400390625, -4.6015625, -2.6630859375, -0.724609375, 1.2138671875, 3.15234375, 5.0908203125, 7.029296875, 8.9677734375, 10.90625, 12.8447265625, 14.783203125, 16.7216796875, 18.66015625, 20.5986328125, 22.537109375, 24.4755859375, 26.4140625, 28.3525390625, 30.291015625, 32.2294921875, 34.16796875, 36.1064453125, 38.044921875, 39.9833984375, 41.921875, 43.8603515625, 45.798828125, 47.7373046875, 49.67578125, 51.6142578125, 53.552734375, 55.4912109375, 57.4296875, 59.3681640625, 61.306640625, 63.2451171875, 65.18359375, 67.1220703125, 69.060546875, 70.9990234375, 72.9375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 15.0, 18.0, 26.0, 55.0, 62.0, 91.0, 107.0, 145.0, 130.0, 80.0, 89.0, 59.0, 38.0, 26.0, 13.0, 12.0, 5.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.65625, -48.439208984375, -47.22216796875, -46.005126953125, -44.7880859375, -43.571044921875, -42.35400390625, -41.136962890625, -39.919921875, -38.702880859375, -37.48583984375, -36.268798828125, -35.0517578125, -33.834716796875, -32.61767578125, -31.400634765625, -30.18359375, -28.966552734375, -27.74951171875, -26.532470703125, -25.3154296875, -24.098388671875, -22.88134765625, -21.664306640625, -20.447265625, -19.230224609375, -18.01318359375, -16.796142578125, -15.5791015625, -14.362060546875, -13.14501953125, -11.927978515625, -10.7109375, -9.493896484375, -8.27685546875, -7.059814453125, -5.8427734375, -4.625732421875, -3.40869140625, -2.191650390625, -0.974609375, 0.242431640625, 1.45947265625, 2.676513671875, 3.8935546875, 5.110595703125, 6.32763671875, 7.544677734375, 8.76171875, 9.978759765625, 11.19580078125, 12.412841796875, 13.6298828125, 14.846923828125, 16.06396484375, 17.281005859375, 18.498046875, 19.715087890625, 20.93212890625, 22.149169921875, 23.3662109375, 24.583251953125, 25.80029296875, 27.017333984375, 28.234375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 16.0, 41.0, 71.0, 84.0, 133.0, 151.0, 149.0, 139.0, 93.0, 58.0, 24.0, 18.0, 9.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-848.6618041992188, -831.5957641601562, -814.5296630859375, -797.463623046875, -780.3975830078125, -763.33154296875, -746.2654418945312, -729.1994018554688, -712.13330078125, -695.0672607421875, -678.0011596679688, -660.9351196289062, -643.8690795898438, -626.802978515625, -609.7369384765625, -592.6708984375, -575.6048583984375, -558.538818359375, -541.4727172851562, -524.4066772460938, -507.34063720703125, -490.2745666503906, -473.20849609375, -456.1424560546875, -439.0763854980469, -422.01031494140625, -404.94427490234375, -387.8782043457031, -370.8121337890625, -353.74609375, -336.6800231933594, -319.61395263671875, -302.54791259765625, -285.4818420410156, -268.4158020019531, -251.3497314453125, -234.28367614746094, -217.21762084960938, -200.15155029296875, -183.0854949951172, -166.01942443847656, -148.953369140625, -131.88729858398438, -114.82124328613281, -97.75518798828125, -80.68913269042969, -63.623069763183594, -46.5570068359375, -29.490951538085938, -12.42489242553711, 4.641166687011719, 21.707225799560547, 38.773284912109375, 55.83934020996094, 72.90540313720703, 89.97146606445312, 107.03752136230469, 124.10357666015625, 141.16964721679688, 158.23570251464844, 175.3017578125, 192.36781311035156, 209.43386840820312, 226.49993896484375, 243.5659942626953]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 8.0, 6.0, 3.0, 11.0, 9.0, 18.0, 22.0, 17.0, 29.0, 30.0, 33.0, 54.0, 56.0, 46.0, 54.0, 59.0, 64.0, 71.0, 55.0, 58.0, 50.0, 50.0, 43.0, 26.0, 21.0, 25.0, 15.0, 18.0, 19.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-317.2839050292969, -305.4145202636719, -293.54510498046875, -281.67572021484375, -269.80633544921875, -257.9369201660156, -246.06753540039062, -234.19813537597656, -222.3287353515625, -210.45933532714844, -198.58993530273438, -186.72055053710938, -174.8511505126953, -162.98175048828125, -151.11236572265625, -139.2429656982422, -127.37356567382812, -115.50416564941406, -103.63477325439453, -91.765380859375, -79.89598083496094, -68.02658081054688, -56.157188415527344, -44.28779602050781, -32.41839599609375, -20.548999786376953, -8.679603576660156, 3.1897926330566406, 15.059188842773438, 26.928585052490234, 38.79798126220703, 50.66737365722656, 62.5367431640625, 74.40614318847656, 86.2755355834961, 98.14492797851562, 110.01432800292969, 121.88372802734375, 133.75311279296875, 145.6225128173828, 157.49191284179688, 169.36131286621094, 181.230712890625, 193.10009765625, 204.96949768066406, 216.83889770507812, 228.70828247070312, 240.5776824951172, 252.44708251953125, 264.31646728515625, 276.1858825683594, 288.0552673339844, 299.9246826171875, 311.7940673828125, 323.6634521484375, 335.5328369140625, 347.4022521972656, 359.2716369628906, 371.14105224609375, 383.01043701171875, 394.87982177734375, 406.7492370605469, 418.6186218261719, 430.488037109375, 442.357421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 6.0, 12.0, 17.0, 15.0, 23.0, 34.0, 46.0, 64.0, 82.0, 138.0, 150.0, 282.0, 461.0, 725.0, 1305.0, 2704.0, 6540.0, 22066.0, 3702914.0, 424813.0, 20065.0, 6030.0, 2538.0, 1249.0, 739.0, 424.0, 235.0, 180.0, 109.0, 76.0, 50.0, 47.0, 33.0, 24.0, 16.0, 16.0, 9.0, 10.0, 5.0, 10.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-66.3125, -64.23828125, -62.1640625, -60.08984375, -58.015625, -55.94140625, -53.8671875, -51.79296875, -49.71875, -47.64453125, -45.5703125, -43.49609375, -41.421875, -39.34765625, -37.2734375, -35.19921875, -33.125, -31.05078125, -28.9765625, -26.90234375, -24.828125, -22.75390625, -20.6796875, -18.60546875, -16.53125, -14.45703125, -12.3828125, -10.30859375, -8.234375, -6.16015625, -4.0859375, -2.01171875, 0.0625, 2.13671875, 4.2109375, 6.28515625, 8.359375, 10.43359375, 12.5078125, 14.58203125, 16.65625, 18.73046875, 20.8046875, 22.87890625, 24.953125, 27.02734375, 29.1015625, 31.17578125, 33.25, 35.32421875, 37.3984375, 39.47265625, 41.546875, 43.62109375, 45.6953125, 47.76953125, 49.84375, 51.91796875, 53.9921875, 56.06640625, 58.140625, 60.21484375, 62.2890625, 64.36328125, 66.4375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 10.0, 9.0, 10.0, 12.0, 13.0, 25.0, 31.0, 32.0, 56.0, 40.0, 66.0, 62.0, 83.0, 52.0, 77.0, 66.0, 63.0, 53.0, 44.0, 44.0, 38.0, 33.0, 21.0, 14.0, 11.0, 11.0, 4.0, 9.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.734375, -20.13916015625, -19.5439453125, -18.94873046875, -18.353515625, -17.75830078125, -17.1630859375, -16.56787109375, -15.97265625, -15.37744140625, -14.7822265625, -14.18701171875, -13.591796875, -12.99658203125, -12.4013671875, -11.80615234375, -11.2109375, -10.61572265625, -10.0205078125, -9.42529296875, -8.830078125, -8.23486328125, -7.6396484375, -7.04443359375, -6.44921875, -5.85400390625, -5.2587890625, -4.66357421875, -4.068359375, -3.47314453125, -2.8779296875, -2.28271484375, -1.6875, -1.09228515625, -0.4970703125, 0.09814453125, 0.693359375, 1.28857421875, 1.8837890625, 2.47900390625, 3.07421875, 3.66943359375, 4.2646484375, 4.85986328125, 5.455078125, 6.05029296875, 6.6455078125, 7.24072265625, 7.8359375, 8.43115234375, 9.0263671875, 9.62158203125, 10.216796875, 10.81201171875, 11.4072265625, 12.00244140625, 12.59765625, 13.19287109375, 13.7880859375, 14.38330078125, 14.978515625, 15.57373046875, 16.1689453125, 16.76416015625, 17.359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 8.0, 9.0, 16.0, 17.0, 36.0, 28.0, 42.0, 84.0, 118.0, 168.0, 265.0, 396.0, 651.0, 1199.0, 2515.0, 6322.0, 26277.0, 4037331.0, 100132.0, 10851.0, 3691.0, 1736.0, 883.0, 498.0, 327.0, 208.0, 127.0, 112.0, 67.0, 53.0, 33.0, 31.0, 11.0, 8.0, 11.0, 4.0, 6.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-118.5, -115.359375, -112.21875, -109.078125, -105.9375, -102.796875, -99.65625, -96.515625, -93.375, -90.234375, -87.09375, -83.953125, -80.8125, -77.671875, -74.53125, -71.390625, -68.25, -65.109375, -61.96875, -58.828125, -55.6875, -52.546875, -49.40625, -46.265625, -43.125, -39.984375, -36.84375, -33.703125, -30.5625, -27.421875, -24.28125, -21.140625, -18.0, -14.859375, -11.71875, -8.578125, -5.4375, -2.296875, 0.84375, 3.984375, 7.125, 10.265625, 13.40625, 16.546875, 19.6875, 22.828125, 25.96875, 29.109375, 32.25, 35.390625, 38.53125, 41.671875, 44.8125, 47.953125, 51.09375, 54.234375, 57.375, 60.515625, 63.65625, 66.796875, 69.9375, 73.078125, 76.21875, 79.359375, 82.5]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 12.0, 29.0, 59.0, 191.0, 3456.0, 188.0, 55.0, 19.0, 15.0, 8.0, 4.0, 2.0, 2.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-25.75, -25.097412109375, -24.44482421875, -23.792236328125, -23.1396484375, -22.487060546875, -21.83447265625, -21.181884765625, -20.529296875, -19.876708984375, -19.22412109375, -18.571533203125, -17.9189453125, -17.266357421875, -16.61376953125, -15.961181640625, -15.30859375, -14.656005859375, -14.00341796875, -13.350830078125, -12.6982421875, -12.045654296875, -11.39306640625, -10.740478515625, -10.087890625, -9.435302734375, -8.78271484375, -8.130126953125, -7.4775390625, -6.824951171875, -6.17236328125, -5.519775390625, -4.8671875, -4.214599609375, -3.56201171875, -2.909423828125, -2.2568359375, -1.604248046875, -0.95166015625, -0.299072265625, 0.353515625, 1.006103515625, 1.65869140625, 2.311279296875, 2.9638671875, 3.616455078125, 4.26904296875, 4.921630859375, 5.57421875, 6.226806640625, 6.87939453125, 7.531982421875, 8.1845703125, 8.837158203125, 9.48974609375, 10.142333984375, 10.794921875, 11.447509765625, 12.10009765625, 12.752685546875, 13.4052734375, 14.057861328125, 14.71044921875, 15.363037109375, 16.015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 8.0, 9.0, 11.0, 19.0, 25.0, 38.0, 74.0, 94.0, 147.0, 159.0, 115.0, 99.0, 71.0, 39.0, 29.0, 17.0, 14.0, 10.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.260986328125, -81.47915649414062, -78.69731903076172, -75.91548919677734, -73.13365173339844, -70.35182189941406, -67.56998443603516, -64.78815460205078, -62.006317138671875, -59.224483489990234, -56.442649841308594, -53.66081619262695, -50.87898254394531, -48.09714889526367, -45.31531524658203, -42.533485412597656, -39.751651763916016, -36.969818115234375, -34.187984466552734, -31.406150817871094, -28.624317169189453, -25.842483520507812, -23.060651779174805, -20.278818130493164, -17.496984481811523, -14.715150833129883, -11.933317184448242, -9.151484489440918, -6.369650840759277, -3.5878171920776367, -0.8059844970703125, 1.9758491516113281, 4.757682800292969, 7.539516448974609, 10.32135009765625, 13.103182792663574, 15.885016441345215, 18.666851043701172, 21.44868278503418, 24.23051643371582, 27.01235008239746, 29.7941837310791, 32.57601547241211, 35.35784912109375, 38.13968276977539, 40.92151641845703, 43.70335006713867, 46.48518371582031, 49.26701736450195, 52.048851013183594, 54.830684661865234, 57.612518310546875, 60.394351959228516, 63.176185607910156, 65.95801544189453, 68.73985290527344, 71.52168273925781, 74.30351257324219, 77.0853500366211, 79.86717987060547, 82.64901733398438, 85.43084716796875, 88.21268463134766, 90.99451446533203, 93.77635192871094]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 3.0, 5.0, 6.0, 11.0, 9.0, 13.0, 10.0, 14.0, 20.0, 22.0, 24.0, 31.0, 26.0, 27.0, 39.0, 31.0, 40.0, 43.0, 44.0, 38.0, 46.0, 46.0, 31.0, 36.0, 39.0, 43.0, 33.0, 28.0, 34.0, 32.0, 30.0, 18.0, 17.0, 18.0, 20.0, 12.0, 15.0, 5.0, 7.0, 5.0, 2.0, 6.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.69208526611328, -32.61668014526367, -31.541275024414062, -30.46586799621582, -29.39046287536621, -28.3150577545166, -27.23965072631836, -26.16424560546875, -25.08884048461914, -24.01343536376953, -22.938030242919922, -21.86262321472168, -20.78721809387207, -19.71181297302246, -18.63640594482422, -17.56100082397461, -16.485595703125, -15.41019058227539, -14.334784507751465, -13.259378433227539, -12.18397331237793, -11.10856819152832, -10.033162117004395, -8.957756042480469, -7.882350921630859, -6.806945323944092, -5.731539726257324, -4.656134128570557, -3.580728530883789, -2.5053229331970215, -1.429917335510254, -0.35451173782348633, 0.7208976745605469, 1.7963032722473145, 2.871708869934082, 3.9471144676208496, 5.022520065307617, 6.097925662994385, 7.173331260681152, 8.248737335205078, 9.324142456054688, 10.399547576904297, 11.474953651428223, 12.550359725952148, 13.625764846801758, 14.701169967651367, 15.776576042175293, 16.85198211669922, 17.927387237548828, 19.002792358398438, 20.078197479248047, 21.15360450744629, 22.2290096282959, 23.304414749145508, 24.37982177734375, 25.45522689819336, 26.53063201904297, 27.606037139892578, 28.681442260742188, 29.75684928894043, 30.83225440979004, 31.90765953063965, 32.98306655883789, 34.0584716796875, 35.13387680053711]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 4.0, 8.0, 11.0, 13.0, 30.0, 36.0, 60.0, 81.0, 101.0, 157.0, 240.0, 323.0, 580.0, 1008.0, 1800.0, 3399.0, 6755.0, 13697.0, 28768.0, 61207.0, 136281.0, 292575.0, 271014.0, 122970.0, 55018.0, 26163.0, 12604.0, 6339.0, 3168.0, 1720.0, 942.0, 518.0, 333.0, 184.0, 138.0, 87.0, 67.0, 36.0, 34.0, 15.0, 15.0, 17.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0], "bins": [-27.671875, -26.90185546875, -26.1318359375, -25.36181640625, -24.591796875, -23.82177734375, -23.0517578125, -22.28173828125, -21.51171875, -20.74169921875, -19.9716796875, -19.20166015625, -18.431640625, -17.66162109375, -16.8916015625, -16.12158203125, -15.3515625, -14.58154296875, -13.8115234375, -13.04150390625, -12.271484375, -11.50146484375, -10.7314453125, -9.96142578125, -9.19140625, -8.42138671875, -7.6513671875, -6.88134765625, -6.111328125, -5.34130859375, -4.5712890625, -3.80126953125, -3.03125, -2.26123046875, -1.4912109375, -0.72119140625, 0.048828125, 0.81884765625, 1.5888671875, 2.35888671875, 3.12890625, 3.89892578125, 4.6689453125, 5.43896484375, 6.208984375, 6.97900390625, 7.7490234375, 8.51904296875, 9.2890625, 10.05908203125, 10.8291015625, 11.59912109375, 12.369140625, 13.13916015625, 13.9091796875, 14.67919921875, 15.44921875, 16.21923828125, 16.9892578125, 17.75927734375, 18.529296875, 19.29931640625, 20.0693359375, 20.83935546875, 21.609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 6.0, 1.0, 8.0, 14.0, 6.0, 13.0, 23.0, 22.0, 37.0, 36.0, 45.0, 42.0, 46.0, 47.0, 58.0, 66.0, 72.0, 60.0, 62.0, 61.0, 42.0, 39.0, 33.0, 36.0, 26.0, 22.0, 13.0, 11.0, 7.0, 11.0, 9.0, 8.0, 5.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.6875, -19.09423828125, -18.5009765625, -17.90771484375, -17.314453125, -16.72119140625, -16.1279296875, -15.53466796875, -14.94140625, -14.34814453125, -13.7548828125, -13.16162109375, -12.568359375, -11.97509765625, -11.3818359375, -10.78857421875, -10.1953125, -9.60205078125, -9.0087890625, -8.41552734375, -7.822265625, -7.22900390625, -6.6357421875, -6.04248046875, -5.44921875, -4.85595703125, -4.2626953125, -3.66943359375, -3.076171875, -2.48291015625, -1.8896484375, -1.29638671875, -0.703125, -0.10986328125, 0.4833984375, 1.07666015625, 1.669921875, 2.26318359375, 2.8564453125, 3.44970703125, 4.04296875, 4.63623046875, 5.2294921875, 5.82275390625, 6.416015625, 7.00927734375, 7.6025390625, 8.19580078125, 8.7890625, 9.38232421875, 9.9755859375, 10.56884765625, 11.162109375, 11.75537109375, 12.3486328125, 12.94189453125, 13.53515625, 14.12841796875, 14.7216796875, 15.31494140625, 15.908203125, 16.50146484375, 17.0947265625, 17.68798828125, 18.28125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 11.0, 10.0, 15.0, 20.0, 34.0, 48.0, 69.0, 111.0, 172.0, 294.0, 590.0, 1359.0, 4128.0, 34629.0, 792113.0, 199465.0, 11292.0, 2273.0, 831.0, 413.0, 208.0, 129.0, 93.0, 63.0, 36.0, 33.0, 27.0, 19.0, 12.0, 7.0, 6.0, 4.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.125, -79.4560546875, -76.787109375, -74.1181640625, -71.44921875, -68.7802734375, -66.111328125, -63.4423828125, -60.7734375, -58.1044921875, -55.435546875, -52.7666015625, -50.09765625, -47.4287109375, -44.759765625, -42.0908203125, -39.421875, -36.7529296875, -34.083984375, -31.4150390625, -28.74609375, -26.0771484375, -23.408203125, -20.7392578125, -18.0703125, -15.4013671875, -12.732421875, -10.0634765625, -7.39453125, -4.7255859375, -2.056640625, 0.6123046875, 3.28125, 5.9501953125, 8.619140625, 11.2880859375, 13.95703125, 16.6259765625, 19.294921875, 21.9638671875, 24.6328125, 27.3017578125, 29.970703125, 32.6396484375, 35.30859375, 37.9775390625, 40.646484375, 43.3154296875, 45.984375, 48.6533203125, 51.322265625, 53.9912109375, 56.66015625, 59.3291015625, 61.998046875, 64.6669921875, 67.3359375, 70.0048828125, 72.673828125, 75.3427734375, 78.01171875, 80.6806640625, 83.349609375, 86.0185546875, 88.6875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 0.0, 7.0, 11.0, 11.0, 12.0, 18.0, 18.0, 16.0, 17.0, 24.0, 17.0, 22.0, 34.0, 34.0, 46.0, 34.0, 44.0, 30.0, 49.0, 28.0, 35.0, 47.0, 41.0, 44.0, 42.0, 35.0, 27.0, 32.0, 38.0, 27.0, 17.0, 28.0, 16.0, 11.0, 17.0, 9.0, 16.0, 5.0, 8.0, 8.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.96875, -58.10595703125, -56.2431640625, -54.38037109375, -52.517578125, -50.65478515625, -48.7919921875, -46.92919921875, -45.06640625, -43.20361328125, -41.3408203125, -39.47802734375, -37.615234375, -35.75244140625, -33.8896484375, -32.02685546875, -30.1640625, -28.30126953125, -26.4384765625, -24.57568359375, -22.712890625, -20.85009765625, -18.9873046875, -17.12451171875, -15.26171875, -13.39892578125, -11.5361328125, -9.67333984375, -7.810546875, -5.94775390625, -4.0849609375, -2.22216796875, -0.359375, 1.50341796875, 3.3662109375, 5.22900390625, 7.091796875, 8.95458984375, 10.8173828125, 12.68017578125, 14.54296875, 16.40576171875, 18.2685546875, 20.13134765625, 21.994140625, 23.85693359375, 25.7197265625, 27.58251953125, 29.4453125, 31.30810546875, 33.1708984375, 35.03369140625, 36.896484375, 38.75927734375, 40.6220703125, 42.48486328125, 44.34765625, 46.21044921875, 48.0732421875, 49.93603515625, 51.798828125, 53.66162109375, 55.5244140625, 57.38720703125, 59.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0, 3.0, 8.0, 15.0, 11.0, 33.0, 40.0, 97.0, 125.0, 251.0, 500.0, 1311.0, 3811.0, 16638.0, 150796.0, 776551.0, 82179.0, 11213.0, 2951.0, 1027.0, 453.0, 217.0, 126.0, 65.0, 40.0, 26.0, 18.0, 15.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.625, -34.52490234375, -33.4248046875, -32.32470703125, -31.224609375, -30.12451171875, -29.0244140625, -27.92431640625, -26.82421875, -25.72412109375, -24.6240234375, -23.52392578125, -22.423828125, -21.32373046875, -20.2236328125, -19.12353515625, -18.0234375, -16.92333984375, -15.8232421875, -14.72314453125, -13.623046875, -12.52294921875, -11.4228515625, -10.32275390625, -9.22265625, -8.12255859375, -7.0224609375, -5.92236328125, -4.822265625, -3.72216796875, -2.6220703125, -1.52197265625, -0.421875, 0.67822265625, 1.7783203125, 2.87841796875, 3.978515625, 5.07861328125, 6.1787109375, 7.27880859375, 8.37890625, 9.47900390625, 10.5791015625, 11.67919921875, 12.779296875, 13.87939453125, 14.9794921875, 16.07958984375, 17.1796875, 18.27978515625, 19.3798828125, 20.47998046875, 21.580078125, 22.68017578125, 23.7802734375, 24.88037109375, 25.98046875, 27.08056640625, 28.1806640625, 29.28076171875, 30.380859375, 31.48095703125, 32.5810546875, 33.68115234375, 34.78125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 9.0, 5.0, 14.0, 13.0, 22.0, 23.0, 24.0, 47.0, 45.0, 70.0, 94.0, 113.0, 126.0, 90.0, 68.0, 41.0, 38.0, 34.0, 18.0, 19.0, 19.0, 18.0, 7.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00572967529296875, -0.005567014217376709, -0.005404353141784668, -0.005241692066192627, -0.005079030990600586, -0.004916369915008545, -0.004753708839416504, -0.004591047763824463, -0.004428386688232422, -0.004265725612640381, -0.00410306453704834, -0.003940403461456299, -0.003777742385864258, -0.003615081310272217, -0.0034524202346801758, -0.0032897591590881348, -0.0031270980834960938, -0.0029644370079040527, -0.0028017759323120117, -0.0026391148567199707, -0.0024764537811279297, -0.0023137927055358887, -0.0021511316299438477, -0.0019884705543518066, -0.0018258094787597656, -0.0016631484031677246, -0.0015004873275756836, -0.0013378262519836426, -0.0011751651763916016, -0.0010125041007995605, -0.0008498430252075195, -0.0006871819496154785, -0.0005245208740234375, -0.0003618597984313965, -0.00019919872283935547, -3.653764724731445e-05, 0.00012612342834472656, 0.0002887845039367676, 0.0004514455795288086, 0.0006141066551208496, 0.0007767677307128906, 0.0009394288063049316, 0.0011020898818969727, 0.0012647509574890137, 0.0014274120330810547, 0.0015900731086730957, 0.0017527341842651367, 0.0019153952598571777, 0.0020780563354492188, 0.0022407174110412598, 0.0024033784866333008, 0.002566039562225342, 0.002728700637817383, 0.002891361713409424, 0.003054022789001465, 0.003216683864593506, 0.003379344940185547, 0.003542006015777588, 0.003704667091369629, 0.00386732816696167, 0.004029989242553711, 0.004192650318145752, 0.004355311393737793, 0.004517972469329834, 0.004680633544921875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 10.0, 16.0, 20.0, 29.0, 89.0, 139.0, 313.0, 905.0, 3368.0, 27091.0, 730428.0, 270472.0, 12498.0, 2044.0, 612.0, 266.0, 119.0, 55.0, 30.0, 25.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.9375, -54.234375, -52.53125, -50.828125, -49.125, -47.421875, -45.71875, -44.015625, -42.3125, -40.609375, -38.90625, -37.203125, -35.5, -33.796875, -32.09375, -30.390625, -28.6875, -26.984375, -25.28125, -23.578125, -21.875, -20.171875, -18.46875, -16.765625, -15.0625, -13.359375, -11.65625, -9.953125, -8.25, -6.546875, -4.84375, -3.140625, -1.4375, 0.265625, 1.96875, 3.671875, 5.375, 7.078125, 8.78125, 10.484375, 12.1875, 13.890625, 15.59375, 17.296875, 19.0, 20.703125, 22.40625, 24.109375, 25.8125, 27.515625, 29.21875, 30.921875, 32.625, 34.328125, 36.03125, 37.734375, 39.4375, 41.140625, 42.84375, 44.546875, 46.25, 47.953125, 49.65625, 51.359375, 53.0625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 1.0, 9.0, 6.0, 18.0, 22.0, 28.0, 34.0, 62.0, 80.0, 93.0, 104.0, 113.0, 91.0, 76.0, 70.0, 63.0, 31.0, 28.0, 15.0, 20.0, 10.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6875, -32.7646484375, -31.841796875, -30.9189453125, -29.99609375, -29.0732421875, -28.150390625, -27.2275390625, -26.3046875, -25.3818359375, -24.458984375, -23.5361328125, -22.61328125, -21.6904296875, -20.767578125, -19.8447265625, -18.921875, -17.9990234375, -17.076171875, -16.1533203125, -15.23046875, -14.3076171875, -13.384765625, -12.4619140625, -11.5390625, -10.6162109375, -9.693359375, -8.7705078125, -7.84765625, -6.9248046875, -6.001953125, -5.0791015625, -4.15625, -3.2333984375, -2.310546875, -1.3876953125, -0.46484375, 0.4580078125, 1.380859375, 2.3037109375, 3.2265625, 4.1494140625, 5.072265625, 5.9951171875, 6.91796875, 7.8408203125, 8.763671875, 9.6865234375, 10.609375, 11.5322265625, 12.455078125, 13.3779296875, 14.30078125, 15.2236328125, 16.146484375, 17.0693359375, 17.9921875, 18.9150390625, 19.837890625, 20.7607421875, 21.68359375, 22.6064453125, 23.529296875, 24.4521484375, 25.375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 10.0, 23.0, 35.0, 55.0, 89.0, 122.0, 144.0, 145.0, 121.0, 91.0, 62.0, 34.0, 20.0, 11.0, 11.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-460.0072326660156, -446.1057434082031, -432.2042541503906, -418.302734375, -404.4012451171875, -390.499755859375, -376.5982666015625, -362.69677734375, -348.7952880859375, -334.893798828125, -320.9923095703125, -307.0908203125, -293.1893005371094, -279.2878112792969, -265.3863220214844, -251.48483276367188, -237.58331298828125, -223.68182373046875, -209.7803192138672, -195.8788299560547, -181.97732543945312, -168.07583618164062, -154.17434692382812, -140.27285766601562, -126.37135314941406, -112.46985626220703, -98.568359375, -84.6668701171875, -70.76537322998047, -56.86387634277344, -42.96238708496094, -29.060890197753906, -15.15936279296875, -1.2578678131103516, 12.643627166748047, 26.545120239257812, 40.446617126464844, 54.348114013671875, 68.24960327148438, 82.1511001586914, 96.05259704589844, 109.95409393310547, 123.8555908203125, 137.757080078125, 151.6585693359375, 165.56007385253906, 179.46156311035156, 193.36306762695312, 207.26455688476562, 221.16604614257812, 235.0675506591797, 248.9690399169922, 262.87054443359375, 276.77203369140625, 290.67352294921875, 304.57501220703125, 318.47650146484375, 332.37799072265625, 346.27947998046875, 360.18096923828125, 374.0824890136719, 387.9839782714844, 401.8854675292969, 415.7869567871094, 429.6884765625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 3.0, 6.0, 3.0, 11.0, 8.0, 9.0, 17.0, 19.0, 17.0, 16.0, 24.0, 28.0, 37.0, 37.0, 27.0, 51.0, 38.0, 56.0, 48.0, 55.0, 57.0, 52.0, 42.0, 43.0, 34.0, 35.0, 25.0, 31.0, 28.0, 22.0, 20.0, 22.0, 14.0, 13.0, 11.0, 7.0, 6.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-335.2519836425781, -326.1717224121094, -317.0914611816406, -308.01116943359375, -298.930908203125, -289.85064697265625, -280.7703857421875, -271.69012451171875, -262.6098327636719, -253.52957153320312, -244.4492950439453, -235.36903381347656, -226.28875732421875, -217.20849609375, -208.12823486328125, -199.04795837402344, -189.9676971435547, -180.88743591308594, -171.80715942382812, -162.72689819335938, -153.64662170410156, -144.5663604736328, -135.486083984375, -126.40582275390625, -117.32555389404297, -108.24528503417969, -99.1650161743164, -90.08474731445312, -81.00448608398438, -71.92420959472656, -62.84394836425781, -53.76367950439453, -44.68341064453125, -35.60314178466797, -26.52287483215332, -17.442607879638672, -8.36233901977539, 0.7179298400878906, 9.798194885253906, 18.878463745117188, 27.95873260498047, 37.03900146484375, 46.11927032470703, 55.19953536987305, 64.27980041503906, 73.36007690429688, 82.44033813476562, 91.5206069946289, 100.60087585449219, 109.68114471435547, 118.76141357421875, 127.8416748046875, 136.9219512939453, 146.00221252441406, 155.08248901367188, 164.16275024414062, 173.24301147460938, 182.32327270507812, 191.40354919433594, 200.4838104248047, 209.5640869140625, 218.64434814453125, 227.724609375, 236.8048858642578, 245.88516235351562]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 2.0, 7.0, 7.0, 17.0, 21.0, 25.0, 29.0, 54.0, 50.0, 102.0, 118.0, 163.0, 241.0, 325.0, 451.0, 741.0, 1167.0, 1862.0, 3254.0, 6596.0, 17793.0, 81467.0, 3854889.0, 179252.0, 26709.0, 8896.0, 4009.0, 2137.0, 1262.0, 834.0, 551.0, 375.0, 245.0, 164.0, 133.0, 79.0, 61.0, 50.0, 36.0, 36.0, 23.0, 9.0, 12.0, 11.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.75, -46.2880859375, -44.826171875, -43.3642578125, -41.90234375, -40.4404296875, -38.978515625, -37.5166015625, -36.0546875, -34.5927734375, -33.130859375, -31.6689453125, -30.20703125, -28.7451171875, -27.283203125, -25.8212890625, -24.359375, -22.8974609375, -21.435546875, -19.9736328125, -18.51171875, -17.0498046875, -15.587890625, -14.1259765625, -12.6640625, -11.2021484375, -9.740234375, -8.2783203125, -6.81640625, -5.3544921875, -3.892578125, -2.4306640625, -0.96875, 0.4931640625, 1.955078125, 3.4169921875, 4.87890625, 6.3408203125, 7.802734375, 9.2646484375, 10.7265625, 12.1884765625, 13.650390625, 15.1123046875, 16.57421875, 18.0361328125, 19.498046875, 20.9599609375, 22.421875, 23.8837890625, 25.345703125, 26.8076171875, 28.26953125, 29.7314453125, 31.193359375, 32.6552734375, 34.1171875, 35.5791015625, 37.041015625, 38.5029296875, 39.96484375, 41.4267578125, 42.888671875, 44.3505859375, 45.8125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 10.0, 8.0, 7.0, 20.0, 21.0, 33.0, 33.0, 52.0, 51.0, 80.0, 68.0, 86.0, 81.0, 85.0, 88.0, 67.0, 49.0, 43.0, 25.0, 26.0, 23.0, 14.0, 10.0, 9.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-33.40625, -32.6671142578125, -31.927978515625, -31.1888427734375, -30.44970703125, -29.7105712890625, -28.971435546875, -28.2322998046875, -27.4931640625, -26.7540283203125, -26.014892578125, -25.2757568359375, -24.53662109375, -23.7974853515625, -23.058349609375, -22.3192138671875, -21.580078125, -20.8409423828125, -20.101806640625, -19.3626708984375, -18.62353515625, -17.8843994140625, -17.145263671875, -16.4061279296875, -15.6669921875, -14.9278564453125, -14.188720703125, -13.4495849609375, -12.71044921875, -11.9713134765625, -11.232177734375, -10.4930419921875, -9.75390625, -9.0147705078125, -8.275634765625, -7.5364990234375, -6.79736328125, -6.0582275390625, -5.319091796875, -4.5799560546875, -3.8408203125, -3.1016845703125, -2.362548828125, -1.6234130859375, -0.88427734375, -0.1451416015625, 0.593994140625, 1.3331298828125, 2.072265625, 2.8114013671875, 3.550537109375, 4.2896728515625, 5.02880859375, 5.7679443359375, 6.507080078125, 7.2462158203125, 7.9853515625, 8.7244873046875, 9.463623046875, 10.2027587890625, 10.94189453125, 11.6810302734375, 12.420166015625, 13.1593017578125, 13.8984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 5.0, 18.0, 31.0, 33.0, 50.0, 85.0, 128.0, 229.0, 372.0, 687.0, 1297.0, 2683.0, 6398.0, 18460.0, 100581.0, 3928186.0, 104316.0, 18772.0, 6419.0, 2739.0, 1265.0, 616.0, 352.0, 222.0, 107.0, 91.0, 40.0, 33.0, 24.0, 17.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.1875, -59.041015625, -56.89453125, -54.748046875, -52.6015625, -50.455078125, -48.30859375, -46.162109375, -44.015625, -41.869140625, -39.72265625, -37.576171875, -35.4296875, -33.283203125, -31.13671875, -28.990234375, -26.84375, -24.697265625, -22.55078125, -20.404296875, -18.2578125, -16.111328125, -13.96484375, -11.818359375, -9.671875, -7.525390625, -5.37890625, -3.232421875, -1.0859375, 1.060546875, 3.20703125, 5.353515625, 7.5, 9.646484375, 11.79296875, 13.939453125, 16.0859375, 18.232421875, 20.37890625, 22.525390625, 24.671875, 26.818359375, 28.96484375, 31.111328125, 33.2578125, 35.404296875, 37.55078125, 39.697265625, 41.84375, 43.990234375, 46.13671875, 48.283203125, 50.4296875, 52.576171875, 54.72265625, 56.869140625, 59.015625, 61.162109375, 63.30859375, 65.455078125, 67.6015625, 69.748046875, 71.89453125, 74.041015625, 76.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 8.0, 11.0, 16.0, 22.0, 48.0, 62.0, 182.0, 1970.0, 1340.0, 163.0, 92.0, 38.0, 28.0, 19.0, 13.0, 10.0, 7.0, 2.0, 7.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.337890625, -22.50390625, -21.669921875, -20.8359375, -20.001953125, -19.16796875, -18.333984375, -17.5, -16.666015625, -15.83203125, -14.998046875, -14.1640625, -13.330078125, -12.49609375, -11.662109375, -10.828125, -9.994140625, -9.16015625, -8.326171875, -7.4921875, -6.658203125, -5.82421875, -4.990234375, -4.15625, -3.322265625, -2.48828125, -1.654296875, -0.8203125, 0.013671875, 0.84765625, 1.681640625, 2.515625, 3.349609375, 4.18359375, 5.017578125, 5.8515625, 6.685546875, 7.51953125, 8.353515625, 9.1875, 10.021484375, 10.85546875, 11.689453125, 12.5234375, 13.357421875, 14.19140625, 15.025390625, 15.859375, 16.693359375, 17.52734375, 18.361328125, 19.1953125, 20.029296875, 20.86328125, 21.697265625, 22.53125, 23.365234375, 24.19921875, 25.033203125, 25.8671875, 26.701171875, 27.53515625, 28.369140625, 29.203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 14.0, 16.0, 50.0, 89.0, 158.0, 228.0, 195.0, 116.0, 64.0, 32.0, 23.0, 5.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-266.13922119140625, -259.09765625, -252.0561065673828, -245.01454162597656, -237.9729766845703, -230.93142700195312, -223.88986206054688, -216.84829711914062, -209.80673217773438, -202.76516723632812, -195.72361755371094, -188.6820526123047, -181.64048767089844, -174.59893798828125, -167.557373046875, -160.51580810546875, -153.4742431640625, -146.43267822265625, -139.39112854003906, -132.3495635986328, -125.30799865722656, -118.26644134521484, -111.22488403320312, -104.18331909179688, -97.14176940917969, -90.10021209716797, -83.05864715576172, -76.01708984375, -68.97552490234375, -61.93396759033203, -54.89240646362305, -47.85084533691406, -40.80928039550781, -33.76771926879883, -26.726158142089844, -19.684598922729492, -12.643037796020508, -5.601478576660156, 1.4400825500488281, 8.481643676757812, 15.523204803466797, 22.56476593017578, 29.606327056884766, 36.64788818359375, 43.68944549560547, 50.73100662231445, 57.77256774902344, 64.81413269042969, 71.8556900024414, 78.89724731445312, 85.93881225585938, 92.9803695678711, 100.02193450927734, 107.06349182128906, 114.10505676269531, 121.14661407470703, 128.18817138671875, 135.229736328125, 142.2712860107422, 149.31285095214844, 156.3544158935547, 163.39596557617188, 170.43753051757812, 177.47909545898438, 184.52066040039062]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 13.0, 8.0, 11.0, 24.0, 16.0, 21.0, 33.0, 40.0, 47.0, 36.0, 49.0, 50.0, 52.0, 53.0, 41.0, 54.0, 57.0, 46.0, 54.0, 49.0, 42.0, 27.0, 37.0, 31.0, 25.0, 18.0, 12.0, 14.0, 19.0, 8.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.72419738769531, -88.1270523071289, -85.5299072265625, -82.9327621459961, -80.33561706542969, -77.73847198486328, -75.14132690429688, -72.54417419433594, -69.94703674316406, -67.34989166259766, -64.75274658203125, -62.155601501464844, -59.55845642089844, -56.96131134033203, -54.36416244506836, -51.76701736450195, -49.16986846923828, -46.572723388671875, -43.97557830810547, -41.37843322753906, -38.781288146972656, -36.18414306640625, -33.58699417114258, -30.989849090576172, -28.392704010009766, -25.79555892944336, -23.198413848876953, -20.601266860961914, -18.004121780395508, -15.406976699829102, -12.809830665588379, -10.212684631347656, -7.61553955078125, -5.0183939933776855, -2.421248435974121, 0.17589712142944336, 2.773042678833008, 5.370187759399414, 7.967333793640137, 10.56447982788086, 13.161624908447266, 15.758769989013672, 18.355915069580078, 20.953062057495117, 23.550207138061523, 26.14735221862793, 28.74449920654297, 31.341644287109375, 33.93878936767578, 36.53593444824219, 39.133079528808594, 41.730224609375, 44.327369689941406, 46.92451477050781, 49.521663665771484, 52.11880874633789, 54.7159538269043, 57.3130989074707, 59.91024398803711, 62.507389068603516, 65.10453796386719, 67.7016830444336, 70.298828125, 72.8959732055664, 75.49311828613281]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 21.0, 27.0, 31.0, 68.0, 124.0, 232.0, 463.0, 998.0, 2292.0, 6239.0, 17531.0, 55045.0, 187918.0, 512813.0, 183346.0, 53758.0, 17265.0, 5963.0, 2360.0, 992.0, 512.0, 233.0, 139.0, 71.0, 41.0, 20.0, 21.0, 6.0, 4.0, 7.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.5, -55.96630859375, -54.4326171875, -52.89892578125, -51.365234375, -49.83154296875, -48.2978515625, -46.76416015625, -45.23046875, -43.69677734375, -42.1630859375, -40.62939453125, -39.095703125, -37.56201171875, -36.0283203125, -34.49462890625, -32.9609375, -31.42724609375, -29.8935546875, -28.35986328125, -26.826171875, -25.29248046875, -23.7587890625, -22.22509765625, -20.69140625, -19.15771484375, -17.6240234375, -16.09033203125, -14.556640625, -13.02294921875, -11.4892578125, -9.95556640625, -8.421875, -6.88818359375, -5.3544921875, -3.82080078125, -2.287109375, -0.75341796875, 0.7802734375, 2.31396484375, 3.84765625, 5.38134765625, 6.9150390625, 8.44873046875, 9.982421875, 11.51611328125, 13.0498046875, 14.58349609375, 16.1171875, 17.65087890625, 19.1845703125, 20.71826171875, 22.251953125, 23.78564453125, 25.3193359375, 26.85302734375, 28.38671875, 29.92041015625, 31.4541015625, 32.98779296875, 34.521484375, 36.05517578125, 37.5888671875, 39.12255859375, 40.65625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 23.0, 21.0, 27.0, 22.0, 50.0, 40.0, 45.0, 64.0, 64.0, 76.0, 67.0, 65.0, 79.0, 68.0, 64.0, 37.0, 37.0, 40.0, 20.0, 22.0, 16.0, 9.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.34375, -26.6328125, -25.921875, -25.2109375, -24.5, -23.7890625, -23.078125, -22.3671875, -21.65625, -20.9453125, -20.234375, -19.5234375, -18.8125, -18.1015625, -17.390625, -16.6796875, -15.96875, -15.2578125, -14.546875, -13.8359375, -13.125, -12.4140625, -11.703125, -10.9921875, -10.28125, -9.5703125, -8.859375, -8.1484375, -7.4375, -6.7265625, -6.015625, -5.3046875, -4.59375, -3.8828125, -3.171875, -2.4609375, -1.75, -1.0390625, -0.328125, 0.3828125, 1.09375, 1.8046875, 2.515625, 3.2265625, 3.9375, 4.6484375, 5.359375, 6.0703125, 6.78125, 7.4921875, 8.203125, 8.9140625, 9.625, 10.3359375, 11.046875, 11.7578125, 12.46875, 13.1796875, 13.890625, 14.6015625, 15.3125, 16.0234375, 16.734375, 17.4453125, 18.15625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 4.0, 17.0, 10.0, 17.0, 19.0, 29.0, 49.0, 59.0, 113.0, 188.0, 342.0, 715.0, 1951.0, 9993.0, 204758.0, 796625.0, 27897.0, 3461.0, 1150.0, 459.0, 268.0, 148.0, 101.0, 55.0, 41.0, 21.0, 14.0, 13.0, 11.0, 6.0, 10.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-115.0625, -111.59765625, -108.1328125, -104.66796875, -101.203125, -97.73828125, -94.2734375, -90.80859375, -87.34375, -83.87890625, -80.4140625, -76.94921875, -73.484375, -70.01953125, -66.5546875, -63.08984375, -59.625, -56.16015625, -52.6953125, -49.23046875, -45.765625, -42.30078125, -38.8359375, -35.37109375, -31.90625, -28.44140625, -24.9765625, -21.51171875, -18.046875, -14.58203125, -11.1171875, -7.65234375, -4.1875, -0.72265625, 2.7421875, 6.20703125, 9.671875, 13.13671875, 16.6015625, 20.06640625, 23.53125, 26.99609375, 30.4609375, 33.92578125, 37.390625, 40.85546875, 44.3203125, 47.78515625, 51.25, 54.71484375, 58.1796875, 61.64453125, 65.109375, 68.57421875, 72.0390625, 75.50390625, 78.96875, 82.43359375, 85.8984375, 89.36328125, 92.828125, 96.29296875, 99.7578125, 103.22265625, 106.6875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 9.0, 12.0, 14.0, 16.0, 24.0, 36.0, 39.0, 29.0, 37.0, 42.0, 37.0, 55.0, 44.0, 68.0, 75.0, 61.0, 53.0, 52.0, 38.0, 41.0, 36.0, 40.0, 17.0, 15.0, 26.0, 12.0, 9.0, 11.0, 5.0, 8.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0, -72.552734375, -70.10546875, -67.658203125, -65.2109375, -62.763671875, -60.31640625, -57.869140625, -55.421875, -52.974609375, -50.52734375, -48.080078125, -45.6328125, -43.185546875, -40.73828125, -38.291015625, -35.84375, -33.396484375, -30.94921875, -28.501953125, -26.0546875, -23.607421875, -21.16015625, -18.712890625, -16.265625, -13.818359375, -11.37109375, -8.923828125, -6.4765625, -4.029296875, -1.58203125, 0.865234375, 3.3125, 5.759765625, 8.20703125, 10.654296875, 13.1015625, 15.548828125, 17.99609375, 20.443359375, 22.890625, 25.337890625, 27.78515625, 30.232421875, 32.6796875, 35.126953125, 37.57421875, 40.021484375, 42.46875, 44.916015625, 47.36328125, 49.810546875, 52.2578125, 54.705078125, 57.15234375, 59.599609375, 62.046875, 64.494140625, 66.94140625, 69.388671875, 71.8359375, 74.283203125, 76.73046875, 79.177734375, 81.625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 9.0, 10.0, 10.0, 16.0, 21.0, 22.0, 41.0, 49.0, 51.0, 101.0, 138.0, 189.0, 330.0, 466.0, 776.0, 1335.0, 2568.0, 5555.0, 13424.0, 39175.0, 144033.0, 545938.0, 209936.0, 53042.0, 17287.0, 6768.0, 3098.0, 1625.0, 903.0, 553.0, 350.0, 237.0, 144.0, 96.0, 71.0, 51.0, 39.0, 26.0, 22.0, 7.0, 5.0, 5.0, 9.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-16.40625, -15.9183349609375, -15.430419921875, -14.9425048828125, -14.45458984375, -13.9666748046875, -13.478759765625, -12.9908447265625, -12.5029296875, -12.0150146484375, -11.527099609375, -11.0391845703125, -10.55126953125, -10.0633544921875, -9.575439453125, -9.0875244140625, -8.599609375, -8.1116943359375, -7.623779296875, -7.1358642578125, -6.64794921875, -6.1600341796875, -5.672119140625, -5.1842041015625, -4.6962890625, -4.2083740234375, -3.720458984375, -3.2325439453125, -2.74462890625, -2.2567138671875, -1.768798828125, -1.2808837890625, -0.79296875, -0.3050537109375, 0.182861328125, 0.6707763671875, 1.15869140625, 1.6466064453125, 2.134521484375, 2.6224365234375, 3.1103515625, 3.5982666015625, 4.086181640625, 4.5740966796875, 5.06201171875, 5.5499267578125, 6.037841796875, 6.5257568359375, 7.013671875, 7.5015869140625, 7.989501953125, 8.4774169921875, 8.96533203125, 9.4532470703125, 9.941162109375, 10.4290771484375, 10.9169921875, 11.4049072265625, 11.892822265625, 12.3807373046875, 12.86865234375, 13.3565673828125, 13.844482421875, 14.3323974609375, 14.8203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 10.0, 12.0, 17.0, 11.0, 22.0, 32.0, 35.0, 49.0, 53.0, 60.0, 108.0, 136.0, 115.0, 69.0, 43.0, 33.0, 31.0, 26.0, 25.0, 22.0, 18.0, 14.0, 8.0, 6.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004665374755859375, -0.0044901371002197266, -0.004314899444580078, -0.00413966178894043, -0.003964424133300781, -0.003789186477661133, -0.0036139488220214844, -0.003438711166381836, -0.0032634735107421875, -0.003088235855102539, -0.0029129981994628906, -0.002737760543823242, -0.0025625228881835938, -0.0023872852325439453, -0.002212047576904297, -0.0020368099212646484, -0.001861572265625, -0.0016863346099853516, -0.0015110969543457031, -0.0013358592987060547, -0.0011606216430664062, -0.0009853839874267578, -0.0008101463317871094, -0.0006349086761474609, -0.0004596710205078125, -0.00028443336486816406, -0.00010919570922851562, 6.604194641113281e-05, 0.00024127960205078125, 0.0004165172576904297, 0.0005917549133300781, 0.0007669925689697266, 0.000942230224609375, 0.0011174678802490234, 0.0012927055358886719, 0.0014679431915283203, 0.0016431808471679688, 0.0018184185028076172, 0.0019936561584472656, 0.002168893814086914, 0.0023441314697265625, 0.002519369125366211, 0.0026946067810058594, 0.002869844436645508, 0.0030450820922851562, 0.0032203197479248047, 0.003395557403564453, 0.0035707950592041016, 0.00374603271484375, 0.0039212703704833984, 0.004096508026123047, 0.004271745681762695, 0.004446983337402344, 0.004622220993041992, 0.004797458648681641, 0.004972696304321289, 0.0051479339599609375, 0.005323171615600586, 0.005498409271240234, 0.005673646926879883, 0.005848884582519531, 0.00602412223815918, 0.006199359893798828, 0.0063745975494384766, 0.006549835205078125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 6.0, 12.0, 12.0, 6.0, 22.0, 33.0, 34.0, 64.0, 153.0, 259.0, 584.0, 1623.0, 6686.0, 59173.0, 824423.0, 140199.0, 11378.0, 2432.0, 781.0, 313.0, 153.0, 75.0, 47.0, 30.0, 25.0, 7.0, 13.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.40625, -31.18994140625, -29.9736328125, -28.75732421875, -27.541015625, -26.32470703125, -25.1083984375, -23.89208984375, -22.67578125, -21.45947265625, -20.2431640625, -19.02685546875, -17.810546875, -16.59423828125, -15.3779296875, -14.16162109375, -12.9453125, -11.72900390625, -10.5126953125, -9.29638671875, -8.080078125, -6.86376953125, -5.6474609375, -4.43115234375, -3.21484375, -1.99853515625, -0.7822265625, 0.43408203125, 1.650390625, 2.86669921875, 4.0830078125, 5.29931640625, 6.515625, 7.73193359375, 8.9482421875, 10.16455078125, 11.380859375, 12.59716796875, 13.8134765625, 15.02978515625, 16.24609375, 17.46240234375, 18.6787109375, 19.89501953125, 21.111328125, 22.32763671875, 23.5439453125, 24.76025390625, 25.9765625, 27.19287109375, 28.4091796875, 29.62548828125, 30.841796875, 32.05810546875, 33.2744140625, 34.49072265625, 35.70703125, 36.92333984375, 38.1396484375, 39.35595703125, 40.572265625, 41.78857421875, 43.0048828125, 44.22119140625, 45.4375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 3.0, 6.0, 8.0, 10.0, 9.0, 17.0, 15.0, 14.0, 21.0, 22.0, 31.0, 56.0, 47.0, 65.0, 76.0, 78.0, 92.0, 87.0, 78.0, 51.0, 46.0, 38.0, 30.0, 21.0, 15.0, 16.0, 11.0, 6.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.578125, -19.921142578125, -19.26416015625, -18.607177734375, -17.9501953125, -17.293212890625, -16.63623046875, -15.979248046875, -15.322265625, -14.665283203125, -14.00830078125, -13.351318359375, -12.6943359375, -12.037353515625, -11.38037109375, -10.723388671875, -10.06640625, -9.409423828125, -8.75244140625, -8.095458984375, -7.4384765625, -6.781494140625, -6.12451171875, -5.467529296875, -4.810546875, -4.153564453125, -3.49658203125, -2.839599609375, -2.1826171875, -1.525634765625, -0.86865234375, -0.211669921875, 0.4453125, 1.102294921875, 1.75927734375, 2.416259765625, 3.0732421875, 3.730224609375, 4.38720703125, 5.044189453125, 5.701171875, 6.358154296875, 7.01513671875, 7.672119140625, 8.3291015625, 8.986083984375, 9.64306640625, 10.300048828125, 10.95703125, 11.614013671875, 12.27099609375, 12.927978515625, 13.5849609375, 14.241943359375, 14.89892578125, 15.555908203125, 16.212890625, 16.869873046875, 17.52685546875, 18.183837890625, 18.8408203125, 19.497802734375, 20.15478515625, 20.811767578125, 21.46875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 14.0, 21.0, 53.0, 135.0, 205.0, 229.0, 150.0, 94.0, 56.0, 21.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-654.52978515625, -634.3231811523438, -614.1166381835938, -593.9100341796875, -573.7034301757812, -553.496826171875, -533.290283203125, -513.0836791992188, -492.8771057128906, -472.6705322265625, -452.46392822265625, -432.2573547363281, -412.05078125, -391.84417724609375, -371.6376037597656, -351.4310302734375, -331.22442626953125, -311.0178527832031, -290.8112487792969, -270.60467529296875, -250.39808654785156, -230.19149780273438, -209.98492431640625, -189.77833557128906, -169.57174682617188, -149.3651580810547, -129.1585693359375, -108.95199584960938, -88.74540710449219, -68.538818359375, -48.332237243652344, -28.125656127929688, -7.91900634765625, 12.287578582763672, 32.494163513183594, 52.700748443603516, 72.90733337402344, 93.11392211914062, 113.32050323486328, 133.52708435058594, 153.73367309570312, 173.9402618408203, 194.1468505859375, 214.35342407226562, 234.5600128173828, 254.7666015625, 274.9731750488281, 295.17974853515625, 315.3863525390625, 335.5929260253906, 355.7995300292969, 376.006103515625, 396.21270751953125, 416.4192810058594, 436.6258544921875, 456.83245849609375, 477.0390319824219, 497.24560546875, 517.4522094726562, 537.6588134765625, 557.8653564453125, 578.0719604492188, 598.278564453125, 618.485107421875, 638.6917114257812]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 3.0, 8.0, 10.0, 11.0, 14.0, 16.0, 14.0, 17.0, 18.0, 24.0, 34.0, 36.0, 23.0, 38.0, 47.0, 49.0, 52.0, 45.0, 37.0, 37.0, 45.0, 49.0, 35.0, 40.0, 42.0, 27.0, 31.0, 24.0, 26.0, 25.0, 21.0, 11.0, 12.0, 13.0, 15.0, 12.0, 3.0, 9.0, 1.0, 8.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-234.61538696289062, -225.93736267089844, -217.25933837890625, -208.58131408691406, -199.90328979492188, -191.22525024414062, -182.54722595214844, -173.86920166015625, -165.19117736816406, -156.51315307617188, -147.8351287841797, -139.1571044921875, -130.47906494140625, -121.8010482788086, -113.12301635742188, -104.44499206542969, -95.7669677734375, -87.08894348144531, -78.41091918945312, -69.7328872680664, -61.05486297607422, -52.37683868408203, -43.69881057739258, -35.020782470703125, -26.342758178710938, -17.664731979370117, -8.986705780029297, -0.30867958068847656, 8.369346618652344, 17.04737091064453, 25.725399017333984, 34.40342712402344, 43.0814208984375, 51.75944519042969, 60.43747329711914, 69.1155014038086, 77.79352569580078, 86.47154998779297, 95.14958190917969, 103.82760620117188, 112.50563049316406, 121.18365478515625, 129.86167907714844, 138.53970336914062, 147.21774291992188, 155.895751953125, 164.57379150390625, 173.25181579589844, 181.92984008789062, 190.6078643798828, 199.285888671875, 207.9639129638672, 216.64193725585938, 225.31997680664062, 233.9980010986328, 242.676025390625, 251.3540496826172, 260.0320739746094, 268.7101135253906, 277.38812255859375, 286.066162109375, 294.7441711425781, 303.4222106933594, 312.1002197265625, 320.77825927734375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 8.0, 16.0, 31.0, 25.0, 47.0, 57.0, 109.0, 118.0, 208.0, 289.0, 412.0, 680.0, 987.0, 1660.0, 2665.0, 4582.0, 8298.0, 15517.0, 34081.0, 91661.0, 395393.0, 2278083.0, 1068718.0, 185578.0, 55204.0, 23172.0, 11363.0, 6014.0, 3456.0, 1990.0, 1318.0, 795.0, 528.0, 373.0, 241.0, 184.0, 109.0, 106.0, 54.0, 34.0, 35.0, 17.0, 21.0, 10.0, 3.0, 6.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-21.40625, -20.71044921875, -20.0146484375, -19.31884765625, -18.623046875, -17.92724609375, -17.2314453125, -16.53564453125, -15.83984375, -15.14404296875, -14.4482421875, -13.75244140625, -13.056640625, -12.36083984375, -11.6650390625, -10.96923828125, -10.2734375, -9.57763671875, -8.8818359375, -8.18603515625, -7.490234375, -6.79443359375, -6.0986328125, -5.40283203125, -4.70703125, -4.01123046875, -3.3154296875, -2.61962890625, -1.923828125, -1.22802734375, -0.5322265625, 0.16357421875, 0.859375, 1.55517578125, 2.2509765625, 2.94677734375, 3.642578125, 4.33837890625, 5.0341796875, 5.72998046875, 6.42578125, 7.12158203125, 7.8173828125, 8.51318359375, 9.208984375, 9.90478515625, 10.6005859375, 11.29638671875, 11.9921875, 12.68798828125, 13.3837890625, 14.07958984375, 14.775390625, 15.47119140625, 16.1669921875, 16.86279296875, 17.55859375, 18.25439453125, 18.9501953125, 19.64599609375, 20.341796875, 21.03759765625, 21.7333984375, 22.42919921875, 23.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 4.0, 5.0, 7.0, 5.0, 12.0, 12.0, 10.0, 17.0, 17.0, 21.0, 25.0, 22.0, 30.0, 24.0, 32.0, 42.0, 48.0, 36.0, 44.0, 45.0, 43.0, 46.0, 48.0, 48.0, 38.0, 38.0, 42.0, 39.0, 30.0, 27.0, 31.0, 17.0, 21.0, 16.0, 10.0, 10.0, 11.0, 7.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.03125, -12.5894775390625, -12.147705078125, -11.7059326171875, -11.26416015625, -10.8223876953125, -10.380615234375, -9.9388427734375, -9.4970703125, -9.0552978515625, -8.613525390625, -8.1717529296875, -7.72998046875, -7.2882080078125, -6.846435546875, -6.4046630859375, -5.962890625, -5.5211181640625, -5.079345703125, -4.6375732421875, -4.19580078125, -3.7540283203125, -3.312255859375, -2.8704833984375, -2.4287109375, -1.9869384765625, -1.545166015625, -1.1033935546875, -0.66162109375, -0.2198486328125, 0.221923828125, 0.6636962890625, 1.10546875, 1.5472412109375, 1.989013671875, 2.4307861328125, 2.87255859375, 3.3143310546875, 3.756103515625, 4.1978759765625, 4.6396484375, 5.0814208984375, 5.523193359375, 5.9649658203125, 6.40673828125, 6.8485107421875, 7.290283203125, 7.7320556640625, 8.173828125, 8.6156005859375, 9.057373046875, 9.4991455078125, 9.94091796875, 10.3826904296875, 10.824462890625, 11.2662353515625, 11.7080078125, 12.1497802734375, 12.591552734375, 13.0333251953125, 13.47509765625, 13.9168701171875, 14.358642578125, 14.8004150390625, 15.2421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 12.0, 12.0, 21.0, 18.0, 23.0, 42.0, 93.0, 102.0, 198.0, 347.0, 671.0, 1369.0, 3233.0, 9162.0, 36854.0, 280708.0, 3526244.0, 282902.0, 36683.0, 9309.0, 3283.0, 1378.0, 725.0, 352.0, 205.0, 113.0, 79.0, 48.0, 28.0, 20.0, 10.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-64.5, -62.73291015625, -60.9658203125, -59.19873046875, -57.431640625, -55.66455078125, -53.8974609375, -52.13037109375, -50.36328125, -48.59619140625, -46.8291015625, -45.06201171875, -43.294921875, -41.52783203125, -39.7607421875, -37.99365234375, -36.2265625, -34.45947265625, -32.6923828125, -30.92529296875, -29.158203125, -27.39111328125, -25.6240234375, -23.85693359375, -22.08984375, -20.32275390625, -18.5556640625, -16.78857421875, -15.021484375, -13.25439453125, -11.4873046875, -9.72021484375, -7.953125, -6.18603515625, -4.4189453125, -2.65185546875, -0.884765625, 0.88232421875, 2.6494140625, 4.41650390625, 6.18359375, 7.95068359375, 9.7177734375, 11.48486328125, 13.251953125, 15.01904296875, 16.7861328125, 18.55322265625, 20.3203125, 22.08740234375, 23.8544921875, 25.62158203125, 27.388671875, 29.15576171875, 30.9228515625, 32.68994140625, 34.45703125, 36.22412109375, 37.9912109375, 39.75830078125, 41.525390625, 43.29248046875, 45.0595703125, 46.82666015625, 48.59375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 5.0, 6.0, 6.0, 11.0, 16.0, 18.0, 29.0, 50.0, 60.0, 104.0, 184.0, 340.0, 674.0, 1075.0, 670.0, 300.0, 191.0, 108.0, 58.0, 36.0, 28.0, 26.0, 10.0, 18.0, 9.0, 9.0, 2.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-65.3125, -63.521484375, -61.73046875, -59.939453125, -58.1484375, -56.357421875, -54.56640625, -52.775390625, -50.984375, -49.193359375, -47.40234375, -45.611328125, -43.8203125, -42.029296875, -40.23828125, -38.447265625, -36.65625, -34.865234375, -33.07421875, -31.283203125, -29.4921875, -27.701171875, -25.91015625, -24.119140625, -22.328125, -20.537109375, -18.74609375, -16.955078125, -15.1640625, -13.373046875, -11.58203125, -9.791015625, -8.0, -6.208984375, -4.41796875, -2.626953125, -0.8359375, 0.955078125, 2.74609375, 4.537109375, 6.328125, 8.119140625, 9.91015625, 11.701171875, 13.4921875, 15.283203125, 17.07421875, 18.865234375, 20.65625, 22.447265625, 24.23828125, 26.029296875, 27.8203125, 29.611328125, 31.40234375, 33.193359375, 34.984375, 36.775390625, 38.56640625, 40.357421875, 42.1484375, 43.939453125, 45.73046875, 47.521484375, 49.3125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 15.0, 14.0, 26.0, 40.0, 61.0, 103.0, 188.0, 185.0, 152.0, 81.0, 56.0, 31.0, 14.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-579.1993408203125, -563.2213745117188, -547.2434692382812, -531.2655029296875, -515.2875366210938, -499.30963134765625, -483.3316650390625, -467.3537292480469, -451.37579345703125, -435.3978576660156, -419.4198913574219, -403.44195556640625, -387.4640197753906, -371.486083984375, -355.50811767578125, -339.5301818847656, -323.5522155761719, -307.57427978515625, -291.5963134765625, -275.6183776855469, -259.64044189453125, -243.66249084472656, -227.68453979492188, -211.70660400390625, -195.72865295410156, -179.75070190429688, -163.77276611328125, -147.79481506347656, -131.81686401367188, -115.83892822265625, -99.86097717285156, -83.8830337524414, -67.90512084960938, -51.92717742919922, -35.9492301940918, -19.971282958984375, -3.9933395385742188, 11.984603881835938, 27.962554931640625, 43.94049835205078, 59.91844177246094, 75.8963851928711, 91.87432861328125, 107.85227966308594, 123.8302230834961, 139.80816650390625, 155.78611755371094, 171.76406860351562, 187.74200439453125, 203.71995544433594, 219.69789123535156, 235.67584228515625, 251.65377807617188, 267.6317138671875, 283.60968017578125, 299.5876159667969, 315.5655517578125, 331.5434875488281, 347.5214538574219, 363.4993896484375, 379.4773254394531, 395.45526123046875, 411.4332275390625, 427.4111633300781, 443.3891296386719]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 7.0, 1.0, 4.0, 12.0, 13.0, 15.0, 20.0, 28.0, 31.0, 26.0, 30.0, 44.0, 30.0, 31.0, 40.0, 46.0, 47.0, 40.0, 40.0, 40.0, 38.0, 52.0, 46.0, 35.0, 31.0, 28.0, 35.0, 26.0, 32.0, 8.0, 19.0, 22.0, 17.0, 13.0, 11.0, 9.0, 6.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-211.9520263671875, -205.6383056640625, -199.3245849609375, -193.01084899902344, -186.69712829589844, -180.38340759277344, -174.06967163085938, -167.75595092773438, -161.44223022460938, -155.12850952148438, -148.81478881835938, -142.5010528564453, -136.1873321533203, -129.8736114501953, -123.55988311767578, -117.24615478515625, -110.93243408203125, -104.61871337890625, -98.30498504638672, -91.99125671386719, -85.67753601074219, -79.36381530761719, -73.05008697509766, -66.73635864257812, -60.422637939453125, -54.10891342163086, -47.795188903808594, -41.48146438598633, -35.16773986816406, -28.854015350341797, -22.54029083251953, -16.226566314697266, -9.912857055664062, -3.599132537841797, 2.7145919799804688, 9.028316497802734, 15.342041015625, 21.655765533447266, 27.96949005126953, 34.2832145690918, 40.59693908691406, 46.91066360473633, 53.224388122558594, 59.53811264038086, 65.85183715820312, 72.16555786132812, 78.47928619384766, 84.79301452636719, 91.10673522949219, 97.42045593261719, 103.73418426513672, 110.04791259765625, 116.36163330078125, 122.67535400390625, 128.98907470703125, 135.3028106689453, 141.6165313720703, 147.9302520751953, 154.24398803710938, 160.55770874023438, 166.87142944335938, 173.18515014648438, 179.49887084960938, 185.81260681152344, 192.12632751464844]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 13.0, 15.0, 27.0, 32.0, 63.0, 80.0, 121.0, 208.0, 330.0, 601.0, 939.0, 1661.0, 2968.0, 5658.0, 10758.0, 21929.0, 48527.0, 127882.0, 398265.0, 273544.0, 84540.0, 35445.0, 16606.0, 8252.0, 4356.0, 2342.0, 1312.0, 803.0, 482.0, 297.0, 155.0, 114.0, 75.0, 41.0, 29.0, 17.0, 15.0, 16.0, 5.0, 3.0, 7.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.28125, -31.2333984375, -30.185546875, -29.1376953125, -28.08984375, -27.0419921875, -25.994140625, -24.9462890625, -23.8984375, -22.8505859375, -21.802734375, -20.7548828125, -19.70703125, -18.6591796875, -17.611328125, -16.5634765625, -15.515625, -14.4677734375, -13.419921875, -12.3720703125, -11.32421875, -10.2763671875, -9.228515625, -8.1806640625, -7.1328125, -6.0849609375, -5.037109375, -3.9892578125, -2.94140625, -1.8935546875, -0.845703125, 0.2021484375, 1.25, 2.2978515625, 3.345703125, 4.3935546875, 5.44140625, 6.4892578125, 7.537109375, 8.5849609375, 9.6328125, 10.6806640625, 11.728515625, 12.7763671875, 13.82421875, 14.8720703125, 15.919921875, 16.9677734375, 18.015625, 19.0634765625, 20.111328125, 21.1591796875, 22.20703125, 23.2548828125, 24.302734375, 25.3505859375, 26.3984375, 27.4462890625, 28.494140625, 29.5419921875, 30.58984375, 31.6376953125, 32.685546875, 33.7333984375, 34.78125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 8.0, 8.0, 8.0, 12.0, 17.0, 13.0, 24.0, 30.0, 26.0, 19.0, 29.0, 32.0, 36.0, 34.0, 46.0, 46.0, 42.0, 58.0, 45.0, 47.0, 56.0, 42.0, 54.0, 33.0, 27.0, 39.0, 23.0, 23.0, 23.0, 11.0, 13.0, 12.0, 11.0, 9.0, 11.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.6556396484375, -15.186279296875, -14.7169189453125, -14.24755859375, -13.7781982421875, -13.308837890625, -12.8394775390625, -12.3701171875, -11.9007568359375, -11.431396484375, -10.9620361328125, -10.49267578125, -10.0233154296875, -9.553955078125, -9.0845947265625, -8.615234375, -8.1458740234375, -7.676513671875, -7.2071533203125, -6.73779296875, -6.2684326171875, -5.799072265625, -5.3297119140625, -4.8603515625, -4.3909912109375, -3.921630859375, -3.4522705078125, -2.98291015625, -2.5135498046875, -2.044189453125, -1.5748291015625, -1.10546875, -0.6361083984375, -0.166748046875, 0.3026123046875, 0.77197265625, 1.2413330078125, 1.710693359375, 2.1800537109375, 2.6494140625, 3.1187744140625, 3.588134765625, 4.0574951171875, 4.52685546875, 4.9962158203125, 5.465576171875, 5.9349365234375, 6.404296875, 6.8736572265625, 7.343017578125, 7.8123779296875, 8.28173828125, 8.7510986328125, 9.220458984375, 9.6898193359375, 10.1591796875, 10.6285400390625, 11.097900390625, 11.5672607421875, 12.03662109375, 12.5059814453125, 12.975341796875, 13.4447021484375, 13.9140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 3.0, 7.0, 5.0, 13.0, 14.0, 12.0, 34.0, 40.0, 39.0, 78.0, 105.0, 191.0, 324.0, 684.0, 1624.0, 5370.0, 42067.0, 885242.0, 99777.0, 8802.0, 2187.0, 895.0, 404.0, 249.0, 128.0, 90.0, 50.0, 31.0, 28.0, 16.0, 16.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-123.375, -119.7080078125, -116.041015625, -112.3740234375, -108.70703125, -105.0400390625, -101.373046875, -97.7060546875, -94.0390625, -90.3720703125, -86.705078125, -83.0380859375, -79.37109375, -75.7041015625, -72.037109375, -68.3701171875, -64.703125, -61.0361328125, -57.369140625, -53.7021484375, -50.03515625, -46.3681640625, -42.701171875, -39.0341796875, -35.3671875, -31.7001953125, -28.033203125, -24.3662109375, -20.69921875, -17.0322265625, -13.365234375, -9.6982421875, -6.03125, -2.3642578125, 1.302734375, 4.9697265625, 8.63671875, 12.3037109375, 15.970703125, 19.6376953125, 23.3046875, 26.9716796875, 30.638671875, 34.3056640625, 37.97265625, 41.6396484375, 45.306640625, 48.9736328125, 52.640625, 56.3076171875, 59.974609375, 63.6416015625, 67.30859375, 70.9755859375, 74.642578125, 78.3095703125, 81.9765625, 85.6435546875, 89.310546875, 92.9775390625, 96.64453125, 100.3115234375, 103.978515625, 107.6455078125, 111.3125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 15.0, 14.0, 16.0, 22.0, 19.0, 21.0, 26.0, 34.0, 38.0, 40.0, 51.0, 49.0, 51.0, 46.0, 64.0, 44.0, 42.0, 49.0, 51.0, 51.0, 36.0, 40.0, 26.0, 32.0, 22.0, 22.0, 18.0, 8.0, 11.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-96.3125, -93.689453125, -91.06640625, -88.443359375, -85.8203125, -83.197265625, -80.57421875, -77.951171875, -75.328125, -72.705078125, -70.08203125, -67.458984375, -64.8359375, -62.212890625, -59.58984375, -56.966796875, -54.34375, -51.720703125, -49.09765625, -46.474609375, -43.8515625, -41.228515625, -38.60546875, -35.982421875, -33.359375, -30.736328125, -28.11328125, -25.490234375, -22.8671875, -20.244140625, -17.62109375, -14.998046875, -12.375, -9.751953125, -7.12890625, -4.505859375, -1.8828125, 0.740234375, 3.36328125, 5.986328125, 8.609375, 11.232421875, 13.85546875, 16.478515625, 19.1015625, 21.724609375, 24.34765625, 26.970703125, 29.59375, 32.216796875, 34.83984375, 37.462890625, 40.0859375, 42.708984375, 45.33203125, 47.955078125, 50.578125, 53.201171875, 55.82421875, 58.447265625, 61.0703125, 63.693359375, 66.31640625, 68.939453125, 71.5625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 6.0, 0.0, 3.0, 4.0, 13.0, 17.0, 17.0, 34.0, 46.0, 69.0, 103.0, 177.0, 293.0, 556.0, 1119.0, 3016.0, 9479.0, 43598.0, 589325.0, 353679.0, 34112.0, 7946.0, 2677.0, 1051.0, 463.0, 278.0, 166.0, 104.0, 51.0, 40.0, 33.0, 21.0, 14.0, 8.0, 10.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.625, -30.568359375, -29.51171875, -28.455078125, -27.3984375, -26.341796875, -25.28515625, -24.228515625, -23.171875, -22.115234375, -21.05859375, -20.001953125, -18.9453125, -17.888671875, -16.83203125, -15.775390625, -14.71875, -13.662109375, -12.60546875, -11.548828125, -10.4921875, -9.435546875, -8.37890625, -7.322265625, -6.265625, -5.208984375, -4.15234375, -3.095703125, -2.0390625, -0.982421875, 0.07421875, 1.130859375, 2.1875, 3.244140625, 4.30078125, 5.357421875, 6.4140625, 7.470703125, 8.52734375, 9.583984375, 10.640625, 11.697265625, 12.75390625, 13.810546875, 14.8671875, 15.923828125, 16.98046875, 18.037109375, 19.09375, 20.150390625, 21.20703125, 22.263671875, 23.3203125, 24.376953125, 25.43359375, 26.490234375, 27.546875, 28.603515625, 29.66015625, 30.716796875, 31.7734375, 32.830078125, 33.88671875, 34.943359375, 36.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 14.0, 18.0, 24.0, 43.0, 68.0, 168.0, 299.0, 159.0, 80.0, 36.0, 27.0, 10.0, 9.0, 12.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01123046875, -0.010807275772094727, -0.010384082794189453, -0.00996088981628418, -0.009537696838378906, -0.009114503860473633, -0.00869131088256836, -0.008268117904663086, -0.007844924926757812, -0.007421731948852539, -0.006998538970947266, -0.006575345993041992, -0.006152153015136719, -0.005728960037231445, -0.005305767059326172, -0.0048825740814208984, -0.004459381103515625, -0.0040361881256103516, -0.003612995147705078, -0.0031898021697998047, -0.0027666091918945312, -0.002343416213989258, -0.0019202232360839844, -0.001497030258178711, -0.0010738372802734375, -0.0006506443023681641, -0.00022745132446289062, 0.0001957416534423828, 0.0006189346313476562, 0.0010421276092529297, 0.0014653205871582031, 0.0018885135650634766, 0.00231170654296875, 0.0027348995208740234, 0.003158092498779297, 0.0035812854766845703, 0.004004478454589844, 0.004427671432495117, 0.004850864410400391, 0.005274057388305664, 0.0056972503662109375, 0.006120443344116211, 0.006543636322021484, 0.006966829299926758, 0.007390022277832031, 0.007813215255737305, 0.008236408233642578, 0.008659601211547852, 0.009082794189453125, 0.009505987167358398, 0.009929180145263672, 0.010352373123168945, 0.010775566101074219, 0.011198759078979492, 0.011621952056884766, 0.012045145034790039, 0.012468338012695312, 0.012891530990600586, 0.01331472396850586, 0.013737916946411133, 0.014161109924316406, 0.01458430290222168, 0.015007495880126953, 0.015430688858032227, 0.0158538818359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 9.0, 9.0, 13.0, 31.0, 44.0, 46.0, 103.0, 160.0, 299.0, 644.0, 1619.0, 5760.0, 39874.0, 812286.0, 169935.0, 12775.0, 2930.0, 982.0, 455.0, 229.0, 117.0, 75.0, 53.0, 28.0, 12.0, 11.0, 12.0, 8.0, 6.0, 3.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.9375, -48.5, -47.0625, -45.625, -44.1875, -42.75, -41.3125, -39.875, -38.4375, -37.0, -35.5625, -34.125, -32.6875, -31.25, -29.8125, -28.375, -26.9375, -25.5, -24.0625, -22.625, -21.1875, -19.75, -18.3125, -16.875, -15.4375, -14.0, -12.5625, -11.125, -9.6875, -8.25, -6.8125, -5.375, -3.9375, -2.5, -1.0625, 0.375, 1.8125, 3.25, 4.6875, 6.125, 7.5625, 9.0, 10.4375, 11.875, 13.3125, 14.75, 16.1875, 17.625, 19.0625, 20.5, 21.9375, 23.375, 24.8125, 26.25, 27.6875, 29.125, 30.5625, 32.0, 33.4375, 34.875, 36.3125, 37.75, 39.1875, 40.625, 42.0625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 10.0, 8.0, 26.0, 21.0, 22.0, 49.0, 30.0, 43.0, 40.0, 67.0, 75.0, 87.0, 67.0, 74.0, 78.0, 50.0, 41.0, 43.0, 37.0, 17.0, 17.0, 20.0, 12.0, 7.0, 15.0, 4.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0, -24.262939453125, -23.52587890625, -22.788818359375, -22.0517578125, -21.314697265625, -20.57763671875, -19.840576171875, -19.103515625, -18.366455078125, -17.62939453125, -16.892333984375, -16.1552734375, -15.418212890625, -14.68115234375, -13.944091796875, -13.20703125, -12.469970703125, -11.73291015625, -10.995849609375, -10.2587890625, -9.521728515625, -8.78466796875, -8.047607421875, -7.310546875, -6.573486328125, -5.83642578125, -5.099365234375, -4.3623046875, -3.625244140625, -2.88818359375, -2.151123046875, -1.4140625, -0.677001953125, 0.06005859375, 0.797119140625, 1.5341796875, 2.271240234375, 3.00830078125, 3.745361328125, 4.482421875, 5.219482421875, 5.95654296875, 6.693603515625, 7.4306640625, 8.167724609375, 8.90478515625, 9.641845703125, 10.37890625, 11.115966796875, 11.85302734375, 12.590087890625, 13.3271484375, 14.064208984375, 14.80126953125, 15.538330078125, 16.275390625, 17.012451171875, 17.74951171875, 18.486572265625, 19.2236328125, 19.960693359375, 20.69775390625, 21.434814453125, 22.171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 49.0, 102.0, 228.0, 285.0, 168.0, 82.0, 24.0, 17.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-892.9130859375, -867.6424560546875, -842.3717651367188, -817.1011352539062, -791.8304443359375, -766.559814453125, -741.2891845703125, -716.0184936523438, -690.747802734375, -665.4771728515625, -640.2064819335938, -614.9358520507812, -589.6651611328125, -564.39453125, -539.1239013671875, -513.8532104492188, -488.58258056640625, -463.3119201660156, -438.041259765625, -412.7706298828125, -387.49993896484375, -362.22930908203125, -336.9586486816406, -311.68798828125, -286.4173278808594, -261.14666748046875, -235.87600708007812, -210.60536193847656, -185.33470153808594, -160.0640411376953, -134.79339599609375, -109.52273559570312, -84.25201416015625, -58.98135757446289, -33.71070098876953, -8.440048217773438, 16.830612182617188, 42.10127258300781, 67.37191772460938, 92.642578125, 117.91323852539062, 143.18389892578125, 168.45455932617188, 193.72520446777344, 218.99586486816406, 244.2665252685547, 269.53717041015625, 294.8078308105469, 320.0784912109375, 345.3491516113281, 370.61981201171875, 395.89044189453125, 421.1611328125, 446.4317626953125, 471.7024230957031, 496.97308349609375, 522.2437744140625, 547.514404296875, 572.7850952148438, 598.0557250976562, 623.326416015625, 648.5970458984375, 673.86767578125, 699.1383666992188, 724.4089965820312]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 10.0, 6.0, 7.0, 9.0, 8.0, 17.0, 21.0, 19.0, 23.0, 27.0, 36.0, 50.0, 50.0, 49.0, 55.0, 68.0, 64.0, 55.0, 65.0, 64.0, 46.0, 41.0, 31.0, 23.0, 35.0, 23.0, 25.0, 18.0, 12.0, 16.0, 11.0, 5.0, 5.0, 3.0, 0.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.068603515625, -311.17230224609375, -300.2759704589844, -289.3796691894531, -278.4833679199219, -267.5870361328125, -256.69073486328125, -245.79443359375, -234.8981170654297, -224.00180053710938, -213.10549926757812, -202.2091827392578, -191.3128662109375, -180.41656494140625, -169.52024841308594, -158.62393188476562, -147.72763061523438, -136.83131408691406, -125.93501281738281, -115.0386962890625, -104.14238739013672, -93.24607849121094, -82.34976196289062, -71.45345306396484, -60.55714416503906, -49.66083526611328, -38.764522552490234, -27.868209838867188, -16.971900939941406, -6.075592041015625, 4.8207244873046875, 15.717033386230469, 26.613311767578125, 37.509620666503906, 48.40593338012695, 59.30224609375, 70.19855499267578, 81.09486389160156, 91.99118041992188, 102.88748931884766, 113.78379821777344, 124.68010711669922, 135.576416015625, 146.4727325439453, 157.36904907226562, 168.26535034179688, 179.1616668701172, 190.0579833984375, 200.95428466796875, 211.85060119628906, 222.7469024658203, 233.64321899414062, 244.53952026367188, 255.4358367919922, 266.3321533203125, 277.22845458984375, 288.124755859375, 299.02105712890625, 309.9173889160156, 320.8136901855469, 331.7099914550781, 342.6063232421875, 353.50262451171875, 364.39892578125, 375.2952575683594]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 5.0, 12.0, 12.0, 14.0, 17.0, 31.0, 45.0, 49.0, 88.0, 124.0, 280.0, 3327.0, 1225116.0, 2960126.0, 4253.0, 353.0, 117.0, 90.0, 57.0, 42.0, 30.0, 22.0, 17.0, 11.0, 19.0, 6.0, 0.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.125, -148.19140625, -143.2578125, -138.32421875, -133.390625, -128.45703125, -123.5234375, -118.58984375, -113.65625, -108.72265625, -103.7890625, -98.85546875, -93.921875, -88.98828125, -84.0546875, -79.12109375, -74.1875, -69.25390625, -64.3203125, -59.38671875, -54.453125, -49.51953125, -44.5859375, -39.65234375, -34.71875, -29.78515625, -24.8515625, -19.91796875, -14.984375, -10.05078125, -5.1171875, -0.18359375, 4.75, 9.68359375, 14.6171875, 19.55078125, 24.484375, 29.41796875, 34.3515625, 39.28515625, 44.21875, 49.15234375, 54.0859375, 59.01953125, 63.953125, 68.88671875, 73.8203125, 78.75390625, 83.6875, 88.62109375, 93.5546875, 98.48828125, 103.421875, 108.35546875, 113.2890625, 118.22265625, 123.15625, 128.08984375, 133.0234375, 137.95703125, 142.890625, 147.82421875, 152.7578125, 157.69140625, 162.625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 10.0, 4.0, 9.0, 8.0, 13.0, 15.0, 32.0, 37.0, 27.0, 45.0, 53.0, 61.0, 71.0, 70.0, 63.0, 71.0, 70.0, 55.0, 50.0, 61.0, 45.0, 39.0, 23.0, 15.0, 17.0, 15.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.0499267578125, -14.388916015625, -13.7279052734375, -13.06689453125, -12.4058837890625, -11.744873046875, -11.0838623046875, -10.4228515625, -9.7618408203125, -9.100830078125, -8.4398193359375, -7.77880859375, -7.1177978515625, -6.456787109375, -5.7957763671875, -5.134765625, -4.4737548828125, -3.812744140625, -3.1517333984375, -2.49072265625, -1.8297119140625, -1.168701171875, -0.5076904296875, 0.1533203125, 0.8143310546875, 1.475341796875, 2.1363525390625, 2.79736328125, 3.4583740234375, 4.119384765625, 4.7803955078125, 5.44140625, 6.1024169921875, 6.763427734375, 7.4244384765625, 8.08544921875, 8.7464599609375, 9.407470703125, 10.0684814453125, 10.7294921875, 11.3905029296875, 12.051513671875, 12.7125244140625, 13.37353515625, 14.0345458984375, 14.695556640625, 15.3565673828125, 16.017578125, 16.6785888671875, 17.339599609375, 18.0006103515625, 18.66162109375, 19.3226318359375, 19.983642578125, 20.6446533203125, 21.3056640625, 21.9666748046875, 22.627685546875, 23.2886962890625, 23.94970703125, 24.6107177734375, 25.271728515625, 25.9327392578125, 26.59375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 2.0, 13.0, 16.0, 19.0, 29.0, 51.0, 80.0, 139.0, 206.0, 332.0, 643.0, 1160.0, 2162.0, 4568.0, 10696.0, 28556.0, 101457.0, 828424.0, 2844014.0, 281927.0, 56051.0, 18701.0, 7664.0, 3484.0, 1720.0, 845.0, 512.0, 309.0, 170.0, 118.0, 62.0, 48.0, 30.0, 19.0, 11.0, 14.0, 7.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-36.34375, -35.1025390625, -33.861328125, -32.6201171875, -31.37890625, -30.1376953125, -28.896484375, -27.6552734375, -26.4140625, -25.1728515625, -23.931640625, -22.6904296875, -21.44921875, -20.2080078125, -18.966796875, -17.7255859375, -16.484375, -15.2431640625, -14.001953125, -12.7607421875, -11.51953125, -10.2783203125, -9.037109375, -7.7958984375, -6.5546875, -5.3134765625, -4.072265625, -2.8310546875, -1.58984375, -0.3486328125, 0.892578125, 2.1337890625, 3.375, 4.6162109375, 5.857421875, 7.0986328125, 8.33984375, 9.5810546875, 10.822265625, 12.0634765625, 13.3046875, 14.5458984375, 15.787109375, 17.0283203125, 18.26953125, 19.5107421875, 20.751953125, 21.9931640625, 23.234375, 24.4755859375, 25.716796875, 26.9580078125, 28.19921875, 29.4404296875, 30.681640625, 31.9228515625, 33.1640625, 34.4052734375, 35.646484375, 36.8876953125, 38.12890625, 39.3701171875, 40.611328125, 41.8525390625, 43.09375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 7.0, 12.0, 18.0, 20.0, 29.0, 49.0, 63.0, 87.0, 161.0, 253.0, 492.0, 811.0, 763.0, 517.0, 287.0, 162.0, 98.0, 58.0, 40.0, 29.0, 24.0, 25.0, 5.0, 12.0, 7.0, 5.0, 10.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.40625, -45.82275390625, -44.2392578125, -42.65576171875, -41.072265625, -39.48876953125, -37.9052734375, -36.32177734375, -34.73828125, -33.15478515625, -31.5712890625, -29.98779296875, -28.404296875, -26.82080078125, -25.2373046875, -23.65380859375, -22.0703125, -20.48681640625, -18.9033203125, -17.31982421875, -15.736328125, -14.15283203125, -12.5693359375, -10.98583984375, -9.40234375, -7.81884765625, -6.2353515625, -4.65185546875, -3.068359375, -1.48486328125, 0.0986328125, 1.68212890625, 3.265625, 4.84912109375, 6.4326171875, 8.01611328125, 9.599609375, 11.18310546875, 12.7666015625, 14.35009765625, 15.93359375, 17.51708984375, 19.1005859375, 20.68408203125, 22.267578125, 23.85107421875, 25.4345703125, 27.01806640625, 28.6015625, 30.18505859375, 31.7685546875, 33.35205078125, 34.935546875, 36.51904296875, 38.1025390625, 39.68603515625, 41.26953125, 42.85302734375, 44.4365234375, 46.02001953125, 47.603515625, 49.18701171875, 50.7705078125, 52.35400390625, 53.9375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 29.0, 71.0, 151.0, 246.0, 218.0, 142.0, 60.0, 26.0, 7.0, 7.0, 5.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-771.695556640625, -752.2750244140625, -732.8544311523438, -713.433837890625, -694.0133056640625, -674.5927734375, -655.1721801757812, -635.7515869140625, -616.3310546875, -596.9105224609375, -577.4899291992188, -558.0693359375, -538.6488037109375, -519.228271484375, -499.80767822265625, -480.3871154785156, -460.966552734375, -441.5459899902344, -422.12542724609375, -402.7048645019531, -383.2843017578125, -363.8637390136719, -344.44317626953125, -325.0226135253906, -305.60205078125, -286.1814880371094, -266.76092529296875, -247.34036254882812, -227.9197998046875, -208.49923706054688, -189.07867431640625, -169.65811157226562, -150.23760986328125, -130.81704711914062, -111.396484375, -91.97592163085938, -72.55535888671875, -53.134796142578125, -33.7142333984375, -14.293670654296875, 5.12689208984375, 24.547454833984375, 43.968017578125, 63.388580322265625, 82.80914306640625, 102.22970581054688, 121.6502685546875, 141.07083129882812, 160.49139404296875, 179.91195678710938, 199.33251953125, 218.75308227539062, 238.17364501953125, 257.5942077636719, 277.0147705078125, 296.4353332519531, 315.85589599609375, 335.2764587402344, 354.697021484375, 374.1175842285156, 393.53814697265625, 412.9587097167969, 432.3792724609375, 451.7998352050781, 471.22039794921875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 1.0, 5.0, 7.0, 8.0, 13.0, 15.0, 17.0, 16.0, 29.0, 18.0, 30.0, 27.0, 29.0, 40.0, 44.0, 46.0, 44.0, 45.0, 42.0, 44.0, 60.0, 47.0, 43.0, 39.0, 36.0, 40.0, 39.0, 34.0, 22.0, 26.0, 19.0, 14.0, 14.0, 9.0, 8.0, 13.0, 4.0, 8.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-292.1580810546875, -284.7128601074219, -277.26763916015625, -269.8224182128906, -262.377197265625, -254.93199157714844, -247.4867706298828, -240.04156494140625, -232.59634399414062, -225.151123046875, -217.70590209960938, -210.2606964111328, -202.8154754638672, -195.37025451660156, -187.92503356933594, -180.47982788085938, -173.03460693359375, -165.58938598632812, -158.1441650390625, -150.69895935058594, -143.2537384033203, -135.8085174560547, -128.36329650878906, -120.91808319091797, -113.47285461425781, -106.02763366699219, -98.5824203491211, -91.13719940185547, -83.69198608398438, -76.24676513671875, -68.80154418945312, -61.35633087158203, -53.91111755371094, -46.46590042114258, -39.02068328857422, -31.575464248657227, -24.130247116088867, -16.685028076171875, -9.239810943603516, -1.7945938110351562, 5.650623321533203, 13.095840454101562, 20.541057586669922, 27.986276626586914, 35.431495666503906, 42.876712799072266, 50.321929931640625, 57.767147064208984, 65.21236419677734, 72.65758514404297, 80.10279846191406, 87.54801940917969, 94.99323272705078, 102.4384536743164, 109.8836669921875, 117.32888793945312, 124.77410888671875, 132.21932983398438, 139.66455078125, 147.10975646972656, 154.5549774169922, 162.0001983642578, 169.44541931152344, 176.890625, 184.33584594726562]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 15.0, 13.0, 21.0, 22.0, 71.0, 84.0, 157.0, 281.0, 481.0, 799.0, 1492.0, 2839.0, 5808.0, 12567.0, 30434.0, 88977.0, 388337.0, 375212.0, 86561.0, 30069.0, 12436.0, 5687.0, 2718.0, 1528.0, 818.0, 477.0, 254.0, 144.0, 89.0, 71.0, 30.0, 22.0, 17.0, 10.0, 9.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.28125, -35.94921875, -34.6171875, -33.28515625, -31.953125, -30.62109375, -29.2890625, -27.95703125, -26.625, -25.29296875, -23.9609375, -22.62890625, -21.296875, -19.96484375, -18.6328125, -17.30078125, -15.96875, -14.63671875, -13.3046875, -11.97265625, -10.640625, -9.30859375, -7.9765625, -6.64453125, -5.3125, -3.98046875, -2.6484375, -1.31640625, 0.015625, 1.34765625, 2.6796875, 4.01171875, 5.34375, 6.67578125, 8.0078125, 9.33984375, 10.671875, 12.00390625, 13.3359375, 14.66796875, 16.0, 17.33203125, 18.6640625, 19.99609375, 21.328125, 22.66015625, 23.9921875, 25.32421875, 26.65625, 27.98828125, 29.3203125, 30.65234375, 31.984375, 33.31640625, 34.6484375, 35.98046875, 37.3125, 38.64453125, 39.9765625, 41.30859375, 42.640625, 43.97265625, 45.3046875, 46.63671875, 47.96875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 5.0, 4.0, 4.0, 15.0, 7.0, 12.0, 14.0, 12.0, 16.0, 20.0, 27.0, 26.0, 32.0, 37.0, 33.0, 42.0, 29.0, 51.0, 55.0, 47.0, 42.0, 47.0, 47.0, 42.0, 37.0, 41.0, 36.0, 29.0, 28.0, 19.0, 24.0, 19.0, 17.0, 10.0, 16.0, 12.0, 5.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-17.28125, -16.773193359375, -16.26513671875, -15.757080078125, -15.2490234375, -14.740966796875, -14.23291015625, -13.724853515625, -13.216796875, -12.708740234375, -12.20068359375, -11.692626953125, -11.1845703125, -10.676513671875, -10.16845703125, -9.660400390625, -9.15234375, -8.644287109375, -8.13623046875, -7.628173828125, -7.1201171875, -6.612060546875, -6.10400390625, -5.595947265625, -5.087890625, -4.579833984375, -4.07177734375, -3.563720703125, -3.0556640625, -2.547607421875, -2.03955078125, -1.531494140625, -1.0234375, -0.515380859375, -0.00732421875, 0.500732421875, 1.0087890625, 1.516845703125, 2.02490234375, 2.532958984375, 3.041015625, 3.549072265625, 4.05712890625, 4.565185546875, 5.0732421875, 5.581298828125, 6.08935546875, 6.597412109375, 7.10546875, 7.613525390625, 8.12158203125, 8.629638671875, 9.1376953125, 9.645751953125, 10.15380859375, 10.661865234375, 11.169921875, 11.677978515625, 12.18603515625, 12.694091796875, 13.2021484375, 13.710205078125, 14.21826171875, 14.726318359375, 15.234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 8.0, 13.0, 17.0, 19.0, 36.0, 55.0, 86.0, 161.0, 282.0, 567.0, 1296.0, 3565.0, 15903.0, 197851.0, 784681.0, 34439.0, 5978.0, 1943.0, 776.0, 380.0, 166.0, 116.0, 77.0, 44.0, 25.0, 18.0, 13.0, 8.0, 6.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.5, -100.79296875, -97.0859375, -93.37890625, -89.671875, -85.96484375, -82.2578125, -78.55078125, -74.84375, -71.13671875, -67.4296875, -63.72265625, -60.015625, -56.30859375, -52.6015625, -48.89453125, -45.1875, -41.48046875, -37.7734375, -34.06640625, -30.359375, -26.65234375, -22.9453125, -19.23828125, -15.53125, -11.82421875, -8.1171875, -4.41015625, -0.703125, 3.00390625, 6.7109375, 10.41796875, 14.125, 17.83203125, 21.5390625, 25.24609375, 28.953125, 32.66015625, 36.3671875, 40.07421875, 43.78125, 47.48828125, 51.1953125, 54.90234375, 58.609375, 62.31640625, 66.0234375, 69.73046875, 73.4375, 77.14453125, 80.8515625, 84.55859375, 88.265625, 91.97265625, 95.6796875, 99.38671875, 103.09375, 106.80078125, 110.5078125, 114.21484375, 117.921875, 121.62890625, 125.3359375, 129.04296875, 132.75]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 10.0, 14.0, 14.0, 17.0, 32.0, 24.0, 35.0, 39.0, 45.0, 48.0, 64.0, 57.0, 55.0, 65.0, 67.0, 59.0, 49.0, 53.0, 41.0, 39.0, 29.0, 35.0, 18.0, 25.0, 11.0, 10.0, 4.0, 5.0, 3.0, 0.0, 7.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-116.4375, -113.2392578125, -110.041015625, -106.8427734375, -103.64453125, -100.4462890625, -97.248046875, -94.0498046875, -90.8515625, -87.6533203125, -84.455078125, -81.2568359375, -78.05859375, -74.8603515625, -71.662109375, -68.4638671875, -65.265625, -62.0673828125, -58.869140625, -55.6708984375, -52.47265625, -49.2744140625, -46.076171875, -42.8779296875, -39.6796875, -36.4814453125, -33.283203125, -30.0849609375, -26.88671875, -23.6884765625, -20.490234375, -17.2919921875, -14.09375, -10.8955078125, -7.697265625, -4.4990234375, -1.30078125, 1.8974609375, 5.095703125, 8.2939453125, 11.4921875, 14.6904296875, 17.888671875, 21.0869140625, 24.28515625, 27.4833984375, 30.681640625, 33.8798828125, 37.078125, 40.2763671875, 43.474609375, 46.6728515625, 49.87109375, 53.0693359375, 56.267578125, 59.4658203125, 62.6640625, 65.8623046875, 69.060546875, 72.2587890625, 75.45703125, 78.6552734375, 81.853515625, 85.0517578125, 88.25]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 7.0, 4.0, 9.0, 17.0, 16.0, 25.0, 31.0, 87.0, 170.0, 362.0, 1176.0, 4504.0, 32422.0, 773799.0, 218079.0, 13957.0, 2570.0, 741.0, 277.0, 133.0, 79.0, 33.0, 18.0, 11.0, 6.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.96875, -51.13037109375, -49.2919921875, -47.45361328125, -45.615234375, -43.77685546875, -41.9384765625, -40.10009765625, -38.26171875, -36.42333984375, -34.5849609375, -32.74658203125, -30.908203125, -29.06982421875, -27.2314453125, -25.39306640625, -23.5546875, -21.71630859375, -19.8779296875, -18.03955078125, -16.201171875, -14.36279296875, -12.5244140625, -10.68603515625, -8.84765625, -7.00927734375, -5.1708984375, -3.33251953125, -1.494140625, 0.34423828125, 2.1826171875, 4.02099609375, 5.859375, 7.69775390625, 9.5361328125, 11.37451171875, 13.212890625, 15.05126953125, 16.8896484375, 18.72802734375, 20.56640625, 22.40478515625, 24.2431640625, 26.08154296875, 27.919921875, 29.75830078125, 31.5966796875, 33.43505859375, 35.2734375, 37.11181640625, 38.9501953125, 40.78857421875, 42.626953125, 44.46533203125, 46.3037109375, 48.14208984375, 49.98046875, 51.81884765625, 53.6572265625, 55.49560546875, 57.333984375, 59.17236328125, 61.0107421875, 62.84912109375, 64.6875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 10.0, 13.0, 13.0, 22.0, 29.0, 48.0, 71.0, 151.0, 190.0, 170.0, 90.0, 51.0, 48.0, 31.0, 15.0, 11.0, 6.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01163482666015625, -0.011334061622619629, -0.011033296585083008, -0.010732531547546387, -0.010431766510009766, -0.010131001472473145, -0.009830236434936523, -0.009529471397399902, -0.009228706359863281, -0.00892794132232666, -0.008627176284790039, -0.008326411247253418, -0.008025646209716797, -0.007724881172180176, -0.007424116134643555, -0.007123351097106934, -0.0068225860595703125, -0.006521821022033691, -0.00622105598449707, -0.005920290946960449, -0.005619525909423828, -0.005318760871887207, -0.005017995834350586, -0.004717230796813965, -0.004416465759277344, -0.004115700721740723, -0.0038149356842041016, -0.0035141706466674805, -0.0032134056091308594, -0.0029126405715942383, -0.002611875534057617, -0.002311110496520996, -0.002010345458984375, -0.001709580421447754, -0.0014088153839111328, -0.0011080503463745117, -0.0008072853088378906, -0.0005065202713012695, -0.00020575523376464844, 9.500980377197266e-05, 0.00039577484130859375, 0.0006965398788452148, 0.000997304916381836, 0.001298069953918457, 0.0015988349914550781, 0.0018996000289916992, 0.0022003650665283203, 0.0025011301040649414, 0.0028018951416015625, 0.0031026601791381836, 0.0034034252166748047, 0.0037041902542114258, 0.004004955291748047, 0.004305720329284668, 0.004606485366821289, 0.00490725040435791, 0.005208015441894531, 0.005508780479431152, 0.0058095455169677734, 0.0061103105545043945, 0.006411075592041016, 0.006711840629577637, 0.007012605667114258, 0.007313370704650879, 0.0076141357421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 11.0, 26.0, 18.0, 33.0, 76.0, 111.0, 197.0, 443.0, 1131.0, 3418.0, 16240.0, 221641.0, 757917.0, 38268.0, 6009.0, 1660.0, 695.0, 266.0, 157.0, 87.0, 52.0, 30.0, 25.0, 15.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.40625, -53.7861328125, -52.166015625, -50.5458984375, -48.92578125, -47.3056640625, -45.685546875, -44.0654296875, -42.4453125, -40.8251953125, -39.205078125, -37.5849609375, -35.96484375, -34.3447265625, -32.724609375, -31.1044921875, -29.484375, -27.8642578125, -26.244140625, -24.6240234375, -23.00390625, -21.3837890625, -19.763671875, -18.1435546875, -16.5234375, -14.9033203125, -13.283203125, -11.6630859375, -10.04296875, -8.4228515625, -6.802734375, -5.1826171875, -3.5625, -1.9423828125, -0.322265625, 1.2978515625, 2.91796875, 4.5380859375, 6.158203125, 7.7783203125, 9.3984375, 11.0185546875, 12.638671875, 14.2587890625, 15.87890625, 17.4990234375, 19.119140625, 20.7392578125, 22.359375, 23.9794921875, 25.599609375, 27.2197265625, 28.83984375, 30.4599609375, 32.080078125, 33.7001953125, 35.3203125, 36.9404296875, 38.560546875, 40.1806640625, 41.80078125, 43.4208984375, 45.041015625, 46.6611328125, 48.28125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 1.0, 5.0, 9.0, 7.0, 8.0, 12.0, 19.0, 29.0, 22.0, 36.0, 40.0, 62.0, 49.0, 92.0, 100.0, 97.0, 77.0, 69.0, 67.0, 38.0, 29.0, 28.0, 20.0, 22.0, 12.0, 16.0, 7.0, 6.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.109375, -23.212158203125, -22.31494140625, -21.417724609375, -20.5205078125, -19.623291015625, -18.72607421875, -17.828857421875, -16.931640625, -16.034423828125, -15.13720703125, -14.239990234375, -13.3427734375, -12.445556640625, -11.54833984375, -10.651123046875, -9.75390625, -8.856689453125, -7.95947265625, -7.062255859375, -6.1650390625, -5.267822265625, -4.37060546875, -3.473388671875, -2.576171875, -1.678955078125, -0.78173828125, 0.115478515625, 1.0126953125, 1.909912109375, 2.80712890625, 3.704345703125, 4.6015625, 5.498779296875, 6.39599609375, 7.293212890625, 8.1904296875, 9.087646484375, 9.98486328125, 10.882080078125, 11.779296875, 12.676513671875, 13.57373046875, 14.470947265625, 15.3681640625, 16.265380859375, 17.16259765625, 18.059814453125, 18.95703125, 19.854248046875, 20.75146484375, 21.648681640625, 22.5458984375, 23.443115234375, 24.34033203125, 25.237548828125, 26.134765625, 27.031982421875, 27.92919921875, 28.826416015625, 29.7236328125, 30.620849609375, 31.51806640625, 32.415283203125, 33.3125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 9.0, 4.0, 10.0, 25.0, 37.0, 78.0, 103.0, 133.0, 192.0, 136.0, 116.0, 62.0, 37.0, 19.0, 9.0, 7.0, 7.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-581.22021484375, -565.3141479492188, -549.4081420898438, -533.5020751953125, -517.5960083007812, -501.6899719238281, -485.783935546875, -469.87786865234375, -453.9718322753906, -438.0657958984375, -422.15972900390625, -406.2536926269531, -390.34765625, -374.44158935546875, -358.5355529785156, -342.6295166015625, -326.72344970703125, -310.8174133300781, -294.9113464355469, -279.00531005859375, -263.0992431640625, -247.19320678710938, -231.28717041015625, -215.38111877441406, -199.47506713867188, -183.5690155029297, -167.6629638671875, -151.75692749023438, -135.8508758544922, -119.94482421875, -104.03878021240234, -88.13273620605469, -72.22665405273438, -56.32060623168945, -40.41455841064453, -24.50851058959961, -8.602462768554688, 7.3035888671875, 23.209632873535156, 39.11567687988281, 55.021728515625, 70.92778015136719, 86.83382415771484, 102.7398681640625, 118.64591979980469, 134.55197143554688, 150.4580078125, 166.3640594482422, 182.27011108398438, 198.17616271972656, 214.08221435546875, 229.98825073242188, 245.89430236816406, 261.80035400390625, 277.7063903808594, 293.6124267578125, 309.51849365234375, 325.4245300292969, 341.3305969238281, 357.23663330078125, 373.1427001953125, 389.0487365722656, 404.95477294921875, 420.86083984375, 436.7668762207031]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 5.0, 12.0, 19.0, 32.0, 23.0, 38.0, 41.0, 63.0, 58.0, 81.0, 97.0, 111.0, 86.0, 75.0, 57.0, 55.0, 36.0, 33.0, 26.0, 16.0, 12.0, 9.0, 5.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.8760986328125, -330.5126037597656, -312.14910888671875, -293.78558349609375, -275.4220886230469, -257.05859375, -238.69508361816406, -220.33157348632812, -201.96807861328125, -183.60458374023438, -165.24107360839844, -146.8775634765625, -128.51406860351562, -110.15056610107422, -91.78706359863281, -73.42355346679688, -55.06005859375, -36.696556091308594, -18.333053588867188, 0.03044891357421875, 18.393951416015625, 36.75745391845703, 55.12095642089844, 73.48446655273438, 91.84796142578125, 110.21146392822266, 128.57496643066406, 146.9384765625, 165.30197143554688, 183.66546630859375, 202.0289764404297, 220.39248657226562, 238.7559814453125, 257.1194763183594, 275.48297119140625, 293.84649658203125, 312.2099914550781, 330.573486328125, 348.93701171875, 367.3005065917969, 385.66400146484375, 404.0274963378906, 422.3909912109375, 440.7545166015625, 459.1180114746094, 477.48150634765625, 495.84503173828125, 514.20849609375, 532.572021484375, 550.935546875, 569.2990112304688, 587.6625366210938, 606.0260009765625, 624.3895263671875, 642.7530517578125, 661.1165771484375, 679.4800415039062, 697.8435668945312, 716.20703125, 734.570556640625, 752.93408203125, 771.2975463867188, 789.6610717773438, 808.0245361328125, 826.3880615234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 11.0, 15.0, 22.0, 39.0, 42.0, 79.0, 114.0, 142.0, 218.0, 346.0, 586.0, 1021.0, 1730.0, 3235.0, 6401.0, 13707.0, 35138.0, 119550.0, 690551.0, 2489723.0, 658181.0, 115674.0, 33125.0, 12710.0, 5489.0, 2751.0, 1391.0, 840.0, 476.0, 319.0, 192.0, 123.0, 99.0, 70.0, 37.0, 28.0, 27.0, 16.0, 11.0, 7.0, 12.0, 4.0, 5.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.609375, -24.710205078125, -23.81103515625, -22.911865234375, -22.0126953125, -21.113525390625, -20.21435546875, -19.315185546875, -18.416015625, -17.516845703125, -16.61767578125, -15.718505859375, -14.8193359375, -13.920166015625, -13.02099609375, -12.121826171875, -11.22265625, -10.323486328125, -9.42431640625, -8.525146484375, -7.6259765625, -6.726806640625, -5.82763671875, -4.928466796875, -4.029296875, -3.130126953125, -2.23095703125, -1.331787109375, -0.4326171875, 0.466552734375, 1.36572265625, 2.264892578125, 3.1640625, 4.063232421875, 4.96240234375, 5.861572265625, 6.7607421875, 7.659912109375, 8.55908203125, 9.458251953125, 10.357421875, 11.256591796875, 12.15576171875, 13.054931640625, 13.9541015625, 14.853271484375, 15.75244140625, 16.651611328125, 17.55078125, 18.449951171875, 19.34912109375, 20.248291015625, 21.1474609375, 22.046630859375, 22.94580078125, 23.844970703125, 24.744140625, 25.643310546875, 26.54248046875, 27.441650390625, 28.3408203125, 29.239990234375, 30.13916015625, 31.038330078125, 31.9375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 16.0, 29.0, 66.0, 63.0, 108.0, 146.0, 166.0, 147.0, 102.0, 70.0, 55.0, 12.0, 8.0, 10.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.5625, -24.9462890625, -23.330078125, -21.7138671875, -20.09765625, -18.4814453125, -16.865234375, -15.2490234375, -13.6328125, -12.0166015625, -10.400390625, -8.7841796875, -7.16796875, -5.5517578125, -3.935546875, -2.3193359375, -0.703125, 0.9130859375, 2.529296875, 4.1455078125, 5.76171875, 7.3779296875, 8.994140625, 10.6103515625, 12.2265625, 13.8427734375, 15.458984375, 17.0751953125, 18.69140625, 20.3076171875, 21.923828125, 23.5400390625, 25.15625, 26.7724609375, 28.388671875, 30.0048828125, 31.62109375, 33.2373046875, 34.853515625, 36.4697265625, 38.0859375, 39.7021484375, 41.318359375, 42.9345703125, 44.55078125, 46.1669921875, 47.783203125, 49.3994140625, 51.015625, 52.6318359375, 54.248046875, 55.8642578125, 57.48046875, 59.0966796875, 60.712890625, 62.3291015625, 63.9453125, 65.5615234375, 67.177734375, 68.7939453125, 70.41015625, 72.0263671875, 73.642578125, 75.2587890625, 76.875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 10.0, 9.0, 16.0, 17.0, 40.0, 79.0, 93.0, 148.0, 276.0, 485.0, 986.0, 2127.0, 5675.0, 19282.0, 104835.0, 2070930.0, 1870441.0, 92691.0, 17025.0, 4920.0, 1994.0, 959.0, 513.0, 291.0, 169.0, 96.0, 51.0, 32.0, 35.0, 14.0, 10.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-70.8125, -68.5986328125, -66.384765625, -64.1708984375, -61.95703125, -59.7431640625, -57.529296875, -55.3154296875, -53.1015625, -50.8876953125, -48.673828125, -46.4599609375, -44.24609375, -42.0322265625, -39.818359375, -37.6044921875, -35.390625, -33.1767578125, -30.962890625, -28.7490234375, -26.53515625, -24.3212890625, -22.107421875, -19.8935546875, -17.6796875, -15.4658203125, -13.251953125, -11.0380859375, -8.82421875, -6.6103515625, -4.396484375, -2.1826171875, 0.03125, 2.2451171875, 4.458984375, 6.6728515625, 8.88671875, 11.1005859375, 13.314453125, 15.5283203125, 17.7421875, 19.9560546875, 22.169921875, 24.3837890625, 26.59765625, 28.8115234375, 31.025390625, 33.2392578125, 35.453125, 37.6669921875, 39.880859375, 42.0947265625, 44.30859375, 46.5224609375, 48.736328125, 50.9501953125, 53.1640625, 55.3779296875, 57.591796875, 59.8056640625, 62.01953125, 64.2333984375, 66.447265625, 68.6611328125, 70.875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 7.0, 4.0, 12.0, 20.0, 22.0, 38.0, 41.0, 51.0, 101.0, 166.0, 245.0, 466.0, 810.0, 886.0, 507.0, 282.0, 141.0, 84.0, 46.0, 38.0, 35.0, 20.0, 12.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-81.9375, -79.3828125, -76.828125, -74.2734375, -71.71875, -69.1640625, -66.609375, -64.0546875, -61.5, -58.9453125, -56.390625, -53.8359375, -51.28125, -48.7265625, -46.171875, -43.6171875, -41.0625, -38.5078125, -35.953125, -33.3984375, -30.84375, -28.2890625, -25.734375, -23.1796875, -20.625, -18.0703125, -15.515625, -12.9609375, -10.40625, -7.8515625, -5.296875, -2.7421875, -0.1875, 2.3671875, 4.921875, 7.4765625, 10.03125, 12.5859375, 15.140625, 17.6953125, 20.25, 22.8046875, 25.359375, 27.9140625, 30.46875, 33.0234375, 35.578125, 38.1328125, 40.6875, 43.2421875, 45.796875, 48.3515625, 50.90625, 53.4609375, 56.015625, 58.5703125, 61.125, 63.6796875, 66.234375, 68.7890625, 71.34375, 73.8984375, 76.453125, 79.0078125, 81.5625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 6.0, 16.0, 20.0, 62.0, 252.0, 443.0, 152.0, 34.0, 6.0, 9.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2344.88427734375, -2297.390869140625, -2249.8974609375, -2202.40380859375, -2154.910400390625, -2107.4169921875, -2059.923583984375, -2012.4300537109375, -1964.9365234375, -1917.443115234375, -1869.9495849609375, -1822.4561767578125, -1774.962646484375, -1727.46923828125, -1679.9757080078125, -1632.4822998046875, -1584.98876953125, -1537.495361328125, -1490.0018310546875, -1442.5084228515625, -1395.014892578125, -1347.521484375, -1300.0279541015625, -1252.5345458984375, -1205.0411376953125, -1157.5477294921875, -1110.05419921875, -1062.560791015625, -1015.0672607421875, -967.5737915039062, -920.080322265625, -872.5869140625, -825.0933837890625, -777.5999145507812, -730.1064453125, -682.6129760742188, -635.1195068359375, -587.6260375976562, -540.132568359375, -492.6391296386719, -445.1456604003906, -397.6521911621094, -350.1587219238281, -302.665283203125, -255.1717987060547, -207.67832946777344, -160.18487548828125, -112.69140625, -65.19793701171875, -17.704471588134766, 29.78899383544922, 77.28245544433594, 124.77592468261719, 172.26939392089844, 219.76284790039062, 267.2563171386719, 314.7497863769531, 362.2432556152344, 409.7367248535156, 457.23016357421875, 504.7236328125, 552.2171020507812, 599.7105712890625, 647.2040405273438, 694.697509765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 16.0, 10.0, 16.0, 29.0, 35.0, 40.0, 37.0, 68.0, 59.0, 77.0, 62.0, 78.0, 74.0, 83.0, 71.0, 58.0, 44.0, 30.0, 30.0, 23.0, 17.0, 15.0, 9.0, 6.0, 1.0, 7.0, 1.0, 2.0, 4.0], "bins": [-768.7218627929688, -752.0758056640625, -735.4297485351562, -718.78369140625, -702.1376342773438, -685.4915771484375, -668.8455810546875, -652.1995239257812, -635.553466796875, -618.9074096679688, -602.2613525390625, -585.6152954101562, -568.96923828125, -552.3232421875, -535.6771240234375, -519.0311279296875, -502.3850402832031, -485.7389831542969, -469.0929260253906, -452.4468994140625, -435.80084228515625, -419.15478515625, -402.50872802734375, -385.8626708984375, -369.21661376953125, -352.570556640625, -335.92449951171875, -319.2784423828125, -302.6324157714844, -285.9863586425781, -269.3403015136719, -252.69424438476562, -236.04818725585938, -219.40213012695312, -202.75608825683594, -186.1100311279297, -169.4639892578125, -152.81793212890625, -136.171875, -119.52582550048828, -102.87977600097656, -86.23372650146484, -69.58767700195312, -52.941619873046875, -36.295570373535156, -19.649520874023438, -3.0034637451171875, 13.642585754394531, 30.28863525390625, 46.93468475341797, 63.58073806762695, 80.22679138183594, 96.87284088134766, 113.51889038085938, 130.16494750976562, 146.81100463867188, 163.45704650878906, 180.1031036376953, 196.7491455078125, 213.39520263671875, 230.041259765625, 246.6873016357422, 263.3333740234375, 279.9794006347656, 296.6254577636719]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 9.0, 18.0, 22.0, 46.0, 53.0, 75.0, 143.0, 210.0, 329.0, 432.0, 739.0, 1226.0, 1988.0, 3662.0, 6950.0, 13505.0, 27525.0, 61770.0, 157621.0, 397399.0, 223034.0, 80725.0, 35195.0, 16877.0, 8395.0, 4346.0, 2450.0, 1413.0, 843.0, 518.0, 335.0, 216.0, 147.0, 95.0, 77.0, 42.0, 31.0, 18.0, 17.0, 15.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78125, -36.548828125, -35.31640625, -34.083984375, -32.8515625, -31.619140625, -30.38671875, -29.154296875, -27.921875, -26.689453125, -25.45703125, -24.224609375, -22.9921875, -21.759765625, -20.52734375, -19.294921875, -18.0625, -16.830078125, -15.59765625, -14.365234375, -13.1328125, -11.900390625, -10.66796875, -9.435546875, -8.203125, -6.970703125, -5.73828125, -4.505859375, -3.2734375, -2.041015625, -0.80859375, 0.423828125, 1.65625, 2.888671875, 4.12109375, 5.353515625, 6.5859375, 7.818359375, 9.05078125, 10.283203125, 11.515625, 12.748046875, 13.98046875, 15.212890625, 16.4453125, 17.677734375, 18.91015625, 20.142578125, 21.375, 22.607421875, 23.83984375, 25.072265625, 26.3046875, 27.537109375, 28.76953125, 30.001953125, 31.234375, 32.466796875, 33.69921875, 34.931640625, 36.1640625, 37.396484375, 38.62890625, 39.861328125, 41.09375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 7.0, 11.0, 10.0, 13.0, 11.0, 16.0, 21.0, 21.0, 19.0, 32.0, 30.0, 32.0, 38.0, 30.0, 36.0, 40.0, 54.0, 50.0, 53.0, 57.0, 39.0, 46.0, 49.0, 38.0, 37.0, 38.0, 22.0, 21.0, 21.0, 21.0, 11.0, 12.0, 12.0, 5.0, 10.0, 5.0, 7.0, 1.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.40771484375, -18.8154296875, -18.22314453125, -17.630859375, -17.03857421875, -16.4462890625, -15.85400390625, -15.26171875, -14.66943359375, -14.0771484375, -13.48486328125, -12.892578125, -12.30029296875, -11.7080078125, -11.11572265625, -10.5234375, -9.93115234375, -9.3388671875, -8.74658203125, -8.154296875, -7.56201171875, -6.9697265625, -6.37744140625, -5.78515625, -5.19287109375, -4.6005859375, -4.00830078125, -3.416015625, -2.82373046875, -2.2314453125, -1.63916015625, -1.046875, -0.45458984375, 0.1376953125, 0.72998046875, 1.322265625, 1.91455078125, 2.5068359375, 3.09912109375, 3.69140625, 4.28369140625, 4.8759765625, 5.46826171875, 6.060546875, 6.65283203125, 7.2451171875, 7.83740234375, 8.4296875, 9.02197265625, 9.6142578125, 10.20654296875, 10.798828125, 11.39111328125, 11.9833984375, 12.57568359375, 13.16796875, 13.76025390625, 14.3525390625, 14.94482421875, 15.537109375, 16.12939453125, 16.7216796875, 17.31396484375, 17.90625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 7.0, 17.0, 16.0, 26.0, 49.0, 99.0, 156.0, 289.0, 586.0, 1335.0, 4069.0, 21888.0, 820438.0, 184063.0, 10758.0, 2699.0, 1031.0, 430.0, 234.0, 135.0, 83.0, 42.0, 26.0, 29.0, 10.0, 20.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-223.875, -217.95703125, -212.0390625, -206.12109375, -200.203125, -194.28515625, -188.3671875, -182.44921875, -176.53125, -170.61328125, -164.6953125, -158.77734375, -152.859375, -146.94140625, -141.0234375, -135.10546875, -129.1875, -123.26953125, -117.3515625, -111.43359375, -105.515625, -99.59765625, -93.6796875, -87.76171875, -81.84375, -75.92578125, -70.0078125, -64.08984375, -58.171875, -52.25390625, -46.3359375, -40.41796875, -34.5, -28.58203125, -22.6640625, -16.74609375, -10.828125, -4.91015625, 1.0078125, 6.92578125, 12.84375, 18.76171875, 24.6796875, 30.59765625, 36.515625, 42.43359375, 48.3515625, 54.26953125, 60.1875, 66.10546875, 72.0234375, 77.94140625, 83.859375, 89.77734375, 95.6953125, 101.61328125, 107.53125, 113.44921875, 119.3671875, 125.28515625, 131.203125, 137.12109375, 143.0390625, 148.95703125, 154.875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 14.0, 12.0, 14.0, 34.0, 28.0, 30.0, 61.0, 66.0, 67.0, 82.0, 103.0, 88.0, 63.0, 92.0, 68.0, 49.0, 29.0, 22.0, 23.0, 11.0, 13.0, 13.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.125, -111.7109375, -106.296875, -100.8828125, -95.46875, -90.0546875, -84.640625, -79.2265625, -73.8125, -68.3984375, -62.984375, -57.5703125, -52.15625, -46.7421875, -41.328125, -35.9140625, -30.5, -25.0859375, -19.671875, -14.2578125, -8.84375, -3.4296875, 1.984375, 7.3984375, 12.8125, 18.2265625, 23.640625, 29.0546875, 34.46875, 39.8828125, 45.296875, 50.7109375, 56.125, 61.5390625, 66.953125, 72.3671875, 77.78125, 83.1953125, 88.609375, 94.0234375, 99.4375, 104.8515625, 110.265625, 115.6796875, 121.09375, 126.5078125, 131.921875, 137.3359375, 142.75, 148.1640625, 153.578125, 158.9921875, 164.40625, 169.8203125, 175.234375, 180.6484375, 186.0625, 191.4765625, 196.890625, 202.3046875, 207.71875, 213.1328125, 218.546875, 223.9609375, 229.375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 2.0, 9.0, 5.0, 12.0, 20.0, 22.0, 32.0, 34.0, 56.0, 109.0, 171.0, 298.0, 533.0, 1172.0, 2727.0, 7496.0, 28580.0, 156078.0, 707177.0, 111413.0, 21843.0, 6297.0, 2265.0, 1006.0, 506.0, 279.0, 144.0, 77.0, 52.0, 37.0, 25.0, 19.0, 12.0, 8.0, 6.0, 9.0, 7.0, 3.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.984375, -27.998779296875, -27.01318359375, -26.027587890625, -25.0419921875, -24.056396484375, -23.07080078125, -22.085205078125, -21.099609375, -20.114013671875, -19.12841796875, -18.142822265625, -17.1572265625, -16.171630859375, -15.18603515625, -14.200439453125, -13.21484375, -12.229248046875, -11.24365234375, -10.258056640625, -9.2724609375, -8.286865234375, -7.30126953125, -6.315673828125, -5.330078125, -4.344482421875, -3.35888671875, -2.373291015625, -1.3876953125, -0.402099609375, 0.58349609375, 1.569091796875, 2.5546875, 3.540283203125, 4.52587890625, 5.511474609375, 6.4970703125, 7.482666015625, 8.46826171875, 9.453857421875, 10.439453125, 11.425048828125, 12.41064453125, 13.396240234375, 14.3818359375, 15.367431640625, 16.35302734375, 17.338623046875, 18.32421875, 19.309814453125, 20.29541015625, 21.281005859375, 22.2666015625, 23.252197265625, 24.23779296875, 25.223388671875, 26.208984375, 27.194580078125, 28.18017578125, 29.165771484375, 30.1513671875, 31.136962890625, 32.12255859375, 33.108154296875, 34.09375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 8.0, 7.0, 6.0, 15.0, 18.0, 19.0, 23.0, 28.0, 42.0, 40.0, 74.0, 87.0, 142.0, 129.0, 87.0, 57.0, 52.0, 33.0, 23.0, 30.0, 21.0, 17.0, 8.0, 12.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0076446533203125, -0.007371306419372559, -0.007097959518432617, -0.006824612617492676, -0.006551265716552734, -0.006277918815612793, -0.0060045719146728516, -0.00573122501373291, -0.005457878112792969, -0.005184531211853027, -0.004911184310913086, -0.0046378374099731445, -0.004364490509033203, -0.004091143608093262, -0.0038177967071533203, -0.003544449806213379, -0.0032711029052734375, -0.002997756004333496, -0.0027244091033935547, -0.0024510622024536133, -0.002177715301513672, -0.0019043684005737305, -0.001631021499633789, -0.0013576745986938477, -0.0010843276977539062, -0.0008109807968139648, -0.0005376338958740234, -0.00026428699493408203, 9.059906005859375e-06, 0.0002824068069458008, 0.0005557537078857422, 0.0008291006088256836, 0.001102447509765625, 0.0013757944107055664, 0.0016491413116455078, 0.0019224882125854492, 0.0021958351135253906, 0.002469182014465332, 0.0027425289154052734, 0.003015875816345215, 0.0032892227172851562, 0.0035625696182250977, 0.003835916519165039, 0.0041092634201049805, 0.004382610321044922, 0.004655957221984863, 0.004929304122924805, 0.005202651023864746, 0.0054759979248046875, 0.005749344825744629, 0.00602269172668457, 0.006296038627624512, 0.006569385528564453, 0.0068427324295043945, 0.007116079330444336, 0.007389426231384277, 0.007662773132324219, 0.00793612003326416, 0.008209466934204102, 0.008482813835144043, 0.008756160736083984, 0.009029507637023926, 0.009302854537963867, 0.009576201438903809, 0.00984954833984375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 4.0, 5.0, 11.0, 16.0, 28.0, 32.0, 43.0, 72.0, 98.0, 172.0, 334.0, 592.0, 1101.0, 2331.0, 5661.0, 23373.0, 192252.0, 731386.0, 71842.0, 11890.0, 3731.0, 1656.0, 790.0, 457.0, 257.0, 148.0, 105.0, 62.0, 31.0, 26.0, 22.0, 6.0, 7.0, 7.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.5, -38.440673828125, -37.38134765625, -36.322021484375, -35.2626953125, -34.203369140625, -33.14404296875, -32.084716796875, -31.025390625, -29.966064453125, -28.90673828125, -27.847412109375, -26.7880859375, -25.728759765625, -24.66943359375, -23.610107421875, -22.55078125, -21.491455078125, -20.43212890625, -19.372802734375, -18.3134765625, -17.254150390625, -16.19482421875, -15.135498046875, -14.076171875, -13.016845703125, -11.95751953125, -10.898193359375, -9.8388671875, -8.779541015625, -7.72021484375, -6.660888671875, -5.6015625, -4.542236328125, -3.48291015625, -2.423583984375, -1.3642578125, -0.304931640625, 0.75439453125, 1.813720703125, 2.873046875, 3.932373046875, 4.99169921875, 6.051025390625, 7.1103515625, 8.169677734375, 9.22900390625, 10.288330078125, 11.34765625, 12.406982421875, 13.46630859375, 14.525634765625, 15.5849609375, 16.644287109375, 17.70361328125, 18.762939453125, 19.822265625, 20.881591796875, 21.94091796875, 23.000244140625, 24.0595703125, 25.118896484375, 26.17822265625, 27.237548828125, 28.296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 8.0, 17.0, 18.0, 15.0, 26.0, 30.0, 32.0, 30.0, 42.0, 46.0, 60.0, 66.0, 65.0, 82.0, 62.0, 65.0, 67.0, 38.0, 38.0, 26.0, 31.0, 20.0, 23.0, 22.0, 10.0, 5.0, 9.0, 3.0, 3.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.054931640625, -20.25048828125, -19.446044921875, -18.6416015625, -17.837158203125, -17.03271484375, -16.228271484375, -15.423828125, -14.619384765625, -13.81494140625, -13.010498046875, -12.2060546875, -11.401611328125, -10.59716796875, -9.792724609375, -8.98828125, -8.183837890625, -7.37939453125, -6.574951171875, -5.7705078125, -4.966064453125, -4.16162109375, -3.357177734375, -2.552734375, -1.748291015625, -0.94384765625, -0.139404296875, 0.6650390625, 1.469482421875, 2.27392578125, 3.078369140625, 3.8828125, 4.687255859375, 5.49169921875, 6.296142578125, 7.1005859375, 7.905029296875, 8.70947265625, 9.513916015625, 10.318359375, 11.122802734375, 11.92724609375, 12.731689453125, 13.5361328125, 14.340576171875, 15.14501953125, 15.949462890625, 16.75390625, 17.558349609375, 18.36279296875, 19.167236328125, 19.9716796875, 20.776123046875, 21.58056640625, 22.385009765625, 23.189453125, 23.993896484375, 24.79833984375, 25.602783203125, 26.4072265625, 27.211669921875, 28.01611328125, 28.820556640625, 29.625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 19.0, 22.0, 46.0, 91.0, 154.0, 277.0, 192.0, 89.0, 46.0, 26.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1310.2720947265625, -1283.4244384765625, -1256.57666015625, -1229.72900390625, -1202.88134765625, -1176.03369140625, -1149.1859130859375, -1122.3382568359375, -1095.4906005859375, -1068.6429443359375, -1041.795166015625, -1014.947509765625, -988.099853515625, -961.2521362304688, -934.4044799804688, -907.5567626953125, -880.7091064453125, -853.8613891601562, -827.0137329101562, -800.166015625, -773.318359375, -746.4706420898438, -719.6229858398438, -692.7752685546875, -665.9275512695312, -639.079833984375, -612.232177734375, -585.3844604492188, -558.5368041992188, -531.6890869140625, -504.8414306640625, -477.99371337890625, -451.14605712890625, -424.2983703613281, -397.45068359375, -370.6029968261719, -343.75531005859375, -316.9075927734375, -290.0599365234375, -263.21221923828125, -236.3645477294922, -209.51686096191406, -182.66917419433594, -155.82147216796875, -128.97378540039062, -102.1260986328125, -75.27841186523438, -48.43072509765625, -21.583038330078125, 5.264650344848633, 32.11233901977539, 58.96002960205078, 85.8077163696289, 112.65541076660156, 139.5030975341797, 166.3507843017578, 193.19847106933594, 220.04615783691406, 246.8938446044922, 273.7415466308594, 300.5892333984375, 327.4369201660156, 354.28460693359375, 381.1322937011719, 407.97998046875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 12.0, 6.0, 6.0, 10.0, 8.0, 11.0, 9.0, 18.0, 19.0, 23.0, 23.0, 27.0, 27.0, 45.0, 41.0, 38.0, 63.0, 69.0, 71.0, 59.0, 51.0, 52.0, 39.0, 36.0, 22.0, 28.0, 21.0, 10.0, 23.0, 17.0, 15.0, 14.0, 12.0, 13.0, 12.0, 11.0, 11.0, 3.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-369.5523681640625, -358.8501281738281, -348.14788818359375, -337.4456481933594, -326.743408203125, -316.0411682128906, -305.33892822265625, -294.6366882324219, -283.9344482421875, -273.2322082519531, -262.52996826171875, -251.82772827148438, -241.12548828125, -230.42324829101562, -219.72100830078125, -209.01876831054688, -198.31651306152344, -187.61427307128906, -176.9120330810547, -166.2097930908203, -155.50755310058594, -144.80531311035156, -134.10305786132812, -123.40082550048828, -112.6985855102539, -101.99634552001953, -91.29410552978516, -80.59185791015625, -69.88961791992188, -59.187381744384766, -48.485137939453125, -37.78289794921875, -27.080657958984375, -16.37841796875, -5.676176071166992, 5.026065826416016, 15.72830581665039, 26.430545806884766, 37.132789611816406, 47.83502960205078, 58.537269592285156, 69.23950958251953, 79.9417495727539, 90.64399719238281, 101.34623718261719, 112.04847717285156, 122.75071716308594, 133.4529571533203, 144.1551971435547, 154.85743713378906, 165.55967712402344, 176.2619171142578, 186.9641571044922, 197.66639709472656, 208.36865234375, 219.07089233398438, 229.77313232421875, 240.47537231445312, 251.1776123046875, 261.8798522949219, 272.58209228515625, 283.2843322753906, 293.986572265625, 304.6888122558594, 315.39105224609375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 13.0, 21.0, 27.0, 32.0, 48.0, 88.0, 142.0, 229.0, 439.0, 718.0, 1244.0, 2454.0, 4925.0, 10668.0, 25374.0, 74736.0, 320955.0, 1724673.0, 1609009.0, 297837.0, 73443.0, 25463.0, 10979.0, 5045.0, 2519.0, 1326.0, 761.0, 432.0, 248.0, 137.0, 107.0, 75.0, 37.0, 26.0, 17.0, 13.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.21875, -23.383056640625, -22.54736328125, -21.711669921875, -20.8759765625, -20.040283203125, -19.20458984375, -18.368896484375, -17.533203125, -16.697509765625, -15.86181640625, -15.026123046875, -14.1904296875, -13.354736328125, -12.51904296875, -11.683349609375, -10.84765625, -10.011962890625, -9.17626953125, -8.340576171875, -7.5048828125, -6.669189453125, -5.83349609375, -4.997802734375, -4.162109375, -3.326416015625, -2.49072265625, -1.655029296875, -0.8193359375, 0.016357421875, 0.85205078125, 1.687744140625, 2.5234375, 3.359130859375, 4.19482421875, 5.030517578125, 5.8662109375, 6.701904296875, 7.53759765625, 8.373291015625, 9.208984375, 10.044677734375, 10.88037109375, 11.716064453125, 12.5517578125, 13.387451171875, 14.22314453125, 15.058837890625, 15.89453125, 16.730224609375, 17.56591796875, 18.401611328125, 19.2373046875, 20.072998046875, 20.90869140625, 21.744384765625, 22.580078125, 23.415771484375, 24.25146484375, 25.087158203125, 25.9228515625, 26.758544921875, 27.59423828125, 28.429931640625, 29.265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 12.0, 7.0, 6.0, 10.0, 14.0, 19.0, 29.0, 26.0, 30.0, 42.0, 40.0, 52.0, 52.0, 61.0, 54.0, 70.0, 43.0, 52.0, 56.0, 62.0, 41.0, 35.0, 36.0, 26.0, 35.0, 15.0, 17.0, 21.0, 11.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.15625, -28.43408203125, -27.7119140625, -26.98974609375, -26.267578125, -25.54541015625, -24.8232421875, -24.10107421875, -23.37890625, -22.65673828125, -21.9345703125, -21.21240234375, -20.490234375, -19.76806640625, -19.0458984375, -18.32373046875, -17.6015625, -16.87939453125, -16.1572265625, -15.43505859375, -14.712890625, -13.99072265625, -13.2685546875, -12.54638671875, -11.82421875, -11.10205078125, -10.3798828125, -9.65771484375, -8.935546875, -8.21337890625, -7.4912109375, -6.76904296875, -6.046875, -5.32470703125, -4.6025390625, -3.88037109375, -3.158203125, -2.43603515625, -1.7138671875, -0.99169921875, -0.26953125, 0.45263671875, 1.1748046875, 1.89697265625, 2.619140625, 3.34130859375, 4.0634765625, 4.78564453125, 5.5078125, 6.22998046875, 6.9521484375, 7.67431640625, 8.396484375, 9.11865234375, 9.8408203125, 10.56298828125, 11.28515625, 12.00732421875, 12.7294921875, 13.45166015625, 14.173828125, 14.89599609375, 15.6181640625, 16.34033203125, 17.0625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 5.0, 10.0, 15.0, 22.0, 28.0, 44.0, 55.0, 73.0, 144.0, 195.0, 393.0, 643.0, 1219.0, 2602.0, 6076.0, 18402.0, 77119.0, 687221.0, 3048363.0, 281304.0, 48537.0, 13102.0, 4454.0, 1977.0, 938.0, 508.0, 309.0, 165.0, 118.0, 83.0, 39.0, 32.0, 18.0, 13.0, 14.0, 7.0, 9.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.15625, -56.23876953125, -54.3212890625, -52.40380859375, -50.486328125, -48.56884765625, -46.6513671875, -44.73388671875, -42.81640625, -40.89892578125, -38.9814453125, -37.06396484375, -35.146484375, -33.22900390625, -31.3115234375, -29.39404296875, -27.4765625, -25.55908203125, -23.6416015625, -21.72412109375, -19.806640625, -17.88916015625, -15.9716796875, -14.05419921875, -12.13671875, -10.21923828125, -8.3017578125, -6.38427734375, -4.466796875, -2.54931640625, -0.6318359375, 1.28564453125, 3.203125, 5.12060546875, 7.0380859375, 8.95556640625, 10.873046875, 12.79052734375, 14.7080078125, 16.62548828125, 18.54296875, 20.46044921875, 22.3779296875, 24.29541015625, 26.212890625, 28.13037109375, 30.0478515625, 31.96533203125, 33.8828125, 35.80029296875, 37.7177734375, 39.63525390625, 41.552734375, 43.47021484375, 45.3876953125, 47.30517578125, 49.22265625, 51.14013671875, 53.0576171875, 54.97509765625, 56.892578125, 58.81005859375, 60.7275390625, 62.64501953125, 64.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 6.0, 11.0, 20.0, 27.0, 49.0, 54.0, 101.0, 190.0, 366.0, 704.0, 897.0, 693.0, 383.0, 186.0, 116.0, 87.0, 54.0, 42.0, 21.0, 14.0, 14.0, 6.0, 10.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.375, -88.48046875, -85.5859375, -82.69140625, -79.796875, -76.90234375, -74.0078125, -71.11328125, -68.21875, -65.32421875, -62.4296875, -59.53515625, -56.640625, -53.74609375, -50.8515625, -47.95703125, -45.0625, -42.16796875, -39.2734375, -36.37890625, -33.484375, -30.58984375, -27.6953125, -24.80078125, -21.90625, -19.01171875, -16.1171875, -13.22265625, -10.328125, -7.43359375, -4.5390625, -1.64453125, 1.25, 4.14453125, 7.0390625, 9.93359375, 12.828125, 15.72265625, 18.6171875, 21.51171875, 24.40625, 27.30078125, 30.1953125, 33.08984375, 35.984375, 38.87890625, 41.7734375, 44.66796875, 47.5625, 50.45703125, 53.3515625, 56.24609375, 59.140625, 62.03515625, 64.9296875, 67.82421875, 70.71875, 73.61328125, 76.5078125, 79.40234375, 82.296875, 85.19140625, 88.0859375, 90.98046875, 93.875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 18.0, 82.0, 389.0, 379.0, 95.0, 16.0, 5.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2836.4833984375, -2778.592529296875, -2720.701904296875, -2662.81103515625, -2604.920166015625, -2547.029541015625, -2489.138671875, -2431.247802734375, -2373.357177734375, -2315.46630859375, -2257.57568359375, -2199.684814453125, -2141.7939453125, -2083.9033203125, -2026.012451171875, -1968.1217041015625, -1910.2308349609375, -1852.340087890625, -1794.44921875, -1736.5584716796875, -1678.667724609375, -1620.77685546875, -1562.8861083984375, -1504.995361328125, -1447.1044921875, -1389.2137451171875, -1331.3228759765625, -1273.43212890625, -1215.5413818359375, -1157.650634765625, -1099.759765625, -1041.8690185546875, -983.9781494140625, -926.0873413085938, -868.1965942382812, -810.3057861328125, -752.4150390625, -694.5242309570312, -636.6334228515625, -578.74267578125, -520.8518676757812, -462.9610900878906, -405.0703125, -347.17950439453125, -289.2887268066406, -231.39794921875, -173.50714111328125, -115.61636352539062, -57.7255859375, 0.16519927978515625, 58.05598449707031, 115.94677734375, 173.83755493164062, 231.72833251953125, 289.619140625, 347.5099182128906, 405.40069580078125, 463.2914733886719, 521.1822509765625, 579.0730590820312, 636.9638671875, 694.8546142578125, 752.7454223632812, 810.63623046875, 868.5269775390625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 11.0, 9.0, 17.0, 17.0, 17.0, 29.0, 35.0, 24.0, 43.0, 38.0, 45.0, 51.0, 49.0, 56.0, 61.0, 61.0, 65.0, 52.0, 51.0, 40.0, 32.0, 41.0, 28.0, 21.0, 23.0, 15.0, 15.0, 11.0, 8.0, 10.0, 2.0, 8.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-501.9755859375, -489.1772155761719, -476.3788757324219, -463.58050537109375, -450.78216552734375, -437.9837951660156, -425.1854248046875, -412.3870849609375, -399.5887451171875, -386.7903747558594, -373.9920349121094, -361.19366455078125, -348.39532470703125, -335.5969543457031, -322.798583984375, -310.000244140625, -297.2018737792969, -284.40350341796875, -271.60516357421875, -258.8067932128906, -246.00845336914062, -233.2100830078125, -220.41172790527344, -207.61337280273438, -194.8150177001953, -182.01666259765625, -169.2183074951172, -156.41995239257812, -143.62158203125, -130.8232421875, -118.02487182617188, -105.22651672363281, -92.42816162109375, -79.62980651855469, -66.83145141601562, -54.03308868408203, -41.23473358154297, -28.436378479003906, -15.638015747070312, -2.83966064453125, 9.958694458007812, 22.757051467895508, 35.5554084777832, 48.35376739501953, 61.152122497558594, 73.95047760009766, 86.74884033203125, 99.54719543457031, 112.34555053710938, 125.14390563964844, 137.9422607421875, 150.74063110351562, 163.53897094726562, 176.33734130859375, 189.1356964111328, 201.93405151367188, 214.73240661621094, 227.53076171875, 240.32911682128906, 253.12747192382812, 265.92584228515625, 278.72418212890625, 291.5225524902344, 304.3209228515625, 317.1192626953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 4.0, 10.0, 10.0, 16.0, 26.0, 31.0, 56.0, 67.0, 87.0, 141.0, 201.0, 310.0, 452.0, 708.0, 1110.0, 1916.0, 3214.0, 5941.0, 11975.0, 26634.0, 71570.0, 245060.0, 436232.0, 153206.0, 49025.0, 19795.0, 9087.0, 4660.0, 2642.0, 1579.0, 980.0, 590.0, 405.0, 276.0, 156.0, 122.0, 82.0, 52.0, 33.0, 34.0, 23.0, 17.0, 8.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.375, -36.05517578125, -34.7353515625, -33.41552734375, -32.095703125, -30.77587890625, -29.4560546875, -28.13623046875, -26.81640625, -25.49658203125, -24.1767578125, -22.85693359375, -21.537109375, -20.21728515625, -18.8974609375, -17.57763671875, -16.2578125, -14.93798828125, -13.6181640625, -12.29833984375, -10.978515625, -9.65869140625, -8.3388671875, -7.01904296875, -5.69921875, -4.37939453125, -3.0595703125, -1.73974609375, -0.419921875, 0.89990234375, 2.2197265625, 3.53955078125, 4.859375, 6.17919921875, 7.4990234375, 8.81884765625, 10.138671875, 11.45849609375, 12.7783203125, 14.09814453125, 15.41796875, 16.73779296875, 18.0576171875, 19.37744140625, 20.697265625, 22.01708984375, 23.3369140625, 24.65673828125, 25.9765625, 27.29638671875, 28.6162109375, 29.93603515625, 31.255859375, 32.57568359375, 33.8955078125, 35.21533203125, 36.53515625, 37.85498046875, 39.1748046875, 40.49462890625, 41.814453125, 43.13427734375, 44.4541015625, 45.77392578125, 47.09375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 7.0, 3.0, 3.0, 8.0, 6.0, 13.0, 6.0, 7.0, 9.0, 11.0, 17.0, 17.0, 15.0, 26.0, 26.0, 32.0, 31.0, 33.0, 39.0, 49.0, 29.0, 41.0, 30.0, 39.0, 49.0, 43.0, 39.0, 36.0, 42.0, 33.0, 30.0, 21.0, 28.0, 31.0, 32.0, 20.0, 20.0, 22.0, 14.0, 11.0, 2.0, 7.0, 5.0, 5.0, 3.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.5546875, -17.953125, -17.3515625, -16.75, -16.1484375, -15.546875, -14.9453125, -14.34375, -13.7421875, -13.140625, -12.5390625, -11.9375, -11.3359375, -10.734375, -10.1328125, -9.53125, -8.9296875, -8.328125, -7.7265625, -7.125, -6.5234375, -5.921875, -5.3203125, -4.71875, -4.1171875, -3.515625, -2.9140625, -2.3125, -1.7109375, -1.109375, -0.5078125, 0.09375, 0.6953125, 1.296875, 1.8984375, 2.5, 3.1015625, 3.703125, 4.3046875, 4.90625, 5.5078125, 6.109375, 6.7109375, 7.3125, 7.9140625, 8.515625, 9.1171875, 9.71875, 10.3203125, 10.921875, 11.5234375, 12.125, 12.7265625, 13.328125, 13.9296875, 14.53125, 15.1328125, 15.734375, 16.3359375, 16.9375, 17.5390625, 18.140625, 18.7421875, 19.34375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 10.0, 14.0, 21.0, 36.0, 37.0, 50.0, 77.0, 151.0, 228.0, 423.0, 791.0, 1729.0, 4856.0, 21963.0, 345966.0, 635447.0, 27134.0, 5635.0, 1913.0, 906.0, 471.0, 248.0, 143.0, 89.0, 66.0, 38.0, 28.0, 22.0, 9.0, 6.0, 12.0, 9.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.1875, -104.3310546875, -100.474609375, -96.6181640625, -92.76171875, -88.9052734375, -85.048828125, -81.1923828125, -77.3359375, -73.4794921875, -69.623046875, -65.7666015625, -61.91015625, -58.0537109375, -54.197265625, -50.3408203125, -46.484375, -42.6279296875, -38.771484375, -34.9150390625, -31.05859375, -27.2021484375, -23.345703125, -19.4892578125, -15.6328125, -11.7763671875, -7.919921875, -4.0634765625, -0.20703125, 3.6494140625, 7.505859375, 11.3623046875, 15.21875, 19.0751953125, 22.931640625, 26.7880859375, 30.64453125, 34.5009765625, 38.357421875, 42.2138671875, 46.0703125, 49.9267578125, 53.783203125, 57.6396484375, 61.49609375, 65.3525390625, 69.208984375, 73.0654296875, 76.921875, 80.7783203125, 84.634765625, 88.4912109375, 92.34765625, 96.2041015625, 100.060546875, 103.9169921875, 107.7734375, 111.6298828125, 115.486328125, 119.3427734375, 123.19921875, 127.0556640625, 130.912109375, 134.7685546875, 138.625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 4.0, 5.0, 14.0, 12.0, 19.0, 18.0, 24.0, 34.0, 43.0, 67.0, 64.0, 73.0, 86.0, 78.0, 83.0, 59.0, 48.0, 52.0, 52.0, 54.0, 37.0, 28.0, 18.0, 7.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.9375, -102.3447265625, -97.751953125, -93.1591796875, -88.56640625, -83.9736328125, -79.380859375, -74.7880859375, -70.1953125, -65.6025390625, -61.009765625, -56.4169921875, -51.82421875, -47.2314453125, -42.638671875, -38.0458984375, -33.453125, -28.8603515625, -24.267578125, -19.6748046875, -15.08203125, -10.4892578125, -5.896484375, -1.3037109375, 3.2890625, 7.8818359375, 12.474609375, 17.0673828125, 21.66015625, 26.2529296875, 30.845703125, 35.4384765625, 40.03125, 44.6240234375, 49.216796875, 53.8095703125, 58.40234375, 62.9951171875, 67.587890625, 72.1806640625, 76.7734375, 81.3662109375, 85.958984375, 90.5517578125, 95.14453125, 99.7373046875, 104.330078125, 108.9228515625, 113.515625, 118.1083984375, 122.701171875, 127.2939453125, 131.88671875, 136.4794921875, 141.072265625, 145.6650390625, 150.2578125, 154.8505859375, 159.443359375, 164.0361328125, 168.62890625, 173.2216796875, 177.814453125, 182.4072265625, 187.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 11.0, 21.0, 30.0, 68.0, 130.0, 226.0, 549.0, 1550.0, 5965.0, 33554.0, 408036.0, 553649.0, 35670.0, 6294.0, 1689.0, 577.0, 261.0, 114.0, 64.0, 41.0, 14.0, 11.0, 7.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-42.1875, -40.90966796875, -39.6318359375, -38.35400390625, -37.076171875, -35.79833984375, -34.5205078125, -33.24267578125, -31.96484375, -30.68701171875, -29.4091796875, -28.13134765625, -26.853515625, -25.57568359375, -24.2978515625, -23.02001953125, -21.7421875, -20.46435546875, -19.1865234375, -17.90869140625, -16.630859375, -15.35302734375, -14.0751953125, -12.79736328125, -11.51953125, -10.24169921875, -8.9638671875, -7.68603515625, -6.408203125, -5.13037109375, -3.8525390625, -2.57470703125, -1.296875, -0.01904296875, 1.2587890625, 2.53662109375, 3.814453125, 5.09228515625, 6.3701171875, 7.64794921875, 8.92578125, 10.20361328125, 11.4814453125, 12.75927734375, 14.037109375, 15.31494140625, 16.5927734375, 17.87060546875, 19.1484375, 20.42626953125, 21.7041015625, 22.98193359375, 24.259765625, 25.53759765625, 26.8154296875, 28.09326171875, 29.37109375, 30.64892578125, 31.9267578125, 33.20458984375, 34.482421875, 35.76025390625, 37.0380859375, 38.31591796875, 39.59375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 11.0, 10.0, 18.0, 25.0, 30.0, 43.0, 66.0, 106.0, 116.0, 119.0, 114.0, 79.0, 59.0, 42.0, 28.0, 26.0, 19.0, 18.0, 6.0, 10.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0094451904296875, -0.009199023246765137, -0.008952856063842773, -0.00870668888092041, -0.008460521697998047, -0.008214354515075684, -0.00796818733215332, -0.007722020149230957, -0.007475852966308594, -0.0072296857833862305, -0.006983518600463867, -0.006737351417541504, -0.006491184234619141, -0.006245017051696777, -0.005998849868774414, -0.005752682685852051, -0.0055065155029296875, -0.005260348320007324, -0.005014181137084961, -0.004768013954162598, -0.004521846771240234, -0.004275679588317871, -0.004029512405395508, -0.0037833452224731445, -0.0035371780395507812, -0.003291010856628418, -0.0030448436737060547, -0.0027986764907836914, -0.002552509307861328, -0.002306342124938965, -0.0020601749420166016, -0.0018140077590942383, -0.001567840576171875, -0.0013216733932495117, -0.0010755062103271484, -0.0008293390274047852, -0.0005831718444824219, -0.0003370046615600586, -9.083747863769531e-05, 0.00015532970428466797, 0.00040149688720703125, 0.0006476640701293945, 0.0008938312530517578, 0.001139998435974121, 0.0013861656188964844, 0.0016323328018188477, 0.001878499984741211, 0.0021246671676635742, 0.0023708343505859375, 0.0026170015335083008, 0.002863168716430664, 0.0031093358993530273, 0.0033555030822753906, 0.003601670265197754, 0.003847837448120117, 0.0040940046310424805, 0.004340171813964844, 0.004586338996887207, 0.00483250617980957, 0.005078673362731934, 0.005324840545654297, 0.00557100772857666, 0.0058171749114990234, 0.006063342094421387, 0.00630950927734375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 20.0, 25.0, 25.0, 52.0, 74.0, 127.0, 205.0, 348.0, 628.0, 1259.0, 2901.0, 8573.0, 37038.0, 286034.0, 628667.0, 63145.0, 12186.0, 3839.0, 1553.0, 759.0, 421.0, 245.0, 137.0, 99.0, 54.0, 43.0, 20.0, 25.0, 6.0, 9.0, 8.0, 1.0, 7.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.328125, -29.4130859375, -28.498046875, -27.5830078125, -26.66796875, -25.7529296875, -24.837890625, -23.9228515625, -23.0078125, -22.0927734375, -21.177734375, -20.2626953125, -19.34765625, -18.4326171875, -17.517578125, -16.6025390625, -15.6875, -14.7724609375, -13.857421875, -12.9423828125, -12.02734375, -11.1123046875, -10.197265625, -9.2822265625, -8.3671875, -7.4521484375, -6.537109375, -5.6220703125, -4.70703125, -3.7919921875, -2.876953125, -1.9619140625, -1.046875, -0.1318359375, 0.783203125, 1.6982421875, 2.61328125, 3.5283203125, 4.443359375, 5.3583984375, 6.2734375, 7.1884765625, 8.103515625, 9.0185546875, 9.93359375, 10.8486328125, 11.763671875, 12.6787109375, 13.59375, 14.5087890625, 15.423828125, 16.3388671875, 17.25390625, 18.1689453125, 19.083984375, 19.9990234375, 20.9140625, 21.8291015625, 22.744140625, 23.6591796875, 24.57421875, 25.4892578125, 26.404296875, 27.3193359375, 28.234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 1.0, 4.0, 5.0, 13.0, 7.0, 9.0, 11.0, 20.0, 20.0, 28.0, 35.0, 44.0, 51.0, 51.0, 87.0, 70.0, 103.0, 83.0, 66.0, 62.0, 41.0, 38.0, 43.0, 17.0, 15.0, 12.0, 12.0, 8.0, 8.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-22.703125, -21.979736328125, -21.25634765625, -20.532958984375, -19.8095703125, -19.086181640625, -18.36279296875, -17.639404296875, -16.916015625, -16.192626953125, -15.46923828125, -14.745849609375, -14.0224609375, -13.299072265625, -12.57568359375, -11.852294921875, -11.12890625, -10.405517578125, -9.68212890625, -8.958740234375, -8.2353515625, -7.511962890625, -6.78857421875, -6.065185546875, -5.341796875, -4.618408203125, -3.89501953125, -3.171630859375, -2.4482421875, -1.724853515625, -1.00146484375, -0.278076171875, 0.4453125, 1.168701171875, 1.89208984375, 2.615478515625, 3.3388671875, 4.062255859375, 4.78564453125, 5.509033203125, 6.232421875, 6.955810546875, 7.67919921875, 8.402587890625, 9.1259765625, 9.849365234375, 10.57275390625, 11.296142578125, 12.01953125, 12.742919921875, 13.46630859375, 14.189697265625, 14.9130859375, 15.636474609375, 16.35986328125, 17.083251953125, 17.806640625, 18.530029296875, 19.25341796875, 19.976806640625, 20.7001953125, 21.423583984375, 22.14697265625, 22.870361328125, 23.59375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 13.0, 7.0, 18.0, 27.0, 61.0, 97.0, 211.0, 250.0, 143.0, 74.0, 46.0, 14.0, 8.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-489.26275634765625, -468.1206359863281, -446.978515625, -425.83642578125, -404.6943054199219, -383.55218505859375, -362.41009521484375, -341.2679748535156, -320.1258544921875, -298.9837341308594, -277.84161376953125, -256.69952392578125, -235.55740356445312, -214.415283203125, -193.27317810058594, -172.13107299804688, -150.98895263671875, -129.84683227539062, -108.70472717285156, -87.56261444091797, -66.42050170898438, -45.27838897705078, -24.136276245117188, -2.994171142578125, 18.14794921875, 39.290061950683594, 60.43217468261719, 81.57428741455078, 102.71640014648438, 123.85851287841797, 145.00062561035156, 166.14273071289062, 187.2847900390625, 208.42691040039062, 229.5690155029297, 250.71112060546875, 271.8532409667969, 292.995361328125, 314.137451171875, 335.2795715332031, 356.42169189453125, 377.5638122558594, 398.7059326171875, 419.8480224609375, 440.9901428222656, 462.13226318359375, 483.27435302734375, 504.4164733886719, 525.55859375, 546.70068359375, 567.8428344726562, 588.9849243164062, 610.1270751953125, 631.2691650390625, 652.4112548828125, 673.5533447265625, 694.6954956054688, 715.8375854492188, 736.979736328125, 758.121826171875, 779.263916015625, 800.4060668945312, 821.5481567382812, 842.6903076171875, 863.8323974609375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 4.0, 15.0, 9.0, 11.0, 15.0, 19.0, 21.0, 30.0, 32.0, 32.0, 32.0, 45.0, 38.0, 61.0, 73.0, 87.0, 70.0, 63.0, 45.0, 49.0, 47.0, 31.0, 22.0, 27.0, 23.0, 18.0, 17.0, 13.0, 8.0, 8.0, 5.0, 8.0, 5.0, 2.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-465.87408447265625, -452.03192138671875, -438.1897277832031, -424.3475646972656, -410.50537109375, -396.6632080078125, -382.821044921875, -368.9788513183594, -355.13665771484375, -341.29449462890625, -327.4523010253906, -313.6101379394531, -299.7679443359375, -285.92578125, -272.0836181640625, -258.2414245605469, -244.39926147460938, -230.5570831298828, -216.71490478515625, -202.87274169921875, -189.03054809570312, -175.18838500976562, -161.34620666503906, -147.5040283203125, -133.66184997558594, -119.81967163085938, -105.97749328613281, -92.13532257080078, -78.29314422607422, -64.45096588134766, -50.608795166015625, -36.76661682128906, -22.9244384765625, -9.08226203918457, 4.759914398193359, 18.602088928222656, 32.44426727294922, 46.28644561767578, 60.12861633300781, 73.97079467773438, 87.81297302246094, 101.6551513671875, 115.49732971191406, 129.33950805664062, 143.18167114257812, 157.02386474609375, 170.86602783203125, 184.7082061767578, 198.55038452148438, 212.39256286621094, 226.2347412109375, 240.076904296875, 253.91909790039062, 267.7612609863281, 281.60345458984375, 295.44561767578125, 309.28778076171875, 323.12994384765625, 336.9721374511719, 350.8143005371094, 364.656494140625, 378.4986572265625, 392.3408203125, 406.1830139160156, 420.02520751953125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 6.0, 1.0, 8.0, 7.0, 11.0, 33.0, 38.0, 62.0, 78.0, 153.0, 263.0, 410.0, 748.0, 1541.0, 3086.0, 7211.0, 19071.0, 67473.0, 382478.0, 2269677.0, 1215356.0, 166475.0, 37190.0, 12688.0, 5197.0, 2392.0, 1170.0, 622.0, 354.0, 182.0, 118.0, 57.0, 56.0, 21.0, 21.0, 10.0, 6.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.875, -32.901123046875, -31.92724609375, -30.953369140625, -29.9794921875, -29.005615234375, -28.03173828125, -27.057861328125, -26.083984375, -25.110107421875, -24.13623046875, -23.162353515625, -22.1884765625, -21.214599609375, -20.24072265625, -19.266845703125, -18.29296875, -17.319091796875, -16.34521484375, -15.371337890625, -14.3974609375, -13.423583984375, -12.44970703125, -11.475830078125, -10.501953125, -9.528076171875, -8.55419921875, -7.580322265625, -6.6064453125, -5.632568359375, -4.65869140625, -3.684814453125, -2.7109375, -1.737060546875, -0.76318359375, 0.210693359375, 1.1845703125, 2.158447265625, 3.13232421875, 4.106201171875, 5.080078125, 6.053955078125, 7.02783203125, 8.001708984375, 8.9755859375, 9.949462890625, 10.92333984375, 11.897216796875, 12.87109375, 13.844970703125, 14.81884765625, 15.792724609375, 16.7666015625, 17.740478515625, 18.71435546875, 19.688232421875, 20.662109375, 21.635986328125, 22.60986328125, 23.583740234375, 24.5576171875, 25.531494140625, 26.50537109375, 27.479248046875, 28.453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 8.0, 8.0, 17.0, 15.0, 15.0, 16.0, 23.0, 26.0, 28.0, 29.0, 44.0, 37.0, 46.0, 41.0, 40.0, 36.0, 51.0, 56.0, 56.0, 37.0, 61.0, 32.0, 36.0, 32.0, 20.0, 30.0, 25.0, 21.0, 21.0, 16.0, 12.0, 7.0, 8.0, 5.0, 4.0, 6.0, 5.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-22.359375, -21.698486328125, -21.03759765625, -20.376708984375, -19.7158203125, -19.054931640625, -18.39404296875, -17.733154296875, -17.072265625, -16.411376953125, -15.75048828125, -15.089599609375, -14.4287109375, -13.767822265625, -13.10693359375, -12.446044921875, -11.78515625, -11.124267578125, -10.46337890625, -9.802490234375, -9.1416015625, -8.480712890625, -7.81982421875, -7.158935546875, -6.498046875, -5.837158203125, -5.17626953125, -4.515380859375, -3.8544921875, -3.193603515625, -2.53271484375, -1.871826171875, -1.2109375, -0.550048828125, 0.11083984375, 0.771728515625, 1.4326171875, 2.093505859375, 2.75439453125, 3.415283203125, 4.076171875, 4.737060546875, 5.39794921875, 6.058837890625, 6.7197265625, 7.380615234375, 8.04150390625, 8.702392578125, 9.36328125, 10.024169921875, 10.68505859375, 11.345947265625, 12.0068359375, 12.667724609375, 13.32861328125, 13.989501953125, 14.650390625, 15.311279296875, 15.97216796875, 16.633056640625, 17.2939453125, 17.954833984375, 18.61572265625, 19.276611328125, 19.9375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 6.0, 9.0, 8.0, 20.0, 26.0, 47.0, 99.0, 138.0, 317.0, 705.0, 2130.0, 7611.0, 36765.0, 449183.0, 3505023.0, 164824.0, 20529.0, 4548.0, 1320.0, 507.0, 200.0, 107.0, 53.0, 28.0, 21.0, 14.0, 9.0, 10.0, 6.0, 6.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.375, -92.8212890625, -90.267578125, -87.7138671875, -85.16015625, -82.6064453125, -80.052734375, -77.4990234375, -74.9453125, -72.3916015625, -69.837890625, -67.2841796875, -64.73046875, -62.1767578125, -59.623046875, -57.0693359375, -54.515625, -51.9619140625, -49.408203125, -46.8544921875, -44.30078125, -41.7470703125, -39.193359375, -36.6396484375, -34.0859375, -31.5322265625, -28.978515625, -26.4248046875, -23.87109375, -21.3173828125, -18.763671875, -16.2099609375, -13.65625, -11.1025390625, -8.548828125, -5.9951171875, -3.44140625, -0.8876953125, 1.666015625, 4.2197265625, 6.7734375, 9.3271484375, 11.880859375, 14.4345703125, 16.98828125, 19.5419921875, 22.095703125, 24.6494140625, 27.203125, 29.7568359375, 32.310546875, 34.8642578125, 37.41796875, 39.9716796875, 42.525390625, 45.0791015625, 47.6328125, 50.1865234375, 52.740234375, 55.2939453125, 57.84765625, 60.4013671875, 62.955078125, 65.5087890625, 68.0625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 1.0, 5.0, 14.0, 13.0, 10.0, 24.0, 24.0, 32.0, 52.0, 99.0, 125.0, 289.0, 537.0, 840.0, 884.0, 496.0, 260.0, 145.0, 72.0, 56.0, 31.0, 21.0, 13.0, 16.0, 8.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-111.875, -109.271484375, -106.66796875, -104.064453125, -101.4609375, -98.857421875, -96.25390625, -93.650390625, -91.046875, -88.443359375, -85.83984375, -83.236328125, -80.6328125, -78.029296875, -75.42578125, -72.822265625, -70.21875, -67.615234375, -65.01171875, -62.408203125, -59.8046875, -57.201171875, -54.59765625, -51.994140625, -49.390625, -46.787109375, -44.18359375, -41.580078125, -38.9765625, -36.373046875, -33.76953125, -31.166015625, -28.5625, -25.958984375, -23.35546875, -20.751953125, -18.1484375, -15.544921875, -12.94140625, -10.337890625, -7.734375, -5.130859375, -2.52734375, 0.076171875, 2.6796875, 5.283203125, 7.88671875, 10.490234375, 13.09375, 15.697265625, 18.30078125, 20.904296875, 23.5078125, 26.111328125, 28.71484375, 31.318359375, 33.921875, 36.525390625, 39.12890625, 41.732421875, 44.3359375, 46.939453125, 49.54296875, 52.146484375, 54.75]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 12.0, 23.0, 86.0, 343.0, 393.0, 104.0, 23.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2430.1484375, -2381.74462890625, -2333.3408203125, -2284.93701171875, -2236.533203125, -2188.12939453125, -2139.7255859375, -2091.32177734375, -2042.9180908203125, -1994.5142822265625, -1946.1104736328125, -1897.7066650390625, -1849.3028564453125, -1800.899169921875, -1752.495361328125, -1704.091552734375, -1655.687744140625, -1607.283935546875, -1558.880126953125, -1510.476318359375, -1462.072509765625, -1413.668701171875, -1365.264892578125, -1316.8612060546875, -1268.457275390625, -1220.053466796875, -1171.649658203125, -1123.245849609375, -1074.842041015625, -1026.438232421875, -978.0344848632812, -929.6307373046875, -881.2269287109375, -832.8231201171875, -784.4193115234375, -736.0155029296875, -687.6117553710938, -639.2079467773438, -590.8041381835938, -542.400390625, -493.9965515136719, -445.5927429199219, -397.18896484375, -348.78515625, -300.38134765625, -251.97756958007812, -203.57376098632812, -155.16998291015625, -106.76617431640625, -58.36237716674805, -9.958580017089844, 38.445220947265625, 86.84901428222656, 135.2528076171875, 183.6566162109375, 232.06039428710938, 280.4642028808594, 328.8680114746094, 377.27178955078125, 425.67559814453125, 474.07940673828125, 522.483154296875, 570.886962890625, 619.290771484375, 667.694580078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 5.0, 10.0, 6.0, 9.0, 21.0, 14.0, 16.0, 30.0, 24.0, 31.0, 28.0, 29.0, 42.0, 42.0, 42.0, 46.0, 46.0, 56.0, 47.0, 62.0, 53.0, 44.0, 38.0, 31.0, 31.0, 31.0, 25.0, 31.0, 22.0, 13.0, 22.0, 11.0, 6.0, 8.0, 7.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-352.5919494628906, -342.6274719238281, -332.6629638671875, -322.698486328125, -312.7340087890625, -302.76953125, -292.8050231933594, -282.8405456542969, -272.87603759765625, -262.91156005859375, -252.9470672607422, -242.98257446289062, -233.01809692382812, -223.05360412597656, -213.089111328125, -203.1246337890625, -193.16015625, -183.19566345214844, -173.23118591308594, -163.26669311523438, -153.30221557617188, -143.3377227783203, -133.37322998046875, -123.40874481201172, -113.44425964355469, -103.47977447509766, -93.51528930664062, -83.55079650878906, -73.58631134033203, -63.621826171875, -53.6573371887207, -43.692848205566406, -33.728363037109375, -23.76387596130371, -13.799388885498047, -3.834901809692383, 6.129585266113281, 16.094070434570312, 26.05855941772461, 36.023048400878906, 45.98753356933594, 55.95201873779297, 65.91650390625, 75.88099670410156, 85.8454818725586, 95.80996704101562, 105.77445983886719, 115.73894500732422, 125.70343017578125, 135.6679229736328, 145.6324005126953, 155.59689331054688, 165.56137084960938, 175.52586364746094, 185.4903564453125, 195.454833984375, 205.41932678222656, 215.38381958007812, 225.34829711914062, 235.3127899169922, 245.27728271484375, 255.24176025390625, 265.20623779296875, 275.1707458496094, 285.1352233886719]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 5.0, 9.0, 19.0, 25.0, 44.0, 44.0, 64.0, 106.0, 179.0, 261.0, 436.0, 663.0, 1199.0, 2115.0, 4131.0, 10233.0, 36115.0, 182647.0, 538887.0, 209722.0, 40714.0, 11100.0, 4425.0, 2256.0, 1196.0, 733.0, 424.0, 275.0, 153.0, 116.0, 75.0, 53.0, 44.0, 26.0, 22.0, 11.0, 12.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.03125, -45.5859375, -44.140625, -42.6953125, -41.25, -39.8046875, -38.359375, -36.9140625, -35.46875, -34.0234375, -32.578125, -31.1328125, -29.6875, -28.2421875, -26.796875, -25.3515625, -23.90625, -22.4609375, -21.015625, -19.5703125, -18.125, -16.6796875, -15.234375, -13.7890625, -12.34375, -10.8984375, -9.453125, -8.0078125, -6.5625, -5.1171875, -3.671875, -2.2265625, -0.78125, 0.6640625, 2.109375, 3.5546875, 5.0, 6.4453125, 7.890625, 9.3359375, 10.78125, 12.2265625, 13.671875, 15.1171875, 16.5625, 18.0078125, 19.453125, 20.8984375, 22.34375, 23.7890625, 25.234375, 26.6796875, 28.125, 29.5703125, 31.015625, 32.4609375, 33.90625, 35.3515625, 36.796875, 38.2421875, 39.6875, 41.1328125, 42.578125, 44.0234375, 45.46875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 7.0, 4.0, 1.0, 5.0, 9.0, 16.0, 9.0, 14.0, 17.0, 15.0, 21.0, 29.0, 29.0, 27.0, 28.0, 40.0, 48.0, 50.0, 38.0, 50.0, 41.0, 62.0, 46.0, 39.0, 41.0, 33.0, 37.0, 32.0, 33.0, 25.0, 31.0, 25.0, 21.0, 21.0, 19.0, 12.0, 9.0, 3.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.521484375, -20.80859375, -20.095703125, -19.3828125, -18.669921875, -17.95703125, -17.244140625, -16.53125, -15.818359375, -15.10546875, -14.392578125, -13.6796875, -12.966796875, -12.25390625, -11.541015625, -10.828125, -10.115234375, -9.40234375, -8.689453125, -7.9765625, -7.263671875, -6.55078125, -5.837890625, -5.125, -4.412109375, -3.69921875, -2.986328125, -2.2734375, -1.560546875, -0.84765625, -0.134765625, 0.578125, 1.291015625, 2.00390625, 2.716796875, 3.4296875, 4.142578125, 4.85546875, 5.568359375, 6.28125, 6.994140625, 7.70703125, 8.419921875, 9.1328125, 9.845703125, 10.55859375, 11.271484375, 11.984375, 12.697265625, 13.41015625, 14.123046875, 14.8359375, 15.548828125, 16.26171875, 16.974609375, 17.6875, 18.400390625, 19.11328125, 19.826171875, 20.5390625, 21.251953125, 21.96484375, 22.677734375, 23.390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 10.0, 4.0, 14.0, 18.0, 17.0, 22.0, 25.0, 48.0, 76.0, 118.0, 165.0, 326.0, 596.0, 1221.0, 3247.0, 13120.0, 145716.0, 813531.0, 57733.0, 7971.0, 2363.0, 1000.0, 520.0, 245.0, 160.0, 79.0, 52.0, 45.0, 26.0, 20.0, 12.0, 9.0, 13.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-88.625, -85.884765625, -83.14453125, -80.404296875, -77.6640625, -74.923828125, -72.18359375, -69.443359375, -66.703125, -63.962890625, -61.22265625, -58.482421875, -55.7421875, -53.001953125, -50.26171875, -47.521484375, -44.78125, -42.041015625, -39.30078125, -36.560546875, -33.8203125, -31.080078125, -28.33984375, -25.599609375, -22.859375, -20.119140625, -17.37890625, -14.638671875, -11.8984375, -9.158203125, -6.41796875, -3.677734375, -0.9375, 1.802734375, 4.54296875, 7.283203125, 10.0234375, 12.763671875, 15.50390625, 18.244140625, 20.984375, 23.724609375, 26.46484375, 29.205078125, 31.9453125, 34.685546875, 37.42578125, 40.166015625, 42.90625, 45.646484375, 48.38671875, 51.126953125, 53.8671875, 56.607421875, 59.34765625, 62.087890625, 64.828125, 67.568359375, 70.30859375, 73.048828125, 75.7890625, 78.529296875, 81.26953125, 84.009765625, 86.75]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 10.0, 10.0, 11.0, 13.0, 13.0, 24.0, 23.0, 33.0, 47.0, 54.0, 50.0, 55.0, 73.0, 63.0, 62.0, 90.0, 63.0, 51.0, 50.0, 48.0, 35.0, 28.0, 25.0, 19.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.875, -116.9765625, -113.078125, -109.1796875, -105.28125, -101.3828125, -97.484375, -93.5859375, -89.6875, -85.7890625, -81.890625, -77.9921875, -74.09375, -70.1953125, -66.296875, -62.3984375, -58.5, -54.6015625, -50.703125, -46.8046875, -42.90625, -39.0078125, -35.109375, -31.2109375, -27.3125, -23.4140625, -19.515625, -15.6171875, -11.71875, -7.8203125, -3.921875, -0.0234375, 3.875, 7.7734375, 11.671875, 15.5703125, 19.46875, 23.3671875, 27.265625, 31.1640625, 35.0625, 38.9609375, 42.859375, 46.7578125, 50.65625, 54.5546875, 58.453125, 62.3515625, 66.25, 70.1484375, 74.046875, 77.9453125, 81.84375, 85.7421875, 89.640625, 93.5390625, 97.4375, 101.3359375, 105.234375, 109.1328125, 113.03125, 116.9296875, 120.828125, 124.7265625, 128.625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 9.0, 9.0, 8.0, 21.0, 26.0, 22.0, 51.0, 68.0, 89.0, 142.0, 285.0, 533.0, 1013.0, 2228.0, 5205.0, 15386.0, 63336.0, 503064.0, 371288.0, 61267.0, 15080.0, 5113.0, 2095.0, 1029.0, 477.0, 252.0, 145.0, 91.0, 67.0, 41.0, 25.0, 33.0, 11.0, 11.0, 8.0, 9.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.109375, -23.305419921875, -22.50146484375, -21.697509765625, -20.8935546875, -20.089599609375, -19.28564453125, -18.481689453125, -17.677734375, -16.873779296875, -16.06982421875, -15.265869140625, -14.4619140625, -13.657958984375, -12.85400390625, -12.050048828125, -11.24609375, -10.442138671875, -9.63818359375, -8.834228515625, -8.0302734375, -7.226318359375, -6.42236328125, -5.618408203125, -4.814453125, -4.010498046875, -3.20654296875, -2.402587890625, -1.5986328125, -0.794677734375, 0.00927734375, 0.813232421875, 1.6171875, 2.421142578125, 3.22509765625, 4.029052734375, 4.8330078125, 5.636962890625, 6.44091796875, 7.244873046875, 8.048828125, 8.852783203125, 9.65673828125, 10.460693359375, 11.2646484375, 12.068603515625, 12.87255859375, 13.676513671875, 14.48046875, 15.284423828125, 16.08837890625, 16.892333984375, 17.6962890625, 18.500244140625, 19.30419921875, 20.108154296875, 20.912109375, 21.716064453125, 22.52001953125, 23.323974609375, 24.1279296875, 24.931884765625, 25.73583984375, 26.539794921875, 27.34375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 9.0, 8.0, 19.0, 24.0, 43.0, 64.0, 79.0, 96.0, 131.0, 91.0, 120.0, 97.0, 58.0, 39.0, 31.0, 30.0, 8.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0085296630859375, -0.00829392671585083, -0.00805819034576416, -0.00782245397567749, -0.00758671760559082, -0.00735098123550415, -0.0071152448654174805, -0.0068795084953308105, -0.006643772125244141, -0.006408035755157471, -0.006172299385070801, -0.005936563014984131, -0.005700826644897461, -0.005465090274810791, -0.005229353904724121, -0.004993617534637451, -0.004757881164550781, -0.004522144794464111, -0.004286408424377441, -0.0040506720542907715, -0.0038149356842041016, -0.0035791993141174316, -0.0033434629440307617, -0.003107726573944092, -0.002871990203857422, -0.002636253833770752, -0.002400517463684082, -0.002164781093597412, -0.0019290447235107422, -0.0016933083534240723, -0.0014575719833374023, -0.0012218356132507324, -0.0009860992431640625, -0.0007503628730773926, -0.0005146265029907227, -0.00027889013290405273, -4.315376281738281e-05, 0.0001925826072692871, 0.00042831897735595703, 0.000664055347442627, 0.0008997917175292969, 0.0011355280876159668, 0.0013712644577026367, 0.0016070008277893066, 0.0018427371978759766, 0.0020784735679626465, 0.0023142099380493164, 0.0025499463081359863, 0.0027856826782226562, 0.003021419048309326, 0.003257155418395996, 0.003492891788482666, 0.003728628158569336, 0.003964364528656006, 0.004200100898742676, 0.004435837268829346, 0.004671573638916016, 0.0049073100090026855, 0.0051430463790893555, 0.005378782749176025, 0.005614519119262695, 0.005850255489349365, 0.006085991859436035, 0.006321728229522705, 0.006557464599609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 13.0, 19.0, 30.0, 62.0, 101.0, 219.0, 570.0, 1749.0, 7511.0, 69053.0, 825966.0, 128366.0, 11275.0, 2328.0, 737.0, 295.0, 122.0, 65.0, 23.0, 26.0, 14.0, 6.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.296875, -26.853759765625, -25.41064453125, -23.967529296875, -22.5244140625, -21.081298828125, -19.63818359375, -18.195068359375, -16.751953125, -15.308837890625, -13.86572265625, -12.422607421875, -10.9794921875, -9.536376953125, -8.09326171875, -6.650146484375, -5.20703125, -3.763916015625, -2.32080078125, -0.877685546875, 0.5654296875, 2.008544921875, 3.45166015625, 4.894775390625, 6.337890625, 7.781005859375, 9.22412109375, 10.667236328125, 12.1103515625, 13.553466796875, 14.99658203125, 16.439697265625, 17.8828125, 19.325927734375, 20.76904296875, 22.212158203125, 23.6552734375, 25.098388671875, 26.54150390625, 27.984619140625, 29.427734375, 30.870849609375, 32.31396484375, 33.757080078125, 35.2001953125, 36.643310546875, 38.08642578125, 39.529541015625, 40.97265625, 42.415771484375, 43.85888671875, 45.302001953125, 46.7451171875, 48.188232421875, 49.63134765625, 51.074462890625, 52.517578125, 53.960693359375, 55.40380859375, 56.846923828125, 58.2900390625, 59.733154296875, 61.17626953125, 62.619384765625, 64.0625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 7.0, 11.0, 10.0, 11.0, 15.0, 26.0, 34.0, 48.0, 61.0, 82.0, 67.0, 84.0, 87.0, 99.0, 88.0, 58.0, 61.0, 34.0, 35.0, 25.0, 15.0, 7.0, 7.0, 6.0, 6.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.375, -32.521728515625, -31.66845703125, -30.815185546875, -29.9619140625, -29.108642578125, -28.25537109375, -27.402099609375, -26.548828125, -25.695556640625, -24.84228515625, -23.989013671875, -23.1357421875, -22.282470703125, -21.42919921875, -20.575927734375, -19.72265625, -18.869384765625, -18.01611328125, -17.162841796875, -16.3095703125, -15.456298828125, -14.60302734375, -13.749755859375, -12.896484375, -12.043212890625, -11.18994140625, -10.336669921875, -9.4833984375, -8.630126953125, -7.77685546875, -6.923583984375, -6.0703125, -5.217041015625, -4.36376953125, -3.510498046875, -2.6572265625, -1.803955078125, -0.95068359375, -0.097412109375, 0.755859375, 1.609130859375, 2.46240234375, 3.315673828125, 4.1689453125, 5.022216796875, 5.87548828125, 6.728759765625, 7.58203125, 8.435302734375, 9.28857421875, 10.141845703125, 10.9951171875, 11.848388671875, 12.70166015625, 13.554931640625, 14.408203125, 15.261474609375, 16.11474609375, 16.968017578125, 17.8212890625, 18.674560546875, 19.52783203125, 20.381103515625, 21.234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 16.0, 23.0, 45.0, 49.0, 93.0, 162.0, 227.0, 131.0, 87.0, 61.0, 35.0, 18.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-369.34765625, -355.2655029296875, -341.183349609375, -327.1011962890625, -313.0190734863281, -298.9369201660156, -284.8547668457031, -270.7726135253906, -256.69049072265625, -242.60833740234375, -228.5261993408203, -214.4440460205078, -200.36190795898438, -186.27975463867188, -172.19760131835938, -158.11544799804688, -144.03329467773438, -129.95114135742188, -115.86900329589844, -101.78684997558594, -87.70470428466797, -73.62255859375, -59.5404052734375, -45.45825958251953, -31.376113891601562, -17.29396629333496, -3.2118186950683594, 10.870330810546875, 24.952476501464844, 39.03462219238281, 53.11677551269531, 67.19892120361328, 81.28106689453125, 95.36321258544922, 109.44535827636719, 123.52751159667969, 137.60964965820312, 151.69180297851562, 165.77395629882812, 179.85610961914062, 193.93824768066406, 208.02040100097656, 222.1025390625, 236.1846923828125, 250.266845703125, 264.3489990234375, 278.43115234375, 292.5132751464844, 306.5954284667969, 320.6775817871094, 334.7597351074219, 348.84185791015625, 362.92401123046875, 377.00616455078125, 391.08831787109375, 405.17047119140625, 419.25262451171875, 433.33477783203125, 447.41693115234375, 461.49908447265625, 475.5812072753906, 489.6633605957031, 503.7455139160156, 517.82763671875, 531.9097900390625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 0.0, 5.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 13.0, 13.0, 11.0, 20.0, 18.0, 19.0, 19.0, 26.0, 27.0, 35.0, 29.0, 41.0, 41.0, 57.0, 81.0, 79.0, 73.0, 47.0, 40.0, 37.0, 34.0, 32.0, 17.0, 32.0, 24.0, 16.0, 18.0, 15.0, 10.0, 8.0, 10.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-368.02923583984375, -356.7095031738281, -345.3897705078125, -334.0700378417969, -322.75030517578125, -311.4305725097656, -300.11083984375, -288.79107666015625, -277.47137451171875, -266.1516418457031, -254.8319091796875, -243.51217651367188, -232.19244384765625, -220.87271118164062, -209.55296325683594, -198.2332305908203, -186.91348266601562, -175.59375, -164.27401733398438, -152.95428466796875, -141.63455200195312, -130.3148193359375, -118.99507141113281, -107.67533874511719, -96.35560607910156, -85.03587341308594, -73.71614074707031, -62.396400451660156, -51.07666778564453, -39.756935119628906, -28.43719482421875, -17.117462158203125, -5.7977294921875, 5.522005081176758, 16.841739654541016, 28.161476135253906, 39.48120880126953, 50.800941467285156, 62.12068176269531, 73.44041442871094, 84.76014709472656, 96.07987976074219, 107.39961242675781, 118.71935272216797, 130.03909301757812, 141.35882568359375, 152.67855834960938, 163.998291015625, 175.31802368164062, 186.63775634765625, 197.95748901367188, 209.2772216796875, 220.59695434570312, 231.91668701171875, 243.23643493652344, 254.55616760253906, 265.87591552734375, 277.1956481933594, 288.515380859375, 299.8351135253906, 311.15484619140625, 322.4745788574219, 333.7943115234375, 345.11407470703125, 356.43377685546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 3.0, 7.0, 7.0, 11.0, 13.0, 28.0, 38.0, 33.0, 74.0, 106.0, 182.0, 292.0, 449.0, 745.0, 1306.0, 2417.0, 4594.0, 9979.0, 25450.0, 84306.0, 365370.0, 1644226.0, 1580511.0, 348183.0, 80905.0, 24706.0, 10115.0, 4604.0, 2357.0, 1253.0, 748.0, 467.0, 263.0, 166.0, 132.0, 72.0, 57.0, 29.0, 19.0, 17.0, 9.0, 7.0, 10.0, 7.0, 2.0, 3.0, 2.0], "bins": [-29.359375, -28.606201171875, -27.85302734375, -27.099853515625, -26.3466796875, -25.593505859375, -24.84033203125, -24.087158203125, -23.333984375, -22.580810546875, -21.82763671875, -21.074462890625, -20.3212890625, -19.568115234375, -18.81494140625, -18.061767578125, -17.30859375, -16.555419921875, -15.80224609375, -15.049072265625, -14.2958984375, -13.542724609375, -12.78955078125, -12.036376953125, -11.283203125, -10.530029296875, -9.77685546875, -9.023681640625, -8.2705078125, -7.517333984375, -6.76416015625, -6.010986328125, -5.2578125, -4.504638671875, -3.75146484375, -2.998291015625, -2.2451171875, -1.491943359375, -0.73876953125, 0.014404296875, 0.767578125, 1.520751953125, 2.27392578125, 3.027099609375, 3.7802734375, 4.533447265625, 5.28662109375, 6.039794921875, 6.79296875, 7.546142578125, 8.29931640625, 9.052490234375, 9.8056640625, 10.558837890625, 11.31201171875, 12.065185546875, 12.818359375, 13.571533203125, 14.32470703125, 15.077880859375, 15.8310546875, 16.584228515625, 17.33740234375, 18.090576171875, 18.84375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 8.0, 13.0, 9.0, 17.0, 22.0, 19.0, 29.0, 21.0, 25.0, 33.0, 40.0, 35.0, 34.0, 44.0, 48.0, 45.0, 50.0, 52.0, 37.0, 49.0, 51.0, 37.0, 39.0, 36.0, 41.0, 21.0, 18.0, 24.0, 22.0, 9.0, 10.0, 11.0, 7.0, 7.0, 4.0, 1.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.501953125, -22.75390625, -22.005859375, -21.2578125, -20.509765625, -19.76171875, -19.013671875, -18.265625, -17.517578125, -16.76953125, -16.021484375, -15.2734375, -14.525390625, -13.77734375, -13.029296875, -12.28125, -11.533203125, -10.78515625, -10.037109375, -9.2890625, -8.541015625, -7.79296875, -7.044921875, -6.296875, -5.548828125, -4.80078125, -4.052734375, -3.3046875, -2.556640625, -1.80859375, -1.060546875, -0.3125, 0.435546875, 1.18359375, 1.931640625, 2.6796875, 3.427734375, 4.17578125, 4.923828125, 5.671875, 6.419921875, 7.16796875, 7.916015625, 8.6640625, 9.412109375, 10.16015625, 10.908203125, 11.65625, 12.404296875, 13.15234375, 13.900390625, 14.6484375, 15.396484375, 16.14453125, 16.892578125, 17.640625, 18.388671875, 19.13671875, 19.884765625, 20.6328125, 21.380859375, 22.12890625, 22.876953125, 23.625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 8.0, 5.0, 17.0, 30.0, 53.0, 79.0, 152.0, 312.0, 844.0, 2506.0, 10212.0, 64766.0, 2154953.0, 1885800.0, 60863.0, 9752.0, 2407.0, 781.0, 356.0, 132.0, 90.0, 42.0, 28.0, 29.0, 14.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.875, -61.5078125, -59.140625, -56.7734375, -54.40625, -52.0390625, -49.671875, -47.3046875, -44.9375, -42.5703125, -40.203125, -37.8359375, -35.46875, -33.1015625, -30.734375, -28.3671875, -26.0, -23.6328125, -21.265625, -18.8984375, -16.53125, -14.1640625, -11.796875, -9.4296875, -7.0625, -4.6953125, -2.328125, 0.0390625, 2.40625, 4.7734375, 7.140625, 9.5078125, 11.875, 14.2421875, 16.609375, 18.9765625, 21.34375, 23.7109375, 26.078125, 28.4453125, 30.8125, 33.1796875, 35.546875, 37.9140625, 40.28125, 42.6484375, 45.015625, 47.3828125, 49.75, 52.1171875, 54.484375, 56.8515625, 59.21875, 61.5859375, 63.953125, 66.3203125, 68.6875, 71.0546875, 73.421875, 75.7890625, 78.15625, 80.5234375, 82.890625, 85.2578125, 87.625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 12.0, 6.0, 8.0, 12.0, 25.0, 26.0, 23.0, 41.0, 59.0, 113.0, 148.0, 219.0, 334.0, 491.0, 638.0, 606.0, 393.0, 295.0, 171.0, 141.0, 64.0, 54.0, 39.0, 35.0, 22.0, 17.0, 13.0, 7.0, 8.0, 8.0, 10.0, 5.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-52.78125, -51.21728515625, -49.6533203125, -48.08935546875, -46.525390625, -44.96142578125, -43.3974609375, -41.83349609375, -40.26953125, -38.70556640625, -37.1416015625, -35.57763671875, -34.013671875, -32.44970703125, -30.8857421875, -29.32177734375, -27.7578125, -26.19384765625, -24.6298828125, -23.06591796875, -21.501953125, -19.93798828125, -18.3740234375, -16.81005859375, -15.24609375, -13.68212890625, -12.1181640625, -10.55419921875, -8.990234375, -7.42626953125, -5.8623046875, -4.29833984375, -2.734375, -1.17041015625, 0.3935546875, 1.95751953125, 3.521484375, 5.08544921875, 6.6494140625, 8.21337890625, 9.77734375, 11.34130859375, 12.9052734375, 14.46923828125, 16.033203125, 17.59716796875, 19.1611328125, 20.72509765625, 22.2890625, 23.85302734375, 25.4169921875, 26.98095703125, 28.544921875, 30.10888671875, 31.6728515625, 33.23681640625, 34.80078125, 36.36474609375, 37.9287109375, 39.49267578125, 41.056640625, 42.62060546875, 44.1845703125, 45.74853515625, 47.3125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 14.0, 18.0, 37.0, 94.0, 174.0, 239.0, 212.0, 111.0, 50.0, 22.0, 6.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-671.1571044921875, -649.3225708007812, -627.4880981445312, -605.653564453125, -583.819091796875, -561.9845581054688, -540.1500244140625, -518.3155517578125, -496.4810485839844, -474.64654541015625, -452.8120422363281, -430.9775390625, -409.14300537109375, -387.30853271484375, -365.4739990234375, -343.6394958496094, -321.80499267578125, -299.9704895019531, -278.135986328125, -256.30145263671875, -234.4669647216797, -212.63246154785156, -190.79794311523438, -168.96343994140625, -147.12893676757812, -125.29443359375, -103.45992279052734, -81.62541198730469, -59.79090881347656, -37.95640563964844, -16.12188720703125, 5.712615966796875, 27.54718017578125, 49.38168716430664, 71.21619415283203, 93.05070495605469, 114.88520812988281, 136.71971130371094, 158.55422973632812, 180.38873291015625, 202.22323608398438, 224.0577392578125, 245.89224243164062, 267.72674560546875, 289.561279296875, 311.395751953125, 333.23028564453125, 355.0647888183594, 376.8992919921875, 398.7337951660156, 420.56829833984375, 442.40283203125, 464.2373046875, 486.07183837890625, 507.9063415527344, 529.7408447265625, 551.5753173828125, 573.4098510742188, 595.2443237304688, 617.078857421875, 638.913330078125, 660.7478637695312, 682.5823974609375, 704.4168701171875, 726.2514038085938]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 7.0, 21.0, 12.0, 11.0, 16.0, 23.0, 30.0, 44.0, 28.0, 51.0, 52.0, 64.0, 53.0, 67.0, 62.0, 66.0, 58.0, 55.0, 52.0, 38.0, 28.0, 33.0, 33.0, 22.0, 16.0, 13.0, 9.0, 9.0, 2.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-360.1078796386719, -349.8678283691406, -339.62774658203125, -329.3876953125, -319.1476135253906, -308.9075622558594, -298.66748046875, -288.42742919921875, -278.1873779296875, -267.94732666015625, -257.7072448730469, -247.46717834472656, -237.22711181640625, -226.987060546875, -216.7469940185547, -206.50692749023438, -196.266845703125, -186.0267791748047, -175.78671264648438, -165.54664611816406, -155.30657958984375, -145.0665283203125, -134.8264617919922, -124.58639526367188, -114.34632873535156, -104.10626220703125, -93.86619567871094, -83.62613677978516, -73.38607025146484, -63.14600372314453, -52.905941009521484, -42.66587829589844, -32.42584228515625, -22.18577766418457, -11.94571304321289, -1.705648422241211, 8.534416198730469, 18.77448272705078, 29.014545440673828, 39.254608154296875, 49.49467468261719, 59.7347412109375, 69.97480773925781, 80.2148666381836, 90.4549331665039, 100.69499969482422, 110.93505859375, 121.17512512207031, 131.41519165039062, 141.65525817871094, 151.89532470703125, 162.13539123535156, 172.37545776367188, 182.61550903320312, 192.85557556152344, 203.09564208984375, 213.33570861816406, 223.57577514648438, 233.8158416748047, 244.055908203125, 254.29595947265625, 264.5360412597656, 274.7760925292969, 285.01617431640625, 295.2562255859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 6.0, 15.0, 17.0, 31.0, 57.0, 78.0, 123.0, 220.0, 349.0, 568.0, 1223.0, 2834.0, 7896.0, 29514.0, 180777.0, 636847.0, 150245.0, 25513.0, 7062.0, 2525.0, 1164.0, 584.0, 349.0, 219.0, 102.0, 80.0, 54.0, 34.0, 17.0, 19.0, 11.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.40625, -52.8271484375, -51.248046875, -49.6689453125, -48.08984375, -46.5107421875, -44.931640625, -43.3525390625, -41.7734375, -40.1943359375, -38.615234375, -37.0361328125, -35.45703125, -33.8779296875, -32.298828125, -30.7197265625, -29.140625, -27.5615234375, -25.982421875, -24.4033203125, -22.82421875, -21.2451171875, -19.666015625, -18.0869140625, -16.5078125, -14.9287109375, -13.349609375, -11.7705078125, -10.19140625, -8.6123046875, -7.033203125, -5.4541015625, -3.875, -2.2958984375, -0.716796875, 0.8623046875, 2.44140625, 4.0205078125, 5.599609375, 7.1787109375, 8.7578125, 10.3369140625, 11.916015625, 13.4951171875, 15.07421875, 16.6533203125, 18.232421875, 19.8115234375, 21.390625, 22.9697265625, 24.548828125, 26.1279296875, 27.70703125, 29.2861328125, 30.865234375, 32.4443359375, 34.0234375, 35.6025390625, 37.181640625, 38.7607421875, 40.33984375, 41.9189453125, 43.498046875, 45.0771484375, 46.65625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 6.0, 4.0, 3.0, 4.0, 8.0, 5.0, 8.0, 9.0, 16.0, 13.0, 21.0, 33.0, 21.0, 34.0, 32.0, 47.0, 43.0, 47.0, 62.0, 54.0, 51.0, 55.0, 60.0, 51.0, 46.0, 41.0, 36.0, 30.0, 36.0, 23.0, 21.0, 16.0, 24.0, 11.0, 8.0, 8.0, 7.0, 7.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.8125, -20.92578125, -20.0390625, -19.15234375, -18.265625, -17.37890625, -16.4921875, -15.60546875, -14.71875, -13.83203125, -12.9453125, -12.05859375, -11.171875, -10.28515625, -9.3984375, -8.51171875, -7.625, -6.73828125, -5.8515625, -4.96484375, -4.078125, -3.19140625, -2.3046875, -1.41796875, -0.53125, 0.35546875, 1.2421875, 2.12890625, 3.015625, 3.90234375, 4.7890625, 5.67578125, 6.5625, 7.44921875, 8.3359375, 9.22265625, 10.109375, 10.99609375, 11.8828125, 12.76953125, 13.65625, 14.54296875, 15.4296875, 16.31640625, 17.203125, 18.08984375, 18.9765625, 19.86328125, 20.75, 21.63671875, 22.5234375, 23.41015625, 24.296875, 25.18359375, 26.0703125, 26.95703125, 27.84375, 28.73046875, 29.6171875, 30.50390625, 31.390625, 32.27734375, 33.1640625, 34.05078125, 34.9375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 8.0, 8.0, 7.0, 11.0, 13.0, 19.0, 24.0, 46.0, 61.0, 83.0, 134.0, 168.0, 320.0, 572.0, 1061.0, 2399.0, 6687.0, 29889.0, 288568.0, 657914.0, 45963.0, 8775.0, 2873.0, 1263.0, 627.0, 309.0, 232.0, 148.0, 91.0, 75.0, 45.0, 48.0, 27.0, 17.0, 10.0, 16.0, 7.0, 4.0, 2.0, 2.0, 6.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.15625, -55.19287109375, -53.2294921875, -51.26611328125, -49.302734375, -47.33935546875, -45.3759765625, -43.41259765625, -41.44921875, -39.48583984375, -37.5224609375, -35.55908203125, -33.595703125, -31.63232421875, -29.6689453125, -27.70556640625, -25.7421875, -23.77880859375, -21.8154296875, -19.85205078125, -17.888671875, -15.92529296875, -13.9619140625, -11.99853515625, -10.03515625, -8.07177734375, -6.1083984375, -4.14501953125, -2.181640625, -0.21826171875, 1.7451171875, 3.70849609375, 5.671875, 7.63525390625, 9.5986328125, 11.56201171875, 13.525390625, 15.48876953125, 17.4521484375, 19.41552734375, 21.37890625, 23.34228515625, 25.3056640625, 27.26904296875, 29.232421875, 31.19580078125, 33.1591796875, 35.12255859375, 37.0859375, 39.04931640625, 41.0126953125, 42.97607421875, 44.939453125, 46.90283203125, 48.8662109375, 50.82958984375, 52.79296875, 54.75634765625, 56.7197265625, 58.68310546875, 60.646484375, 62.60986328125, 64.5732421875, 66.53662109375, 68.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 7.0, 8.0, 10.0, 13.0, 14.0, 14.0, 26.0, 21.0, 24.0, 28.0, 49.0, 49.0, 45.0, 55.0, 54.0, 75.0, 62.0, 43.0, 51.0, 66.0, 47.0, 41.0, 33.0, 24.0, 21.0, 24.0, 15.0, 13.0, 8.0, 7.0, 11.0, 8.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-88.0625, -84.6826171875, -81.302734375, -77.9228515625, -74.54296875, -71.1630859375, -67.783203125, -64.4033203125, -61.0234375, -57.6435546875, -54.263671875, -50.8837890625, -47.50390625, -44.1240234375, -40.744140625, -37.3642578125, -33.984375, -30.6044921875, -27.224609375, -23.8447265625, -20.46484375, -17.0849609375, -13.705078125, -10.3251953125, -6.9453125, -3.5654296875, -0.185546875, 3.1943359375, 6.57421875, 9.9541015625, 13.333984375, 16.7138671875, 20.09375, 23.4736328125, 26.853515625, 30.2333984375, 33.61328125, 36.9931640625, 40.373046875, 43.7529296875, 47.1328125, 50.5126953125, 53.892578125, 57.2724609375, 60.65234375, 64.0322265625, 67.412109375, 70.7919921875, 74.171875, 77.5517578125, 80.931640625, 84.3115234375, 87.69140625, 91.0712890625, 94.451171875, 97.8310546875, 101.2109375, 104.5908203125, 107.970703125, 111.3505859375, 114.73046875, 118.1103515625, 121.490234375, 124.8701171875, 128.25]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 13.0, 11.0, 13.0, 23.0, 35.0, 48.0, 86.0, 123.0, 231.0, 366.0, 615.0, 1133.0, 2409.0, 5205.0, 13236.0, 39480.0, 157701.0, 666415.0, 111812.0, 30015.0, 10869.0, 4329.0, 2050.0, 1009.0, 527.0, 297.0, 170.0, 104.0, 81.0, 45.0, 22.0, 24.0, 18.0, 11.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -18.006591796875, -17.45068359375, -16.894775390625, -16.3388671875, -15.782958984375, -15.22705078125, -14.671142578125, -14.115234375, -13.559326171875, -13.00341796875, -12.447509765625, -11.8916015625, -11.335693359375, -10.77978515625, -10.223876953125, -9.66796875, -9.112060546875, -8.55615234375, -8.000244140625, -7.4443359375, -6.888427734375, -6.33251953125, -5.776611328125, -5.220703125, -4.664794921875, -4.10888671875, -3.552978515625, -2.9970703125, -2.441162109375, -1.88525390625, -1.329345703125, -0.7734375, -0.217529296875, 0.33837890625, 0.894287109375, 1.4501953125, 2.006103515625, 2.56201171875, 3.117919921875, 3.673828125, 4.229736328125, 4.78564453125, 5.341552734375, 5.8974609375, 6.453369140625, 7.00927734375, 7.565185546875, 8.12109375, 8.677001953125, 9.23291015625, 9.788818359375, 10.3447265625, 10.900634765625, 11.45654296875, 12.012451171875, 12.568359375, 13.124267578125, 13.68017578125, 14.236083984375, 14.7919921875, 15.347900390625, 15.90380859375, 16.459716796875, 17.015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 8.0, 17.0, 14.0, 38.0, 64.0, 82.0, 119.0, 151.0, 143.0, 93.0, 76.0, 56.0, 25.0, 34.0, 11.0, 15.0, 4.0, 12.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0059814453125, -0.005759119987487793, -0.005536794662475586, -0.005314469337463379, -0.005092144012451172, -0.004869818687438965, -0.004647493362426758, -0.004425168037414551, -0.004202842712402344, -0.003980517387390137, -0.0037581920623779297, -0.0035358667373657227, -0.0033135414123535156, -0.0030912160873413086, -0.0028688907623291016, -0.0026465654373168945, -0.0024242401123046875, -0.0022019147872924805, -0.0019795894622802734, -0.0017572641372680664, -0.0015349388122558594, -0.0013126134872436523, -0.0010902881622314453, -0.0008679628372192383, -0.0006456375122070312, -0.0004233121871948242, -0.0002009868621826172, 2.1338462829589844e-05, 0.00024366378784179688, 0.0004659891128540039, 0.0006883144378662109, 0.000910639762878418, 0.001132965087890625, 0.001355290412902832, 0.001577615737915039, 0.001799941062927246, 0.002022266387939453, 0.00224459171295166, 0.002466917037963867, 0.0026892423629760742, 0.0029115676879882812, 0.0031338930130004883, 0.0033562183380126953, 0.0035785436630249023, 0.0038008689880371094, 0.004023194313049316, 0.0042455196380615234, 0.0044678449630737305, 0.0046901702880859375, 0.0049124956130981445, 0.0051348209381103516, 0.005357146263122559, 0.005579471588134766, 0.005801796913146973, 0.00602412223815918, 0.006246447563171387, 0.006468772888183594, 0.006691098213195801, 0.006913423538208008, 0.007135748863220215, 0.007358074188232422, 0.007580399513244629, 0.007802724838256836, 0.008025050163269043, 0.00824737548828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 8.0, 12.0, 16.0, 32.0, 24.0, 61.0, 89.0, 150.0, 254.0, 517.0, 1130.0, 2813.0, 8730.0, 38753.0, 283431.0, 640454.0, 54417.0, 11465.0, 3521.0, 1359.0, 561.0, 282.0, 179.0, 94.0, 57.0, 40.0, 28.0, 23.0, 13.0, 8.0, 10.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.796875, -23.99951171875, -23.2021484375, -22.40478515625, -21.607421875, -20.81005859375, -20.0126953125, -19.21533203125, -18.41796875, -17.62060546875, -16.8232421875, -16.02587890625, -15.228515625, -14.43115234375, -13.6337890625, -12.83642578125, -12.0390625, -11.24169921875, -10.4443359375, -9.64697265625, -8.849609375, -8.05224609375, -7.2548828125, -6.45751953125, -5.66015625, -4.86279296875, -4.0654296875, -3.26806640625, -2.470703125, -1.67333984375, -0.8759765625, -0.07861328125, 0.71875, 1.51611328125, 2.3134765625, 3.11083984375, 3.908203125, 4.70556640625, 5.5029296875, 6.30029296875, 7.09765625, 7.89501953125, 8.6923828125, 9.48974609375, 10.287109375, 11.08447265625, 11.8818359375, 12.67919921875, 13.4765625, 14.27392578125, 15.0712890625, 15.86865234375, 16.666015625, 17.46337890625, 18.2607421875, 19.05810546875, 19.85546875, 20.65283203125, 21.4501953125, 22.24755859375, 23.044921875, 23.84228515625, 24.6396484375, 25.43701171875, 26.234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 4.0, 6.0, 6.0, 13.0, 15.0, 18.0, 43.0, 53.0, 66.0, 103.0, 120.0, 131.0, 135.0, 88.0, 63.0, 53.0, 32.0, 24.0, 6.0, 8.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.22607421875, -18.3271484375, -17.42822265625, -16.529296875, -15.63037109375, -14.7314453125, -13.83251953125, -12.93359375, -12.03466796875, -11.1357421875, -10.23681640625, -9.337890625, -8.43896484375, -7.5400390625, -6.64111328125, -5.7421875, -4.84326171875, -3.9443359375, -3.04541015625, -2.146484375, -1.24755859375, -0.3486328125, 0.55029296875, 1.44921875, 2.34814453125, 3.2470703125, 4.14599609375, 5.044921875, 5.94384765625, 6.8427734375, 7.74169921875, 8.640625, 9.53955078125, 10.4384765625, 11.33740234375, 12.236328125, 13.13525390625, 14.0341796875, 14.93310546875, 15.83203125, 16.73095703125, 17.6298828125, 18.52880859375, 19.427734375, 20.32666015625, 21.2255859375, 22.12451171875, 23.0234375, 23.92236328125, 24.8212890625, 25.72021484375, 26.619140625, 27.51806640625, 28.4169921875, 29.31591796875, 30.21484375, 31.11376953125, 32.0126953125, 32.91162109375, 33.810546875, 34.70947265625, 35.6083984375, 36.50732421875, 37.40625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 17.0, 30.0, 71.0, 115.0, 392.0, 193.0, 97.0, 42.0, 16.0, 11.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-757.6083984375, -736.9835205078125, -716.3585815429688, -695.7337036132812, -675.1087646484375, -654.48388671875, -633.8590087890625, -613.234130859375, -592.6091918945312, -571.9843139648438, -551.359375, -530.7344970703125, -510.1095886230469, -489.48468017578125, -468.85980224609375, -448.2348937988281, -427.6099853515625, -406.9850769042969, -386.36016845703125, -365.73529052734375, -345.1103820800781, -324.4854736328125, -303.860595703125, -283.2356872558594, -262.61077880859375, -241.98587036132812, -221.36097717285156, -200.736083984375, -180.11117553710938, -159.48626708984375, -138.8613739013672, -118.23648071289062, -97.61163330078125, -76.98673248291016, -56.36183166503906, -35.73693084716797, -15.112030029296875, 5.512870788574219, 26.137771606445312, 46.762664794921875, 67.3875732421875, 88.0124740600586, 108.63737487792969, 129.26226806640625, 149.88717651367188, 170.5120849609375, 191.13697814941406, 211.76187133789062, 232.38677978515625, 253.01168823242188, 273.6365966796875, 294.261474609375, 314.8863830566406, 335.51129150390625, 356.13616943359375, 376.7610778808594, 397.385986328125, 418.0108947753906, 438.63580322265625, 459.26068115234375, 479.8855895996094, 500.510498046875, 521.1353759765625, 541.76025390625, 562.3851928710938]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 7.0, 3.0, 5.0, 7.0, 10.0, 12.0, 9.0, 13.0, 16.0, 12.0, 18.0, 16.0, 30.0, 30.0, 32.0, 28.0, 35.0, 55.0, 65.0, 95.0, 100.0, 61.0, 33.0, 30.0, 31.0, 32.0, 31.0, 26.0, 20.0, 21.0, 22.0, 13.0, 9.0, 7.0, 11.0, 6.0, 9.0, 6.0, 9.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-369.95526123046875, -358.2567138671875, -346.5581359863281, -334.8595886230469, -323.1610107421875, -311.46246337890625, -299.763916015625, -288.06536865234375, -276.3667907714844, -264.6682434082031, -252.96966552734375, -241.2711181640625, -229.5725555419922, -217.87399291992188, -206.17544555664062, -194.4768829345703, -182.7783203125, -171.0797576904297, -159.38119506835938, -147.68264770507812, -135.9840850830078, -124.2855224609375, -112.58696746826172, -100.88841247558594, -89.18984985351562, -77.49128723144531, -65.79273223876953, -54.094173431396484, -42.39561462402344, -30.69705581665039, -18.998497009277344, -7.2999420166015625, 4.39862060546875, 16.097179412841797, 27.795738220214844, 39.49429702758789, 51.19285583496094, 62.891414642333984, 74.58997344970703, 86.28852844238281, 97.98709106445312, 109.68565368652344, 121.38420867919922, 133.082763671875, 144.7813262939453, 156.47988891601562, 168.17843627929688, 179.8769989013672, 191.5755615234375, 203.2741241455078, 214.97268676757812, 226.67123413085938, 238.3697967529297, 250.068359375, 261.76690673828125, 273.4654541015625, 285.1640319824219, 296.8625793457031, 308.5611572265625, 320.25970458984375, 331.958251953125, 343.6568298339844, 355.3553771972656, 367.053955078125, 378.75250244140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 11.0, 8.0, 15.0, 20.0, 22.0, 54.0, 70.0, 86.0, 107.0, 197.0, 300.0, 408.0, 744.0, 1280.0, 2338.0, 4668.0, 10641.0, 27352.0, 84758.0, 327629.0, 1313770.0, 1754206.0, 486563.0, 118230.0, 35122.0, 13036.0, 5713.0, 2792.0, 1574.0, 959.0, 519.0, 366.0, 225.0, 164.0, 95.0, 75.0, 42.0, 29.0, 28.0, 19.0, 9.0, 10.0, 7.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.639404296875, -22.90380859375, -22.168212890625, -21.4326171875, -20.697021484375, -19.96142578125, -19.225830078125, -18.490234375, -17.754638671875, -17.01904296875, -16.283447265625, -15.5478515625, -14.812255859375, -14.07666015625, -13.341064453125, -12.60546875, -11.869873046875, -11.13427734375, -10.398681640625, -9.6630859375, -8.927490234375, -8.19189453125, -7.456298828125, -6.720703125, -5.985107421875, -5.24951171875, -4.513916015625, -3.7783203125, -3.042724609375, -2.30712890625, -1.571533203125, -0.8359375, -0.100341796875, 0.63525390625, 1.370849609375, 2.1064453125, 2.842041015625, 3.57763671875, 4.313232421875, 5.048828125, 5.784423828125, 6.52001953125, 7.255615234375, 7.9912109375, 8.726806640625, 9.46240234375, 10.197998046875, 10.93359375, 11.669189453125, 12.40478515625, 13.140380859375, 13.8759765625, 14.611572265625, 15.34716796875, 16.082763671875, 16.818359375, 17.553955078125, 18.28955078125, 19.025146484375, 19.7607421875, 20.496337890625, 21.23193359375, 21.967529296875, 22.703125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 10.0, 8.0, 12.0, 13.0, 15.0, 24.0, 32.0, 25.0, 34.0, 39.0, 49.0, 39.0, 57.0, 39.0, 38.0, 51.0, 43.0, 49.0, 44.0, 52.0, 54.0, 36.0, 31.0, 18.0, 29.0, 28.0, 28.0, 15.0, 15.0, 24.0, 4.0, 4.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-24.875, -24.06884765625, -23.2626953125, -22.45654296875, -21.650390625, -20.84423828125, -20.0380859375, -19.23193359375, -18.42578125, -17.61962890625, -16.8134765625, -16.00732421875, -15.201171875, -14.39501953125, -13.5888671875, -12.78271484375, -11.9765625, -11.17041015625, -10.3642578125, -9.55810546875, -8.751953125, -7.94580078125, -7.1396484375, -6.33349609375, -5.52734375, -4.72119140625, -3.9150390625, -3.10888671875, -2.302734375, -1.49658203125, -0.6904296875, 0.11572265625, 0.921875, 1.72802734375, 2.5341796875, 3.34033203125, 4.146484375, 4.95263671875, 5.7587890625, 6.56494140625, 7.37109375, 8.17724609375, 8.9833984375, 9.78955078125, 10.595703125, 11.40185546875, 12.2080078125, 13.01416015625, 13.8203125, 14.62646484375, 15.4326171875, 16.23876953125, 17.044921875, 17.85107421875, 18.6572265625, 19.46337890625, 20.26953125, 21.07568359375, 21.8818359375, 22.68798828125, 23.494140625, 24.30029296875, 25.1064453125, 25.91259765625, 26.71875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 16.0, 13.0, 23.0, 27.0, 33.0, 63.0, 114.0, 225.0, 528.0, 1635.0, 5941.0, 35908.0, 817598.0, 3223632.0, 93236.0, 11065.0, 2675.0, 858.0, 308.0, 155.0, 73.0, 45.0, 32.0, 14.0, 14.0, 8.0, 8.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-79.8125, -77.478515625, -75.14453125, -72.810546875, -70.4765625, -68.142578125, -65.80859375, -63.474609375, -61.140625, -58.806640625, -56.47265625, -54.138671875, -51.8046875, -49.470703125, -47.13671875, -44.802734375, -42.46875, -40.134765625, -37.80078125, -35.466796875, -33.1328125, -30.798828125, -28.46484375, -26.130859375, -23.796875, -21.462890625, -19.12890625, -16.794921875, -14.4609375, -12.126953125, -9.79296875, -7.458984375, -5.125, -2.791015625, -0.45703125, 1.876953125, 4.2109375, 6.544921875, 8.87890625, 11.212890625, 13.546875, 15.880859375, 18.21484375, 20.548828125, 22.8828125, 25.216796875, 27.55078125, 29.884765625, 32.21875, 34.552734375, 36.88671875, 39.220703125, 41.5546875, 43.888671875, 46.22265625, 48.556640625, 50.890625, 53.224609375, 55.55859375, 57.892578125, 60.2265625, 62.560546875, 64.89453125, 67.228515625, 69.5625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 7.0, 18.0, 20.0, 32.0, 32.0, 50.0, 64.0, 128.0, 181.0, 262.0, 450.0, 596.0, 663.0, 546.0, 350.0, 201.0, 143.0, 91.0, 74.0, 46.0, 26.0, 26.0, 8.0, 5.0, 5.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-62.0, -60.287109375, -58.57421875, -56.861328125, -55.1484375, -53.435546875, -51.72265625, -50.009765625, -48.296875, -46.583984375, -44.87109375, -43.158203125, -41.4453125, -39.732421875, -38.01953125, -36.306640625, -34.59375, -32.880859375, -31.16796875, -29.455078125, -27.7421875, -26.029296875, -24.31640625, -22.603515625, -20.890625, -19.177734375, -17.46484375, -15.751953125, -14.0390625, -12.326171875, -10.61328125, -8.900390625, -7.1875, -5.474609375, -3.76171875, -2.048828125, -0.3359375, 1.376953125, 3.08984375, 4.802734375, 6.515625, 8.228515625, 9.94140625, 11.654296875, 13.3671875, 15.080078125, 16.79296875, 18.505859375, 20.21875, 21.931640625, 23.64453125, 25.357421875, 27.0703125, 28.783203125, 30.49609375, 32.208984375, 33.921875, 35.634765625, 37.34765625, 39.060546875, 40.7734375, 42.486328125, 44.19921875, 45.912109375, 47.625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 9.0, 11.0, 28.0, 45.0, 145.0, 279.0, 240.0, 146.0, 61.0, 14.0, 17.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-567.9182739257812, -543.019775390625, -518.1212768554688, -493.2228088378906, -468.3243103027344, -443.4258117675781, -418.52734375, -393.62884521484375, -368.7303466796875, -343.83184814453125, -318.933349609375, -294.0348815917969, -269.1363830566406, -244.23788452148438, -219.3394012451172, -194.44091796875, -169.54241943359375, -144.6439208984375, -119.74543762207031, -94.8469467163086, -69.94845581054688, -45.049964904785156, -20.151473999023438, 4.74700927734375, 29.6455078125, 54.54399871826172, 79.44248962402344, 104.34098052978516, 129.23947143554688, 154.13796997070312, 179.0364532470703, 203.9349365234375, 228.83349609375, 253.73199462890625, 278.6304931640625, 303.5289611816406, 328.4274597167969, 353.3259582519531, 378.22442626953125, 403.1229248046875, 428.02142333984375, 452.919921875, 477.81842041015625, 502.7168884277344, 527.6153564453125, 552.5138549804688, 577.412353515625, 602.3108520507812, 627.2093505859375, 652.1078491210938, 677.00634765625, 701.9048461914062, 726.8033447265625, 751.7017822265625, 776.6002807617188, 801.498779296875, 826.3972778320312, 851.2957763671875, 876.1942749023438, 901.0927734375, 925.9912109375, 950.8897094726562, 975.7882080078125, 1000.6867065429688, 1025.585205078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 10.0, 8.0, 13.0, 11.0, 14.0, 14.0, 23.0, 28.0, 29.0, 39.0, 41.0, 49.0, 65.0, 40.0, 72.0, 63.0, 79.0, 47.0, 46.0, 55.0, 53.0, 35.0, 26.0, 20.0, 21.0, 20.0, 20.0, 12.0, 13.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-333.4386901855469, -324.39263916015625, -315.34661865234375, -306.3005676269531, -297.2545471191406, -288.20849609375, -279.1624755859375, -270.1164245605469, -261.07037353515625, -252.0243377685547, -242.97830200195312, -233.93226623535156, -224.88623046875, -215.84017944335938, -206.7941436767578, -197.74810791015625, -188.70208740234375, -179.6560516357422, -170.61001586914062, -161.56398010253906, -152.5179443359375, -143.47189331054688, -134.4258575439453, -125.37982177734375, -116.33378601074219, -107.28775024414062, -98.24171447753906, -89.19567108154297, -80.1496353149414, -71.10359954833984, -62.057559967041016, -53.01152038574219, -43.96551513671875, -34.91947937011719, -25.87343978881836, -16.827402114868164, -7.781364440917969, 1.2646713256835938, 10.310710906982422, 19.35675048828125, 28.402786254882812, 37.448822021484375, 46.4948616027832, 55.54090118408203, 64.5869369506836, 73.63297271728516, 82.67901611328125, 91.72505187988281, 100.77108764648438, 109.81712341308594, 118.8631591796875, 127.9092025756836, 136.95523071289062, 146.00128173828125, 155.0473175048828, 164.09335327148438, 173.13938903808594, 182.1854248046875, 191.23146057128906, 200.27749633789062, 209.32354736328125, 218.36956787109375, 227.41561889648438, 236.46165466308594, 245.5076904296875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 6.0, 17.0, 13.0, 19.0, 46.0, 45.0, 89.0, 96.0, 146.0, 234.0, 352.0, 554.0, 951.0, 1643.0, 2985.0, 5808.0, 12425.0, 28890.0, 76342.0, 235419.0, 415647.0, 167766.0, 56291.0, 21992.0, 9875.0, 4682.0, 2526.0, 1376.0, 831.0, 537.0, 334.0, 211.0, 112.0, 89.0, 56.0, 44.0, 28.0, 20.0, 8.0, 7.0, 14.0, 8.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0], "bins": [-34.59375, -33.615234375, -32.63671875, -31.658203125, -30.6796875, -29.701171875, -28.72265625, -27.744140625, -26.765625, -25.787109375, -24.80859375, -23.830078125, -22.8515625, -21.873046875, -20.89453125, -19.916015625, -18.9375, -17.958984375, -16.98046875, -16.001953125, -15.0234375, -14.044921875, -13.06640625, -12.087890625, -11.109375, -10.130859375, -9.15234375, -8.173828125, -7.1953125, -6.216796875, -5.23828125, -4.259765625, -3.28125, -2.302734375, -1.32421875, -0.345703125, 0.6328125, 1.611328125, 2.58984375, 3.568359375, 4.546875, 5.525390625, 6.50390625, 7.482421875, 8.4609375, 9.439453125, 10.41796875, 11.396484375, 12.375, 13.353515625, 14.33203125, 15.310546875, 16.2890625, 17.267578125, 18.24609375, 19.224609375, 20.203125, 21.181640625, 22.16015625, 23.138671875, 24.1171875, 25.095703125, 26.07421875, 27.052734375, 28.03125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 13.0, 8.0, 11.0, 9.0, 15.0, 15.0, 27.0, 33.0, 31.0, 30.0, 31.0, 31.0, 30.0, 42.0, 51.0, 53.0, 46.0, 65.0, 38.0, 53.0, 41.0, 38.0, 40.0, 27.0, 34.0, 29.0, 25.0, 23.0, 19.0, 18.0, 11.0, 12.0, 5.0, 5.0, 10.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.609375, -24.807373046875, -24.00537109375, -23.203369140625, -22.4013671875, -21.599365234375, -20.79736328125, -19.995361328125, -19.193359375, -18.391357421875, -17.58935546875, -16.787353515625, -15.9853515625, -15.183349609375, -14.38134765625, -13.579345703125, -12.77734375, -11.975341796875, -11.17333984375, -10.371337890625, -9.5693359375, -8.767333984375, -7.96533203125, -7.163330078125, -6.361328125, -5.559326171875, -4.75732421875, -3.955322265625, -3.1533203125, -2.351318359375, -1.54931640625, -0.747314453125, 0.0546875, 0.856689453125, 1.65869140625, 2.460693359375, 3.2626953125, 4.064697265625, 4.86669921875, 5.668701171875, 6.470703125, 7.272705078125, 8.07470703125, 8.876708984375, 9.6787109375, 10.480712890625, 11.28271484375, 12.084716796875, 12.88671875, 13.688720703125, 14.49072265625, 15.292724609375, 16.0947265625, 16.896728515625, 17.69873046875, 18.500732421875, 19.302734375, 20.104736328125, 20.90673828125, 21.708740234375, 22.5107421875, 23.312744140625, 24.11474609375, 24.916748046875, 25.71875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 8.0, 11.0, 11.0, 8.0, 15.0, 21.0, 33.0, 55.0, 65.0, 99.0, 150.0, 247.0, 380.0, 638.0, 1185.0, 2620.0, 7874.0, 32622.0, 244733.0, 685406.0, 54002.0, 11361.0, 3568.0, 1433.0, 757.0, 441.0, 268.0, 154.0, 108.0, 69.0, 56.0, 41.0, 21.0, 29.0, 19.0, 12.0, 8.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-68.8125, -66.90869140625, -65.0048828125, -63.10107421875, -61.197265625, -59.29345703125, -57.3896484375, -55.48583984375, -53.58203125, -51.67822265625, -49.7744140625, -47.87060546875, -45.966796875, -44.06298828125, -42.1591796875, -40.25537109375, -38.3515625, -36.44775390625, -34.5439453125, -32.64013671875, -30.736328125, -28.83251953125, -26.9287109375, -25.02490234375, -23.12109375, -21.21728515625, -19.3134765625, -17.40966796875, -15.505859375, -13.60205078125, -11.6982421875, -9.79443359375, -7.890625, -5.98681640625, -4.0830078125, -2.17919921875, -0.275390625, 1.62841796875, 3.5322265625, 5.43603515625, 7.33984375, 9.24365234375, 11.1474609375, 13.05126953125, 14.955078125, 16.85888671875, 18.7626953125, 20.66650390625, 22.5703125, 24.47412109375, 26.3779296875, 28.28173828125, 30.185546875, 32.08935546875, 33.9931640625, 35.89697265625, 37.80078125, 39.70458984375, 41.6083984375, 43.51220703125, 45.416015625, 47.31982421875, 49.2236328125, 51.12744140625, 53.03125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 4.0, 9.0, 10.0, 11.0, 8.0, 10.0, 15.0, 20.0, 23.0, 28.0, 31.0, 32.0, 47.0, 66.0, 62.0, 59.0, 51.0, 70.0, 62.0, 54.0, 43.0, 39.0, 52.0, 35.0, 37.0, 23.0, 22.0, 27.0, 11.0, 6.0, 6.0, 5.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.9375, -119.314453125, -115.69140625, -112.068359375, -108.4453125, -104.822265625, -101.19921875, -97.576171875, -93.953125, -90.330078125, -86.70703125, -83.083984375, -79.4609375, -75.837890625, -72.21484375, -68.591796875, -64.96875, -61.345703125, -57.72265625, -54.099609375, -50.4765625, -46.853515625, -43.23046875, -39.607421875, -35.984375, -32.361328125, -28.73828125, -25.115234375, -21.4921875, -17.869140625, -14.24609375, -10.623046875, -7.0, -3.376953125, 0.24609375, 3.869140625, 7.4921875, 11.115234375, 14.73828125, 18.361328125, 21.984375, 25.607421875, 29.23046875, 32.853515625, 36.4765625, 40.099609375, 43.72265625, 47.345703125, 50.96875, 54.591796875, 58.21484375, 61.837890625, 65.4609375, 69.083984375, 72.70703125, 76.330078125, 79.953125, 83.576171875, 87.19921875, 90.822265625, 94.4453125, 98.068359375, 101.69140625, 105.314453125, 108.9375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 13.0, 18.0, 20.0, 17.0, 29.0, 58.0, 77.0, 117.0, 159.0, 253.0, 459.0, 810.0, 1485.0, 3573.0, 8813.0, 25907.0, 98260.0, 663532.0, 180406.0, 41784.0, 13063.0, 5013.0, 2167.0, 996.0, 593.0, 339.0, 196.0, 128.0, 63.0, 63.0, 43.0, 28.0, 20.0, 13.0, 6.0, 5.0, 6.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.2471923828125, -9.814697265625, -9.3822021484375, -8.94970703125, -8.5172119140625, -8.084716796875, -7.6522216796875, -7.2197265625, -6.7872314453125, -6.354736328125, -5.9222412109375, -5.48974609375, -5.0572509765625, -4.624755859375, -4.1922607421875, -3.759765625, -3.3272705078125, -2.894775390625, -2.4622802734375, -2.02978515625, -1.5972900390625, -1.164794921875, -0.7322998046875, -0.2998046875, 0.1326904296875, 0.565185546875, 0.9976806640625, 1.43017578125, 1.8626708984375, 2.295166015625, 2.7276611328125, 3.16015625, 3.5926513671875, 4.025146484375, 4.4576416015625, 4.89013671875, 5.3226318359375, 5.755126953125, 6.1876220703125, 6.6201171875, 7.0526123046875, 7.485107421875, 7.9176025390625, 8.35009765625, 8.7825927734375, 9.215087890625, 9.6475830078125, 10.080078125, 10.5125732421875, 10.945068359375, 11.3775634765625, 11.81005859375, 12.2425537109375, 12.675048828125, 13.1075439453125, 13.5400390625, 13.9725341796875, 14.405029296875, 14.8375244140625, 15.27001953125, 15.7025146484375, 16.135009765625, 16.5675048828125, 17.0]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 8.0, 6.0, 15.0, 21.0, 17.0, 39.0, 56.0, 87.0, 104.0, 116.0, 136.0, 98.0, 77.0, 57.0, 39.0, 23.0, 26.0, 14.0, 13.0, 6.0, 6.0, 4.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004940032958984375, -0.004775106906890869, -0.004610180854797363, -0.004445254802703857, -0.0042803287506103516, -0.004115402698516846, -0.00395047664642334, -0.003785550594329834, -0.003620624542236328, -0.0034556984901428223, -0.0032907724380493164, -0.0031258463859558105, -0.0029609203338623047, -0.002795994281768799, -0.002631068229675293, -0.002466142177581787, -0.0023012161254882812, -0.0021362900733947754, -0.0019713640213012695, -0.0018064379692077637, -0.0016415119171142578, -0.001476585865020752, -0.001311659812927246, -0.0011467337608337402, -0.0009818077087402344, -0.0008168816566467285, -0.0006519556045532227, -0.0004870295524597168, -0.00032210350036621094, -0.00015717744827270508, 7.748603820800781e-06, 0.00017267465591430664, 0.0003376007080078125, 0.0005025267601013184, 0.0006674528121948242, 0.0008323788642883301, 0.000997304916381836, 0.0011622309684753418, 0.0013271570205688477, 0.0014920830726623535, 0.0016570091247558594, 0.0018219351768493652, 0.001986861228942871, 0.002151787281036377, 0.002316713333129883, 0.0024816393852233887, 0.0026465654373168945, 0.0028114914894104004, 0.0029764175415039062, 0.003141343593597412, 0.003306269645690918, 0.003471195697784424, 0.0036361217498779297, 0.0038010478019714355, 0.003965973854064941, 0.004130899906158447, 0.004295825958251953, 0.004460752010345459, 0.004625678062438965, 0.004790604114532471, 0.0049555301666259766, 0.005120456218719482, 0.005285382270812988, 0.005450308322906494, 0.005615234375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 17.0, 17.0, 27.0, 48.0, 68.0, 147.0, 263.0, 524.0, 1263.0, 3460.0, 14173.0, 88847.0, 781318.0, 132574.0, 18674.0, 4418.0, 1443.0, 590.0, 307.0, 176.0, 76.0, 44.0, 25.0, 15.0, 14.0, 7.0, 8.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.90625, -25.1982421875, -24.490234375, -23.7822265625, -23.07421875, -22.3662109375, -21.658203125, -20.9501953125, -20.2421875, -19.5341796875, -18.826171875, -18.1181640625, -17.41015625, -16.7021484375, -15.994140625, -15.2861328125, -14.578125, -13.8701171875, -13.162109375, -12.4541015625, -11.74609375, -11.0380859375, -10.330078125, -9.6220703125, -8.9140625, -8.2060546875, -7.498046875, -6.7900390625, -6.08203125, -5.3740234375, -4.666015625, -3.9580078125, -3.25, -2.5419921875, -1.833984375, -1.1259765625, -0.41796875, 0.2900390625, 0.998046875, 1.7060546875, 2.4140625, 3.1220703125, 3.830078125, 4.5380859375, 5.24609375, 5.9541015625, 6.662109375, 7.3701171875, 8.078125, 8.7861328125, 9.494140625, 10.2021484375, 10.91015625, 11.6181640625, 12.326171875, 13.0341796875, 13.7421875, 14.4501953125, 15.158203125, 15.8662109375, 16.57421875, 17.2822265625, 17.990234375, 18.6982421875, 19.40625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 7.0, 7.0, 9.0, 8.0, 6.0, 6.0, 17.0, 13.0, 26.0, 25.0, 38.0, 44.0, 57.0, 70.0, 71.0, 67.0, 68.0, 60.0, 65.0, 63.0, 59.0, 35.0, 31.0, 30.0, 21.0, 13.0, 19.0, 5.0, 9.0, 5.0, 7.0, 4.0, 2.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-15.5, -15.02783203125, -14.5556640625, -14.08349609375, -13.611328125, -13.13916015625, -12.6669921875, -12.19482421875, -11.72265625, -11.25048828125, -10.7783203125, -10.30615234375, -9.833984375, -9.36181640625, -8.8896484375, -8.41748046875, -7.9453125, -7.47314453125, -7.0009765625, -6.52880859375, -6.056640625, -5.58447265625, -5.1123046875, -4.64013671875, -4.16796875, -3.69580078125, -3.2236328125, -2.75146484375, -2.279296875, -1.80712890625, -1.3349609375, -0.86279296875, -0.390625, 0.08154296875, 0.5537109375, 1.02587890625, 1.498046875, 1.97021484375, 2.4423828125, 2.91455078125, 3.38671875, 3.85888671875, 4.3310546875, 4.80322265625, 5.275390625, 5.74755859375, 6.2197265625, 6.69189453125, 7.1640625, 7.63623046875, 8.1083984375, 8.58056640625, 9.052734375, 9.52490234375, 9.9970703125, 10.46923828125, 10.94140625, 11.41357421875, 11.8857421875, 12.35791015625, 12.830078125, 13.30224609375, 13.7744140625, 14.24658203125, 14.71875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 14.0, 38.0, 83.0, 171.0, 403.0, 142.0, 72.0, 38.0, 18.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-531.448974609375, -510.46685791015625, -489.4847412109375, -468.50262451171875, -447.5205078125, -426.53839111328125, -405.5562744140625, -384.57415771484375, -363.592041015625, -342.60992431640625, -321.6278076171875, -300.64569091796875, -279.66357421875, -258.68145751953125, -237.69935607910156, -216.7172393798828, -195.73513793945312, -174.75302124023438, -153.77090454101562, -132.78878784179688, -111.80667877197266, -90.8245620727539, -69.84245300292969, -48.86033630371094, -27.878219604492188, -6.89610481262207, 14.086009979248047, 35.06812286376953, 56.05023956298828, 77.03235626220703, 98.01446533203125, 118.99658203125, 139.97869873046875, 160.9608154296875, 181.94293212890625, 202.925048828125, 223.90716552734375, 244.8892822265625, 265.87139892578125, 286.853515625, 307.83563232421875, 328.8177490234375, 349.79986572265625, 370.781982421875, 391.76409912109375, 412.7462158203125, 433.72833251953125, 454.71044921875, 475.6925354003906, 496.6746520996094, 517.65673828125, 538.6388549804688, 559.6209716796875, 580.6030883789062, 601.585205078125, 622.5673217773438, 643.5494384765625, 664.5315551757812, 685.513671875, 706.4957885742188, 727.4779052734375, 748.4600219726562, 769.442138671875, 790.4242553710938, 811.4063720703125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 6.0, 14.0, 17.0, 23.0, 22.0, 16.0, 21.0, 31.0, 30.0, 31.0, 39.0, 75.0, 114.0, 126.0, 80.0, 37.0, 29.0, 26.0, 32.0, 32.0, 22.0, 28.0, 11.0, 16.0, 17.0, 18.0, 12.0, 5.0, 7.0, 6.0, 4.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.53582763671875, -322.13092041015625, -310.7260437011719, -299.3211364746094, -287.9162292480469, -276.5113525390625, -265.1064453125, -253.7015380859375, -242.29664611816406, -230.89175415039062, -219.48684692382812, -208.0819549560547, -196.67706298828125, -185.27215576171875, -173.8672637939453, -162.46237182617188, -151.05746459960938, -139.65257263183594, -128.24766540527344, -116.8427734375, -105.43787384033203, -94.03297424316406, -82.62808227539062, -71.22318267822266, -59.81828308105469, -48.41338348388672, -37.008487701416016, -25.603591918945312, -14.198692321777344, -2.793792724609375, 8.611099243164062, 20.01599884033203, 31.420928955078125, 42.825828552246094, 54.2307243347168, 65.6356201171875, 77.04051971435547, 88.44541931152344, 99.85031127929688, 111.25521087646484, 122.66011047363281, 134.06500244140625, 145.46990966796875, 156.8748016357422, 168.27969360351562, 179.68460083007812, 191.08949279785156, 202.494384765625, 213.8992919921875, 225.30418395996094, 236.70909118652344, 248.11398315429688, 259.5188903808594, 270.92376708984375, 282.32867431640625, 293.73358154296875, 305.13848876953125, 316.54339599609375, 327.9482727050781, 339.3531799316406, 350.7580871582031, 362.1629638671875, 373.56787109375, 384.9727783203125, 396.3776550292969]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 9.0, 3.0, 6.0, 6.0, 12.0, 13.0, 15.0, 21.0, 43.0, 42.0, 71.0, 109.0, 132.0, 211.0, 324.0, 542.0, 901.0, 1557.0, 2799.0, 5423.0, 11198.0, 25480.0, 67754.0, 213729.0, 723713.0, 1698196.0, 992253.0, 298934.0, 89550.0, 32065.0, 14008.0, 6681.0, 3480.0, 1932.0, 1133.0, 681.0, 441.0, 265.0, 201.0, 101.0, 86.0, 64.0, 34.0, 24.0, 17.0, 11.0, 6.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.8359375, -30.796875, -29.7578125, -28.71875, -27.6796875, -26.640625, -25.6015625, -24.5625, -23.5234375, -22.484375, -21.4453125, -20.40625, -19.3671875, -18.328125, -17.2890625, -16.25, -15.2109375, -14.171875, -13.1328125, -12.09375, -11.0546875, -10.015625, -8.9765625, -7.9375, -6.8984375, -5.859375, -4.8203125, -3.78125, -2.7421875, -1.703125, -0.6640625, 0.375, 1.4140625, 2.453125, 3.4921875, 4.53125, 5.5703125, 6.609375, 7.6484375, 8.6875, 9.7265625, 10.765625, 11.8046875, 12.84375, 13.8828125, 14.921875, 15.9609375, 17.0, 18.0390625, 19.078125, 20.1171875, 21.15625, 22.1953125, 23.234375, 24.2734375, 25.3125, 26.3515625, 27.390625, 28.4296875, 29.46875, 30.5078125, 31.546875, 32.5859375, 33.625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 11.0, 17.0, 15.0, 17.0, 19.0, 20.0, 18.0, 19.0, 41.0, 34.0, 43.0, 36.0, 33.0, 48.0, 43.0, 58.0, 35.0, 48.0, 52.0, 43.0, 35.0, 43.0, 29.0, 36.0, 25.0, 25.0, 35.0, 14.0, 14.0, 16.0, 13.0, 11.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-22.21875, -21.488037109375, -20.75732421875, -20.026611328125, -19.2958984375, -18.565185546875, -17.83447265625, -17.103759765625, -16.373046875, -15.642333984375, -14.91162109375, -14.180908203125, -13.4501953125, -12.719482421875, -11.98876953125, -11.258056640625, -10.52734375, -9.796630859375, -9.06591796875, -8.335205078125, -7.6044921875, -6.873779296875, -6.14306640625, -5.412353515625, -4.681640625, -3.950927734375, -3.22021484375, -2.489501953125, -1.7587890625, -1.028076171875, -0.29736328125, 0.433349609375, 1.1640625, 1.894775390625, 2.62548828125, 3.356201171875, 4.0869140625, 4.817626953125, 5.54833984375, 6.279052734375, 7.009765625, 7.740478515625, 8.47119140625, 9.201904296875, 9.9326171875, 10.663330078125, 11.39404296875, 12.124755859375, 12.85546875, 13.586181640625, 14.31689453125, 15.047607421875, 15.7783203125, 16.509033203125, 17.23974609375, 17.970458984375, 18.701171875, 19.431884765625, 20.16259765625, 20.893310546875, 21.6240234375, 22.354736328125, 23.08544921875, 23.816162109375, 24.546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 9.0, 7.0, 10.0, 8.0, 14.0, 35.0, 24.0, 72.0, 75.0, 147.0, 273.0, 555.0, 1291.0, 4425.0, 44818.0, 3850953.0, 278055.0, 9910.0, 2044.0, 710.0, 371.0, 196.0, 110.0, 52.0, 40.0, 25.0, 22.0, 14.0, 10.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.875, -161.44140625, -156.0078125, -150.57421875, -145.140625, -139.70703125, -134.2734375, -128.83984375, -123.40625, -117.97265625, -112.5390625, -107.10546875, -101.671875, -96.23828125, -90.8046875, -85.37109375, -79.9375, -74.50390625, -69.0703125, -63.63671875, -58.203125, -52.76953125, -47.3359375, -41.90234375, -36.46875, -31.03515625, -25.6015625, -20.16796875, -14.734375, -9.30078125, -3.8671875, 1.56640625, 7.0, 12.43359375, 17.8671875, 23.30078125, 28.734375, 34.16796875, 39.6015625, 45.03515625, 50.46875, 55.90234375, 61.3359375, 66.76953125, 72.203125, 77.63671875, 83.0703125, 88.50390625, 93.9375, 99.37109375, 104.8046875, 110.23828125, 115.671875, 121.10546875, 126.5390625, 131.97265625, 137.40625, 142.83984375, 148.2734375, 153.70703125, 159.140625, 164.57421875, 170.0078125, 175.44140625, 180.875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 12.0, 11.0, 9.0, 10.0, 17.0, 26.0, 29.0, 41.0, 56.0, 76.0, 83.0, 127.0, 175.0, 217.0, 273.0, 394.0, 450.0, 491.0, 355.0, 320.0, 187.0, 173.0, 132.0, 108.0, 66.0, 58.0, 26.0, 36.0, 30.0, 23.0, 12.0, 11.0, 8.0, 7.0, 6.0, 3.0, 3.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-75.625, -73.4677734375, -71.310546875, -69.1533203125, -66.99609375, -64.8388671875, -62.681640625, -60.5244140625, -58.3671875, -56.2099609375, -54.052734375, -51.8955078125, -49.73828125, -47.5810546875, -45.423828125, -43.2666015625, -41.109375, -38.9521484375, -36.794921875, -34.6376953125, -32.48046875, -30.3232421875, -28.166015625, -26.0087890625, -23.8515625, -21.6943359375, -19.537109375, -17.3798828125, -15.22265625, -13.0654296875, -10.908203125, -8.7509765625, -6.59375, -4.4365234375, -2.279296875, -0.1220703125, 2.03515625, 4.1923828125, 6.349609375, 8.5068359375, 10.6640625, 12.8212890625, 14.978515625, 17.1357421875, 19.29296875, 21.4501953125, 23.607421875, 25.7646484375, 27.921875, 30.0791015625, 32.236328125, 34.3935546875, 36.55078125, 38.7080078125, 40.865234375, 43.0224609375, 45.1796875, 47.3369140625, 49.494140625, 51.6513671875, 53.80859375, 55.9658203125, 58.123046875, 60.2802734375, 62.4375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 13.0, 18.0, 25.0, 58.0, 73.0, 114.0, 154.0, 155.0, 126.0, 98.0, 54.0, 41.0, 14.0, 13.0, 12.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-676.854736328125, -648.73486328125, -620.614990234375, -592.4951782226562, -564.3753051757812, -536.2554321289062, -508.13555908203125, -480.0157165527344, -451.8958740234375, -423.7760009765625, -395.6561584472656, -367.5362854003906, -339.41644287109375, -311.29656982421875, -283.17669677734375, -255.05685424804688, -226.93698120117188, -198.81712341308594, -170.697265625, -142.577392578125, -114.4575424194336, -86.33767700195312, -58.21781921386719, -30.09796142578125, -1.9781036376953125, 26.141756057739258, 54.26161575317383, 82.38147735595703, 110.50133514404297, 138.62120056152344, 166.74105834960938, 194.8609161376953, 222.98077392578125, 251.1006317138672, 279.2204895019531, 307.3403625488281, 335.460205078125, 363.580078125, 391.699951171875, 419.8197937011719, 447.93963623046875, 476.05950927734375, 504.1793518066406, 532.2991943359375, 560.4190673828125, 588.5389404296875, 616.6588134765625, 644.7786865234375, 672.8985595703125, 701.0184326171875, 729.1383056640625, 757.2581176757812, 785.3779907226562, 813.4978637695312, 841.6177368164062, 869.737548828125, 897.857421875, 925.977294921875, 954.09716796875, 982.2169799804688, 1010.3368530273438, 1038.456787109375, 1066.5765380859375, 1094.6964111328125, 1122.8162841796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 1.0, 0.0, 6.0, 3.0, 3.0, 8.0, 5.0, 14.0, 16.0, 14.0, 22.0, 23.0, 30.0, 31.0, 28.0, 29.0, 43.0, 49.0, 55.0, 45.0, 44.0, 53.0, 56.0, 63.0, 42.0, 34.0, 35.0, 35.0, 28.0, 28.0, 26.0, 12.0, 25.0, 14.0, 26.0, 6.0, 6.0, 9.0, 6.0, 8.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-422.91131591796875, -408.9854431152344, -395.0595703125, -381.13372802734375, -367.2078552246094, -353.281982421875, -339.3561096191406, -325.43023681640625, -311.50439453125, -297.5785217285156, -283.65264892578125, -269.726806640625, -255.80093383789062, -241.87506103515625, -227.94918823242188, -214.0233154296875, -200.09744262695312, -186.17156982421875, -172.24571228027344, -158.31983947753906, -144.39398193359375, -130.46810913085938, -116.542236328125, -102.61637115478516, -88.69050598144531, -74.76464080810547, -60.83877182006836, -46.91290283203125, -32.987037658691406, -19.061172485351562, -5.1352996826171875, 8.790565490722656, 22.7164306640625, 36.642295837402344, 50.56816482543945, 64.49403381347656, 78.4198989868164, 92.34576416015625, 106.27163696289062, 120.19750213623047, 134.1233673095703, 148.0492401123047, 161.97509765625, 175.90097045898438, 189.82684326171875, 203.75270080566406, 217.67857360839844, 231.60443115234375, 245.53030395507812, 259.4561767578125, 273.3820495605469, 287.30792236328125, 301.2337646484375, 315.1596374511719, 329.08551025390625, 343.0113830566406, 356.937255859375, 370.8631286621094, 384.78900146484375, 398.71484375, 412.6407165527344, 426.56658935546875, 440.4924621582031, 454.4183349609375, 468.34417724609375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 9.0, 20.0, 32.0, 38.0, 47.0, 85.0, 132.0, 197.0, 318.0, 511.0, 797.0, 1446.0, 2760.0, 5751.0, 12864.0, 33309.0, 103946.0, 403788.0, 340734.0, 89456.0, 29500.0, 11497.0, 5245.0, 2577.0, 1340.0, 793.0, 514.0, 304.0, 203.0, 101.0, 82.0, 48.0, 23.0, 30.0, 17.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.46875, -35.2900390625, -34.111328125, -32.9326171875, -31.75390625, -30.5751953125, -29.396484375, -28.2177734375, -27.0390625, -25.8603515625, -24.681640625, -23.5029296875, -22.32421875, -21.1455078125, -19.966796875, -18.7880859375, -17.609375, -16.4306640625, -15.251953125, -14.0732421875, -12.89453125, -11.7158203125, -10.537109375, -9.3583984375, -8.1796875, -7.0009765625, -5.822265625, -4.6435546875, -3.46484375, -2.2861328125, -1.107421875, 0.0712890625, 1.25, 2.4287109375, 3.607421875, 4.7861328125, 5.96484375, 7.1435546875, 8.322265625, 9.5009765625, 10.6796875, 11.8583984375, 13.037109375, 14.2158203125, 15.39453125, 16.5732421875, 17.751953125, 18.9306640625, 20.109375, 21.2880859375, 22.466796875, 23.6455078125, 24.82421875, 26.0029296875, 27.181640625, 28.3603515625, 29.5390625, 30.7177734375, 31.896484375, 33.0751953125, 34.25390625, 35.4326171875, 36.611328125, 37.7900390625, 38.96875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 9.0, 8.0, 9.0, 20.0, 22.0, 33.0, 34.0, 42.0, 58.0, 59.0, 65.0, 78.0, 80.0, 93.0, 63.0, 54.0, 34.0, 48.0, 41.0, 26.0, 30.0, 23.0, 10.0, 13.0, 8.0, 13.0, 3.0, 3.0, 8.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.75, -52.09765625, -50.4453125, -48.79296875, -47.140625, -45.48828125, -43.8359375, -42.18359375, -40.53125, -38.87890625, -37.2265625, -35.57421875, -33.921875, -32.26953125, -30.6171875, -28.96484375, -27.3125, -25.66015625, -24.0078125, -22.35546875, -20.703125, -19.05078125, -17.3984375, -15.74609375, -14.09375, -12.44140625, -10.7890625, -9.13671875, -7.484375, -5.83203125, -4.1796875, -2.52734375, -0.875, 0.77734375, 2.4296875, 4.08203125, 5.734375, 7.38671875, 9.0390625, 10.69140625, 12.34375, 13.99609375, 15.6484375, 17.30078125, 18.953125, 20.60546875, 22.2578125, 23.91015625, 25.5625, 27.21484375, 28.8671875, 30.51953125, 32.171875, 33.82421875, 35.4765625, 37.12890625, 38.78125, 40.43359375, 42.0859375, 43.73828125, 45.390625, 47.04296875, 48.6953125, 50.34765625, 52.0]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 10.0, 13.0, 16.0, 14.0, 27.0, 39.0, 60.0, 87.0, 136.0, 231.0, 413.0, 791.0, 1671.0, 4271.0, 16690.0, 115035.0, 821510.0, 68568.0, 12372.0, 3538.0, 1420.0, 634.0, 371.0, 212.0, 125.0, 81.0, 44.0, 35.0, 32.0, 23.0, 16.0, 11.0, 10.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-55.0625, -53.41357421875, -51.7646484375, -50.11572265625, -48.466796875, -46.81787109375, -45.1689453125, -43.52001953125, -41.87109375, -40.22216796875, -38.5732421875, -36.92431640625, -35.275390625, -33.62646484375, -31.9775390625, -30.32861328125, -28.6796875, -27.03076171875, -25.3818359375, -23.73291015625, -22.083984375, -20.43505859375, -18.7861328125, -17.13720703125, -15.48828125, -13.83935546875, -12.1904296875, -10.54150390625, -8.892578125, -7.24365234375, -5.5947265625, -3.94580078125, -2.296875, -0.64794921875, 1.0009765625, 2.64990234375, 4.298828125, 5.94775390625, 7.5966796875, 9.24560546875, 10.89453125, 12.54345703125, 14.1923828125, 15.84130859375, 17.490234375, 19.13916015625, 20.7880859375, 22.43701171875, 24.0859375, 25.73486328125, 27.3837890625, 29.03271484375, 30.681640625, 32.33056640625, 33.9794921875, 35.62841796875, 37.27734375, 38.92626953125, 40.5751953125, 42.22412109375, 43.873046875, 45.52197265625, 47.1708984375, 48.81982421875, 50.46875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 9.0, 10.0, 13.0, 9.0, 12.0, 19.0, 20.0, 29.0, 26.0, 39.0, 63.0, 61.0, 79.0, 80.0, 75.0, 68.0, 66.0, 50.0, 50.0, 34.0, 34.0, 21.0, 17.0, 15.0, 21.0, 13.0, 11.0, 9.0, 17.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.875, -123.970703125, -119.06640625, -114.162109375, -109.2578125, -104.353515625, -99.44921875, -94.544921875, -89.640625, -84.736328125, -79.83203125, -74.927734375, -70.0234375, -65.119140625, -60.21484375, -55.310546875, -50.40625, -45.501953125, -40.59765625, -35.693359375, -30.7890625, -25.884765625, -20.98046875, -16.076171875, -11.171875, -6.267578125, -1.36328125, 3.541015625, 8.4453125, 13.349609375, 18.25390625, 23.158203125, 28.0625, 32.966796875, 37.87109375, 42.775390625, 47.6796875, 52.583984375, 57.48828125, 62.392578125, 67.296875, 72.201171875, 77.10546875, 82.009765625, 86.9140625, 91.818359375, 96.72265625, 101.626953125, 106.53125, 111.435546875, 116.33984375, 121.244140625, 126.1484375, 131.052734375, 135.95703125, 140.861328125, 145.765625, 150.669921875, 155.57421875, 160.478515625, 165.3828125, 170.287109375, 175.19140625, 180.095703125, 185.0]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 12.0, 10.0, 13.0, 23.0, 22.0, 28.0, 51.0, 63.0, 112.0, 185.0, 282.0, 544.0, 1158.0, 2551.0, 7019.0, 23580.0, 132927.0, 805627.0, 53278.0, 13157.0, 4313.0, 1769.0, 782.0, 387.0, 228.0, 143.0, 92.0, 54.0, 39.0, 18.0, 16.0, 15.0, 8.0, 10.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3671875, -10.03564453125, -9.7041015625, -9.37255859375, -9.041015625, -8.70947265625, -8.3779296875, -8.04638671875, -7.71484375, -7.38330078125, -7.0517578125, -6.72021484375, -6.388671875, -6.05712890625, -5.7255859375, -5.39404296875, -5.0625, -4.73095703125, -4.3994140625, -4.06787109375, -3.736328125, -3.40478515625, -3.0732421875, -2.74169921875, -2.41015625, -2.07861328125, -1.7470703125, -1.41552734375, -1.083984375, -0.75244140625, -0.4208984375, -0.08935546875, 0.2421875, 0.57373046875, 0.9052734375, 1.23681640625, 1.568359375, 1.89990234375, 2.2314453125, 2.56298828125, 2.89453125, 3.22607421875, 3.5576171875, 3.88916015625, 4.220703125, 4.55224609375, 4.8837890625, 5.21533203125, 5.546875, 5.87841796875, 6.2099609375, 6.54150390625, 6.873046875, 7.20458984375, 7.5361328125, 7.86767578125, 8.19921875, 8.53076171875, 8.8623046875, 9.19384765625, 9.525390625, 9.85693359375, 10.1884765625, 10.52001953125, 10.8515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 8.0, 9.0, 9.0, 12.0, 6.0, 14.0, 14.0, 29.0, 25.0, 34.0, 44.0, 64.0, 86.0, 87.0, 100.0, 86.0, 72.0, 65.0, 35.0, 32.0, 24.0, 16.0, 22.0, 11.0, 14.0, 9.0, 8.0, 2.0, 7.0, 3.0, 6.0, 5.0, 1.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00231170654296875, -0.0022357702255249023, -0.0021598339080810547, -0.002083897590637207, -0.0020079612731933594, -0.0019320249557495117, -0.001856088638305664, -0.0017801523208618164, -0.0017042160034179688, -0.001628279685974121, -0.0015523433685302734, -0.0014764070510864258, -0.0014004707336425781, -0.0013245344161987305, -0.0012485980987548828, -0.0011726617813110352, -0.0010967254638671875, -0.0010207891464233398, -0.0009448528289794922, -0.0008689165115356445, -0.0007929801940917969, -0.0007170438766479492, -0.0006411075592041016, -0.0005651712417602539, -0.0004892349243164062, -0.0004132986068725586, -0.00033736228942871094, -0.0002614259719848633, -0.00018548965454101562, -0.00010955333709716797, -3.361701965332031e-05, 4.2319297790527344e-05, 0.000118255615234375, 0.00019419193267822266, 0.0002701282501220703, 0.00034606456756591797, 0.0004220008850097656, 0.0004979372024536133, 0.0005738735198974609, 0.0006498098373413086, 0.0007257461547851562, 0.0008016824722290039, 0.0008776187896728516, 0.0009535551071166992, 0.0010294914245605469, 0.0011054277420043945, 0.0011813640594482422, 0.0012573003768920898, 0.0013332366943359375, 0.0014091730117797852, 0.0014851093292236328, 0.0015610456466674805, 0.0016369819641113281, 0.0017129182815551758, 0.0017888545989990234, 0.001864790916442871, 0.0019407272338867188, 0.0020166635513305664, 0.002092599868774414, 0.0021685361862182617, 0.0022444725036621094, 0.002320408821105957, 0.0023963451385498047, 0.0024722814559936523, 0.0025482177734375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 14.0, 25.0, 39.0, 83.0, 168.0, 396.0, 1049.0, 3295.0, 13561.0, 94612.0, 873580.0, 49261.0, 8744.0, 2315.0, 758.0, 289.0, 152.0, 85.0, 33.0, 19.0, 19.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.359375, -17.7919921875, -17.224609375, -16.6572265625, -16.08984375, -15.5224609375, -14.955078125, -14.3876953125, -13.8203125, -13.2529296875, -12.685546875, -12.1181640625, -11.55078125, -10.9833984375, -10.416015625, -9.8486328125, -9.28125, -8.7138671875, -8.146484375, -7.5791015625, -7.01171875, -6.4443359375, -5.876953125, -5.3095703125, -4.7421875, -4.1748046875, -3.607421875, -3.0400390625, -2.47265625, -1.9052734375, -1.337890625, -0.7705078125, -0.203125, 0.3642578125, 0.931640625, 1.4990234375, 2.06640625, 2.6337890625, 3.201171875, 3.7685546875, 4.3359375, 4.9033203125, 5.470703125, 6.0380859375, 6.60546875, 7.1728515625, 7.740234375, 8.3076171875, 8.875, 9.4423828125, 10.009765625, 10.5771484375, 11.14453125, 11.7119140625, 12.279296875, 12.8466796875, 13.4140625, 13.9814453125, 14.548828125, 15.1162109375, 15.68359375, 16.2509765625, 16.818359375, 17.3857421875, 17.953125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 7.0, 4.0, 2.0, 8.0, 7.0, 7.0, 11.0, 14.0, 11.0, 14.0, 18.0, 41.0, 39.0, 80.0, 72.0, 106.0, 108.0, 96.0, 88.0, 64.0, 38.0, 38.0, 30.0, 22.0, 17.0, 8.0, 6.0, 12.0, 7.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.324951171875, -11.87646484375, -11.427978515625, -10.9794921875, -10.531005859375, -10.08251953125, -9.634033203125, -9.185546875, -8.737060546875, -8.28857421875, -7.840087890625, -7.3916015625, -6.943115234375, -6.49462890625, -6.046142578125, -5.59765625, -5.149169921875, -4.70068359375, -4.252197265625, -3.8037109375, -3.355224609375, -2.90673828125, -2.458251953125, -2.009765625, -1.561279296875, -1.11279296875, -0.664306640625, -0.2158203125, 0.232666015625, 0.68115234375, 1.129638671875, 1.578125, 2.026611328125, 2.47509765625, 2.923583984375, 3.3720703125, 3.820556640625, 4.26904296875, 4.717529296875, 5.166015625, 5.614501953125, 6.06298828125, 6.511474609375, 6.9599609375, 7.408447265625, 7.85693359375, 8.305419921875, 8.75390625, 9.202392578125, 9.65087890625, 10.099365234375, 10.5478515625, 10.996337890625, 11.44482421875, 11.893310546875, 12.341796875, 12.790283203125, 13.23876953125, 13.687255859375, 14.1357421875, 14.584228515625, 15.03271484375, 15.481201171875, 15.9296875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 7.0, 13.0, 25.0, 47.0, 91.0, 353.0, 227.0, 68.0, 50.0, 40.0, 21.0, 23.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.28170776367188, -190.4730682373047, -176.66441345214844, -162.85577392578125, -149.047119140625, -135.2384796142578, -121.42984008789062, -107.6211929321289, -93.81254577636719, -80.00389862060547, -66.19525146484375, -52.38661193847656, -38.577964782714844, -24.769317626953125, -10.960678100585938, 2.8479690551757812, 16.6566162109375, 30.465261459350586, 44.27390670776367, 58.082550048828125, 71.89119720458984, 85.69984436035156, 99.50848388671875, 113.31713104248047, 127.12577819824219, 140.93441772460938, 154.74307250976562, 168.5517120361328, 182.3603515625, 196.16900634765625, 209.97764587402344, 223.78628540039062, 237.59490966796875, 251.40354919433594, 265.2121887207031, 279.0208435058594, 292.8294982910156, 306.63812255859375, 320.44677734375, 334.25543212890625, 348.0640869140625, 361.87274169921875, 375.6813659667969, 389.4900207519531, 403.2986755371094, 417.1072998046875, 430.91595458984375, 444.724609375, 458.5332336425781, 472.3418884277344, 486.1505126953125, 499.95916748046875, 513.767822265625, 527.5764770507812, 541.3851318359375, 555.1937255859375, 569.0023803710938, 582.81103515625, 596.6196899414062, 610.4283447265625, 624.2369384765625, 638.0455932617188, 651.854248046875, 665.6629028320312, 679.4715576171875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 6.0, 7.0, 12.0, 7.0, 20.0, 18.0, 24.0, 19.0, 21.0, 20.0, 37.0, 57.0, 154.0, 142.0, 136.0, 79.0, 33.0, 25.0, 25.0, 16.0, 21.0, 14.0, 16.0, 12.0, 17.0, 9.0, 3.0, 7.0, 9.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-413.6853942871094, -400.5760498046875, -387.4667053222656, -374.35736083984375, -361.24798583984375, -348.1386413574219, -335.029296875, -321.9199523925781, -308.81060791015625, -295.7012634277344, -282.5919189453125, -269.4825439453125, -256.3731994628906, -243.26385498046875, -230.15451049804688, -217.045166015625, -203.935791015625, -190.82644653320312, -177.7170867919922, -164.6077423095703, -151.49838256835938, -138.3890380859375, -125.27969360351562, -112.17034149169922, -99.06098937988281, -85.9516372680664, -72.84228515625, -59.732940673828125, -46.62358856201172, -33.51423645019531, -20.404891967773438, -7.295539855957031, 5.81378173828125, 18.923131942749023, 32.0324821472168, 45.14183044433594, 58.251182556152344, 71.36053466796875, 84.46987915039062, 97.57923126220703, 110.68858337402344, 123.79793548583984, 136.90728759765625, 150.01663208007812, 163.1259765625, 176.23533630371094, 189.3446807861328, 202.45404052734375, 215.56338500976562, 228.6727294921875, 241.78208923339844, 254.8914337158203, 268.00079345703125, 281.1101379394531, 294.219482421875, 307.3288269042969, 320.43817138671875, 333.5475158691406, 346.6568603515625, 359.7662353515625, 372.8755798339844, 385.98492431640625, 399.0942687988281, 412.20361328125, 425.31298828125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 13.0, 13.0, 25.0, 21.0, 30.0, 47.0, 47.0, 50.0, 89.0, 257.0, 113.0, 57.0, 44.0, 41.0, 28.0, 21.0, 16.0, 24.0, 15.0, 8.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.03125, -40.25732421875, -38.4833984375, -36.70947265625, -34.935546875, -33.16162109375, -31.3876953125, -29.61376953125, -27.83984375, -26.06591796875, -24.2919921875, -22.51806640625, -20.744140625, -18.97021484375, -17.1962890625, -15.42236328125, -13.6484375, -11.87451171875, -10.1005859375, -8.32666015625, -6.552734375, -4.77880859375, -3.0048828125, -1.23095703125, 0.54296875, 2.31689453125, 4.0908203125, 5.86474609375, 7.638671875, 9.41259765625, 11.1865234375, 12.96044921875, 14.734375, 16.50830078125, 18.2822265625, 20.05615234375, 21.830078125, 23.60400390625, 25.3779296875, 27.15185546875, 28.92578125, 30.69970703125, 32.4736328125, 34.24755859375, 36.021484375, 37.79541015625, 39.5693359375, 41.34326171875, 43.1171875, 44.89111328125, 46.6650390625, 48.43896484375, 50.212890625, 51.98681640625, 53.7607421875, 55.53466796875, 57.30859375, 59.08251953125, 60.8564453125, 62.63037109375, 64.404296875, 66.17822265625, 67.9521484375, 69.72607421875, 71.5]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 13.0, 13.0, 21.0, 41.0, 68.0, 77.0, 143.0, 295.0, 552.0, 1470.0, 3972.0, 14510.0, 8246618.0, 107654.0, 8369.0, 2630.0, 1018.0, 444.0, 214.0, 135.0, 72.0, 47.0, 35.0, 18.0, 22.0, 9.0, 10.0, 14.0, 16.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-173.3074951171875, -167.49594116210938, -161.6844024658203, -155.8728485107422, -150.06130981445312, -144.249755859375, -138.43820190429688, -132.62664794921875, -126.81510925292969, -121.0035629272461, -115.1920166015625, -109.38046264648438, -103.56891632080078, -97.75736999511719, -91.94581604003906, -86.13426971435547, -80.32272338867188, -74.51117706298828, -68.69963073730469, -62.88807678222656, -57.07653045654297, -51.264984130859375, -45.453433990478516, -39.641883850097656, -33.83033752441406, -28.018789291381836, -22.20724105834961, -16.395692825317383, -10.584144592285156, -4.77259635925293, 1.0389518737792969, 6.850502014160156, 12.662063598632812, 18.47361183166504, 24.285160064697266, 30.096708297729492, 35.90825653076172, 41.71980285644531, 47.53135299682617, 53.34290313720703, 59.154449462890625, 64.96599578857422, 70.77754211425781, 76.58909606933594, 82.40064239501953, 88.21218872070312, 94.02374267578125, 99.83528900146484, 105.64683532714844, 111.45838165283203, 117.26992797851562, 123.08148193359375, 128.89303588867188, 134.70457458496094, 140.51612854003906, 146.32766723632812, 152.13922119140625, 157.95077514648438, 163.76231384277344, 169.57386779785156, 175.38540649414062, 181.19696044921875, 187.00851440429688, 192.820068359375, 198.63160705566406]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 1.0, 1.0, 3.0, 6.0, 7.0, 0.0, 5.0, 4.0, 6.0, 7.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-320.3318786621094, -310.34954833984375, -300.3671875, -290.3848571777344, -280.40252685546875, -270.4201965332031, -260.4378662109375, -250.45550537109375, -240.47317504882812, -230.4908447265625, -220.5084991455078, -210.52615356445312, -200.5438232421875, -190.56149291992188, -180.5791473388672, -170.5968017578125, -160.61447143554688, -150.63214111328125, -140.64979553222656, -130.66744995117188, -120.68511962890625, -110.7027816772461, -100.72044372558594, -90.73810577392578, -80.75576782226562, -70.77342987060547, -60.79109191894531, -50.808753967285156, -40.826416015625, -30.844078063964844, -20.861740112304688, -10.879402160644531, -0.8970947265625, 9.085243225097656, 19.067581176757812, 29.04991912841797, 39.032257080078125, 49.01459503173828, 58.99693298339844, 68.9792709350586, 78.96160888671875, 88.9439468383789, 98.92628479003906, 108.90862274169922, 118.89096069335938, 128.873291015625, 138.8556365966797, 148.83798217773438, 158.8203125, 168.80264282226562, 178.7849884033203, 188.767333984375, 198.74966430664062, 208.73199462890625, 218.71434020996094, 228.69668579101562, 238.67901611328125, 248.66134643554688, 258.6436767578125, 268.62603759765625, 278.6083679199219, 288.5906982421875, 298.57305908203125, 308.5553894042969, 318.5377197265625]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 7.0, 4.0, 18.0, 23.0, 30.0, 35.0, 43.0, 59.0, 66.0, 65.0, 59.0, 48.0, 89.0, 80.0, 72.0, 64.0, 52.0, 46.0, 32.0, 27.0, 18.0, 11.0, 12.0, 8.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.375, -46.8662109375, -45.357421875, -43.8486328125, -42.33984375, -40.8310546875, -39.322265625, -37.8134765625, -36.3046875, -34.7958984375, -33.287109375, -31.7783203125, -30.26953125, -28.7607421875, -27.251953125, -25.7431640625, -24.234375, -22.7255859375, -21.216796875, -19.7080078125, -18.19921875, -16.6904296875, -15.181640625, -13.6728515625, -12.1640625, -10.6552734375, -9.146484375, -7.6376953125, -6.12890625, -4.6201171875, -3.111328125, -1.6025390625, -0.09375, 1.4150390625, 2.923828125, 4.4326171875, 5.94140625, 7.4501953125, 8.958984375, 10.4677734375, 11.9765625, 13.4853515625, 14.994140625, 16.5029296875, 18.01171875, 19.5205078125, 21.029296875, 22.5380859375, 24.046875, 25.5556640625, 27.064453125, 28.5732421875, 30.08203125, 31.5908203125, 33.099609375, 34.6083984375, 36.1171875, 37.6259765625, 39.134765625, 40.6435546875, 42.15234375, 43.6611328125, 45.169921875, 46.6787109375, 48.1875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 10.0, 15.0, 17.0, 44.0, 54.0, 66.0, 173.0, 342.0, 964.0, 2944.0, 11643.0, 54689.0, 244808.0, 165094.0, 32766.0, 7368.0, 1992.0, 710.0, 275.0, 122.0, 66.0, 33.0, 26.0, 28.0, 4.0, 4.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-351.25, -341.16796875, -331.0859375, -321.00390625, -310.921875, -300.83984375, -290.7578125, -280.67578125, -270.59375, -260.51171875, -250.4296875, -240.34765625, -230.265625, -220.18359375, -210.1015625, -200.01953125, -189.9375, -179.85546875, -169.7734375, -159.69140625, -149.609375, -139.52734375, -129.4453125, -119.36328125, -109.28125, -99.19921875, -89.1171875, -79.03515625, -68.953125, -58.87109375, -48.7890625, -38.70703125, -28.625, -18.54296875, -8.4609375, 1.62109375, 11.703125, 21.78515625, 31.8671875, 41.94921875, 52.03125, 62.11328125, 72.1953125, 82.27734375, 92.359375, 102.44140625, 112.5234375, 122.60546875, 132.6875, 142.76953125, 152.8515625, 162.93359375, 173.015625, 183.09765625, 193.1796875, 203.26171875, 213.34375, 223.42578125, 233.5078125, 243.58984375, 253.671875, 263.75390625, 273.8359375, 283.91796875, 294.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 9.0, 16.0, 8.0, 18.0, 14.0, 16.0, 37.0, 25.0, 36.0, 34.0, 48.0, 50.0, 39.0, 53.0, 68.0, 49.0, 54.0, 60.0, 40.0, 44.0, 44.0, 39.0, 36.0, 28.0, 18.0, 21.0, 16.0, 13.0, 9.0, 7.0, 5.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.59375, -27.64453125, -26.6953125, -25.74609375, -24.796875, -23.84765625, -22.8984375, -21.94921875, -21.0, -20.05078125, -19.1015625, -18.15234375, -17.203125, -16.25390625, -15.3046875, -14.35546875, -13.40625, -12.45703125, -11.5078125, -10.55859375, -9.609375, -8.66015625, -7.7109375, -6.76171875, -5.8125, -4.86328125, -3.9140625, -2.96484375, -2.015625, -1.06640625, -0.1171875, 0.83203125, 1.78125, 2.73046875, 3.6796875, 4.62890625, 5.578125, 6.52734375, 7.4765625, 8.42578125, 9.375, 10.32421875, 11.2734375, 12.22265625, 13.171875, 14.12109375, 15.0703125, 16.01953125, 16.96875, 17.91796875, 18.8671875, 19.81640625, 20.765625, 21.71484375, 22.6640625, 23.61328125, 24.5625, 25.51171875, 26.4609375, 27.41015625, 28.359375, 29.30859375, 30.2578125, 31.20703125, 32.15625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 12.0, 15.0, 27.0, 69.0, 92.0, 117.0, 63.0, 18.0, 12.0, 7.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-358.60430908203125, -348.249267578125, -337.89422607421875, -327.5391845703125, -317.18414306640625, -306.8290710449219, -296.4740295410156, -286.1189880371094, -275.7639465332031, -265.4089050292969, -255.05386352539062, -244.6988067626953, -234.34376525878906, -223.9887237548828, -213.6336669921875, -203.27862548828125, -192.923583984375, -182.56854248046875, -172.2135009765625, -161.8584442138672, -151.50340270996094, -141.1483612060547, -130.79330444335938, -120.43826293945312, -110.08322143554688, -99.72817993164062, -89.37313079833984, -79.01808166503906, -68.66304016113281, -58.3079948425293, -47.95294952392578, -37.597900390625, -27.24285888671875, -16.887813568115234, -6.532768249511719, 3.822277069091797, 14.177322387695312, 24.532367706298828, 34.887413024902344, 45.242462158203125, 55.597503662109375, 65.95254516601562, 76.3075942993164, 86.66264343261719, 97.01768493652344, 107.37272644042969, 117.72777557373047, 128.08282470703125, 138.4378662109375, 148.79290771484375, 159.14794921875, 169.5030059814453, 179.85804748535156, 190.2130889892578, 200.56814575195312, 210.92318725585938, 221.27822875976562, 231.63327026367188, 241.98831176757812, 252.34336853027344, 262.69842529296875, 273.053466796875, 283.40850830078125, 293.7635498046875, 304.11859130859375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 9.0, 5.0, 6.0, 11.0, 17.0, 30.0, 45.0, 81.0, 87.0, 69.0, 40.0, 23.0, 7.0, 5.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-271.1093444824219, -264.0339660644531, -256.9585876464844, -249.8832244873047, -242.80784606933594, -235.7324676513672, -228.6571044921875, -221.58172607421875, -214.50634765625, -207.43096923828125, -200.3555908203125, -193.2802276611328, -186.20484924316406, -179.1294708251953, -172.05410766601562, -164.97872924804688, -157.90335083007812, -150.82797241210938, -143.75259399414062, -136.67723083496094, -129.6018524169922, -122.52647399902344, -115.45110321044922, -108.375732421875, -101.30035400390625, -94.2249755859375, -87.14960479736328, -80.07423400878906, -72.99885559082031, -65.92347717285156, -58.848106384277344, -51.77273178100586, -44.69734191894531, -37.62196731567383, -30.546592712402344, -23.47121810913086, -16.395843505859375, -9.32046890258789, -2.2450942993164062, 4.830280303955078, 11.905654907226562, 18.981029510498047, 26.05640411376953, 33.131778717041016, 40.2071533203125, 47.282527923583984, 54.35790252685547, 61.43327713012695, 68.50865173339844, 75.58403015136719, 82.6594009399414, 89.73477172851562, 96.81015014648438, 103.88552856445312, 110.96089935302734, 118.03627014160156, 125.11164855957031, 132.18702697753906, 139.26239013671875, 146.3377685546875, 153.41314697265625, 160.488525390625, 167.56390380859375, 174.63926696777344, 181.7146453857422]}, "eval/loss": 0.6976933479309082, "eval/wer": 0.12308607695358985, "eval/runtime": 636.3851, "eval/samples_per_second": 4.152, "eval/steps_per_second": 0.52} \ No newline at end of file