diff --git "a/wandb/run-20220303_074415-2c9ds5of/files/wandb-summary.json" "b/wandb/run-20220303_074415-2c9ds5of/files/wandb-summary.json" --- "a/wandb/run-20220303_074415-2c9ds5of/files/wandb-summary.json" +++ "b/wandb/run-20220303_074415-2c9ds5of/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.843, "train/learning_rate": 4.354136429608128e-06, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 6750, "_timestamp": 1646300206, "_step": 1191, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 217.0, 781.0, 18.0], "bins": [-1056.006591796875, -1039.0478515625, -1022.089111328125, -1005.13037109375, -988.1715698242188, -971.2128295898438, -954.2540893554688, -937.2953491210938, -920.3366088867188, -903.3778686523438, -886.4191284179688, -869.4603271484375, -852.5015869140625, -835.5428466796875, -818.5841064453125, -801.6253662109375, -784.6666259765625, -767.7078857421875, -750.7491455078125, -733.7904052734375, -716.8316040039062, -699.8728637695312, -682.9141235351562, -665.9553833007812, -648.99658203125, -632.037841796875, -615.0791015625, -598.120361328125, -581.1615600585938, -564.2028198242188, -547.2440795898438, -530.2853393554688, -513.32666015625, -496.367919921875, -479.4091491699219, -462.4504089355469, -445.4916687011719, -428.53289794921875, -411.57415771484375, -394.61541748046875, -377.6566467285156, -360.6979064941406, -343.7391357421875, -326.7803955078125, -309.8216552734375, -292.8629150390625, -275.9041442871094, -258.9454040527344, -241.98663330078125, -225.0278778076172, -208.0691375732422, -191.11038208007812, -174.15164184570312, -157.19288635253906, -140.234130859375, -123.27538299560547, -106.31664276123047, -89.35789489746094, -72.39913940429688, -55.440391540527344, -38.48164367675781, -21.52289581298828, -4.564140319824219, 12.394607543945312, 29.353355407714844]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 8.0, 10.0, 13.0, 13.0, 16.0, 18.0, 24.0, 20.0, 22.0, 34.0, 28.0, 28.0, 38.0, 38.0, 39.0, 42.0, 42.0, 36.0, 43.0, 41.0, 29.0, 45.0, 38.0, 34.0, 36.0, 33.0, 21.0, 30.0, 20.0, 23.0, 22.0, 14.0, 13.0, 13.0, 13.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-114.42926025390625, -110.70561981201172, -106.98198699951172, -103.25834655761719, -99.53471374511719, -95.81107330322266, -92.08743286132812, -88.36380004882812, -84.6401596069336, -80.91651916503906, -77.19288635253906, -73.46924591064453, -69.74560546875, -66.02197265625, -62.29833221435547, -58.5746955871582, -54.85105895996094, -51.12742233276367, -47.403785705566406, -43.680145263671875, -39.95650863647461, -36.232872009277344, -32.50923156738281, -28.785594940185547, -25.06195831298828, -21.338321685791016, -17.614683151245117, -13.891045570373535, -10.167407989501953, -6.4437713623046875, -2.720132827758789, 1.0035057067871094, 4.727142333984375, 8.450779914855957, 12.174417495727539, 15.898055076599121, 19.621692657470703, 23.34532928466797, 27.068967819213867, 30.792606353759766, 34.51624298095703, 38.2398796081543, 41.96351623535156, 45.687156677246094, 49.41079330444336, 53.134429931640625, 56.858070373535156, 60.58170700073242, 64.30534362792969, 68.02898406982422, 71.75261688232422, 75.47625732421875, 79.19989013671875, 82.92353057861328, 86.64717102050781, 90.37080383300781, 94.09444427490234, 97.81808471679688, 101.54171752929688, 105.2653579711914, 108.98899841308594, 112.71263122558594, 116.43627166748047, 120.159912109375, 123.883544921875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 15.0, 17.0, 24.0, 28.0, 30.0, 42.0, 38.0, 64.0, 59.0, 65.0, 83.0, 72.0, 57.0, 71.0, 69.0, 62.0, 47.0, 36.0, 33.0, 19.0, 27.0, 12.0, 7.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.80816650390625, -3.7159423828125, -3.62371826171875, -3.531494140625, -3.43927001953125, -3.3470458984375, -3.25482177734375, -3.16259765625, -3.07037353515625, -2.9781494140625, -2.88592529296875, -2.793701171875, -2.70147705078125, -2.6092529296875, -2.51702880859375, -2.4248046875, -2.33258056640625, -2.2403564453125, -2.14813232421875, -2.055908203125, -1.96368408203125, -1.8714599609375, -1.77923583984375, -1.68701171875, -1.59478759765625, -1.5025634765625, -1.41033935546875, -1.318115234375, -1.22589111328125, -1.1336669921875, -1.04144287109375, -0.94921875, -0.85699462890625, -0.7647705078125, -0.67254638671875, -0.580322265625, -0.48809814453125, -0.3958740234375, -0.30364990234375, -0.21142578125, -0.11920166015625, -0.0269775390625, 0.06524658203125, 0.157470703125, 0.24969482421875, 0.3419189453125, 0.43414306640625, 0.5263671875, 0.61859130859375, 0.7108154296875, 0.80303955078125, 0.895263671875, 0.98748779296875, 1.0797119140625, 1.17193603515625, 1.26416015625, 1.35638427734375, 1.4486083984375, 1.54083251953125, 1.633056640625, 1.72528076171875, 1.8175048828125, 1.90972900390625, 2.001953125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 15.0, 12.0, 22.0, 28.0, 49.0, 86.0, 120.0, 207.0, 382.0, 700.0, 1239.0, 2570.0, 7192.0, 74633.0, 4046930.0, 48887.0, 6218.0, 2302.0, 1196.0, 614.0, 331.0, 205.0, 116.0, 80.0, 50.0, 25.0, 26.0, 15.0, 8.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-33.5, -32.710693359375, -31.92138671875, -31.132080078125, -30.3427734375, -29.553466796875, -28.76416015625, -27.974853515625, -27.185546875, -26.396240234375, -25.60693359375, -24.817626953125, -24.0283203125, -23.239013671875, -22.44970703125, -21.660400390625, -20.87109375, -20.081787109375, -19.29248046875, -18.503173828125, -17.7138671875, -16.924560546875, -16.13525390625, -15.345947265625, -14.556640625, -13.767333984375, -12.97802734375, -12.188720703125, -11.3994140625, -10.610107421875, -9.82080078125, -9.031494140625, -8.2421875, -7.452880859375, -6.66357421875, -5.874267578125, -5.0849609375, -4.295654296875, -3.50634765625, -2.717041015625, -1.927734375, -1.138427734375, -0.34912109375, 0.440185546875, 1.2294921875, 2.018798828125, 2.80810546875, 3.597412109375, 4.38671875, 5.176025390625, 5.96533203125, 6.754638671875, 7.5439453125, 8.333251953125, 9.12255859375, 9.911865234375, 10.701171875, 11.490478515625, 12.27978515625, 13.069091796875, 13.8583984375, 14.647705078125, 15.43701171875, 16.226318359375, 17.015625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 21.0, 33.0, 33.0, 84.0, 166.0, 389.0, 1046.0, 1220.0, 553.0, 259.0, 132.0, 59.0, 35.0, 21.0, 11.0, 9.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.0625, -23.517333984375, -22.97216796875, -22.427001953125, -21.8818359375, -21.336669921875, -20.79150390625, -20.246337890625, -19.701171875, -19.156005859375, -18.61083984375, -18.065673828125, -17.5205078125, -16.975341796875, -16.43017578125, -15.885009765625, -15.33984375, -14.794677734375, -14.24951171875, -13.704345703125, -13.1591796875, -12.614013671875, -12.06884765625, -11.523681640625, -10.978515625, -10.433349609375, -9.88818359375, -9.343017578125, -8.7978515625, -8.252685546875, -7.70751953125, -7.162353515625, -6.6171875, -6.072021484375, -5.52685546875, -4.981689453125, -4.4365234375, -3.891357421875, -3.34619140625, -2.801025390625, -2.255859375, -1.710693359375, -1.16552734375, -0.620361328125, -0.0751953125, 0.469970703125, 1.01513671875, 1.560302734375, 2.10546875, 2.650634765625, 3.19580078125, 3.740966796875, 4.2861328125, 4.831298828125, 5.37646484375, 5.921630859375, 6.466796875, 7.011962890625, 7.55712890625, 8.102294921875, 8.6474609375, 9.192626953125, 9.73779296875, 10.282958984375, 10.828125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 2.0, 12.0, 22.0, 46.0, 98.0, 231.0, 652.0, 3396.0, 3978798.0, 208211.0, 2032.0, 479.0, 169.0, 70.0, 35.0, 13.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.65625, -46.84423828125, -45.0322265625, -43.22021484375, -41.408203125, -39.59619140625, -37.7841796875, -35.97216796875, -34.16015625, -32.34814453125, -30.5361328125, -28.72412109375, -26.912109375, -25.10009765625, -23.2880859375, -21.47607421875, -19.6640625, -17.85205078125, -16.0400390625, -14.22802734375, -12.416015625, -10.60400390625, -8.7919921875, -6.97998046875, -5.16796875, -3.35595703125, -1.5439453125, 0.26806640625, 2.080078125, 3.89208984375, 5.7041015625, 7.51611328125, 9.328125, 11.14013671875, 12.9521484375, 14.76416015625, 16.576171875, 18.38818359375, 20.2001953125, 22.01220703125, 23.82421875, 25.63623046875, 27.4482421875, 29.26025390625, 31.072265625, 32.88427734375, 34.6962890625, 36.50830078125, 38.3203125, 40.13232421875, 41.9443359375, 43.75634765625, 45.568359375, 47.38037109375, 49.1923828125, 51.00439453125, 52.81640625, 54.62841796875, 56.4404296875, 58.25244140625, 60.064453125, 61.87646484375, 63.6884765625, 65.50048828125, 67.3125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 49.0, 264.0, 437.0, 201.0, 46.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-123.02286529541016, -120.75912475585938, -118.4953842163086, -116.23163604736328, -113.9678955078125, -111.70415496826172, -109.44041442871094, -107.17667388916016, -104.91293334960938, -102.6491928100586, -100.38545227050781, -98.1217041015625, -95.85796356201172, -93.59422302246094, -91.33048248291016, -89.06674194335938, -86.80299377441406, -84.53925323486328, -82.2755126953125, -80.01176452636719, -77.7480239868164, -75.48428344726562, -73.22054290771484, -70.95680236816406, -68.69305419921875, -66.42931365966797, -64.16557312011719, -61.90182876586914, -59.638084411621094, -57.37434387207031, -55.11060333251953, -52.84686279296875, -50.58312225341797, -48.31938171386719, -46.05563735961914, -43.79189682006836, -41.52815246582031, -39.26441192626953, -37.00067138671875, -34.73693084716797, -32.47318649291992, -30.209444046020508, -27.945701599121094, -25.681961059570312, -23.4182186126709, -21.154476165771484, -18.890735626220703, -16.62699317932129, -14.363250732421875, -12.099508285522461, -9.835766792297363, -7.572024822235107, -5.308282852172852, -3.0445404052734375, -0.7807989120483398, 1.4829425811767578, 3.746685028076172, 6.010426998138428, 8.274168968200684, 10.537910461425781, 12.801652908325195, 15.06539535522461, 17.32913589477539, 19.592878341674805, 21.85662078857422]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 9.0, 3.0, 6.0, 12.0, 11.0, 16.0, 22.0, 21.0, 25.0, 23.0, 34.0, 35.0, 43.0, 26.0, 35.0, 35.0, 38.0, 45.0, 43.0, 37.0, 59.0, 43.0, 36.0, 51.0, 36.0, 24.0, 33.0, 27.0, 22.0, 28.0, 24.0, 16.0, 14.0, 14.0, 7.0, 8.0, 7.0, 9.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-34.01847839355469, -33.0948600769043, -32.171241760253906, -31.24762535095215, -30.32400894165039, -29.400390625, -28.47677230834961, -27.55315589904785, -26.629539489746094, -25.705921173095703, -24.782304763793945, -23.858686447143555, -22.935070037841797, -22.011451721191406, -21.087833404541016, -20.164216995239258, -19.240598678588867, -18.316980361938477, -17.39336395263672, -16.469745635986328, -15.54612922668457, -14.62251091003418, -13.698893547058105, -12.775276184082031, -11.851658821105957, -10.928041458129883, -10.004424095153809, -9.080806732177734, -8.157188415527344, -7.233571529388428, -6.309953689575195, -5.386336326599121, -4.462718963623047, -3.5391016006469727, -2.6154839992523193, -1.691866397857666, -0.7682490348815918, 0.15536832809448242, 1.0789861679077148, 2.002603530883789, 2.9262208938598633, 3.8498382568359375, 4.773455619812012, 5.697073459625244, 6.620690822601318, 7.544308185577393, 8.467926025390625, 9.3915433883667, 10.315160751342773, 11.238778114318848, 12.162395477294922, 13.086013793945312, 14.00963020324707, 14.933248519897461, 15.856865882873535, 16.78048324584961, 17.7041015625, 18.62771987915039, 19.55133628845215, 20.47495460510254, 21.398571014404297, 22.322189331054688, 23.245807647705078, 24.169424057006836, 25.093040466308594]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 15.0, 21.0, 27.0, 21.0, 28.0, 36.0, 40.0, 55.0, 63.0, 54.0, 75.0, 86.0, 60.0, 52.0, 61.0, 65.0, 71.0, 28.0, 29.0, 30.0, 27.0, 13.0, 12.0, 4.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.791015625, -3.70184326171875, -3.6126708984375, -3.52349853515625, -3.434326171875, -3.34515380859375, -3.2559814453125, -3.16680908203125, -3.07763671875, -2.98846435546875, -2.8992919921875, -2.81011962890625, -2.720947265625, -2.63177490234375, -2.5426025390625, -2.45343017578125, -2.3642578125, -2.27508544921875, -2.1859130859375, -2.09674072265625, -2.007568359375, -1.91839599609375, -1.8292236328125, -1.74005126953125, -1.65087890625, -1.56170654296875, -1.4725341796875, -1.38336181640625, -1.294189453125, -1.20501708984375, -1.1158447265625, -1.02667236328125, -0.9375, -0.84832763671875, -0.7591552734375, -0.66998291015625, -0.580810546875, -0.49163818359375, -0.4024658203125, -0.31329345703125, -0.22412109375, -0.13494873046875, -0.0457763671875, 0.04339599609375, 0.132568359375, 0.22174072265625, 0.3109130859375, 0.40008544921875, 0.4892578125, 0.57843017578125, 0.6676025390625, 0.75677490234375, 0.845947265625, 0.93511962890625, 1.0242919921875, 1.11346435546875, 1.20263671875, 1.29180908203125, 1.3809814453125, 1.47015380859375, 1.559326171875, 1.64849853515625, 1.7376708984375, 1.82684326171875, 1.916015625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 7.0, 6.0, 6.0, 7.0, 5.0, 13.0, 17.0, 17.0, 16.0, 39.0, 78.0, 116.0, 212.0, 420.0, 748.0, 1611.0, 3090.0, 6104.0, 12240.0, 27212.0, 64617.0, 171225.0, 427432.0, 200779.0, 73960.0, 30795.0, 14087.0, 6834.0, 3285.0, 1639.0, 866.0, 470.0, 223.0, 140.0, 65.0, 48.0, 27.0, 18.0, 15.0, 17.0, 7.0, 10.0, 4.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0265960693359375, -0.02575373649597168, -0.02491140365600586, -0.02406907081604004, -0.02322673797607422, -0.0223844051361084, -0.021542072296142578, -0.020699739456176758, -0.019857406616210938, -0.019015073776245117, -0.018172740936279297, -0.017330408096313477, -0.016488075256347656, -0.015645742416381836, -0.014803409576416016, -0.013961076736450195, -0.013118743896484375, -0.012276411056518555, -0.011434078216552734, -0.010591745376586914, -0.009749412536621094, -0.008907079696655273, -0.008064746856689453, -0.007222414016723633, -0.0063800811767578125, -0.005537748336791992, -0.004695415496826172, -0.0038530826568603516, -0.0030107498168945312, -0.002168416976928711, -0.0013260841369628906, -0.0004837512969970703, 0.00035858154296875, 0.0012009143829345703, 0.0020432472229003906, 0.002885580062866211, 0.0037279129028320312, 0.0045702457427978516, 0.005412578582763672, 0.006254911422729492, 0.0070972442626953125, 0.007939577102661133, 0.008781909942626953, 0.009624242782592773, 0.010466575622558594, 0.011308908462524414, 0.012151241302490234, 0.012993574142456055, 0.013835906982421875, 0.014678239822387695, 0.015520572662353516, 0.016362905502319336, 0.017205238342285156, 0.018047571182250977, 0.018889904022216797, 0.019732236862182617, 0.020574569702148438, 0.021416902542114258, 0.022259235382080078, 0.0231015682220459, 0.02394390106201172, 0.02478623390197754, 0.02562856674194336, 0.02647089958190918, 0.027313232421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 2.0, 1.0, 15.0, 13.0, 8.0, 11.0, 9.0, 16.0, 18.0, 20.0, 20.0, 30.0, 31.0, 42.0, 36.0, 36.0, 25.0, 41.0, 33.0, 40.0, 1067.0, 54.0, 44.0, 33.0, 30.0, 41.0, 35.0, 28.0, 27.0, 29.0, 29.0, 23.0, 14.0, 20.0, 16.0, 14.0, 12.0, 16.0, 4.0, 8.0, 8.0, 2.0, 10.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.318939208984375, -1.27459716796875, -1.230255126953125, -1.1859130859375, -1.141571044921875, -1.09722900390625, -1.052886962890625, -1.008544921875, -0.964202880859375, -0.91986083984375, -0.875518798828125, -0.8311767578125, -0.786834716796875, -0.74249267578125, -0.698150634765625, -0.65380859375, -0.609466552734375, -0.56512451171875, -0.520782470703125, -0.4764404296875, -0.432098388671875, -0.38775634765625, -0.343414306640625, -0.299072265625, -0.254730224609375, -0.21038818359375, -0.166046142578125, -0.1217041015625, -0.077362060546875, -0.03302001953125, 0.011322021484375, 0.0556640625, 0.100006103515625, 0.14434814453125, 0.188690185546875, 0.2330322265625, 0.277374267578125, 0.32171630859375, 0.366058349609375, 0.410400390625, 0.454742431640625, 0.49908447265625, 0.543426513671875, 0.5877685546875, 0.632110595703125, 0.67645263671875, 0.720794677734375, 0.76513671875, 0.809478759765625, 0.85382080078125, 0.898162841796875, 0.9425048828125, 0.986846923828125, 1.03118896484375, 1.075531005859375, 1.119873046875, 1.164215087890625, 1.20855712890625, 1.252899169921875, 1.2972412109375, 1.341583251953125, 1.38592529296875, 1.430267333984375, 1.474609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 7.0, 23.0, 35.0, 41.0, 54.0, 83.0, 139.0, 217.0, 378.0, 511.0, 747.0, 1248.0, 1904.0, 2893.0, 4715.0, 7578.0, 12278.0, 20482.0, 33846.0, 57472.0, 100595.0, 180120.0, 1291669.0, 160061.0, 90063.0, 51384.0, 30446.0, 18190.0, 11123.0, 6870.0, 4364.0, 2676.0, 1766.0, 1074.0, 724.0, 450.0, 331.0, 185.0, 136.0, 98.0, 52.0, 35.0, 32.0, 20.0, 10.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00634002685546875, -0.006150186061859131, -0.005960345268249512, -0.005770504474639893, -0.0055806636810302734, -0.005390822887420654, -0.005200982093811035, -0.005011141300201416, -0.004821300506591797, -0.004631459712982178, -0.004441618919372559, -0.0042517781257629395, -0.00406193733215332, -0.003872096538543701, -0.003682255744934082, -0.003492414951324463, -0.0033025741577148438, -0.0031127333641052246, -0.0029228925704956055, -0.0027330517768859863, -0.002543210983276367, -0.002353370189666748, -0.002163529396057129, -0.0019736886024475098, -0.0017838478088378906, -0.0015940070152282715, -0.0014041662216186523, -0.0012143254280090332, -0.001024484634399414, -0.0008346438407897949, -0.0006448030471801758, -0.00045496225357055664, -0.0002651214599609375, -7.528066635131836e-05, 0.00011456012725830078, 0.0003044009208679199, 0.0004942417144775391, 0.0006840825080871582, 0.0008739233016967773, 0.0010637640953063965, 0.0012536048889160156, 0.0014434456825256348, 0.001633286476135254, 0.001823127269744873, 0.002012968063354492, 0.0022028088569641113, 0.0023926496505737305, 0.0025824904441833496, 0.0027723312377929688, 0.002962172031402588, 0.003152012825012207, 0.003341853618621826, 0.0035316944122314453, 0.0037215352058410645, 0.003911375999450684, 0.004101216793060303, 0.004291057586669922, 0.004480898380279541, 0.00467073917388916, 0.004860579967498779, 0.0050504207611083984, 0.005240261554718018, 0.005430102348327637, 0.005619943141937256, 0.005809783935546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 11.0, 0.0, 13.0, 0.0, 0.0, 18.0, 0.0, 0.0, 19.0, 0.0, 40.0, 0.0, 0.0, 44.0, 0.0, 0.0, 74.0, 0.0, 145.0, 0.0, 0.0, 286.0, 0.0, 0.0, 132.0, 0.0, 62.0, 0.0, 0.0, 46.0, 0.0, 0.0, 42.0, 0.0, 20.0, 0.0, 0.0, 20.0, 0.0, 0.0, 16.0, 0.0, 5.0, 0.0, 0.0, 10.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.556510925292969e-07, -6.332993507385254e-07, -6.109476089477539e-07, -5.885958671569824e-07, -5.662441253662109e-07, -5.438923835754395e-07, -5.21540641784668e-07, -4.991888999938965e-07, -4.76837158203125e-07, -4.544854164123535e-07, -4.3213367462158203e-07, -4.0978193283081055e-07, -3.8743019104003906e-07, -3.650784492492676e-07, -3.427267074584961e-07, -3.203749656677246e-07, -2.980232238769531e-07, -2.7567148208618164e-07, -2.5331974029541016e-07, -2.3096799850463867e-07, -2.086162567138672e-07, -1.862645149230957e-07, -1.6391277313232422e-07, -1.4156103134155273e-07, -1.1920928955078125e-07, -9.685754776000977e-08, -7.450580596923828e-08, -5.21540641784668e-08, -2.9802322387695312e-08, -7.450580596923828e-09, 1.4901161193847656e-08, 3.725290298461914e-08, 5.960464477539063e-08, 8.195638656616211e-08, 1.043081283569336e-07, 1.2665987014770508e-07, 1.4901161193847656e-07, 1.7136335372924805e-07, 1.9371509552001953e-07, 2.1606683731079102e-07, 2.384185791015625e-07, 2.60770320892334e-07, 2.8312206268310547e-07, 3.0547380447387695e-07, 3.2782554626464844e-07, 3.501772880554199e-07, 3.725290298461914e-07, 3.948807716369629e-07, 4.172325134277344e-07, 4.3958425521850586e-07, 4.6193599700927734e-07, 4.842877388000488e-07, 5.066394805908203e-07, 5.289912223815918e-07, 5.513429641723633e-07, 5.736947059631348e-07, 5.960464477539062e-07, 6.183981895446777e-07, 6.407499313354492e-07, 6.631016731262207e-07, 6.854534149169922e-07, 7.078051567077637e-07, 7.301568984985352e-07, 7.525086402893066e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 1.0, 0.0, 4.0, 3.0, 10.0, 10.0, 7.0, 15.0, 11.0, 15.0, 18.0, 18.0, 38.0, 42.0, 55.0, 53.0, 38.0, 107.0, 108.0, 178.0, 238.0, 611.0, 903227.0, 142241.0, 526.0, 243.0, 175.0, 89.0, 92.0, 68.0, 54.0, 53.0, 31.0, 44.0, 21.0, 23.0, 15.0, 6.0, 19.0, 8.0, 5.0, 9.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.7881393432617188e-05, -1.7354264855384827e-05, -1.6827136278152466e-05, -1.6300007700920105e-05, -1.5772879123687744e-05, -1.5245750546455383e-05, -1.4718621969223022e-05, -1.4191493391990662e-05, -1.36643648147583e-05, -1.313723623752594e-05, -1.2610107660293579e-05, -1.2082979083061218e-05, -1.1555850505828857e-05, -1.1028721928596497e-05, -1.0501593351364136e-05, -9.974464774131775e-06, -9.447336196899414e-06, -8.920207619667053e-06, -8.393079042434692e-06, -7.865950465202332e-06, -7.338821887969971e-06, -6.81169331073761e-06, -6.284564733505249e-06, -5.757436156272888e-06, -5.230307579040527e-06, -4.7031790018081665e-06, -4.176050424575806e-06, -3.648921847343445e-06, -3.121793270111084e-06, -2.594664692878723e-06, -2.0675361156463623e-06, -1.5404075384140015e-06, -1.0132789611816406e-06, -4.861503839492798e-07, 4.0978193283081055e-08, 5.681067705154419e-07, 1.0952353477478027e-06, 1.6223639249801636e-06, 2.1494925022125244e-06, 2.6766210794448853e-06, 3.203749656677246e-06, 3.730878233909607e-06, 4.258006811141968e-06, 4.785135388374329e-06, 5.3122639656066895e-06, 5.83939254283905e-06, 6.366521120071411e-06, 6.893649697303772e-06, 7.420778274536133e-06, 7.947906851768494e-06, 8.475035429000854e-06, 9.002164006233215e-06, 9.529292583465576e-06, 1.0056421160697937e-05, 1.0583549737930298e-05, 1.1110678315162659e-05, 1.163780689239502e-05, 1.216493546962738e-05, 1.2692064046859741e-05, 1.3219192624092102e-05, 1.3746321201324463e-05, 1.4273449778556824e-05, 1.4800578355789185e-05, 1.5327706933021545e-05, 1.5854835510253906e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 17.0, 143.0, 601.0, 215.0, 32.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.332940749118279e-07, -8.995003213385644e-07, -8.65706510921882e-07, -8.319127573486185e-07, -7.981190037753549e-07, -7.643251933586725e-07, -7.30531439785409e-07, -6.967376293687266e-07, -6.629438757954631e-07, -6.291501222221996e-07, -5.953563118055172e-07, -5.615625582322537e-07, -5.277687478155713e-07, -4.939749942423077e-07, -4.601812406690442e-07, -4.2638745867407124e-07, -3.925936766790983e-07, -3.587998946841253e-07, -3.2500611268915236e-07, -2.9121235911588883e-07, -2.5741857712091587e-07, -2.236247951259429e-07, -1.8983102734182467e-07, -1.5603725955770642e-07, -1.2224347756273346e-07, -8.844970267318786e-08, -5.4655927783642255e-08, -2.0862152894096653e-08, 1.293162199544895e-08, 4.672540399042191e-08, 8.051917177454015e-08, 1.143129395586584e-07, 1.481066647102125e-07, 1.8190044670518546e-07, 2.156942144893037e-07, 2.4948798227342195e-07, 2.832817642683949e-07, 3.1707554626336787e-07, 3.508692998366314e-07, 3.8466308183160436e-07, 4.184568638265773e-07, 4.522506458215503e-07, 4.860444278165232e-07, 5.198381813897868e-07, 5.536319349630503e-07, 5.874257453797327e-07, 6.212194989529962e-07, 6.550133093696786e-07, 6.888070629429421e-07, 7.226008165162057e-07, 7.563946269328881e-07, 7.901883805061516e-07, 8.23982190922834e-07, 8.577759444960975e-07, 8.91569698069361e-07, 9.253634516426246e-07, 9.59157205215888e-07, 9.929509587891516e-07, 1.0267447123624152e-06, 1.0605385796225164e-06, 1.09433233319578e-06, 1.1281260867690435e-06, 1.161919840342307e-06, 1.1957135939155705e-06, 1.2295074611756718e-06]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 106.0, 0.0, 0.0, 0.0, 156.0, 0.0, 0.0, 0.0, 242.0, 0.0, 0.0, 0.0, 0.0, 184.0, 0.0, 0.0, 0.0, 112.0, 0.0, 0.0, 0.0, 62.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.032626748085022e-07, -3.8929283618927e-07, -3.7532299757003784e-07, -3.6135315895080566e-07, -3.473833203315735e-07, -3.334134817123413e-07, -3.1944364309310913e-07, -3.0547380447387695e-07, -2.915039658546448e-07, -2.775341272354126e-07, -2.635642886161804e-07, -2.4959444999694824e-07, -2.3562461137771606e-07, -2.2165477275848389e-07, -2.076849341392517e-07, -1.9371509552001953e-07, -1.7974525690078735e-07, -1.6577541828155518e-07, -1.51805579662323e-07, -1.3783574104309082e-07, -1.2386590242385864e-07, -1.0989606380462646e-07, -9.592622518539429e-08, -8.195638656616211e-08, -6.798654794692993e-08, -5.4016709327697754e-08, -4.0046870708465576e-08, -2.60770320892334e-08, -1.210719347000122e-08, 1.862645149230957e-09, 1.5832483768463135e-08, 2.9802322387695312e-08, 4.377216100692749e-08, 5.774199962615967e-08, 7.171183824539185e-08, 8.568167686462402e-08, 9.96515154838562e-08, 1.1362135410308838e-07, 1.2759119272232056e-07, 1.4156103134155273e-07, 1.555308699607849e-07, 1.695007085800171e-07, 1.8347054719924927e-07, 1.9744038581848145e-07, 2.1141022443771362e-07, 2.253800630569458e-07, 2.39349901676178e-07, 2.5331974029541016e-07, 2.6728957891464233e-07, 2.812594175338745e-07, 2.952292561531067e-07, 3.0919909477233887e-07, 3.2316893339157104e-07, 3.371387720108032e-07, 3.511086106300354e-07, 3.650784492492676e-07, 3.7904828786849976e-07, 3.9301812648773193e-07, 4.069879651069641e-07, 4.209578037261963e-07, 4.3492764234542847e-07, 4.4889748096466064e-07, 4.628673195838928e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 15.0, 21.0, 27.0, 21.0, 28.0, 36.0, 40.0, 55.0, 63.0, 54.0, 75.0, 86.0, 60.0, 52.0, 61.0, 65.0, 71.0, 28.0, 29.0, 30.0, 27.0, 13.0, 12.0, 4.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.791015625, -3.70184326171875, -3.6126708984375, -3.52349853515625, -3.434326171875, -3.34515380859375, -3.2559814453125, -3.16680908203125, -3.07763671875, -2.98846435546875, -2.8992919921875, -2.81011962890625, -2.720947265625, -2.63177490234375, -2.5426025390625, -2.45343017578125, -2.3642578125, -2.27508544921875, -2.1859130859375, -2.09674072265625, -2.007568359375, -1.91839599609375, -1.8292236328125, -1.74005126953125, -1.65087890625, -1.56170654296875, -1.4725341796875, -1.38336181640625, -1.294189453125, -1.20501708984375, -1.1158447265625, -1.02667236328125, -0.9375, -0.84832763671875, -0.7591552734375, -0.66998291015625, -0.580810546875, -0.49163818359375, -0.4024658203125, -0.31329345703125, -0.22412109375, -0.13494873046875, -0.0457763671875, 0.04339599609375, 0.132568359375, 0.22174072265625, 0.3109130859375, 0.40008544921875, 0.4892578125, 0.57843017578125, 0.6676025390625, 0.75677490234375, 0.845947265625, 0.93511962890625, 1.0242919921875, 1.11346435546875, 1.20263671875, 1.29180908203125, 1.3809814453125, 1.47015380859375, 1.559326171875, 1.64849853515625, 1.7376708984375, 1.82684326171875, 1.916015625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 17.0, 41.0, 76.0, 140.0, 243.0, 395.0, 659.0, 1025.0, 1766.0, 3819.0, 10559.0, 83112.0, 890555.0, 41001.0, 8067.0, 3192.0, 1591.0, 899.0, 571.0, 342.0, 200.0, 131.0, 63.0, 29.0, 12.0, 14.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.40625, -21.735107421875, -21.06396484375, -20.392822265625, -19.7216796875, -19.050537109375, -18.37939453125, -17.708251953125, -17.037109375, -16.365966796875, -15.69482421875, -15.023681640625, -14.3525390625, -13.681396484375, -13.01025390625, -12.339111328125, -11.66796875, -10.996826171875, -10.32568359375, -9.654541015625, -8.9833984375, -8.312255859375, -7.64111328125, -6.969970703125, -6.298828125, -5.627685546875, -4.95654296875, -4.285400390625, -3.6142578125, -2.943115234375, -2.27197265625, -1.600830078125, -0.9296875, -0.258544921875, 0.41259765625, 1.083740234375, 1.7548828125, 2.426025390625, 3.09716796875, 3.768310546875, 4.439453125, 5.110595703125, 5.78173828125, 6.452880859375, 7.1240234375, 7.795166015625, 8.46630859375, 9.137451171875, 9.80859375, 10.479736328125, 11.15087890625, 11.822021484375, 12.4931640625, 13.164306640625, 13.83544921875, 14.506591796875, 15.177734375, 15.848876953125, 16.52001953125, 17.191162109375, 17.8623046875, 18.533447265625, 19.20458984375, 19.875732421875, 20.546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 6.0, 12.0, 10.0, 17.0, 17.0, 17.0, 21.0, 30.0, 27.0, 36.0, 43.0, 45.0, 31.0, 49.0, 64.0, 93.0, 164.0, 1496.0, 258.0, 105.0, 72.0, 49.0, 53.0, 51.0, 48.0, 24.0, 28.0, 32.0, 16.0, 21.0, 14.0, 18.0, 14.0, 13.0, 5.0, 3.0, 5.0, 12.0, 5.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.83306884765625, -4.6583251953125, -4.48358154296875, -4.308837890625, -4.13409423828125, -3.9593505859375, -3.78460693359375, -3.60986328125, -3.43511962890625, -3.2603759765625, -3.08563232421875, -2.910888671875, -2.73614501953125, -2.5614013671875, -2.38665771484375, -2.2119140625, -2.03717041015625, -1.8624267578125, -1.68768310546875, -1.512939453125, -1.33819580078125, -1.1634521484375, -0.98870849609375, -0.81396484375, -0.63922119140625, -0.4644775390625, -0.28973388671875, -0.114990234375, 0.05975341796875, 0.2344970703125, 0.40924072265625, 0.583984375, 0.75872802734375, 0.9334716796875, 1.10821533203125, 1.282958984375, 1.45770263671875, 1.6324462890625, 1.80718994140625, 1.98193359375, 2.15667724609375, 2.3314208984375, 2.50616455078125, 2.680908203125, 2.85565185546875, 3.0303955078125, 3.20513916015625, 3.3798828125, 3.55462646484375, 3.7293701171875, 3.90411376953125, 4.078857421875, 4.25360107421875, 4.4283447265625, 4.60308837890625, 4.77783203125, 4.95257568359375, 5.1273193359375, 5.30206298828125, 5.476806640625, 5.65155029296875, 5.8262939453125, 6.00103759765625, 6.17578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 7.0, 10.0, 4.0, 2.0, 6.0, 13.0, 12.0, 22.0, 20.0, 20.0, 20.0, 37.0, 39.0, 63.0, 95.0, 131.0, 242.0, 650.0, 3617.0, 254763.0, 2874626.0, 9446.0, 994.0, 332.0, 164.0, 75.0, 62.0, 41.0, 33.0, 32.0, 25.0, 17.0, 20.0, 16.0, 8.0, 11.0, 3.0, 10.0, 4.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.59375, -24.885986328125, -24.17822265625, -23.470458984375, -22.7626953125, -22.054931640625, -21.34716796875, -20.639404296875, -19.931640625, -19.223876953125, -18.51611328125, -17.808349609375, -17.1005859375, -16.392822265625, -15.68505859375, -14.977294921875, -14.26953125, -13.561767578125, -12.85400390625, -12.146240234375, -11.4384765625, -10.730712890625, -10.02294921875, -9.315185546875, -8.607421875, -7.899658203125, -7.19189453125, -6.484130859375, -5.7763671875, -5.068603515625, -4.36083984375, -3.653076171875, -2.9453125, -2.237548828125, -1.52978515625, -0.822021484375, -0.1142578125, 0.593505859375, 1.30126953125, 2.009033203125, 2.716796875, 3.424560546875, 4.13232421875, 4.840087890625, 5.5478515625, 6.255615234375, 6.96337890625, 7.671142578125, 8.37890625, 9.086669921875, 9.79443359375, 10.502197265625, 11.2099609375, 11.917724609375, 12.62548828125, 13.333251953125, 14.041015625, 14.748779296875, 15.45654296875, 16.164306640625, 16.8720703125, 17.579833984375, 18.28759765625, 18.995361328125, 19.703125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 29.0, 921.0, 66.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-289.0257873535156, -283.7305908203125, -278.43536376953125, -273.1401672363281, -267.8449401855469, -262.54974365234375, -257.2545166015625, -251.9593048095703, -246.66409301757812, -241.36888122558594, -236.07366943359375, -230.77845764160156, -225.48324584960938, -220.1880340576172, -214.892822265625, -209.5976104736328, -204.30239868164062, -199.00718688964844, -193.71197509765625, -188.41676330566406, -183.12155151367188, -177.8263397216797, -172.5311279296875, -167.2359161376953, -161.9407196044922, -156.6455078125, -151.3502960205078, -146.05508422851562, -140.75987243652344, -135.46466064453125, -130.16944885253906, -124.87423706054688, -119.57903289794922, -114.28382110595703, -108.98860931396484, -103.69339752197266, -98.39818572998047, -93.10297393798828, -87.80776977539062, -82.51255798339844, -77.21734619140625, -71.92213439941406, -66.62692260742188, -61.33171081542969, -56.0364990234375, -50.74128723144531, -45.44607925415039, -40.1508674621582, -34.85565185546875, -29.560440063476562, -24.265228271484375, -18.97001838684082, -13.674806594848633, -8.379594802856445, -3.0843849182128906, 2.210826873779297, 7.506038665771484, 12.801250457763672, 18.09646224975586, 23.391672134399414, 28.6868839263916, 33.982093811035156, 39.277305603027344, 44.57251739501953, 49.86772918701172]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 3.0, 5.0, 10.0, 13.0, 25.0, 19.0, 18.0, 28.0, 30.0, 34.0, 24.0, 38.0, 40.0, 48.0, 32.0, 47.0, 59.0, 42.0, 45.0, 47.0, 50.0, 39.0, 35.0, 42.0, 43.0, 35.0, 27.0, 25.0, 17.0, 21.0, 12.0, 9.0, 7.0, 5.0, 3.0, 4.0, 4.0, 11.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.69549560546875, -19.965490341186523, -19.23548698425293, -18.505481719970703, -17.77547836303711, -17.045473098754883, -16.315467834472656, -15.585463523864746, -14.855459213256836, -14.125454902648926, -13.395450592041016, -12.665445327758789, -11.935441017150879, -11.205436706542969, -10.475431442260742, -9.745427131652832, -9.015422821044922, -8.285418510437012, -7.555413722991943, -6.825408935546875, -6.095404624938965, -5.365400314331055, -4.635395526885986, -3.905390739440918, -3.175386428833008, -2.4453818798065186, -1.7153773307800293, -0.98537278175354, -0.2553682327270508, 0.4746363162994385, 1.2046408653259277, 1.934645652770996, 2.6646499633789062, 3.3946545124053955, 4.124659061431885, 4.854663848876953, 5.584668159484863, 6.314672470092773, 7.044677257537842, 7.77468204498291, 8.50468635559082, 9.23469066619873, 9.96469497680664, 10.694700241088867, 11.424704551696777, 12.154708862304688, 12.884714126586914, 13.614718437194824, 14.344722747802734, 15.074727058410645, 15.804731369018555, 16.53473663330078, 17.264739990234375, 17.9947452545166, 18.724750518798828, 19.454753875732422, 20.18475914001465, 20.914764404296875, 21.64476776123047, 22.374773025512695, 23.104778289794922, 23.834781646728516, 24.564786911010742, 25.29479217529297, 26.024795532226562]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 8.0, 6.0, 11.0, 15.0, 29.0, 19.0, 22.0, 31.0, 29.0, 53.0, 67.0, 46.0, 67.0, 79.0, 65.0, 59.0, 61.0, 60.0, 74.0, 49.0, 35.0, 28.0, 28.0, 18.0, 19.0, 7.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.775390625, -3.685943603515625, -3.59649658203125, -3.507049560546875, -3.4176025390625, -3.328155517578125, -3.23870849609375, -3.149261474609375, -3.059814453125, -2.970367431640625, -2.88092041015625, -2.791473388671875, -2.7020263671875, -2.612579345703125, -2.52313232421875, -2.433685302734375, -2.34423828125, -2.254791259765625, -2.16534423828125, -2.075897216796875, -1.9864501953125, -1.897003173828125, -1.80755615234375, -1.718109130859375, -1.628662109375, -1.539215087890625, -1.44976806640625, -1.360321044921875, -1.2708740234375, -1.181427001953125, -1.09197998046875, -1.002532958984375, -0.9130859375, -0.823638916015625, -0.73419189453125, -0.644744873046875, -0.5552978515625, -0.465850830078125, -0.37640380859375, -0.286956787109375, -0.197509765625, -0.108062744140625, -0.01861572265625, 0.070831298828125, 0.1602783203125, 0.249725341796875, 0.33917236328125, 0.428619384765625, 0.51806640625, 0.607513427734375, 0.69696044921875, 0.786407470703125, 0.8758544921875, 0.965301513671875, 1.05474853515625, 1.144195556640625, 1.233642578125, 1.323089599609375, 1.41253662109375, 1.501983642578125, 1.5914306640625, 1.680877685546875, 1.77032470703125, 1.859771728515625, 1.94921875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 13.0, 18.0, 32.0, 36.0, 79.0, 132.0, 168.0, 370.0, 640.0, 1587.0, 10153.0, 3024651.0, 1146519.0, 7178.0, 1338.0, 575.0, 307.0, 194.0, 106.0, 68.0, 30.0, 34.0, 13.0, 13.0, 7.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-37.90625, -37.04345703125, -36.1806640625, -35.31787109375, -34.455078125, -33.59228515625, -32.7294921875, -31.86669921875, -31.00390625, -30.14111328125, -29.2783203125, -28.41552734375, -27.552734375, -26.68994140625, -25.8271484375, -24.96435546875, -24.1015625, -23.23876953125, -22.3759765625, -21.51318359375, -20.650390625, -19.78759765625, -18.9248046875, -18.06201171875, -17.19921875, -16.33642578125, -15.4736328125, -14.61083984375, -13.748046875, -12.88525390625, -12.0224609375, -11.15966796875, -10.296875, -9.43408203125, -8.5712890625, -7.70849609375, -6.845703125, -5.98291015625, -5.1201171875, -4.25732421875, -3.39453125, -2.53173828125, -1.6689453125, -0.80615234375, 0.056640625, 0.91943359375, 1.7822265625, 2.64501953125, 3.5078125, 4.37060546875, 5.2333984375, 6.09619140625, 6.958984375, 7.82177734375, 8.6845703125, 9.54736328125, 10.41015625, 11.27294921875, 12.1357421875, 12.99853515625, 13.861328125, 14.72412109375, 15.5869140625, 16.44970703125, 17.3125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 9.0, 3.0, 7.0, 15.0, 27.0, 49.0, 109.0, 194.0, 379.0, 587.0, 979.0, 762.0, 417.0, 248.0, 148.0, 69.0, 26.0, 20.0, 11.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.0234375, -9.6328125, -9.2421875, -8.8515625, -8.4609375, -8.0703125, -7.6796875, -7.2890625, -6.8984375, -6.5078125, -6.1171875, -5.7265625, -5.3359375, -4.9453125, -4.5546875, -4.1640625, -3.7734375, -3.3828125, -2.9921875, -2.6015625, -2.2109375, -1.8203125, -1.4296875, -1.0390625, -0.6484375, -0.2578125, 0.1328125, 0.5234375, 0.9140625, 1.3046875, 1.6953125, 2.0859375, 2.4765625, 2.8671875, 3.2578125, 3.6484375, 4.0390625, 4.4296875, 4.8203125, 5.2109375, 5.6015625, 5.9921875, 6.3828125, 6.7734375, 7.1640625, 7.5546875, 7.9453125, 8.3359375, 8.7265625, 9.1171875, 9.5078125, 9.8984375, 10.2890625, 10.6796875, 11.0703125, 11.4609375, 11.8515625, 12.2421875, 12.6328125, 13.0234375, 13.4140625, 13.8046875, 14.1953125, 14.5859375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 15.0, 24.0, 34.0, 82.0, 142.0, 285.0, 759.0, 2619.0, 22624.0, 1816579.0, 2320396.0, 26527.0, 2745.0, 840.0, 336.0, 126.0, 69.0, 41.0, 16.0, 15.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.40576171875, -17.5302734375, -16.65478515625, -15.779296875, -14.90380859375, -14.0283203125, -13.15283203125, -12.27734375, -11.40185546875, -10.5263671875, -9.65087890625, -8.775390625, -7.89990234375, -7.0244140625, -6.14892578125, -5.2734375, -4.39794921875, -3.5224609375, -2.64697265625, -1.771484375, -0.89599609375, -0.0205078125, 0.85498046875, 1.73046875, 2.60595703125, 3.4814453125, 4.35693359375, 5.232421875, 6.10791015625, 6.9833984375, 7.85888671875, 8.734375, 9.60986328125, 10.4853515625, 11.36083984375, 12.236328125, 13.11181640625, 13.9873046875, 14.86279296875, 15.73828125, 16.61376953125, 17.4892578125, 18.36474609375, 19.240234375, 20.11572265625, 20.9912109375, 21.86669921875, 22.7421875, 23.61767578125, 24.4931640625, 25.36865234375, 26.244140625, 27.11962890625, 27.9951171875, 28.87060546875, 29.74609375, 30.62158203125, 31.4970703125, 32.37255859375, 33.248046875, 34.12353515625, 34.9990234375, 35.87451171875, 36.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 110.0, 393.0, 411.0, 92.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.30104064941406, -32.240684509277344, -28.18033218383789, -24.119977951049805, -20.05962371826172, -15.999269485473633, -11.938915252685547, -7.878561019897461, -3.818206787109375, 0.24214744567871094, 4.302501678466797, 8.362855911254883, 12.423210144042969, 16.483564376831055, 20.54391860961914, 24.604272842407227, 28.664627075195312, 32.72498321533203, 36.785335540771484, 40.84568786621094, 44.906044006347656, 48.966400146484375, 53.02675247192383, 57.08710479736328, 61.1474609375, 65.20781707763672, 69.26817321777344, 73.32852172851562, 77.38887786865234, 81.44923400878906, 85.50958251953125, 89.56993865966797, 93.63031005859375, 97.69066619873047, 101.75102233886719, 105.81137084960938, 109.8717269897461, 113.93208312988281, 117.992431640625, 122.05278778076172, 126.11314392089844, 130.17349243164062, 134.23385620117188, 138.29420471191406, 142.35455322265625, 146.4149169921875, 150.4752655029297, 154.53562927246094, 158.59597778320312, 162.6563262939453, 166.71669006347656, 170.77703857421875, 174.83740234375, 178.8977508544922, 182.95809936523438, 187.01846313476562, 191.0788116455078, 195.13916015625, 199.19952392578125, 203.25987243652344, 207.32022094726562, 211.38058471679688, 215.44093322753906, 219.5012969970703, 223.5616455078125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 7.0, 13.0, 22.0, 18.0, 20.0, 18.0, 32.0, 33.0, 29.0, 36.0, 40.0, 31.0, 36.0, 38.0, 38.0, 46.0, 43.0, 38.0, 38.0, 45.0, 29.0, 35.0, 44.0, 28.0, 30.0, 25.0, 22.0, 26.0, 17.0, 14.0, 10.0, 15.0, 9.0, 13.0, 7.0, 9.0, 2.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-25.921432495117188, -25.211803436279297, -24.502172470092773, -23.79254150390625, -23.08291244506836, -22.37328338623047, -21.663652420043945, -20.954021453857422, -20.24439239501953, -19.53476333618164, -18.825132369995117, -18.115501403808594, -17.405872344970703, -16.696243286132812, -15.986612319946289, -15.276982307434082, -14.567352294921875, -13.857722282409668, -13.148092269897461, -12.438462257385254, -11.728832244873047, -11.01920223236084, -10.309572219848633, -9.599942207336426, -8.890312194824219, -8.180682182312012, -7.471052169799805, -6.761422157287598, -6.051792144775391, -5.342162132263184, -4.632532119750977, -3.9229021072387695, -3.2132720947265625, -2.5036420822143555, -1.7940120697021484, -1.0843820571899414, -0.3747520446777344, 0.33487796783447266, 1.0445079803466797, 1.7541379928588867, 2.4637680053710938, 3.173398017883301, 3.883028030395508, 4.592658042907715, 5.302288055419922, 6.011918067932129, 6.721548080444336, 7.431178092956543, 8.14080810546875, 8.850438117980957, 9.560068130493164, 10.269698143005371, 10.979328155517578, 11.688958168029785, 12.398588180541992, 13.1082181930542, 13.817848205566406, 14.527478218078613, 15.23710823059082, 15.946738243103027, 16.656368255615234, 17.365997314453125, 18.07562828063965, 18.785259246826172, 19.494888305664062]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 5.0, 12.0, 10.0, 18.0, 19.0, 25.0, 22.0, 33.0, 37.0, 56.0, 45.0, 72.0, 53.0, 71.0, 64.0, 56.0, 62.0, 48.0, 62.0, 56.0, 40.0, 33.0, 30.0, 20.0, 16.0, 8.0, 8.0, 5.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0], "bins": [-3.736328125, -3.6497955322265625, -3.563262939453125, -3.4767303466796875, -3.39019775390625, -3.3036651611328125, -3.217132568359375, -3.1305999755859375, -3.0440673828125, -2.9575347900390625, -2.871002197265625, -2.7844696044921875, -2.69793701171875, -2.6114044189453125, -2.524871826171875, -2.4383392333984375, -2.351806640625, -2.2652740478515625, -2.178741455078125, -2.0922088623046875, -2.00567626953125, -1.9191436767578125, -1.832611083984375, -1.7460784912109375, -1.6595458984375, -1.5730133056640625, -1.486480712890625, -1.3999481201171875, -1.31341552734375, -1.2268829345703125, -1.140350341796875, -1.0538177490234375, -0.96728515625, -0.8807525634765625, -0.794219970703125, -0.7076873779296875, -0.62115478515625, -0.5346221923828125, -0.448089599609375, -0.3615570068359375, -0.2750244140625, -0.1884918212890625, -0.101959228515625, -0.0154266357421875, 0.07110595703125, 0.1576385498046875, 0.244171142578125, 0.3307037353515625, 0.417236328125, 0.5037689208984375, 0.590301513671875, 0.6768341064453125, 0.76336669921875, 0.8498992919921875, 0.936431884765625, 1.0229644775390625, 1.1094970703125, 1.1960296630859375, 1.282562255859375, 1.3690948486328125, 1.45562744140625, 1.5421600341796875, 1.628692626953125, 1.7152252197265625, 1.8017578125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 11.0, 11.0, 12.0, 11.0, 20.0, 35.0, 37.0, 55.0, 102.0, 213.0, 429.0, 777.0, 1460.0, 2843.0, 5659.0, 11488.0, 23987.0, 52751.0, 127213.0, 360338.0, 277276.0, 101336.0, 43218.0, 19756.0, 9440.0, 4781.0, 2517.0, 1275.0, 698.0, 344.0, 174.0, 95.0, 49.0, 24.0, 25.0, 15.0, 9.0, 10.0, 15.0, 7.0, 3.0, 6.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.027557373046875, -0.02674388885498047, -0.025930404663085938, -0.025116920471191406, -0.024303436279296875, -0.023489952087402344, -0.022676467895507812, -0.02186298370361328, -0.02104949951171875, -0.02023601531982422, -0.019422531127929688, -0.018609046936035156, -0.017795562744140625, -0.016982078552246094, -0.016168594360351562, -0.015355110168457031, -0.0145416259765625, -0.013728141784667969, -0.012914657592773438, -0.012101173400878906, -0.011287689208984375, -0.010474205017089844, -0.009660720825195312, -0.008847236633300781, -0.00803375244140625, -0.007220268249511719, -0.0064067840576171875, -0.005593299865722656, -0.004779815673828125, -0.003966331481933594, -0.0031528472900390625, -0.0023393630981445312, -0.00152587890625, -0.0007123947143554688, 0.0001010894775390625, 0.0009145736694335938, 0.001728057861328125, 0.0025415420532226562, 0.0033550262451171875, 0.004168510437011719, 0.00498199462890625, 0.005795478820800781, 0.0066089630126953125, 0.007422447204589844, 0.008235931396484375, 0.009049415588378906, 0.009862899780273438, 0.010676383972167969, 0.0114898681640625, 0.012303352355957031, 0.013116836547851562, 0.013930320739746094, 0.014743804931640625, 0.015557289123535156, 0.016370773315429688, 0.01718425750732422, 0.01799774169921875, 0.01881122589111328, 0.019624710083007812, 0.020438194274902344, 0.021251678466796875, 0.022065162658691406, 0.022878646850585938, 0.02369213104248047, 0.024505615234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 6.0, 4.0, 7.0, 13.0, 7.0, 13.0, 14.0, 21.0, 18.0, 21.0, 24.0, 28.0, 25.0, 24.0, 34.0, 40.0, 29.0, 41.0, 41.0, 46.0, 1085.0, 44.0, 53.0, 37.0, 41.0, 41.0, 29.0, 35.0, 30.0, 40.0, 29.0, 23.0, 19.0, 11.0, 13.0, 11.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7021484375, -1.6480865478515625, -1.594024658203125, -1.5399627685546875, -1.48590087890625, -1.4318389892578125, -1.377777099609375, -1.3237152099609375, -1.2696533203125, -1.2155914306640625, -1.161529541015625, -1.1074676513671875, -1.05340576171875, -0.9993438720703125, -0.945281982421875, -0.8912200927734375, -0.837158203125, -0.7830963134765625, -0.729034423828125, -0.6749725341796875, -0.62091064453125, -0.5668487548828125, -0.512786865234375, -0.4587249755859375, -0.4046630859375, -0.3506011962890625, -0.296539306640625, -0.2424774169921875, -0.18841552734375, -0.1343536376953125, -0.080291748046875, -0.0262298583984375, 0.02783203125, 0.0818939208984375, 0.135955810546875, 0.1900177001953125, 0.24407958984375, 0.2981414794921875, 0.352203369140625, 0.4062652587890625, 0.4603271484375, 0.5143890380859375, 0.568450927734375, 0.6225128173828125, 0.67657470703125, 0.7306365966796875, 0.784698486328125, 0.8387603759765625, 0.892822265625, 0.9468841552734375, 1.000946044921875, 1.0550079345703125, 1.10906982421875, 1.1631317138671875, 1.217193603515625, 1.2712554931640625, 1.3253173828125, 1.3793792724609375, 1.433441162109375, 1.4875030517578125, 1.54156494140625, 1.5956268310546875, 1.649688720703125, 1.7037506103515625, 1.7578125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 15.0, 21.0, 36.0, 38.0, 56.0, 71.0, 102.0, 160.0, 284.0, 415.0, 536.0, 876.0, 1339.0, 1934.0, 3010.0, 4578.0, 7278.0, 11484.0, 17901.0, 28492.0, 46532.0, 76664.0, 130806.0, 1264656.0, 199455.0, 116468.0, 69290.0, 42481.0, 25956.0, 16593.0, 10429.0, 6649.0, 4250.0, 2825.0, 1848.0, 1115.0, 846.0, 538.0, 351.0, 235.0, 162.0, 109.0, 89.0, 48.0, 33.0, 28.0, 17.0, 12.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0061798095703125, -0.0059860944747924805, -0.005792379379272461, -0.005598664283752441, -0.005404949188232422, -0.005211234092712402, -0.005017518997192383, -0.004823803901672363, -0.004630088806152344, -0.004436373710632324, -0.004242658615112305, -0.004048943519592285, -0.0038552284240722656, -0.003661513328552246, -0.0034677982330322266, -0.003274083137512207, -0.0030803680419921875, -0.002886652946472168, -0.0026929378509521484, -0.002499222755432129, -0.0023055076599121094, -0.00211179256439209, -0.0019180774688720703, -0.0017243623733520508, -0.0015306472778320312, -0.0013369321823120117, -0.0011432170867919922, -0.0009495019912719727, -0.0007557868957519531, -0.0005620718002319336, -0.00036835670471191406, -0.00017464160919189453, 1.9073486328125e-05, 0.00021278858184814453, 0.00040650367736816406, 0.0006002187728881836, 0.0007939338684082031, 0.0009876489639282227, 0.0011813640594482422, 0.0013750791549682617, 0.0015687942504882812, 0.0017625093460083008, 0.0019562244415283203, 0.00214993953704834, 0.0023436546325683594, 0.002537369728088379, 0.0027310848236083984, 0.002924799919128418, 0.0031185150146484375, 0.003312230110168457, 0.0035059452056884766, 0.003699660301208496, 0.0038933753967285156, 0.004087090492248535, 0.004280805587768555, 0.004474520683288574, 0.004668235778808594, 0.004861950874328613, 0.005055665969848633, 0.005249381065368652, 0.005443096160888672, 0.005636811256408691, 0.005830526351928711, 0.0060242414474487305, 0.00621795654296875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 10.0, 0.0, 0.0, 14.0, 0.0, 0.0, 31.0, 0.0, 0.0, 39.0, 0.0, 0.0, 60.0, 0.0, 145.0, 0.0, 0.0, 388.0, 0.0, 0.0, 156.0, 0.0, 0.0, 81.0, 0.0, 0.0, 38.0, 0.0, 0.0, 27.0, 0.0, 0.0, 11.0, 0.0, 0.0, 9.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.543712854385376e-07, -7.338821887969971e-07, -7.133930921554565e-07, -6.92903995513916e-07, -6.724148988723755e-07, -6.51925802230835e-07, -6.314367055892944e-07, -6.109476089477539e-07, -5.904585123062134e-07, -5.699694156646729e-07, -5.494803190231323e-07, -5.289912223815918e-07, -5.085021257400513e-07, -4.880130290985107e-07, -4.675239324569702e-07, -4.470348358154297e-07, -4.2654573917388916e-07, -4.0605664253234863e-07, -3.855675458908081e-07, -3.650784492492676e-07, -3.4458935260772705e-07, -3.241002559661865e-07, -3.03611159324646e-07, -2.8312206268310547e-07, -2.6263296604156494e-07, -2.421438694000244e-07, -2.2165477275848389e-07, -2.0116567611694336e-07, -1.8067657947540283e-07, -1.601874828338623e-07, -1.3969838619232178e-07, -1.1920928955078125e-07, -9.872019290924072e-08, -7.82310962677002e-08, -5.774199962615967e-08, -3.725290298461914e-08, -1.6763806343078613e-08, 3.725290298461914e-09, 2.421438694000244e-08, 4.470348358154297e-08, 6.51925802230835e-08, 8.568167686462402e-08, 1.0617077350616455e-07, 1.2665987014770508e-07, 1.471489667892456e-07, 1.6763806343078613e-07, 1.8812716007232666e-07, 2.086162567138672e-07, 2.2910535335540771e-07, 2.4959444999694824e-07, 2.7008354663848877e-07, 2.905726432800293e-07, 3.110617399215698e-07, 3.3155083656311035e-07, 3.520399332046509e-07, 3.725290298461914e-07, 3.9301812648773193e-07, 4.1350722312927246e-07, 4.33996319770813e-07, 4.544854164123535e-07, 4.7497451305389404e-07, 4.954636096954346e-07, 5.159527063369751e-07, 5.364418029785156e-07]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 20.0, 14.0, 22.0, 11.0, 26.0, 33.0, 25.0, 35.0, 74.0, 40.0, 129.0, 96.0, 119.0, 479.0, 3769.0, 977561.0, 64696.0, 552.0, 275.0, 71.0, 135.0, 53.0, 48.0, 71.0, 37.0, 34.0, 18.0, 22.0, 21.0, 13.0, 12.0, 8.0, 3.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.233816146850586e-05, -1.194886863231659e-05, -1.155957579612732e-05, -1.117028295993805e-05, -1.078099012374878e-05, -1.039169728755951e-05, -1.000240445137024e-05, -9.61311161518097e-06, -9.2238187789917e-06, -8.83452594280243e-06, -8.44523310661316e-06, -8.05594027042389e-06, -7.666647434234619e-06, -7.277354598045349e-06, -6.888061761856079e-06, -6.498768925666809e-06, -6.109476089477539e-06, -5.720183253288269e-06, -5.330890417098999e-06, -4.941597580909729e-06, -4.552304744720459e-06, -4.163011908531189e-06, -3.773719072341919e-06, -3.384426236152649e-06, -2.995133399963379e-06, -2.605840563774109e-06, -2.216547727584839e-06, -1.8272548913955688e-06, -1.4379620552062988e-06, -1.0486692190170288e-06, -6.593763828277588e-07, -2.7008354663848877e-07, 1.1920928955078125e-07, 5.085021257400513e-07, 8.977949619293213e-07, 1.2870877981185913e-06, 1.6763806343078613e-06, 2.0656734704971313e-06, 2.4549663066864014e-06, 2.8442591428756714e-06, 3.2335519790649414e-06, 3.6228448152542114e-06, 4.0121376514434814e-06, 4.4014304876327515e-06, 4.7907233238220215e-06, 5.1800161600112915e-06, 5.5693089962005615e-06, 5.9586018323898315e-06, 6.3478946685791016e-06, 6.737187504768372e-06, 7.126480340957642e-06, 7.515773177146912e-06, 7.905066013336182e-06, 8.294358849525452e-06, 8.683651685714722e-06, 9.072944521903992e-06, 9.462237358093262e-06, 9.851530194282532e-06, 1.0240823030471802e-05, 1.0630115866661072e-05, 1.1019408702850342e-05, 1.1408701539039612e-05, 1.1797994375228882e-05, 1.2187287211418152e-05, 1.2576580047607422e-05]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 51.0, 289.0, 594.0, 73.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0107694379257737e-06, -9.478548577135371e-07, -8.849402775013004e-07, -8.220257541324827e-07, -7.591111739202461e-07, -6.961965937080095e-07, -6.332820703391917e-07, -5.703674901269551e-07, -5.074529099147185e-07, -4.4453832970248186e-07, -3.816237779119547e-07, -3.187092261214275e-07, -2.557946459091909e-07, -1.9288006569695426e-07, -1.2996551390642708e-07, -6.705096211589989e-08, -4.136381903663278e-09, 5.877818409771862e-08, 1.2169275009910052e-07, 1.8460731610048242e-07, 2.475218821018643e-07, 3.1043646231410094e-07, 3.733510141046281e-07, 4.362655658951553e-07, 4.991801461073919e-07, 5.620947263196285e-07, 6.250093065318651e-07, 6.879238299006829e-07, 7.508384101129195e-07, 8.137529903251561e-07, 8.766675136939739e-07, 9.395820939062105e-07, 1.0024969014921226e-06, 1.0654114248609403e-06, 1.1283260619165958e-06, 1.1912405852854135e-06, 1.254155222341069e-06, 1.3170697457098868e-06, 1.3799842690787045e-06, 1.4428987924475223e-06, 1.5058134295031778e-06, 1.5687279528719955e-06, 1.631642589927651e-06, 1.6945571132964687e-06, 1.7574716366652865e-06, 1.820386273720942e-06, 1.8833007970897597e-06, 1.946215434145415e-06, 2.009129957514233e-06, 2.0720444808830507e-06, 2.1349590042518685e-06, 2.1978737549943617e-06, 2.2607882783631794e-06, 2.323702801731997e-06, 2.386617325100815e-06, 2.4495318484696327e-06, 2.5124463718384504e-06, 2.575360895207268e-06, 2.638275418576086e-06, 2.701190169318579e-06, 2.764104692687397e-06, 2.8270192160562146e-06, 2.8899337394250324e-06, 2.95284826279385e-06, 3.0157630135363434e-06]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.0, 0.0, 0.0, 0.0, 0.0, 179.0, 0.0, 0.0, 0.0, 0.0, 376.0, 0.0, 0.0, 0.0, 0.0, 0.0, 220.0, 0.0, 0.0, 0.0, 0.0, 79.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.980232238769531e-07, -2.868473529815674e-07, -2.7567148208618164e-07, -2.644956111907959e-07, -2.5331974029541016e-07, -2.421438694000244e-07, -2.3096799850463867e-07, -2.1979212760925293e-07, -2.086162567138672e-07, -1.9744038581848145e-07, -1.862645149230957e-07, -1.7508864402770996e-07, -1.6391277313232422e-07, -1.5273690223693848e-07, -1.4156103134155273e-07, -1.30385160446167e-07, -1.1920928955078125e-07, -1.0803341865539551e-07, -9.685754776000977e-08, -8.568167686462402e-08, -7.450580596923828e-08, -6.332993507385254e-08, -5.21540641784668e-08, -4.0978193283081055e-08, -2.9802322387695312e-08, -1.862645149230957e-08, -7.450580596923828e-09, 3.725290298461914e-09, 1.4901161193847656e-08, 2.60770320892334e-08, 3.725290298461914e-08, 4.842877388000488e-08, 5.960464477539063e-08, 7.078051567077637e-08, 8.195638656616211e-08, 9.313225746154785e-08, 1.043081283569336e-07, 1.1548399925231934e-07, 1.2665987014770508e-07, 1.3783574104309082e-07, 1.4901161193847656e-07, 1.601874828338623e-07, 1.7136335372924805e-07, 1.825392246246338e-07, 1.9371509552001953e-07, 2.0489096641540527e-07, 2.1606683731079102e-07, 2.2724270820617676e-07, 2.384185791015625e-07, 2.4959444999694824e-07, 2.60770320892334e-07, 2.7194619178771973e-07, 2.8312206268310547e-07, 2.942979335784912e-07, 3.0547380447387695e-07, 3.166496753692627e-07, 3.2782554626464844e-07, 3.390014171600342e-07, 3.501772880554199e-07, 3.6135315895080566e-07, 3.725290298461914e-07, 3.8370490074157715e-07, 3.948807716369629e-07, 4.0605664253234863e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 5.0, 12.0, 10.0, 18.0, 19.0, 25.0, 22.0, 33.0, 37.0, 56.0, 45.0, 72.0, 53.0, 71.0, 64.0, 56.0, 62.0, 48.0, 62.0, 56.0, 40.0, 33.0, 30.0, 20.0, 16.0, 8.0, 8.0, 5.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0], "bins": [-3.736328125, -3.6497955322265625, -3.563262939453125, -3.4767303466796875, -3.39019775390625, -3.3036651611328125, -3.217132568359375, -3.1305999755859375, -3.0440673828125, -2.9575347900390625, -2.871002197265625, -2.7844696044921875, -2.69793701171875, -2.6114044189453125, -2.524871826171875, -2.4383392333984375, -2.351806640625, -2.2652740478515625, -2.178741455078125, -2.0922088623046875, -2.00567626953125, -1.9191436767578125, -1.832611083984375, -1.7460784912109375, -1.6595458984375, -1.5730133056640625, -1.486480712890625, -1.3999481201171875, -1.31341552734375, -1.2268829345703125, -1.140350341796875, -1.0538177490234375, -0.96728515625, -0.8807525634765625, -0.794219970703125, -0.7076873779296875, -0.62115478515625, -0.5346221923828125, -0.448089599609375, -0.3615570068359375, -0.2750244140625, -0.1884918212890625, -0.101959228515625, -0.0154266357421875, 0.07110595703125, 0.1576385498046875, 0.244171142578125, 0.3307037353515625, 0.417236328125, 0.5037689208984375, 0.590301513671875, 0.6768341064453125, 0.76336669921875, 0.8498992919921875, 0.936431884765625, 1.0229644775390625, 1.1094970703125, 1.1960296630859375, 1.282562255859375, 1.3690948486328125, 1.45562744140625, 1.5421600341796875, 1.628692626953125, 1.7152252197265625, 1.8017578125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 12.0, 26.0, 36.0, 53.0, 91.0, 136.0, 271.0, 490.0, 945.0, 1790.0, 3532.0, 7688.0, 18684.0, 54566.0, 240565.0, 559026.0, 106590.0, 31270.0, 12226.0, 5224.0, 2560.0, 1254.0, 646.0, 383.0, 186.0, 125.0, 70.0, 50.0, 22.0, 14.0, 8.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.236328125, -3.14453125, -3.052734375, -2.9609375, -2.869140625, -2.77734375, -2.685546875, -2.59375, -2.501953125, -2.41015625, -2.318359375, -2.2265625, -2.134765625, -2.04296875, -1.951171875, -1.859375, -1.767578125, -1.67578125, -1.583984375, -1.4921875, -1.400390625, -1.30859375, -1.216796875, -1.125, -1.033203125, -0.94140625, -0.849609375, -0.7578125, -0.666015625, -0.57421875, -0.482421875, -0.390625, -0.298828125, -0.20703125, -0.115234375, -0.0234375, 0.068359375, 0.16015625, 0.251953125, 0.34375, 0.435546875, 0.52734375, 0.619140625, 0.7109375, 0.802734375, 0.89453125, 0.986328125, 1.078125, 1.169921875, 1.26171875, 1.353515625, 1.4453125, 1.537109375, 1.62890625, 1.720703125, 1.8125, 1.904296875, 1.99609375, 2.087890625, 2.1796875, 2.271484375, 2.36328125, 2.455078125, 2.546875, 2.638671875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 10.0, 7.0, 7.0, 6.0, 12.0, 10.0, 9.0, 12.0, 16.0, 21.0, 17.0, 19.0, 23.0, 23.0, 31.0, 27.0, 39.0, 31.0, 53.0, 49.0, 84.0, 222.0, 1664.0, 156.0, 71.0, 54.0, 43.0, 31.0, 40.0, 35.0, 29.0, 23.0, 25.0, 26.0, 18.0, 20.0, 14.0, 13.0, 12.0, 8.0, 8.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.81640625, -5.63092041015625, -5.4454345703125, -5.25994873046875, -5.074462890625, -4.88897705078125, -4.7034912109375, -4.51800537109375, -4.33251953125, -4.14703369140625, -3.9615478515625, -3.77606201171875, -3.590576171875, -3.40509033203125, -3.2196044921875, -3.03411865234375, -2.8486328125, -2.66314697265625, -2.4776611328125, -2.29217529296875, -2.106689453125, -1.92120361328125, -1.7357177734375, -1.55023193359375, -1.36474609375, -1.17926025390625, -0.9937744140625, -0.80828857421875, -0.622802734375, -0.43731689453125, -0.2518310546875, -0.06634521484375, 0.119140625, 0.30462646484375, 0.4901123046875, 0.67559814453125, 0.861083984375, 1.04656982421875, 1.2320556640625, 1.41754150390625, 1.60302734375, 1.78851318359375, 1.9739990234375, 2.15948486328125, 2.344970703125, 2.53045654296875, 2.7159423828125, 2.90142822265625, 3.0869140625, 3.27239990234375, 3.4578857421875, 3.64337158203125, 3.828857421875, 4.01434326171875, 4.1998291015625, 4.38531494140625, 4.57080078125, 4.75628662109375, 4.9417724609375, 5.12725830078125, 5.312744140625, 5.49822998046875, 5.6837158203125, 5.86920166015625, 6.0546875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 7.0, 1.0, 7.0, 8.0, 7.0, 3.0, 9.0, 18.0, 13.0, 20.0, 18.0, 28.0, 31.0, 26.0, 50.0, 45.0, 80.0, 111.0, 206.0, 344.0, 858.0, 5916.0, 533397.0, 2592067.0, 10384.0, 1002.0, 379.0, 194.0, 124.0, 67.0, 53.0, 40.0, 26.0, 31.0, 17.0, 17.0, 22.0, 18.0, 12.0, 10.0, 9.0, 7.0, 2.0, 5.0, 13.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.796875, -11.4173583984375, -11.037841796875, -10.6583251953125, -10.27880859375, -9.8992919921875, -9.519775390625, -9.1402587890625, -8.7607421875, -8.3812255859375, -8.001708984375, -7.6221923828125, -7.24267578125, -6.8631591796875, -6.483642578125, -6.1041259765625, -5.724609375, -5.3450927734375, -4.965576171875, -4.5860595703125, -4.20654296875, -3.8270263671875, -3.447509765625, -3.0679931640625, -2.6884765625, -2.3089599609375, -1.929443359375, -1.5499267578125, -1.17041015625, -0.7908935546875, -0.411376953125, -0.0318603515625, 0.34765625, 0.7271728515625, 1.106689453125, 1.4862060546875, 1.86572265625, 2.2452392578125, 2.624755859375, 3.0042724609375, 3.3837890625, 3.7633056640625, 4.142822265625, 4.5223388671875, 4.90185546875, 5.2813720703125, 5.660888671875, 6.0404052734375, 6.419921875, 6.7994384765625, 7.178955078125, 7.5584716796875, 7.93798828125, 8.3175048828125, 8.697021484375, 9.0765380859375, 9.4560546875, 9.8355712890625, 10.215087890625, 10.5946044921875, 10.97412109375, 11.3536376953125, 11.733154296875, 12.1126708984375, 12.4921875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 8.0, 1011.0], "bins": [-361.3667907714844, -355.6764831542969, -349.9861755371094, -344.29583740234375, -338.60552978515625, -332.91522216796875, -327.22491455078125, -321.53460693359375, -315.84429931640625, -310.15399169921875, -304.46368408203125, -298.77337646484375, -293.0830383300781, -287.3927307128906, -281.7024230957031, -276.0121154785156, -270.32177734375, -264.6314697265625, -258.941162109375, -253.25083923339844, -247.56053161621094, -241.87020874023438, -236.17990112304688, -230.48959350585938, -224.79928588867188, -219.10897827148438, -213.4186553955078, -207.7283477783203, -202.0380401611328, -196.34771728515625, -190.65740966796875, -184.96710205078125, -179.27679443359375, -173.58648681640625, -167.8961639404297, -162.2058563232422, -156.5155487060547, -150.82522583007812, -145.13491821289062, -139.44461059570312, -133.75428771972656, -128.06398010253906, -122.37366485595703, -116.683349609375, -110.9930419921875, -105.30272674560547, -99.61241149902344, -93.92210388183594, -88.2317886352539, -82.54147338867188, -76.85116577148438, -71.16085052490234, -65.47053527832031, -59.78022766113281, -54.08991241455078, -48.399600982666016, -42.70928955078125, -37.018978118896484, -31.328664779663086, -25.638351440429688, -19.948040008544922, -14.257728576660156, -8.567413330078125, -2.8771018981933594, 2.813208818435669]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 3.0, 7.0, 12.0, 9.0, 9.0, 10.0, 10.0, 14.0, 20.0, 34.0, 24.0, 16.0, 29.0, 28.0, 28.0, 47.0, 39.0, 41.0, 24.0, 33.0, 42.0, 39.0, 49.0, 51.0, 28.0, 32.0, 40.0, 35.0, 26.0, 28.0, 24.0, 11.0, 24.0, 17.0, 21.0, 24.0, 14.0, 4.0, 14.0, 5.0, 3.0, 6.0, 4.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-22.755081176757812, -22.09783363342285, -21.44058609008789, -20.783340454101562, -20.1260929107666, -19.46884536743164, -18.81159782409668, -18.15435028076172, -17.497102737426758, -16.839855194091797, -16.182607650756836, -15.525361061096191, -14.86811351776123, -14.210866928100586, -13.553619384765625, -12.896371841430664, -12.23912525177002, -11.581877708435059, -10.924631118774414, -10.267383575439453, -9.610136032104492, -8.952888488769531, -8.295641899108887, -7.638394355773926, -6.981147289276123, -6.32390022277832, -5.666652679443359, -5.009405612945557, -4.352158546447754, -3.694911003112793, -3.0376639366149902, -2.3804163932800293, -1.7231693267822266, -1.0659220218658447, -0.40867483615875244, 0.24857234954833984, 0.9058196544647217, 1.5630669593811035, 2.2203140258789062, 2.877561569213867, 3.53480863571167, 4.192055702209473, 4.849303245544434, 5.506550312042236, 6.163797378540039, 6.821044921875, 7.478291988372803, 8.135540008544922, 8.792786598205566, 9.450034141540527, 10.107280731201172, 10.764528274536133, 11.421775817871094, 12.079023361206055, 12.7362699508667, 13.39351749420166, 14.050764083862305, 14.708011627197266, 15.36525821685791, 16.022506713867188, 16.679752349853516, 17.336999893188477, 17.994247436523438, 18.6514949798584, 19.30874252319336]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 5.0, 3.0, 3.0, 15.0, 10.0, 23.0, 14.0, 29.0, 20.0, 31.0, 40.0, 48.0, 52.0, 59.0, 66.0, 67.0, 65.0, 54.0, 57.0, 47.0, 71.0, 45.0, 42.0, 43.0, 26.0, 19.0, 16.0, 8.0, 10.0, 6.0, 4.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.74609375, -3.6594696044921875, -3.572845458984375, -3.4862213134765625, -3.39959716796875, -3.3129730224609375, -3.226348876953125, -3.1397247314453125, -3.0531005859375, -2.9664764404296875, -2.879852294921875, -2.7932281494140625, -2.70660400390625, -2.6199798583984375, -2.533355712890625, -2.4467315673828125, -2.360107421875, -2.2734832763671875, -2.186859130859375, -2.1002349853515625, -2.01361083984375, -1.9269866943359375, -1.840362548828125, -1.7537384033203125, -1.6671142578125, -1.5804901123046875, -1.493865966796875, -1.4072418212890625, -1.32061767578125, -1.2339935302734375, -1.147369384765625, -1.0607452392578125, -0.97412109375, -0.8874969482421875, -0.800872802734375, -0.7142486572265625, -0.62762451171875, -0.5410003662109375, -0.454376220703125, -0.3677520751953125, -0.2811279296875, -0.1945037841796875, -0.107879638671875, -0.0212554931640625, 0.06536865234375, 0.1519927978515625, 0.238616943359375, 0.3252410888671875, 0.411865234375, 0.4984893798828125, 0.585113525390625, 0.6717376708984375, 0.75836181640625, 0.8449859619140625, 0.931610107421875, 1.0182342529296875, 1.1048583984375, 1.1914825439453125, 1.278106689453125, 1.3647308349609375, 1.45135498046875, 1.5379791259765625, 1.624603271484375, 1.7112274169921875, 1.7978515625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 2.0, 7.0, 9.0, 25.0, 21.0, 36.0, 42.0, 56.0, 85.0, 157.0, 319.0, 796.0, 3442.0, 66607.0, 3872211.0, 241569.0, 6868.0, 1168.0, 366.0, 175.0, 114.0, 61.0, 37.0, 32.0, 32.0, 19.0, 5.0, 6.0, 3.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-28.34375, -27.6943359375, -27.044921875, -26.3955078125, -25.74609375, -25.0966796875, -24.447265625, -23.7978515625, -23.1484375, -22.4990234375, -21.849609375, -21.2001953125, -20.55078125, -19.9013671875, -19.251953125, -18.6025390625, -17.953125, -17.3037109375, -16.654296875, -16.0048828125, -15.35546875, -14.7060546875, -14.056640625, -13.4072265625, -12.7578125, -12.1083984375, -11.458984375, -10.8095703125, -10.16015625, -9.5107421875, -8.861328125, -8.2119140625, -7.5625, -6.9130859375, -6.263671875, -5.6142578125, -4.96484375, -4.3154296875, -3.666015625, -3.0166015625, -2.3671875, -1.7177734375, -1.068359375, -0.4189453125, 0.23046875, 0.8798828125, 1.529296875, 2.1787109375, 2.828125, 3.4775390625, 4.126953125, 4.7763671875, 5.42578125, 6.0751953125, 6.724609375, 7.3740234375, 8.0234375, 8.6728515625, 9.322265625, 9.9716796875, 10.62109375, 11.2705078125, 11.919921875, 12.5693359375, 13.21875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 18.0, 25.0, 44.0, 103.0, 178.0, 271.0, 462.0, 730.0, 822.0, 573.0, 391.0, 204.0, 98.0, 57.0, 30.0, 27.0, 14.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9029541015625, -9.524658203125, -9.1463623046875, -8.76806640625, -8.3897705078125, -8.011474609375, -7.6331787109375, -7.2548828125, -6.8765869140625, -6.498291015625, -6.1199951171875, -5.74169921875, -5.3634033203125, -4.985107421875, -4.6068115234375, -4.228515625, -3.8502197265625, -3.471923828125, -3.0936279296875, -2.71533203125, -2.3370361328125, -1.958740234375, -1.5804443359375, -1.2021484375, -0.8238525390625, -0.445556640625, -0.0672607421875, 0.31103515625, 0.6893310546875, 1.067626953125, 1.4459228515625, 1.82421875, 2.2025146484375, 2.580810546875, 2.9591064453125, 3.33740234375, 3.7156982421875, 4.093994140625, 4.4722900390625, 4.8505859375, 5.2288818359375, 5.607177734375, 5.9854736328125, 6.36376953125, 6.7420654296875, 7.120361328125, 7.4986572265625, 7.876953125, 8.2552490234375, 8.633544921875, 9.0118408203125, 9.39013671875, 9.7684326171875, 10.146728515625, 10.5250244140625, 10.9033203125, 11.2816162109375, 11.659912109375, 12.0382080078125, 12.41650390625, 12.7947998046875, 13.173095703125, 13.5513916015625, 13.9296875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 15.0, 8.0, 9.0, 23.0, 20.0, 32.0, 58.0, 66.0, 86.0, 143.0, 224.0, 370.0, 721.0, 1581.0, 5462.0, 43604.0, 891865.0, 3080171.0, 152690.0, 12379.0, 2499.0, 956.0, 469.0, 261.0, 163.0, 120.0, 83.0, 56.0, 43.0, 25.0, 28.0, 19.0, 14.0, 7.0, 1.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.953125, -20.322509765625, -19.69189453125, -19.061279296875, -18.4306640625, -17.800048828125, -17.16943359375, -16.538818359375, -15.908203125, -15.277587890625, -14.64697265625, -14.016357421875, -13.3857421875, -12.755126953125, -12.12451171875, -11.493896484375, -10.86328125, -10.232666015625, -9.60205078125, -8.971435546875, -8.3408203125, -7.710205078125, -7.07958984375, -6.448974609375, -5.818359375, -5.187744140625, -4.55712890625, -3.926513671875, -3.2958984375, -2.665283203125, -2.03466796875, -1.404052734375, -0.7734375, -0.142822265625, 0.48779296875, 1.118408203125, 1.7490234375, 2.379638671875, 3.01025390625, 3.640869140625, 4.271484375, 4.902099609375, 5.53271484375, 6.163330078125, 6.7939453125, 7.424560546875, 8.05517578125, 8.685791015625, 9.31640625, 9.947021484375, 10.57763671875, 11.208251953125, 11.8388671875, 12.469482421875, 13.10009765625, 13.730712890625, 14.361328125, 14.991943359375, 15.62255859375, 16.253173828125, 16.8837890625, 17.514404296875, 18.14501953125, 18.775634765625, 19.40625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 23.0, 72.0, 180.0, 280.0, 259.0, 139.0, 45.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.13874053955078, -64.05313110351562, -60.9675178527832, -57.88190460205078, -54.796295166015625, -51.7106819152832, -48.62506866455078, -45.539459228515625, -42.4538459777832, -39.36823272705078, -36.282623291015625, -33.1970100402832, -30.111398696899414, -27.025787353515625, -23.940174102783203, -20.854562759399414, -17.768951416015625, -14.683340072631836, -11.59772777557373, -8.512115478515625, -5.426504135131836, -2.340892791748047, 0.744720458984375, 3.830331802368164, 6.915943145751953, 10.001554489135742, 13.087166786193848, 16.172779083251953, 19.258390426635742, 22.34400177001953, 25.429615020751953, 28.515226364135742, 31.600845336914062, 34.686458587646484, 37.77206802368164, 40.85768127441406, 43.94329071044922, 47.02890396118164, 50.11451721191406, 53.20012664794922, 56.28573989868164, 59.37135314941406, 62.45696258544922, 65.54257202148438, 68.62818908691406, 71.71379852294922, 74.79940795898438, 77.88502502441406, 80.97063446044922, 84.05624389648438, 87.14186096191406, 90.22747039794922, 93.31307983398438, 96.39869689941406, 99.48430633544922, 102.56991577148438, 105.65553283691406, 108.74114227294922, 111.8267593383789, 114.91236877441406, 117.99797821044922, 121.08358764648438, 124.16920471191406, 127.25481414794922, 130.34042358398438]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 7.0, 11.0, 13.0, 14.0, 9.0, 8.0, 7.0, 19.0, 22.0, 22.0, 27.0, 19.0, 30.0, 27.0, 25.0, 34.0, 31.0, 32.0, 30.0, 44.0, 44.0, 41.0, 38.0, 35.0, 39.0, 35.0, 23.0, 33.0, 29.0, 31.0, 33.0, 10.0, 32.0, 15.0, 18.0, 14.0, 18.0, 14.0, 14.0, 7.0, 7.0, 8.0, 5.0, 4.0, 7.0, 3.0, 1.0, 3.0, 0.0, 3.0], "bins": [-23.70941162109375, -23.038780212402344, -22.36815071105957, -21.697519302368164, -21.026887893676758, -20.356258392333984, -19.685626983642578, -19.014995574951172, -18.344364166259766, -17.67373275756836, -17.003103256225586, -16.33247184753418, -15.661840438842773, -14.991209983825684, -14.320579528808594, -13.649948120117188, -12.979318618774414, -12.308688163757324, -11.638056755065918, -10.967426300048828, -10.296794891357422, -9.626164436340332, -8.955533981323242, -8.284902572631836, -7.614272117614746, -6.943641185760498, -6.27301025390625, -5.60237979888916, -4.931748867034912, -4.261117935180664, -3.590487480163574, -2.919856548309326, -2.249225616455078, -1.5785948038101196, -0.9079639911651611, -0.2373332977294922, 0.43329763412475586, 1.103928565979004, 1.7745590209960938, 2.445189952850342, 3.11582088470459, 3.786451816558838, 4.457082748413086, 5.127713203430176, 5.798344135284424, 6.468975067138672, 7.139605522155762, 7.81023645401001, 8.480867385864258, 9.151497840881348, 9.822129249572754, 10.492759704589844, 11.16339111328125, 11.83402156829834, 12.50465202331543, 13.175283432006836, 13.845913887023926, 14.516544342041016, 15.187175750732422, 15.857806205749512, 16.5284366607666, 17.199068069458008, 17.86969757080078, 18.540328979492188, 19.210960388183594]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 15.0, 13.0, 14.0, 35.0, 20.0, 24.0, 38.0, 47.0, 51.0, 50.0, 61.0, 71.0, 61.0, 62.0, 57.0, 57.0, 43.0, 46.0, 45.0, 39.0, 30.0, 30.0, 17.0, 19.0, 12.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 4.0], "bins": [-3.72265625, -3.6373138427734375, -3.551971435546875, -3.4666290283203125, -3.38128662109375, -3.2959442138671875, -3.210601806640625, -3.1252593994140625, -3.0399169921875, -2.9545745849609375, -2.869232177734375, -2.7838897705078125, -2.69854736328125, -2.6132049560546875, -2.527862548828125, -2.4425201416015625, -2.357177734375, -2.2718353271484375, -2.186492919921875, -2.1011505126953125, -2.01580810546875, -1.9304656982421875, -1.845123291015625, -1.7597808837890625, -1.6744384765625, -1.5890960693359375, -1.503753662109375, -1.4184112548828125, -1.33306884765625, -1.2477264404296875, -1.162384033203125, -1.0770416259765625, -0.99169921875, -0.9063568115234375, -0.821014404296875, -0.7356719970703125, -0.65032958984375, -0.5649871826171875, -0.479644775390625, -0.3943023681640625, -0.3089599609375, -0.2236175537109375, -0.138275146484375, -0.0529327392578125, 0.03240966796875, 0.1177520751953125, 0.203094482421875, 0.2884368896484375, 0.373779296875, 0.4591217041015625, 0.544464111328125, 0.6298065185546875, 0.71514892578125, 0.8004913330078125, 0.885833740234375, 0.9711761474609375, 1.0565185546875, 1.1418609619140625, 1.227203369140625, 1.3125457763671875, 1.39788818359375, 1.4832305908203125, 1.568572998046875, 1.6539154052734375, 1.7392578125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 3.0, 7.0, 5.0, 16.0, 24.0, 32.0, 35.0, 79.0, 169.0, 228.0, 505.0, 989.0, 1951.0, 4191.0, 8994.0, 20010.0, 46774.0, 120663.0, 392351.0, 290792.0, 92919.0, 37680.0, 15978.0, 7243.0, 3423.0, 1696.0, 798.0, 445.0, 240.0, 114.0, 61.0, 40.0, 21.0, 13.0, 10.0, 16.0, 9.0, 2.0, 7.0, 3.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.033721923828125, -0.03278183937072754, -0.03184175491333008, -0.030901670455932617, -0.029961585998535156, -0.029021501541137695, -0.028081417083740234, -0.027141332626342773, -0.026201248168945312, -0.02526116371154785, -0.02432107925415039, -0.02338099479675293, -0.02244091033935547, -0.021500825881958008, -0.020560741424560547, -0.019620656967163086, -0.018680572509765625, -0.017740488052368164, -0.016800403594970703, -0.015860319137573242, -0.014920234680175781, -0.01398015022277832, -0.01304006576538086, -0.012099981307983398, -0.011159896850585938, -0.010219812393188477, -0.009279727935791016, -0.008339643478393555, -0.007399559020996094, -0.006459474563598633, -0.005519390106201172, -0.004579305648803711, -0.00363922119140625, -0.002699136734008789, -0.0017590522766113281, -0.0008189678192138672, 0.00012111663818359375, 0.0010612010955810547, 0.0020012855529785156, 0.0029413700103759766, 0.0038814544677734375, 0.0048215389251708984, 0.005761623382568359, 0.00670170783996582, 0.007641792297363281, 0.008581876754760742, 0.009521961212158203, 0.010462045669555664, 0.011402130126953125, 0.012342214584350586, 0.013282299041748047, 0.014222383499145508, 0.015162467956542969, 0.01610255241394043, 0.01704263687133789, 0.01798272132873535, 0.018922805786132812, 0.019862890243530273, 0.020802974700927734, 0.021743059158325195, 0.022683143615722656, 0.023623228073120117, 0.024563312530517578, 0.02550339698791504, 0.0264434814453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 5.0, 11.0, 13.0, 11.0, 21.0, 22.0, 19.0, 26.0, 26.0, 24.0, 35.0, 24.0, 34.0, 43.0, 42.0, 49.0, 43.0, 1079.0, 28.0, 41.0, 44.0, 43.0, 41.0, 41.0, 33.0, 33.0, 27.0, 26.0, 17.0, 18.0, 20.0, 19.0, 14.0, 10.0, 9.0, 3.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41015625, -1.3609466552734375, -1.311737060546875, -1.2625274658203125, -1.21331787109375, -1.1641082763671875, -1.114898681640625, -1.0656890869140625, -1.0164794921875, -0.9672698974609375, -0.918060302734375, -0.8688507080078125, -0.81964111328125, -0.7704315185546875, -0.721221923828125, -0.6720123291015625, -0.622802734375, -0.5735931396484375, -0.524383544921875, -0.4751739501953125, -0.42596435546875, -0.3767547607421875, -0.327545166015625, -0.2783355712890625, -0.2291259765625, -0.1799163818359375, -0.130706787109375, -0.0814971923828125, -0.03228759765625, 0.0169219970703125, 0.066131591796875, 0.1153411865234375, 0.16455078125, 0.2137603759765625, 0.262969970703125, 0.3121795654296875, 0.36138916015625, 0.4105987548828125, 0.459808349609375, 0.5090179443359375, 0.5582275390625, 0.6074371337890625, 0.656646728515625, 0.7058563232421875, 0.75506591796875, 0.8042755126953125, 0.853485107421875, 0.9026947021484375, 0.951904296875, 1.0011138916015625, 1.050323486328125, 1.0995330810546875, 1.14874267578125, 1.1979522705078125, 1.247161865234375, 1.2963714599609375, 1.3455810546875, 1.3947906494140625, 1.444000244140625, 1.4932098388671875, 1.54241943359375, 1.5916290283203125, 1.640838623046875, 1.6900482177734375, 1.7392578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 3.0, 11.0, 11.0, 25.0, 19.0, 50.0, 71.0, 100.0, 150.0, 167.0, 283.0, 396.0, 563.0, 888.0, 1261.0, 1882.0, 2821.0, 4419.0, 6614.0, 10492.0, 16334.0, 25679.0, 40772.0, 65585.0, 109625.0, 183174.0, 1263852.0, 139629.0, 82857.0, 50899.0, 31712.0, 19751.0, 12736.0, 8236.0, 5514.0, 3464.0, 2306.0, 1571.0, 1037.0, 685.0, 439.0, 343.0, 244.0, 149.0, 91.0, 68.0, 44.0, 33.0, 34.0, 13.0, 6.0, 2.0, 9.0, 8.0, 2.0, 0.0, 4.0, 3.0], "bins": [-0.005870819091796875, -0.005688667297363281, -0.0055065155029296875, -0.005324363708496094, -0.0051422119140625, -0.004960060119628906, -0.0047779083251953125, -0.004595756530761719, -0.004413604736328125, -0.004231452941894531, -0.0040493011474609375, -0.0038671493530273438, -0.00368499755859375, -0.0035028457641601562, -0.0033206939697265625, -0.0031385421752929688, -0.002956390380859375, -0.0027742385864257812, -0.0025920867919921875, -0.0024099349975585938, -0.002227783203125, -0.0020456314086914062, -0.0018634796142578125, -0.0016813278198242188, -0.001499176025390625, -0.0013170242309570312, -0.0011348724365234375, -0.0009527206420898438, -0.00077056884765625, -0.0005884170532226562, -0.0004062652587890625, -0.00022411346435546875, -4.1961669921875e-05, 0.00014019012451171875, 0.0003223419189453125, 0.0005044937133789062, 0.0006866455078125, 0.0008687973022460938, 0.0010509490966796875, 0.0012331008911132812, 0.001415252685546875, 0.0015974044799804688, 0.0017795562744140625, 0.0019617080688476562, 0.00214385986328125, 0.0023260116577148438, 0.0025081634521484375, 0.0026903152465820312, 0.002872467041015625, 0.0030546188354492188, 0.0032367706298828125, 0.0034189224243164062, 0.00360107421875, 0.0037832260131835938, 0.0039653778076171875, 0.004147529602050781, 0.004329681396484375, 0.004511833190917969, 0.0046939849853515625, 0.004876136779785156, 0.00505828857421875, 0.005240440368652344, 0.0054225921630859375, 0.005604743957519531, 0.005786895751953125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 147.0, 0.0, 0.0, 475.0, 0.0, 0.0, 0.0, 131.0, 0.0, 0.0, 93.0, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.792826414108276e-07, -5.62518835067749e-07, -5.457550287246704e-07, -5.289912223815918e-07, -5.122274160385132e-07, -4.954636096954346e-07, -4.78699803352356e-07, -4.6193599700927734e-07, -4.4517219066619873e-07, -4.284083843231201e-07, -4.116445779800415e-07, -3.948807716369629e-07, -3.781169652938843e-07, -3.6135315895080566e-07, -3.4458935260772705e-07, -3.2782554626464844e-07, -3.110617399215698e-07, -2.942979335784912e-07, -2.775341272354126e-07, -2.60770320892334e-07, -2.4400651454925537e-07, -2.2724270820617676e-07, -2.1047890186309814e-07, -1.9371509552001953e-07, -1.7695128917694092e-07, -1.601874828338623e-07, -1.434236764907837e-07, -1.2665987014770508e-07, -1.0989606380462646e-07, -9.313225746154785e-08, -7.636845111846924e-08, -5.960464477539063e-08, -4.284083843231201e-08, -2.60770320892334e-08, -9.313225746154785e-09, 7.450580596923828e-09, 2.421438694000244e-08, 4.0978193283081055e-08, 5.774199962615967e-08, 7.450580596923828e-08, 9.12696123123169e-08, 1.0803341865539551e-07, 1.2479722499847412e-07, 1.4156103134155273e-07, 1.5832483768463135e-07, 1.7508864402770996e-07, 1.9185245037078857e-07, 2.086162567138672e-07, 2.253800630569458e-07, 2.421438694000244e-07, 2.5890767574310303e-07, 2.7567148208618164e-07, 2.9243528842926025e-07, 3.0919909477233887e-07, 3.259629011154175e-07, 3.427267074584961e-07, 3.594905138015747e-07, 3.762543201446533e-07, 3.9301812648773193e-07, 4.0978193283081055e-07, 4.2654573917388916e-07, 4.4330954551696777e-07, 4.600733518600464e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 8.0, 9.0, 19.0, 22.0, 15.0, 43.0, 50.0, 13.0, 70.0, 154.0, 58.0, 114.0, 400.0, 1162.0, 68787.0, 950934.0, 25219.0, 529.0, 405.0, 69.0, 52.0, 177.0, 51.0, 25.0, 43.0, 28.0, 12.0, 24.0, 21.0, 6.0, 6.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-06, -7.533468306064606e-06, -7.2587281465530396e-06, -6.983987987041473e-06, -6.709247827529907e-06, -6.434507668018341e-06, -6.159767508506775e-06, -5.885027348995209e-06, -5.610287189483643e-06, -5.335547029972076e-06, -5.06080687046051e-06, -4.786066710948944e-06, -4.511326551437378e-06, -4.236586391925812e-06, -3.961846232414246e-06, -3.6871060729026794e-06, -3.4123659133911133e-06, -3.137625753879547e-06, -2.862885594367981e-06, -2.588145434856415e-06, -2.3134052753448486e-06, -2.0386651158332825e-06, -1.7639249563217163e-06, -1.4891847968101501e-06, -1.214444637298584e-06, -9.397044777870178e-07, -6.649643182754517e-07, -3.902241587638855e-07, -1.1548399925231934e-07, 1.5925616025924683e-07, 4.33996319770813e-07, 7.087364792823792e-07, 9.834766387939453e-07, 1.2582167983055115e-06, 1.5329569578170776e-06, 1.8076971173286438e-06, 2.08243727684021e-06, 2.357177436351776e-06, 2.6319175958633423e-06, 2.9066577553749084e-06, 3.1813979148864746e-06, 3.4561380743980408e-06, 3.730878233909607e-06, 4.005618393421173e-06, 4.280358552932739e-06, 4.555098712444305e-06, 4.829838871955872e-06, 5.104579031467438e-06, 5.379319190979004e-06, 5.65405935049057e-06, 5.928799510002136e-06, 6.203539669513702e-06, 6.4782798290252686e-06, 6.753019988536835e-06, 7.027760148048401e-06, 7.302500307559967e-06, 7.577240467071533e-06, 7.8519806265831e-06, 8.126720786094666e-06, 8.401460945606232e-06, 8.676201105117798e-06, 8.950941264629364e-06, 9.22568142414093e-06, 9.500421583652496e-06, 9.775161743164062e-06]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 13.0, 19.0, 32.0, 39.0, 60.0, 65.0, 469.0, 95.0, 81.0, 36.0, 39.0, 25.0, 16.0, 6.0, 6.0, 3.0, 2.0, 2.0], "bins": [-8.073860158219759e-07, -7.921365181573492e-07, -7.768870204927225e-07, -7.616375228280958e-07, -7.463880251634691e-07, -7.311385274988424e-07, -7.158890298342158e-07, -7.006394753261702e-07, -6.853899776615435e-07, -6.701404799969168e-07, -6.548909823322902e-07, -6.396414846676635e-07, -6.243919870030368e-07, -6.091424893384101e-07, -5.938929916737834e-07, -5.786434940091567e-07, -5.6339399634453e-07, -5.481444986799033e-07, -5.328950010152766e-07, -5.1764550335065e-07, -5.023960056860233e-07, -4.871465080213966e-07, -4.7189698193506047e-07, -4.566474842704338e-07, -4.413979866058071e-07, -4.261484889411804e-07, -4.108989912765537e-07, -3.9564949361192703e-07, -3.803999675255909e-07, -3.651504698609642e-07, -3.4990097219633753e-07, -3.3465147453171085e-07, -3.19402033710503e-07, -3.0415253604587633e-07, -2.8890303838124964e-07, -2.7365354071662296e-07, -2.5840404305199627e-07, -2.431545453873696e-07, -2.2790501930103346e-07, -2.1265552163640677e-07, -1.974060239717801e-07, -1.821565263071534e-07, -1.669070286425267e-07, -1.516575167670453e-07, -1.3640801910241862e-07, -1.2115852143779193e-07, -1.0590901666773789e-07, -9.065951189768384e-08, -7.541001423305715e-08, -6.016051656843047e-08, -4.491101179837642e-08, -2.9661510581036055e-08, -1.4412009363695688e-08, 8.374883009309997e-10, 1.6086993070985045e-08, 3.133649784103909e-08, 4.658599550566578e-08, 6.183549317029247e-08, 7.708499794034651e-08, 9.233450271040056e-08, 1.0758400037502724e-07, 1.2283349803965393e-07, 1.3808300991513534e-07, 1.5333250757976202e-07, 1.685820052443887e-07]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 192.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 485.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 199.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.980232238769531e-07, -2.896413207054138e-07, -2.812594175338745e-07, -2.728775143623352e-07, -2.644956111907959e-07, -2.561137080192566e-07, -2.477318048477173e-07, -2.39349901676178e-07, -2.3096799850463867e-07, -2.2258609533309937e-07, -2.1420419216156006e-07, -2.0582228899002075e-07, -1.9744038581848145e-07, -1.8905848264694214e-07, -1.8067657947540283e-07, -1.7229467630386353e-07, -1.6391277313232422e-07, -1.555308699607849e-07, -1.471489667892456e-07, -1.387670636177063e-07, -1.30385160446167e-07, -1.2200325727462769e-07, -1.1362135410308838e-07, -1.0523945093154907e-07, -9.685754776000977e-08, -8.847564458847046e-08, -8.009374141693115e-08, -7.171183824539185e-08, -6.332993507385254e-08, -5.494803190231323e-08, -4.6566128730773926e-08, -3.818422555923462e-08, -2.9802322387695312e-08, -2.1420419216156006e-08, -1.30385160446167e-08, -4.6566128730773926e-09, 3.725290298461914e-09, 1.210719347000122e-08, 2.0489096641540527e-08, 2.8870999813079834e-08, 3.725290298461914e-08, 4.563480615615845e-08, 5.4016709327697754e-08, 6.239861249923706e-08, 7.078051567077637e-08, 7.916241884231567e-08, 8.754432201385498e-08, 9.592622518539429e-08, 1.043081283569336e-07, 1.126900315284729e-07, 1.210719347000122e-07, 1.2945383787155151e-07, 1.3783574104309082e-07, 1.4621764421463013e-07, 1.5459954738616943e-07, 1.6298145055770874e-07, 1.7136335372924805e-07, 1.7974525690078735e-07, 1.8812716007232666e-07, 1.9650906324386597e-07, 2.0489096641540527e-07, 2.1327286958694458e-07, 2.2165477275848389e-07, 2.300366759300232e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 15.0, 13.0, 14.0, 35.0, 20.0, 24.0, 38.0, 47.0, 51.0, 50.0, 61.0, 71.0, 61.0, 62.0, 57.0, 57.0, 43.0, 46.0, 45.0, 39.0, 30.0, 30.0, 17.0, 19.0, 12.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 4.0], "bins": [-3.72265625, -3.6373138427734375, -3.551971435546875, -3.4666290283203125, -3.38128662109375, -3.2959442138671875, -3.210601806640625, -3.1252593994140625, -3.0399169921875, -2.9545745849609375, -2.869232177734375, -2.7838897705078125, -2.69854736328125, -2.6132049560546875, -2.527862548828125, -2.4425201416015625, -2.357177734375, -2.2718353271484375, -2.186492919921875, -2.1011505126953125, -2.01580810546875, -1.9304656982421875, -1.845123291015625, -1.7597808837890625, -1.6744384765625, -1.5890960693359375, -1.503753662109375, -1.4184112548828125, -1.33306884765625, -1.2477264404296875, -1.162384033203125, -1.0770416259765625, -0.99169921875, -0.9063568115234375, -0.821014404296875, -0.7356719970703125, -0.65032958984375, -0.5649871826171875, -0.479644775390625, -0.3943023681640625, -0.3089599609375, -0.2236175537109375, -0.138275146484375, -0.0529327392578125, 0.03240966796875, 0.1177520751953125, 0.203094482421875, 0.2884368896484375, 0.373779296875, 0.4591217041015625, 0.544464111328125, 0.6298065185546875, 0.71514892578125, 0.8004913330078125, 0.885833740234375, 0.9711761474609375, 1.0565185546875, 1.1418609619140625, 1.227203369140625, 1.3125457763671875, 1.39788818359375, 1.4832305908203125, 1.568572998046875, 1.6539154052734375, 1.7392578125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 9.0, 3.0, 8.0, 13.0, 19.0, 27.0, 32.0, 43.0, 67.0, 104.0, 169.0, 286.0, 388.0, 704.0, 1135.0, 1861.0, 3099.0, 5562.0, 10882.0, 24094.0, 65284.0, 409928.0, 411091.0, 65019.0, 24087.0, 10945.0, 5669.0, 3118.0, 1888.0, 1060.0, 706.0, 468.0, 260.0, 184.0, 110.0, 70.0, 54.0, 38.0, 21.0, 15.0, 10.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.771484375, -2.689971923828125, -2.60845947265625, -2.526947021484375, -2.4454345703125, -2.363922119140625, -2.28240966796875, -2.200897216796875, -2.119384765625, -2.037872314453125, -1.95635986328125, -1.874847412109375, -1.7933349609375, -1.711822509765625, -1.63031005859375, -1.548797607421875, -1.46728515625, -1.385772705078125, -1.30426025390625, -1.222747802734375, -1.1412353515625, -1.059722900390625, -0.97821044921875, -0.896697998046875, -0.815185546875, -0.733673095703125, -0.65216064453125, -0.570648193359375, -0.4891357421875, -0.407623291015625, -0.32611083984375, -0.244598388671875, -0.1630859375, -0.081573486328125, -6.103515625e-05, 0.081451416015625, 0.1629638671875, 0.244476318359375, 0.32598876953125, 0.407501220703125, 0.489013671875, 0.570526123046875, 0.65203857421875, 0.733551025390625, 0.8150634765625, 0.896575927734375, 0.97808837890625, 1.059600830078125, 1.14111328125, 1.222625732421875, 1.30413818359375, 1.385650634765625, 1.4671630859375, 1.548675537109375, 1.63018798828125, 1.711700439453125, 1.793212890625, 1.874725341796875, 1.95623779296875, 2.037750244140625, 2.1192626953125, 2.200775146484375, 2.28228759765625, 2.363800048828125, 2.4453125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 6.0, 10.0, 1.0, 8.0, 7.0, 7.0, 7.0, 16.0, 11.0, 12.0, 12.0, 21.0, 37.0, 27.0, 31.0, 32.0, 46.0, 36.0, 48.0, 54.0, 64.0, 139.0, 1802.0, 135.0, 52.0, 46.0, 54.0, 50.0, 42.0, 35.0, 24.0, 28.0, 24.0, 14.0, 22.0, 17.0, 12.0, 15.0, 10.0, 14.0, 8.0, 10.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-7.69140625, -7.474609375, -7.2578125, -7.041015625, -6.82421875, -6.607421875, -6.390625, -6.173828125, -5.95703125, -5.740234375, -5.5234375, -5.306640625, -5.08984375, -4.873046875, -4.65625, -4.439453125, -4.22265625, -4.005859375, -3.7890625, -3.572265625, -3.35546875, -3.138671875, -2.921875, -2.705078125, -2.48828125, -2.271484375, -2.0546875, -1.837890625, -1.62109375, -1.404296875, -1.1875, -0.970703125, -0.75390625, -0.537109375, -0.3203125, -0.103515625, 0.11328125, 0.330078125, 0.546875, 0.763671875, 0.98046875, 1.197265625, 1.4140625, 1.630859375, 1.84765625, 2.064453125, 2.28125, 2.498046875, 2.71484375, 2.931640625, 3.1484375, 3.365234375, 3.58203125, 3.798828125, 4.015625, 4.232421875, 4.44921875, 4.666015625, 4.8828125, 5.099609375, 5.31640625, 5.533203125, 5.75, 5.966796875, 6.18359375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 4.0, 9.0, 6.0, 12.0, 15.0, 9.0, 12.0, 16.0, 22.0, 18.0, 22.0, 33.0, 41.0, 58.0, 101.0, 142.0, 288.0, 787.0, 3938.0, 66115.0, 3019429.0, 49836.0, 3294.0, 717.0, 275.0, 121.0, 93.0, 58.0, 44.0, 49.0, 25.0, 20.0, 15.0, 13.0, 10.0, 10.0, 11.0, 4.0, 6.0, 11.0, 5.0, 8.0, 3.0, 0.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.21875, -10.8245849609375, -10.430419921875, -10.0362548828125, -9.64208984375, -9.2479248046875, -8.853759765625, -8.4595947265625, -8.0654296875, -7.6712646484375, -7.277099609375, -6.8829345703125, -6.48876953125, -6.0946044921875, -5.700439453125, -5.3062744140625, -4.912109375, -4.5179443359375, -4.123779296875, -3.7296142578125, -3.33544921875, -2.9412841796875, -2.547119140625, -2.1529541015625, -1.7587890625, -1.3646240234375, -0.970458984375, -0.5762939453125, -0.18212890625, 0.2120361328125, 0.606201171875, 1.0003662109375, 1.39453125, 1.7886962890625, 2.182861328125, 2.5770263671875, 2.97119140625, 3.3653564453125, 3.759521484375, 4.1536865234375, 4.5478515625, 4.9420166015625, 5.336181640625, 5.7303466796875, 6.12451171875, 6.5186767578125, 6.912841796875, 7.3070068359375, 7.701171875, 8.0953369140625, 8.489501953125, 8.8836669921875, 9.27783203125, 9.6719970703125, 10.066162109375, 10.4603271484375, 10.8544921875, 11.2486572265625, 11.642822265625, 12.0369873046875, 12.43115234375, 12.8253173828125, 13.219482421875, 13.6136474609375, 14.0078125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 23.0, 340.0, 580.0, 70.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.37042999267578, -88.49588775634766, -86.62135314941406, -84.74681091308594, -82.87227630615234, -80.99773406982422, -79.12319946289062, -77.2486572265625, -75.37411499023438, -73.49957275390625, -71.62503814697266, -69.75049591064453, -67.87596130371094, -66.00141906738281, -64.12688446044922, -62.252342224121094, -60.3778076171875, -58.50326919555664, -56.62873077392578, -54.75419235229492, -52.87965393066406, -51.00511169433594, -49.13057327270508, -47.25603485107422, -45.38149642944336, -43.5069580078125, -41.63241958618164, -39.75788116455078, -37.883338928222656, -36.00880432128906, -34.13426208496094, -32.25972366333008, -30.38518714904785, -28.510648727416992, -26.6361083984375, -24.76156997680664, -22.88703155517578, -21.012493133544922, -19.137954711914062, -17.26341438293457, -15.388875961303711, -13.514337539672852, -11.639798164367676, -9.7652587890625, -7.890720367431641, -6.016181945800781, -4.1416425704956055, -2.2671031951904297, -0.3925647735595703, 1.4819741249084473, 3.356513023376465, 5.231051921844482, 7.1055908203125, 8.98012924194336, 10.854668617248535, 12.729207992553711, 14.60374641418457, 16.47828483581543, 18.352825164794922, 20.22736358642578, 22.10190200805664, 23.9764404296875, 25.85097885131836, 27.72551918029785, 29.60005760192871]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 5.0, 2.0, 9.0, 8.0, 10.0, 9.0, 9.0, 9.0, 16.0, 17.0, 17.0, 27.0, 32.0, 27.0, 45.0, 35.0, 30.0, 48.0, 40.0, 45.0, 39.0, 48.0, 40.0, 41.0, 47.0, 39.0, 38.0, 40.0, 24.0, 30.0, 13.0, 30.0, 24.0, 22.0, 15.0, 17.0, 7.0, 10.0, 7.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.774188995361328, -23.012977600097656, -22.251768112182617, -21.490556716918945, -20.729345321655273, -19.968135833740234, -19.206924438476562, -18.44571304321289, -17.68450355529785, -16.92329216003418, -16.16208267211914, -15.400871276855469, -14.639660835266113, -13.878450393676758, -13.117238998413086, -12.35602855682373, -11.594817161560059, -10.833606719970703, -10.072395324707031, -9.311184883117676, -8.54997444152832, -7.788763523101807, -7.027552604675293, -6.2663421630859375, -5.505131244659424, -4.74392032623291, -3.9827098846435547, -3.221498966217041, -2.4602882862091064, -1.6990776062011719, -0.9378666877746582, -0.17665624618530273, 0.5845546722412109, 1.3457653522491455, 2.10697603225708, 2.8681869506835938, 3.6293976306915283, 4.390608310699463, 5.151819229125977, 5.913029670715332, 6.674240589141846, 7.435451507568359, 8.196661949157715, 8.95787239074707, 9.719083786010742, 10.480294227600098, 11.241504669189453, 12.002716064453125, 12.76392650604248, 13.525136947631836, 14.286348342895508, 15.047558784484863, 15.808769226074219, 16.56998062133789, 17.331192016601562, 18.0924015045166, 18.853612899780273, 19.614824295043945, 20.376033782958984, 21.137245178222656, 21.898456573486328, 22.659666061401367, 23.42087745666504, 24.182086944580078, 24.94329833984375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 2.0, 5.0, 9.0, 17.0, 7.0, 14.0, 19.0, 30.0, 23.0, 33.0, 41.0, 39.0, 48.0, 65.0, 60.0, 66.0, 64.0, 59.0, 59.0, 45.0, 53.0, 32.0, 51.0, 38.0, 33.0, 23.0, 18.0, 17.0, 10.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 4.0], "bins": [-3.705078125, -3.6194915771484375, -3.533905029296875, -3.4483184814453125, -3.36273193359375, -3.2771453857421875, -3.191558837890625, -3.1059722900390625, -3.0203857421875, -2.9347991943359375, -2.849212646484375, -2.7636260986328125, -2.67803955078125, -2.5924530029296875, -2.506866455078125, -2.4212799072265625, -2.335693359375, -2.2501068115234375, -2.164520263671875, -2.0789337158203125, -1.99334716796875, -1.9077606201171875, -1.822174072265625, -1.7365875244140625, -1.6510009765625, -1.5654144287109375, -1.479827880859375, -1.3942413330078125, -1.30865478515625, -1.2230682373046875, -1.137481689453125, -1.0518951416015625, -0.96630859375, -0.8807220458984375, -0.795135498046875, -0.7095489501953125, -0.62396240234375, -0.5383758544921875, -0.452789306640625, -0.3672027587890625, -0.2816162109375, -0.1960296630859375, -0.110443115234375, -0.0248565673828125, 0.06072998046875, 0.1463165283203125, 0.231903076171875, 0.3174896240234375, 0.403076171875, 0.4886627197265625, 0.574249267578125, 0.6598358154296875, 0.74542236328125, 0.8310089111328125, 0.916595458984375, 1.0021820068359375, 1.0877685546875, 1.1733551025390625, 1.258941650390625, 1.3445281982421875, 1.43011474609375, 1.5157012939453125, 1.601287841796875, 1.6868743896484375, 1.7724609375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 14.0, 13.0, 22.0, 20.0, 36.0, 49.0, 62.0, 98.0, 174.0, 328.0, 995.0, 4125.0, 38003.0, 1332077.0, 2745402.0, 65162.0, 5682.0, 1172.0, 318.0, 165.0, 93.0, 78.0, 52.0, 41.0, 23.0, 26.0, 11.0, 5.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.140625, -18.6632080078125, -18.185791015625, -17.7083740234375, -17.23095703125, -16.7535400390625, -16.276123046875, -15.7987060546875, -15.3212890625, -14.8438720703125, -14.366455078125, -13.8890380859375, -13.41162109375, -12.9342041015625, -12.456787109375, -11.9793701171875, -11.501953125, -11.0245361328125, -10.547119140625, -10.0697021484375, -9.59228515625, -9.1148681640625, -8.637451171875, -8.1600341796875, -7.6826171875, -7.2052001953125, -6.727783203125, -6.2503662109375, -5.77294921875, -5.2955322265625, -4.818115234375, -4.3406982421875, -3.86328125, -3.3858642578125, -2.908447265625, -2.4310302734375, -1.95361328125, -1.4761962890625, -0.998779296875, -0.5213623046875, -0.0439453125, 0.4334716796875, 0.910888671875, 1.3883056640625, 1.86572265625, 2.3431396484375, 2.820556640625, 3.2979736328125, 3.775390625, 4.2528076171875, 4.730224609375, 5.2076416015625, 5.68505859375, 6.1624755859375, 6.639892578125, 7.1173095703125, 7.5947265625, 8.0721435546875, 8.549560546875, 9.0269775390625, 9.50439453125, 9.9818115234375, 10.459228515625, 10.9366455078125, 11.4140625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 9.0, 4.0, 11.0, 6.0, 23.0, 47.0, 72.0, 140.0, 241.0, 526.0, 855.0, 882.0, 554.0, 309.0, 186.0, 100.0, 61.0, 17.0, 14.0, 12.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.765625, -19.35467529296875, -18.9437255859375, -18.53277587890625, -18.121826171875, -17.71087646484375, -17.2999267578125, -16.88897705078125, -16.47802734375, -16.06707763671875, -15.6561279296875, -15.24517822265625, -14.834228515625, -14.42327880859375, -14.0123291015625, -13.60137939453125, -13.1904296875, -12.77947998046875, -12.3685302734375, -11.95758056640625, -11.546630859375, -11.13568115234375, -10.7247314453125, -10.31378173828125, -9.90283203125, -9.49188232421875, -9.0809326171875, -8.66998291015625, -8.259033203125, -7.84808349609375, -7.4371337890625, -7.02618408203125, -6.615234375, -6.20428466796875, -5.7933349609375, -5.38238525390625, -4.971435546875, -4.56048583984375, -4.1495361328125, -3.73858642578125, -3.32763671875, -2.91668701171875, -2.5057373046875, -2.09478759765625, -1.683837890625, -1.27288818359375, -0.8619384765625, -0.45098876953125, -0.0400390625, 0.37091064453125, 0.7818603515625, 1.19281005859375, 1.603759765625, 2.01470947265625, 2.4256591796875, 2.83660888671875, 3.24755859375, 3.65850830078125, 4.0694580078125, 4.48040771484375, 4.891357421875, 5.30230712890625, 5.7132568359375, 6.12420654296875, 6.53515625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 7.0, 9.0, 11.0, 24.0, 32.0, 32.0, 61.0, 101.0, 202.0, 462.0, 1493.0, 9233.0, 535381.0, 3603709.0, 39293.0, 2881.0, 727.0, 258.0, 125.0, 80.0, 38.0, 31.0, 30.0, 22.0, 8.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.0625, -25.9453125, -24.828125, -23.7109375, -22.59375, -21.4765625, -20.359375, -19.2421875, -18.125, -17.0078125, -15.890625, -14.7734375, -13.65625, -12.5390625, -11.421875, -10.3046875, -9.1875, -8.0703125, -6.953125, -5.8359375, -4.71875, -3.6015625, -2.484375, -1.3671875, -0.25, 0.8671875, 1.984375, 3.1015625, 4.21875, 5.3359375, 6.453125, 7.5703125, 8.6875, 9.8046875, 10.921875, 12.0390625, 13.15625, 14.2734375, 15.390625, 16.5078125, 17.625, 18.7421875, 19.859375, 20.9765625, 22.09375, 23.2109375, 24.328125, 25.4453125, 26.5625, 27.6796875, 28.796875, 29.9140625, 31.03125, 32.1484375, 33.265625, 34.3828125, 35.5, 36.6171875, 37.734375, 38.8515625, 39.96875, 41.0859375, 42.203125, 43.3203125, 44.4375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 19.0, 26.0, 38.0, 106.0, 142.0, 177.0, 166.0, 154.0, 84.0, 49.0, 26.0, 12.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0624008178711, -79.03031158447266, -76.99822235107422, -74.96613311767578, -72.93403625488281, -70.90194702148438, -68.86985778808594, -66.8377685546875, -64.80567932128906, -62.773590087890625, -60.74150085449219, -58.709407806396484, -56.67731857299805, -54.64522933959961, -52.613136291503906, -50.58104705810547, -48.54895782470703, -46.516868591308594, -44.484779357910156, -42.45268630981445, -40.420597076416016, -38.38850784301758, -36.356414794921875, -34.32432556152344, -32.292236328125, -30.260147094726562, -28.228055953979492, -26.195964813232422, -24.163875579833984, -22.131786346435547, -20.099695205688477, -18.067604064941406, -16.0355224609375, -14.003432273864746, -11.971342086791992, -9.939251899719238, -7.907161712646484, -5.8750715255737305, -3.8429813385009766, -1.8108911514282227, 0.22119903564453125, 2.253289222717285, 4.285379409790039, 6.317469596862793, 8.349559783935547, 10.3816499710083, 12.413740158081055, 14.445830345153809, 16.477920532226562, 18.510009765625, 20.54210090637207, 22.57419204711914, 24.606281280517578, 26.638370513916016, 28.670461654663086, 30.702552795410156, 32.734642028808594, 34.76673126220703, 36.79882049560547, 38.83091354370117, 40.86300277709961, 42.89509201049805, 44.92718505859375, 46.95927429199219, 48.991363525390625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 8.0, 4.0, 7.0, 10.0, 10.0, 9.0, 14.0, 17.0, 14.0, 10.0, 22.0, 23.0, 32.0, 30.0, 36.0, 25.0, 39.0, 37.0, 44.0, 50.0, 37.0, 40.0, 41.0, 34.0, 48.0, 42.0, 35.0, 50.0, 39.0, 29.0, 33.0, 26.0, 27.0, 14.0, 17.0, 13.0, 7.0, 10.0, 8.0, 1.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.678138732910156, -29.807748794555664, -28.937358856201172, -28.06696891784668, -27.196578979492188, -26.326189041137695, -25.455799102783203, -24.58540916442871, -23.71501922607422, -22.844629287719727, -21.974239349365234, -21.103849411010742, -20.23345947265625, -19.363069534301758, -18.492679595947266, -17.622289657592773, -16.75189971923828, -15.881509780883789, -15.011119842529297, -14.140729904174805, -13.270339965820312, -12.39995002746582, -11.529560089111328, -10.659170150756836, -9.788780212402344, -8.918390274047852, -8.04800033569336, -7.177610397338867, -6.307220458984375, -5.436830520629883, -4.566440582275391, -3.6960506439208984, -2.8256607055664062, -1.955270767211914, -1.0848808288574219, -0.2144908905029297, 0.6558990478515625, 1.5262889862060547, 2.396678924560547, 3.267068862915039, 4.137458801269531, 5.007848739624023, 5.878238677978516, 6.748628616333008, 7.6190185546875, 8.489408493041992, 9.359798431396484, 10.230188369750977, 11.100578308105469, 11.970968246459961, 12.841358184814453, 13.711748123168945, 14.582138061523438, 15.45252799987793, 16.322917938232422, 17.193307876586914, 18.063697814941406, 18.9340877532959, 19.80447769165039, 20.674867630004883, 21.545257568359375, 22.415647506713867, 23.28603744506836, 24.15642738342285, 25.026817321777344]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 8.0, 11.0, 10.0, 16.0, 20.0, 23.0, 26.0, 33.0, 44.0, 47.0, 46.0, 58.0, 71.0, 55.0, 51.0, 65.0, 60.0, 57.0, 48.0, 31.0, 38.0, 47.0, 27.0, 25.0, 16.0, 19.0, 11.0, 13.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-3.88671875, -3.7968902587890625, -3.707061767578125, -3.6172332763671875, -3.52740478515625, -3.4375762939453125, -3.347747802734375, -3.2579193115234375, -3.1680908203125, -3.0782623291015625, -2.988433837890625, -2.8986053466796875, -2.80877685546875, -2.7189483642578125, -2.629119873046875, -2.5392913818359375, -2.449462890625, -2.3596343994140625, -2.269805908203125, -2.1799774169921875, -2.09014892578125, -2.0003204345703125, -1.910491943359375, -1.8206634521484375, -1.7308349609375, -1.6410064697265625, -1.551177978515625, -1.4613494873046875, -1.37152099609375, -1.2816925048828125, -1.191864013671875, -1.1020355224609375, -1.01220703125, -0.9223785400390625, -0.832550048828125, -0.7427215576171875, -0.65289306640625, -0.5630645751953125, -0.473236083984375, -0.3834075927734375, -0.2935791015625, -0.2037506103515625, -0.113922119140625, -0.0240936279296875, 0.06573486328125, 0.1555633544921875, 0.245391845703125, 0.3352203369140625, 0.425048828125, 0.5148773193359375, 0.604705810546875, 0.6945343017578125, 0.78436279296875, 0.8741912841796875, 0.964019775390625, 1.0538482666015625, 1.1436767578125, 1.2335052490234375, 1.323333740234375, 1.4131622314453125, 1.50299072265625, 1.5928192138671875, 1.682647705078125, 1.7724761962890625, 1.8623046875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 9.0, 10.0, 14.0, 19.0, 25.0, 33.0, 47.0, 88.0, 181.0, 369.0, 658.0, 1363.0, 2600.0, 4925.0, 9910.0, 19973.0, 42412.0, 97128.0, 287204.0, 364620.0, 119567.0, 50098.0, 23707.0, 11596.0, 5846.0, 2936.0, 1504.0, 785.0, 376.0, 223.0, 118.0, 58.0, 30.0, 25.0, 17.0, 16.0, 14.0, 5.0, 8.0, 3.0, 4.0, 4.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025360107421875, -0.02448892593383789, -0.02361774444580078, -0.022746562957763672, -0.021875381469726562, -0.021004199981689453, -0.020133018493652344, -0.019261837005615234, -0.018390655517578125, -0.017519474029541016, -0.016648292541503906, -0.015777111053466797, -0.014905929565429688, -0.014034748077392578, -0.013163566589355469, -0.01229238510131836, -0.01142120361328125, -0.01055002212524414, -0.009678840637207031, -0.008807659149169922, -0.007936477661132812, -0.007065296173095703, -0.006194114685058594, -0.005322933197021484, -0.004451751708984375, -0.0035805702209472656, -0.0027093887329101562, -0.0018382072448730469, -0.0009670257568359375, -9.584426879882812e-05, 0.0007753372192382812, 0.0016465187072753906, 0.0025177001953125, 0.0033888816833496094, 0.004260063171386719, 0.005131244659423828, 0.0060024261474609375, 0.006873607635498047, 0.007744789123535156, 0.008615970611572266, 0.009487152099609375, 0.010358333587646484, 0.011229515075683594, 0.012100696563720703, 0.012971878051757812, 0.013843059539794922, 0.014714241027832031, 0.01558542251586914, 0.01645660400390625, 0.01732778549194336, 0.01819896697998047, 0.019070148468017578, 0.019941329956054688, 0.020812511444091797, 0.021683692932128906, 0.022554874420166016, 0.023426055908203125, 0.024297237396240234, 0.025168418884277344, 0.026039600372314453, 0.026910781860351562, 0.027781963348388672, 0.02865314483642578, 0.02952432632446289, 0.0303955078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 6.0, 10.0, 16.0, 10.0, 8.0, 9.0, 14.0, 17.0, 23.0, 26.0, 27.0, 43.0, 29.0, 34.0, 29.0, 32.0, 32.0, 28.0, 46.0, 1064.0, 49.0, 42.0, 39.0, 44.0, 27.0, 31.0, 35.0, 25.0, 29.0, 20.0, 16.0, 22.0, 11.0, 19.0, 14.0, 11.0, 11.0, 8.0, 7.0, 8.0, 7.0, 6.0, 4.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.525390625, -1.4770965576171875, -1.428802490234375, -1.3805084228515625, -1.33221435546875, -1.2839202880859375, -1.235626220703125, -1.1873321533203125, -1.1390380859375, -1.0907440185546875, -1.042449951171875, -0.9941558837890625, -0.94586181640625, -0.8975677490234375, -0.849273681640625, -0.8009796142578125, -0.752685546875, -0.7043914794921875, -0.656097412109375, -0.6078033447265625, -0.55950927734375, -0.5112152099609375, -0.462921142578125, -0.4146270751953125, -0.3663330078125, -0.3180389404296875, -0.269744873046875, -0.2214508056640625, -0.17315673828125, -0.1248626708984375, -0.076568603515625, -0.0282745361328125, 0.02001953125, 0.0683135986328125, 0.116607666015625, 0.1649017333984375, 0.21319580078125, 0.2614898681640625, 0.309783935546875, 0.3580780029296875, 0.4063720703125, 0.4546661376953125, 0.502960205078125, 0.5512542724609375, 0.59954833984375, 0.6478424072265625, 0.696136474609375, 0.7444305419921875, 0.792724609375, 0.8410186767578125, 0.889312744140625, 0.9376068115234375, 0.98590087890625, 1.0341949462890625, 1.082489013671875, 1.1307830810546875, 1.1790771484375, 1.2273712158203125, 1.275665283203125, 1.3239593505859375, 1.37225341796875, 1.4205474853515625, 1.468841552734375, 1.5171356201171875, 1.5654296875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 10.0, 15.0, 27.0, 34.0, 54.0, 81.0, 112.0, 177.0, 225.0, 342.0, 505.0, 724.0, 1007.0, 1594.0, 2203.0, 3244.0, 4990.0, 7429.0, 11256.0, 17022.0, 26036.0, 40485.0, 65056.0, 107252.0, 188773.0, 1269231.0, 132715.0, 78225.0, 48427.0, 30579.0, 19656.0, 13230.0, 8478.0, 5817.0, 3790.0, 2612.0, 1780.0, 1254.0, 847.0, 584.0, 385.0, 263.0, 189.0, 135.0, 95.0, 59.0, 46.0, 34.0, 15.0, 20.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00628662109375, -0.006085038185119629, -0.005883455276489258, -0.005681872367858887, -0.005480289459228516, -0.0052787065505981445, -0.0050771236419677734, -0.004875540733337402, -0.004673957824707031, -0.00447237491607666, -0.004270792007446289, -0.004069209098815918, -0.003867626190185547, -0.0036660432815551758, -0.0034644603729248047, -0.0032628774642944336, -0.0030612945556640625, -0.0028597116470336914, -0.0026581287384033203, -0.0024565458297729492, -0.002254962921142578, -0.002053380012512207, -0.001851797103881836, -0.0016502141952514648, -0.0014486312866210938, -0.0012470483779907227, -0.0010454654693603516, -0.0008438825607299805, -0.0006422996520996094, -0.0004407167434692383, -0.0002391338348388672, -3.7550926208496094e-05, 0.000164031982421875, 0.0003656148910522461, 0.0005671977996826172, 0.0007687807083129883, 0.0009703636169433594, 0.0011719465255737305, 0.0013735294342041016, 0.0015751123428344727, 0.0017766952514648438, 0.001978278160095215, 0.002179861068725586, 0.002381443977355957, 0.002583026885986328, 0.0027846097946166992, 0.0029861927032470703, 0.0031877756118774414, 0.0033893585205078125, 0.0035909414291381836, 0.0037925243377685547, 0.003994107246398926, 0.004195690155029297, 0.004397273063659668, 0.004598855972290039, 0.00480043888092041, 0.005002021789550781, 0.005203604698181152, 0.0054051876068115234, 0.0056067705154418945, 0.005808353424072266, 0.006009936332702637, 0.006211519241333008, 0.006413102149963379, 0.00661468505859375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 121.0, 0.0, 0.0, 0.0, 467.0, 0.0, 0.0, 0.0, 113.0, 0.0, 0.0, 77.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.0140002965927124e-07, -3.855675458908081e-07, -3.6973506212234497e-07, -3.5390257835388184e-07, -3.380700945854187e-07, -3.2223761081695557e-07, -3.0640512704849243e-07, -2.905726432800293e-07, -2.7474015951156616e-07, -2.5890767574310303e-07, -2.430751919746399e-07, -2.2724270820617676e-07, -2.1141022443771362e-07, -1.955777406692505e-07, -1.7974525690078735e-07, -1.6391277313232422e-07, -1.4808028936386108e-07, -1.3224780559539795e-07, -1.1641532182693481e-07, -1.0058283805847168e-07, -8.475035429000854e-08, -6.891787052154541e-08, -5.3085386753082275e-08, -3.725290298461914e-08, -2.1420419216156006e-08, -5.587935447692871e-09, 1.0244548320770264e-08, 2.60770320892334e-08, 4.190951585769653e-08, 5.774199962615967e-08, 7.35744833946228e-08, 8.940696716308594e-08, 1.0523945093154907e-07, 1.210719347000122e-07, 1.3690441846847534e-07, 1.5273690223693848e-07, 1.685693860054016e-07, 1.8440186977386475e-07, 2.0023435354232788e-07, 2.1606683731079102e-07, 2.3189932107925415e-07, 2.477318048477173e-07, 2.635642886161804e-07, 2.7939677238464355e-07, 2.952292561531067e-07, 3.110617399215698e-07, 3.2689422369003296e-07, 3.427267074584961e-07, 3.5855919122695923e-07, 3.7439167499542236e-07, 3.902241587638855e-07, 4.0605664253234863e-07, 4.2188912630081177e-07, 4.377216100692749e-07, 4.5355409383773804e-07, 4.6938657760620117e-07, 4.852190613746643e-07, 5.010515451431274e-07, 5.168840289115906e-07, 5.327165126800537e-07, 5.485489964485168e-07, 5.6438148021698e-07, 5.802139639854431e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 3.0, 6.0, 3.0, 5.0, 12.0, 11.0, 16.0, 31.0, 19.0, 34.0, 41.0, 52.0, 67.0, 54.0, 104.0, 112.0, 113.0, 380.0, 1443.0, 40924.0, 909332.0, 89574.0, 5011.0, 448.0, 152.0, 124.0, 98.0, 76.0, 50.0, 51.0, 38.0, 29.0, 27.0, 28.0, 19.0, 18.0, 10.0, 8.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-8.285045623779297e-06, -8.023343980312347e-06, -7.761642336845398e-06, -7.4999406933784485e-06, -7.238239049911499e-06, -6.9765374064445496e-06, -6.7148357629776e-06, -6.453134119510651e-06, -6.191432476043701e-06, -5.929730832576752e-06, -5.668029189109802e-06, -5.406327545642853e-06, -5.144625902175903e-06, -4.882924258708954e-06, -4.621222615242004e-06, -4.359520971775055e-06, -4.0978193283081055e-06, -3.836117684841156e-06, -3.5744160413742065e-06, -3.312714397907257e-06, -3.0510127544403076e-06, -2.789311110973358e-06, -2.5276094675064087e-06, -2.2659078240394592e-06, -2.0042061805725098e-06, -1.7425045371055603e-06, -1.4808028936386108e-06, -1.2191012501716614e-06, -9.57399606704712e-07, -6.956979632377625e-07, -4.33996319770813e-07, -1.7229467630386353e-07, 8.940696716308594e-08, 3.511086106300354e-07, 6.128102540969849e-07, 8.745118975639343e-07, 1.1362135410308838e-06, 1.3979151844978333e-06, 1.6596168279647827e-06, 1.921318471431732e-06, 2.1830201148986816e-06, 2.444721758365631e-06, 2.7064234018325806e-06, 2.96812504529953e-06, 3.2298266887664795e-06, 3.491528332233429e-06, 3.7532299757003784e-06, 4.014931619167328e-06, 4.276633262634277e-06, 4.538334906101227e-06, 4.800036549568176e-06, 5.061738193035126e-06, 5.323439836502075e-06, 5.585141479969025e-06, 5.846843123435974e-06, 6.108544766902924e-06, 6.370246410369873e-06, 6.6319480538368225e-06, 6.893649697303772e-06, 7.1553513407707214e-06, 7.417052984237671e-06, 7.67875462770462e-06, 7.94045627117157e-06, 8.20215791463852e-06, 8.463859558105469e-06]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 12.0, 17.0, 33.0, 42.0, 67.0, 77.0, 431.0, 69.0, 70.0, 52.0, 47.0, 29.0, 19.0, 11.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.444868970196694e-07, -7.28646341485728e-07, -7.128058427952055e-07, -6.969652872612642e-07, -6.811247317273228e-07, -6.652842330368003e-07, -6.494436775028589e-07, -6.336031219689175e-07, -6.17762623278395e-07, -6.019220677444537e-07, -5.860815690539312e-07, -5.702410135199898e-07, -5.544004579860484e-07, -5.385599592955259e-07, -5.227194037615845e-07, -5.068788482276432e-07, -4.910383495371207e-07, -4.7519782242488873e-07, -4.5935726689094736e-07, -4.435167397787154e-07, -4.276762126664835e-07, -4.1183568555425154e-07, -3.9599513002031017e-07, -3.8015460290807823e-07, -3.6431401895242743e-07, -3.484734918401955e-07, -3.326329363062541e-07, -3.167924091940222e-07, -3.0095188208179025e-07, -2.851113549695583e-07, -2.6927079943561694e-07, -2.53430272323385e-07, -2.375897736328625e-07, -2.2174923230977583e-07, -2.059087051975439e-07, -1.9006816387445724e-07, -1.742276367622253e-07, -1.5838709543913865e-07, -1.42546554116052e-07, -1.2670602700382005e-07, -1.108654856807334e-07, -9.50249514630741e-08, -7.91844172454148e-08, -6.334387592232815e-08, -4.7503341704668856e-08, -3.166280748700956e-08, -1.5822266163922905e-08, 1.8268053736392176e-11, 1.585880227139569e-08, 3.1699336489054986e-08, 4.753987425942796e-08, 6.338041202980094e-08, 7.922094624746023e-08, 9.506148046511953e-08, 1.1090202178820618e-07, 1.2674254890043812e-07, 1.4258309022352478e-07, 1.5842363154661143e-07, 1.7426415865884337e-07, 1.9010469998193003e-07, 2.0594524130501668e-07, 2.2178576841724862e-07, 2.3762630974033527e-07, 2.5346685106342193e-07, 2.6930737817565387e-07]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 0.0, 0.0, 186.0, 0.0, 0.0, 0.0, 0.0, 0.0, 445.0, 0.0, 0.0, 0.0, 0.0, 182.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.980232238769531e-07, -2.8777867555618286e-07, -2.775341272354126e-07, -2.6728957891464233e-07, -2.5704503059387207e-07, -2.468004822731018e-07, -2.3655593395233154e-07, -2.2631138563156128e-07, -2.1606683731079102e-07, -2.0582228899002075e-07, -1.955777406692505e-07, -1.8533319234848022e-07, -1.7508864402770996e-07, -1.648440957069397e-07, -1.5459954738616943e-07, -1.4435499906539917e-07, -1.341104507446289e-07, -1.2386590242385864e-07, -1.1362135410308838e-07, -1.0337680578231812e-07, -9.313225746154785e-08, -8.288770914077759e-08, -7.264316082000732e-08, -6.239861249923706e-08, -5.21540641784668e-08, -4.190951585769653e-08, -3.166496753692627e-08, -2.1420419216156006e-08, -1.1175870895385742e-08, -9.313225746154785e-10, 9.313225746154785e-09, 1.955777406692505e-08, 2.9802322387695312e-08, 4.0046870708465576e-08, 5.029141902923584e-08, 6.05359673500061e-08, 7.078051567077637e-08, 8.102506399154663e-08, 9.12696123123169e-08, 1.0151416063308716e-07, 1.1175870895385742e-07, 1.2200325727462769e-07, 1.3224780559539795e-07, 1.424923539161682e-07, 1.5273690223693848e-07, 1.6298145055770874e-07, 1.73225998878479e-07, 1.8347054719924927e-07, 1.9371509552001953e-07, 2.039596438407898e-07, 2.1420419216156006e-07, 2.2444874048233032e-07, 2.3469328880310059e-07, 2.4493783712387085e-07, 2.551823854446411e-07, 2.654269337654114e-07, 2.7567148208618164e-07, 2.859160304069519e-07, 2.9616057872772217e-07, 3.0640512704849243e-07, 3.166496753692627e-07, 3.2689422369003296e-07, 3.371387720108032e-07, 3.473833203315735e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 8.0, 11.0, 10.0, 16.0, 20.0, 23.0, 26.0, 33.0, 44.0, 47.0, 46.0, 58.0, 71.0, 55.0, 51.0, 65.0, 60.0, 57.0, 48.0, 31.0, 38.0, 47.0, 27.0, 25.0, 16.0, 19.0, 11.0, 13.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-3.88671875, -3.7968902587890625, -3.707061767578125, -3.6172332763671875, -3.52740478515625, -3.4375762939453125, -3.347747802734375, -3.2579193115234375, -3.1680908203125, -3.0782623291015625, -2.988433837890625, -2.8986053466796875, -2.80877685546875, -2.7189483642578125, -2.629119873046875, -2.5392913818359375, -2.449462890625, -2.3596343994140625, -2.269805908203125, -2.1799774169921875, -2.09014892578125, -2.0003204345703125, -1.910491943359375, -1.8206634521484375, -1.7308349609375, -1.6410064697265625, -1.551177978515625, -1.4613494873046875, -1.37152099609375, -1.2816925048828125, -1.191864013671875, -1.1020355224609375, -1.01220703125, -0.9223785400390625, -0.832550048828125, -0.7427215576171875, -0.65289306640625, -0.5630645751953125, -0.473236083984375, -0.3834075927734375, -0.2935791015625, -0.2037506103515625, -0.113922119140625, -0.0240936279296875, 0.06573486328125, 0.1555633544921875, 0.245391845703125, 0.3352203369140625, 0.425048828125, 0.5148773193359375, 0.604705810546875, 0.6945343017578125, 0.78436279296875, 0.8741912841796875, 0.964019775390625, 1.0538482666015625, 1.1436767578125, 1.2335052490234375, 1.323333740234375, 1.4131622314453125, 1.50299072265625, 1.5928192138671875, 1.682647705078125, 1.7724761962890625, 1.8623046875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 10.0, 29.0, 41.0, 66.0, 120.0, 255.0, 519.0, 1037.0, 2414.0, 7280.0, 32304.0, 239788.0, 682370.0, 63637.0, 12407.0, 3524.0, 1393.0, 662.0, 316.0, 163.0, 98.0, 46.0, 25.0, 18.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.80078125, -6.617919921875, -6.43505859375, -6.252197265625, -6.0693359375, -5.886474609375, -5.70361328125, -5.520751953125, -5.337890625, -5.155029296875, -4.97216796875, -4.789306640625, -4.6064453125, -4.423583984375, -4.24072265625, -4.057861328125, -3.875, -3.692138671875, -3.50927734375, -3.326416015625, -3.1435546875, -2.960693359375, -2.77783203125, -2.594970703125, -2.412109375, -2.229248046875, -2.04638671875, -1.863525390625, -1.6806640625, -1.497802734375, -1.31494140625, -1.132080078125, -0.94921875, -0.766357421875, -0.58349609375, -0.400634765625, -0.2177734375, -0.034912109375, 0.14794921875, 0.330810546875, 0.513671875, 0.696533203125, 0.87939453125, 1.062255859375, 1.2451171875, 1.427978515625, 1.61083984375, 1.793701171875, 1.9765625, 2.159423828125, 2.34228515625, 2.525146484375, 2.7080078125, 2.890869140625, 3.07373046875, 3.256591796875, 3.439453125, 3.622314453125, 3.80517578125, 3.988037109375, 4.1708984375, 4.353759765625, 4.53662109375, 4.719482421875, 4.90234375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 17.0, 6.0, 22.0, 21.0, 27.0, 33.0, 34.0, 41.0, 44.0, 58.0, 72.0, 152.0, 1768.0, 267.0, 89.0, 56.0, 58.0, 49.0, 46.0, 35.0, 28.0, 14.0, 25.0, 13.0, 19.0, 8.0, 10.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.0740966796875, -8.757568359375, -8.4410400390625, -8.12451171875, -7.8079833984375, -7.491455078125, -7.1749267578125, -6.8583984375, -6.5418701171875, -6.225341796875, -5.9088134765625, -5.59228515625, -5.2757568359375, -4.959228515625, -4.6427001953125, -4.326171875, -4.0096435546875, -3.693115234375, -3.3765869140625, -3.06005859375, -2.7435302734375, -2.427001953125, -2.1104736328125, -1.7939453125, -1.4774169921875, -1.160888671875, -0.8443603515625, -0.52783203125, -0.2113037109375, 0.105224609375, 0.4217529296875, 0.73828125, 1.0548095703125, 1.371337890625, 1.6878662109375, 2.00439453125, 2.3209228515625, 2.637451171875, 2.9539794921875, 3.2705078125, 3.5870361328125, 3.903564453125, 4.2200927734375, 4.53662109375, 4.8531494140625, 5.169677734375, 5.4862060546875, 5.802734375, 6.1192626953125, 6.435791015625, 6.7523193359375, 7.06884765625, 7.3853759765625, 7.701904296875, 8.0184326171875, 8.3349609375, 8.6514892578125, 8.968017578125, 9.2845458984375, 9.60107421875, 9.9176025390625, 10.234130859375, 10.5506591796875, 10.8671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 14.0, 11.0, 16.0, 18.0, 14.0, 26.0, 27.0, 44.0, 55.0, 80.0, 146.0, 288.0, 604.0, 2319.0, 17220.0, 2034344.0, 1072040.0, 15015.0, 2166.0, 606.0, 233.0, 125.0, 83.0, 43.0, 38.0, 28.0, 27.0, 18.0, 12.0, 12.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.921875, -11.560302734375, -11.19873046875, -10.837158203125, -10.4755859375, -10.114013671875, -9.75244140625, -9.390869140625, -9.029296875, -8.667724609375, -8.30615234375, -7.944580078125, -7.5830078125, -7.221435546875, -6.85986328125, -6.498291015625, -6.13671875, -5.775146484375, -5.41357421875, -5.052001953125, -4.6904296875, -4.328857421875, -3.96728515625, -3.605712890625, -3.244140625, -2.882568359375, -2.52099609375, -2.159423828125, -1.7978515625, -1.436279296875, -1.07470703125, -0.713134765625, -0.3515625, 0.010009765625, 0.37158203125, 0.733154296875, 1.0947265625, 1.456298828125, 1.81787109375, 2.179443359375, 2.541015625, 2.902587890625, 3.26416015625, 3.625732421875, 3.9873046875, 4.348876953125, 4.71044921875, 5.072021484375, 5.43359375, 5.795166015625, 6.15673828125, 6.518310546875, 6.8798828125, 7.241455078125, 7.60302734375, 7.964599609375, 8.326171875, 8.687744140625, 9.04931640625, 9.410888671875, 9.7724609375, 10.134033203125, 10.49560546875, 10.857177734375, 11.21875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 109.0, 554.0, 322.0, 27.0, 2.0, 2.0], "bins": [-134.84300231933594, -132.58731079101562, -130.33163452148438, -128.07594299316406, -125.82025146484375, -123.56456756591797, -121.30887603759766, -119.05319213867188, -116.79750061035156, -114.54181671142578, -112.28612518310547, -110.03044128417969, -107.77474975585938, -105.5190658569336, -103.26337432861328, -101.0076904296875, -98.75199890136719, -96.4963150024414, -94.2406234741211, -91.98493957519531, -89.729248046875, -87.47356414794922, -85.2178726196289, -82.96218872070312, -80.70650482177734, -78.45082092285156, -76.19512939453125, -73.93944549560547, -71.68375396728516, -69.42807006835938, -67.17237854003906, -64.91669464111328, -62.661006927490234, -60.40531921386719, -58.14963150024414, -55.893943786621094, -53.63825607299805, -51.382568359375, -49.12688446044922, -46.871192932128906, -44.615509033203125, -42.35982131958008, -40.10413360595703, -37.848445892333984, -35.59275817871094, -33.33707046508789, -31.081384658813477, -28.82569694519043, -26.57000732421875, -24.314319610595703, -22.058631896972656, -19.80294418334961, -17.547256469726562, -15.291569709777832, -13.035882949829102, -10.780195236206055, -8.524507522583008, -6.268819808959961, -4.013132572174072, -1.7574453353881836, 0.4982423782348633, 2.75393009185791, 5.009616851806641, 7.2653045654296875, 9.520992279052734]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 9.0, 13.0, 11.0, 16.0, 10.0, 23.0, 26.0, 23.0, 24.0, 27.0, 30.0, 40.0, 32.0, 33.0, 36.0, 34.0, 38.0, 43.0, 50.0, 39.0, 59.0, 36.0, 28.0, 34.0, 26.0, 23.0, 22.0, 29.0, 25.0, 25.0, 13.0, 20.0, 16.0, 16.0, 6.0, 7.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.819372177124023, -23.039987564086914, -22.260604858398438, -21.481220245361328, -20.70183753967285, -19.922452926635742, -19.143070220947266, -18.363685607910156, -17.584300994873047, -16.804916381835938, -16.02553367614746, -15.246149063110352, -14.466766357421875, -13.687381744384766, -12.907998085021973, -12.12861442565918, -11.349231719970703, -10.56984806060791, -9.790464401245117, -9.011079788208008, -8.231697082519531, -7.45231294631958, -6.672928810119629, -5.893545150756836, -5.114161491394043, -4.33477783203125, -3.555393934249878, -2.776010036468506, -1.996626377105713, -1.21724271774292, -0.43785858154296875, 0.3415250778198242, 1.12091064453125, 1.9002944231033325, 2.679678201675415, 3.459062099456787, 4.23844575881958, 5.017829418182373, 5.797213554382324, 6.576597213745117, 7.35598087310791, 8.135364532470703, 8.914748191833496, 9.694131851196289, 10.473516464233398, 11.252899169921875, 12.032283782958984, 12.811667442321777, 13.59105110168457, 14.370434761047363, 15.149818420410156, 15.929203033447266, 16.708585739135742, 17.48797035217285, 18.267353057861328, 19.046737670898438, 19.826122283935547, 20.605506896972656, 21.384889602661133, 22.164274215698242, 22.94365692138672, 23.723041534423828, 24.502426147460938, 25.281808853149414, 26.06119155883789]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 8.0, 10.0, 10.0, 15.0, 17.0, 23.0, 21.0, 37.0, 41.0, 50.0, 47.0, 59.0, 52.0, 65.0, 51.0, 66.0, 64.0, 51.0, 52.0, 38.0, 32.0, 45.0, 32.0, 25.0, 17.0, 16.0, 17.0, 11.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-3.92578125, -3.8353424072265625, -3.744903564453125, -3.6544647216796875, -3.56402587890625, -3.4735870361328125, -3.383148193359375, -3.2927093505859375, -3.2022705078125, -3.1118316650390625, -3.021392822265625, -2.9309539794921875, -2.84051513671875, -2.7500762939453125, -2.659637451171875, -2.5691986083984375, -2.478759765625, -2.3883209228515625, -2.297882080078125, -2.2074432373046875, -2.11700439453125, -2.0265655517578125, -1.936126708984375, -1.8456878662109375, -1.7552490234375, -1.6648101806640625, -1.574371337890625, -1.4839324951171875, -1.39349365234375, -1.3030548095703125, -1.212615966796875, -1.1221771240234375, -1.03173828125, -0.9412994384765625, -0.850860595703125, -0.7604217529296875, -0.66998291015625, -0.5795440673828125, -0.489105224609375, -0.3986663818359375, -0.3082275390625, -0.2177886962890625, -0.127349853515625, -0.0369110107421875, 0.05352783203125, 0.1439666748046875, 0.234405517578125, 0.3248443603515625, 0.415283203125, 0.5057220458984375, 0.596160888671875, 0.6865997314453125, 0.77703857421875, 0.8674774169921875, 0.957916259765625, 1.0483551025390625, 1.1387939453125, 1.2292327880859375, 1.319671630859375, 1.4101104736328125, 1.50054931640625, 1.5909881591796875, 1.681427001953125, 1.7718658447265625, 1.8623046875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 18.0, 10.0, 18.0, 30.0, 34.0, 55.0, 84.0, 184.0, 349.0, 860.0, 2489.0, 8812.0, 40269.0, 260567.0, 2598905.0, 1134948.0, 117659.0, 21160.0, 5183.0, 1468.0, 584.0, 257.0, 115.0, 83.0, 28.0, 39.0, 17.0, 14.0, 9.0, 5.0, 10.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-10.984375, -10.71514892578125, -10.4459228515625, -10.17669677734375, -9.907470703125, -9.63824462890625, -9.3690185546875, -9.09979248046875, -8.83056640625, -8.56134033203125, -8.2921142578125, -8.02288818359375, -7.753662109375, -7.48443603515625, -7.2152099609375, -6.94598388671875, -6.6767578125, -6.40753173828125, -6.1383056640625, -5.86907958984375, -5.599853515625, -5.33062744140625, -5.0614013671875, -4.79217529296875, -4.52294921875, -4.25372314453125, -3.9844970703125, -3.71527099609375, -3.446044921875, -3.17681884765625, -2.9075927734375, -2.63836669921875, -2.369140625, -2.09991455078125, -1.8306884765625, -1.56146240234375, -1.292236328125, -1.02301025390625, -0.7537841796875, -0.48455810546875, -0.21533203125, 0.05389404296875, 0.3231201171875, 0.59234619140625, 0.861572265625, 1.13079833984375, 1.4000244140625, 1.66925048828125, 1.9384765625, 2.20770263671875, 2.4769287109375, 2.74615478515625, 3.015380859375, 3.28460693359375, 3.5538330078125, 3.82305908203125, 4.09228515625, 4.36151123046875, 4.6307373046875, 4.89996337890625, 5.169189453125, 5.43841552734375, 5.7076416015625, 5.97686767578125, 6.24609375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 9.0, 19.0, 14.0, 27.0, 55.0, 56.0, 97.0, 154.0, 237.0, 347.0, 447.0, 582.0, 600.0, 461.0, 305.0, 207.0, 145.0, 105.0, 75.0, 40.0, 35.0, 21.0, 12.0, 11.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1484375, -10.869140625, -10.58984375, -10.310546875, -10.03125, -9.751953125, -9.47265625, -9.193359375, -8.9140625, -8.634765625, -8.35546875, -8.076171875, -7.796875, -7.517578125, -7.23828125, -6.958984375, -6.6796875, -6.400390625, -6.12109375, -5.841796875, -5.5625, -5.283203125, -5.00390625, -4.724609375, -4.4453125, -4.166015625, -3.88671875, -3.607421875, -3.328125, -3.048828125, -2.76953125, -2.490234375, -2.2109375, -1.931640625, -1.65234375, -1.373046875, -1.09375, -0.814453125, -0.53515625, -0.255859375, 0.0234375, 0.302734375, 0.58203125, 0.861328125, 1.140625, 1.419921875, 1.69921875, 1.978515625, 2.2578125, 2.537109375, 2.81640625, 3.095703125, 3.375, 3.654296875, 3.93359375, 4.212890625, 4.4921875, 4.771484375, 5.05078125, 5.330078125, 5.609375, 5.888671875, 6.16796875, 6.447265625, 6.7265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 5.0, 0.0, 8.0, 10.0, 13.0, 16.0, 18.0, 28.0, 51.0, 96.0, 145.0, 215.0, 380.0, 729.0, 1393.0, 3482.0, 11489.0, 57761.0, 432752.0, 2752728.0, 809583.0, 97679.0, 17216.0, 4823.0, 1781.0, 822.0, 443.0, 242.0, 131.0, 91.0, 52.0, 36.0, 22.0, 13.0, 13.0, 9.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.3193359375, -8.888671875, -8.4580078125, -8.02734375, -7.5966796875, -7.166015625, -6.7353515625, -6.3046875, -5.8740234375, -5.443359375, -5.0126953125, -4.58203125, -4.1513671875, -3.720703125, -3.2900390625, -2.859375, -2.4287109375, -1.998046875, -1.5673828125, -1.13671875, -0.7060546875, -0.275390625, 0.1552734375, 0.5859375, 1.0166015625, 1.447265625, 1.8779296875, 2.30859375, 2.7392578125, 3.169921875, 3.6005859375, 4.03125, 4.4619140625, 4.892578125, 5.3232421875, 5.75390625, 6.1845703125, 6.615234375, 7.0458984375, 7.4765625, 7.9072265625, 8.337890625, 8.7685546875, 9.19921875, 9.6298828125, 10.060546875, 10.4912109375, 10.921875, 11.3525390625, 11.783203125, 12.2138671875, 12.64453125, 13.0751953125, 13.505859375, 13.9365234375, 14.3671875, 14.7978515625, 15.228515625, 15.6591796875, 16.08984375, 16.5205078125, 16.951171875, 17.3818359375, 17.8125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 14.0, 17.0, 36.0, 54.0, 75.0, 114.0, 124.0, 140.0, 120.0, 111.0, 75.0, 61.0, 33.0, 15.0, 13.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.715938568115234, -34.05451583862305, -32.393089294433594, -30.731666564941406, -29.070240020751953, -27.408817291259766, -25.747392654418945, -24.085968017578125, -22.424543380737305, -20.763118743896484, -19.101694107055664, -17.440269470214844, -15.77884578704834, -14.11742115020752, -12.455997467041016, -10.794572830200195, -9.133148193359375, -7.471723556518555, -5.810299396514893, -4.1488752365112305, -2.48745059967041, -0.8260259628295898, 0.8353977203369141, 2.4968223571777344, 4.158246994018555, 5.819671630859375, 7.481095790863037, 9.1425199508667, 10.80394458770752, 12.46536922454834, 14.126792907714844, 15.788217544555664, 17.44963836669922, 19.11106300354004, 20.77248764038086, 22.433910369873047, 24.0953369140625, 25.756759643554688, 27.418184280395508, 29.079608917236328, 30.74103355407715, 32.40245819091797, 34.063880920410156, 35.72530746459961, 37.3867301940918, 39.04815673828125, 40.70957946777344, 42.371002197265625, 44.03242874145508, 45.693851470947266, 47.35527801513672, 49.016700744628906, 50.67812728881836, 52.33955001831055, 54.0009765625, 55.66239929199219, 57.323822021484375, 58.98524475097656, 60.646671295166016, 62.3080940246582, 63.969520568847656, 65.63094329833984, 67.29236602783203, 68.95379638671875, 70.61521911621094]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 9.0, 5.0, 8.0, 10.0, 12.0, 11.0, 15.0, 18.0, 17.0, 19.0, 23.0, 19.0, 30.0, 33.0, 34.0, 36.0, 44.0, 34.0, 40.0, 40.0, 35.0, 43.0, 44.0, 59.0, 31.0, 40.0, 29.0, 31.0, 28.0, 28.0, 21.0, 25.0, 22.0, 19.0, 20.0, 14.0, 12.0, 14.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.386524200439453, -23.668357849121094, -22.950193405151367, -22.232027053833008, -21.51386070251465, -20.795696258544922, -20.077529907226562, -19.359363555908203, -18.641199111938477, -17.923032760620117, -17.20486831665039, -16.48670196533203, -15.768536567687988, -15.050371170043945, -14.332204818725586, -13.614039421081543, -12.895873069763184, -12.17770767211914, -11.459541320800781, -10.741375923156738, -10.023210525512695, -9.305044174194336, -8.586878776550293, -7.86871337890625, -7.150547504425049, -6.432381629943848, -5.714216232299805, -4.9960503578186035, -4.277884483337402, -3.5597190856933594, -2.841553211212158, -2.1233878135681152, -1.405221939086914, -0.6870562434196472, 0.03110945224761963, 0.7492752075195312, 1.4674408435821533, 2.1856064796447754, 2.9037723541259766, 3.6219377517700195, 4.340103626251221, 5.058269500732422, 5.776434898376465, 6.494600772857666, 7.212766647338867, 7.93093204498291, 8.649097442626953, 9.367263793945312, 10.085429191589355, 10.803594589233398, 11.521760940551758, 12.2399263381958, 12.958091735839844, 13.676258087158203, 14.394423484802246, 15.112588882446289, 15.830755233764648, 16.548921585083008, 17.267086029052734, 17.985252380371094, 18.703418731689453, 19.42158317565918, 20.13974952697754, 20.857913970947266, 21.576080322265625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 8.0, 6.0, 13.0, 18.0, 20.0, 16.0, 24.0, 33.0, 38.0, 40.0, 53.0, 43.0, 53.0, 55.0, 62.0, 54.0, 46.0, 45.0, 47.0, 36.0, 44.0, 44.0, 36.0, 23.0, 28.0, 28.0, 16.0, 12.0, 13.0, 13.0, 2.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.560546875, -3.4758453369140625, -3.391143798828125, -3.3064422607421875, -3.22174072265625, -3.1370391845703125, -3.052337646484375, -2.9676361083984375, -2.8829345703125, -2.7982330322265625, -2.713531494140625, -2.6288299560546875, -2.54412841796875, -2.4594268798828125, -2.374725341796875, -2.2900238037109375, -2.205322265625, -2.1206207275390625, -2.035919189453125, -1.9512176513671875, -1.86651611328125, -1.7818145751953125, -1.697113037109375, -1.6124114990234375, -1.5277099609375, -1.4430084228515625, -1.358306884765625, -1.2736053466796875, -1.18890380859375, -1.1042022705078125, -1.019500732421875, -0.9347991943359375, -0.85009765625, -0.7653961181640625, -0.680694580078125, -0.5959930419921875, -0.51129150390625, -0.4265899658203125, -0.341888427734375, -0.2571868896484375, -0.1724853515625, -0.0877838134765625, -0.003082275390625, 0.0816192626953125, 0.16632080078125, 0.2510223388671875, 0.335723876953125, 0.4204254150390625, 0.505126953125, 0.5898284912109375, 0.674530029296875, 0.7592315673828125, 0.84393310546875, 0.9286346435546875, 1.013336181640625, 1.0980377197265625, 1.1827392578125, 1.2674407958984375, 1.352142333984375, 1.4368438720703125, 1.52154541015625, 1.6062469482421875, 1.690948486328125, 1.7756500244140625, 1.8603515625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 18.0, 18.0, 42.0, 42.0, 66.0, 148.0, 197.0, 375.0, 695.0, 1200.0, 2033.0, 3673.0, 6664.0, 12229.0, 23275.0, 46202.0, 100237.0, 252107.0, 339586.0, 136093.0, 60524.0, 29384.0, 15252.0, 8037.0, 4461.0, 2533.0, 1430.0, 835.0, 464.0, 284.0, 168.0, 88.0, 65.0, 34.0, 24.0, 14.0, 13.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0264739990234375, -0.02567601203918457, -0.02487802505493164, -0.02408003807067871, -0.02328205108642578, -0.02248406410217285, -0.021686077117919922, -0.020888090133666992, -0.020090103149414062, -0.019292116165161133, -0.018494129180908203, -0.017696142196655273, -0.016898155212402344, -0.016100168228149414, -0.015302181243896484, -0.014504194259643555, -0.013706207275390625, -0.012908220291137695, -0.012110233306884766, -0.011312246322631836, -0.010514259338378906, -0.009716272354125977, -0.008918285369873047, -0.008120298385620117, -0.0073223114013671875, -0.006524324417114258, -0.005726337432861328, -0.0049283504486083984, -0.004130363464355469, -0.003332376480102539, -0.0025343894958496094, -0.0017364025115966797, -0.00093841552734375, -0.0001404285430908203, 0.0006575584411621094, 0.001455545425415039, 0.0022535324096679688, 0.0030515193939208984, 0.003849506378173828, 0.004647493362426758, 0.0054454803466796875, 0.006243467330932617, 0.007041454315185547, 0.007839441299438477, 0.008637428283691406, 0.009435415267944336, 0.010233402252197266, 0.011031389236450195, 0.011829376220703125, 0.012627363204956055, 0.013425350189208984, 0.014223337173461914, 0.015021324157714844, 0.015819311141967773, 0.016617298126220703, 0.017415285110473633, 0.018213272094726562, 0.019011259078979492, 0.019809246063232422, 0.02060723304748535, 0.02140522003173828, 0.02220320701599121, 0.02300119400024414, 0.02379918098449707, 0.02459716796875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 7.0, 9.0, 8.0, 10.0, 11.0, 19.0, 20.0, 16.0, 30.0, 21.0, 38.0, 29.0, 22.0, 27.0, 39.0, 41.0, 31.0, 51.0, 54.0, 1072.0, 36.0, 42.0, 44.0, 30.0, 42.0, 26.0, 34.0, 17.0, 23.0, 32.0, 18.0, 21.0, 23.0, 19.0, 9.0, 10.0, 12.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.673828125, -1.62078857421875, -1.5677490234375, -1.51470947265625, -1.461669921875, -1.40863037109375, -1.3555908203125, -1.30255126953125, -1.24951171875, -1.19647216796875, -1.1434326171875, -1.09039306640625, -1.037353515625, -0.98431396484375, -0.9312744140625, -0.87823486328125, -0.8251953125, -0.77215576171875, -0.7191162109375, -0.66607666015625, -0.613037109375, -0.55999755859375, -0.5069580078125, -0.45391845703125, -0.40087890625, -0.34783935546875, -0.2947998046875, -0.24176025390625, -0.188720703125, -0.13568115234375, -0.0826416015625, -0.02960205078125, 0.0234375, 0.07647705078125, 0.1295166015625, 0.18255615234375, 0.235595703125, 0.28863525390625, 0.3416748046875, 0.39471435546875, 0.44775390625, 0.50079345703125, 0.5538330078125, 0.60687255859375, 0.659912109375, 0.71295166015625, 0.7659912109375, 0.81903076171875, 0.8720703125, 0.92510986328125, 0.9781494140625, 1.03118896484375, 1.084228515625, 1.13726806640625, 1.1903076171875, 1.24334716796875, 1.29638671875, 1.34942626953125, 1.4024658203125, 1.45550537109375, 1.508544921875, 1.56158447265625, 1.6146240234375, 1.66766357421875, 1.720703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 5.0, 5.0, 5.0, 6.0, 3.0, 19.0, 24.0, 40.0, 65.0, 88.0, 99.0, 174.0, 230.0, 341.0, 516.0, 730.0, 1134.0, 1712.0, 2593.0, 3898.0, 5938.0, 8976.0, 14274.0, 21864.0, 34276.0, 53709.0, 85772.0, 143603.0, 1264873.0, 172471.0, 102471.0, 63815.0, 40097.0, 25912.0, 16534.0, 10467.0, 6966.0, 4455.0, 2943.0, 1984.0, 1362.0, 816.0, 585.0, 396.0, 306.0, 178.0, 123.0, 86.0, 81.0, 46.0, 24.0, 15.0, 9.0, 6.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0], "bins": [-0.0065155029296875, -0.006316125392913818, -0.006116747856140137, -0.005917370319366455, -0.0057179927825927734, -0.005518615245819092, -0.00531923770904541, -0.0051198601722717285, -0.004920482635498047, -0.004721105098724365, -0.004521727561950684, -0.004322350025177002, -0.00412297248840332, -0.003923594951629639, -0.003724217414855957, -0.0035248398780822754, -0.0033254623413085938, -0.003126084804534912, -0.0029267072677612305, -0.002727329730987549, -0.002527952194213867, -0.0023285746574401855, -0.002129197120666504, -0.0019298195838928223, -0.0017304420471191406, -0.001531064510345459, -0.0013316869735717773, -0.0011323094367980957, -0.0009329319000244141, -0.0007335543632507324, -0.0005341768264770508, -0.00033479928970336914, -0.0001354217529296875, 6.395578384399414e-05, 0.0002633333206176758, 0.0004627108573913574, 0.0006620883941650391, 0.0008614659309387207, 0.0010608434677124023, 0.001260221004486084, 0.0014595985412597656, 0.0016589760780334473, 0.001858353614807129, 0.0020577311515808105, 0.002257108688354492, 0.002456486225128174, 0.0026558637619018555, 0.002855241298675537, 0.0030546188354492188, 0.0032539963722229004, 0.003453373908996582, 0.0036527514457702637, 0.0038521289825439453, 0.004051506519317627, 0.004250884056091309, 0.00445026159286499, 0.004649639129638672, 0.0048490166664123535, 0.005048394203186035, 0.005247771739959717, 0.0054471492767333984, 0.00564652681350708, 0.005845904350280762, 0.006045281887054443, 0.006244659423828125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 15.0, 0.0, 0.0, 30.0, 0.0, 0.0, 67.0, 0.0, 0.0, 123.0, 0.0, 0.0, 0.0, 456.0, 0.0, 0.0, 159.0, 0.0, 0.0, 53.0, 0.0, 0.0, 34.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 8.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 5.0, 12.0, 10.0, 7.0, 18.0, 10.0, 14.0, 14.0, 23.0, 32.0, 33.0, 36.0, 35.0, 82.0, 74.0, 132.0, 211.0, 684.0, 3215.0, 94573.0, 925283.0, 20795.0, 2193.0, 395.0, 144.0, 90.0, 104.0, 57.0, 42.0, 35.0, 32.0, 22.0, 26.0, 15.0, 13.0, 16.0, 9.0, 14.0, 7.0, 8.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.119510650634766e-06, -8.837319910526276e-06, -8.555129170417786e-06, -8.272938430309296e-06, -7.990747690200806e-06, -7.708556950092316e-06, -7.426366209983826e-06, -7.144175469875336e-06, -6.861984729766846e-06, -6.579793989658356e-06, -6.297603249549866e-06, -6.015412509441376e-06, -5.733221769332886e-06, -5.451031029224396e-06, -5.168840289115906e-06, -4.886649549007416e-06, -4.604458808898926e-06, -4.322268068790436e-06, -4.040077328681946e-06, -3.757886588573456e-06, -3.475695848464966e-06, -3.193505108356476e-06, -2.911314368247986e-06, -2.629123628139496e-06, -2.346932888031006e-06, -2.064742147922516e-06, -1.7825514078140259e-06, -1.5003606677055359e-06, -1.218169927597046e-06, -9.359791874885559e-07, -6.537884473800659e-07, -3.7159770727157593e-07, -8.940696716308594e-08, 1.9278377294540405e-07, 4.7497451305389404e-07, 7.57165253162384e-07, 1.039355993270874e-06, 1.321546733379364e-06, 1.603737473487854e-06, 1.885928213596344e-06, 2.168118953704834e-06, 2.450309693813324e-06, 2.732500433921814e-06, 3.014691174030304e-06, 3.296881914138794e-06, 3.579072654247284e-06, 3.861263394355774e-06, 4.143454134464264e-06, 4.425644874572754e-06, 4.707835614681244e-06, 4.990026354789734e-06, 5.272217094898224e-06, 5.554407835006714e-06, 5.836598575115204e-06, 6.118789315223694e-06, 6.400980055332184e-06, 6.683170795440674e-06, 6.965361535549164e-06, 7.247552275657654e-06, 7.529743015766144e-06, 7.811933755874634e-06, 8.094124495983124e-06, 8.376315236091614e-06, 8.658505976200104e-06, 8.940696716308594e-06]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 15.0, 33.0, 60.0, 118.0, 434.0, 136.0, 95.0, 52.0, 33.0, 14.0, 9.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.125636799770291e-06, -1.0994504009431694e-06, -1.0732640021160478e-06, -1.0470774896020885e-06, -1.0208910907749669e-06, -9.947046919478453e-07, -9.685182931207237e-07, -9.423318374501832e-07, -9.161453817796428e-07, -8.899589829525212e-07, -8.637725272819807e-07, -8.375861284548591e-07, -8.113996727843187e-07, -7.852132739571971e-07, -7.590268751300755e-07, -7.32840419459535e-07, -7.066540206324134e-07, -6.804676218052919e-07, -6.542811661347514e-07, -6.280947673076298e-07, -6.019083116370894e-07, -5.757219128099678e-07, -5.495354571394273e-07, -5.233490583123057e-07, -4.971626594851841e-07, -4.709762322363531e-07, -4.447898049875221e-07, -4.186034061604005e-07, -3.9241695048986003e-07, -3.6623055166273843e-07, -3.400441244139074e-07, -3.138576971650764e-07, -2.8767124149453593e-07, -2.614848142457049e-07, -2.352983869968739e-07, -2.0911197395889758e-07, -1.8292554671006656e-07, -1.5673911946123553e-07, -1.3055270642325922e-07, -1.043662791744282e-07, -7.817985192559718e-08, -5.199342822947983e-08, -2.5807004533362488e-08, 3.794156100411783e-10, 2.6565842858872202e-08, 5.2752270107703225e-08, 7.893868314567953e-08, 1.0512511039451056e-07, 1.3131153764334158e-07, 1.574979648921726e-07, 1.8368439214100363e-07, 2.0987080517897994e-07, 2.3605723242781096e-07, 2.6224364546578727e-07, 2.884300727146183e-07, 3.146164999634493e-07, 3.4080292721228034e-07, 3.6698935446111136e-07, 3.931757817099424e-07, 4.193622089587734e-07, 4.45548607785895e-07, 4.7173506345643546e-07, 4.97921462283557e-07, 5.241079179540975e-07, 5.502943167812191e-07]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 204.0, 0.0, 0.0, 0.0, 0.0, 0.0, 420.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 228.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.384185791015625e-07, -2.2910535335540771e-07, -2.1979212760925293e-07, -2.1047890186309814e-07, -2.0116567611694336e-07, -1.9185245037078857e-07, -1.825392246246338e-07, -1.73225998878479e-07, -1.6391277313232422e-07, -1.5459954738616943e-07, -1.4528632164001465e-07, -1.3597309589385986e-07, -1.2665987014770508e-07, -1.1734664440155029e-07, -1.0803341865539551e-07, -9.872019290924072e-08, -8.940696716308594e-08, -8.009374141693115e-08, -7.078051567077637e-08, -6.146728992462158e-08, -5.21540641784668e-08, -4.284083843231201e-08, -3.3527612686157227e-08, -2.421438694000244e-08, -1.4901161193847656e-08, -5.587935447692871e-09, 3.725290298461914e-09, 1.30385160446167e-08, 2.2351741790771484e-08, 3.166496753692627e-08, 4.0978193283081055e-08, 5.029141902923584e-08, 5.960464477539063e-08, 6.891787052154541e-08, 7.82310962677002e-08, 8.754432201385498e-08, 9.685754776000977e-08, 1.0617077350616455e-07, 1.1548399925231934e-07, 1.2479722499847412e-07, 1.341104507446289e-07, 1.434236764907837e-07, 1.5273690223693848e-07, 1.6205012798309326e-07, 1.7136335372924805e-07, 1.8067657947540283e-07, 1.8998980522155762e-07, 1.993030309677124e-07, 2.086162567138672e-07, 2.1792948246002197e-07, 2.2724270820617676e-07, 2.3655593395233154e-07, 2.4586915969848633e-07, 2.551823854446411e-07, 2.644956111907959e-07, 2.738088369369507e-07, 2.8312206268310547e-07, 2.9243528842926025e-07, 3.0174851417541504e-07, 3.110617399215698e-07, 3.203749656677246e-07, 3.296881914138794e-07, 3.390014171600342e-07, 3.4831464290618896e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 8.0, 6.0, 13.0, 18.0, 20.0, 16.0, 24.0, 33.0, 38.0, 40.0, 53.0, 43.0, 53.0, 55.0, 62.0, 54.0, 46.0, 45.0, 47.0, 36.0, 44.0, 44.0, 36.0, 23.0, 28.0, 28.0, 16.0, 12.0, 13.0, 13.0, 2.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.560546875, -3.4758453369140625, -3.391143798828125, -3.3064422607421875, -3.22174072265625, -3.1370391845703125, -3.052337646484375, -2.9676361083984375, -2.8829345703125, -2.7982330322265625, -2.713531494140625, -2.6288299560546875, -2.54412841796875, -2.4594268798828125, -2.374725341796875, -2.2900238037109375, -2.205322265625, -2.1206207275390625, -2.035919189453125, -1.9512176513671875, -1.86651611328125, -1.7818145751953125, -1.697113037109375, -1.6124114990234375, -1.5277099609375, -1.4430084228515625, -1.358306884765625, -1.2736053466796875, -1.18890380859375, -1.1042022705078125, -1.019500732421875, -0.9347991943359375, -0.85009765625, -0.7653961181640625, -0.680694580078125, -0.5959930419921875, -0.51129150390625, -0.4265899658203125, -0.341888427734375, -0.2571868896484375, -0.1724853515625, -0.0877838134765625, -0.003082275390625, 0.0816192626953125, 0.16632080078125, 0.2510223388671875, 0.335723876953125, 0.4204254150390625, 0.505126953125, 0.5898284912109375, 0.674530029296875, 0.7592315673828125, 0.84393310546875, 0.9286346435546875, 1.013336181640625, 1.0980377197265625, 1.1827392578125, 1.2674407958984375, 1.352142333984375, 1.4368438720703125, 1.52154541015625, 1.6062469482421875, 1.690948486328125, 1.7756500244140625, 1.8603515625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 9.0, 18.0, 22.0, 28.0, 55.0, 74.0, 116.0, 189.0, 317.0, 498.0, 822.0, 1418.0, 2444.0, 4112.0, 7767.0, 14554.0, 29042.0, 64633.0, 229951.0, 494509.0, 110647.0, 42539.0, 20672.0, 10611.0, 5642.0, 3144.0, 1902.0, 1047.0, 635.0, 420.0, 238.0, 172.0, 107.0, 60.0, 45.0, 27.0, 21.0, 13.0, 9.0, 2.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0], "bins": [-3.91015625, -3.80230712890625, -3.6944580078125, -3.58660888671875, -3.478759765625, -3.37091064453125, -3.2630615234375, -3.15521240234375, -3.04736328125, -2.93951416015625, -2.8316650390625, -2.72381591796875, -2.615966796875, -2.50811767578125, -2.4002685546875, -2.29241943359375, -2.1845703125, -2.07672119140625, -1.9688720703125, -1.86102294921875, -1.753173828125, -1.64532470703125, -1.5374755859375, -1.42962646484375, -1.32177734375, -1.21392822265625, -1.1060791015625, -0.99822998046875, -0.890380859375, -0.78253173828125, -0.6746826171875, -0.56683349609375, -0.458984375, -0.35113525390625, -0.2432861328125, -0.13543701171875, -0.027587890625, 0.08026123046875, 0.1881103515625, 0.29595947265625, 0.40380859375, 0.51165771484375, 0.6195068359375, 0.72735595703125, 0.835205078125, 0.94305419921875, 1.0509033203125, 1.15875244140625, 1.2666015625, 1.37445068359375, 1.4822998046875, 1.59014892578125, 1.697998046875, 1.80584716796875, 1.9136962890625, 2.02154541015625, 2.12939453125, 2.23724365234375, 2.3450927734375, 2.45294189453125, 2.560791015625, 2.66864013671875, 2.7764892578125, 2.88433837890625, 2.9921875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 2.0, 7.0, 10.0, 6.0, 10.0, 12.0, 16.0, 22.0, 21.0, 33.0, 35.0, 35.0, 12.0, 43.0, 40.0, 40.0, 55.0, 103.0, 181.0, 1501.0, 283.0, 113.0, 54.0, 48.0, 40.0, 47.0, 44.0, 24.0, 36.0, 21.0, 23.0, 19.0, 16.0, 18.0, 13.0, 11.0, 8.0, 9.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-7.88671875, -7.64593505859375, -7.4051513671875, -7.16436767578125, -6.923583984375, -6.68280029296875, -6.4420166015625, -6.20123291015625, -5.96044921875, -5.71966552734375, -5.4788818359375, -5.23809814453125, -4.997314453125, -4.75653076171875, -4.5157470703125, -4.27496337890625, -4.0341796875, -3.79339599609375, -3.5526123046875, -3.31182861328125, -3.071044921875, -2.83026123046875, -2.5894775390625, -2.34869384765625, -2.10791015625, -1.86712646484375, -1.6263427734375, -1.38555908203125, -1.144775390625, -0.90399169921875, -0.6632080078125, -0.42242431640625, -0.181640625, 0.05914306640625, 0.2999267578125, 0.54071044921875, 0.781494140625, 1.02227783203125, 1.2630615234375, 1.50384521484375, 1.74462890625, 1.98541259765625, 2.2261962890625, 2.46697998046875, 2.707763671875, 2.94854736328125, 3.1893310546875, 3.43011474609375, 3.6708984375, 3.91168212890625, 4.1524658203125, 4.39324951171875, 4.634033203125, 4.87481689453125, 5.1156005859375, 5.35638427734375, 5.59716796875, 5.83795166015625, 6.0787353515625, 6.31951904296875, 6.560302734375, 6.80108642578125, 7.0418701171875, 7.28265380859375, 7.5234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 3.0, 9.0, 7.0, 7.0, 7.0, 13.0, 12.0, 7.0, 25.0, 19.0, 34.0, 37.0, 40.0, 67.0, 85.0, 147.0, 214.0, 480.0, 1525.0, 7339.0, 56584.0, 2559039.0, 489275.0, 24924.0, 3886.0, 959.0, 338.0, 155.0, 128.0, 71.0, 46.0, 48.0, 39.0, 27.0, 18.0, 21.0, 15.0, 12.0, 7.0, 7.0, 4.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.1484375, -10.8087158203125, -10.468994140625, -10.1292724609375, -9.78955078125, -9.4498291015625, -9.110107421875, -8.7703857421875, -8.4306640625, -8.0909423828125, -7.751220703125, -7.4114990234375, -7.07177734375, -6.7320556640625, -6.392333984375, -6.0526123046875, -5.712890625, -5.3731689453125, -5.033447265625, -4.6937255859375, -4.35400390625, -4.0142822265625, -3.674560546875, -3.3348388671875, -2.9951171875, -2.6553955078125, -2.315673828125, -1.9759521484375, -1.63623046875, -1.2965087890625, -0.956787109375, -0.6170654296875, -0.27734375, 0.0623779296875, 0.402099609375, 0.7418212890625, 1.08154296875, 1.4212646484375, 1.760986328125, 2.1007080078125, 2.4404296875, 2.7801513671875, 3.119873046875, 3.4595947265625, 3.79931640625, 4.1390380859375, 4.478759765625, 4.8184814453125, 5.158203125, 5.4979248046875, 5.837646484375, 6.1773681640625, 6.51708984375, 6.8568115234375, 7.196533203125, 7.5362548828125, 7.8759765625, 8.2156982421875, 8.555419921875, 8.8951416015625, 9.23486328125, 9.5745849609375, 9.914306640625, 10.2540283203125, 10.59375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 42.0, 259.0, 474.0, 211.0, 23.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-109.1397933959961, -107.01485443115234, -104.8899154663086, -102.76497650146484, -100.6400375366211, -98.51509094238281, -96.39015197753906, -94.26521301269531, -92.14027404785156, -90.01533508300781, -87.89039611816406, -85.76545715332031, -83.64051818847656, -81.51557922363281, -79.39064025878906, -77.26569366455078, -75.14076232910156, -73.01582336425781, -70.89088439941406, -68.76594543457031, -66.64100646972656, -64.51606750488281, -62.3911247253418, -60.26618576049805, -58.14124298095703, -56.01630401611328, -53.89136505126953, -51.76642608642578, -49.641483306884766, -47.516544342041016, -45.391605377197266, -43.266666412353516, -41.141727447509766, -39.016788482666016, -36.891849517822266, -34.76690673828125, -32.6419677734375, -30.51702880859375, -28.39208984375, -26.26715087890625, -24.142210006713867, -22.017271041870117, -19.892330169677734, -17.767391204833984, -15.642451286315918, -13.517511367797852, -11.392572402954102, -9.267632484436035, -7.142692565917969, -5.017752647399902, -2.892813205718994, -0.7678737640380859, 1.3570661544799805, 3.482006072998047, 5.606945037841797, 7.731884956359863, 9.85682487487793, 11.981764793395996, 14.106704711914062, 16.231643676757812, 18.356582641601562, 20.481523513793945, 22.606462478637695, 24.731403350830078, 26.856342315673828]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 5.0, 9.0, 10.0, 9.0, 17.0, 12.0, 12.0, 32.0, 20.0, 27.0, 31.0, 29.0, 35.0, 42.0, 40.0, 29.0, 43.0, 53.0, 42.0, 39.0, 44.0, 40.0, 39.0, 37.0, 34.0, 31.0, 32.0, 31.0, 28.0, 22.0, 18.0, 22.0, 12.0, 13.0, 9.0, 5.0, 11.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.180843353271484, -27.292997360229492, -26.405149459838867, -25.517303466796875, -24.62945556640625, -23.741609573364258, -22.853761672973633, -21.96591567993164, -21.078067779541016, -20.190221786499023, -19.3023738861084, -18.414527893066406, -17.52667999267578, -16.63883399963379, -15.750986099243164, -14.863140106201172, -13.975293159484863, -13.087446212768555, -12.199599266052246, -11.311752319335938, -10.423905372619629, -9.53605842590332, -8.648212432861328, -7.760365009307861, -6.872518062591553, -5.984671115875244, -5.0968241691589355, -4.208977699279785, -3.3211305141448975, -2.433283805847168, -1.5454368591308594, -0.6575899124145508, 0.2302570343017578, 1.1181039810180664, 2.005950927734375, 2.8937976360321045, 3.781644582748413, 4.669491291046143, 5.557338237762451, 6.44518518447876, 7.333032131195068, 8.220878601074219, 9.108725547790527, 9.996572494506836, 10.884419441223145, 11.772266387939453, 12.660113334655762, 13.54796028137207, 14.435807228088379, 15.323654174804688, 16.21150016784668, 17.099348068237305, 17.987194061279297, 18.875041961669922, 19.762887954711914, 20.65073585510254, 21.53858184814453, 22.426427841186523, 23.31427574157715, 24.20212173461914, 25.089969635009766, 25.977815628051758, 26.865663528442383, 27.753509521484375, 28.641357421875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 8.0, 9.0, 6.0, 8.0, 14.0, 21.0, 13.0, 25.0, 23.0, 32.0, 31.0, 43.0, 44.0, 58.0, 42.0, 52.0, 63.0, 55.0, 54.0, 49.0, 31.0, 40.0, 46.0, 37.0, 37.0, 32.0, 25.0, 28.0, 17.0, 8.0, 17.0, 6.0, 8.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.49609375, -3.410919189453125, -3.32574462890625, -3.240570068359375, -3.1553955078125, -3.070220947265625, -2.98504638671875, -2.899871826171875, -2.814697265625, -2.729522705078125, -2.64434814453125, -2.559173583984375, -2.4739990234375, -2.388824462890625, -2.30364990234375, -2.218475341796875, -2.13330078125, -2.048126220703125, -1.96295166015625, -1.877777099609375, -1.7926025390625, -1.707427978515625, -1.62225341796875, -1.537078857421875, -1.451904296875, -1.366729736328125, -1.28155517578125, -1.196380615234375, -1.1112060546875, -1.026031494140625, -0.94085693359375, -0.855682373046875, -0.7705078125, -0.685333251953125, -0.60015869140625, -0.514984130859375, -0.4298095703125, -0.344635009765625, -0.25946044921875, -0.174285888671875, -0.089111328125, -0.003936767578125, 0.08123779296875, 0.166412353515625, 0.2515869140625, 0.336761474609375, 0.42193603515625, 0.507110595703125, 0.59228515625, 0.677459716796875, 0.76263427734375, 0.847808837890625, 0.9329833984375, 1.018157958984375, 1.10333251953125, 1.188507080078125, 1.273681640625, 1.358856201171875, 1.44403076171875, 1.529205322265625, 1.6143798828125, 1.699554443359375, 1.78472900390625, 1.869903564453125, 1.955078125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 9.0, 4.0, 7.0, 6.0, 13.0, 14.0, 20.0, 25.0, 31.0, 53.0, 82.0, 153.0, 281.0, 641.0, 1794.0, 5829.0, 23584.0, 130019.0, 1330826.0, 2416278.0, 234868.0, 37435.0, 8399.0, 2366.0, 765.0, 322.0, 176.0, 91.0, 48.0, 39.0, 33.0, 20.0, 19.0, 10.0, 9.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.828125, -10.54425048828125, -10.2603759765625, -9.97650146484375, -9.692626953125, -9.40875244140625, -9.1248779296875, -8.84100341796875, -8.55712890625, -8.27325439453125, -7.9893798828125, -7.70550537109375, -7.421630859375, -7.13775634765625, -6.8538818359375, -6.57000732421875, -6.2861328125, -6.00225830078125, -5.7183837890625, -5.43450927734375, -5.150634765625, -4.86676025390625, -4.5828857421875, -4.29901123046875, -4.01513671875, -3.73126220703125, -3.4473876953125, -3.16351318359375, -2.879638671875, -2.59576416015625, -2.3118896484375, -2.02801513671875, -1.744140625, -1.46026611328125, -1.1763916015625, -0.89251708984375, -0.608642578125, -0.32476806640625, -0.0408935546875, 0.24298095703125, 0.52685546875, 0.81072998046875, 1.0946044921875, 1.37847900390625, 1.662353515625, 1.94622802734375, 2.2301025390625, 2.51397705078125, 2.7978515625, 3.08172607421875, 3.3656005859375, 3.64947509765625, 3.933349609375, 4.21722412109375, 4.5010986328125, 4.78497314453125, 5.06884765625, 5.35272216796875, 5.6365966796875, 5.92047119140625, 6.204345703125, 6.48822021484375, 6.7720947265625, 7.05596923828125, 7.33984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 12.0, 16.0, 28.0, 44.0, 48.0, 62.0, 108.0, 163.0, 233.0, 392.0, 567.0, 672.0, 528.0, 401.0, 272.0, 195.0, 114.0, 83.0, 57.0, 26.0, 18.0, 10.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5234375, -10.2269287109375, -9.930419921875, -9.6339111328125, -9.33740234375, -9.0408935546875, -8.744384765625, -8.4478759765625, -8.1513671875, -7.8548583984375, -7.558349609375, -7.2618408203125, -6.96533203125, -6.6688232421875, -6.372314453125, -6.0758056640625, -5.779296875, -5.4827880859375, -5.186279296875, -4.8897705078125, -4.59326171875, -4.2967529296875, -4.000244140625, -3.7037353515625, -3.4072265625, -3.1107177734375, -2.814208984375, -2.5177001953125, -2.22119140625, -1.9246826171875, -1.628173828125, -1.3316650390625, -1.03515625, -0.7386474609375, -0.442138671875, -0.1456298828125, 0.15087890625, 0.4473876953125, 0.743896484375, 1.0404052734375, 1.3369140625, 1.6334228515625, 1.929931640625, 2.2264404296875, 2.52294921875, 2.8194580078125, 3.115966796875, 3.4124755859375, 3.708984375, 4.0054931640625, 4.302001953125, 4.5985107421875, 4.89501953125, 5.1915283203125, 5.488037109375, 5.7845458984375, 6.0810546875, 6.3775634765625, 6.674072265625, 6.9705810546875, 7.26708984375, 7.5635986328125, 7.860107421875, 8.1566162109375, 8.453125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 11.0, 14.0, 16.0, 29.0, 49.0, 97.0, 122.0, 274.0, 636.0, 1405.0, 4200.0, 17776.0, 128007.0, 1645270.0, 2195144.0, 171556.0, 21964.0, 4905.0, 1488.0, 625.0, 307.0, 167.0, 83.0, 56.0, 26.0, 22.0, 11.0, 5.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8515625, -13.3397216796875, -12.827880859375, -12.3160400390625, -11.80419921875, -11.2923583984375, -10.780517578125, -10.2686767578125, -9.7568359375, -9.2449951171875, -8.733154296875, -8.2213134765625, -7.70947265625, -7.1976318359375, -6.685791015625, -6.1739501953125, -5.662109375, -5.1502685546875, -4.638427734375, -4.1265869140625, -3.61474609375, -3.1029052734375, -2.591064453125, -2.0792236328125, -1.5673828125, -1.0555419921875, -0.543701171875, -0.0318603515625, 0.47998046875, 0.9918212890625, 1.503662109375, 2.0155029296875, 2.52734375, 3.0391845703125, 3.551025390625, 4.0628662109375, 4.57470703125, 5.0865478515625, 5.598388671875, 6.1102294921875, 6.6220703125, 7.1339111328125, 7.645751953125, 8.1575927734375, 8.66943359375, 9.1812744140625, 9.693115234375, 10.2049560546875, 10.716796875, 11.2286376953125, 11.740478515625, 12.2523193359375, 12.76416015625, 13.2760009765625, 13.787841796875, 14.2996826171875, 14.8115234375, 15.3233642578125, 15.835205078125, 16.3470458984375, 16.85888671875, 17.3707275390625, 17.882568359375, 18.3944091796875, 18.90625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 11.0, 18.0, 39.0, 75.0, 127.0, 140.0, 179.0, 157.0, 125.0, 71.0, 40.0, 17.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.4660873413086, -87.30715942382812, -85.14822387695312, -82.98929595947266, -80.83036041259766, -78.67143249511719, -76.51249694824219, -74.35356903076172, -72.19463348388672, -70.03570556640625, -67.87677001953125, -65.71784210205078, -63.55890655517578, -61.39997482299805, -59.24104309082031, -57.082115173339844, -54.92318344116211, -52.764251708984375, -50.60531997680664, -48.446388244628906, -46.28745651245117, -44.12852478027344, -41.96959686279297, -39.81066131591797, -37.6517333984375, -35.492801666259766, -33.33386993408203, -31.174938201904297, -29.016006469726562, -26.857074737548828, -24.698144912719727, -22.539213180541992, -20.38028335571289, -18.221351623535156, -16.062419891357422, -13.903489112854004, -11.74455738067627, -9.585625648498535, -7.426694869995117, -5.267763137817383, -3.1088314056396484, -0.9498999118804932, 1.209031581878662, 3.3679628372192383, 5.526894569396973, 7.685826301574707, 9.844757080078125, 12.00368881225586, 14.162620544433594, 16.321552276611328, 18.480484008789062, 20.639415740966797, 22.79834747314453, 24.957279205322266, 27.116209030151367, 29.2751407623291, 31.434072494506836, 33.59300231933594, 35.75193405151367, 37.910865783691406, 40.06979751586914, 42.228729248046875, 44.38766098022461, 46.546592712402344, 48.70552444458008]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 2.0, 11.0, 9.0, 11.0, 17.0, 11.0, 6.0, 19.0, 19.0, 24.0, 26.0, 19.0, 43.0, 36.0, 32.0, 42.0, 29.0, 40.0, 41.0, 32.0, 43.0, 39.0, 41.0, 30.0, 42.0, 34.0, 36.0, 31.0, 33.0, 27.0, 23.0, 27.0, 17.0, 22.0, 7.0, 18.0, 7.0, 8.0, 11.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.8173828125, -23.04169464111328, -22.266006469726562, -21.490318298339844, -20.714630126953125, -19.938941955566406, -19.163253784179688, -18.38756561279297, -17.61187744140625, -16.83618927001953, -16.060501098632812, -15.284812927246094, -14.509124755859375, -13.733436584472656, -12.957748413085938, -12.182060241699219, -11.406371116638184, -10.630682945251465, -9.854994773864746, -9.079306602478027, -8.303618431091309, -7.52793025970459, -6.752241611480713, -5.976553440093994, -5.200865268707275, -4.425177097320557, -3.649488925933838, -2.87380051612854, -2.0981123447418213, -1.3224241733551025, -0.5467357635498047, 0.22895240783691406, 1.0046405792236328, 1.7803287506103516, 2.5560169219970703, 3.331705331802368, 4.107393264770508, 4.883081436157227, 5.6587700843811035, 6.434458255767822, 7.210146427154541, 7.98583459854126, 8.761523246765137, 9.537211418151855, 10.312899589538574, 11.088587760925293, 11.864275932312012, 12.63996410369873, 13.41565227508545, 14.191340446472168, 14.967028617858887, 15.742716789245605, 16.51840591430664, 17.29409408569336, 18.069782257080078, 18.845470428466797, 19.621158599853516, 20.396846771240234, 21.172534942626953, 21.948223114013672, 22.72391128540039, 23.49959945678711, 24.275287628173828, 25.050975799560547, 25.826663970947266]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 5.0, 7.0, 8.0, 18.0, 6.0, 20.0, 23.0, 25.0, 27.0, 34.0, 34.0, 37.0, 46.0, 45.0, 43.0, 43.0, 41.0, 47.0, 52.0, 56.0, 36.0, 45.0, 32.0, 35.0, 39.0, 30.0, 36.0, 24.0, 22.0, 16.0, 7.0, 11.0, 10.0, 8.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84765625, -2.7667236328125, -2.685791015625, -2.6048583984375, -2.52392578125, -2.4429931640625, -2.362060546875, -2.2811279296875, -2.2001953125, -2.1192626953125, -2.038330078125, -1.9573974609375, -1.87646484375, -1.7955322265625, -1.714599609375, -1.6336669921875, -1.552734375, -1.4718017578125, -1.390869140625, -1.3099365234375, -1.22900390625, -1.1480712890625, -1.067138671875, -0.9862060546875, -0.9052734375, -0.8243408203125, -0.743408203125, -0.6624755859375, -0.58154296875, -0.5006103515625, -0.419677734375, -0.3387451171875, -0.2578125, -0.1768798828125, -0.095947265625, -0.0150146484375, 0.06591796875, 0.1468505859375, 0.227783203125, 0.3087158203125, 0.3896484375, 0.4705810546875, 0.551513671875, 0.6324462890625, 0.71337890625, 0.7943115234375, 0.875244140625, 0.9561767578125, 1.037109375, 1.1180419921875, 1.198974609375, 1.2799072265625, 1.36083984375, 1.4417724609375, 1.522705078125, 1.6036376953125, 1.6845703125, 1.7655029296875, 1.846435546875, 1.9273681640625, 2.00830078125, 2.0892333984375, 2.170166015625, 2.2510986328125, 2.33203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 13.0, 15.0, 34.0, 41.0, 100.0, 91.0, 158.0, 271.0, 393.0, 633.0, 909.0, 1501.0, 2274.0, 3601.0, 5668.0, 9213.0, 14961.0, 24773.0, 41512.0, 72850.0, 140577.0, 300815.0, 200347.0, 94747.0, 52862.0, 31032.0, 18674.0, 11412.0, 6914.0, 4422.0, 2702.0, 1787.0, 1166.0, 721.0, 456.0, 339.0, 181.0, 132.0, 80.0, 56.0, 40.0, 25.0, 17.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02142333984375, -0.020747900009155273, -0.020072460174560547, -0.01939702033996582, -0.018721580505371094, -0.018046140670776367, -0.01737070083618164, -0.016695261001586914, -0.016019821166992188, -0.015344381332397461, -0.014668941497802734, -0.013993501663208008, -0.013318061828613281, -0.012642621994018555, -0.011967182159423828, -0.011291742324829102, -0.010616302490234375, -0.009940862655639648, -0.009265422821044922, -0.008589982986450195, -0.007914543151855469, -0.007239103317260742, -0.006563663482666016, -0.005888223648071289, -0.0052127838134765625, -0.004537343978881836, -0.0038619041442871094, -0.003186464309692383, -0.0025110244750976562, -0.0018355846405029297, -0.0011601448059082031, -0.00048470497131347656, 0.00019073486328125, 0.0008661746978759766, 0.0015416145324707031, 0.0022170543670654297, 0.0028924942016601562, 0.003567934036254883, 0.004243373870849609, 0.004918813705444336, 0.0055942535400390625, 0.006269693374633789, 0.006945133209228516, 0.007620573043823242, 0.008296012878417969, 0.008971452713012695, 0.009646892547607422, 0.010322332382202148, 0.010997772216796875, 0.011673212051391602, 0.012348651885986328, 0.013024091720581055, 0.013699531555175781, 0.014374971389770508, 0.015050411224365234, 0.01572585105895996, 0.016401290893554688, 0.017076730728149414, 0.01775217056274414, 0.018427610397338867, 0.019103050231933594, 0.01977849006652832, 0.020453929901123047, 0.021129369735717773, 0.0218048095703125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 7.0, 6.0, 7.0, 12.0, 8.0, 15.0, 17.0, 23.0, 20.0, 35.0, 27.0, 48.0, 27.0, 40.0, 36.0, 46.0, 48.0, 44.0, 1070.0, 53.0, 47.0, 49.0, 57.0, 45.0, 34.0, 32.0, 32.0, 28.0, 21.0, 20.0, 24.0, 12.0, 7.0, 10.0, 6.0, 4.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.400390625, -2.334197998046875, -2.26800537109375, -2.201812744140625, -2.1356201171875, -2.069427490234375, -2.00323486328125, -1.937042236328125, -1.870849609375, -1.804656982421875, -1.73846435546875, -1.672271728515625, -1.6060791015625, -1.539886474609375, -1.47369384765625, -1.407501220703125, -1.34130859375, -1.275115966796875, -1.20892333984375, -1.142730712890625, -1.0765380859375, -1.010345458984375, -0.94415283203125, -0.877960205078125, -0.811767578125, -0.745574951171875, -0.67938232421875, -0.613189697265625, -0.5469970703125, -0.480804443359375, -0.41461181640625, -0.348419189453125, -0.2822265625, -0.216033935546875, -0.14984130859375, -0.083648681640625, -0.0174560546875, 0.048736572265625, 0.11492919921875, 0.181121826171875, 0.247314453125, 0.313507080078125, 0.37969970703125, 0.445892333984375, 0.5120849609375, 0.578277587890625, 0.64447021484375, 0.710662841796875, 0.77685546875, 0.843048095703125, 0.90924072265625, 0.975433349609375, 1.0416259765625, 1.107818603515625, 1.17401123046875, 1.240203857421875, 1.306396484375, 1.372589111328125, 1.43878173828125, 1.504974365234375, 1.5711669921875, 1.637359619140625, 1.70355224609375, 1.769744873046875, 1.8359375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 11.0, 9.0, 23.0, 44.0, 66.0, 91.0, 90.0, 181.0, 266.0, 436.0, 632.0, 999.0, 1614.0, 2596.0, 4368.0, 7090.0, 12139.0, 20638.0, 35946.0, 62580.0, 114231.0, 214788.0, 1299303.0, 139965.0, 75396.0, 42456.0, 24804.0, 14559.0, 8506.0, 5015.0, 3135.0, 1872.0, 1167.0, 748.0, 453.0, 307.0, 184.0, 116.0, 84.0, 65.0, 40.0, 31.0, 16.0, 13.0, 15.0, 9.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00832366943359375, -0.008064866065979004, -0.007806062698364258, -0.007547259330749512, -0.007288455963134766, -0.0070296525955200195, -0.0067708492279052734, -0.006512045860290527, -0.006253242492675781, -0.005994439125061035, -0.005735635757446289, -0.005476832389831543, -0.005218029022216797, -0.004959225654602051, -0.004700422286987305, -0.004441618919372559, -0.0041828155517578125, -0.003924012184143066, -0.0036652088165283203, -0.0034064054489135742, -0.003147602081298828, -0.002888798713684082, -0.002629995346069336, -0.00237119197845459, -0.0021123886108398438, -0.0018535852432250977, -0.0015947818756103516, -0.0013359785079956055, -0.0010771751403808594, -0.0008183717727661133, -0.0005595684051513672, -0.0003007650375366211, -4.1961669921875e-05, 0.0002168416976928711, 0.0004756450653076172, 0.0007344484329223633, 0.0009932518005371094, 0.0012520551681518555, 0.0015108585357666016, 0.0017696619033813477, 0.0020284652709960938, 0.00228726863861084, 0.002546072006225586, 0.002804875373840332, 0.003063678741455078, 0.0033224821090698242, 0.0035812854766845703, 0.0038400888442993164, 0.0040988922119140625, 0.004357695579528809, 0.004616498947143555, 0.004875302314758301, 0.005134105682373047, 0.005392909049987793, 0.005651712417602539, 0.005910515785217285, 0.006169319152832031, 0.006428122520446777, 0.0066869258880615234, 0.0069457292556762695, 0.007204532623291016, 0.007463335990905762, 0.007722139358520508, 0.007980942726135254, 0.00823974609375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 8.0, 0.0, 8.0, 0.0, 0.0, 15.0, 0.0, 0.0, 28.0, 0.0, 0.0, 33.0, 0.0, 0.0, 69.0, 0.0, 152.0, 0.0, 0.0, 385.0, 0.0, 0.0, 136.0, 0.0, 0.0, 74.0, 0.0, 30.0, 0.0, 0.0, 27.0, 0.0, 0.0, 23.0, 0.0, 0.0, 11.0, 0.0, 0.0, 8.0, 0.0, 5.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.342306733131409e-07, -6.128102540969849e-07, -5.913898348808289e-07, -5.699694156646729e-07, -5.485489964485168e-07, -5.271285772323608e-07, -5.057081580162048e-07, -4.842877388000488e-07, -4.628673195838928e-07, -4.414469003677368e-07, -4.200264811515808e-07, -3.986060619354248e-07, -3.771856427192688e-07, -3.557652235031128e-07, -3.343448042869568e-07, -3.129243850708008e-07, -2.915039658546448e-07, -2.7008354663848877e-07, -2.4866312742233276e-07, -2.2724270820617676e-07, -2.0582228899002075e-07, -1.8440186977386475e-07, -1.6298145055770874e-07, -1.4156103134155273e-07, -1.2014061212539673e-07, -9.872019290924072e-08, -7.729977369308472e-08, -5.587935447692871e-08, -3.4458935260772705e-08, -1.30385160446167e-08, 8.381903171539307e-09, 2.9802322387695312e-08, 5.122274160385132e-08, 7.264316082000732e-08, 9.406358003616333e-08, 1.1548399925231934e-07, 1.3690441846847534e-07, 1.5832483768463135e-07, 1.7974525690078735e-07, 2.0116567611694336e-07, 2.2258609533309937e-07, 2.4400651454925537e-07, 2.654269337654114e-07, 2.868473529815674e-07, 3.082677721977234e-07, 3.296881914138794e-07, 3.511086106300354e-07, 3.725290298461914e-07, 3.939494490623474e-07, 4.153698682785034e-07, 4.367902874946594e-07, 4.5821070671081543e-07, 4.796311259269714e-07, 5.010515451431274e-07, 5.224719643592834e-07, 5.438923835754395e-07, 5.653128027915955e-07, 5.867332220077515e-07, 6.081536412239075e-07, 6.295740604400635e-07, 6.509944796562195e-07, 6.724148988723755e-07, 6.938353180885315e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 18.0, 12.0, 19.0, 23.0, 17.0, 34.0, 39.0, 52.0, 44.0, 65.0, 113.0, 153.0, 243.0, 507.0, 2732.0, 33459.0, 880640.0, 121909.0, 6479.0, 952.0, 295.0, 126.0, 129.0, 67.0, 64.0, 61.0, 37.0, 42.0, 37.0, 25.0, 23.0, 25.0, 20.0, 15.0, 10.0, 8.0, 7.0, 6.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-9.894371032714844e-06, -9.601004421710968e-06, -9.307637810707092e-06, -9.014271199703217e-06, -8.72090458869934e-06, -8.427537977695465e-06, -8.13417136669159e-06, -7.840804755687714e-06, -7.547438144683838e-06, -7.254071533679962e-06, -6.9607049226760864e-06, -6.667338311672211e-06, -6.373971700668335e-06, -6.080605089664459e-06, -5.7872384786605835e-06, -5.493871867656708e-06, -5.200505256652832e-06, -4.907138645648956e-06, -4.6137720346450806e-06, -4.320405423641205e-06, -4.027038812637329e-06, -3.7336722016334534e-06, -3.4403055906295776e-06, -3.146938979625702e-06, -2.853572368621826e-06, -2.5602057576179504e-06, -2.2668391466140747e-06, -1.973472535610199e-06, -1.6801059246063232e-06, -1.3867393136024475e-06, -1.0933727025985718e-06, -8.00006091594696e-07, -5.066394805908203e-07, -2.1327286958694458e-07, 8.009374141693115e-08, 3.734603524208069e-07, 6.668269634246826e-07, 9.601935744285583e-07, 1.253560185432434e-06, 1.5469267964363098e-06, 1.8402934074401855e-06, 2.1336600184440613e-06, 2.427026629447937e-06, 2.7203932404518127e-06, 3.0137598514556885e-06, 3.307126462459564e-06, 3.60049307346344e-06, 3.893859684467316e-06, 4.187226295471191e-06, 4.480592906475067e-06, 4.773959517478943e-06, 5.067326128482819e-06, 5.360692739486694e-06, 5.65405935049057e-06, 5.947425961494446e-06, 6.2407925724983215e-06, 6.534159183502197e-06, 6.827525794506073e-06, 7.120892405509949e-06, 7.4142590165138245e-06, 7.7076256275177e-06, 8.000992238521576e-06, 8.294358849525452e-06, 8.587725460529327e-06, 8.881092071533203e-06]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 11.0, 18.0, 50.0, 122.0, 380.0, 207.0, 125.0, 57.0, 21.0, 9.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2618720575119369e-06, -1.2197108389955247e-06, -1.1775496204791125e-06, -1.1353884019627003e-06, -1.0932271834462881e-06, -1.051065964929876e-06, -1.0089047464134637e-06, -9.667435278970515e-07, -9.245823093806393e-07, -8.824210908642272e-07, -8.40259872347815e-07, -7.980986538314028e-07, -7.559374353149906e-07, -7.137762167985784e-07, -6.716149982821662e-07, -6.29453779765754e-07, -5.872925612493418e-07, -5.451313427329296e-07, -5.029701242165174e-07, -4.6080890570010524e-07, -4.1864768718369305e-07, -3.7648646866728086e-07, -3.3432525015086867e-07, -2.921640316344565e-07, -2.500028131180443e-07, -2.078415946016321e-07, -1.656803760852199e-07, -1.2351915756880771e-07, -8.135793905239552e-08, -3.919672053598333e-08, 2.9644979804288596e-09, 4.512571649684105e-08, 8.728704870009096e-08, 1.2944826721650315e-07, 1.7160948573291535e-07, 2.1377070424932754e-07, 2.5593192276573973e-07, 2.980931412821519e-07, 3.402543597985641e-07, 3.824155783149763e-07, 4.245767968313885e-07, 4.667380153478007e-07, 5.088992338642129e-07, 5.510604523806251e-07, 5.932216708970373e-07, 6.353828894134494e-07, 6.775441079298616e-07, 7.197053264462738e-07, 7.61866544962686e-07, 8.040277634790982e-07, 8.461889819955104e-07, 8.883502005119226e-07, 9.305114190283348e-07, 9.72672637544747e-07, 1.0148338560611592e-06, 1.0569950745775714e-06, 1.0991562930939835e-06, 1.1413175116103957e-06, 1.183478730126808e-06, 1.2256399486432201e-06, 1.2678011671596323e-06, 1.3099623856760445e-06, 1.3521236041924567e-06, 1.3942848227088689e-06, 1.436446041225281e-06]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 0.0, 95.0, 0.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 0.0, 0.0, 326.0, 0.0, 0.0, 0.0, 0.0, 192.0, 0.0, 0.0, 0.0, 0.0, 73.0, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 4.0], "bins": [-4.172325134277344e-07, -4.0512531995773315e-07, -3.9301812648773193e-07, -3.809109330177307e-07, -3.688037395477295e-07, -3.5669654607772827e-07, -3.4458935260772705e-07, -3.3248215913772583e-07, -3.203749656677246e-07, -3.082677721977234e-07, -2.9616057872772217e-07, -2.8405338525772095e-07, -2.7194619178771973e-07, -2.598389983177185e-07, -2.477318048477173e-07, -2.3562461137771606e-07, -2.2351741790771484e-07, -2.1141022443771362e-07, -1.993030309677124e-07, -1.8719583749771118e-07, -1.7508864402770996e-07, -1.6298145055770874e-07, -1.5087425708770752e-07, -1.387670636177063e-07, -1.2665987014770508e-07, -1.1455267667770386e-07, -1.0244548320770264e-07, -9.033828973770142e-08, -7.82310962677002e-08, -6.612390279769897e-08, -5.4016709327697754e-08, -4.190951585769653e-08, -2.9802322387695312e-08, -1.7695128917694092e-08, -5.587935447692871e-09, 6.51925802230835e-09, 1.862645149230957e-08, 3.073364496231079e-08, 4.284083843231201e-08, 5.494803190231323e-08, 6.705522537231445e-08, 7.916241884231567e-08, 9.12696123123169e-08, 1.0337680578231812e-07, 1.1548399925231934e-07, 1.2759119272232056e-07, 1.3969838619232178e-07, 1.51805579662323e-07, 1.6391277313232422e-07, 1.7601996660232544e-07, 1.8812716007232666e-07, 2.0023435354232788e-07, 2.123415470123291e-07, 2.2444874048233032e-07, 2.3655593395233154e-07, 2.4866312742233276e-07, 2.60770320892334e-07, 2.728775143623352e-07, 2.849847078323364e-07, 2.9709190130233765e-07, 3.0919909477233887e-07, 3.213062882423401e-07, 3.334134817123413e-07, 3.4552067518234253e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 5.0, 7.0, 8.0, 18.0, 6.0, 20.0, 23.0, 25.0, 27.0, 34.0, 34.0, 37.0, 46.0, 45.0, 43.0, 43.0, 41.0, 47.0, 52.0, 56.0, 36.0, 45.0, 32.0, 35.0, 39.0, 30.0, 36.0, 24.0, 22.0, 16.0, 7.0, 11.0, 10.0, 8.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84765625, -2.7667236328125, -2.685791015625, -2.6048583984375, -2.52392578125, -2.4429931640625, -2.362060546875, -2.2811279296875, -2.2001953125, -2.1192626953125, -2.038330078125, -1.9573974609375, -1.87646484375, -1.7955322265625, -1.714599609375, -1.6336669921875, -1.552734375, -1.4718017578125, -1.390869140625, -1.3099365234375, -1.22900390625, -1.1480712890625, -1.067138671875, -0.9862060546875, -0.9052734375, -0.8243408203125, -0.743408203125, -0.6624755859375, -0.58154296875, -0.5006103515625, -0.419677734375, -0.3387451171875, -0.2578125, -0.1768798828125, -0.095947265625, -0.0150146484375, 0.06591796875, 0.1468505859375, 0.227783203125, 0.3087158203125, 0.3896484375, 0.4705810546875, 0.551513671875, 0.6324462890625, 0.71337890625, 0.7943115234375, 0.875244140625, 0.9561767578125, 1.037109375, 1.1180419921875, 1.198974609375, 1.2799072265625, 1.36083984375, 1.4417724609375, 1.522705078125, 1.6036376953125, 1.6845703125, 1.7655029296875, 1.846435546875, 1.9273681640625, 2.00830078125, 2.0892333984375, 2.170166015625, 2.2510986328125, 2.33203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 10.0, 11.0, 18.0, 31.0, 51.0, 62.0, 102.0, 160.0, 292.0, 484.0, 734.0, 1269.0, 2147.0, 3665.0, 6353.0, 11465.0, 20822.0, 40555.0, 90762.0, 510798.0, 226677.0, 63416.0, 30760.0, 16273.0, 9109.0, 5139.0, 2959.0, 1746.0, 1062.0, 620.0, 379.0, 240.0, 140.0, 94.0, 48.0, 41.0, 24.0, 16.0, 9.0, 4.0, 0.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.00506591796875, -2.8929443359375, -2.78082275390625, -2.668701171875, -2.55657958984375, -2.4444580078125, -2.33233642578125, -2.22021484375, -2.10809326171875, -1.9959716796875, -1.88385009765625, -1.771728515625, -1.65960693359375, -1.5474853515625, -1.43536376953125, -1.3232421875, -1.21112060546875, -1.0989990234375, -0.98687744140625, -0.874755859375, -0.76263427734375, -0.6505126953125, -0.53839111328125, -0.42626953125, -0.31414794921875, -0.2020263671875, -0.08990478515625, 0.022216796875, 0.13433837890625, 0.2464599609375, 0.35858154296875, 0.470703125, 0.58282470703125, 0.6949462890625, 0.80706787109375, 0.919189453125, 1.03131103515625, 1.1434326171875, 1.25555419921875, 1.36767578125, 1.47979736328125, 1.5919189453125, 1.70404052734375, 1.816162109375, 1.92828369140625, 2.0404052734375, 2.15252685546875, 2.2646484375, 2.37677001953125, 2.4888916015625, 2.60101318359375, 2.713134765625, 2.82525634765625, 2.9373779296875, 3.04949951171875, 3.16162109375, 3.27374267578125, 3.3858642578125, 3.49798583984375, 3.610107421875, 3.72222900390625, 3.8343505859375, 3.94647216796875, 4.05859375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 10.0, 10.0, 15.0, 13.0, 16.0, 19.0, 22.0, 22.0, 25.0, 28.0, 34.0, 28.0, 32.0, 41.0, 41.0, 47.0, 88.0, 126.0, 371.0, 1371.0, 146.0, 78.0, 72.0, 61.0, 37.0, 37.0, 32.0, 28.0, 26.0, 28.0, 14.0, 27.0, 14.0, 16.0, 14.0, 10.0, 8.0, 8.0, 4.0, 2.0, 6.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-7.546875, -7.3111572265625, -7.075439453125, -6.8397216796875, -6.60400390625, -6.3682861328125, -6.132568359375, -5.8968505859375, -5.6611328125, -5.4254150390625, -5.189697265625, -4.9539794921875, -4.71826171875, -4.4825439453125, -4.246826171875, -4.0111083984375, -3.775390625, -3.5396728515625, -3.303955078125, -3.0682373046875, -2.83251953125, -2.5968017578125, -2.361083984375, -2.1253662109375, -1.8896484375, -1.6539306640625, -1.418212890625, -1.1824951171875, -0.94677734375, -0.7110595703125, -0.475341796875, -0.2396240234375, -0.00390625, 0.2318115234375, 0.467529296875, 0.7032470703125, 0.93896484375, 1.1746826171875, 1.410400390625, 1.6461181640625, 1.8818359375, 2.1175537109375, 2.353271484375, 2.5889892578125, 2.82470703125, 3.0604248046875, 3.296142578125, 3.5318603515625, 3.767578125, 4.0032958984375, 4.239013671875, 4.4747314453125, 4.71044921875, 4.9461669921875, 5.181884765625, 5.4176025390625, 5.6533203125, 5.8890380859375, 6.124755859375, 6.3604736328125, 6.59619140625, 6.8319091796875, 7.067626953125, 7.3033447265625, 7.5390625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 3.0, 7.0, 7.0, 11.0, 8.0, 12.0, 18.0, 22.0, 29.0, 34.0, 44.0, 65.0, 79.0, 98.0, 148.0, 255.0, 531.0, 1636.0, 8006.0, 64218.0, 2248069.0, 772585.0, 41619.0, 5724.0, 1218.0, 444.0, 223.0, 149.0, 96.0, 74.0, 63.0, 39.0, 35.0, 27.0, 21.0, 13.0, 12.0, 13.0, 12.0, 9.0, 4.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.046875, -11.6807861328125, -11.314697265625, -10.9486083984375, -10.58251953125, -10.2164306640625, -9.850341796875, -9.4842529296875, -9.1181640625, -8.7520751953125, -8.385986328125, -8.0198974609375, -7.65380859375, -7.2877197265625, -6.921630859375, -6.5555419921875, -6.189453125, -5.8233642578125, -5.457275390625, -5.0911865234375, -4.72509765625, -4.3590087890625, -3.992919921875, -3.6268310546875, -3.2607421875, -2.8946533203125, -2.528564453125, -2.1624755859375, -1.79638671875, -1.4302978515625, -1.064208984375, -0.6981201171875, -0.33203125, 0.0340576171875, 0.400146484375, 0.7662353515625, 1.13232421875, 1.4984130859375, 1.864501953125, 2.2305908203125, 2.5966796875, 2.9627685546875, 3.328857421875, 3.6949462890625, 4.06103515625, 4.4271240234375, 4.793212890625, 5.1593017578125, 5.525390625, 5.8914794921875, 6.257568359375, 6.6236572265625, 6.98974609375, 7.3558349609375, 7.721923828125, 8.0880126953125, 8.4541015625, 8.8201904296875, 9.186279296875, 9.5523681640625, 9.91845703125, 10.2845458984375, 10.650634765625, 11.0167236328125, 11.3828125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 25.0, 115.0, 371.0, 353.0, 129.0, 20.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.97040367126465, -25.831098556518555, -23.691791534423828, -21.552486419677734, -19.41318130493164, -17.273876190185547, -15.134570121765137, -12.995264053344727, -10.855958938598633, -8.716653823852539, -6.577347755432129, -4.438042163848877, -2.298736572265625, -0.15943145751953125, 1.979874610900879, 4.119180679321289, 6.258485794067383, 8.397790908813477, 10.537096977233887, 12.676403045654297, 14.81570816040039, 16.955013275146484, 19.094318389892578, 21.233625411987305, 23.3729305267334, 25.512235641479492, 27.65154266357422, 29.790847778320312, 31.930152893066406, 34.0694580078125, 36.208763122558594, 38.34806823730469, 40.48738098144531, 42.626686096191406, 44.7659912109375, 46.905296325683594, 49.04460144042969, 51.18390655517578, 53.32321548461914, 55.462520599365234, 57.60182571411133, 59.74113082885742, 61.880435943603516, 64.01974487304688, 66.15904998779297, 68.29835510253906, 70.43766021728516, 72.57696533203125, 74.71627044677734, 76.85557556152344, 78.99488067626953, 81.13418579101562, 83.27349090576172, 85.41279602050781, 87.5521011352539, 89.69140625, 91.83071899414062, 93.97002410888672, 96.10932922363281, 98.2486343383789, 100.387939453125, 102.5272445678711, 104.66654968261719, 106.80586242675781, 108.94515991210938]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 3.0, 10.0, 8.0, 10.0, 17.0, 19.0, 16.0, 25.0, 23.0, 31.0, 31.0, 23.0, 32.0, 41.0, 38.0, 37.0, 43.0, 53.0, 39.0, 52.0, 49.0, 48.0, 34.0, 31.0, 25.0, 28.0, 28.0, 28.0, 22.0, 22.0, 24.0, 25.0, 15.0, 16.0, 14.0, 8.0, 8.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.498703002929688, -26.61612319946289, -25.733543395996094, -24.850963592529297, -23.9683837890625, -23.085803985595703, -22.203222274780273, -21.320642471313477, -20.43806266784668, -19.555482864379883, -18.672903060913086, -17.79032325744629, -16.90774154663086, -16.025161743164062, -15.142581939697266, -14.260002136230469, -13.377422332763672, -12.494842529296875, -11.612262725830078, -10.729681968688965, -9.847102165222168, -8.964522361755371, -8.081941604614258, -7.199361801147461, -6.316781997680664, -5.434202194213867, -4.551621913909912, -3.669041872024536, -2.78646183013916, -1.9038820266723633, -1.0213017463684082, -0.13872146606445312, 0.7438583374023438, 1.6264383792877197, 2.5090184211730957, 3.3915984630584717, 4.274178504943848, 5.1567583084106445, 6.0393385887146, 6.921918869018555, 7.804498672485352, 8.687078475952148, 9.569658279418945, 10.452239036560059, 11.334818840026855, 12.217398643493652, 13.099979400634766, 13.982559204101562, 14.86513900756836, 15.747718811035156, 16.630298614501953, 17.51287841796875, 18.395458221435547, 19.278038024902344, 20.160619735717773, 21.04319953918457, 21.925779342651367, 22.808359146118164, 23.69093894958496, 24.573518753051758, 25.456100463867188, 26.338680267333984, 27.22126007080078, 28.103839874267578, 28.986419677734375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 8.0, 10.0, 9.0, 9.0, 16.0, 17.0, 20.0, 18.0, 29.0, 39.0, 26.0, 40.0, 39.0, 38.0, 42.0, 45.0, 57.0, 40.0, 45.0, 55.0, 39.0, 47.0, 31.0, 36.0, 43.0, 37.0, 30.0, 25.0, 24.0, 17.0, 13.0, 9.0, 8.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.921875, -2.83978271484375, -2.7576904296875, -2.67559814453125, -2.593505859375, -2.51141357421875, -2.4293212890625, -2.34722900390625, -2.26513671875, -2.18304443359375, -2.1009521484375, -2.01885986328125, -1.936767578125, -1.85467529296875, -1.7725830078125, -1.69049072265625, -1.6083984375, -1.52630615234375, -1.4442138671875, -1.36212158203125, -1.280029296875, -1.19793701171875, -1.1158447265625, -1.03375244140625, -0.95166015625, -0.86956787109375, -0.7874755859375, -0.70538330078125, -0.623291015625, -0.54119873046875, -0.4591064453125, -0.37701416015625, -0.294921875, -0.21282958984375, -0.1307373046875, -0.04864501953125, 0.033447265625, 0.11553955078125, 0.1976318359375, 0.27972412109375, 0.36181640625, 0.44390869140625, 0.5260009765625, 0.60809326171875, 0.690185546875, 0.77227783203125, 0.8543701171875, 0.93646240234375, 1.0185546875, 1.10064697265625, 1.1827392578125, 1.26483154296875, 1.346923828125, 1.42901611328125, 1.5111083984375, 1.59320068359375, 1.67529296875, 1.75738525390625, 1.8394775390625, 1.92156982421875, 2.003662109375, 2.08575439453125, 2.1678466796875, 2.24993896484375, 2.33203125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 9.0, 18.0, 26.0, 30.0, 47.0, 58.0, 110.0, 143.0, 242.0, 373.0, 623.0, 1208.0, 2147.0, 4592.0, 10749.0, 28554.0, 88735.0, 338832.0, 1601647.0, 1627736.0, 347646.0, 90778.0, 29420.0, 10783.0, 4668.0, 2270.0, 1171.0, 684.0, 341.0, 220.0, 132.0, 83.0, 62.0, 48.0, 30.0, 17.0, 16.0, 10.0, 6.0, 3.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.0806884765625, -4.911376953125, -4.7420654296875, -4.57275390625, -4.4034423828125, -4.234130859375, -4.0648193359375, -3.8955078125, -3.7261962890625, -3.556884765625, -3.3875732421875, -3.21826171875, -3.0489501953125, -2.879638671875, -2.7103271484375, -2.541015625, -2.3717041015625, -2.202392578125, -2.0330810546875, -1.86376953125, -1.6944580078125, -1.525146484375, -1.3558349609375, -1.1865234375, -1.0172119140625, -0.847900390625, -0.6785888671875, -0.50927734375, -0.3399658203125, -0.170654296875, -0.0013427734375, 0.16796875, 0.3372802734375, 0.506591796875, 0.6759033203125, 0.84521484375, 1.0145263671875, 1.183837890625, 1.3531494140625, 1.5224609375, 1.6917724609375, 1.861083984375, 2.0303955078125, 2.19970703125, 2.3690185546875, 2.538330078125, 2.7076416015625, 2.876953125, 3.0462646484375, 3.215576171875, 3.3848876953125, 3.55419921875, 3.7235107421875, 3.892822265625, 4.0621337890625, 4.2314453125, 4.4007568359375, 4.570068359375, 4.7393798828125, 4.90869140625, 5.0780029296875, 5.247314453125, 5.4166259765625, 5.5859375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 11.0, 12.0, 23.0, 27.0, 36.0, 76.0, 95.0, 147.0, 175.0, 279.0, 328.0, 479.0, 550.0, 468.0, 409.0, 277.0, 212.0, 164.0, 99.0, 71.0, 48.0, 22.0, 11.0, 20.0, 11.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4140625, -9.16363525390625, -8.9132080078125, -8.66278076171875, -8.412353515625, -8.16192626953125, -7.9114990234375, -7.66107177734375, -7.41064453125, -7.16021728515625, -6.9097900390625, -6.65936279296875, -6.408935546875, -6.15850830078125, -5.9080810546875, -5.65765380859375, -5.4072265625, -5.15679931640625, -4.9063720703125, -4.65594482421875, -4.405517578125, -4.15509033203125, -3.9046630859375, -3.65423583984375, -3.40380859375, -3.15338134765625, -2.9029541015625, -2.65252685546875, -2.402099609375, -2.15167236328125, -1.9012451171875, -1.65081787109375, -1.400390625, -1.14996337890625, -0.8995361328125, -0.64910888671875, -0.398681640625, -0.14825439453125, 0.1021728515625, 0.35260009765625, 0.60302734375, 0.85345458984375, 1.1038818359375, 1.35430908203125, 1.604736328125, 1.85516357421875, 2.1055908203125, 2.35601806640625, 2.6064453125, 2.85687255859375, 3.1072998046875, 3.35772705078125, 3.608154296875, 3.85858154296875, 4.1090087890625, 4.35943603515625, 4.60986328125, 4.86029052734375, 5.1107177734375, 5.36114501953125, 5.611572265625, 5.86199951171875, 6.1124267578125, 6.36285400390625, 6.61328125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 7.0, 13.0, 11.0, 12.0, 26.0, 17.0, 38.0, 40.0, 63.0, 99.0, 119.0, 214.0, 338.0, 592.0, 1071.0, 2202.0, 5498.0, 17693.0, 71066.0, 358900.0, 1900467.0, 1489859.0, 268098.0, 54639.0, 14235.0, 4642.0, 1926.0, 941.0, 513.0, 321.0, 178.0, 125.0, 77.0, 53.0, 31.0, 33.0, 22.0, 23.0, 14.0, 16.0, 17.0, 7.0, 5.0, 10.0, 0.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.140625, -9.8228759765625, -9.505126953125, -9.1873779296875, -8.86962890625, -8.5518798828125, -8.234130859375, -7.9163818359375, -7.5986328125, -7.2808837890625, -6.963134765625, -6.6453857421875, -6.32763671875, -6.0098876953125, -5.692138671875, -5.3743896484375, -5.056640625, -4.7388916015625, -4.421142578125, -4.1033935546875, -3.78564453125, -3.4678955078125, -3.150146484375, -2.8323974609375, -2.5146484375, -2.1968994140625, -1.879150390625, -1.5614013671875, -1.24365234375, -0.9259033203125, -0.608154296875, -0.2904052734375, 0.02734375, 0.3450927734375, 0.662841796875, 0.9805908203125, 1.29833984375, 1.6160888671875, 1.933837890625, 2.2515869140625, 2.5693359375, 2.8870849609375, 3.204833984375, 3.5225830078125, 3.84033203125, 4.1580810546875, 4.475830078125, 4.7935791015625, 5.111328125, 5.4290771484375, 5.746826171875, 6.0645751953125, 6.38232421875, 6.7000732421875, 7.017822265625, 7.3355712890625, 7.6533203125, 7.9710693359375, 8.288818359375, 8.6065673828125, 8.92431640625, 9.2420654296875, 9.559814453125, 9.8775634765625, 10.1953125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 14.0, 36.0, 83.0, 155.0, 189.0, 203.0, 167.0, 99.0, 43.0, 15.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.00029373168945, -38.296077728271484, -35.59185791015625, -32.88764190673828, -30.183422088623047, -27.479206085205078, -24.774988174438477, -22.070770263671875, -19.366552352905273, -16.662334442138672, -13.95811653137207, -11.253899574279785, -8.549681663513184, -5.845463752746582, -3.141246795654297, -0.4370288848876953, 2.2671890258789062, 4.971406936645508, 7.675624370574951, 10.379841804504395, 13.084059715270996, 15.788277626037598, 18.492494583129883, 21.196712493896484, 23.900930404663086, 26.605148315429688, 29.30936622619629, 32.01358413696289, 34.71780014038086, 37.422019958496094, 40.12623596191406, 42.83045196533203, 45.53467559814453, 48.2388916015625, 50.943111419677734, 53.6473274230957, 56.35154724121094, 59.055763244628906, 61.759979248046875, 64.46420288085938, 67.16841888427734, 69.87263488769531, 72.57685089111328, 75.28107452392578, 77.98529052734375, 80.68950653076172, 83.39372253417969, 86.09794616699219, 88.80215454101562, 91.5063705444336, 94.21058654785156, 96.91481018066406, 99.61902618408203, 102.3232421875, 105.02745819091797, 107.73167419433594, 110.43589782714844, 113.1401138305664, 115.84432983398438, 118.54855346679688, 121.25276947021484, 123.95698547363281, 126.66120147705078, 129.36541748046875, 132.06964111328125]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 12.0, 3.0, 12.0, 11.0, 10.0, 21.0, 19.0, 22.0, 13.0, 22.0, 26.0, 25.0, 34.0, 28.0, 33.0, 41.0, 38.0, 30.0, 31.0, 36.0, 40.0, 46.0, 33.0, 30.0, 31.0, 46.0, 27.0, 37.0, 28.0, 32.0, 23.0, 18.0, 17.0, 17.0, 20.0, 13.0, 11.0, 17.0, 10.0, 8.0, 3.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-25.74560546875, -25.035871505737305, -24.32613754272461, -23.616405487060547, -22.90667152404785, -22.196937561035156, -21.48720359802246, -20.777469635009766, -20.067737579345703, -19.358003616333008, -18.648269653320312, -17.93853759765625, -17.228803634643555, -16.51906967163086, -15.809335708618164, -15.099601745605469, -14.389867782592773, -13.680133819580078, -12.9704008102417, -12.260666847229004, -11.550933837890625, -10.84119987487793, -10.131465911865234, -9.421731948852539, -8.71199893951416, -8.002264976501465, -7.292531967163086, -6.582798004150391, -5.8730645179748535, -5.163331031799316, -4.453597068786621, -3.743863582611084, -3.034130096435547, -2.3243966102600098, -1.6146628856658936, -0.9049291610717773, -0.19519567489624023, 0.5145378112792969, 1.2242717742919922, 1.9340052604675293, 2.6437387466430664, 3.3534722328186035, 4.063205718994141, 4.772939682006836, 5.482673168182373, 6.19240665435791, 6.9021406173706055, 7.611874103546143, 8.32160758972168, 9.031341552734375, 9.741074562072754, 10.45080852508545, 11.160541534423828, 11.870275497436523, 12.580009460449219, 13.289743423461914, 13.999476432800293, 14.709210395812988, 15.418943405151367, 16.128677368164062, 16.838411331176758, 17.548145294189453, 18.257877349853516, 18.96761131286621, 19.677345275878906]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 0.0, 5.0, 5.0, 13.0, 7.0, 17.0, 16.0, 14.0, 18.0, 30.0, 21.0, 18.0, 28.0, 33.0, 36.0, 49.0, 43.0, 49.0, 54.0, 55.0, 35.0, 37.0, 46.0, 41.0, 40.0, 42.0, 30.0, 31.0, 34.0, 34.0, 28.0, 17.0, 9.0, 15.0, 12.0, 10.0, 3.0, 5.0, 4.0, 10.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.66461181640625, -2.5811767578125, -2.49774169921875, -2.414306640625, -2.33087158203125, -2.2474365234375, -2.16400146484375, -2.08056640625, -1.99713134765625, -1.9136962890625, -1.83026123046875, -1.746826171875, -1.66339111328125, -1.5799560546875, -1.49652099609375, -1.4130859375, -1.32965087890625, -1.2462158203125, -1.16278076171875, -1.079345703125, -0.99591064453125, -0.9124755859375, -0.82904052734375, -0.74560546875, -0.66217041015625, -0.5787353515625, -0.49530029296875, -0.411865234375, -0.32843017578125, -0.2449951171875, -0.16156005859375, -0.078125, 0.00531005859375, 0.0887451171875, 0.17218017578125, 0.255615234375, 0.33905029296875, 0.4224853515625, 0.50592041015625, 0.58935546875, 0.67279052734375, 0.7562255859375, 0.83966064453125, 0.923095703125, 1.00653076171875, 1.0899658203125, 1.17340087890625, 1.2568359375, 1.34027099609375, 1.4237060546875, 1.50714111328125, 1.590576171875, 1.67401123046875, 1.7574462890625, 1.84088134765625, 1.92431640625, 2.00775146484375, 2.0911865234375, 2.17462158203125, 2.258056640625, 2.34149169921875, 2.4249267578125, 2.50836181640625, 2.591796875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 9.0, 15.0, 12.0, 29.0, 35.0, 69.0, 100.0, 146.0, 197.0, 350.0, 475.0, 707.0, 1047.0, 1559.0, 2426.0, 3775.0, 5978.0, 9393.0, 14680.0, 23543.0, 39386.0, 70109.0, 137571.0, 280601.0, 214469.0, 102225.0, 54540.0, 31938.0, 19399.0, 12004.0, 7542.0, 4899.0, 3169.0, 2095.0, 1357.0, 947.0, 579.0, 355.0, 277.0, 170.0, 115.0, 85.0, 57.0, 34.0, 34.0, 23.0, 8.0, 12.0, 2.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0198822021484375, -0.0192568302154541, -0.018631458282470703, -0.018006086349487305, -0.017380714416503906, -0.016755342483520508, -0.01612997055053711, -0.015504598617553711, -0.014879226684570312, -0.014253854751586914, -0.013628482818603516, -0.013003110885620117, -0.012377738952636719, -0.01175236701965332, -0.011126995086669922, -0.010501623153686523, -0.009876251220703125, -0.009250879287719727, -0.008625507354736328, -0.00800013542175293, -0.007374763488769531, -0.006749391555786133, -0.006124019622802734, -0.005498647689819336, -0.0048732757568359375, -0.004247903823852539, -0.0036225318908691406, -0.002997159957885742, -0.0023717880249023438, -0.0017464160919189453, -0.0011210441589355469, -0.0004956722259521484, 0.00012969970703125, 0.0007550716400146484, 0.0013804435729980469, 0.0020058155059814453, 0.0026311874389648438, 0.003256559371948242, 0.0038819313049316406, 0.004507303237915039, 0.0051326751708984375, 0.005758047103881836, 0.006383419036865234, 0.007008790969848633, 0.007634162902832031, 0.00825953483581543, 0.008884906768798828, 0.009510278701782227, 0.010135650634765625, 0.010761022567749023, 0.011386394500732422, 0.01201176643371582, 0.012637138366699219, 0.013262510299682617, 0.013887882232666016, 0.014513254165649414, 0.015138626098632812, 0.01576399803161621, 0.01638936996459961, 0.017014741897583008, 0.017640113830566406, 0.018265485763549805, 0.018890857696533203, 0.0195162296295166, 0.0201416015625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 8.0, 2.0, 14.0, 11.0, 12.0, 21.0, 17.0, 32.0, 25.0, 28.0, 27.0, 36.0, 35.0, 45.0, 27.0, 43.0, 50.0, 1078.0, 38.0, 45.0, 43.0, 31.0, 36.0, 45.0, 30.0, 31.0, 27.0, 29.0, 19.0, 23.0, 21.0, 19.0, 17.0, 14.0, 9.0, 9.0, 3.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.951171875, -1.888092041015625, -1.82501220703125, -1.761932373046875, -1.6988525390625, -1.635772705078125, -1.57269287109375, -1.509613037109375, -1.446533203125, -1.383453369140625, -1.32037353515625, -1.257293701171875, -1.1942138671875, -1.131134033203125, -1.06805419921875, -1.004974365234375, -0.94189453125, -0.878814697265625, -0.81573486328125, -0.752655029296875, -0.6895751953125, -0.626495361328125, -0.56341552734375, -0.500335693359375, -0.437255859375, -0.374176025390625, -0.31109619140625, -0.248016357421875, -0.1849365234375, -0.121856689453125, -0.05877685546875, 0.004302978515625, 0.0673828125, 0.130462646484375, 0.19354248046875, 0.256622314453125, 0.3197021484375, 0.382781982421875, 0.44586181640625, 0.508941650390625, 0.572021484375, 0.635101318359375, 0.69818115234375, 0.761260986328125, 0.8243408203125, 0.887420654296875, 0.95050048828125, 1.013580322265625, 1.07666015625, 1.139739990234375, 1.20281982421875, 1.265899658203125, 1.3289794921875, 1.392059326171875, 1.45513916015625, 1.518218994140625, 1.581298828125, 1.644378662109375, 1.70745849609375, 1.770538330078125, 1.8336181640625, 1.896697998046875, 1.95977783203125, 2.022857666015625, 2.0859375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 5.0, 8.0, 17.0, 12.0, 32.0, 39.0, 38.0, 85.0, 86.0, 154.0, 237.0, 314.0, 423.0, 629.0, 915.0, 1462.0, 1970.0, 2882.0, 4336.0, 6236.0, 9400.0, 14248.0, 21677.0, 32710.0, 49995.0, 76836.0, 122110.0, 1239452.0, 181921.0, 115776.0, 72908.0, 47602.0, 30718.0, 20289.0, 13513.0, 8911.0, 6085.0, 4125.0, 2850.0, 1916.0, 1285.0, 850.0, 631.0, 469.0, 297.0, 223.0, 146.0, 91.0, 73.0, 50.0, 28.0, 23.0, 16.0, 9.0, 11.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.006374359130859375, -0.00616830587387085, -0.005962252616882324, -0.005756199359893799, -0.0055501461029052734, -0.005344092845916748, -0.005138039588928223, -0.004931986331939697, -0.004725933074951172, -0.0045198798179626465, -0.004313826560974121, -0.004107773303985596, -0.0039017200469970703, -0.003695666790008545, -0.0034896135330200195, -0.003283560276031494, -0.0030775070190429688, -0.0028714537620544434, -0.002665400505065918, -0.0024593472480773926, -0.002253293991088867, -0.002047240734100342, -0.0018411874771118164, -0.001635134220123291, -0.0014290809631347656, -0.0012230277061462402, -0.0010169744491577148, -0.0008109211921691895, -0.0006048679351806641, -0.00039881467819213867, -0.00019276142120361328, 1.329183578491211e-05, 0.0002193450927734375, 0.0004253983497619629, 0.0006314516067504883, 0.0008375048637390137, 0.001043558120727539, 0.0012496113777160645, 0.0014556646347045898, 0.0016617178916931152, 0.0018677711486816406, 0.002073824405670166, 0.0022798776626586914, 0.002485930919647217, 0.002691984176635742, 0.0028980374336242676, 0.003104090690612793, 0.0033101439476013184, 0.0035161972045898438, 0.003722250461578369, 0.0039283037185668945, 0.00413435697555542, 0.004340410232543945, 0.004546463489532471, 0.004752516746520996, 0.0049585700035095215, 0.005164623260498047, 0.005370676517486572, 0.005576729774475098, 0.005782783031463623, 0.0059888362884521484, 0.006194889545440674, 0.006400942802429199, 0.006606996059417725, 0.00681304931640625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 0.0, 8.0, 0.0, 7.0, 8.0, 0.0, 17.0, 0.0, 21.0, 30.0, 0.0, 69.0, 119.0, 0.0, 420.0, 0.0, 140.0, 67.0, 0.0, 40.0, 0.0, 20.0, 14.0, 0.0, 10.0, 0.0, 10.0, 5.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.577480912208557e-07, -8.21426510810852e-07, -7.851049304008484e-07, -7.487833499908447e-07, -7.124617695808411e-07, -6.761401891708374e-07, -6.398186087608337e-07, -6.034970283508301e-07, -5.671754479408264e-07, -5.308538675308228e-07, -4.945322871208191e-07, -4.5821070671081543e-07, -4.2188912630081177e-07, -3.855675458908081e-07, -3.4924596548080444e-07, -3.129243850708008e-07, -2.766028046607971e-07, -2.4028122425079346e-07, -2.039596438407898e-07, -1.6763806343078613e-07, -1.3131648302078247e-07, -9.499490261077881e-08, -5.8673322200775146e-08, -2.2351741790771484e-08, 1.3969838619232178e-08, 5.029141902923584e-08, 8.66129994392395e-08, 1.2293457984924316e-07, 1.5925616025924683e-07, 1.955777406692505e-07, 2.3189932107925415e-07, 2.682209014892578e-07, 3.045424818992615e-07, 3.4086406230926514e-07, 3.771856427192688e-07, 4.1350722312927246e-07, 4.498288035392761e-07, 4.861503839492798e-07, 5.224719643592834e-07, 5.587935447692871e-07, 5.951151251792908e-07, 6.314367055892944e-07, 6.677582859992981e-07, 7.040798664093018e-07, 7.404014468193054e-07, 7.767230272293091e-07, 8.130446076393127e-07, 8.493661880493164e-07, 8.856877684593201e-07, 9.220093488693237e-07, 9.583309292793274e-07, 9.94652509689331e-07, 1.0309740900993347e-06, 1.0672956705093384e-06, 1.103617250919342e-06, 1.1399388313293457e-06, 1.1762604117393494e-06, 1.212581992149353e-06, 1.2489035725593567e-06, 1.2852251529693604e-06, 1.321546733379364e-06, 1.3578683137893677e-06, 1.3941898941993713e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 9.0, 19.0, 20.0, 22.0, 48.0, 43.0, 93.0, 104.0, 209.0, 602.0, 11232.0, 1000464.0, 34165.0, 815.0, 293.0, 146.0, 84.0, 55.0, 40.0, 21.0, 20.0, 12.0, 10.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9729137420654297e-05, -1.9189901649951935e-05, -1.8650665879249573e-05, -1.811143010854721e-05, -1.757219433784485e-05, -1.7032958567142487e-05, -1.6493722796440125e-05, -1.5954487025737762e-05, -1.54152512550354e-05, -1.4876015484333038e-05, -1.4336779713630676e-05, -1.3797543942928314e-05, -1.3258308172225952e-05, -1.271907240152359e-05, -1.2179836630821228e-05, -1.1640600860118866e-05, -1.1101365089416504e-05, -1.0562129318714142e-05, -1.002289354801178e-05, -9.483657777309418e-06, -8.944422006607056e-06, -8.405186235904694e-06, -7.865950465202332e-06, -7.3267146944999695e-06, -6.787478923797607e-06, -6.248243153095245e-06, -5.709007382392883e-06, -5.169771611690521e-06, -4.630535840988159e-06, -4.091300070285797e-06, -3.552064299583435e-06, -3.012828528881073e-06, -2.473592758178711e-06, -1.934356987476349e-06, -1.3951212167739868e-06, -8.558854460716248e-07, -3.166496753692627e-07, 2.2258609533309937e-07, 7.618218660354614e-07, 1.3010576367378235e-06, 1.8402934074401855e-06, 2.3795291781425476e-06, 2.9187649488449097e-06, 3.4580007195472717e-06, 3.997236490249634e-06, 4.536472260951996e-06, 5.075708031654358e-06, 5.61494380235672e-06, 6.154179573059082e-06, 6.693415343761444e-06, 7.232651114463806e-06, 7.771886885166168e-06, 8.31112265586853e-06, 8.850358426570892e-06, 9.389594197273254e-06, 9.928829967975616e-06, 1.0468065738677979e-05, 1.100730150938034e-05, 1.1546537280082703e-05, 1.2085773050785065e-05, 1.2625008821487427e-05, 1.3164244592189789e-05, 1.3703480362892151e-05, 1.4242716133594513e-05, 1.4781951904296875e-05]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 67.0, 627.0, 296.0, 21.0], "bins": [-7.136484327929793e-06, -7.021114470262546e-06, -6.90574506734265e-06, -6.790375209675403e-06, -6.675005806755507e-06, -6.5596359490882605e-06, -6.444266546168365e-06, -6.328896688501118e-06, -6.213526830833871e-06, -6.098156973166624e-06, -5.982787570246728e-06, -5.867417712579481e-06, -5.752048309659585e-06, -5.6366784519923385e-06, -5.521308594325092e-06, -5.405939191405196e-06, -5.2905697884853e-06, -5.175199930818053e-06, -5.059830527898157e-06, -4.94446067023091e-06, -4.829091267311014e-06, -4.713721409643767e-06, -4.5983515519765206e-06, -4.482982149056625e-06, -4.367612291389378e-06, -4.252242433722131e-06, -4.136873030802235e-06, -4.021503173134988e-06, -3.906133770215092e-06, -3.7907639125478454e-06, -3.675394282254274e-06, -3.5600246519607026e-06, -3.4446545669197803e-06, -3.329284936626209e-06, -3.2139153063326376e-06, -3.098545676039066e-06, -2.9831758183718193e-06, -2.867806188078248e-06, -2.7524365577846766e-06, -2.637066927491105e-06, -2.5216972971975338e-06, -2.4063276669039624e-06, -2.290958036610391e-06, -2.175588178943144e-06, -2.0602185486495728e-06, -1.9448489183560014e-06, -1.82947928806243e-06, -1.7141096577688586e-06, -1.5987398001016118e-06, -1.4833701698080404e-06, -1.3680004258276313e-06, -1.2526307955340599e-06, -1.1372610515536508e-06, -1.0218914212600794e-06, -9.06521790966508e-07, -7.911521038295177e-07, -6.757824735359463e-07, -5.604127863989561e-07, -4.4504312768367527e-07, -3.2967346896839445e-07, -2.143037818314042e-07, -9.893409469441394e-08, 1.6435535599157447e-08, 1.318052227361477e-07, 2.4717490987313795e-07]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 39.0, 0.0, 0.0, 0.0, 0.0, 107.0, 0.0, 0.0, 0.0, 189.0, 0.0, 0.0, 0.0, 0.0, 315.0, 0.0, 0.0, 0.0, 0.0, 172.0, 0.0, 0.0, 0.0, 95.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4458935260772705e-07, -3.3155083656311035e-07, -3.1851232051849365e-07, -3.0547380447387695e-07, -2.9243528842926025e-07, -2.7939677238464355e-07, -2.6635825634002686e-07, -2.5331974029541016e-07, -2.4028122425079346e-07, -2.2724270820617676e-07, -2.1420419216156006e-07, -2.0116567611694336e-07, -1.8812716007232666e-07, -1.7508864402770996e-07, -1.6205012798309326e-07, -1.4901161193847656e-07, -1.3597309589385986e-07, -1.2293457984924316e-07, -1.0989606380462646e-07, -9.685754776000977e-08, -8.381903171539307e-08, -7.078051567077637e-08, -5.774199962615967e-08, -4.470348358154297e-08, -3.166496753692627e-08, -1.862645149230957e-08, -5.587935447692871e-09, 7.450580596923828e-09, 2.0489096641540527e-08, 3.3527612686157227e-08, 4.6566128730773926e-08, 5.960464477539063e-08, 7.264316082000732e-08, 8.568167686462402e-08, 9.872019290924072e-08, 1.1175870895385742e-07, 1.2479722499847412e-07, 1.3783574104309082e-07, 1.5087425708770752e-07, 1.6391277313232422e-07, 1.7695128917694092e-07, 1.8998980522155762e-07, 2.0302832126617432e-07, 2.1606683731079102e-07, 2.2910535335540771e-07, 2.421438694000244e-07, 2.551823854446411e-07, 2.682209014892578e-07, 2.812594175338745e-07, 2.942979335784912e-07, 3.073364496231079e-07, 3.203749656677246e-07, 3.334134817123413e-07, 3.46451997756958e-07, 3.594905138015747e-07, 3.725290298461914e-07, 3.855675458908081e-07, 3.986060619354248e-07, 4.116445779800415e-07, 4.246830940246582e-07, 4.377216100692749e-07, 4.507601261138916e-07, 4.637986421585083e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 0.0, 5.0, 5.0, 13.0, 7.0, 17.0, 16.0, 14.0, 18.0, 30.0, 21.0, 18.0, 28.0, 33.0, 36.0, 49.0, 43.0, 49.0, 54.0, 55.0, 35.0, 37.0, 46.0, 41.0, 40.0, 42.0, 30.0, 31.0, 34.0, 34.0, 28.0, 17.0, 9.0, 15.0, 12.0, 10.0, 3.0, 5.0, 4.0, 10.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.66461181640625, -2.5811767578125, -2.49774169921875, -2.414306640625, -2.33087158203125, -2.2474365234375, -2.16400146484375, -2.08056640625, -1.99713134765625, -1.9136962890625, -1.83026123046875, -1.746826171875, -1.66339111328125, -1.5799560546875, -1.49652099609375, -1.4130859375, -1.32965087890625, -1.2462158203125, -1.16278076171875, -1.079345703125, -0.99591064453125, -0.9124755859375, -0.82904052734375, -0.74560546875, -0.66217041015625, -0.5787353515625, -0.49530029296875, -0.411865234375, -0.32843017578125, -0.2449951171875, -0.16156005859375, -0.078125, 0.00531005859375, 0.0887451171875, 0.17218017578125, 0.255615234375, 0.33905029296875, 0.4224853515625, 0.50592041015625, 0.58935546875, 0.67279052734375, 0.7562255859375, 0.83966064453125, 0.923095703125, 1.00653076171875, 1.0899658203125, 1.17340087890625, 1.2568359375, 1.34027099609375, 1.4237060546875, 1.50714111328125, 1.590576171875, 1.67401123046875, 1.7574462890625, 1.84088134765625, 1.92431640625, 2.00775146484375, 2.0911865234375, 2.17462158203125, 2.258056640625, 2.34149169921875, 2.4249267578125, 2.50836181640625, 2.591796875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 17.0, 19.0, 40.0, 61.0, 91.0, 137.0, 220.0, 309.0, 523.0, 823.0, 1283.0, 1961.0, 3028.0, 4542.0, 7099.0, 11344.0, 19666.0, 37971.0, 95018.0, 418067.0, 292169.0, 75878.0, 32297.0, 17134.0, 10534.0, 6493.0, 4156.0, 2657.0, 1824.0, 1138.0, 687.0, 490.0, 322.0, 194.0, 131.0, 78.0, 56.0, 36.0, 27.0, 10.0, 5.0, 12.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.509765625, -3.39971923828125, -3.2896728515625, -3.17962646484375, -3.069580078125, -2.95953369140625, -2.8494873046875, -2.73944091796875, -2.62939453125, -2.51934814453125, -2.4093017578125, -2.29925537109375, -2.189208984375, -2.07916259765625, -1.9691162109375, -1.85906982421875, -1.7490234375, -1.63897705078125, -1.5289306640625, -1.41888427734375, -1.308837890625, -1.19879150390625, -1.0887451171875, -0.97869873046875, -0.86865234375, -0.75860595703125, -0.6485595703125, -0.53851318359375, -0.428466796875, -0.31842041015625, -0.2083740234375, -0.09832763671875, 0.01171875, 0.12176513671875, 0.2318115234375, 0.34185791015625, 0.451904296875, 0.56195068359375, 0.6719970703125, 0.78204345703125, 0.89208984375, 1.00213623046875, 1.1121826171875, 1.22222900390625, 1.332275390625, 1.44232177734375, 1.5523681640625, 1.66241455078125, 1.7724609375, 1.88250732421875, 1.9925537109375, 2.10260009765625, 2.212646484375, 2.32269287109375, 2.4327392578125, 2.54278564453125, 2.65283203125, 2.76287841796875, 2.8729248046875, 2.98297119140625, 3.093017578125, 3.20306396484375, 3.3131103515625, 3.42315673828125, 3.533203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 5.0, 1.0, 10.0, 10.0, 11.0, 11.0, 18.0, 24.0, 22.0, 23.0, 29.0, 25.0, 24.0, 43.0, 41.0, 54.0, 66.0, 74.0, 167.0, 1493.0, 291.0, 119.0, 78.0, 59.0, 57.0, 45.0, 39.0, 26.0, 20.0, 30.0, 22.0, 26.0, 17.0, 15.0, 6.0, 13.0, 5.0, 8.0, 4.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1015625, -7.82958984375, -7.5576171875, -7.28564453125, -7.013671875, -6.74169921875, -6.4697265625, -6.19775390625, -5.92578125, -5.65380859375, -5.3818359375, -5.10986328125, -4.837890625, -4.56591796875, -4.2939453125, -4.02197265625, -3.75, -3.47802734375, -3.2060546875, -2.93408203125, -2.662109375, -2.39013671875, -2.1181640625, -1.84619140625, -1.57421875, -1.30224609375, -1.0302734375, -0.75830078125, -0.486328125, -0.21435546875, 0.0576171875, 0.32958984375, 0.6015625, 0.87353515625, 1.1455078125, 1.41748046875, 1.689453125, 1.96142578125, 2.2333984375, 2.50537109375, 2.77734375, 3.04931640625, 3.3212890625, 3.59326171875, 3.865234375, 4.13720703125, 4.4091796875, 4.68115234375, 4.953125, 5.22509765625, 5.4970703125, 5.76904296875, 6.041015625, 6.31298828125, 6.5849609375, 6.85693359375, 7.12890625, 7.40087890625, 7.6728515625, 7.94482421875, 8.216796875, 8.48876953125, 8.7607421875, 9.03271484375, 9.3046875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 6.0, 6.0, 13.0, 9.0, 15.0, 16.0, 23.0, 30.0, 40.0, 47.0, 50.0, 85.0, 124.0, 206.0, 383.0, 988.0, 4584.0, 34247.0, 1769883.0, 1297256.0, 31349.0, 4390.0, 941.0, 314.0, 182.0, 149.0, 86.0, 67.0, 39.0, 28.0, 33.0, 20.0, 22.0, 14.0, 13.0, 12.0, 6.0, 9.0, 1.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.734375, -15.2713623046875, -14.808349609375, -14.3453369140625, -13.88232421875, -13.4193115234375, -12.956298828125, -12.4932861328125, -12.0302734375, -11.5672607421875, -11.104248046875, -10.6412353515625, -10.17822265625, -9.7152099609375, -9.252197265625, -8.7891845703125, -8.326171875, -7.8631591796875, -7.400146484375, -6.9371337890625, -6.47412109375, -6.0111083984375, -5.548095703125, -5.0850830078125, -4.6220703125, -4.1590576171875, -3.696044921875, -3.2330322265625, -2.77001953125, -2.3070068359375, -1.843994140625, -1.3809814453125, -0.91796875, -0.4549560546875, 0.008056640625, 0.4710693359375, 0.93408203125, 1.3970947265625, 1.860107421875, 2.3231201171875, 2.7861328125, 3.2491455078125, 3.712158203125, 4.1751708984375, 4.63818359375, 5.1011962890625, 5.564208984375, 6.0272216796875, 6.490234375, 6.9532470703125, 7.416259765625, 7.8792724609375, 8.34228515625, 8.8052978515625, 9.268310546875, 9.7313232421875, 10.1943359375, 10.6573486328125, 11.120361328125, 11.5833740234375, 12.04638671875, 12.5093994140625, 12.972412109375, 13.4354248046875, 13.8984375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 28.0, 65.0, 194.0, 315.0, 234.0, 117.0, 45.0, 10.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.07544708251953, -31.556636810302734, -30.03782844543457, -28.519018173217773, -27.000207901000977, -25.481399536132812, -23.962589263916016, -22.44377899169922, -20.924968719482422, -19.406158447265625, -17.88735008239746, -16.368539810180664, -14.849729537963867, -13.330920219421387, -11.812110900878906, -10.29330062866211, -8.774492263793945, -7.255682468414307, -5.736872673034668, -4.2180633544921875, -2.699253559112549, -1.1804437637329102, 0.3383655548095703, 1.8571758270263672, 3.3759851455688477, 4.894794940948486, 6.413604736328125, 7.9324140548706055, 9.451223373413086, 10.970033645629883, 12.488842964172363, 14.00765323638916, 15.52646255493164, 17.045272827148438, 18.5640811920166, 20.0828914642334, 21.601701736450195, 23.12051010131836, 24.639320373535156, 26.158130645751953, 27.67694091796875, 29.195751190185547, 30.71455955505371, 32.233367919921875, 33.75217819213867, 35.27098846435547, 36.789798736572266, 38.30860900878906, 39.827415466308594, 41.34622573852539, 42.86503601074219, 44.38384246826172, 45.902652740478516, 47.42146301269531, 48.94027328491211, 50.459083557128906, 51.9778938293457, 53.4967041015625, 55.0155143737793, 56.534324645996094, 58.053131103515625, 59.57194137573242, 61.09075164794922, 62.609561920166016, 64.12837219238281]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 8.0, 6.0, 7.0, 8.0, 15.0, 19.0, 19.0, 20.0, 16.0, 20.0, 32.0, 22.0, 34.0, 37.0, 61.0, 25.0, 54.0, 45.0, 57.0, 44.0, 43.0, 49.0, 47.0, 36.0, 34.0, 28.0, 27.0, 26.0, 26.0, 30.0, 23.0, 17.0, 14.0, 10.0, 9.0, 5.0, 8.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.180925369262695, -21.36521339416504, -20.549503326416016, -19.73379135131836, -18.918079376220703, -18.102367401123047, -17.286657333374023, -16.470945358276367, -15.655233383178711, -14.839522361755371, -14.023810386657715, -13.208099365234375, -12.392387390136719, -11.576676368713379, -10.760965347290039, -9.945253372192383, -9.129542350769043, -8.313831329345703, -7.498119354248047, -6.682408332824707, -5.866696357727051, -5.050985336303711, -4.235273838043213, -3.419562339782715, -2.603850841522217, -1.7881393432617188, -0.9724279642105103, -0.15671658515930176, 0.6589949131011963, 1.4747061729431152, 2.2904176712036133, 3.1061291694641113, 3.9218406677246094, 4.737552165985107, 5.5532636642456055, 6.368974685668945, 7.184686660766602, 8.000397682189941, 8.816108703613281, 9.631820678710938, 10.447532653808594, 11.263243675231934, 12.07895565032959, 12.89466667175293, 13.710378646850586, 14.526089668273926, 15.341800689697266, 16.157512664794922, 16.973224639892578, 17.788936614990234, 18.604646682739258, 19.420358657836914, 20.23607063293457, 21.051780700683594, 21.86749267578125, 22.683204650878906, 23.49891471862793, 24.314626693725586, 25.13033676147461, 25.946048736572266, 26.761760711669922, 27.577472686767578, 28.3931827545166, 29.208894729614258, 30.024606704711914]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 9.0, 8.0, 15.0, 14.0, 17.0, 24.0, 23.0, 20.0, 19.0, 29.0, 35.0, 37.0, 35.0, 45.0, 60.0, 47.0, 54.0, 44.0, 42.0, 29.0, 45.0, 47.0, 45.0, 33.0, 32.0, 38.0, 27.0, 24.0, 20.0, 15.0, 11.0, 11.0, 8.0, 8.0, 5.0, 5.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.79296875, -2.706024169921875, -2.61907958984375, -2.532135009765625, -2.4451904296875, -2.358245849609375, -2.27130126953125, -2.184356689453125, -2.097412109375, -2.010467529296875, -1.92352294921875, -1.836578369140625, -1.7496337890625, -1.662689208984375, -1.57574462890625, -1.488800048828125, -1.40185546875, -1.314910888671875, -1.22796630859375, -1.141021728515625, -1.0540771484375, -0.967132568359375, -0.88018798828125, -0.793243408203125, -0.706298828125, -0.619354248046875, -0.53240966796875, -0.445465087890625, -0.3585205078125, -0.271575927734375, -0.18463134765625, -0.097686767578125, -0.0107421875, 0.076202392578125, 0.16314697265625, 0.250091552734375, 0.3370361328125, 0.423980712890625, 0.51092529296875, 0.597869873046875, 0.684814453125, 0.771759033203125, 0.85870361328125, 0.945648193359375, 1.0325927734375, 1.119537353515625, 1.20648193359375, 1.293426513671875, 1.38037109375, 1.467315673828125, 1.55426025390625, 1.641204833984375, 1.7281494140625, 1.815093994140625, 1.90203857421875, 1.988983154296875, 2.075927734375, 2.162872314453125, 2.24981689453125, 2.336761474609375, 2.4237060546875, 2.510650634765625, 2.59759521484375, 2.684539794921875, 2.771484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 10.0, 4.0, 11.0, 2.0, 13.0, 16.0, 24.0, 28.0, 42.0, 59.0, 73.0, 141.0, 219.0, 459.0, 1138.0, 2987.0, 10215.0, 47130.0, 349899.0, 2862391.0, 809894.0, 85754.0, 16344.0, 4520.0, 1556.0, 571.0, 273.0, 169.0, 103.0, 61.0, 49.0, 25.0, 26.0, 13.0, 11.0, 9.0, 9.0, 7.0, 4.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.59375, -9.300048828125, -9.00634765625, -8.712646484375, -8.4189453125, -8.125244140625, -7.83154296875, -7.537841796875, -7.244140625, -6.950439453125, -6.65673828125, -6.363037109375, -6.0693359375, -5.775634765625, -5.48193359375, -5.188232421875, -4.89453125, -4.600830078125, -4.30712890625, -4.013427734375, -3.7197265625, -3.426025390625, -3.13232421875, -2.838623046875, -2.544921875, -2.251220703125, -1.95751953125, -1.663818359375, -1.3701171875, -1.076416015625, -0.78271484375, -0.489013671875, -0.1953125, 0.098388671875, 0.39208984375, 0.685791015625, 0.9794921875, 1.273193359375, 1.56689453125, 1.860595703125, 2.154296875, 2.447998046875, 2.74169921875, 3.035400390625, 3.3291015625, 3.622802734375, 3.91650390625, 4.210205078125, 4.50390625, 4.797607421875, 5.09130859375, 5.385009765625, 5.6787109375, 5.972412109375, 6.26611328125, 6.559814453125, 6.853515625, 7.147216796875, 7.44091796875, 7.734619140625, 8.0283203125, 8.322021484375, 8.61572265625, 8.909423828125, 9.203125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 10.0, 11.0, 14.0, 26.0, 44.0, 68.0, 92.0, 158.0, 200.0, 254.0, 337.0, 457.0, 540.0, 513.0, 408.0, 267.0, 206.0, 131.0, 94.0, 65.0, 53.0, 37.0, 32.0, 13.0, 14.0, 10.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.14520263671875, -6.9036865234375, -6.66217041015625, -6.420654296875, -6.17913818359375, -5.9376220703125, -5.69610595703125, -5.45458984375, -5.21307373046875, -4.9715576171875, -4.73004150390625, -4.488525390625, -4.24700927734375, -4.0054931640625, -3.76397705078125, -3.5224609375, -3.28094482421875, -3.0394287109375, -2.79791259765625, -2.556396484375, -2.31488037109375, -2.0733642578125, -1.83184814453125, -1.59033203125, -1.34881591796875, -1.1072998046875, -0.86578369140625, -0.624267578125, -0.38275146484375, -0.1412353515625, 0.10028076171875, 0.341796875, 0.58331298828125, 0.8248291015625, 1.06634521484375, 1.307861328125, 1.54937744140625, 1.7908935546875, 2.03240966796875, 2.27392578125, 2.51544189453125, 2.7569580078125, 2.99847412109375, 3.239990234375, 3.48150634765625, 3.7230224609375, 3.96453857421875, 4.2060546875, 4.44757080078125, 4.6890869140625, 4.93060302734375, 5.172119140625, 5.41363525390625, 5.6551513671875, 5.89666748046875, 6.13818359375, 6.37969970703125, 6.6212158203125, 6.86273193359375, 7.104248046875, 7.34576416015625, 7.5872802734375, 7.82879638671875, 8.0703125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 16.0, 19.0, 23.0, 41.0, 52.0, 107.0, 194.0, 338.0, 630.0, 1606.0, 7380.0, 85722.0, 2039203.0, 1966070.0, 82789.0, 7127.0, 1536.0, 658.0, 348.0, 192.0, 90.0, 61.0, 28.0, 12.0, 16.0, 7.0, 11.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-22.109375, -21.4951171875, -20.880859375, -20.2666015625, -19.65234375, -19.0380859375, -18.423828125, -17.8095703125, -17.1953125, -16.5810546875, -15.966796875, -15.3525390625, -14.73828125, -14.1240234375, -13.509765625, -12.8955078125, -12.28125, -11.6669921875, -11.052734375, -10.4384765625, -9.82421875, -9.2099609375, -8.595703125, -7.9814453125, -7.3671875, -6.7529296875, -6.138671875, -5.5244140625, -4.91015625, -4.2958984375, -3.681640625, -3.0673828125, -2.453125, -1.8388671875, -1.224609375, -0.6103515625, 0.00390625, 0.6181640625, 1.232421875, 1.8466796875, 2.4609375, 3.0751953125, 3.689453125, 4.3037109375, 4.91796875, 5.5322265625, 6.146484375, 6.7607421875, 7.375, 7.9892578125, 8.603515625, 9.2177734375, 9.83203125, 10.4462890625, 11.060546875, 11.6748046875, 12.2890625, 12.9033203125, 13.517578125, 14.1318359375, 14.74609375, 15.3603515625, 15.974609375, 16.5888671875, 17.203125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 12.0, 50.0, 112.0, 264.0, 281.0, 190.0, 78.0, 22.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.87179183959961, -15.284139633178711, -11.696486473083496, -8.108833312988281, -4.521181106567383, -0.9335289001464844, 2.654125213623047, 6.241777420043945, 9.829429626464844, 13.417081832885742, 17.00473403930664, 20.592388153076172, 24.18004035949707, 27.76769256591797, 31.3553466796875, 34.94300079345703, 38.5306510925293, 42.11830520629883, 45.705955505371094, 49.293609619140625, 52.881263732910156, 56.46891403198242, 60.05656814575195, 63.64421844482422, 67.23187255859375, 70.81952667236328, 74.40718078613281, 77.99482727050781, 81.58248138427734, 85.17013549804688, 88.7577896118164, 92.34544372558594, 95.93309020996094, 99.52074432373047, 103.1083984375, 106.696044921875, 110.28369903564453, 113.87135314941406, 117.4590072631836, 121.04666137695312, 124.63430786132812, 128.22195434570312, 131.8096160888672, 135.3972625732422, 138.98492431640625, 142.57257080078125, 146.16021728515625, 149.7478790283203, 153.33554077148438, 156.92318725585938, 160.51084899902344, 164.09849548339844, 167.6861572265625, 171.2738037109375, 174.8614501953125, 178.44911193847656, 182.03675842285156, 185.62440490722656, 189.21206665039062, 192.79971313476562, 196.3873748779297, 199.9750213623047, 203.56268310546875, 207.15032958984375, 210.73797607421875]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 9.0, 9.0, 15.0, 18.0, 23.0, 18.0, 26.0, 27.0, 31.0, 42.0, 35.0, 55.0, 46.0, 42.0, 65.0, 40.0, 39.0, 38.0, 46.0, 44.0, 33.0, 39.0, 30.0, 37.0, 28.0, 24.0, 27.0, 21.0, 17.0, 12.0, 17.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.712013244628906, -22.931381225585938, -22.1507511138916, -21.370121002197266, -20.589488983154297, -19.808856964111328, -19.028226852416992, -18.247596740722656, -17.466964721679688, -16.68633270263672, -15.905702590942383, -15.12507152557373, -14.344440460205078, -13.563809394836426, -12.783178329467773, -12.002547264099121, -11.221916198730469, -10.441285133361816, -9.660654067993164, -8.880023002624512, -8.09939193725586, -7.318760871887207, -6.538129806518555, -5.757498741149902, -4.97686767578125, -4.196236610412598, -3.4156055450439453, -2.634974479675293, -1.8543434143066406, -1.0737123489379883, -0.29308128356933594, 0.4875497817993164, 1.2681808471679688, 2.048811912536621, 2.8294429779052734, 3.610074043273926, 4.390705108642578, 5.1713361740112305, 5.951967239379883, 6.732598304748535, 7.5132293701171875, 8.29386043548584, 9.074491500854492, 9.855122566223145, 10.635753631591797, 11.41638469696045, 12.197015762329102, 12.977646827697754, 13.758277893066406, 14.538908958435059, 15.319540023803711, 16.100170135498047, 16.880802154541016, 17.661434173583984, 18.44206428527832, 19.222694396972656, 20.003326416015625, 20.783958435058594, 21.56458854675293, 22.345218658447266, 23.125850677490234, 23.906482696533203, 24.68711280822754, 25.467742919921875, 26.248374938964844]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 8.0, 8.0, 10.0, 9.0, 16.0, 17.0, 21.0, 20.0, 22.0, 32.0, 20.0, 26.0, 35.0, 41.0, 53.0, 40.0, 48.0, 51.0, 40.0, 56.0, 39.0, 41.0, 38.0, 46.0, 34.0, 33.0, 37.0, 30.0, 22.0, 28.0, 12.0, 16.0, 12.0, 7.0, 6.0, 5.0, 3.0, 5.0, 5.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.7918701171875, -2.702880859375, -2.6138916015625, -2.52490234375, -2.4359130859375, -2.346923828125, -2.2579345703125, -2.1689453125, -2.0799560546875, -1.990966796875, -1.9019775390625, -1.81298828125, -1.7239990234375, -1.635009765625, -1.5460205078125, -1.45703125, -1.3680419921875, -1.279052734375, -1.1900634765625, -1.10107421875, -1.0120849609375, -0.923095703125, -0.8341064453125, -0.7451171875, -0.6561279296875, -0.567138671875, -0.4781494140625, -0.38916015625, -0.3001708984375, -0.211181640625, -0.1221923828125, -0.033203125, 0.0557861328125, 0.144775390625, 0.2337646484375, 0.32275390625, 0.4117431640625, 0.500732421875, 0.5897216796875, 0.6787109375, 0.7677001953125, 0.856689453125, 0.9456787109375, 1.03466796875, 1.1236572265625, 1.212646484375, 1.3016357421875, 1.390625, 1.4796142578125, 1.568603515625, 1.6575927734375, 1.74658203125, 1.8355712890625, 1.924560546875, 2.0135498046875, 2.1025390625, 2.1915283203125, 2.280517578125, 2.3695068359375, 2.45849609375, 2.5474853515625, 2.636474609375, 2.7254638671875, 2.814453125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 8.0, 7.0, 9.0, 19.0, 22.0, 36.0, 61.0, 89.0, 101.0, 154.0, 234.0, 321.0, 492.0, 719.0, 1121.0, 1646.0, 2564.0, 3869.0, 6192.0, 9859.0, 15740.0, 25766.0, 44479.0, 79245.0, 148954.0, 270778.0, 194906.0, 101002.0, 56125.0, 32278.0, 19127.0, 11638.0, 7423.0, 4678.0, 2985.0, 1892.0, 1315.0, 871.0, 569.0, 383.0, 281.0, 204.0, 119.0, 93.0, 55.0, 37.0, 31.0, 20.0, 15.0, 6.0, 12.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.021026611328125, -0.020383596420288086, -0.019740581512451172, -0.019097566604614258, -0.018454551696777344, -0.01781153678894043, -0.017168521881103516, -0.0165255069732666, -0.015882492065429688, -0.015239477157592773, -0.01459646224975586, -0.013953447341918945, -0.013310432434082031, -0.012667417526245117, -0.012024402618408203, -0.011381387710571289, -0.010738372802734375, -0.010095357894897461, -0.009452342987060547, -0.008809328079223633, -0.008166313171386719, -0.007523298263549805, -0.006880283355712891, -0.0062372684478759766, -0.0055942535400390625, -0.0049512386322021484, -0.004308223724365234, -0.0036652088165283203, -0.0030221939086914062, -0.002379179000854492, -0.0017361640930175781, -0.001093149185180664, -0.00045013427734375, 0.00019288063049316406, 0.0008358955383300781, 0.0014789104461669922, 0.0021219253540039062, 0.0027649402618408203, 0.0034079551696777344, 0.0040509700775146484, 0.0046939849853515625, 0.0053369998931884766, 0.005980014801025391, 0.006623029708862305, 0.007266044616699219, 0.007909059524536133, 0.008552074432373047, 0.009195089340209961, 0.009838104248046875, 0.010481119155883789, 0.011124134063720703, 0.011767148971557617, 0.012410163879394531, 0.013053178787231445, 0.01369619369506836, 0.014339208602905273, 0.014982223510742188, 0.0156252384185791, 0.016268253326416016, 0.01691126823425293, 0.017554283142089844, 0.018197298049926758, 0.018840312957763672, 0.019483327865600586, 0.0201263427734375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 4.0, 10.0, 6.0, 9.0, 8.0, 13.0, 17.0, 13.0, 23.0, 14.0, 21.0, 28.0, 31.0, 27.0, 21.0, 30.0, 28.0, 31.0, 46.0, 29.0, 40.0, 38.0, 1064.0, 41.0, 39.0, 32.0, 30.0, 30.0, 31.0, 27.0, 23.0, 22.0, 34.0, 14.0, 20.0, 24.0, 15.0, 16.0, 20.0, 12.0, 3.0, 9.0, 10.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7353515625, -1.6803741455078125, -1.625396728515625, -1.5704193115234375, -1.51544189453125, -1.4604644775390625, -1.405487060546875, -1.3505096435546875, -1.2955322265625, -1.2405548095703125, -1.185577392578125, -1.1305999755859375, -1.07562255859375, -1.0206451416015625, -0.965667724609375, -0.9106903076171875, -0.855712890625, -0.8007354736328125, -0.745758056640625, -0.6907806396484375, -0.63580322265625, -0.5808258056640625, -0.525848388671875, -0.4708709716796875, -0.4158935546875, -0.3609161376953125, -0.305938720703125, -0.2509613037109375, -0.19598388671875, -0.1410064697265625, -0.086029052734375, -0.0310516357421875, 0.02392578125, 0.0789031982421875, 0.133880615234375, 0.1888580322265625, 0.24383544921875, 0.2988128662109375, 0.353790283203125, 0.4087677001953125, 0.4637451171875, 0.5187225341796875, 0.573699951171875, 0.6286773681640625, 0.68365478515625, 0.7386322021484375, 0.793609619140625, 0.8485870361328125, 0.903564453125, 0.9585418701171875, 1.013519287109375, 1.0684967041015625, 1.12347412109375, 1.1784515380859375, 1.233428955078125, 1.2884063720703125, 1.3433837890625, 1.3983612060546875, 1.453338623046875, 1.5083160400390625, 1.56329345703125, 1.6182708740234375, 1.673248291015625, 1.7282257080078125, 1.783203125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 13.0, 28.0, 33.0, 45.0, 71.0, 82.0, 126.0, 183.0, 336.0, 446.0, 687.0, 967.0, 1513.0, 2252.0, 3179.0, 5026.0, 7502.0, 11332.0, 17503.0, 26539.0, 40020.0, 60475.0, 92853.0, 146375.0, 1245461.0, 152208.0, 96928.0, 62689.0, 41650.0, 27400.0, 17994.0, 11878.0, 7825.0, 5099.0, 3404.0, 2302.0, 1548.0, 1062.0, 670.0, 478.0, 310.0, 204.0, 158.0, 78.0, 76.0, 48.0, 26.0, 24.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.00675201416015625, -0.006544530391693115, -0.0063370466232299805, -0.006129562854766846, -0.005922079086303711, -0.005714595317840576, -0.005507111549377441, -0.005299627780914307, -0.005092144012451172, -0.004884660243988037, -0.004677176475524902, -0.004469692707061768, -0.004262208938598633, -0.004054725170135498, -0.0038472414016723633, -0.0036397576332092285, -0.0034322738647460938, -0.003224790096282959, -0.0030173063278198242, -0.0028098225593566895, -0.0026023387908935547, -0.00239485502243042, -0.002187371253967285, -0.0019798874855041504, -0.0017724037170410156, -0.0015649199485778809, -0.001357436180114746, -0.0011499524116516113, -0.0009424686431884766, -0.0007349848747253418, -0.000527501106262207, -0.00032001733779907227, -0.0001125335693359375, 9.495019912719727e-05, 0.00030243396759033203, 0.0005099177360534668, 0.0007174015045166016, 0.0009248852729797363, 0.001132369041442871, 0.0013398528099060059, 0.0015473365783691406, 0.0017548203468322754, 0.00196230411529541, 0.002169787883758545, 0.0023772716522216797, 0.0025847554206848145, 0.0027922391891479492, 0.002999722957611084, 0.0032072067260742188, 0.0034146904945373535, 0.0036221742630004883, 0.003829658031463623, 0.004037141799926758, 0.004244625568389893, 0.004452109336853027, 0.004659593105316162, 0.004867076873779297, 0.005074560642242432, 0.005282044410705566, 0.005489528179168701, 0.005697011947631836, 0.005904495716094971, 0.0061119794845581055, 0.00631946325302124, 0.006526947021484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 11.0, 0.0, 9.0, 0.0, 0.0, 12.0, 0.0, 0.0, 8.0, 0.0, 14.0, 0.0, 0.0, 25.0, 0.0, 0.0, 33.0, 0.0, 69.0, 0.0, 0.0, 116.0, 0.0, 0.0, 399.0, 0.0, 113.0, 0.0, 0.0, 77.0, 0.0, 0.0, 29.0, 0.0, 27.0, 0.0, 0.0, 13.0, 0.0, 0.0, 21.0, 0.0, 11.0, 0.0, 0.0, 6.0, 0.0, 0.0, 7.0, 0.0, 5.0, 0.0, 0.0, 5.0, 0.0, 2.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 7.0, 5.0, 6.0, 11.0, 11.0, 13.0, 16.0, 22.0, 33.0, 37.0, 33.0, 48.0, 96.0, 130.0, 178.0, 328.0, 846.0, 13193.0, 763329.0, 264311.0, 4578.0, 471.0, 256.0, 149.0, 105.0, 84.0, 73.0, 29.0, 35.0, 24.0, 15.0, 15.0, 10.0, 6.0, 3.0, 2.0, 7.0, 4.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.1980533599853516e-05, -1.1604279279708862e-05, -1.1228024959564209e-05, -1.0851770639419556e-05, -1.0475516319274902e-05, -1.0099261999130249e-05, -9.723007678985596e-06, -9.346753358840942e-06, -8.970499038696289e-06, -8.594244718551636e-06, -8.217990398406982e-06, -7.841736078262329e-06, -7.465481758117676e-06, -7.0892274379730225e-06, -6.712973117828369e-06, -6.336718797683716e-06, -5.9604644775390625e-06, -5.584210157394409e-06, -5.207955837249756e-06, -4.8317015171051025e-06, -4.455447196960449e-06, -4.079192876815796e-06, -3.7029385566711426e-06, -3.3266842365264893e-06, -2.950429916381836e-06, -2.5741755962371826e-06, -2.1979212760925293e-06, -1.821666955947876e-06, -1.4454126358032227e-06, -1.0691583156585693e-06, -6.92903995513916e-07, -3.166496753692627e-07, 5.960464477539063e-08, 4.3585896492004395e-07, 8.121132850646973e-07, 1.1883676052093506e-06, 1.564621925354004e-06, 1.9408762454986572e-06, 2.3171305656433105e-06, 2.693384885787964e-06, 3.069639205932617e-06, 3.4458935260772705e-06, 3.822147846221924e-06, 4.198402166366577e-06, 4.5746564865112305e-06, 4.950910806655884e-06, 5.327165126800537e-06, 5.7034194469451904e-06, 6.079673767089844e-06, 6.455928087234497e-06, 6.83218240737915e-06, 7.208436727523804e-06, 7.584691047668457e-06, 7.96094536781311e-06, 8.337199687957764e-06, 8.713454008102417e-06, 9.08970832824707e-06, 9.465962648391724e-06, 9.842216968536377e-06, 1.021847128868103e-05, 1.0594725608825684e-05, 1.0970979928970337e-05, 1.134723424911499e-05, 1.1723488569259644e-05, 1.2099742889404297e-05]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 20.0, 26.0, 74.0, 118.0, 404.0, 168.0, 100.0, 49.0, 30.0, 11.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.429752374970121e-07, -6.088771442591678e-07, -5.747790510213235e-07, -5.406809009400604e-07, -5.065828077022161e-07, -4.724847144643718e-07, -4.3838659280481806e-07, -4.0428847114526434e-07, -3.7019037790742004e-07, -3.3609228466957575e-07, -3.01994163010022e-07, -2.678960413504683e-07, -2.33797948112624e-07, -1.99699840663925e-07, -1.6560173321522598e-07, -1.3150361155567225e-07, -9.740551831782795e-08, -6.330741086912894e-08, -2.9209303420429933e-08, 4.888804028269078e-09, 3.898691147696809e-08, 7.30850189256671e-08, 1.0718312637436611e-07, 1.4128124803391984e-07, 1.7537934127176413e-07, 2.0947744872046314e-07, 2.4357555616916216e-07, 2.776736778287159e-07, 3.117717710665602e-07, 3.4586986430440447e-07, 3.799679859639582e-07, 4.140661076235119e-07, 4.481640871745185e-07, 4.822621804123628e-07, 5.163602736502071e-07, 5.504584237314702e-07, 5.845565169693145e-07, 6.186546102071588e-07, 6.52752760288422e-07, 6.868508535262663e-07, 7.209489467641106e-07, 7.550470400019549e-07, 7.891451332397992e-07, 8.232432833210623e-07, 8.573413765589066e-07, 8.914394697967509e-07, 9.255376198780141e-07, 9.596357131158584e-07, 9.937338063537027e-07, 1.027831899591547e-06, 1.0619299928293913e-06, 1.0960280860672356e-06, 1.1301262929919176e-06, 1.1642243862297619e-06, 1.1983224794676062e-06, 1.2324205727054505e-06, 1.2665186659432948e-06, 1.300616759181139e-06, 1.3347148524189834e-06, 1.3688129456568277e-06, 1.402911038894672e-06, 1.437009245819354e-06, 1.4711073390571983e-06, 1.5052054322950426e-06, 1.5393035255328869e-06]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 80.0, 0.0, 0.0, 0.0, 0.0, 198.0, 0.0, 0.0, 0.0, 0.0, 355.0, 0.0, 0.0, 0.0, 207.0, 0.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 8.0, 8.0, 10.0, 9.0, 16.0, 17.0, 21.0, 20.0, 22.0, 32.0, 20.0, 26.0, 35.0, 41.0, 53.0, 40.0, 48.0, 51.0, 40.0, 56.0, 39.0, 41.0, 38.0, 46.0, 34.0, 33.0, 37.0, 30.0, 22.0, 28.0, 12.0, 16.0, 12.0, 7.0, 6.0, 5.0, 3.0, 5.0, 5.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.7918701171875, -2.702880859375, -2.6138916015625, -2.52490234375, -2.4359130859375, -2.346923828125, -2.2579345703125, -2.1689453125, -2.0799560546875, -1.990966796875, -1.9019775390625, -1.81298828125, -1.7239990234375, -1.635009765625, -1.5460205078125, -1.45703125, -1.3680419921875, -1.279052734375, -1.1900634765625, -1.10107421875, -1.0120849609375, -0.923095703125, -0.8341064453125, -0.7451171875, -0.6561279296875, -0.567138671875, -0.4781494140625, -0.38916015625, -0.3001708984375, -0.211181640625, -0.1221923828125, -0.033203125, 0.0557861328125, 0.144775390625, 0.2337646484375, 0.32275390625, 0.4117431640625, 0.500732421875, 0.5897216796875, 0.6787109375, 0.7677001953125, 0.856689453125, 0.9456787109375, 1.03466796875, 1.1236572265625, 1.212646484375, 1.3016357421875, 1.390625, 1.4796142578125, 1.568603515625, 1.6575927734375, 1.74658203125, 1.8355712890625, 1.924560546875, 2.0135498046875, 2.1025390625, 2.1915283203125, 2.280517578125, 2.3695068359375, 2.45849609375, 2.5474853515625, 2.636474609375, 2.7254638671875, 2.814453125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 14.0, 12.0, 19.0, 25.0, 32.0, 48.0, 63.0, 96.0, 149.0, 225.0, 296.0, 476.0, 662.0, 938.0, 1399.0, 2053.0, 2884.0, 4212.0, 6340.0, 9244.0, 14200.0, 22617.0, 38498.0, 78928.0, 324343.0, 352038.0, 81705.0, 39426.0, 23185.0, 14551.0, 9517.0, 6362.0, 4372.0, 3047.0, 2056.0, 1410.0, 925.0, 692.0, 455.0, 341.0, 244.0, 130.0, 113.0, 68.0, 46.0, 33.0, 32.0, 10.0, 7.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.54296875, -2.46099853515625, -2.3790283203125, -2.29705810546875, -2.215087890625, -2.13311767578125, -2.0511474609375, -1.96917724609375, -1.88720703125, -1.80523681640625, -1.7232666015625, -1.64129638671875, -1.559326171875, -1.47735595703125, -1.3953857421875, -1.31341552734375, -1.2314453125, -1.14947509765625, -1.0675048828125, -0.98553466796875, -0.903564453125, -0.82159423828125, -0.7396240234375, -0.65765380859375, -0.57568359375, -0.49371337890625, -0.4117431640625, -0.32977294921875, -0.247802734375, -0.16583251953125, -0.0838623046875, -0.00189208984375, 0.080078125, 0.16204833984375, 0.2440185546875, 0.32598876953125, 0.407958984375, 0.48992919921875, 0.5718994140625, 0.65386962890625, 0.73583984375, 0.81781005859375, 0.8997802734375, 0.98175048828125, 1.063720703125, 1.14569091796875, 1.2276611328125, 1.30963134765625, 1.3916015625, 1.47357177734375, 1.5555419921875, 1.63751220703125, 1.719482421875, 1.80145263671875, 1.8834228515625, 1.96539306640625, 2.04736328125, 2.12933349609375, 2.2113037109375, 2.29327392578125, 2.375244140625, 2.45721435546875, 2.5391845703125, 2.62115478515625, 2.703125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 10.0, 14.0, 16.0, 20.0, 11.0, 21.0, 28.0, 19.0, 18.0, 28.0, 31.0, 35.0, 29.0, 34.0, 53.0, 57.0, 116.0, 247.0, 1518.0, 169.0, 83.0, 56.0, 49.0, 28.0, 35.0, 43.0, 32.0, 34.0, 28.0, 18.0, 25.0, 18.0, 23.0, 13.0, 13.0, 15.0, 9.0, 12.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0], "bins": [-8.0546875, -7.81268310546875, -7.5706787109375, -7.32867431640625, -7.086669921875, -6.84466552734375, -6.6026611328125, -6.36065673828125, -6.11865234375, -5.87664794921875, -5.6346435546875, -5.39263916015625, -5.150634765625, -4.90863037109375, -4.6666259765625, -4.42462158203125, -4.1826171875, -3.94061279296875, -3.6986083984375, -3.45660400390625, -3.214599609375, -2.97259521484375, -2.7305908203125, -2.48858642578125, -2.24658203125, -2.00457763671875, -1.7625732421875, -1.52056884765625, -1.278564453125, -1.03656005859375, -0.7945556640625, -0.55255126953125, -0.310546875, -0.06854248046875, 0.1734619140625, 0.41546630859375, 0.657470703125, 0.89947509765625, 1.1414794921875, 1.38348388671875, 1.62548828125, 1.86749267578125, 2.1094970703125, 2.35150146484375, 2.593505859375, 2.83551025390625, 3.0775146484375, 3.31951904296875, 3.5615234375, 3.80352783203125, 4.0455322265625, 4.28753662109375, 4.529541015625, 4.77154541015625, 5.0135498046875, 5.25555419921875, 5.49755859375, 5.73956298828125, 5.9815673828125, 6.22357177734375, 6.465576171875, 6.70758056640625, 6.9495849609375, 7.19158935546875, 7.43359375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 1.0, 2.0, 7.0, 5.0, 10.0, 10.0, 10.0, 9.0, 12.0, 22.0, 26.0, 35.0, 41.0, 57.0, 71.0, 84.0, 111.0, 161.0, 243.0, 502.0, 1729.0, 9469.0, 98556.0, 2871154.0, 147948.0, 11967.0, 2018.0, 541.0, 282.0, 152.0, 125.0, 83.0, 49.0, 42.0, 39.0, 38.0, 23.0, 20.0, 13.0, 13.0, 13.0, 1.0, 1.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-15.28125, -14.839111328125, -14.39697265625, -13.954833984375, -13.5126953125, -13.070556640625, -12.62841796875, -12.186279296875, -11.744140625, -11.302001953125, -10.85986328125, -10.417724609375, -9.9755859375, -9.533447265625, -9.09130859375, -8.649169921875, -8.20703125, -7.764892578125, -7.32275390625, -6.880615234375, -6.4384765625, -5.996337890625, -5.55419921875, -5.112060546875, -4.669921875, -4.227783203125, -3.78564453125, -3.343505859375, -2.9013671875, -2.459228515625, -2.01708984375, -1.574951171875, -1.1328125, -0.690673828125, -0.24853515625, 0.193603515625, 0.6357421875, 1.077880859375, 1.52001953125, 1.962158203125, 2.404296875, 2.846435546875, 3.28857421875, 3.730712890625, 4.1728515625, 4.614990234375, 5.05712890625, 5.499267578125, 5.94140625, 6.383544921875, 6.82568359375, 7.267822265625, 7.7099609375, 8.152099609375, 8.59423828125, 9.036376953125, 9.478515625, 9.920654296875, 10.36279296875, 10.804931640625, 11.2470703125, 11.689208984375, 12.13134765625, 12.573486328125, 13.015625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 51.0, 428.0, 441.0, 88.0, 7.0], "bins": [-173.51063537597656, -170.66748046875, -167.82432556152344, -164.98117065429688, -162.13803100585938, -159.2948760986328, -156.45172119140625, -153.6085662841797, -150.76541137695312, -147.92225646972656, -145.0791015625, -142.23594665527344, -139.39279174804688, -136.54965209960938, -133.7064971923828, -130.86334228515625, -128.0201873779297, -125.17703247070312, -122.33387756347656, -119.49073028564453, -116.64757537841797, -113.8044204711914, -110.96127319335938, -108.11811828613281, -105.27496337890625, -102.43180847167969, -99.58865356445312, -96.7455062866211, -93.90235137939453, -91.05919647216797, -88.21604919433594, -85.37289428710938, -82.52973937988281, -79.68658447265625, -76.84342956542969, -74.00028228759766, -71.1571273803711, -68.31397247314453, -65.4708251953125, -62.62767028808594, -59.784515380859375, -56.94136047363281, -54.098209381103516, -51.25505828857422, -48.411903381347656, -45.568748474121094, -42.7255973815918, -39.8824462890625, -37.03929138183594, -34.196136474609375, -31.352985382080078, -28.50983238220215, -25.66667938232422, -22.82352638244629, -19.98037338256836, -17.13722038269043, -14.2940673828125, -11.45091438293457, -8.60776138305664, -5.764608383178711, -2.9214553833007812, -0.07830238342285156, 2.764850616455078, 5.608003616333008, 8.451156616210938]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 5.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 7.0, 7.0, 15.0, 10.0, 22.0, 17.0, 22.0, 26.0, 22.0, 32.0, 28.0, 48.0, 32.0, 42.0, 42.0, 45.0, 44.0, 45.0, 47.0, 34.0, 46.0, 27.0, 30.0, 43.0, 22.0, 24.0, 19.0, 33.0, 15.0, 22.0, 9.0, 14.0, 10.0, 9.0, 16.0, 12.0, 14.0, 2.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.727693557739258, -23.95778465270996, -23.187877655029297, -22.41796875, -21.648059844970703, -20.878150939941406, -20.108243942260742, -19.338335037231445, -18.56842613220215, -17.79851722717285, -17.028610229492188, -16.25870132446289, -15.488792419433594, -14.718884468078613, -13.948976516723633, -13.179067611694336, -12.409159660339355, -11.639251708984375, -10.869342803955078, -10.099434852600098, -9.3295259475708, -8.55961799621582, -7.789709568023682, -7.019801139831543, -6.249892711639404, -5.479984283447266, -4.710075855255127, -3.9401676654815674, -3.1702592372894287, -2.40035080909729, -1.6304426193237305, -0.8605341911315918, -0.09062576293945312, 0.6792826056480408, 1.4491909742355347, 2.219099283218384, 2.9890077114105225, 3.758916139602661, 4.528824329376221, 5.298732757568359, 6.068641185760498, 6.838549613952637, 7.608458042144775, 8.378366470336914, 9.148274421691895, 9.918183326721191, 10.688091278076172, 11.458000183105469, 12.22790813446045, 12.99781608581543, 13.767724990844727, 14.537632942199707, 15.307541847229004, 16.077449798583984, 16.84735870361328, 17.617267608642578, 18.387174606323242, 19.15708351135254, 19.926990509033203, 20.6968994140625, 21.466808319091797, 22.236717224121094, 23.006624221801758, 23.776533126831055, 24.54644203186035]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 10.0, 14.0, 13.0, 21.0, 16.0, 29.0, 21.0, 22.0, 30.0, 32.0, 36.0, 39.0, 48.0, 43.0, 47.0, 53.0, 57.0, 54.0, 26.0, 44.0, 51.0, 42.0, 37.0, 25.0, 39.0, 26.0, 23.0, 23.0, 14.0, 10.0, 8.0, 8.0, 2.0, 4.0, 8.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98828125, -2.894805908203125, -2.80133056640625, -2.707855224609375, -2.6143798828125, -2.520904541015625, -2.42742919921875, -2.333953857421875, -2.240478515625, -2.147003173828125, -2.05352783203125, -1.960052490234375, -1.8665771484375, -1.773101806640625, -1.67962646484375, -1.586151123046875, -1.49267578125, -1.399200439453125, -1.30572509765625, -1.212249755859375, -1.1187744140625, -1.025299072265625, -0.93182373046875, -0.838348388671875, -0.744873046875, -0.651397705078125, -0.55792236328125, -0.464447021484375, -0.3709716796875, -0.277496337890625, -0.18402099609375, -0.090545654296875, 0.0029296875, 0.096405029296875, 0.18988037109375, 0.283355712890625, 0.3768310546875, 0.470306396484375, 0.56378173828125, 0.657257080078125, 0.750732421875, 0.844207763671875, 0.93768310546875, 1.031158447265625, 1.1246337890625, 1.218109130859375, 1.31158447265625, 1.405059814453125, 1.49853515625, 1.592010498046875, 1.68548583984375, 1.778961181640625, 1.8724365234375, 1.965911865234375, 2.05938720703125, 2.152862548828125, 2.246337890625, 2.339813232421875, 2.43328857421875, 2.526763916015625, 2.6202392578125, 2.713714599609375, 2.80718994140625, 2.900665283203125, 2.994140625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 11.0, 11.0, 22.0, 15.0, 30.0, 38.0, 46.0, 64.0, 117.0, 133.0, 189.0, 289.0, 429.0, 771.0, 1361.0, 2410.0, 4966.0, 10401.0, 24482.0, 64533.0, 206539.0, 828174.0, 1966499.0, 779391.0, 196430.0, 62711.0, 23819.0, 9902.0, 4660.0, 2432.0, 1295.0, 680.0, 473.0, 295.0, 186.0, 127.0, 104.0, 62.0, 43.0, 31.0, 25.0, 17.0, 14.0, 11.0, 15.0, 9.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-5.296875, -5.14324951171875, -4.9896240234375, -4.83599853515625, -4.682373046875, -4.52874755859375, -4.3751220703125, -4.22149658203125, -4.06787109375, -3.91424560546875, -3.7606201171875, -3.60699462890625, -3.453369140625, -3.29974365234375, -3.1461181640625, -2.99249267578125, -2.8388671875, -2.68524169921875, -2.5316162109375, -2.37799072265625, -2.224365234375, -2.07073974609375, -1.9171142578125, -1.76348876953125, -1.60986328125, -1.45623779296875, -1.3026123046875, -1.14898681640625, -0.995361328125, -0.84173583984375, -0.6881103515625, -0.53448486328125, -0.380859375, -0.22723388671875, -0.0736083984375, 0.08001708984375, 0.233642578125, 0.38726806640625, 0.5408935546875, 0.69451904296875, 0.84814453125, 1.00177001953125, 1.1553955078125, 1.30902099609375, 1.462646484375, 1.61627197265625, 1.7698974609375, 1.92352294921875, 2.0771484375, 2.23077392578125, 2.3843994140625, 2.53802490234375, 2.691650390625, 2.84527587890625, 2.9989013671875, 3.15252685546875, 3.30615234375, 3.45977783203125, 3.6134033203125, 3.76702880859375, 3.920654296875, 4.07427978515625, 4.2279052734375, 4.38153076171875, 4.53515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 4.0, 6.0, 9.0, 12.0, 20.0, 31.0, 56.0, 82.0, 127.0, 182.0, 269.0, 440.0, 573.0, 656.0, 519.0, 358.0, 245.0, 181.0, 101.0, 63.0, 49.0, 29.0, 31.0, 5.0, 7.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.1484375, -10.871826171875, -10.59521484375, -10.318603515625, -10.0419921875, -9.765380859375, -9.48876953125, -9.212158203125, -8.935546875, -8.658935546875, -8.38232421875, -8.105712890625, -7.8291015625, -7.552490234375, -7.27587890625, -6.999267578125, -6.72265625, -6.446044921875, -6.16943359375, -5.892822265625, -5.6162109375, -5.339599609375, -5.06298828125, -4.786376953125, -4.509765625, -4.233154296875, -3.95654296875, -3.679931640625, -3.4033203125, -3.126708984375, -2.85009765625, -2.573486328125, -2.296875, -2.020263671875, -1.74365234375, -1.467041015625, -1.1904296875, -0.913818359375, -0.63720703125, -0.360595703125, -0.083984375, 0.192626953125, 0.46923828125, 0.745849609375, 1.0224609375, 1.299072265625, 1.57568359375, 1.852294921875, 2.12890625, 2.405517578125, 2.68212890625, 2.958740234375, 3.2353515625, 3.511962890625, 3.78857421875, 4.065185546875, 4.341796875, 4.618408203125, 4.89501953125, 5.171630859375, 5.4482421875, 5.724853515625, 6.00146484375, 6.278076171875, 6.5546875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 20.0, 19.0, 32.0, 72.0, 111.0, 173.0, 305.0, 763.0, 2226.0, 13651.0, 176868.0, 3071076.0, 877040.0, 44686.0, 4999.0, 1190.0, 481.0, 247.0, 123.0, 65.0, 38.0, 28.0, 17.0, 13.0, 14.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.140625, -13.5693359375, -12.998046875, -12.4267578125, -11.85546875, -11.2841796875, -10.712890625, -10.1416015625, -9.5703125, -8.9990234375, -8.427734375, -7.8564453125, -7.28515625, -6.7138671875, -6.142578125, -5.5712890625, -5.0, -4.4287109375, -3.857421875, -3.2861328125, -2.71484375, -2.1435546875, -1.572265625, -1.0009765625, -0.4296875, 0.1416015625, 0.712890625, 1.2841796875, 1.85546875, 2.4267578125, 2.998046875, 3.5693359375, 4.140625, 4.7119140625, 5.283203125, 5.8544921875, 6.42578125, 6.9970703125, 7.568359375, 8.1396484375, 8.7109375, 9.2822265625, 9.853515625, 10.4248046875, 10.99609375, 11.5673828125, 12.138671875, 12.7099609375, 13.28125, 13.8525390625, 14.423828125, 14.9951171875, 15.56640625, 16.1376953125, 16.708984375, 17.2802734375, 17.8515625, 18.4228515625, 18.994140625, 19.5654296875, 20.13671875, 20.7080078125, 21.279296875, 21.8505859375, 22.421875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 11.0, 22.0, 38.0, 58.0, 84.0, 89.0, 130.0, 116.0, 125.0, 99.0, 72.0, 66.0, 39.0, 24.0, 18.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.1524658203125, -49.63003921508789, -48.107608795166016, -46.585182189941406, -45.0627555847168, -43.54032897949219, -42.01789855957031, -40.4954719543457, -38.973045349121094, -37.450618743896484, -35.92818832397461, -34.40576171875, -32.88333511352539, -31.36090660095215, -29.838478088378906, -28.316051483154297, -26.793621063232422, -25.27119255065918, -23.74876594543457, -22.226337432861328, -20.70391082763672, -19.181482315063477, -17.659053802490234, -16.136627197265625, -14.614198684692383, -13.091771125793457, -11.569343566894531, -10.046915054321289, -8.524487495422363, -7.0020599365234375, -5.479631423950195, -3.9572038650512695, -2.4347763061523438, -0.9123485088348389, 0.610079288482666, 2.13250732421875, 3.654934883117676, 5.177362442016602, 6.699790954589844, 8.22221851348877, 9.744646072387695, 11.267073631286621, 12.789501190185547, 14.311929702758789, 15.834357261657715, 17.35678482055664, 18.879213333129883, 20.401641845703125, 21.924068450927734, 23.446496963500977, 24.968923568725586, 26.491352081298828, 28.013778686523438, 29.53620719909668, 31.058635711669922, 32.58106231689453, 34.103492736816406, 35.625919342041016, 37.14834976196289, 38.6707763671875, 40.19320297241211, 41.71562957763672, 43.238059997558594, 44.7604866027832, 46.28291320800781]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 8.0, 4.0, 8.0, 9.0, 18.0, 12.0, 13.0, 27.0, 13.0, 21.0, 24.0, 26.0, 31.0, 38.0, 43.0, 42.0, 35.0, 42.0, 36.0, 38.0, 45.0, 38.0, 42.0, 44.0, 39.0, 37.0, 31.0, 32.0, 25.0, 28.0, 23.0, 22.0, 12.0, 14.0, 14.0, 12.0, 12.0, 4.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.444656372070312, -20.770015716552734, -20.095375061035156, -19.420732498168945, -18.746091842651367, -18.07145118713379, -17.396808624267578, -16.72216796875, -16.047527313232422, -15.372886657714844, -14.69824504852295, -14.023603439331055, -13.348962783813477, -12.674322128295898, -11.999680519104004, -11.32503890991211, -10.650398254394531, -9.975757598876953, -9.301115989685059, -8.626474380493164, -7.951833724975586, -7.27719259262085, -6.602551460266113, -5.927910327911377, -5.253269195556641, -4.578628063201904, -3.903986930847168, -3.2293457984924316, -2.5547046661376953, -1.880063533782959, -1.2054224014282227, -0.5307812690734863, 0.14385986328125, 0.8185009956359863, 1.4931421279907227, 2.167783260345459, 2.8424243927001953, 3.5170655250549316, 4.191706657409668, 4.866347789764404, 5.540988922119141, 6.215630054473877, 6.890271186828613, 7.56491231918335, 8.239553451538086, 8.914194107055664, 9.588835716247559, 10.263477325439453, 10.938117980957031, 11.61275863647461, 12.287400245666504, 12.962041854858398, 13.636682510375977, 14.311323165893555, 14.98596477508545, 15.660606384277344, 16.335247039794922, 17.0098876953125, 17.684528350830078, 18.35917091369629, 19.033811569213867, 19.708452224731445, 20.383094787597656, 21.057735443115234, 21.732376098632812]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 7.0, 9.0, 21.0, 13.0, 20.0, 14.0, 20.0, 28.0, 25.0, 35.0, 39.0, 36.0, 40.0, 36.0, 44.0, 59.0, 41.0, 52.0, 43.0, 40.0, 45.0, 42.0, 42.0, 34.0, 36.0, 24.0, 26.0, 20.0, 21.0, 16.0, 11.0, 11.0, 6.0, 4.0, 6.0, 7.0, 7.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.64422607421875, -2.5521240234375, -2.46002197265625, -2.367919921875, -2.27581787109375, -2.1837158203125, -2.09161376953125, -1.99951171875, -1.90740966796875, -1.8153076171875, -1.72320556640625, -1.631103515625, -1.53900146484375, -1.4468994140625, -1.35479736328125, -1.2626953125, -1.17059326171875, -1.0784912109375, -0.98638916015625, -0.894287109375, -0.80218505859375, -0.7100830078125, -0.61798095703125, -0.52587890625, -0.43377685546875, -0.3416748046875, -0.24957275390625, -0.157470703125, -0.06536865234375, 0.0267333984375, 0.11883544921875, 0.2109375, 0.30303955078125, 0.3951416015625, 0.48724365234375, 0.579345703125, 0.67144775390625, 0.7635498046875, 0.85565185546875, 0.94775390625, 1.03985595703125, 1.1319580078125, 1.22406005859375, 1.316162109375, 1.40826416015625, 1.5003662109375, 1.59246826171875, 1.6845703125, 1.77667236328125, 1.8687744140625, 1.96087646484375, 2.052978515625, 2.14508056640625, 2.2371826171875, 2.32928466796875, 2.42138671875, 2.51348876953125, 2.6055908203125, 2.69769287109375, 2.789794921875, 2.88189697265625, 2.9739990234375, 3.06610107421875, 3.158203125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 7.0, 5.0, 13.0, 17.0, 19.0, 32.0, 57.0, 75.0, 87.0, 151.0, 210.0, 347.0, 539.0, 879.0, 1411.0, 2207.0, 3724.0, 6135.0, 10572.0, 18215.0, 32543.0, 62250.0, 128957.0, 304194.0, 248561.0, 106992.0, 52668.0, 28192.0, 15892.0, 9260.0, 5563.0, 3380.0, 2018.0, 1242.0, 755.0, 492.0, 284.0, 192.0, 120.0, 95.0, 71.0, 35.0, 36.0, 29.0, 11.0, 4.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.025665283203125, -0.024834156036376953, -0.024003028869628906, -0.02317190170288086, -0.022340774536132812, -0.021509647369384766, -0.02067852020263672, -0.019847393035888672, -0.019016265869140625, -0.018185138702392578, -0.01735401153564453, -0.016522884368896484, -0.015691757202148438, -0.01486063003540039, -0.014029502868652344, -0.013198375701904297, -0.01236724853515625, -0.011536121368408203, -0.010704994201660156, -0.00987386703491211, -0.009042739868164062, -0.008211612701416016, -0.007380485534667969, -0.006549358367919922, -0.005718231201171875, -0.004887104034423828, -0.004055976867675781, -0.0032248497009277344, -0.0023937225341796875, -0.0015625953674316406, -0.0007314682006835938, 9.965896606445312e-05, 0.0009307861328125, 0.0017619132995605469, 0.0025930404663085938, 0.0034241676330566406, 0.0042552947998046875, 0.005086421966552734, 0.005917549133300781, 0.006748676300048828, 0.007579803466796875, 0.008410930633544922, 0.009242057800292969, 0.010073184967041016, 0.010904312133789062, 0.01173543930053711, 0.012566566467285156, 0.013397693634033203, 0.01422882080078125, 0.015059947967529297, 0.015891075134277344, 0.01672220230102539, 0.017553329467773438, 0.018384456634521484, 0.01921558380126953, 0.020046710968017578, 0.020877838134765625, 0.021708965301513672, 0.02254009246826172, 0.023371219635009766, 0.024202346801757812, 0.02503347396850586, 0.025864601135253906, 0.026695728302001953, 0.02752685546875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 4.0, 10.0, 13.0, 16.0, 16.0, 15.0, 20.0, 19.0, 23.0, 33.0, 21.0, 25.0, 33.0, 37.0, 30.0, 27.0, 40.0, 37.0, 28.0, 1073.0, 36.0, 28.0, 36.0, 39.0, 37.0, 36.0, 40.0, 21.0, 23.0, 27.0, 22.0, 20.0, 25.0, 18.0, 12.0, 17.0, 10.0, 9.0, 10.0, 6.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.931640625, -1.8748016357421875, -1.817962646484375, -1.7611236572265625, -1.70428466796875, -1.6474456787109375, -1.590606689453125, -1.5337677001953125, -1.4769287109375, -1.4200897216796875, -1.363250732421875, -1.3064117431640625, -1.24957275390625, -1.1927337646484375, -1.135894775390625, -1.0790557861328125, -1.022216796875, -0.9653778076171875, -0.908538818359375, -0.8516998291015625, -0.79486083984375, -0.7380218505859375, -0.681182861328125, -0.6243438720703125, -0.5675048828125, -0.5106658935546875, -0.453826904296875, -0.3969879150390625, -0.34014892578125, -0.2833099365234375, -0.226470947265625, -0.1696319580078125, -0.11279296875, -0.0559539794921875, 0.000885009765625, 0.0577239990234375, 0.11456298828125, 0.1714019775390625, 0.228240966796875, 0.2850799560546875, 0.3419189453125, 0.3987579345703125, 0.455596923828125, 0.5124359130859375, 0.56927490234375, 0.6261138916015625, 0.682952880859375, 0.7397918701171875, 0.796630859375, 0.8534698486328125, 0.910308837890625, 0.9671478271484375, 1.02398681640625, 1.0808258056640625, 1.137664794921875, 1.1945037841796875, 1.2513427734375, 1.3081817626953125, 1.365020751953125, 1.4218597412109375, 1.47869873046875, 1.5355377197265625, 1.592376708984375, 1.6492156982421875, 1.7060546875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 10.0, 8.0, 19.0, 26.0, 41.0, 69.0, 76.0, 120.0, 181.0, 250.0, 344.0, 489.0, 741.0, 1062.0, 1510.0, 2206.0, 3279.0, 4785.0, 7088.0, 10668.0, 15536.0, 23248.0, 35246.0, 53335.0, 81398.0, 125341.0, 1228896.0, 169504.0, 113221.0, 73586.0, 47609.0, 31746.0, 21446.0, 14224.0, 9552.0, 6363.0, 4428.0, 2947.0, 1997.0, 1455.0, 966.0, 657.0, 426.0, 295.0, 200.0, 164.0, 131.0, 67.0, 57.0, 35.0, 26.0, 26.0, 11.0, 11.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.00658416748046875, -0.0063838958740234375, -0.006183624267578125, -0.0059833526611328125, -0.0057830810546875, -0.0055828094482421875, -0.005382537841796875, -0.0051822662353515625, -0.00498199462890625, -0.0047817230224609375, -0.004581451416015625, -0.0043811798095703125, -0.004180908203125, -0.0039806365966796875, -0.003780364990234375, -0.0035800933837890625, -0.00337982177734375, -0.0031795501708984375, -0.002979278564453125, -0.0027790069580078125, -0.0025787353515625, -0.0023784637451171875, -0.002178192138671875, -0.0019779205322265625, -0.00177764892578125, -0.0015773773193359375, -0.001377105712890625, -0.0011768341064453125, -0.0009765625, -0.0007762908935546875, -0.000576019287109375, -0.0003757476806640625, -0.00017547607421875, 2.47955322265625e-05, 0.000225067138671875, 0.0004253387451171875, 0.0006256103515625, 0.0008258819580078125, 0.001026153564453125, 0.0012264251708984375, 0.00142669677734375, 0.0016269683837890625, 0.001827239990234375, 0.0020275115966796875, 0.002227783203125, 0.0024280548095703125, 0.002628326416015625, 0.0028285980224609375, 0.00302886962890625, 0.0032291412353515625, 0.003429412841796875, 0.0036296844482421875, 0.0038299560546875, 0.0040302276611328125, 0.004230499267578125, 0.0044307708740234375, 0.00463104248046875, 0.0048313140869140625, 0.005031585693359375, 0.0052318572998046875, 0.00543212890625, 0.0056324005126953125, 0.005832672119140625, 0.0060329437255859375, 0.00623321533203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 0.0, 5.0, 0.0, 6.0, 0.0, 10.0, 0.0, 0.0, 15.0, 0.0, 22.0, 0.0, 33.0, 0.0, 68.0, 0.0, 143.0, 0.0, 399.0, 0.0, 140.0, 0.0, 71.0, 0.0, 38.0, 0.0, 23.0, 0.0, 10.0, 0.0, 9.0, 0.0, 8.0, 0.0, 5.0, 0.0, 4.0, 0.0, 3.0], "bins": [-1.2516975402832031e-06, -1.2228265404701233e-06, -1.1939555406570435e-06, -1.1650845408439636e-06, -1.1362135410308838e-06, -1.107342541217804e-06, -1.0784715414047241e-06, -1.0496005415916443e-06, -1.0207295417785645e-06, -9.918585419654846e-07, -9.629875421524048e-07, -9.34116542339325e-07, -9.052455425262451e-07, -8.763745427131653e-07, -8.475035429000854e-07, -8.186325430870056e-07, -7.897615432739258e-07, -7.60890543460846e-07, -7.320195436477661e-07, -7.031485438346863e-07, -6.742775440216064e-07, -6.454065442085266e-07, -6.165355443954468e-07, -5.876645445823669e-07, -5.587935447692871e-07, -5.299225449562073e-07, -5.010515451431274e-07, -4.721805453300476e-07, -4.4330954551696777e-07, -4.1443854570388794e-07, -3.855675458908081e-07, -3.5669654607772827e-07, -3.2782554626464844e-07, -2.989545464515686e-07, -2.7008354663848877e-07, -2.4121254682540894e-07, -2.123415470123291e-07, -1.8347054719924927e-07, -1.5459954738616943e-07, -1.257285475730896e-07, -9.685754776000977e-08, -6.798654794692993e-08, -3.91155481338501e-08, -1.0244548320770264e-08, 1.862645149230957e-08, 4.7497451305389404e-08, 7.636845111846924e-08, 1.0523945093154907e-07, 1.341104507446289e-07, 1.6298145055770874e-07, 1.9185245037078857e-07, 2.207234501838684e-07, 2.4959444999694824e-07, 2.784654498100281e-07, 3.073364496231079e-07, 3.3620744943618774e-07, 3.650784492492676e-07, 3.939494490623474e-07, 4.2282044887542725e-07, 4.516914486885071e-07, 4.805624485015869e-07, 5.094334483146667e-07, 5.383044481277466e-07, 5.671754479408264e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 5.0, 13.0, 18.0, 10.0, 43.0, 68.0, 86.0, 154.0, 350.0, 2532.0, 273010.0, 767677.0, 3749.0, 395.0, 163.0, 88.0, 63.0, 44.0, 13.0, 16.0, 10.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138448715209961e-05, -1.0868534445762634e-05, -1.035258173942566e-05, -9.836629033088684e-06, -9.320676326751709e-06, -8.804723620414734e-06, -8.288770914077759e-06, -7.772818207740784e-06, -7.256865501403809e-06, -6.7409127950668335e-06, -6.224960088729858e-06, -5.709007382392883e-06, -5.193054676055908e-06, -4.677101969718933e-06, -4.161149263381958e-06, -3.645196557044983e-06, -3.129243850708008e-06, -2.6132911443710327e-06, -2.0973384380340576e-06, -1.5813857316970825e-06, -1.0654330253601074e-06, -5.494803190231323e-07, -3.3527612686157227e-08, 4.824250936508179e-07, 9.98377799987793e-07, 1.514330506324768e-06, 2.030283212661743e-06, 2.5462359189987183e-06, 3.0621886253356934e-06, 3.5781413316726685e-06, 4.0940940380096436e-06, 4.610046744346619e-06, 5.125999450683594e-06, 5.641952157020569e-06, 6.157904863357544e-06, 6.673857569694519e-06, 7.189810276031494e-06, 7.70576298236847e-06, 8.221715688705444e-06, 8.73766839504242e-06, 9.253621101379395e-06, 9.76957380771637e-06, 1.0285526514053345e-05, 1.080147922039032e-05, 1.1317431926727295e-05, 1.183338463306427e-05, 1.2349337339401245e-05, 1.286529004573822e-05, 1.3381242752075195e-05, 1.389719545841217e-05, 1.4413148164749146e-05, 1.492910087108612e-05, 1.5445053577423096e-05, 1.596100628376007e-05, 1.6476958990097046e-05, 1.699291169643402e-05, 1.7508864402770996e-05, 1.802481710910797e-05, 1.8540769815444946e-05, 1.905672252178192e-05, 1.9572675228118896e-05, 2.008862793445587e-05, 2.0604580640792847e-05, 2.1120533347129822e-05, 2.1636486053466797e-05]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 15.0, 111.0, 555.0, 278.0, 51.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.494871402333956e-06, -5.396424512582598e-06, -5.297977168083889e-06, -5.1995302783325315e-06, -5.1010833885811735e-06, -5.002636044082465e-06, -4.904189154331107e-06, -4.805742264579749e-06, -4.70729492008104e-06, -4.608848030329682e-06, -4.510400685830973e-06, -4.411953796079615e-06, -4.313506906328257e-06, -4.215059561829548e-06, -4.11661267207819e-06, -4.018165782326832e-06, -3.9197188925754745e-06, -3.8212720028241165e-06, -3.722824885699083e-06, -3.6243777685740497e-06, -3.5259306514490163e-06, -3.4274837616976583e-06, -3.329036644572625e-06, -3.230589754821267e-06, -3.132142410322558e-06, -3.0336952931975247e-06, -2.9352484034461668e-06, -2.8368012863211334e-06, -2.7383541691961e-06, -2.639907279444742e-06, -2.5414601623197086e-06, -2.4430132725683507e-06, -2.3445663828169927e-06, -2.2461192656919593e-06, -2.1476723759406013e-06, -2.049225258815568e-06, -1.9507781416905345e-06, -1.8523312519391766e-06, -1.7538841348141432e-06, -1.6554371313759475e-06, -1.5569899005640764e-06, -1.4585428971258807e-06, -1.3600957800008473e-06, -1.2616487765626516e-06, -1.163201773124456e-06, -1.0647547696862603e-06, -9.663076525612269e-07, -8.678606491230312e-07, -7.694136456848355e-07, -6.70966585403221e-07, -5.725195819650253e-07, -4.7407252168341074e-07, -3.7562548982350563e-07, -2.771784579636005e-07, -1.7873139768198598e-07, -8.02843942437903e-08, 1.8162666037824238e-08, 1.166097050031567e-07, 2.1505674396848917e-07, 3.13503790039249e-07, 4.119508218991541e-07, 5.103978537590592e-07, 6.088449140406738e-07, 7.072919174788694e-07, 8.05738977760484e-07]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 93.0, 0.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 0.0, 323.0, 0.0, 0.0, 0.0, 0.0, 200.0, 0.0, 0.0, 0.0, 0.0, 84.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 7.0, 9.0, 21.0, 13.0, 20.0, 14.0, 20.0, 28.0, 25.0, 35.0, 39.0, 36.0, 40.0, 36.0, 44.0, 59.0, 41.0, 52.0, 43.0, 40.0, 45.0, 42.0, 42.0, 34.0, 36.0, 24.0, 26.0, 20.0, 21.0, 16.0, 11.0, 11.0, 6.0, 4.0, 6.0, 7.0, 7.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.64422607421875, -2.5521240234375, -2.46002197265625, -2.367919921875, -2.27581787109375, -2.1837158203125, -2.09161376953125, -1.99951171875, -1.90740966796875, -1.8153076171875, -1.72320556640625, -1.631103515625, -1.53900146484375, -1.4468994140625, -1.35479736328125, -1.2626953125, -1.17059326171875, -1.0784912109375, -0.98638916015625, -0.894287109375, -0.80218505859375, -0.7100830078125, -0.61798095703125, -0.52587890625, -0.43377685546875, -0.3416748046875, -0.24957275390625, -0.157470703125, -0.06536865234375, 0.0267333984375, 0.11883544921875, 0.2109375, 0.30303955078125, 0.3951416015625, 0.48724365234375, 0.579345703125, 0.67144775390625, 0.7635498046875, 0.85565185546875, 0.94775390625, 1.03985595703125, 1.1319580078125, 1.22406005859375, 1.316162109375, 1.40826416015625, 1.5003662109375, 1.59246826171875, 1.6845703125, 1.77667236328125, 1.8687744140625, 1.96087646484375, 2.052978515625, 2.14508056640625, 2.2371826171875, 2.32928466796875, 2.42138671875, 2.51348876953125, 2.6055908203125, 2.69769287109375, 2.789794921875, 2.88189697265625, 2.9739990234375, 3.06610107421875, 3.158203125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 15.0, 24.0, 40.0, 48.0, 82.0, 122.0, 180.0, 230.0, 398.0, 586.0, 881.0, 1287.0, 1851.0, 2783.0, 4172.0, 6280.0, 9782.0, 14900.0, 22460.0, 34396.0, 54104.0, 96864.0, 233302.0, 279519.0, 113787.0, 60257.0, 37792.0, 24432.0, 16390.0, 10640.0, 7022.0, 4669.0, 3137.0, 1995.0, 1373.0, 890.0, 597.0, 400.0, 304.0, 176.0, 119.0, 78.0, 62.0, 42.0, 27.0, 17.0, 10.0, 11.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.931640625, -2.84033203125, -2.7490234375, -2.65771484375, -2.56640625, -2.47509765625, -2.3837890625, -2.29248046875, -2.201171875, -2.10986328125, -2.0185546875, -1.92724609375, -1.8359375, -1.74462890625, -1.6533203125, -1.56201171875, -1.470703125, -1.37939453125, -1.2880859375, -1.19677734375, -1.10546875, -1.01416015625, -0.9228515625, -0.83154296875, -0.740234375, -0.64892578125, -0.5576171875, -0.46630859375, -0.375, -0.28369140625, -0.1923828125, -0.10107421875, -0.009765625, 0.08154296875, 0.1728515625, 0.26416015625, 0.35546875, 0.44677734375, 0.5380859375, 0.62939453125, 0.720703125, 0.81201171875, 0.9033203125, 0.99462890625, 1.0859375, 1.17724609375, 1.2685546875, 1.35986328125, 1.451171875, 1.54248046875, 1.6337890625, 1.72509765625, 1.81640625, 1.90771484375, 1.9990234375, 2.09033203125, 2.181640625, 2.27294921875, 2.3642578125, 2.45556640625, 2.546875, 2.63818359375, 2.7294921875, 2.82080078125, 2.912109375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 9.0, 10.0, 12.0, 22.0, 19.0, 22.0, 25.0, 18.0, 32.0, 36.0, 58.0, 37.0, 66.0, 64.0, 81.0, 166.0, 301.0, 1379.0, 171.0, 89.0, 65.0, 59.0, 40.0, 33.0, 26.0, 24.0, 27.0, 21.0, 18.0, 23.0, 17.0, 10.0, 8.0, 12.0, 8.0, 7.0, 2.0, 4.0, 6.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.75, -9.4639892578125, -9.177978515625, -8.8919677734375, -8.60595703125, -8.3199462890625, -8.033935546875, -7.7479248046875, -7.4619140625, -7.1759033203125, -6.889892578125, -6.6038818359375, -6.31787109375, -6.0318603515625, -5.745849609375, -5.4598388671875, -5.173828125, -4.8878173828125, -4.601806640625, -4.3157958984375, -4.02978515625, -3.7437744140625, -3.457763671875, -3.1717529296875, -2.8857421875, -2.5997314453125, -2.313720703125, -2.0277099609375, -1.74169921875, -1.4556884765625, -1.169677734375, -0.8836669921875, -0.59765625, -0.3116455078125, -0.025634765625, 0.2603759765625, 0.54638671875, 0.8323974609375, 1.118408203125, 1.4044189453125, 1.6904296875, 1.9764404296875, 2.262451171875, 2.5484619140625, 2.83447265625, 3.1204833984375, 3.406494140625, 3.6925048828125, 3.978515625, 4.2645263671875, 4.550537109375, 4.8365478515625, 5.12255859375, 5.4085693359375, 5.694580078125, 5.9805908203125, 6.2666015625, 6.5526123046875, 6.838623046875, 7.1246337890625, 7.41064453125, 7.6966552734375, 7.982666015625, 8.2686767578125, 8.5546875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 8.0, 17.0, 19.0, 22.0, 31.0, 51.0, 52.0, 79.0, 80.0, 104.0, 174.0, 274.0, 606.0, 1743.0, 9028.0, 96521.0, 2714278.0, 298031.0, 19469.0, 3077.0, 916.0, 364.0, 213.0, 138.0, 99.0, 77.0, 54.0, 46.0, 32.0, 24.0, 12.0, 12.0, 7.0, 9.0, 4.0, 8.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.03125, -16.49365234375, -15.9560546875, -15.41845703125, -14.880859375, -14.34326171875, -13.8056640625, -13.26806640625, -12.73046875, -12.19287109375, -11.6552734375, -11.11767578125, -10.580078125, -10.04248046875, -9.5048828125, -8.96728515625, -8.4296875, -7.89208984375, -7.3544921875, -6.81689453125, -6.279296875, -5.74169921875, -5.2041015625, -4.66650390625, -4.12890625, -3.59130859375, -3.0537109375, -2.51611328125, -1.978515625, -1.44091796875, -0.9033203125, -0.36572265625, 0.171875, 0.70947265625, 1.2470703125, 1.78466796875, 2.322265625, 2.85986328125, 3.3974609375, 3.93505859375, 4.47265625, 5.01025390625, 5.5478515625, 6.08544921875, 6.623046875, 7.16064453125, 7.6982421875, 8.23583984375, 8.7734375, 9.31103515625, 9.8486328125, 10.38623046875, 10.923828125, 11.46142578125, 11.9990234375, 12.53662109375, 13.07421875, 13.61181640625, 14.1494140625, 14.68701171875, 15.224609375, 15.76220703125, 16.2998046875, 16.83740234375, 17.375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 12.0, 157.0, 570.0, 255.0, 23.0, 1.0], "bins": [-258.2127685546875, -253.9541015625, -249.6954345703125, -245.436767578125, -241.1781005859375, -236.91943359375, -232.6607666015625, -228.40211486816406, -224.14344787597656, -219.88478088378906, -215.62611389160156, -211.36744689941406, -207.10877990722656, -202.85012817382812, -198.59146118164062, -194.33279418945312, -190.07412719726562, -185.81546020507812, -181.55679321289062, -177.29812622070312, -173.03945922851562, -168.78079223632812, -164.52212524414062, -160.2634735107422, -156.00479125976562, -151.74612426757812, -147.48745727539062, -143.22879028320312, -138.97012329101562, -134.71145629882812, -130.45278930664062, -126.19412994384766, -121.93548583984375, -117.67681884765625, -113.41815185546875, -109.15948486328125, -104.90082550048828, -100.64215850830078, -96.38349151611328, -92.12482452392578, -87.86615753173828, -83.60749053955078, -79.34882354736328, -75.09016418457031, -70.83149719238281, -66.57283020019531, -62.31416320800781, -58.05549621582031, -53.796836853027344, -49.538169860839844, -45.27950668334961, -41.02083969116211, -36.762176513671875, -32.503509521484375, -28.244842529296875, -23.986177444458008, -19.727510452270508, -15.46884536743164, -11.210179328918457, -6.951513290405273, -2.6928482055664062, 1.565816879272461, 5.824483871459961, 10.083148956298828, 14.341814041137695]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 8.0, 11.0, 8.0, 11.0, 14.0, 14.0, 21.0, 26.0, 24.0, 24.0, 32.0, 30.0, 25.0, 31.0, 46.0, 40.0, 42.0, 37.0, 33.0, 45.0, 31.0, 44.0, 40.0, 48.0, 42.0, 27.0, 31.0, 33.0, 23.0, 23.0, 16.0, 17.0, 16.0, 9.0, 10.0, 5.0, 10.0, 6.0, 15.0, 12.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.24087142944336, -23.45634651184082, -22.67181968688965, -21.88729476928711, -21.102767944335938, -20.3182430267334, -19.533716201782227, -18.749191284179688, -17.964664459228516, -17.180139541625977, -16.395612716674805, -15.61108684539795, -14.826560974121094, -14.042035102844238, -13.257509231567383, -12.472984313964844, -11.688458442687988, -10.903932571411133, -10.119406700134277, -9.334880828857422, -8.550354957580566, -7.765829086303711, -6.981303691864014, -6.196777820587158, -5.412251949310303, -4.627726078033447, -3.843200206756592, -3.0586745738983154, -2.27414870262146, -1.4896228313446045, -0.7050971984863281, 0.07942867279052734, 0.8639545440673828, 1.6484804153442383, 2.4330062866210938, 3.21753191947937, 4.002058029174805, 4.78658390045166, 5.571109294891357, 6.355635166168213, 7.140161037445068, 7.924686908721924, 8.709212303161621, 9.493738174438477, 10.278264045715332, 11.062789916992188, 11.847315788269043, 12.631841659545898, 13.416367530822754, 14.20089340209961, 14.985419273376465, 15.76994514465332, 16.55447006225586, 17.33899688720703, 18.12352180480957, 18.908048629760742, 19.69257354736328, 20.47709846496582, 21.261625289916992, 22.04615020751953, 22.830677032470703, 23.615201950073242, 24.399728775024414, 25.184253692626953, 25.968780517578125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 9.0, 8.0, 11.0, 10.0, 18.0, 15.0, 22.0, 20.0, 22.0, 23.0, 34.0, 39.0, 38.0, 41.0, 40.0, 41.0, 57.0, 45.0, 58.0, 42.0, 49.0, 39.0, 42.0, 39.0, 34.0, 29.0, 35.0, 23.0, 23.0, 18.0, 15.0, 11.0, 8.0, 9.0, 5.0, 5.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.896484375, -2.799224853515625, -2.70196533203125, -2.604705810546875, -2.5074462890625, -2.410186767578125, -2.31292724609375, -2.215667724609375, -2.118408203125, -2.021148681640625, -1.92388916015625, -1.826629638671875, -1.7293701171875, -1.632110595703125, -1.53485107421875, -1.437591552734375, -1.34033203125, -1.243072509765625, -1.14581298828125, -1.048553466796875, -0.9512939453125, -0.854034423828125, -0.75677490234375, -0.659515380859375, -0.562255859375, -0.464996337890625, -0.36773681640625, -0.270477294921875, -0.1732177734375, -0.075958251953125, 0.02130126953125, 0.118560791015625, 0.2158203125, 0.313079833984375, 0.41033935546875, 0.507598876953125, 0.6048583984375, 0.702117919921875, 0.79937744140625, 0.896636962890625, 0.993896484375, 1.091156005859375, 1.18841552734375, 1.285675048828125, 1.3829345703125, 1.480194091796875, 1.57745361328125, 1.674713134765625, 1.77197265625, 1.869232177734375, 1.96649169921875, 2.063751220703125, 2.1610107421875, 2.258270263671875, 2.35552978515625, 2.452789306640625, 2.550048828125, 2.647308349609375, 2.74456787109375, 2.841827392578125, 2.9390869140625, 3.036346435546875, 3.13360595703125, 3.230865478515625, 3.328125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 9.0, 11.0, 8.0, 16.0, 16.0, 19.0, 19.0, 35.0, 42.0, 65.0, 103.0, 261.0, 514.0, 1240.0, 3506.0, 11812.0, 56103.0, 394842.0, 2666773.0, 922823.0, 107962.0, 19949.0, 5101.0, 1716.0, 632.0, 305.0, 128.0, 67.0, 41.0, 32.0, 15.0, 24.0, 18.0, 7.0, 10.0, 12.0, 5.0, 4.0, 2.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.90625, -8.6251220703125, -8.343994140625, -8.0628662109375, -7.78173828125, -7.5006103515625, -7.219482421875, -6.9383544921875, -6.6572265625, -6.3760986328125, -6.094970703125, -5.8138427734375, -5.53271484375, -5.2515869140625, -4.970458984375, -4.6893310546875, -4.408203125, -4.1270751953125, -3.845947265625, -3.5648193359375, -3.28369140625, -3.0025634765625, -2.721435546875, -2.4403076171875, -2.1591796875, -1.8780517578125, -1.596923828125, -1.3157958984375, -1.03466796875, -0.7535400390625, -0.472412109375, -0.1912841796875, 0.08984375, 0.3709716796875, 0.652099609375, 0.9332275390625, 1.21435546875, 1.4954833984375, 1.776611328125, 2.0577392578125, 2.3388671875, 2.6199951171875, 2.901123046875, 3.1822509765625, 3.46337890625, 3.7445068359375, 4.025634765625, 4.3067626953125, 4.587890625, 4.8690185546875, 5.150146484375, 5.4312744140625, 5.71240234375, 5.9935302734375, 6.274658203125, 6.5557861328125, 6.8369140625, 7.1180419921875, 7.399169921875, 7.6802978515625, 7.96142578125, 8.2425537109375, 8.523681640625, 8.8048095703125, 9.0859375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 9.0, 14.0, 33.0, 43.0, 36.0, 57.0, 81.0, 133.0, 150.0, 190.0, 271.0, 326.0, 393.0, 452.0, 417.0, 370.0, 264.0, 205.0, 140.0, 113.0, 104.0, 63.0, 56.0, 38.0, 28.0, 22.0, 13.0, 4.0, 9.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.19140625, -6.99493408203125, -6.7984619140625, -6.60198974609375, -6.405517578125, -6.20904541015625, -6.0125732421875, -5.81610107421875, -5.61962890625, -5.42315673828125, -5.2266845703125, -5.03021240234375, -4.833740234375, -4.63726806640625, -4.4407958984375, -4.24432373046875, -4.0478515625, -3.85137939453125, -3.6549072265625, -3.45843505859375, -3.261962890625, -3.06549072265625, -2.8690185546875, -2.67254638671875, -2.47607421875, -2.27960205078125, -2.0831298828125, -1.88665771484375, -1.690185546875, -1.49371337890625, -1.2972412109375, -1.10076904296875, -0.904296875, -0.70782470703125, -0.5113525390625, -0.31488037109375, -0.118408203125, 0.07806396484375, 0.2745361328125, 0.47100830078125, 0.66748046875, 0.86395263671875, 1.0604248046875, 1.25689697265625, 1.453369140625, 1.64984130859375, 1.8463134765625, 2.04278564453125, 2.2392578125, 2.43572998046875, 2.6322021484375, 2.82867431640625, 3.025146484375, 3.22161865234375, 3.4180908203125, 3.61456298828125, 3.81103515625, 4.00750732421875, 4.2039794921875, 4.40045166015625, 4.596923828125, 4.79339599609375, 4.9898681640625, 5.18634033203125, 5.3828125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 2.0, 9.0, 4.0, 8.0, 17.0, 26.0, 31.0, 49.0, 61.0, 99.0, 174.0, 201.0, 373.0, 598.0, 1315.0, 3396.0, 12396.0, 63373.0, 427525.0, 2492910.0, 1021449.0, 136982.0, 23687.0, 5677.0, 1854.0, 819.0, 416.0, 255.0, 180.0, 110.0, 81.0, 65.0, 42.0, 28.0, 22.0, 16.0, 4.0, 9.0, 6.0, 0.0, 5.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.984375, -10.626708984375, -10.26904296875, -9.911376953125, -9.5537109375, -9.196044921875, -8.83837890625, -8.480712890625, -8.123046875, -7.765380859375, -7.40771484375, -7.050048828125, -6.6923828125, -6.334716796875, -5.97705078125, -5.619384765625, -5.26171875, -4.904052734375, -4.54638671875, -4.188720703125, -3.8310546875, -3.473388671875, -3.11572265625, -2.758056640625, -2.400390625, -2.042724609375, -1.68505859375, -1.327392578125, -0.9697265625, -0.612060546875, -0.25439453125, 0.103271484375, 0.4609375, 0.818603515625, 1.17626953125, 1.533935546875, 1.8916015625, 2.249267578125, 2.60693359375, 2.964599609375, 3.322265625, 3.679931640625, 4.03759765625, 4.395263671875, 4.7529296875, 5.110595703125, 5.46826171875, 5.825927734375, 6.18359375, 6.541259765625, 6.89892578125, 7.256591796875, 7.6142578125, 7.971923828125, 8.32958984375, 8.687255859375, 9.044921875, 9.402587890625, 9.76025390625, 10.117919921875, 10.4755859375, 10.833251953125, 11.19091796875, 11.548583984375, 11.90625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 7.0, 22.0, 65.0, 87.0, 147.0, 128.0, 177.0, 156.0, 107.0, 57.0, 32.0, 14.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0333251953125, -16.081329345703125, -14.129332542419434, -12.177335739135742, -10.225339889526367, -8.273344039916992, -6.321347236633301, -4.369350433349609, -2.4173545837402344, -0.46535825729370117, 1.486638069152832, 3.4386343955993652, 5.390630722045898, 7.342626571655273, 9.294623374938965, 11.246620178222656, 13.198616027832031, 15.150611877441406, 17.10260772705078, 19.05460548400879, 21.006601333618164, 22.95859718322754, 24.910594940185547, 26.862590789794922, 28.814586639404297, 30.766582489013672, 32.71857833862305, 34.67057418823242, 36.62257385253906, 38.57456970214844, 40.52656555175781, 42.47856140136719, 44.43055725097656, 46.38255310058594, 48.33454895019531, 50.28654479980469, 52.23854064941406, 54.19053649902344, 56.14253616333008, 58.09453201293945, 60.04652786254883, 61.9985237121582, 63.95051956176758, 65.90251922607422, 67.8545150756836, 69.80651092529297, 71.75850677490234, 73.71050262451172, 75.6624984741211, 77.61449432373047, 79.56649017333984, 81.51848602294922, 83.4704818725586, 85.42247772216797, 87.37447357177734, 89.32647705078125, 91.27847290039062, 93.23046875, 95.18246459960938, 97.13446044921875, 99.08645629882812, 101.0384521484375, 102.99044799804688, 104.94244384765625, 106.89443969726562]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 7.0, 7.0, 8.0, 16.0, 14.0, 15.0, 18.0, 26.0, 20.0, 29.0, 45.0, 31.0, 32.0, 39.0, 37.0, 37.0, 33.0, 47.0, 43.0, 36.0, 44.0, 27.0, 39.0, 49.0, 30.0, 38.0, 29.0, 25.0, 30.0, 33.0, 24.0, 11.0, 11.0, 16.0, 11.0, 8.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.985031127929688, -19.326824188232422, -18.668617248535156, -18.01041030883789, -17.352203369140625, -16.69399642944336, -16.035789489746094, -15.377582550048828, -14.719375610351562, -14.061168670654297, -13.402961730957031, -12.744754791259766, -12.0865478515625, -11.428340911865234, -10.770133972167969, -10.111927032470703, -9.453720092773438, -8.795513153076172, -8.137306213378906, -7.479099273681641, -6.820892333984375, -6.162685394287109, -5.504478454589844, -4.846271514892578, -4.1880645751953125, -3.529857635498047, -2.8716506958007812, -2.2134437561035156, -1.55523681640625, -0.8970298767089844, -0.23882293701171875, 0.4193840026855469, 1.0775909423828125, 1.7357978820800781, 2.3940048217773438, 3.0522117614746094, 3.710418701171875, 4.368625640869141, 5.026832580566406, 5.685039520263672, 6.3432464599609375, 7.001453399658203, 7.659660339355469, 8.317867279052734, 8.97607421875, 9.634281158447266, 10.292488098144531, 10.950695037841797, 11.608901977539062, 12.267108917236328, 12.925315856933594, 13.58352279663086, 14.241729736328125, 14.89993667602539, 15.558143615722656, 16.216350555419922, 16.874557495117188, 17.532764434814453, 18.19097137451172, 18.849178314208984, 19.50738525390625, 20.165592193603516, 20.82379913330078, 21.482006072998047, 22.140213012695312]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 10.0, 8.0, 8.0, 10.0, 16.0, 20.0, 27.0, 16.0, 38.0, 26.0, 32.0, 36.0, 44.0, 41.0, 53.0, 59.0, 42.0, 65.0, 49.0, 42.0, 52.0, 39.0, 43.0, 27.0, 31.0, 37.0, 21.0, 23.0, 11.0, 14.0, 12.0, 10.0, 9.0, 4.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.216796875, -3.112548828125, -3.00830078125, -2.904052734375, -2.7998046875, -2.695556640625, -2.59130859375, -2.487060546875, -2.3828125, -2.278564453125, -2.17431640625, -2.070068359375, -1.9658203125, -1.861572265625, -1.75732421875, -1.653076171875, -1.548828125, -1.444580078125, -1.34033203125, -1.236083984375, -1.1318359375, -1.027587890625, -0.92333984375, -0.819091796875, -0.71484375, -0.610595703125, -0.50634765625, -0.402099609375, -0.2978515625, -0.193603515625, -0.08935546875, 0.014892578125, 0.119140625, 0.223388671875, 0.32763671875, 0.431884765625, 0.5361328125, 0.640380859375, 0.74462890625, 0.848876953125, 0.953125, 1.057373046875, 1.16162109375, 1.265869140625, 1.3701171875, 1.474365234375, 1.57861328125, 1.682861328125, 1.787109375, 1.891357421875, 1.99560546875, 2.099853515625, 2.2041015625, 2.308349609375, 2.41259765625, 2.516845703125, 2.62109375, 2.725341796875, 2.82958984375, 2.933837890625, 3.0380859375, 3.142333984375, 3.24658203125, 3.350830078125, 3.455078125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 0.0, 7.0, 11.0, 19.0, 20.0, 46.0, 45.0, 90.0, 121.0, 143.0, 241.0, 336.0, 492.0, 746.0, 1103.0, 1721.0, 2499.0, 3735.0, 5557.0, 8775.0, 13359.0, 20868.0, 33870.0, 57767.0, 104752.0, 199423.0, 259957.0, 140813.0, 75652.0, 42901.0, 25968.0, 16217.0, 10659.0, 6845.0, 4568.0, 2971.0, 2072.0, 1374.0, 872.0, 642.0, 392.0, 295.0, 191.0, 137.0, 104.0, 60.0, 41.0, 24.0, 24.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.021240234375, -0.02058124542236328, -0.019922256469726562, -0.019263267517089844, -0.018604278564453125, -0.017945289611816406, -0.017286300659179688, -0.01662731170654297, -0.01596832275390625, -0.015309333801269531, -0.014650344848632812, -0.013991355895996094, -0.013332366943359375, -0.012673377990722656, -0.012014389038085938, -0.011355400085449219, -0.0106964111328125, -0.010037422180175781, -0.009378433227539062, -0.008719444274902344, -0.008060455322265625, -0.007401466369628906, -0.0067424774169921875, -0.006083488464355469, -0.00542449951171875, -0.004765510559082031, -0.0041065216064453125, -0.0034475326538085938, -0.002788543701171875, -0.0021295547485351562, -0.0014705657958984375, -0.0008115768432617188, -0.000152587890625, 0.0005064010620117188, 0.0011653900146484375, 0.0018243789672851562, 0.002483367919921875, 0.0031423568725585938, 0.0038013458251953125, 0.004460334777832031, 0.00511932373046875, 0.005778312683105469, 0.0064373016357421875, 0.007096290588378906, 0.007755279541015625, 0.008414268493652344, 0.009073257446289062, 0.009732246398925781, 0.0103912353515625, 0.011050224304199219, 0.011709213256835938, 0.012368202209472656, 0.013027191162109375, 0.013686180114746094, 0.014345169067382812, 0.015004158020019531, 0.01566314697265625, 0.01632213592529297, 0.016981124877929688, 0.017640113830566406, 0.018299102783203125, 0.018958091735839844, 0.019617080688476562, 0.02027606964111328, 0.02093505859375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 4.0, 9.0, 10.0, 9.0, 17.0, 15.0, 15.0, 25.0, 29.0, 27.0, 29.0, 33.0, 31.0, 33.0, 50.0, 41.0, 31.0, 48.0, 1071.0, 44.0, 40.0, 30.0, 47.0, 33.0, 25.0, 30.0, 34.0, 29.0, 19.0, 23.0, 15.0, 29.0, 15.0, 8.0, 13.0, 6.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0], "bins": [-2.4921875, -2.4244384765625, -2.356689453125, -2.2889404296875, -2.22119140625, -2.1534423828125, -2.085693359375, -2.0179443359375, -1.9501953125, -1.8824462890625, -1.814697265625, -1.7469482421875, -1.67919921875, -1.6114501953125, -1.543701171875, -1.4759521484375, -1.408203125, -1.3404541015625, -1.272705078125, -1.2049560546875, -1.13720703125, -1.0694580078125, -1.001708984375, -0.9339599609375, -0.8662109375, -0.7984619140625, -0.730712890625, -0.6629638671875, -0.59521484375, -0.5274658203125, -0.459716796875, -0.3919677734375, -0.32421875, -0.2564697265625, -0.188720703125, -0.1209716796875, -0.05322265625, 0.0145263671875, 0.082275390625, 0.1500244140625, 0.2177734375, 0.2855224609375, 0.353271484375, 0.4210205078125, 0.48876953125, 0.5565185546875, 0.624267578125, 0.6920166015625, 0.759765625, 0.8275146484375, 0.895263671875, 0.9630126953125, 1.03076171875, 1.0985107421875, 1.166259765625, 1.2340087890625, 1.3017578125, 1.3695068359375, 1.437255859375, 1.5050048828125, 1.57275390625, 1.6405029296875, 1.708251953125, 1.7760009765625, 1.84375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 15.0, 12.0, 21.0, 49.0, 55.0, 90.0, 116.0, 186.0, 247.0, 362.0, 519.0, 779.0, 1127.0, 1775.0, 2491.0, 3778.0, 5599.0, 8373.0, 13209.0, 19944.0, 30753.0, 47714.0, 76385.0, 124732.0, 1247160.0, 190729.0, 117746.0, 71987.0, 45624.0, 29100.0, 19220.0, 12520.0, 8127.0, 5443.0, 3723.0, 2350.0, 1608.0, 1127.0, 717.0, 496.0, 338.0, 275.0, 159.0, 118.0, 57.0, 61.0, 44.0, 21.0, 25.0, 12.0, 5.0, 5.0, 2.0, 4.0, 3.0], "bins": [-0.0082550048828125, -0.008011817932128906, -0.0077686309814453125, -0.007525444030761719, -0.007282257080078125, -0.007039070129394531, -0.0067958831787109375, -0.006552696228027344, -0.00630950927734375, -0.006066322326660156, -0.0058231353759765625, -0.005579948425292969, -0.005336761474609375, -0.005093574523925781, -0.0048503875732421875, -0.004607200622558594, -0.004364013671875, -0.004120826721191406, -0.0038776397705078125, -0.0036344528198242188, -0.003391265869140625, -0.0031480789184570312, -0.0029048919677734375, -0.0026617050170898438, -0.00241851806640625, -0.0021753311157226562, -0.0019321441650390625, -0.0016889572143554688, -0.001445770263671875, -0.0012025833129882812, -0.0009593963623046875, -0.0007162094116210938, -0.0004730224609375, -0.00022983551025390625, 1.33514404296875e-05, 0.00025653839111328125, 0.000499725341796875, 0.0007429122924804688, 0.0009860992431640625, 0.0012292861938476562, 0.00147247314453125, 0.0017156600952148438, 0.0019588470458984375, 0.0022020339965820312, 0.002445220947265625, 0.0026884078979492188, 0.0029315948486328125, 0.0031747817993164062, 0.00341796875, 0.0036611557006835938, 0.0039043426513671875, 0.004147529602050781, 0.004390716552734375, 0.004633903503417969, 0.0048770904541015625, 0.005120277404785156, 0.00536346435546875, 0.005606651306152344, 0.0058498382568359375, 0.006093025207519531, 0.006336212158203125, 0.006579399108886719, 0.0068225860595703125, 0.007065773010253906, 0.0073089599609375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 0.0, 0.0, 6.0, 0.0, 6.0, 0.0, 9.0, 0.0, 0.0, 8.0, 0.0, 12.0, 0.0, 18.0, 0.0, 0.0, 19.0, 0.0, 29.0, 0.0, 0.0, 29.0, 0.0, 76.0, 0.0, 135.0, 0.0, 0.0, 309.0, 0.0, 161.0, 0.0, 78.0, 0.0, 0.0, 36.0, 0.0, 12.0, 0.0, 0.0, 16.0, 0.0, 14.0, 0.0, 10.0, 0.0, 0.0, 9.0, 0.0, 12.0, 0.0, 7.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 9.0, 6.0, 6.0, 6.0, 8.0, 11.0, 18.0, 17.0, 26.0, 40.0, 68.0, 118.0, 168.0, 329.0, 1606.0, 67539.0, 934463.0, 41656.0, 1625.0, 299.0, 165.0, 94.0, 50.0, 42.0, 31.0, 23.0, 16.0, 5.0, 19.0, 6.0, 12.0, 3.0, 5.0, 6.0, 7.0, 2.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-1.5556812286376953e-05, -1.5062279999256134e-05, -1.4567747712135315e-05, -1.4073215425014496e-05, -1.3578683137893677e-05, -1.3084150850772858e-05, -1.2589618563652039e-05, -1.209508627653122e-05, -1.16005539894104e-05, -1.1106021702289581e-05, -1.0611489415168762e-05, -1.0116957128047943e-05, -9.622424840927124e-06, -9.127892553806305e-06, -8.633360266685486e-06, -8.138827979564667e-06, -7.644295692443848e-06, -7.1497634053230286e-06, -6.6552311182022095e-06, -6.16069883108139e-06, -5.666166543960571e-06, -5.171634256839752e-06, -4.677101969718933e-06, -4.182569682598114e-06, -3.688037395477295e-06, -3.193505108356476e-06, -2.6989728212356567e-06, -2.2044405341148376e-06, -1.7099082469940186e-06, -1.2153759598731995e-06, -7.208436727523804e-07, -2.2631138563156128e-07, 2.682209014892578e-07, 7.627531886100769e-07, 1.257285475730896e-06, 1.751817762851715e-06, 2.246350049972534e-06, 2.7408823370933533e-06, 3.2354146242141724e-06, 3.7299469113349915e-06, 4.2244791984558105e-06, 4.71901148557663e-06, 5.213543772697449e-06, 5.708076059818268e-06, 6.202608346939087e-06, 6.697140634059906e-06, 7.191672921180725e-06, 7.686205208301544e-06, 8.180737495422363e-06, 8.675269782543182e-06, 9.169802069664001e-06, 9.66433435678482e-06, 1.015886664390564e-05, 1.0653398931026459e-05, 1.1147931218147278e-05, 1.1642463505268097e-05, 1.2136995792388916e-05, 1.2631528079509735e-05, 1.3126060366630554e-05, 1.3620592653751373e-05, 1.4115124940872192e-05, 1.4609657227993011e-05, 1.510418951511383e-05, 1.559872180223465e-05, 1.609325408935547e-05]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 557.0, 436.0, 15.0], "bins": [-1.4749783076695167e-05, -1.4511805602523964e-05, -1.4273829037847463e-05, -1.403585156367626e-05, -1.379787499899976e-05, -1.3559897524828557e-05, -1.3321920050657354e-05, -1.3083943485980853e-05, -1.284596601180965e-05, -1.2607988537638448e-05, -1.2370011972961947e-05, -1.2132034498790745e-05, -1.1894057024619542e-05, -1.1656080459943041e-05, -1.1418102985771839e-05, -1.1180126421095338e-05, -1.0942148946924135e-05, -1.0704171472752932e-05, -1.0466194908076432e-05, -1.0228217433905229e-05, -9.990240869228728e-06, -9.752263395057525e-06, -9.514285920886323e-06, -9.276309356209822e-06, -9.03833188203862e-06, -8.800354407867417e-06, -8.562377843190916e-06, -8.324400369019713e-06, -8.08642289484851e-06, -7.84844633017201e-06, -7.610468856000807e-06, -7.372491836576955e-06, -7.1345152719004545e-06, -6.896538252476603e-06, -6.6585607783054e-06, -6.420583758881548e-06, -6.182606739457697e-06, -5.944629720033845e-06, -5.706652700609993e-06, -5.4686752264387906e-06, -5.230698207014939e-06, -4.992721187591087e-06, -4.7547437134198844e-06, -4.516766693996033e-06, -4.278789674572181e-06, -4.040812655148329e-06, -3.802835408350802e-06, -3.564858161553275e-06, -3.326881142129423e-06, -3.0889041227055714e-06, -2.850926875908044e-06, -2.612949629110517e-06, -2.3749726096866652e-06, -2.1369955902628135e-06, -1.8990183434652863e-06, -1.6610412103545968e-06, -1.4230640772439074e-06, -1.185086944133218e-06, -9.471098110225284e-07, -7.09132677911839e-07, -4.711555448011495e-07, -2.3317841169046005e-07, 4.798721420229413e-09, 2.427758545309189e-07, 4.807529876416083e-07]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 4.0, 0.0, 0.0, 14.0, 0.0, 0.0, 49.0, 0.0, 0.0, 114.0, 0.0, 0.0, 197.0, 0.0, 0.0, 255.0, 0.0, 0.0, 212.0, 0.0, 105.0, 0.0, 0.0, 42.0, 0.0, 0.0, 15.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.755573511123657e-07, -5.550682544708252e-07, -5.345791578292847e-07, -5.140900611877441e-07, -4.936009645462036e-07, -4.731118679046631e-07, -4.5262277126312256e-07, -4.3213367462158203e-07, -4.116445779800415e-07, -3.91155481338501e-07, -3.7066638469696045e-07, -3.501772880554199e-07, -3.296881914138794e-07, -3.0919909477233887e-07, -2.8870999813079834e-07, -2.682209014892578e-07, -2.477318048477173e-07, -2.2724270820617676e-07, -2.0675361156463623e-07, -1.862645149230957e-07, -1.6577541828155518e-07, -1.4528632164001465e-07, -1.2479722499847412e-07, -1.043081283569336e-07, -8.381903171539307e-08, -6.332993507385254e-08, -4.284083843231201e-08, -2.2351741790771484e-08, -1.862645149230957e-09, 1.862645149230957e-08, 3.91155481338501e-08, 5.960464477539063e-08, 8.009374141693115e-08, 1.0058283805847168e-07, 1.210719347000122e-07, 1.4156103134155273e-07, 1.6205012798309326e-07, 1.825392246246338e-07, 2.0302832126617432e-07, 2.2351741790771484e-07, 2.4400651454925537e-07, 2.644956111907959e-07, 2.849847078323364e-07, 3.0547380447387695e-07, 3.259629011154175e-07, 3.46451997756958e-07, 3.6694109439849854e-07, 3.8743019104003906e-07, 4.079192876815796e-07, 4.284083843231201e-07, 4.4889748096466064e-07, 4.6938657760620117e-07, 4.898756742477417e-07, 5.103647708892822e-07, 5.308538675308228e-07, 5.513429641723633e-07, 5.718320608139038e-07, 5.923211574554443e-07, 6.128102540969849e-07, 6.332993507385254e-07, 6.537884473800659e-07, 6.742775440216064e-07, 6.94766640663147e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 10.0, 8.0, 8.0, 10.0, 16.0, 20.0, 27.0, 16.0, 38.0, 26.0, 32.0, 36.0, 44.0, 41.0, 53.0, 59.0, 42.0, 65.0, 49.0, 42.0, 52.0, 39.0, 43.0, 27.0, 31.0, 37.0, 21.0, 23.0, 11.0, 14.0, 12.0, 10.0, 9.0, 4.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.216796875, -3.112548828125, -3.00830078125, -2.904052734375, -2.7998046875, -2.695556640625, -2.59130859375, -2.487060546875, -2.3828125, -2.278564453125, -2.17431640625, -2.070068359375, -1.9658203125, -1.861572265625, -1.75732421875, -1.653076171875, -1.548828125, -1.444580078125, -1.34033203125, -1.236083984375, -1.1318359375, -1.027587890625, -0.92333984375, -0.819091796875, -0.71484375, -0.610595703125, -0.50634765625, -0.402099609375, -0.2978515625, -0.193603515625, -0.08935546875, 0.014892578125, 0.119140625, 0.223388671875, 0.32763671875, 0.431884765625, 0.5361328125, 0.640380859375, 0.74462890625, 0.848876953125, 0.953125, 1.057373046875, 1.16162109375, 1.265869140625, 1.3701171875, 1.474365234375, 1.57861328125, 1.682861328125, 1.787109375, 1.891357421875, 1.99560546875, 2.099853515625, 2.2041015625, 2.308349609375, 2.41259765625, 2.516845703125, 2.62109375, 2.725341796875, 2.82958984375, 2.933837890625, 3.0380859375, 3.142333984375, 3.24658203125, 3.350830078125, 3.455078125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 13.0, 13.0, 28.0, 25.0, 52.0, 84.0, 132.0, 220.0, 328.0, 590.0, 938.0, 1537.0, 2369.0, 3801.0, 6246.0, 10002.0, 16018.0, 25299.0, 40877.0, 69737.0, 144521.0, 347585.0, 177670.0, 79820.0, 45388.0, 27950.0, 17751.0, 11412.0, 6861.0, 4333.0, 2736.0, 1597.0, 1006.0, 596.0, 405.0, 220.0, 137.0, 87.0, 69.0, 36.0, 28.0, 19.0, 9.0, 6.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.992095947265625, -2.89434814453125, -2.796600341796875, -2.6988525390625, -2.601104736328125, -2.50335693359375, -2.405609130859375, -2.307861328125, -2.210113525390625, -2.11236572265625, -2.014617919921875, -1.9168701171875, -1.819122314453125, -1.72137451171875, -1.623626708984375, -1.52587890625, -1.428131103515625, -1.33038330078125, -1.232635498046875, -1.1348876953125, -1.037139892578125, -0.93939208984375, -0.841644287109375, -0.743896484375, -0.646148681640625, -0.54840087890625, -0.450653076171875, -0.3529052734375, -0.255157470703125, -0.15740966796875, -0.059661865234375, 0.0380859375, 0.135833740234375, 0.23358154296875, 0.331329345703125, 0.4290771484375, 0.526824951171875, 0.62457275390625, 0.722320556640625, 0.820068359375, 0.917816162109375, 1.01556396484375, 1.113311767578125, 1.2110595703125, 1.308807373046875, 1.40655517578125, 1.504302978515625, 1.60205078125, 1.699798583984375, 1.79754638671875, 1.895294189453125, 1.9930419921875, 2.090789794921875, 2.18853759765625, 2.286285400390625, 2.384033203125, 2.481781005859375, 2.57952880859375, 2.677276611328125, 2.7750244140625, 2.872772216796875, 2.97052001953125, 3.068267822265625, 3.166015625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 7.0, 6.0, 15.0, 8.0, 14.0, 13.0, 23.0, 19.0, 18.0, 29.0, 29.0, 25.0, 39.0, 27.0, 68.0, 63.0, 93.0, 174.0, 1559.0, 248.0, 137.0, 56.0, 56.0, 39.0, 38.0, 33.0, 40.0, 28.0, 25.0, 16.0, 26.0, 14.0, 16.0, 14.0, 10.0, 5.0, 6.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.69970703125, -9.3837890625, -9.06787109375, -8.751953125, -8.43603515625, -8.1201171875, -7.80419921875, -7.48828125, -7.17236328125, -6.8564453125, -6.54052734375, -6.224609375, -5.90869140625, -5.5927734375, -5.27685546875, -4.9609375, -4.64501953125, -4.3291015625, -4.01318359375, -3.697265625, -3.38134765625, -3.0654296875, -2.74951171875, -2.43359375, -2.11767578125, -1.8017578125, -1.48583984375, -1.169921875, -0.85400390625, -0.5380859375, -0.22216796875, 0.09375, 0.40966796875, 0.7255859375, 1.04150390625, 1.357421875, 1.67333984375, 1.9892578125, 2.30517578125, 2.62109375, 2.93701171875, 3.2529296875, 3.56884765625, 3.884765625, 4.20068359375, 4.5166015625, 4.83251953125, 5.1484375, 5.46435546875, 5.7802734375, 6.09619140625, 6.412109375, 6.72802734375, 7.0439453125, 7.35986328125, 7.67578125, 7.99169921875, 8.3076171875, 8.62353515625, 8.939453125, 9.25537109375, 9.5712890625, 9.88720703125, 10.203125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 11.0, 15.0, 9.0, 26.0, 17.0, 28.0, 31.0, 48.0, 43.0, 83.0, 109.0, 112.0, 173.0, 236.0, 526.0, 2041.0, 20179.0, 549162.0, 2519264.0, 47947.0, 3792.0, 752.0, 323.0, 186.0, 114.0, 102.0, 86.0, 68.0, 35.0, 34.0, 25.0, 25.0, 23.0, 13.0, 12.0, 14.0, 9.0, 7.0, 5.0, 1.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.71875, -17.167724609375, -16.61669921875, -16.065673828125, -15.5146484375, -14.963623046875, -14.41259765625, -13.861572265625, -13.310546875, -12.759521484375, -12.20849609375, -11.657470703125, -11.1064453125, -10.555419921875, -10.00439453125, -9.453369140625, -8.90234375, -8.351318359375, -7.80029296875, -7.249267578125, -6.6982421875, -6.147216796875, -5.59619140625, -5.045166015625, -4.494140625, -3.943115234375, -3.39208984375, -2.841064453125, -2.2900390625, -1.739013671875, -1.18798828125, -0.636962890625, -0.0859375, 0.465087890625, 1.01611328125, 1.567138671875, 2.1181640625, 2.669189453125, 3.22021484375, 3.771240234375, 4.322265625, 4.873291015625, 5.42431640625, 5.975341796875, 6.5263671875, 7.077392578125, 7.62841796875, 8.179443359375, 8.73046875, 9.281494140625, 9.83251953125, 10.383544921875, 10.9345703125, 11.485595703125, 12.03662109375, 12.587646484375, 13.138671875, 13.689697265625, 14.24072265625, 14.791748046875, 15.3427734375, 15.893798828125, 16.44482421875, 16.995849609375, 17.546875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 5.0, 7.0, 11.0, 15.0, 15.0, 29.0, 39.0, 36.0, 47.0, 44.0, 60.0, 64.0, 69.0, 73.0, 54.0, 50.0, 52.0, 60.0, 45.0, 46.0, 33.0, 35.0, 30.0, 18.0, 18.0, 7.0, 13.0, 8.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.862521171569824, -13.496307373046875, -13.13009262084961, -12.76387882232666, -12.397665023803711, -12.031450271606445, -11.665236473083496, -11.299022674560547, -10.932807922363281, -10.566594123840332, -10.200379371643066, -9.834165573120117, -9.467950820922852, -9.101737022399902, -8.735523223876953, -8.369308471679688, -8.003094673156738, -7.636880397796631, -7.270666122436523, -6.904452323913574, -6.538238048553467, -6.172023773193359, -5.80580997467041, -5.439595699310303, -5.073381423950195, -4.707167148590088, -4.3409528732299805, -3.9747390747070312, -3.608524799346924, -3.2423105239868164, -2.876096487045288, -2.5098824501037598, -2.143667221069336, -1.777453064918518, -1.4112389087677002, -1.0450247526168823, -0.6788105964660645, -0.3125964403152466, 0.05361771583557129, 0.4198317527770996, 0.786046028137207, 1.152260184288025, 1.5184743404388428, 1.8846884965896606, 2.2509026527404785, 2.617116928100586, 2.9833309650421143, 3.3495450019836426, 3.71575927734375, 4.081973552703857, 4.448187828063965, 4.814401626586914, 5.1806159019470215, 5.546830177307129, 5.913043975830078, 6.2792582511901855, 6.645472526550293, 7.0116868019104, 7.377901077270508, 7.744114875793457, 8.110328674316406, 8.476543426513672, 8.842757225036621, 9.20897102355957, 9.575185775756836]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 3.0, 11.0, 12.0, 8.0, 14.0, 21.0, 20.0, 25.0, 21.0, 31.0, 28.0, 35.0, 34.0, 38.0, 38.0, 35.0, 51.0, 43.0, 49.0, 48.0, 32.0, 42.0, 39.0, 40.0, 34.0, 37.0, 16.0, 33.0, 20.0, 23.0, 19.0, 9.0, 17.0, 11.0, 11.0, 13.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-30.117591857910156, -29.18962287902832, -28.261655807495117, -27.33368682861328, -26.405719757080078, -25.477750778198242, -24.549781799316406, -23.621814727783203, -22.69384765625, -21.765878677368164, -20.83791160583496, -19.909942626953125, -18.981975555419922, -18.054006576538086, -17.12603759765625, -16.198070526123047, -15.270101547241211, -14.342133522033691, -13.414165496826172, -12.486196517944336, -11.558229446411133, -10.630260467529297, -9.702292442321777, -8.774324417114258, -7.846356391906738, -6.918388366699219, -5.990420341491699, -5.0624518394470215, -4.134483814239502, -3.2065157890319824, -2.2785472869873047, -1.3505792617797852, -0.42261314392089844, 0.5053550004959106, 1.4333231449127197, 2.3612914085388184, 3.289259433746338, 4.217227458953857, 5.145195960998535, 6.073163986206055, 7.001132011413574, 7.929100036621094, 8.857068061828613, 9.785036087036133, 10.713005065917969, 11.640972137451172, 12.568941116333008, 13.496909141540527, 14.424877166748047, 15.352845191955566, 16.280813217163086, 17.208782196044922, 18.136749267578125, 19.06471824645996, 19.992687225341797, 20.920654296875, 21.848621368408203, 22.77659034729004, 23.704557418823242, 24.632526397705078, 25.56049346923828, 26.488462448120117, 27.416431427001953, 28.344398498535156, 29.272367477416992]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 5.0, 7.0, 18.0, 14.0, 23.0, 13.0, 24.0, 24.0, 28.0, 37.0, 32.0, 43.0, 39.0, 39.0, 54.0, 59.0, 52.0, 54.0, 53.0, 55.0, 33.0, 40.0, 35.0, 37.0, 34.0, 28.0, 20.0, 18.0, 15.0, 12.0, 10.0, 10.0, 5.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.185546875, -3.077178955078125, -2.96881103515625, -2.860443115234375, -2.7520751953125, -2.643707275390625, -2.53533935546875, -2.426971435546875, -2.318603515625, -2.210235595703125, -2.10186767578125, -1.993499755859375, -1.8851318359375, -1.776763916015625, -1.66839599609375, -1.560028076171875, -1.45166015625, -1.343292236328125, -1.23492431640625, -1.126556396484375, -1.0181884765625, -0.909820556640625, -0.80145263671875, -0.693084716796875, -0.584716796875, -0.476348876953125, -0.36798095703125, -0.259613037109375, -0.1512451171875, -0.042877197265625, 0.06549072265625, 0.173858642578125, 0.2822265625, 0.390594482421875, 0.49896240234375, 0.607330322265625, 0.7156982421875, 0.824066162109375, 0.93243408203125, 1.040802001953125, 1.149169921875, 1.257537841796875, 1.36590576171875, 1.474273681640625, 1.5826416015625, 1.691009521484375, 1.79937744140625, 1.907745361328125, 2.01611328125, 2.124481201171875, 2.23284912109375, 2.341217041015625, 2.4495849609375, 2.557952880859375, 2.66632080078125, 2.774688720703125, 2.883056640625, 2.991424560546875, 3.09979248046875, 3.208160400390625, 3.3165283203125, 3.424896240234375, 3.53326416015625, 3.641632080078125, 3.75]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 4.0, 10.0, 14.0, 19.0, 24.0, 43.0, 47.0, 70.0, 87.0, 138.0, 218.0, 371.0, 609.0, 1343.0, 3279.0, 9382.0, 31020.0, 137409.0, 868842.0, 2413792.0, 590936.0, 100293.0, 23660.0, 7342.0, 2709.0, 1211.0, 501.0, 316.0, 194.0, 119.0, 73.0, 53.0, 41.0, 22.0, 24.0, 13.0, 11.0, 5.0, 9.0, 3.0, 4.0, 3.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.58203125, -7.3480224609375, -7.114013671875, -6.8800048828125, -6.64599609375, -6.4119873046875, -6.177978515625, -5.9439697265625, -5.7099609375, -5.4759521484375, -5.241943359375, -5.0079345703125, -4.77392578125, -4.5399169921875, -4.305908203125, -4.0718994140625, -3.837890625, -3.6038818359375, -3.369873046875, -3.1358642578125, -2.90185546875, -2.6678466796875, -2.433837890625, -2.1998291015625, -1.9658203125, -1.7318115234375, -1.497802734375, -1.2637939453125, -1.02978515625, -0.7957763671875, -0.561767578125, -0.3277587890625, -0.09375, 0.1402587890625, 0.374267578125, 0.6082763671875, 0.84228515625, 1.0762939453125, 1.310302734375, 1.5443115234375, 1.7783203125, 2.0123291015625, 2.246337890625, 2.4803466796875, 2.71435546875, 2.9483642578125, 3.182373046875, 3.4163818359375, 3.650390625, 3.8843994140625, 4.118408203125, 4.3524169921875, 4.58642578125, 4.8204345703125, 5.054443359375, 5.2884521484375, 5.5224609375, 5.7564697265625, 5.990478515625, 6.2244873046875, 6.45849609375, 6.6925048828125, 6.926513671875, 7.1605224609375, 7.39453125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 5.0, 14.0, 8.0, 21.0, 27.0, 39.0, 73.0, 82.0, 113.0, 175.0, 235.0, 345.0, 403.0, 528.0, 488.0, 385.0, 313.0, 253.0, 176.0, 123.0, 77.0, 50.0, 46.0, 34.0, 21.0, 18.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.84515380859375, -8.6121826171875, -8.37921142578125, -8.146240234375, -7.91326904296875, -7.6802978515625, -7.44732666015625, -7.21435546875, -6.98138427734375, -6.7484130859375, -6.51544189453125, -6.282470703125, -6.04949951171875, -5.8165283203125, -5.58355712890625, -5.3505859375, -5.11761474609375, -4.8846435546875, -4.65167236328125, -4.418701171875, -4.18572998046875, -3.9527587890625, -3.71978759765625, -3.48681640625, -3.25384521484375, -3.0208740234375, -2.78790283203125, -2.554931640625, -2.32196044921875, -2.0889892578125, -1.85601806640625, -1.623046875, -1.39007568359375, -1.1571044921875, -0.92413330078125, -0.691162109375, -0.45819091796875, -0.2252197265625, 0.00775146484375, 0.24072265625, 0.47369384765625, 0.7066650390625, 0.93963623046875, 1.172607421875, 1.40557861328125, 1.6385498046875, 1.87152099609375, 2.1044921875, 2.33746337890625, 2.5704345703125, 2.80340576171875, 3.036376953125, 3.26934814453125, 3.5023193359375, 3.73529052734375, 3.96826171875, 4.20123291015625, 4.4342041015625, 4.66717529296875, 4.900146484375, 5.13311767578125, 5.3660888671875, 5.59906005859375, 5.83203125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 13.0, 14.0, 18.0, 22.0, 37.0, 42.0, 60.0, 104.0, 119.0, 244.0, 361.0, 753.0, 1935.0, 14287.0, 275164.0, 3401121.0, 474061.0, 21415.0, 2619.0, 754.0, 379.0, 232.0, 150.0, 106.0, 83.0, 57.0, 34.0, 25.0, 15.0, 10.0, 10.0, 10.0, 6.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8671875, -14.2623291015625, -13.657470703125, -13.0526123046875, -12.44775390625, -11.8428955078125, -11.238037109375, -10.6331787109375, -10.0283203125, -9.4234619140625, -8.818603515625, -8.2137451171875, -7.60888671875, -7.0040283203125, -6.399169921875, -5.7943115234375, -5.189453125, -4.5845947265625, -3.979736328125, -3.3748779296875, -2.77001953125, -2.1651611328125, -1.560302734375, -0.9554443359375, -0.3505859375, 0.2542724609375, 0.859130859375, 1.4639892578125, 2.06884765625, 2.6737060546875, 3.278564453125, 3.8834228515625, 4.48828125, 5.0931396484375, 5.697998046875, 6.3028564453125, 6.90771484375, 7.5125732421875, 8.117431640625, 8.7222900390625, 9.3271484375, 9.9320068359375, 10.536865234375, 11.1417236328125, 11.74658203125, 12.3514404296875, 12.956298828125, 13.5611572265625, 14.166015625, 14.7708740234375, 15.375732421875, 15.9805908203125, 16.58544921875, 17.1903076171875, 17.795166015625, 18.4000244140625, 19.0048828125, 19.6097412109375, 20.214599609375, 20.8194580078125, 21.42431640625, 22.0291748046875, 22.634033203125, 23.2388916015625, 23.84375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 13.0, 14.0, 28.0, 41.0, 60.0, 71.0, 85.0, 96.0, 98.0, 114.0, 101.0, 74.0, 67.0, 43.0, 35.0, 24.0, 16.0, 13.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.36457633972168, -21.12825584411621, -19.891935348510742, -18.655614852905273, -17.419294357299805, -16.182973861694336, -14.946653366088867, -13.710332870483398, -12.47401237487793, -11.237691879272461, -10.001371383666992, -8.765050888061523, -7.528730392456055, -6.292409896850586, -5.056089401245117, -3.8197689056396484, -2.5834484100341797, -1.347127914428711, -0.11080741882324219, 1.1255130767822266, 2.3618335723876953, 3.598154067993164, 4.834474563598633, 6.070795059204102, 7.30711555480957, 8.543436050415039, 9.779756546020508, 11.016077041625977, 12.252397537231445, 13.488718032836914, 14.725038528442383, 15.961359024047852, 17.197681427001953, 18.434001922607422, 19.67032241821289, 20.90664291381836, 22.142963409423828, 23.379283905029297, 24.615604400634766, 25.851924896240234, 27.088245391845703, 28.324565887451172, 29.56088638305664, 30.79720687866211, 32.03352737426758, 33.26984786987305, 34.506168365478516, 35.742488861083984, 36.97880935668945, 38.21512985229492, 39.45145034790039, 40.68777084350586, 41.92409133911133, 43.1604118347168, 44.396732330322266, 45.633052825927734, 46.8693733215332, 48.10569381713867, 49.34201431274414, 50.57833480834961, 51.81465530395508, 53.05097579956055, 54.287296295166016, 55.523616790771484, 56.75993728637695]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 5.0, 2.0, 10.0, 11.0, 10.0, 17.0, 17.0, 18.0, 20.0, 23.0, 25.0, 25.0, 35.0, 35.0, 38.0, 44.0, 42.0, 38.0, 32.0, 42.0, 41.0, 34.0, 40.0, 37.0, 33.0, 41.0, 33.0, 31.0, 20.0, 24.0, 33.0, 26.0, 17.0, 14.0, 15.0, 15.0, 22.0, 9.0, 6.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.292266845703125, -19.617502212524414, -18.942737579345703, -18.267972946166992, -17.59320831298828, -16.918445587158203, -16.243680953979492, -15.568916320800781, -14.89415168762207, -14.21938705444336, -13.544622421264648, -12.869858741760254, -12.195094108581543, -11.520329475402832, -10.845565795898438, -10.170801162719727, -9.496036529541016, -8.821271896362305, -8.146507263183594, -7.471743583679199, -6.796978950500488, -6.122214317321777, -5.447450160980225, -4.772686004638672, -4.097921371459961, -3.423156976699829, -2.7483925819396973, -2.0736281871795654, -1.3988637924194336, -0.7240993976593018, -0.04933500289916992, 0.6254291534423828, 1.3001937866210938, 1.9749581813812256, 2.6497225761413574, 3.3244869709014893, 3.999251365661621, 4.674015998840332, 5.348780155181885, 6.0235443115234375, 6.698308944702148, 7.373073577880859, 8.04783821105957, 8.722601890563965, 9.397366523742676, 10.072131156921387, 10.746894836425781, 11.421659469604492, 12.096424102783203, 12.771188735961914, 13.445953369140625, 14.12071704864502, 14.79548168182373, 15.470246315002441, 16.145009994506836, 16.819774627685547, 17.494539260864258, 18.16930389404297, 18.84406852722168, 19.51883316040039, 20.19359588623047, 20.86836051940918, 21.54312515258789, 22.2178897857666, 22.892654418945312]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 8.0, 9.0, 17.0, 17.0, 13.0, 25.0, 18.0, 23.0, 22.0, 35.0, 33.0, 35.0, 49.0, 46.0, 43.0, 55.0, 54.0, 53.0, 53.0, 49.0, 40.0, 40.0, 42.0, 30.0, 36.0, 30.0, 21.0, 21.0, 17.0, 12.0, 16.0, 10.0, 6.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.99609375, -2.88812255859375, -2.7801513671875, -2.67218017578125, -2.564208984375, -2.45623779296875, -2.3482666015625, -2.24029541015625, -2.13232421875, -2.02435302734375, -1.9163818359375, -1.80841064453125, -1.700439453125, -1.59246826171875, -1.4844970703125, -1.37652587890625, -1.2685546875, -1.16058349609375, -1.0526123046875, -0.94464111328125, -0.836669921875, -0.72869873046875, -0.6207275390625, -0.51275634765625, -0.40478515625, -0.29681396484375, -0.1888427734375, -0.08087158203125, 0.027099609375, 0.13507080078125, 0.2430419921875, 0.35101318359375, 0.458984375, 0.56695556640625, 0.6749267578125, 0.78289794921875, 0.890869140625, 0.99884033203125, 1.1068115234375, 1.21478271484375, 1.32275390625, 1.43072509765625, 1.5386962890625, 1.64666748046875, 1.754638671875, 1.86260986328125, 1.9705810546875, 2.07855224609375, 2.1865234375, 2.29449462890625, 2.4024658203125, 2.51043701171875, 2.618408203125, 2.72637939453125, 2.8343505859375, 2.94232177734375, 3.05029296875, 3.15826416015625, 3.2662353515625, 3.37420654296875, 3.482177734375, 3.59014892578125, 3.6981201171875, 3.80609130859375, 3.9140625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 12.0, 24.0, 29.0, 43.0, 67.0, 107.0, 129.0, 216.0, 369.0, 510.0, 830.0, 1264.0, 1855.0, 2822.0, 4251.0, 6854.0, 10624.0, 17129.0, 28195.0, 48015.0, 84003.0, 158603.0, 273268.0, 179847.0, 93977.0, 53097.0, 31310.0, 18792.0, 11362.0, 7270.0, 4723.0, 3031.0, 2055.0, 1359.0, 855.0, 544.0, 336.0, 244.0, 176.0, 126.0, 77.0, 50.0, 33.0, 15.0, 12.0, 9.0, 5.0, 5.0, 2.0, 6.0, 0.0, 3.0, 5.0, 0.0, 1.0], "bins": [-0.0206756591796875, -0.02002120018005371, -0.019366741180419922, -0.018712282180786133, -0.018057823181152344, -0.017403364181518555, -0.016748905181884766, -0.016094446182250977, -0.015439987182617188, -0.014785528182983398, -0.01413106918334961, -0.01347661018371582, -0.012822151184082031, -0.012167692184448242, -0.011513233184814453, -0.010858774185180664, -0.010204315185546875, -0.009549856185913086, -0.008895397186279297, -0.008240938186645508, -0.007586479187011719, -0.00693202018737793, -0.006277561187744141, -0.0056231021881103516, -0.0049686431884765625, -0.0043141841888427734, -0.0036597251892089844, -0.0030052661895751953, -0.0023508071899414062, -0.0016963481903076172, -0.0010418891906738281, -0.00038743019104003906, 0.00026702880859375, 0.0009214878082275391, 0.0015759468078613281, 0.002230405807495117, 0.0028848648071289062, 0.0035393238067626953, 0.004193782806396484, 0.0048482418060302734, 0.0055027008056640625, 0.0061571598052978516, 0.006811618804931641, 0.00746607780456543, 0.008120536804199219, 0.008774995803833008, 0.009429454803466797, 0.010083913803100586, 0.010738372802734375, 0.011392831802368164, 0.012047290802001953, 0.012701749801635742, 0.013356208801269531, 0.01401066780090332, 0.01466512680053711, 0.015319585800170898, 0.015974044799804688, 0.016628503799438477, 0.017282962799072266, 0.017937421798706055, 0.018591880798339844, 0.019246339797973633, 0.019900798797607422, 0.02055525779724121, 0.021209716796875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 9.0, 12.0, 8.0, 13.0, 13.0, 17.0, 27.0, 28.0, 35.0, 30.0, 27.0, 44.0, 32.0, 35.0, 40.0, 37.0, 42.0, 1059.0, 52.0, 52.0, 43.0, 33.0, 43.0, 32.0, 43.0, 34.0, 29.0, 28.0, 18.0, 18.0, 21.0, 22.0, 13.0, 6.0, 6.0, 5.0, 7.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7890625, -2.708740234375, -2.62841796875, -2.548095703125, -2.4677734375, -2.387451171875, -2.30712890625, -2.226806640625, -2.146484375, -2.066162109375, -1.98583984375, -1.905517578125, -1.8251953125, -1.744873046875, -1.66455078125, -1.584228515625, -1.50390625, -1.423583984375, -1.34326171875, -1.262939453125, -1.1826171875, -1.102294921875, -1.02197265625, -0.941650390625, -0.861328125, -0.781005859375, -0.70068359375, -0.620361328125, -0.5400390625, -0.459716796875, -0.37939453125, -0.299072265625, -0.21875, -0.138427734375, -0.05810546875, 0.022216796875, 0.1025390625, 0.182861328125, 0.26318359375, 0.343505859375, 0.423828125, 0.504150390625, 0.58447265625, 0.664794921875, 0.7451171875, 0.825439453125, 0.90576171875, 0.986083984375, 1.06640625, 1.146728515625, 1.22705078125, 1.307373046875, 1.3876953125, 1.468017578125, 1.54833984375, 1.628662109375, 1.708984375, 1.789306640625, 1.86962890625, 1.949951171875, 2.0302734375, 2.110595703125, 2.19091796875, 2.271240234375, 2.3515625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 5.0, 16.0, 27.0, 29.0, 56.0, 97.0, 123.0, 178.0, 301.0, 430.0, 618.0, 1029.0, 1654.0, 2505.0, 3915.0, 6323.0, 10089.0, 16115.0, 25685.0, 41760.0, 66430.0, 108868.0, 179760.0, 1261693.0, 142289.0, 85391.0, 52979.0, 33188.0, 20493.0, 13061.0, 8163.0, 5041.0, 3154.0, 2056.0, 1237.0, 804.0, 527.0, 393.0, 228.0, 127.0, 83.0, 73.0, 44.0, 34.0, 16.0, 8.0, 7.0, 9.0, 4.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.008941650390625, -0.008664488792419434, -0.008387327194213867, -0.0081101655960083, -0.007833003997802734, -0.007555842399597168, -0.0072786808013916016, -0.007001519203186035, -0.006724357604980469, -0.006447196006774902, -0.006170034408569336, -0.0058928728103637695, -0.005615711212158203, -0.005338549613952637, -0.00506138801574707, -0.004784226417541504, -0.0045070648193359375, -0.004229903221130371, -0.003952741622924805, -0.0036755800247192383, -0.003398418426513672, -0.0031212568283081055, -0.002844095230102539, -0.0025669336318969727, -0.0022897720336914062, -0.00201261043548584, -0.0017354488372802734, -0.001458287239074707, -0.0011811256408691406, -0.0009039640426635742, -0.0006268024444580078, -0.0003496408462524414, -7.2479248046875e-05, 0.0002046823501586914, 0.0004818439483642578, 0.0007590055465698242, 0.0010361671447753906, 0.001313328742980957, 0.0015904903411865234, 0.0018676519393920898, 0.0021448135375976562, 0.0024219751358032227, 0.002699136734008789, 0.0029762983322143555, 0.003253459930419922, 0.0035306215286254883, 0.0038077831268310547, 0.004084944725036621, 0.0043621063232421875, 0.004639267921447754, 0.00491642951965332, 0.005193591117858887, 0.005470752716064453, 0.0057479143142700195, 0.006025075912475586, 0.006302237510681152, 0.006579399108886719, 0.006856560707092285, 0.0071337223052978516, 0.007410883903503418, 0.007688045501708984, 0.00796520709991455, 0.008242368698120117, 0.008519530296325684, 0.00879669189453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 0.0, 11.0, 13.0, 0.0, 16.0, 23.0, 0.0, 25.0, 26.0, 0.0, 34.0, 0.0, 63.0, 149.0, 0.0, 261.0, 130.0, 0.0, 66.0, 34.0, 0.0, 35.0, 24.0, 0.0, 26.0, 13.0, 0.0, 8.0, 11.0, 0.0, 6.0, 8.0, 0.0, 2.0, 1.0, 0.0, 3.0, 8.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3317912817001343e-06, -1.2926757335662842e-06, -1.253560185432434e-06, -1.214444637298584e-06, -1.1753290891647339e-06, -1.1362135410308838e-06, -1.0970979928970337e-06, -1.0579824447631836e-06, -1.0188668966293335e-06, -9.797513484954834e-07, -9.406358003616333e-07, -9.015202522277832e-07, -8.624047040939331e-07, -8.23289155960083e-07, -7.841736078262329e-07, -7.450580596923828e-07, -7.059425115585327e-07, -6.668269634246826e-07, -6.277114152908325e-07, -5.885958671569824e-07, -5.494803190231323e-07, -5.103647708892822e-07, -4.7124922275543213e-07, -4.3213367462158203e-07, -3.9301812648773193e-07, -3.5390257835388184e-07, -3.1478703022003174e-07, -2.7567148208618164e-07, -2.3655593395233154e-07, -1.9744038581848145e-07, -1.5832483768463135e-07, -1.1920928955078125e-07, -8.009374141693115e-08, -4.0978193283081055e-08, -1.862645149230957e-09, 3.725290298461914e-08, 7.636845111846924e-08, 1.1548399925231934e-07, 1.5459954738616943e-07, 1.9371509552001953e-07, 2.3283064365386963e-07, 2.7194619178771973e-07, 3.110617399215698e-07, 3.501772880554199e-07, 3.8929283618927e-07, 4.284083843231201e-07, 4.675239324569702e-07, 5.066394805908203e-07, 5.457550287246704e-07, 5.848705768585205e-07, 6.239861249923706e-07, 6.631016731262207e-07, 7.022172212600708e-07, 7.413327693939209e-07, 7.80448317527771e-07, 8.195638656616211e-07, 8.586794137954712e-07, 8.977949619293213e-07, 9.369105100631714e-07, 9.760260581970215e-07, 1.0151416063308716e-06, 1.0542571544647217e-06, 1.0933727025985718e-06, 1.1324882507324219e-06]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 0.0, 6.0, 6.0, 6.0, 9.0, 2.0, 11.0, 13.0, 18.0, 16.0, 26.0, 35.0, 62.0, 80.0, 171.0, 372.0, 2182.0, 855843.0, 187524.0, 1440.0, 304.0, 142.0, 85.0, 52.0, 24.0, 21.0, 18.0, 18.0, 10.0, 9.0, 11.0, 6.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.282857894897461e-05, -2.2038817405700684e-05, -2.1249055862426758e-05, -2.0459294319152832e-05, -1.9669532775878906e-05, -1.887977123260498e-05, -1.8090009689331055e-05, -1.730024814605713e-05, -1.6510486602783203e-05, -1.5720725059509277e-05, -1.4930963516235352e-05, -1.4141201972961426e-05, -1.33514404296875e-05, -1.2561678886413574e-05, -1.1771917343139648e-05, -1.0982155799865723e-05, -1.0192394256591797e-05, -9.402632713317871e-06, -8.612871170043945e-06, -7.82310962677002e-06, -7.033348083496094e-06, -6.243586540222168e-06, -5.453824996948242e-06, -4.664063453674316e-06, -3.874301910400391e-06, -3.084540367126465e-06, -2.294778823852539e-06, -1.5050172805786133e-06, -7.152557373046875e-07, 7.450580596923828e-08, 8.642673492431641e-07, 1.6540288925170898e-06, 2.4437904357910156e-06, 3.2335519790649414e-06, 4.023313522338867e-06, 4.813075065612793e-06, 5.602836608886719e-06, 6.3925981521606445e-06, 7.18235969543457e-06, 7.972121238708496e-06, 8.761882781982422e-06, 9.551644325256348e-06, 1.0341405868530273e-05, 1.11311674118042e-05, 1.1920928955078125e-05, 1.271069049835205e-05, 1.3500452041625977e-05, 1.4290213584899902e-05, 1.5079975128173828e-05, 1.5869736671447754e-05, 1.665949821472168e-05, 1.7449259757995605e-05, 1.823902130126953e-05, 1.9028782844543457e-05, 1.9818544387817383e-05, 2.060830593109131e-05, 2.1398067474365234e-05, 2.218782901763916e-05, 2.2977590560913086e-05, 2.3767352104187012e-05, 2.4557113647460938e-05, 2.5346875190734863e-05, 2.613663673400879e-05, 2.6926398277282715e-05, 2.771615982055664e-05]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 29.0, 433.0, 525.0, 28.0], "bins": [-1.2334198800090235e-05, -1.2135421457060147e-05, -1.193664411403006e-05, -1.1737867680494674e-05, -1.1539090337464586e-05, -1.1340312994434498e-05, -1.114153565140441e-05, -1.0942758308374323e-05, -1.0743980965344235e-05, -1.0545203622314148e-05, -1.034642627928406e-05, -1.0147648936253972e-05, -9.948872502718586e-06, -9.750095159688499e-06, -9.551317816658411e-06, -9.352540473628324e-06, -9.153764040092938e-06, -8.95498669706285e-06, -8.756209354032762e-06, -8.557432011002675e-06, -8.358655577467289e-06, -8.159878234437201e-06, -7.961100891407114e-06, -7.762323548377026e-06, -7.563546205346938e-06, -7.3647688623168506e-06, -7.165991974034114e-06, -6.967214631004026e-06, -6.7684372879739385e-06, -6.569660399691202e-06, -6.370883056661114e-06, -6.1721057136310264e-06, -5.97332882534829e-06, -5.774551482318202e-06, -5.575774594035465e-06, -5.376997251005378e-06, -5.17821990797529e-06, -4.979443019692553e-06, -4.7806656766624656e-06, -4.581888788379729e-06, -4.383111445349641e-06, -4.1843341023195535e-06, -3.985557214036817e-06, -3.786779871006729e-06, -3.588002755350317e-06, -3.3892256396939047e-06, -3.190448296663817e-06, -2.991671181007405e-06, -2.7928940653509926e-06, -2.5941169496945804e-06, -2.3953396066644927e-06, -2.1965624910080805e-06, -1.9977853753516683e-06, -1.7990081460084184e-06, -1.6002309166651685e-06, -1.4014538010087563e-06, -1.2026764579786686e-06, -1.0038992286354187e-06, -8.051221129790065e-07, -6.063448836357566e-07, -4.075677111359255e-07, -2.0879053863609442e-07, -1.0013309292844497e-08, 1.887638063635677e-07, 3.875410072851082e-07]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 25.0, 0.0, 0.0, 53.0, 0.0, 0.0, 121.0, 0.0, 0.0, 184.0, 0.0, 0.0, 0.0, 253.0, 0.0, 0.0, 170.0, 0.0, 0.0, 103.0, 0.0, 0.0, 47.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 7.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 8.0, 9.0, 17.0, 17.0, 13.0, 25.0, 18.0, 23.0, 22.0, 35.0, 33.0, 35.0, 49.0, 46.0, 43.0, 55.0, 54.0, 53.0, 53.0, 49.0, 40.0, 40.0, 42.0, 30.0, 36.0, 30.0, 21.0, 21.0, 17.0, 12.0, 16.0, 10.0, 6.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.99609375, -2.88812255859375, -2.7801513671875, -2.67218017578125, -2.564208984375, -2.45623779296875, -2.3482666015625, -2.24029541015625, -2.13232421875, -2.02435302734375, -1.9163818359375, -1.80841064453125, -1.700439453125, -1.59246826171875, -1.4844970703125, -1.37652587890625, -1.2685546875, -1.16058349609375, -1.0526123046875, -0.94464111328125, -0.836669921875, -0.72869873046875, -0.6207275390625, -0.51275634765625, -0.40478515625, -0.29681396484375, -0.1888427734375, -0.08087158203125, 0.027099609375, 0.13507080078125, 0.2430419921875, 0.35101318359375, 0.458984375, 0.56695556640625, 0.6749267578125, 0.78289794921875, 0.890869140625, 0.99884033203125, 1.1068115234375, 1.21478271484375, 1.32275390625, 1.43072509765625, 1.5386962890625, 1.64666748046875, 1.754638671875, 1.86260986328125, 1.9705810546875, 2.07855224609375, 2.1865234375, 2.29449462890625, 2.4024658203125, 2.51043701171875, 2.618408203125, 2.72637939453125, 2.8343505859375, 2.94232177734375, 3.05029296875, 3.15826416015625, 3.2662353515625, 3.37420654296875, 3.482177734375, 3.59014892578125, 3.6981201171875, 3.80609130859375, 3.9140625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 8.0, 15.0, 17.0, 20.0, 33.0, 37.0, 71.0, 87.0, 159.0, 241.0, 364.0, 513.0, 734.0, 1096.0, 1730.0, 2550.0, 4217.0, 6902.0, 11832.0, 21736.0, 44782.0, 101185.0, 246222.0, 322295.0, 150385.0, 63253.0, 29619.0, 15321.0, 8743.0, 5087.0, 3318.0, 2012.0, 1243.0, 921.0, 567.0, 403.0, 267.0, 191.0, 107.0, 83.0, 56.0, 41.0, 31.0, 17.0, 18.0, 8.0, 9.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.751953125, -3.639007568359375, -3.52606201171875, -3.413116455078125, -3.3001708984375, -3.187225341796875, -3.07427978515625, -2.961334228515625, -2.848388671875, -2.735443115234375, -2.62249755859375, -2.509552001953125, -2.3966064453125, -2.283660888671875, -2.17071533203125, -2.057769775390625, -1.94482421875, -1.831878662109375, -1.71893310546875, -1.605987548828125, -1.4930419921875, -1.380096435546875, -1.26715087890625, -1.154205322265625, -1.041259765625, -0.928314208984375, -0.81536865234375, -0.702423095703125, -0.5894775390625, -0.476531982421875, -0.36358642578125, -0.250640869140625, -0.1376953125, -0.024749755859375, 0.08819580078125, 0.201141357421875, 0.3140869140625, 0.427032470703125, 0.53997802734375, 0.652923583984375, 0.765869140625, 0.878814697265625, 0.99176025390625, 1.104705810546875, 1.2176513671875, 1.330596923828125, 1.44354248046875, 1.556488037109375, 1.66943359375, 1.782379150390625, 1.89532470703125, 2.008270263671875, 2.1212158203125, 2.234161376953125, 2.34710693359375, 2.460052490234375, 2.572998046875, 2.685943603515625, 2.79888916015625, 2.911834716796875, 3.0247802734375, 3.137725830078125, 3.25067138671875, 3.363616943359375, 3.4765625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 4.0, 8.0, 2.0, 8.0, 5.0, 13.0, 7.0, 12.0, 15.0, 12.0, 27.0, 22.0, 27.0, 27.0, 28.0, 34.0, 46.0, 40.0, 20.0, 56.0, 84.0, 139.0, 330.0, 1360.0, 195.0, 83.0, 55.0, 49.0, 42.0, 32.0, 32.0, 31.0, 33.0, 22.0, 21.0, 20.0, 17.0, 22.0, 6.0, 14.0, 9.0, 7.0, 6.0, 8.0, 8.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5, -8.2352294921875, -7.970458984375, -7.7056884765625, -7.44091796875, -7.1761474609375, -6.911376953125, -6.6466064453125, -6.3818359375, -6.1170654296875, -5.852294921875, -5.5875244140625, -5.32275390625, -5.0579833984375, -4.793212890625, -4.5284423828125, -4.263671875, -3.9989013671875, -3.734130859375, -3.4693603515625, -3.20458984375, -2.9398193359375, -2.675048828125, -2.4102783203125, -2.1455078125, -1.8807373046875, -1.615966796875, -1.3511962890625, -1.08642578125, -0.8216552734375, -0.556884765625, -0.2921142578125, -0.02734375, 0.2374267578125, 0.502197265625, 0.7669677734375, 1.03173828125, 1.2965087890625, 1.561279296875, 1.8260498046875, 2.0908203125, 2.3555908203125, 2.620361328125, 2.8851318359375, 3.14990234375, 3.4146728515625, 3.679443359375, 3.9442138671875, 4.208984375, 4.4737548828125, 4.738525390625, 5.0032958984375, 5.26806640625, 5.5328369140625, 5.797607421875, 6.0623779296875, 6.3271484375, 6.5919189453125, 6.856689453125, 7.1214599609375, 7.38623046875, 7.6510009765625, 7.915771484375, 8.1805419921875, 8.4453125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 10.0, 6.0, 14.0, 14.0, 15.0, 26.0, 31.0, 28.0, 52.0, 60.0, 71.0, 84.0, 97.0, 165.0, 200.0, 289.0, 682.0, 1810.0, 6733.0, 50677.0, 2278920.0, 773761.0, 24600.0, 4405.0, 1302.0, 560.0, 282.0, 202.0, 135.0, 94.0, 92.0, 71.0, 48.0, 28.0, 34.0, 22.0, 24.0, 13.0, 13.0, 10.0, 4.0, 9.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.015625, -12.5797119140625, -12.143798828125, -11.7078857421875, -11.27197265625, -10.8360595703125, -10.400146484375, -9.9642333984375, -9.5283203125, -9.0924072265625, -8.656494140625, -8.2205810546875, -7.78466796875, -7.3487548828125, -6.912841796875, -6.4769287109375, -6.041015625, -5.6051025390625, -5.169189453125, -4.7332763671875, -4.29736328125, -3.8614501953125, -3.425537109375, -2.9896240234375, -2.5537109375, -2.1177978515625, -1.681884765625, -1.2459716796875, -0.81005859375, -0.3741455078125, 0.061767578125, 0.4976806640625, 0.93359375, 1.3695068359375, 1.805419921875, 2.2413330078125, 2.67724609375, 3.1131591796875, 3.549072265625, 3.9849853515625, 4.4208984375, 4.8568115234375, 5.292724609375, 5.7286376953125, 6.16455078125, 6.6004638671875, 7.036376953125, 7.4722900390625, 7.908203125, 8.3441162109375, 8.780029296875, 9.2159423828125, 9.65185546875, 10.0877685546875, 10.523681640625, 10.9595947265625, 11.3955078125, 11.8314208984375, 12.267333984375, 12.7032470703125, 13.13916015625, 13.5750732421875, 14.010986328125, 14.4468994140625, 14.8828125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 52.0, 279.0, 531.0, 141.0, 8.0, 1.0, 1.0, 1.0], "bins": [-172.35409545898438, -169.39540100097656, -166.4366912841797, -163.47799682617188, -160.51930236816406, -157.56060791015625, -154.60189819335938, -151.64320373535156, -148.68450927734375, -145.72581481933594, -142.76710510253906, -139.80841064453125, -136.84971618652344, -133.89102172851562, -130.93231201171875, -127.97361755371094, -125.0149154663086, -122.05621337890625, -119.09751892089844, -116.1388168334961, -113.18012237548828, -110.22142028808594, -107.26272583007812, -104.30402374267578, -101.34532165527344, -98.3866195678711, -95.42792510986328, -92.46922302246094, -89.51052856445312, -86.55182647705078, -83.59312438964844, -80.63442993164062, -77.67574310302734, -74.717041015625, -71.75834655761719, -68.79964447021484, -65.84095001220703, -62.88224792480469, -59.92354965209961, -56.96485137939453, -54.00615310668945, -51.047454833984375, -48.0887565612793, -45.13005828857422, -42.171356201171875, -39.21266174316406, -36.25395965576172, -33.29526138305664, -30.336563110351562, -27.377864837646484, -24.419166564941406, -21.460466384887695, -18.501768112182617, -15.543069839477539, -12.584369659423828, -9.62567138671875, -6.666973114013672, -3.7082743644714355, -0.7495756149291992, 2.2091236114501953, 5.167821884155273, 8.126520156860352, 11.085220336914062, 14.04391860961914, 17.00261688232422]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 0.0, 7.0, 12.0, 14.0, 19.0, 15.0, 22.0, 24.0, 17.0, 37.0, 36.0, 35.0, 33.0, 41.0, 52.0, 49.0, 59.0, 58.0, 43.0, 55.0, 47.0, 43.0, 41.0, 54.0, 28.0, 22.0, 20.0, 25.0, 22.0, 18.0, 13.0, 6.0, 3.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.12200927734375, -31.067209243774414, -30.012407302856445, -28.95760726928711, -27.90280532836914, -26.848005294799805, -25.79320526123047, -24.7384033203125, -23.683603286743164, -22.628803253173828, -21.57400131225586, -20.519201278686523, -19.464401245117188, -18.40959930419922, -17.354799270629883, -16.299999237060547, -15.245197296142578, -14.190396308898926, -13.135595321655273, -12.080795288085938, -11.025994300842285, -9.971193313598633, -8.916393280029297, -7.8615922927856445, -6.806791305541992, -5.75199031829834, -4.697189807891846, -3.6423890590667725, -2.587588310241699, -1.5327873229980469, -0.47798681259155273, 0.5768136978149414, 1.6316146850585938, 2.686415433883667, 3.7412161827087402, 4.796016693115234, 5.850817680358887, 6.905618667602539, 7.960419178009033, 9.015219688415527, 10.07002067565918, 11.124821662902832, 12.179622650146484, 13.23442268371582, 14.289223670959473, 15.344024658203125, 16.39882469177246, 17.453624725341797, 18.508426666259766, 19.5632266998291, 20.61802864074707, 21.672828674316406, 22.727630615234375, 23.78243064880371, 24.837230682373047, 25.892032623291016, 26.94683265686035, 28.001632690429688, 29.056434631347656, 30.111234664916992, 31.166034698486328, 32.2208366394043, 33.275638580322266, 34.33043670654297, 35.38523864746094]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 8.0, 12.0, 24.0, 15.0, 19.0, 17.0, 27.0, 23.0, 26.0, 30.0, 41.0, 40.0, 54.0, 38.0, 43.0, 67.0, 46.0, 57.0, 45.0, 42.0, 45.0, 43.0, 30.0, 34.0, 33.0, 24.0, 20.0, 17.0, 19.0, 11.0, 9.0, 9.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.815643310546875, -2.70745849609375, -2.599273681640625, -2.4910888671875, -2.382904052734375, -2.27471923828125, -2.166534423828125, -2.058349609375, -1.950164794921875, -1.84197998046875, -1.733795166015625, -1.6256103515625, -1.517425537109375, -1.40924072265625, -1.301055908203125, -1.19287109375, -1.084686279296875, -0.97650146484375, -0.868316650390625, -0.7601318359375, -0.651947021484375, -0.54376220703125, -0.435577392578125, -0.327392578125, -0.219207763671875, -0.11102294921875, -0.002838134765625, 0.1053466796875, 0.213531494140625, 0.32171630859375, 0.429901123046875, 0.5380859375, 0.646270751953125, 0.75445556640625, 0.862640380859375, 0.9708251953125, 1.079010009765625, 1.18719482421875, 1.295379638671875, 1.403564453125, 1.511749267578125, 1.61993408203125, 1.728118896484375, 1.8363037109375, 1.944488525390625, 2.05267333984375, 2.160858154296875, 2.26904296875, 2.377227783203125, 2.48541259765625, 2.593597412109375, 2.7017822265625, 2.809967041015625, 2.91815185546875, 3.026336669921875, 3.134521484375, 3.242706298828125, 3.35089111328125, 3.459075927734375, 3.5672607421875, 3.675445556640625, 3.78363037109375, 3.891815185546875, 4.0]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 15.0, 7.0, 23.0, 17.0, 37.0, 41.0, 71.0, 98.0, 147.0, 206.0, 338.0, 566.0, 882.0, 1577.0, 2863.0, 5695.0, 11478.0, 25417.0, 63192.0, 184269.0, 640077.0, 1744201.0, 1055210.0, 295689.0, 94677.0, 36323.0, 15557.0, 7271.0, 3644.0, 1883.0, 1056.0, 598.0, 353.0, 240.0, 142.0, 125.0, 81.0, 55.0, 35.0, 25.0, 21.0, 20.0, 9.0, 11.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.55859375, -4.41009521484375, -4.2615966796875, -4.11309814453125, -3.964599609375, -3.81610107421875, -3.6676025390625, -3.51910400390625, -3.37060546875, -3.22210693359375, -3.0736083984375, -2.92510986328125, -2.776611328125, -2.62811279296875, -2.4796142578125, -2.33111572265625, -2.1826171875, -2.03411865234375, -1.8856201171875, -1.73712158203125, -1.588623046875, -1.44012451171875, -1.2916259765625, -1.14312744140625, -0.99462890625, -0.84613037109375, -0.6976318359375, -0.54913330078125, -0.400634765625, -0.25213623046875, -0.1036376953125, 0.04486083984375, 0.193359375, 0.34185791015625, 0.4903564453125, 0.63885498046875, 0.787353515625, 0.93585205078125, 1.0843505859375, 1.23284912109375, 1.38134765625, 1.52984619140625, 1.6783447265625, 1.82684326171875, 1.975341796875, 2.12384033203125, 2.2723388671875, 2.42083740234375, 2.5693359375, 2.71783447265625, 2.8663330078125, 3.01483154296875, 3.163330078125, 3.31182861328125, 3.4603271484375, 3.60882568359375, 3.75732421875, 3.90582275390625, 4.0543212890625, 4.20281982421875, 4.351318359375, 4.49981689453125, 4.6483154296875, 4.79681396484375, 4.9453125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 14.0, 13.0, 14.0, 23.0, 37.0, 28.0, 47.0, 69.0, 98.0, 125.0, 168.0, 294.0, 353.0, 470.0, 527.0, 435.0, 357.0, 311.0, 208.0, 136.0, 90.0, 68.0, 60.0, 36.0, 28.0, 21.0, 11.0, 13.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.25, -8.0465087890625, -7.843017578125, -7.6395263671875, -7.43603515625, -7.2325439453125, -7.029052734375, -6.8255615234375, -6.6220703125, -6.4185791015625, -6.215087890625, -6.0115966796875, -5.80810546875, -5.6046142578125, -5.401123046875, -5.1976318359375, -4.994140625, -4.7906494140625, -4.587158203125, -4.3836669921875, -4.18017578125, -3.9766845703125, -3.773193359375, -3.5697021484375, -3.3662109375, -3.1627197265625, -2.959228515625, -2.7557373046875, -2.55224609375, -2.3487548828125, -2.145263671875, -1.9417724609375, -1.73828125, -1.5347900390625, -1.331298828125, -1.1278076171875, -0.92431640625, -0.7208251953125, -0.517333984375, -0.3138427734375, -0.1103515625, 0.0931396484375, 0.296630859375, 0.5001220703125, 0.70361328125, 0.9071044921875, 1.110595703125, 1.3140869140625, 1.517578125, 1.7210693359375, 1.924560546875, 2.1280517578125, 2.33154296875, 2.5350341796875, 2.738525390625, 2.9420166015625, 3.1455078125, 3.3489990234375, 3.552490234375, 3.7559814453125, 3.95947265625, 4.1629638671875, 4.366455078125, 4.5699462890625, 4.7734375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 11.0, 10.0, 19.0, 26.0, 28.0, 39.0, 58.0, 90.0, 133.0, 211.0, 345.0, 732.0, 2173.0, 13863.0, 228651.0, 3379683.0, 536788.0, 26129.0, 3224.0, 911.0, 418.0, 221.0, 152.0, 101.0, 71.0, 48.0, 39.0, 20.0, 21.0, 11.0, 18.0, 10.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5859375, -15.0006103515625, -14.415283203125, -13.8299560546875, -13.24462890625, -12.6593017578125, -12.073974609375, -11.4886474609375, -10.9033203125, -10.3179931640625, -9.732666015625, -9.1473388671875, -8.56201171875, -7.9766845703125, -7.391357421875, -6.8060302734375, -6.220703125, -5.6353759765625, -5.050048828125, -4.4647216796875, -3.87939453125, -3.2940673828125, -2.708740234375, -2.1234130859375, -1.5380859375, -0.9527587890625, -0.367431640625, 0.2178955078125, 0.80322265625, 1.3885498046875, 1.973876953125, 2.5592041015625, 3.14453125, 3.7298583984375, 4.315185546875, 4.9005126953125, 5.48583984375, 6.0711669921875, 6.656494140625, 7.2418212890625, 7.8271484375, 8.4124755859375, 8.997802734375, 9.5831298828125, 10.16845703125, 10.7537841796875, 11.339111328125, 11.9244384765625, 12.509765625, 13.0950927734375, 13.680419921875, 14.2657470703125, 14.85107421875, 15.4364013671875, 16.021728515625, 16.6070556640625, 17.1923828125, 17.7777099609375, 18.363037109375, 18.9483642578125, 19.53369140625, 20.1190185546875, 20.704345703125, 21.2896728515625, 21.875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 10.0, 8.0, 20.0, 19.0, 31.0, 29.0, 44.0, 50.0, 72.0, 78.0, 98.0, 94.0, 79.0, 80.0, 69.0, 56.0, 40.0, 38.0, 26.0, 15.0, 16.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.686321258544922, -15.83186149597168, -14.977402687072754, -14.122942924499512, -13.26848316192627, -12.414024353027344, -11.559564590454102, -10.70510482788086, -9.850645065307617, -8.996185302734375, -8.14172649383545, -7.287266731262207, -6.432806968688965, -5.578347682952881, -4.723888397216797, -3.8694286346435547, -3.014969825744629, -2.160510301589966, -1.3060508966445923, -0.45159149169921875, 0.40286803245544434, 1.2573275566101074, 2.1117868423461914, 2.9662466049194336, 3.8207058906555176, 4.675165176391602, 5.529624938964844, 6.384084224700928, 7.238543510437012, 8.093003273010254, 8.94746208190918, 9.801921844482422, 10.656381607055664, 11.510841369628906, 12.365300178527832, 13.219759941101074, 14.074219703674316, 14.928678512573242, 15.783138275146484, 16.637598037719727, 17.49205780029297, 18.34651756286621, 19.200977325439453, 20.055435180664062, 20.909894943237305, 21.764354705810547, 22.61881446838379, 23.47327423095703, 24.32773208618164, 25.182191848754883, 26.036651611328125, 26.891109466552734, 27.745569229125977, 28.60002899169922, 29.45448875427246, 30.308948516845703, 31.163408279418945, 32.01786804199219, 32.8723258972168, 33.72678756713867, 34.58124542236328, 35.435707092285156, 36.290164947509766, 37.144622802734375, 37.99908447265625]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 5.0, 9.0, 11.0, 13.0, 10.0, 16.0, 20.0, 21.0, 17.0, 23.0, 28.0, 34.0, 36.0, 31.0, 31.0, 30.0, 41.0, 28.0, 45.0, 46.0, 52.0, 37.0, 45.0, 34.0, 30.0, 34.0, 32.0, 34.0, 30.0, 33.0, 28.0, 18.0, 12.0, 13.0, 17.0, 18.0, 6.0, 3.0, 4.0, 6.0, 1.0, 0.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.021026611328125, -19.350439071655273, -18.679851531982422, -18.00926399230957, -17.33867645263672, -16.6680908203125, -15.997502326965332, -15.326915740966797, -14.656328201293945, -13.985740661621094, -13.315153121948242, -12.64456558227539, -11.973978996276855, -11.303391456604004, -10.632803916931152, -9.962217330932617, -9.29162883758545, -8.621041297912598, -7.950454235076904, -7.279866695404053, -6.609279632568359, -5.938692092895508, -5.268104553222656, -4.597517490386963, -3.9269299507141113, -3.256342649459839, -2.5857553482055664, -1.9151678085327148, -1.2445805072784424, -0.5739932060241699, 0.09659433364868164, 0.767181396484375, 1.4377689361572266, 2.108356237411499, 2.7789435386657715, 3.449531078338623, 4.120118141174316, 4.790705680847168, 5.4612932205200195, 6.131880283355713, 6.8024678230285645, 7.473055362701416, 8.14364242553711, 8.814229965209961, 9.484817504882812, 10.155405044555664, 10.825992584228516, 11.49657917022705, 12.167166709899902, 12.837754249572754, 13.508341789245605, 14.17892837524414, 14.849515914916992, 15.520103454589844, 16.190690994262695, 16.861278533935547, 17.5318660736084, 18.20245361328125, 18.8730411529541, 19.543628692626953, 20.214216232299805, 20.884803771972656, 21.555389404296875, 22.225976943969727, 22.896564483642578]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 14.0, 10.0, 14.0, 18.0, 22.0, 24.0, 25.0, 32.0, 29.0, 34.0, 42.0, 43.0, 44.0, 56.0, 47.0, 58.0, 49.0, 64.0, 54.0, 46.0, 47.0, 35.0, 24.0, 28.0, 24.0, 32.0, 16.0, 13.0, 18.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44921875, -3.3319091796875, -3.214599609375, -3.0972900390625, -2.97998046875, -2.8626708984375, -2.745361328125, -2.6280517578125, -2.5107421875, -2.3934326171875, -2.276123046875, -2.1588134765625, -2.04150390625, -1.9241943359375, -1.806884765625, -1.6895751953125, -1.572265625, -1.4549560546875, -1.337646484375, -1.2203369140625, -1.10302734375, -0.9857177734375, -0.868408203125, -0.7510986328125, -0.6337890625, -0.5164794921875, -0.399169921875, -0.2818603515625, -0.16455078125, -0.0472412109375, 0.070068359375, 0.1873779296875, 0.3046875, 0.4219970703125, 0.539306640625, 0.6566162109375, 0.77392578125, 0.8912353515625, 1.008544921875, 1.1258544921875, 1.2431640625, 1.3604736328125, 1.477783203125, 1.5950927734375, 1.71240234375, 1.8297119140625, 1.947021484375, 2.0643310546875, 2.181640625, 2.2989501953125, 2.416259765625, 2.5335693359375, 2.65087890625, 2.7681884765625, 2.885498046875, 3.0028076171875, 3.1201171875, 3.2374267578125, 3.354736328125, 3.4720458984375, 3.58935546875, 3.7066650390625, 3.823974609375, 3.9412841796875, 4.05859375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 9.0, 11.0, 10.0, 18.0, 26.0, 17.0, 35.0, 56.0, 98.0, 161.0, 262.0, 419.0, 598.0, 1030.0, 1714.0, 2666.0, 4668.0, 8363.0, 14584.0, 26489.0, 48453.0, 96082.0, 207880.0, 321786.0, 152113.0, 73483.0, 38716.0, 20793.0, 11528.0, 6626.0, 3949.0, 2281.0, 1377.0, 857.0, 491.0, 309.0, 172.0, 142.0, 105.0, 63.0, 50.0, 28.0, 15.0, 8.0, 6.0, 6.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0273895263671875, -0.02656722068786621, -0.025744915008544922, -0.024922609329223633, -0.024100303649902344, -0.023277997970581055, -0.022455692291259766, -0.021633386611938477, -0.020811080932617188, -0.0199887752532959, -0.01916646957397461, -0.01834416389465332, -0.01752185821533203, -0.016699552536010742, -0.015877246856689453, -0.015054941177368164, -0.014232635498046875, -0.013410329818725586, -0.012588024139404297, -0.011765718460083008, -0.010943412780761719, -0.01012110710144043, -0.00929880142211914, -0.008476495742797852, -0.0076541900634765625, -0.0068318843841552734, -0.006009578704833984, -0.005187273025512695, -0.004364967346191406, -0.003542661666870117, -0.002720355987548828, -0.001898050308227539, -0.00107574462890625, -0.00025343894958496094, 0.0005688667297363281, 0.0013911724090576172, 0.0022134780883789062, 0.0030357837677001953, 0.0038580894470214844, 0.0046803951263427734, 0.0055027008056640625, 0.0063250064849853516, 0.007147312164306641, 0.00796961784362793, 0.008791923522949219, 0.009614229202270508, 0.010436534881591797, 0.011258840560913086, 0.012081146240234375, 0.012903451919555664, 0.013725757598876953, 0.014548063278198242, 0.015370368957519531, 0.01619267463684082, 0.01701498031616211, 0.0178372859954834, 0.018659591674804688, 0.019481897354125977, 0.020304203033447266, 0.021126508712768555, 0.021948814392089844, 0.022771120071411133, 0.023593425750732422, 0.02441573143005371, 0.025238037109375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 9.0, 14.0, 17.0, 17.0, 20.0, 18.0, 27.0, 24.0, 33.0, 20.0, 26.0, 31.0, 33.0, 27.0, 41.0, 40.0, 36.0, 1060.0, 36.0, 34.0, 35.0, 44.0, 35.0, 37.0, 39.0, 28.0, 37.0, 26.0, 22.0, 19.0, 18.0, 17.0, 12.0, 11.0, 11.0, 10.0, 9.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.193359375, -2.12420654296875, -2.0550537109375, -1.98590087890625, -1.916748046875, -1.84759521484375, -1.7784423828125, -1.70928955078125, -1.64013671875, -1.57098388671875, -1.5018310546875, -1.43267822265625, -1.363525390625, -1.29437255859375, -1.2252197265625, -1.15606689453125, -1.0869140625, -1.01776123046875, -0.9486083984375, -0.87945556640625, -0.810302734375, -0.74114990234375, -0.6719970703125, -0.60284423828125, -0.53369140625, -0.46453857421875, -0.3953857421875, -0.32623291015625, -0.257080078125, -0.18792724609375, -0.1187744140625, -0.04962158203125, 0.01953125, 0.08868408203125, 0.1578369140625, 0.22698974609375, 0.296142578125, 0.36529541015625, 0.4344482421875, 0.50360107421875, 0.57275390625, 0.64190673828125, 0.7110595703125, 0.78021240234375, 0.849365234375, 0.91851806640625, 0.9876708984375, 1.05682373046875, 1.1259765625, 1.19512939453125, 1.2642822265625, 1.33343505859375, 1.402587890625, 1.47174072265625, 1.5408935546875, 1.61004638671875, 1.67919921875, 1.74835205078125, 1.8175048828125, 1.88665771484375, 1.955810546875, 2.02496337890625, 2.0941162109375, 2.16326904296875, 2.232421875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 11.0, 17.0, 21.0, 31.0, 44.0, 78.0, 87.0, 134.0, 206.0, 280.0, 419.0, 617.0, 861.0, 1316.0, 1969.0, 2854.0, 4377.0, 6599.0, 10199.0, 15397.0, 23936.0, 36372.0, 56493.0, 88011.0, 140622.0, 1249659.0, 164833.0, 102920.0, 65708.0, 42585.0, 27834.0, 17920.0, 11655.0, 7626.0, 5153.0, 3350.0, 2236.0, 1492.0, 994.0, 686.0, 469.0, 326.0, 226.0, 162.0, 105.0, 63.0, 59.0, 34.0, 22.0, 18.0, 16.0, 9.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.00811767578125, -0.00786137580871582, -0.007605075836181641, -0.007348775863647461, -0.007092475891113281, -0.0068361759185791016, -0.006579875946044922, -0.006323575973510742, -0.0060672760009765625, -0.005810976028442383, -0.005554676055908203, -0.0052983760833740234, -0.005042076110839844, -0.004785776138305664, -0.004529476165771484, -0.004273176193237305, -0.004016876220703125, -0.0037605762481689453, -0.0035042762756347656, -0.003247976303100586, -0.0029916763305664062, -0.0027353763580322266, -0.002479076385498047, -0.002222776412963867, -0.0019664764404296875, -0.0017101764678955078, -0.0014538764953613281, -0.0011975765228271484, -0.0009412765502929688, -0.0006849765777587891, -0.0004286766052246094, -0.0001723766326904297, 8.392333984375e-05, 0.0003402233123779297, 0.0005965232849121094, 0.0008528232574462891, 0.0011091232299804688, 0.0013654232025146484, 0.0016217231750488281, 0.0018780231475830078, 0.0021343231201171875, 0.002390623092651367, 0.002646923065185547, 0.0029032230377197266, 0.0031595230102539062, 0.003415822982788086, 0.0036721229553222656, 0.003928422927856445, 0.004184722900390625, 0.004441022872924805, 0.004697322845458984, 0.004953622817993164, 0.005209922790527344, 0.0054662227630615234, 0.005722522735595703, 0.005978822708129883, 0.0062351226806640625, 0.006491422653198242, 0.006747722625732422, 0.0070040225982666016, 0.007260322570800781, 0.007516622543334961, 0.007772922515869141, 0.00802922248840332, 0.0082855224609375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 6.0, 0.0, 5.0, 11.0, 9.0, 5.0, 0.0, 11.0, 15.0, 7.0, 0.0, 12.0, 8.0, 30.0, 0.0, 32.0, 45.0, 65.0, 0.0, 142.0, 220.0, 124.0, 73.0, 0.0, 39.0, 28.0, 19.0, 0.0, 16.0, 10.0, 12.0, 0.0, 10.0, 12.0, 8.0, 0.0, 9.0, 3.0, 6.0, 10.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.3848766684532166e-06, -1.339241862297058e-06, -1.2936070561408997e-06, -1.2479722499847412e-06, -1.2023374438285828e-06, -1.1567026376724243e-06, -1.1110678315162659e-06, -1.0654330253601074e-06, -1.019798219203949e-06, -9.741634130477905e-07, -9.285286068916321e-07, -8.828938007354736e-07, -8.372589945793152e-07, -7.916241884231567e-07, -7.459893822669983e-07, -7.003545761108398e-07, -6.547197699546814e-07, -6.09084963798523e-07, -5.634501576423645e-07, -5.178153514862061e-07, -4.721805453300476e-07, -4.2654573917388916e-07, -3.809109330177307e-07, -3.3527612686157227e-07, -2.896413207054138e-07, -2.4400651454925537e-07, -1.9837170839309692e-07, -1.5273690223693848e-07, -1.0710209608078003e-07, -6.146728992462158e-08, -1.5832483768463135e-08, 2.9802322387695312e-08, 7.543712854385376e-08, 1.210719347000122e-07, 1.6670674085617065e-07, 2.123415470123291e-07, 2.5797635316848755e-07, 3.03611159324646e-07, 3.4924596548080444e-07, 3.948807716369629e-07, 4.4051557779312134e-07, 4.861503839492798e-07, 5.317851901054382e-07, 5.774199962615967e-07, 6.230548024177551e-07, 6.686896085739136e-07, 7.14324414730072e-07, 7.599592208862305e-07, 8.055940270423889e-07, 8.512288331985474e-07, 8.968636393547058e-07, 9.424984455108643e-07, 9.881332516670227e-07, 1.0337680578231812e-06, 1.0794028639793396e-06, 1.125037670135498e-06, 1.1706724762916565e-06, 1.216307282447815e-06, 1.2619420886039734e-06, 1.3075768947601318e-06, 1.3532117009162903e-06, 1.3988465070724487e-06, 1.4444813132286072e-06, 1.4901161193847656e-06]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 2.0, 9.0, 3.0, 7.0, 7.0, 13.0, 7.0, 11.0, 14.0, 13.0, 32.0, 40.0, 73.0, 143.0, 264.0, 788.0, 75989.0, 967226.0, 2988.0, 393.0, 187.0, 123.0, 51.0, 40.0, 20.0, 19.0, 10.0, 8.0, 6.0, 9.0, 9.0, 2.0, 5.0, 6.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0219554901123047e-05, -2.928171306848526e-05, -2.8343871235847473e-05, -2.7406029403209686e-05, -2.64681875705719e-05, -2.5530345737934113e-05, -2.4592503905296326e-05, -2.365466207265854e-05, -2.2716820240020752e-05, -2.1778978407382965e-05, -2.0841136574745178e-05, -1.990329474210739e-05, -1.8965452909469604e-05, -1.8027611076831818e-05, -1.708976924419403e-05, -1.6151927411556244e-05, -1.5214085578918457e-05, -1.427624374628067e-05, -1.3338401913642883e-05, -1.2400560081005096e-05, -1.146271824836731e-05, -1.0524876415729523e-05, -9.587034583091736e-06, -8.649192750453949e-06, -7.711350917816162e-06, -6.773509085178375e-06, -5.835667252540588e-06, -4.8978254199028015e-06, -3.959983587265015e-06, -3.0221417546272278e-06, -2.084299921989441e-06, -1.146458089351654e-06, -2.086162567138672e-07, 7.292255759239197e-07, 1.6670674085617065e-06, 2.6049092411994934e-06, 3.5427510738372803e-06, 4.480592906475067e-06, 5.418434739112854e-06, 6.356276571750641e-06, 7.294118404388428e-06, 8.231960237026215e-06, 9.169802069664001e-06, 1.0107643902301788e-05, 1.1045485734939575e-05, 1.1983327567577362e-05, 1.2921169400215149e-05, 1.3859011232852936e-05, 1.4796853065490723e-05, 1.573469489812851e-05, 1.6672536730766296e-05, 1.7610378563404083e-05, 1.854822039604187e-05, 1.9486062228679657e-05, 2.0423904061317444e-05, 2.136174589395523e-05, 2.2299587726593018e-05, 2.3237429559230804e-05, 2.417527139186859e-05, 2.5113113224506378e-05, 2.6050955057144165e-05, 2.6988796889781952e-05, 2.792663872241974e-05, 2.8864480555057526e-05, 2.9802322387695312e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 74.0, 905.0, 38.0, 1.0], "bins": [-2.0190791474306025e-05, -1.9862396584358066e-05, -1.9534001694410108e-05, -1.920560680446215e-05, -1.887721191451419e-05, -1.8548817024566233e-05, -1.822042031562887e-05, -1.7892025425680913e-05, -1.7563630535732955e-05, -1.7235235645784996e-05, -1.6906840755837038e-05, -1.657844586588908e-05, -1.625005097594112e-05, -1.592165426700376e-05, -1.5593261196045205e-05, -1.5264864487107843e-05, -1.4936470506654587e-05, -1.4608075616706628e-05, -1.427968072675867e-05, -1.395128492731601e-05, -1.3622890037368052e-05, -1.3294495147420093e-05, -1.2966100257472135e-05, -1.2637705367524177e-05, -1.2309310477576219e-05, -1.198091558762826e-05, -1.1652520697680302e-05, -1.1324125807732344e-05, -1.0995730008289684e-05, -1.0667335118341725e-05, -1.0338940228393767e-05, -1.0010545338445809e-05, -9.68215044849785e-06, -9.353755558549892e-06, -9.025360668601934e-06, -8.696964869159274e-06, -8.368569979211316e-06, -8.040175089263357e-06, -7.711780199315399e-06, -7.383385309367441e-06, -7.054989509924781e-06, -6.726594619976822e-06, -6.398199275281513e-06, -6.069804385333555e-06, -5.741409040638246e-06, -5.413014150690287e-06, -5.084619260742329e-06, -4.756224370794371e-06, -4.427829026099062e-06, -4.099434136151103e-06, -3.771038791455794e-06, -3.442643901507836e-06, -3.114248784186202e-06, -2.7858536668645684e-06, -2.45745877691661e-06, -2.1290636595949763e-06, -1.800668769647018e-06, -1.4722736523253843e-06, -1.1438786486905883e-06, -8.154836450557923e-07, -4.870885277341586e-07, -1.5869341041252483e-07, 1.6970147953543346e-07, 4.980965968570672e-07, 8.264917710221198e-07]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 9.0, 0.0, 9.0, 0.0, 0.0, 8.0, 0.0, 24.0, 0.0, 0.0, 28.0, 0.0, 56.0, 0.0, 0.0, 118.0, 0.0, 135.0, 0.0, 0.0, 217.0, 0.0, 145.0, 0.0, 0.0, 102.0, 0.0, 63.0, 0.0, 44.0, 0.0, 0.0, 26.0, 0.0, 9.0, 0.0, 0.0, 4.0, 0.0, 9.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.314367055892944e-07, -6.07222318649292e-07, -5.830079317092896e-07, -5.587935447692871e-07, -5.345791578292847e-07, -5.103647708892822e-07, -4.861503839492798e-07, -4.6193599700927734e-07, -4.377216100692749e-07, -4.1350722312927246e-07, -3.8929283618927e-07, -3.650784492492676e-07, -3.4086406230926514e-07, -3.166496753692627e-07, -2.9243528842926025e-07, -2.682209014892578e-07, -2.4400651454925537e-07, -2.1979212760925293e-07, -1.955777406692505e-07, -1.7136335372924805e-07, -1.471489667892456e-07, -1.2293457984924316e-07, -9.872019290924072e-08, -7.450580596923828e-08, -5.029141902923584e-08, -2.60770320892334e-08, -1.862645149230957e-09, 2.2351741790771484e-08, 4.6566128730773926e-08, 7.078051567077637e-08, 9.499490261077881e-08, 1.1920928955078125e-07, 1.434236764907837e-07, 1.6763806343078613e-07, 1.9185245037078857e-07, 2.1606683731079102e-07, 2.4028122425079346e-07, 2.644956111907959e-07, 2.8870999813079834e-07, 3.129243850708008e-07, 3.371387720108032e-07, 3.6135315895080566e-07, 3.855675458908081e-07, 4.0978193283081055e-07, 4.33996319770813e-07, 4.5821070671081543e-07, 4.824250936508179e-07, 5.066394805908203e-07, 5.308538675308228e-07, 5.550682544708252e-07, 5.792826414108276e-07, 6.034970283508301e-07, 6.277114152908325e-07, 6.51925802230835e-07, 6.761401891708374e-07, 7.003545761108398e-07, 7.245689630508423e-07, 7.487833499908447e-07, 7.729977369308472e-07, 7.972121238708496e-07, 8.21426510810852e-07, 8.456408977508545e-07, 8.698552846908569e-07, 8.940696716308594e-07]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 14.0, 10.0, 14.0, 18.0, 22.0, 24.0, 25.0, 32.0, 29.0, 34.0, 42.0, 43.0, 44.0, 56.0, 47.0, 58.0, 49.0, 64.0, 54.0, 46.0, 47.0, 35.0, 24.0, 28.0, 24.0, 32.0, 16.0, 13.0, 18.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44921875, -3.3319091796875, -3.214599609375, -3.0972900390625, -2.97998046875, -2.8626708984375, -2.745361328125, -2.6280517578125, -2.5107421875, -2.3934326171875, -2.276123046875, -2.1588134765625, -2.04150390625, -1.9241943359375, -1.806884765625, -1.6895751953125, -1.572265625, -1.4549560546875, -1.337646484375, -1.2203369140625, -1.10302734375, -0.9857177734375, -0.868408203125, -0.7510986328125, -0.6337890625, -0.5164794921875, -0.399169921875, -0.2818603515625, -0.16455078125, -0.0472412109375, 0.070068359375, 0.1873779296875, 0.3046875, 0.4219970703125, 0.539306640625, 0.6566162109375, 0.77392578125, 0.8912353515625, 1.008544921875, 1.1258544921875, 1.2431640625, 1.3604736328125, 1.477783203125, 1.5950927734375, 1.71240234375, 1.8297119140625, 1.947021484375, 2.0643310546875, 2.181640625, 2.2989501953125, 2.416259765625, 2.5335693359375, 2.65087890625, 2.7681884765625, 2.885498046875, 3.0028076171875, 3.1201171875, 3.2374267578125, 3.354736328125, 3.4720458984375, 3.58935546875, 3.7066650390625, 3.823974609375, 3.9412841796875, 4.05859375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 8.0, 5.0, 15.0, 10.0, 16.0, 26.0, 32.0, 45.0, 69.0, 92.0, 140.0, 191.0, 300.0, 399.0, 554.0, 844.0, 1158.0, 1669.0, 2348.0, 3672.0, 5827.0, 10050.0, 18897.0, 40409.0, 94434.0, 238008.0, 356344.0, 148276.0, 61579.0, 27751.0, 13649.0, 7614.0, 4629.0, 2964.0, 1931.0, 1351.0, 1006.0, 644.0, 464.0, 333.0, 231.0, 175.0, 141.0, 81.0, 59.0, 43.0, 28.0, 19.0, 6.0, 12.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.12890625, -3.025482177734375, -2.92205810546875, -2.818634033203125, -2.7152099609375, -2.611785888671875, -2.50836181640625, -2.404937744140625, -2.301513671875, -2.198089599609375, -2.09466552734375, -1.991241455078125, -1.8878173828125, -1.784393310546875, -1.68096923828125, -1.577545166015625, -1.47412109375, -1.370697021484375, -1.26727294921875, -1.163848876953125, -1.0604248046875, -0.957000732421875, -0.85357666015625, -0.750152587890625, -0.646728515625, -0.543304443359375, -0.43988037109375, -0.336456298828125, -0.2330322265625, -0.129608154296875, -0.02618408203125, 0.077239990234375, 0.1806640625, 0.284088134765625, 0.38751220703125, 0.490936279296875, 0.5943603515625, 0.697784423828125, 0.80120849609375, 0.904632568359375, 1.008056640625, 1.111480712890625, 1.21490478515625, 1.318328857421875, 1.4217529296875, 1.525177001953125, 1.62860107421875, 1.732025146484375, 1.83544921875, 1.938873291015625, 2.04229736328125, 2.145721435546875, 2.2491455078125, 2.352569580078125, 2.45599365234375, 2.559417724609375, 2.662841796875, 2.766265869140625, 2.86968994140625, 2.973114013671875, 3.0765380859375, 3.179962158203125, 3.28338623046875, 3.386810302734375, 3.490234375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 13.0, 9.0, 13.0, 10.0, 21.0, 19.0, 19.0, 27.0, 37.0, 42.0, 46.0, 50.0, 68.0, 115.0, 223.0, 1547.0, 278.0, 110.0, 59.0, 54.0, 46.0, 40.0, 35.0, 37.0, 28.0, 22.0, 20.0, 11.0, 14.0, 6.0, 13.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.260986328125, -9.88916015625, -9.517333984375, -9.1455078125, -8.773681640625, -8.40185546875, -8.030029296875, -7.658203125, -7.286376953125, -6.91455078125, -6.542724609375, -6.1708984375, -5.799072265625, -5.42724609375, -5.055419921875, -4.68359375, -4.311767578125, -3.93994140625, -3.568115234375, -3.1962890625, -2.824462890625, -2.45263671875, -2.080810546875, -1.708984375, -1.337158203125, -0.96533203125, -0.593505859375, -0.2216796875, 0.150146484375, 0.52197265625, 0.893798828125, 1.265625, 1.637451171875, 2.00927734375, 2.381103515625, 2.7529296875, 3.124755859375, 3.49658203125, 3.868408203125, 4.240234375, 4.612060546875, 4.98388671875, 5.355712890625, 5.7275390625, 6.099365234375, 6.47119140625, 6.843017578125, 7.21484375, 7.586669921875, 7.95849609375, 8.330322265625, 8.7021484375, 9.073974609375, 9.44580078125, 9.817626953125, 10.189453125, 10.561279296875, 10.93310546875, 11.304931640625, 11.6767578125, 12.048583984375, 12.42041015625, 12.792236328125, 13.1640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 2.0, 6.0, 13.0, 14.0, 20.0, 30.0, 37.0, 50.0, 77.0, 122.0, 185.0, 302.0, 698.0, 2484.0, 18169.0, 2705061.0, 407408.0, 8242.0, 1570.0, 478.0, 252.0, 159.0, 95.0, 59.0, 40.0, 29.0, 30.0, 19.0, 16.0, 9.0, 6.0, 8.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.40625, -19.744384765625, -19.08251953125, -18.420654296875, -17.7587890625, -17.096923828125, -16.43505859375, -15.773193359375, -15.111328125, -14.449462890625, -13.78759765625, -13.125732421875, -12.4638671875, -11.802001953125, -11.14013671875, -10.478271484375, -9.81640625, -9.154541015625, -8.49267578125, -7.830810546875, -7.1689453125, -6.507080078125, -5.84521484375, -5.183349609375, -4.521484375, -3.859619140625, -3.19775390625, -2.535888671875, -1.8740234375, -1.212158203125, -0.55029296875, 0.111572265625, 0.7734375, 1.435302734375, 2.09716796875, 2.759033203125, 3.4208984375, 4.082763671875, 4.74462890625, 5.406494140625, 6.068359375, 6.730224609375, 7.39208984375, 8.053955078125, 8.7158203125, 9.377685546875, 10.03955078125, 10.701416015625, 11.36328125, 12.025146484375, 12.68701171875, 13.348876953125, 14.0107421875, 14.672607421875, 15.33447265625, 15.996337890625, 16.658203125, 17.320068359375, 17.98193359375, 18.643798828125, 19.3056640625, 19.967529296875, 20.62939453125, 21.291259765625, 21.953125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 329.0, 688.0], "bins": [-439.1383972167969, -432.17840576171875, -425.2184143066406, -418.2584228515625, -411.2984619140625, -404.3384704589844, -397.37847900390625, -390.4184875488281, -383.45849609375, -376.4985046386719, -369.53851318359375, -362.57855224609375, -355.6185607910156, -348.6585693359375, -341.6985778808594, -334.73858642578125, -327.77862548828125, -320.8186340332031, -313.858642578125, -306.898681640625, -299.9386901855469, -292.97869873046875, -286.0187072753906, -279.0587158203125, -272.0987243652344, -265.13873291015625, -258.1787414550781, -251.21876525878906, -244.25877380371094, -237.29879760742188, -230.33880615234375, -223.37881469726562, -216.41883850097656, -209.45884704589844, -202.49887084960938, -195.53887939453125, -188.57888793945312, -181.618896484375, -174.65892028808594, -167.6989288330078, -160.7389373779297, -153.77894592285156, -146.8189697265625, -139.85897827148438, -132.89898681640625, -125.93900299072266, -118.97901916503906, -112.01902770996094, -105.05905151367188, -98.09906768798828, -91.13907623291016, -84.17909240722656, -77.21910095214844, -70.25911712646484, -63.29913330078125, -56.33914566040039, -49.37915802001953, -42.41917037963867, -35.45918273925781, -28.49919891357422, -21.53921127319336, -14.5792236328125, -7.619239807128906, -0.6592521667480469, 6.300736904144287]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 5.0, 7.0, 10.0, 12.0, 21.0, 22.0, 25.0, 16.0, 24.0, 22.0, 34.0, 26.0, 34.0, 48.0, 43.0, 42.0, 53.0, 42.0, 43.0, 60.0, 38.0, 42.0, 38.0, 36.0, 39.0, 31.0, 29.0, 26.0, 22.0, 21.0, 12.0, 16.0, 12.0, 10.0, 10.0, 4.0, 5.0, 8.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.695337295532227, -28.728042602539062, -27.760746002197266, -26.79344940185547, -25.826154708862305, -24.85886001586914, -23.891563415527344, -22.924266815185547, -21.956972122192383, -20.98967742919922, -20.022380828857422, -19.055084228515625, -18.08778953552246, -17.120494842529297, -16.1531982421875, -15.18590259552002, -14.218606948852539, -13.251311302185059, -12.284015655517578, -11.316720008850098, -10.349424362182617, -9.382128715515137, -8.414833068847656, -7.447537422180176, -6.480241775512695, -5.512946128845215, -4.545650482177734, -3.578354835510254, -2.6110591888427734, -1.643763542175293, -0.6764678955078125, 0.29082775115966797, 1.2581253051757812, 2.2254209518432617, 3.192716598510742, 4.160012245178223, 5.127307891845703, 6.094603538513184, 7.061899185180664, 8.029194831848145, 8.996490478515625, 9.963786125183105, 10.931081771850586, 11.898377418518066, 12.865673065185547, 13.832968711853027, 14.800264358520508, 15.767560005187988, 16.73485565185547, 17.702152252197266, 18.66944694519043, 19.636741638183594, 20.60403823852539, 21.571334838867188, 22.53862953186035, 23.505924224853516, 24.473220825195312, 25.44051742553711, 26.407812118530273, 27.375106811523438, 28.342403411865234, 29.30970001220703, 30.276994705200195, 31.24428939819336, 32.211585998535156]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 10.0, 9.0, 14.0, 11.0, 21.0, 24.0, 30.0, 37.0, 32.0, 41.0, 35.0, 51.0, 50.0, 54.0, 41.0, 54.0, 63.0, 61.0, 55.0, 46.0, 37.0, 44.0, 27.0, 30.0, 26.0, 23.0, 16.0, 17.0, 12.0, 6.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.751953125, -3.628204345703125, -3.50445556640625, -3.380706787109375, -3.2569580078125, -3.133209228515625, -3.00946044921875, -2.885711669921875, -2.761962890625, -2.638214111328125, -2.51446533203125, -2.390716552734375, -2.2669677734375, -2.143218994140625, -2.01947021484375, -1.895721435546875, -1.77197265625, -1.648223876953125, -1.52447509765625, -1.400726318359375, -1.2769775390625, -1.153228759765625, -1.02947998046875, -0.905731201171875, -0.781982421875, -0.658233642578125, -0.53448486328125, -0.410736083984375, -0.2869873046875, -0.163238525390625, -0.03948974609375, 0.084259033203125, 0.2080078125, 0.331756591796875, 0.45550537109375, 0.579254150390625, 0.7030029296875, 0.826751708984375, 0.95050048828125, 1.074249267578125, 1.197998046875, 1.321746826171875, 1.44549560546875, 1.569244384765625, 1.6929931640625, 1.816741943359375, 1.94049072265625, 2.064239501953125, 2.18798828125, 2.311737060546875, 2.43548583984375, 2.559234619140625, 2.6829833984375, 2.806732177734375, 2.93048095703125, 3.054229736328125, 3.177978515625, 3.301727294921875, 3.42547607421875, 3.549224853515625, 3.6729736328125, 3.796722412109375, 3.92047119140625, 4.044219970703125, 4.16796875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 11.0, 22.0, 28.0, 35.0, 52.0, 60.0, 92.0, 155.0, 249.0, 409.0, 639.0, 1094.0, 2062.0, 4024.0, 8969.0, 22586.0, 66099.0, 239046.0, 1041899.0, 1971188.0, 614388.0, 147739.0, 44116.0, 15903.0, 6488.0, 3049.0, 1554.0, 864.0, 519.0, 328.0, 183.0, 130.0, 81.0, 51.0, 52.0, 22.0, 28.0, 10.0, 12.0, 7.0, 2.0, 8.0, 5.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.05859375, -5.87677001953125, -5.6949462890625, -5.51312255859375, -5.331298828125, -5.14947509765625, -4.9676513671875, -4.78582763671875, -4.60400390625, -4.42218017578125, -4.2403564453125, -4.05853271484375, -3.876708984375, -3.69488525390625, -3.5130615234375, -3.33123779296875, -3.1494140625, -2.96759033203125, -2.7857666015625, -2.60394287109375, -2.422119140625, -2.24029541015625, -2.0584716796875, -1.87664794921875, -1.69482421875, -1.51300048828125, -1.3311767578125, -1.14935302734375, -0.967529296875, -0.78570556640625, -0.6038818359375, -0.42205810546875, -0.240234375, -0.05841064453125, 0.1234130859375, 0.30523681640625, 0.487060546875, 0.66888427734375, 0.8507080078125, 1.03253173828125, 1.21435546875, 1.39617919921875, 1.5780029296875, 1.75982666015625, 1.941650390625, 2.12347412109375, 2.3052978515625, 2.48712158203125, 2.6689453125, 2.85076904296875, 3.0325927734375, 3.21441650390625, 3.396240234375, 3.57806396484375, 3.7598876953125, 3.94171142578125, 4.12353515625, 4.30535888671875, 4.4871826171875, 4.66900634765625, 4.850830078125, 5.03265380859375, 5.2144775390625, 5.39630126953125, 5.578125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 11.0, 18.0, 12.0, 26.0, 35.0, 36.0, 43.0, 66.0, 63.0, 115.0, 130.0, 174.0, 227.0, 250.0, 322.0, 401.0, 399.0, 346.0, 284.0, 247.0, 189.0, 160.0, 117.0, 95.0, 70.0, 52.0, 41.0, 30.0, 19.0, 24.0, 15.0, 10.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.28515625, -6.1162109375, -5.947265625, -5.7783203125, -5.609375, -5.4404296875, -5.271484375, -5.1025390625, -4.93359375, -4.7646484375, -4.595703125, -4.4267578125, -4.2578125, -4.0888671875, -3.919921875, -3.7509765625, -3.58203125, -3.4130859375, -3.244140625, -3.0751953125, -2.90625, -2.7373046875, -2.568359375, -2.3994140625, -2.23046875, -2.0615234375, -1.892578125, -1.7236328125, -1.5546875, -1.3857421875, -1.216796875, -1.0478515625, -0.87890625, -0.7099609375, -0.541015625, -0.3720703125, -0.203125, -0.0341796875, 0.134765625, 0.3037109375, 0.47265625, 0.6416015625, 0.810546875, 0.9794921875, 1.1484375, 1.3173828125, 1.486328125, 1.6552734375, 1.82421875, 1.9931640625, 2.162109375, 2.3310546875, 2.5, 2.6689453125, 2.837890625, 3.0068359375, 3.17578125, 3.3447265625, 3.513671875, 3.6826171875, 3.8515625, 4.0205078125, 4.189453125, 4.3583984375, 4.52734375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 13.0, 19.0, 15.0, 28.0, 30.0, 39.0, 57.0, 70.0, 115.0, 157.0, 194.0, 385.0, 947.0, 5814.0, 121376.0, 3559243.0, 488899.0, 13935.0, 1604.0, 439.0, 254.0, 156.0, 119.0, 72.0, 64.0, 48.0, 40.0, 35.0, 21.0, 21.0, 11.0, 12.0, 6.0, 6.0, 4.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.015625, -18.27490234375, -17.5341796875, -16.79345703125, -16.052734375, -15.31201171875, -14.5712890625, -13.83056640625, -13.08984375, -12.34912109375, -11.6083984375, -10.86767578125, -10.126953125, -9.38623046875, -8.6455078125, -7.90478515625, -7.1640625, -6.42333984375, -5.6826171875, -4.94189453125, -4.201171875, -3.46044921875, -2.7197265625, -1.97900390625, -1.23828125, -0.49755859375, 0.2431640625, 0.98388671875, 1.724609375, 2.46533203125, 3.2060546875, 3.94677734375, 4.6875, 5.42822265625, 6.1689453125, 6.90966796875, 7.650390625, 8.39111328125, 9.1318359375, 9.87255859375, 10.61328125, 11.35400390625, 12.0947265625, 12.83544921875, 13.576171875, 14.31689453125, 15.0576171875, 15.79833984375, 16.5390625, 17.27978515625, 18.0205078125, 18.76123046875, 19.501953125, 20.24267578125, 20.9833984375, 21.72412109375, 22.46484375, 23.20556640625, 23.9462890625, 24.68701171875, 25.427734375, 26.16845703125, 26.9091796875, 27.64990234375, 28.390625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 10.0, 7.0, 21.0, 34.0, 70.0, 67.0, 81.0, 97.0, 127.0, 116.0, 107.0, 84.0, 62.0, 44.0, 29.0, 22.0, 17.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.76214027404785, -21.62501335144043, -20.487886428833008, -19.350759506225586, -18.213634490966797, -17.076507568359375, -15.939380645751953, -14.802253723144531, -13.66512680053711, -12.527999877929688, -11.390872955322266, -10.25374698638916, -9.116620063781738, -7.979493141174316, -6.842366695404053, -5.705240249633789, -4.568113327026367, -3.4309866428375244, -2.2938599586486816, -1.1567332744598389, -0.019606590270996094, 1.1175203323364258, 2.2546467781066895, 3.391773223876953, 4.528900146484375, 5.666027069091797, 6.8031535148620605, 7.940279960632324, 9.077406883239746, 10.214533805847168, 11.351659774780273, 12.488786697387695, 13.625911712646484, 14.763038635253906, 15.900165557861328, 17.03729248046875, 18.174419403076172, 19.311546325683594, 20.448671340942383, 21.585798263549805, 22.722925186157227, 23.86005210876465, 24.99717903137207, 26.134305953979492, 27.27143096923828, 28.408557891845703, 29.545684814453125, 30.682811737060547, 31.81993865966797, 32.95706558227539, 34.09419250488281, 35.231319427490234, 36.368446350097656, 37.50557327270508, 38.6427001953125, 39.779823303222656, 40.916954040527344, 42.054080963134766, 43.19120788574219, 44.32833480834961, 45.46546173095703, 46.60258865356445, 47.739715576171875, 48.87683868408203, 50.01396560668945]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 6.0, 13.0, 7.0, 14.0, 8.0, 25.0, 22.0, 28.0, 25.0, 26.0, 23.0, 32.0, 38.0, 50.0, 53.0, 44.0, 47.0, 43.0, 43.0, 48.0, 40.0, 39.0, 35.0, 31.0, 31.0, 30.0, 29.0, 27.0, 30.0, 24.0, 20.0, 17.0, 10.0, 11.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0], "bins": [-24.647010803222656, -23.960922241210938, -23.27483367919922, -22.5887451171875, -21.90265655517578, -21.21656608581543, -20.53047752380371, -19.844388961791992, -19.158300399780273, -18.472211837768555, -17.786123275756836, -17.100034713745117, -16.413944244384766, -15.727856636047363, -15.041767120361328, -14.35567855834961, -13.66958999633789, -12.983501434326172, -12.297412872314453, -11.611323356628418, -10.9252347946167, -10.23914623260498, -9.553056716918945, -8.866968154907227, -8.180879592895508, -7.494791030883789, -6.808701992034912, -6.122612953186035, -5.436524391174316, -4.750435829162598, -4.064346790313721, -3.3782577514648438, -2.692169189453125, -2.006080389022827, -1.3199915885925293, -0.6339027881622314, 0.052186012268066406, 0.7382748126983643, 1.424363613128662, 2.110452651977539, 2.796541213989258, 3.4826300144195557, 4.1687188148498535, 4.8548078536987305, 5.540896415710449, 6.226984977722168, 6.913074016571045, 7.599163055419922, 8.28525161743164, 8.97134017944336, 9.657428741455078, 10.343518257141113, 11.029606819152832, 11.71569538116455, 12.401784896850586, 13.087873458862305, 13.773962020874023, 14.460050582885742, 15.146139144897461, 15.832228660583496, 16.51831817626953, 17.20440673828125, 17.89049530029297, 18.576583862304688, 19.262672424316406]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 11.0, 8.0, 12.0, 19.0, 26.0, 28.0, 29.0, 35.0, 42.0, 44.0, 38.0, 47.0, 52.0, 46.0, 58.0, 45.0, 57.0, 57.0, 49.0, 35.0, 40.0, 40.0, 34.0, 26.0, 26.0, 20.0, 26.0, 5.0, 15.0, 4.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.798828125, -3.675811767578125, -3.55279541015625, -3.429779052734375, -3.3067626953125, -3.183746337890625, -3.06072998046875, -2.937713623046875, -2.814697265625, -2.691680908203125, -2.56866455078125, -2.445648193359375, -2.3226318359375, -2.199615478515625, -2.07659912109375, -1.953582763671875, -1.83056640625, -1.707550048828125, -1.58453369140625, -1.461517333984375, -1.3385009765625, -1.215484619140625, -1.09246826171875, -0.969451904296875, -0.846435546875, -0.723419189453125, -0.60040283203125, -0.477386474609375, -0.3543701171875, -0.231353759765625, -0.10833740234375, 0.014678955078125, 0.1376953125, 0.260711669921875, 0.38372802734375, 0.506744384765625, 0.6297607421875, 0.752777099609375, 0.87579345703125, 0.998809814453125, 1.121826171875, 1.244842529296875, 1.36785888671875, 1.490875244140625, 1.6138916015625, 1.736907958984375, 1.85992431640625, 1.982940673828125, 2.10595703125, 2.228973388671875, 2.35198974609375, 2.475006103515625, 2.5980224609375, 2.721038818359375, 2.84405517578125, 2.967071533203125, 3.090087890625, 3.213104248046875, 3.33612060546875, 3.459136962890625, 3.5821533203125, 3.705169677734375, 3.82818603515625, 3.951202392578125, 4.07421875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 13.0, 5.0, 6.0, 8.0, 16.0, 24.0, 31.0, 49.0, 67.0, 83.0, 157.0, 213.0, 311.0, 508.0, 802.0, 1224.0, 1862.0, 2806.0, 4532.0, 7057.0, 11148.0, 17907.0, 29474.0, 49576.0, 86947.0, 163233.0, 275186.0, 172044.0, 91017.0, 51166.0, 30430.0, 18637.0, 11614.0, 7277.0, 4653.0, 2975.0, 1952.0, 1204.0, 772.0, 496.0, 342.0, 233.0, 172.0, 104.0, 56.0, 38.0, 39.0, 18.0, 14.0, 18.0, 6.0, 8.0, 7.0, 6.0, 6.0, 2.0, 6.0], "bins": [-0.024810791015625, -0.02407097816467285, -0.023331165313720703, -0.022591352462768555, -0.021851539611816406, -0.021111726760864258, -0.02037191390991211, -0.01963210105895996, -0.018892288208007812, -0.018152475357055664, -0.017412662506103516, -0.016672849655151367, -0.01593303680419922, -0.01519322395324707, -0.014453411102294922, -0.013713598251342773, -0.012973785400390625, -0.012233972549438477, -0.011494159698486328, -0.01075434684753418, -0.010014533996582031, -0.009274721145629883, -0.008534908294677734, -0.007795095443725586, -0.0070552825927734375, -0.006315469741821289, -0.005575656890869141, -0.004835844039916992, -0.004096031188964844, -0.0033562183380126953, -0.002616405487060547, -0.0018765926361083984, -0.00113677978515625, -0.00039696693420410156, 0.0003428459167480469, 0.0010826587677001953, 0.0018224716186523438, 0.002562284469604492, 0.0033020973205566406, 0.004041910171508789, 0.0047817230224609375, 0.005521535873413086, 0.006261348724365234, 0.007001161575317383, 0.007740974426269531, 0.00848078727722168, 0.009220600128173828, 0.009960412979125977, 0.010700225830078125, 0.011440038681030273, 0.012179851531982422, 0.01291966438293457, 0.013659477233886719, 0.014399290084838867, 0.015139102935791016, 0.015878915786743164, 0.016618728637695312, 0.01735854148864746, 0.01809835433959961, 0.018838167190551758, 0.019577980041503906, 0.020317792892456055, 0.021057605743408203, 0.02179741859436035, 0.0225372314453125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 12.0, 8.0, 9.0, 10.0, 11.0, 21.0, 17.0, 22.0, 16.0, 27.0, 32.0, 34.0, 27.0, 28.0, 28.0, 43.0, 31.0, 46.0, 32.0, 1064.0, 50.0, 33.0, 40.0, 43.0, 38.0, 35.0, 38.0, 35.0, 35.0, 28.0, 20.0, 16.0, 9.0, 15.0, 6.0, 11.0, 10.0, 13.0, 4.0, 4.0, 5.0, 7.0, 0.0, 6.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3671875, -2.291900634765625, -2.21661376953125, -2.141326904296875, -2.0660400390625, -1.990753173828125, -1.91546630859375, -1.840179443359375, -1.764892578125, -1.689605712890625, -1.61431884765625, -1.539031982421875, -1.4637451171875, -1.388458251953125, -1.31317138671875, -1.237884521484375, -1.16259765625, -1.087310791015625, -1.01202392578125, -0.936737060546875, -0.8614501953125, -0.786163330078125, -0.71087646484375, -0.635589599609375, -0.560302734375, -0.485015869140625, -0.40972900390625, -0.334442138671875, -0.2591552734375, -0.183868408203125, -0.10858154296875, -0.033294677734375, 0.0419921875, 0.117279052734375, 0.19256591796875, 0.267852783203125, 0.3431396484375, 0.418426513671875, 0.49371337890625, 0.569000244140625, 0.644287109375, 0.719573974609375, 0.79486083984375, 0.870147705078125, 0.9454345703125, 1.020721435546875, 1.09600830078125, 1.171295166015625, 1.24658203125, 1.321868896484375, 1.39715576171875, 1.472442626953125, 1.5477294921875, 1.623016357421875, 1.69830322265625, 1.773590087890625, 1.848876953125, 1.924163818359375, 1.99945068359375, 2.074737548828125, 2.1500244140625, 2.225311279296875, 2.30059814453125, 2.375885009765625, 2.451171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 9.0, 10.0, 11.0, 20.0, 27.0, 41.0, 68.0, 86.0, 121.0, 175.0, 222.0, 336.0, 450.0, 668.0, 918.0, 1316.0, 1833.0, 2817.0, 3912.0, 5582.0, 8288.0, 12186.0, 18050.0, 26571.0, 39912.0, 59659.0, 91103.0, 137263.0, 1230176.0, 150792.0, 101191.0, 66533.0, 44202.0, 29576.0, 19849.0, 13494.0, 9096.0, 6249.0, 4319.0, 2999.0, 2105.0, 1470.0, 1009.0, 726.0, 536.0, 338.0, 246.0, 156.0, 131.0, 91.0, 74.0, 39.0, 28.0, 22.0, 11.0, 16.0, 7.0, 4.0, 3.0, 2.0], "bins": [-0.00789642333984375, -0.007654428482055664, -0.007412433624267578, -0.007170438766479492, -0.006928443908691406, -0.00668644905090332, -0.006444454193115234, -0.0062024593353271484, -0.0059604644775390625, -0.0057184696197509766, -0.005476474761962891, -0.005234479904174805, -0.004992485046386719, -0.004750490188598633, -0.004508495330810547, -0.004266500473022461, -0.004024505615234375, -0.003782510757446289, -0.003540515899658203, -0.003298521041870117, -0.0030565261840820312, -0.0028145313262939453, -0.0025725364685058594, -0.0023305416107177734, -0.0020885467529296875, -0.0018465518951416016, -0.0016045570373535156, -0.0013625621795654297, -0.0011205673217773438, -0.0008785724639892578, -0.0006365776062011719, -0.00039458274841308594, -0.000152587890625, 8.940696716308594e-05, 0.0003314018249511719, 0.0005733966827392578, 0.0008153915405273438, 0.0010573863983154297, 0.0012993812561035156, 0.0015413761138916016, 0.0017833709716796875, 0.0020253658294677734, 0.0022673606872558594, 0.0025093555450439453, 0.0027513504028320312, 0.002993345260620117, 0.003235340118408203, 0.003477334976196289, 0.003719329833984375, 0.003961324691772461, 0.004203319549560547, 0.004445314407348633, 0.004687309265136719, 0.004929304122924805, 0.005171298980712891, 0.0054132938385009766, 0.0056552886962890625, 0.0058972835540771484, 0.006139278411865234, 0.00638127326965332, 0.006623268127441406, 0.006865262985229492, 0.007107257843017578, 0.007349252700805664, 0.00759124755859375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 0.0, 5.0, 0.0, 16.0, 0.0, 12.0, 0.0, 17.0, 16.0, 0.0, 35.0, 0.0, 41.0, 0.0, 50.0, 65.0, 0.0, 139.0, 0.0, 212.0, 0.0, 142.0, 0.0, 92.0, 42.0, 0.0, 39.0, 0.0, 21.0, 0.0, 28.0, 8.0, 0.0, 6.0, 0.0, 6.0, 0.0, 1.0, 0.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.201467037200928e-07, -8.866190910339355e-07, -8.530914783477783e-07, -8.195638656616211e-07, -7.860362529754639e-07, -7.525086402893066e-07, -7.189810276031494e-07, -6.854534149169922e-07, -6.51925802230835e-07, -6.183981895446777e-07, -5.848705768585205e-07, -5.513429641723633e-07, -5.178153514862061e-07, -4.842877388000488e-07, -4.507601261138916e-07, -4.172325134277344e-07, -3.8370490074157715e-07, -3.501772880554199e-07, -3.166496753692627e-07, -2.8312206268310547e-07, -2.4959444999694824e-07, -2.1606683731079102e-07, -1.825392246246338e-07, -1.4901161193847656e-07, -1.1548399925231934e-07, -8.195638656616211e-08, -4.842877388000488e-08, -1.4901161193847656e-08, 1.862645149230957e-08, 5.21540641784668e-08, 8.568167686462402e-08, 1.1920928955078125e-07, 1.5273690223693848e-07, 1.862645149230957e-07, 2.1979212760925293e-07, 2.5331974029541016e-07, 2.868473529815674e-07, 3.203749656677246e-07, 3.5390257835388184e-07, 3.8743019104003906e-07, 4.209578037261963e-07, 4.544854164123535e-07, 4.880130290985107e-07, 5.21540641784668e-07, 5.550682544708252e-07, 5.885958671569824e-07, 6.221234798431396e-07, 6.556510925292969e-07, 6.891787052154541e-07, 7.227063179016113e-07, 7.562339305877686e-07, 7.897615432739258e-07, 8.23289155960083e-07, 8.568167686462402e-07, 8.903443813323975e-07, 9.238719940185547e-07, 9.57399606704712e-07, 9.909272193908691e-07, 1.0244548320770264e-06, 1.0579824447631836e-06, 1.0915100574493408e-06, 1.125037670135498e-06, 1.1585652828216553e-06, 1.1920928955078125e-06]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 7.0, 15.0, 21.0, 22.0, 36.0, 45.0, 87.0, 168.0, 344.0, 2435.0, 215796.0, 822799.0, 5768.0, 466.0, 172.0, 92.0, 68.0, 47.0, 20.0, 26.0, 13.0, 10.0, 15.0, 4.0, 6.0, 9.0, 9.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.580881118774414e-05, -2.5093555450439453e-05, -2.4378299713134766e-05, -2.3663043975830078e-05, -2.294778823852539e-05, -2.2232532501220703e-05, -2.1517276763916016e-05, -2.0802021026611328e-05, -2.008676528930664e-05, -1.9371509552001953e-05, -1.8656253814697266e-05, -1.7940998077392578e-05, -1.722574234008789e-05, -1.6510486602783203e-05, -1.5795230865478516e-05, -1.5079975128173828e-05, -1.436471939086914e-05, -1.3649463653564453e-05, -1.2934207916259766e-05, -1.2218952178955078e-05, -1.150369644165039e-05, -1.0788440704345703e-05, -1.0073184967041016e-05, -9.357929229736328e-06, -8.64267349243164e-06, -7.927417755126953e-06, -7.212162017822266e-06, -6.496906280517578e-06, -5.781650543212891e-06, -5.066394805908203e-06, -4.351139068603516e-06, -3.635883331298828e-06, -2.9206275939941406e-06, -2.205371856689453e-06, -1.4901161193847656e-06, -7.748603820800781e-07, -5.960464477539063e-08, 6.556510925292969e-07, 1.3709068298339844e-06, 2.086162567138672e-06, 2.8014183044433594e-06, 3.516674041748047e-06, 4.231929779052734e-06, 4.947185516357422e-06, 5.662441253662109e-06, 6.377696990966797e-06, 7.092952728271484e-06, 7.808208465576172e-06, 8.52346420288086e-06, 9.238719940185547e-06, 9.953975677490234e-06, 1.0669231414794922e-05, 1.138448715209961e-05, 1.2099742889404297e-05, 1.2814998626708984e-05, 1.3530254364013672e-05, 1.424551010131836e-05, 1.4960765838623047e-05, 1.5676021575927734e-05, 1.6391277313232422e-05, 1.710653305053711e-05, 1.7821788787841797e-05, 1.8537044525146484e-05, 1.9252300262451172e-05, 1.996755599975586e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 9.0, 36.0, 129.0, 375.0, 321.0, 122.0, 19.0, 5.0, 4.0], "bins": [-6.3115667217061855e-06, -6.2043445723247714e-06, -6.097122422943357e-06, -5.989900728309294e-06, -5.88267857892788e-06, -5.775456429546466e-06, -5.668234280165052e-06, -5.561012585530989e-06, -5.453790436149575e-06, -5.346568286768161e-06, -5.239346137386747e-06, -5.1321244427526835e-06, -5.0249022933712695e-06, -4.9176801439898554e-06, -4.810457994608441e-06, -4.703236299974378e-06, -4.596014150592964e-06, -4.48879200121155e-06, -4.381569851830136e-06, -4.274348157196073e-06, -4.167126007814659e-06, -4.059903858433245e-06, -3.952681709051831e-06, -3.8454600144177675e-06, -3.738237637662678e-06, -3.631015488281264e-06, -3.5237935662735254e-06, -3.4165714168921113e-06, -3.3093494948843727e-06, -3.2021273455029586e-06, -3.09490542349522e-06, -2.987683274113806e-06, -2.8804613521060674e-06, -2.7732392027246533e-06, -2.6660172807169147e-06, -2.5587951313355006e-06, -2.451573209327762e-06, -2.344351059946348e-06, -2.2371291379386093e-06, -2.1299069885571953e-06, -2.0226848391757812e-06, -1.915462689794367e-06, -1.8082407677866286e-06, -1.7010187320920522e-06, -1.593796696397476e-06, -1.4865745470160618e-06, -1.3793526250083232e-06, -1.2721304756269092e-06, -1.1649085536191706e-06, -1.0576865179245942e-06, -9.504644822300179e-07, -8.432424465354416e-07, -7.360204108408652e-07, -6.2879831830287e-07, -5.215762826082937e-07, -4.1435424691371736e-07, -3.071322680625599e-07, -1.9991023236798355e-07, -9.26881824625525e-08, 1.4533867442878545e-08, 1.2175590313745488e-07, 2.2897796725374064e-07, 3.36200002948317e-07, 4.434220386428933e-07, 5.506440743374696e-07]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 13.0, 0.0, 0.0, 40.0, 0.0, 0.0, 60.0, 0.0, 0.0, 118.0, 0.0, 0.0, 0.0, 172.0, 0.0, 0.0, 186.0, 0.0, 0.0, 148.0, 0.0, 0.0, 115.0, 0.0, 0.0, 70.0, 0.0, 0.0, 0.0, 39.0, 0.0, 0.0, 21.0, 0.0, 0.0, 12.0, 0.0, 0.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.370246410369873e-07, -6.183981895446777e-07, -5.997717380523682e-07, -5.811452865600586e-07, -5.62518835067749e-07, -5.438923835754395e-07, -5.252659320831299e-07, -5.066394805908203e-07, -4.880130290985107e-07, -4.6938657760620117e-07, -4.507601261138916e-07, -4.3213367462158203e-07, -4.1350722312927246e-07, -3.948807716369629e-07, -3.762543201446533e-07, -3.5762786865234375e-07, -3.390014171600342e-07, -3.203749656677246e-07, -3.0174851417541504e-07, -2.8312206268310547e-07, -2.644956111907959e-07, -2.4586915969848633e-07, -2.2724270820617676e-07, -2.086162567138672e-07, -1.8998980522155762e-07, -1.7136335372924805e-07, -1.5273690223693848e-07, -1.341104507446289e-07, -1.1548399925231934e-07, -9.685754776000977e-08, -7.82310962677002e-08, -5.960464477539063e-08, -4.0978193283081055e-08, -2.2351741790771484e-08, -3.725290298461914e-09, 1.4901161193847656e-08, 3.3527612686157227e-08, 5.21540641784668e-08, 7.078051567077637e-08, 8.940696716308594e-08, 1.0803341865539551e-07, 1.2665987014770508e-07, 1.4528632164001465e-07, 1.6391277313232422e-07, 1.825392246246338e-07, 2.0116567611694336e-07, 2.1979212760925293e-07, 2.384185791015625e-07, 2.5704503059387207e-07, 2.7567148208618164e-07, 2.942979335784912e-07, 3.129243850708008e-07, 3.3155083656311035e-07, 3.501772880554199e-07, 3.688037395477295e-07, 3.8743019104003906e-07, 4.0605664253234863e-07, 4.246830940246582e-07, 4.4330954551696777e-07, 4.6193599700927734e-07, 4.805624485015869e-07, 4.991888999938965e-07, 5.178153514862061e-07, 5.364418029785156e-07]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 11.0, 8.0, 12.0, 19.0, 26.0, 28.0, 29.0, 35.0, 42.0, 44.0, 38.0, 47.0, 52.0, 46.0, 58.0, 45.0, 57.0, 57.0, 49.0, 35.0, 40.0, 40.0, 34.0, 26.0, 26.0, 20.0, 26.0, 5.0, 15.0, 4.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.798828125, -3.675811767578125, -3.55279541015625, -3.429779052734375, -3.3067626953125, -3.183746337890625, -3.06072998046875, -2.937713623046875, -2.814697265625, -2.691680908203125, -2.56866455078125, -2.445648193359375, -2.3226318359375, -2.199615478515625, -2.07659912109375, -1.953582763671875, -1.83056640625, -1.707550048828125, -1.58453369140625, -1.461517333984375, -1.3385009765625, -1.215484619140625, -1.09246826171875, -0.969451904296875, -0.846435546875, -0.723419189453125, -0.60040283203125, -0.477386474609375, -0.3543701171875, -0.231353759765625, -0.10833740234375, 0.014678955078125, 0.1376953125, 0.260711669921875, 0.38372802734375, 0.506744384765625, 0.6297607421875, 0.752777099609375, 0.87579345703125, 0.998809814453125, 1.121826171875, 1.244842529296875, 1.36785888671875, 1.490875244140625, 1.6138916015625, 1.736907958984375, 1.85992431640625, 1.982940673828125, 2.10595703125, 2.228973388671875, 2.35198974609375, 2.475006103515625, 2.5980224609375, 2.721038818359375, 2.84405517578125, 2.967071533203125, 3.090087890625, 3.213104248046875, 3.33612060546875, 3.459136962890625, 3.5821533203125, 3.705169677734375, 3.82818603515625, 3.951202392578125, 4.07421875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 10.0, 17.0, 24.0, 32.0, 62.0, 91.0, 151.0, 219.0, 359.0, 483.0, 779.0, 1178.0, 1830.0, 2827.0, 4223.0, 6614.0, 10804.0, 18373.0, 33154.0, 67223.0, 180458.0, 439811.0, 146155.0, 59300.0, 30003.0, 16852.0, 9964.0, 6174.0, 3931.0, 2614.0, 1746.0, 1075.0, 668.0, 482.0, 318.0, 181.0, 142.0, 78.0, 64.0, 46.0, 11.0, 15.0, 9.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.82421875, -3.70977783203125, -3.5953369140625, -3.48089599609375, -3.366455078125, -3.25201416015625, -3.1375732421875, -3.02313232421875, -2.90869140625, -2.79425048828125, -2.6798095703125, -2.56536865234375, -2.450927734375, -2.33648681640625, -2.2220458984375, -2.10760498046875, -1.9931640625, -1.87872314453125, -1.7642822265625, -1.64984130859375, -1.535400390625, -1.42095947265625, -1.3065185546875, -1.19207763671875, -1.07763671875, -0.96319580078125, -0.8487548828125, -0.73431396484375, -0.619873046875, -0.50543212890625, -0.3909912109375, -0.27655029296875, -0.162109375, -0.04766845703125, 0.0667724609375, 0.18121337890625, 0.295654296875, 0.41009521484375, 0.5245361328125, 0.63897705078125, 0.75341796875, 0.86785888671875, 0.9822998046875, 1.09674072265625, 1.211181640625, 1.32562255859375, 1.4400634765625, 1.55450439453125, 1.6689453125, 1.78338623046875, 1.8978271484375, 2.01226806640625, 2.126708984375, 2.24114990234375, 2.3555908203125, 2.47003173828125, 2.58447265625, 2.69891357421875, 2.8133544921875, 2.92779541015625, 3.042236328125, 3.15667724609375, 3.2711181640625, 3.38555908203125, 3.5]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 9.0, 8.0, 22.0, 22.0, 26.0, 28.0, 30.0, 28.0, 27.0, 32.0, 35.0, 40.0, 39.0, 53.0, 84.0, 192.0, 1539.0, 217.0, 126.0, 68.0, 54.0, 44.0, 35.0, 34.0, 31.0, 27.0, 31.0, 23.0, 17.0, 17.0, 14.0, 14.0, 16.0, 10.0, 6.0, 4.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.0369873046875, -7.745849609375, -7.4547119140625, -7.16357421875, -6.8724365234375, -6.581298828125, -6.2901611328125, -5.9990234375, -5.7078857421875, -5.416748046875, -5.1256103515625, -4.83447265625, -4.5433349609375, -4.252197265625, -3.9610595703125, -3.669921875, -3.3787841796875, -3.087646484375, -2.7965087890625, -2.50537109375, -2.2142333984375, -1.923095703125, -1.6319580078125, -1.3408203125, -1.0496826171875, -0.758544921875, -0.4674072265625, -0.17626953125, 0.1148681640625, 0.406005859375, 0.6971435546875, 0.98828125, 1.2794189453125, 1.570556640625, 1.8616943359375, 2.15283203125, 2.4439697265625, 2.735107421875, 3.0262451171875, 3.3173828125, 3.6085205078125, 3.899658203125, 4.1907958984375, 4.48193359375, 4.7730712890625, 5.064208984375, 5.3553466796875, 5.646484375, 5.9376220703125, 6.228759765625, 6.5198974609375, 6.81103515625, 7.1021728515625, 7.393310546875, 7.6844482421875, 7.9755859375, 8.2667236328125, 8.557861328125, 8.8489990234375, 9.14013671875, 9.4312744140625, 9.722412109375, 10.0135498046875, 10.3046875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 6.0, 6.0, 5.0, 11.0, 9.0, 15.0, 19.0, 23.0, 22.0, 34.0, 28.0, 56.0, 64.0, 65.0, 93.0, 140.0, 165.0, 256.0, 552.0, 2321.0, 20963.0, 989638.0, 2100359.0, 26401.0, 2806.0, 603.0, 250.0, 167.0, 139.0, 115.0, 87.0, 67.0, 42.0, 39.0, 30.0, 31.0, 28.0, 10.0, 8.0, 5.0, 5.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0], "bins": [-20.328125, -19.7794189453125, -19.230712890625, -18.6820068359375, -18.13330078125, -17.5845947265625, -17.035888671875, -16.4871826171875, -15.9384765625, -15.3897705078125, -14.841064453125, -14.2923583984375, -13.74365234375, -13.1949462890625, -12.646240234375, -12.0975341796875, -11.548828125, -11.0001220703125, -10.451416015625, -9.9027099609375, -9.35400390625, -8.8052978515625, -8.256591796875, -7.7078857421875, -7.1591796875, -6.6104736328125, -6.061767578125, -5.5130615234375, -4.96435546875, -4.4156494140625, -3.866943359375, -3.3182373046875, -2.76953125, -2.2208251953125, -1.672119140625, -1.1234130859375, -0.57470703125, -0.0260009765625, 0.522705078125, 1.0714111328125, 1.6201171875, 2.1688232421875, 2.717529296875, 3.2662353515625, 3.81494140625, 4.3636474609375, 4.912353515625, 5.4610595703125, 6.009765625, 6.5584716796875, 7.107177734375, 7.6558837890625, 8.20458984375, 8.7532958984375, 9.302001953125, 9.8507080078125, 10.3994140625, 10.9481201171875, 11.496826171875, 12.0455322265625, 12.59423828125, 13.1429443359375, 13.691650390625, 14.2403564453125, 14.7890625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 17.0, 77.0, 208.0, 288.0, 243.0, 125.0, 42.0, 8.0, 2.0, 4.0], "bins": [-77.77172088623047, -76.42308807373047, -75.07445526123047, -73.72582244873047, -72.37718963623047, -71.02855682373047, -69.67992401123047, -68.331298828125, -66.982666015625, -65.634033203125, -64.285400390625, -62.936767578125, -61.588134765625, -60.239505767822266, -58.890872955322266, -57.542240142822266, -56.193603515625, -54.844970703125, -53.496337890625, -52.147705078125, -50.799072265625, -49.450443267822266, -48.101810455322266, -46.753177642822266, -45.404544830322266, -44.055912017822266, -42.707279205322266, -41.358646392822266, -40.01001739501953, -38.66138458251953, -37.31275177001953, -35.96411895751953, -34.6154899597168, -33.2668571472168, -31.918224334716797, -30.56959342956543, -29.22096061706543, -27.87232780456543, -26.523696899414062, -25.175064086914062, -23.826431274414062, -22.477798461914062, -21.129165649414062, -19.780534744262695, -18.431901931762695, -17.083269119262695, -15.734637260437012, -14.386005401611328, -13.037371635437012, -11.688739776611328, -10.340106964111328, -8.991474151611328, -7.6428422927856445, -6.294209957122803, -4.945577621459961, -3.5969457626342773, -2.2483129501342773, -0.8996806144714355, 0.44895172119140625, 1.797584056854248, 3.14621639251709, 4.494848728179932, 5.843481063842773, 7.192112922668457, 8.540745735168457]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 11.0, 8.0, 12.0, 10.0, 14.0, 14.0, 20.0, 22.0, 30.0, 18.0, 22.0, 30.0, 26.0, 22.0, 24.0, 30.0, 22.0, 40.0, 31.0, 46.0, 32.0, 45.0, 41.0, 31.0, 29.0, 36.0, 32.0, 38.0, 26.0, 35.0, 28.0, 26.0, 11.0, 23.0, 23.0, 11.0, 11.0, 7.0, 6.0, 9.0, 7.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.958168029785156, -21.232492446899414, -20.506818771362305, -19.781143188476562, -19.05546760559082, -18.329792022705078, -17.60411834716797, -16.878442764282227, -16.152767181396484, -15.427092552185059, -14.701416969299316, -13.97574234008789, -13.250066757202148, -12.524392127990723, -11.798717498779297, -11.073041915893555, -10.347368240356445, -9.62169361114502, -8.896018028259277, -8.170343399047852, -7.444668292999268, -6.718993186950684, -5.993318557739258, -5.267643451690674, -4.54196834564209, -3.816293239593506, -3.090618371963501, -2.364943504333496, -1.639268398284912, -0.9135932922363281, -0.18791866302490234, 0.5377564430236816, 1.2634315490722656, 1.98910653591156, 2.7147815227508545, 3.4404563903808594, 4.166131496429443, 4.891806602478027, 5.617481231689453, 6.343156337738037, 7.068831443786621, 7.794506549835205, 8.520181655883789, 9.245856285095215, 9.97153091430664, 10.697206497192383, 11.422881126403809, 12.148555755615234, 12.874231338500977, 13.599905967712402, 14.325581550598145, 15.05125617980957, 15.776931762695312, 16.502605438232422, 17.228281021118164, 17.953956604003906, 18.679630279541016, 19.405305862426758, 20.130979537963867, 20.85665512084961, 21.58233070373535, 22.308006286621094, 23.033679962158203, 23.759355545043945, 24.485031127929688]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 11.0, 10.0, 9.0, 13.0, 30.0, 26.0, 31.0, 34.0, 38.0, 43.0, 38.0, 48.0, 53.0, 34.0, 61.0, 50.0, 55.0, 53.0, 55.0, 36.0, 41.0, 37.0, 37.0, 26.0, 23.0, 17.0, 27.0, 19.0, 10.0, 10.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.859375, -3.7354736328125, -3.611572265625, -3.4876708984375, -3.36376953125, -3.2398681640625, -3.115966796875, -2.9920654296875, -2.8681640625, -2.7442626953125, -2.620361328125, -2.4964599609375, -2.37255859375, -2.2486572265625, -2.124755859375, -2.0008544921875, -1.876953125, -1.7530517578125, -1.629150390625, -1.5052490234375, -1.38134765625, -1.2574462890625, -1.133544921875, -1.0096435546875, -0.8857421875, -0.7618408203125, -0.637939453125, -0.5140380859375, -0.39013671875, -0.2662353515625, -0.142333984375, -0.0184326171875, 0.10546875, 0.2293701171875, 0.353271484375, 0.4771728515625, 0.60107421875, 0.7249755859375, 0.848876953125, 0.9727783203125, 1.0966796875, 1.2205810546875, 1.344482421875, 1.4683837890625, 1.59228515625, 1.7161865234375, 1.840087890625, 1.9639892578125, 2.087890625, 2.2117919921875, 2.335693359375, 2.4595947265625, 2.58349609375, 2.7073974609375, 2.831298828125, 2.9552001953125, 3.0791015625, 3.2030029296875, 3.326904296875, 3.4508056640625, 3.57470703125, 3.6986083984375, 3.822509765625, 3.9464111328125, 4.0703125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 8.0, 7.0, 19.0, 12.0, 23.0, 29.0, 34.0, 59.0, 72.0, 109.0, 189.0, 457.0, 1027.0, 2668.0, 7185.0, 22943.0, 95775.0, 624438.0, 2575965.0, 718075.0, 107954.0, 24765.0, 7634.0, 2788.0, 1054.0, 441.0, 203.0, 100.0, 76.0, 44.0, 34.0, 20.0, 18.0, 13.0, 5.0, 9.0, 9.0, 4.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-8.21875, -7.96612548828125, -7.7135009765625, -7.46087646484375, -7.208251953125, -6.95562744140625, -6.7030029296875, -6.45037841796875, -6.19775390625, -5.94512939453125, -5.6925048828125, -5.43988037109375, -5.187255859375, -4.93463134765625, -4.6820068359375, -4.42938232421875, -4.1767578125, -3.92413330078125, -3.6715087890625, -3.41888427734375, -3.166259765625, -2.91363525390625, -2.6610107421875, -2.40838623046875, -2.15576171875, -1.90313720703125, -1.6505126953125, -1.39788818359375, -1.145263671875, -0.89263916015625, -0.6400146484375, -0.38739013671875, -0.134765625, 0.11785888671875, 0.3704833984375, 0.62310791015625, 0.875732421875, 1.12835693359375, 1.3809814453125, 1.63360595703125, 1.88623046875, 2.13885498046875, 2.3914794921875, 2.64410400390625, 2.896728515625, 3.14935302734375, 3.4019775390625, 3.65460205078125, 3.9072265625, 4.15985107421875, 4.4124755859375, 4.66510009765625, 4.917724609375, 5.17034912109375, 5.4229736328125, 5.67559814453125, 5.92822265625, 6.18084716796875, 6.4334716796875, 6.68609619140625, 6.938720703125, 7.19134521484375, 7.4439697265625, 7.69659423828125, 7.94921875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 9.0, 7.0, 23.0, 23.0, 45.0, 35.0, 82.0, 118.0, 159.0, 250.0, 365.0, 498.0, 653.0, 574.0, 390.0, 293.0, 203.0, 115.0, 63.0, 59.0, 37.0, 30.0, 17.0, 10.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.11285400390625, -5.8546142578125, -5.59637451171875, -5.338134765625, -5.07989501953125, -4.8216552734375, -4.56341552734375, -4.30517578125, -4.04693603515625, -3.7886962890625, -3.53045654296875, -3.272216796875, -3.01397705078125, -2.7557373046875, -2.49749755859375, -2.2392578125, -1.98101806640625, -1.7227783203125, -1.46453857421875, -1.206298828125, -0.94805908203125, -0.6898193359375, -0.43157958984375, -0.17333984375, 0.08489990234375, 0.3431396484375, 0.60137939453125, 0.859619140625, 1.11785888671875, 1.3760986328125, 1.63433837890625, 1.892578125, 2.15081787109375, 2.4090576171875, 2.66729736328125, 2.925537109375, 3.18377685546875, 3.4420166015625, 3.70025634765625, 3.95849609375, 4.21673583984375, 4.4749755859375, 4.73321533203125, 4.991455078125, 5.24969482421875, 5.5079345703125, 5.76617431640625, 6.0244140625, 6.28265380859375, 6.5408935546875, 6.79913330078125, 7.057373046875, 7.31561279296875, 7.5738525390625, 7.83209228515625, 8.09033203125, 8.34857177734375, 8.6068115234375, 8.86505126953125, 9.123291015625, 9.38153076171875, 9.6397705078125, 9.89801025390625, 10.15625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 7.0, 13.0, 17.0, 26.0, 43.0, 51.0, 85.0, 118.0, 217.0, 395.0, 847.0, 5118.0, 332208.0, 3804788.0, 46799.0, 2103.0, 605.0, 313.0, 172.0, 113.0, 79.0, 52.0, 34.0, 27.0, 17.0, 13.0, 10.0, 2.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.767822265625, -33.75439453125, -32.740966796875, -31.7275390625, -30.714111328125, -29.70068359375, -28.687255859375, -27.673828125, -26.660400390625, -25.64697265625, -24.633544921875, -23.6201171875, -22.606689453125, -21.59326171875, -20.579833984375, -19.56640625, -18.552978515625, -17.53955078125, -16.526123046875, -15.5126953125, -14.499267578125, -13.48583984375, -12.472412109375, -11.458984375, -10.445556640625, -9.43212890625, -8.418701171875, -7.4052734375, -6.391845703125, -5.37841796875, -4.364990234375, -3.3515625, -2.338134765625, -1.32470703125, -0.311279296875, 0.7021484375, 1.715576171875, 2.72900390625, 3.742431640625, 4.755859375, 5.769287109375, 6.78271484375, 7.796142578125, 8.8095703125, 9.822998046875, 10.83642578125, 11.849853515625, 12.86328125, 13.876708984375, 14.89013671875, 15.903564453125, 16.9169921875, 17.930419921875, 18.94384765625, 19.957275390625, 20.970703125, 21.984130859375, 22.99755859375, 24.010986328125, 25.0244140625, 26.037841796875, 27.05126953125, 28.064697265625, 29.078125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 17.0, 38.0, 49.0, 93.0, 109.0, 143.0, 147.0, 131.0, 107.0, 68.0, 41.0, 33.0, 8.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-70.85023498535156, -69.44483947753906, -68.03943634033203, -66.63404083251953, -65.22864532470703, -63.823246002197266, -62.4178466796875, -61.012451171875, -59.607051849365234, -58.20165252685547, -56.79625701904297, -55.3908576965332, -53.9854621887207, -52.58006286621094, -51.17466735839844, -49.76926803588867, -48.363868713378906, -46.95846939086914, -45.55307388305664, -44.147674560546875, -42.742279052734375, -41.33687973022461, -39.931480407714844, -38.526084899902344, -37.120689392089844, -35.71529006958008, -34.30989456176758, -32.90449523925781, -31.49909782409668, -30.093700408935547, -28.688302993774414, -27.28290557861328, -25.877504348754883, -24.47210693359375, -23.066709518432617, -21.661312103271484, -20.25591278076172, -18.850515365600586, -17.445117950439453, -16.039718627929688, -14.634322166442871, -13.228924751281738, -11.823526382446289, -10.418128967285156, -9.012731552124023, -7.607333183288574, -6.201935768127441, -4.796537399291992, -3.3911399841308594, -1.985742211341858, -0.5803444385528564, 0.8250532150268555, 2.2304511070251465, 3.6358489990234375, 5.04124641418457, 6.4466447830200195, 7.852042198181152, 9.257439613342285, 10.662837982177734, 12.068235397338867, 13.4736328125, 14.87903118133545, 16.284427642822266, 17.68982696533203, 19.095224380493164]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 8.0, 2.0, 7.0, 7.0, 9.0, 4.0, 7.0, 7.0, 16.0, 12.0, 13.0, 21.0, 25.0, 23.0, 23.0, 33.0, 37.0, 33.0, 40.0, 44.0, 54.0, 52.0, 50.0, 44.0, 57.0, 32.0, 42.0, 33.0, 38.0, 39.0, 29.0, 28.0, 26.0, 20.0, 16.0, 16.0, 14.0, 11.0, 8.0, 18.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.21916961669922, -25.479211807250977, -24.739255905151367, -23.999298095703125, -23.259340286254883, -22.51938247680664, -21.77942657470703, -21.03946876525879, -20.299510955810547, -19.559553146362305, -18.819597244262695, -18.079639434814453, -17.33968162536621, -16.59972381591797, -15.85976791381836, -15.119810104370117, -14.379854202270508, -13.639897346496582, -12.89993953704834, -12.159982681274414, -11.420024871826172, -10.680068016052246, -9.94011116027832, -9.200153350830078, -8.460196495056152, -7.720239162445068, -6.980281829833984, -6.240324974060059, -5.500367641448975, -4.760410308837891, -4.020453453063965, -3.280496120452881, -2.540538787841797, -1.8005815744400024, -1.060624361038208, -0.3206672668457031, 0.41929006576538086, 1.1592473983764648, 1.8992042541503906, 2.6391615867614746, 3.3791189193725586, 4.119076251983643, 4.859033584594727, 5.598990440368652, 6.338947772979736, 7.07890510559082, 7.818861961364746, 8.558818817138672, 9.298776626586914, 10.03873348236084, 10.778691291809082, 11.518648147583008, 12.25860595703125, 12.998562812805176, 13.738519668579102, 14.478477478027344, 15.21843433380127, 15.958391189575195, 16.698348999023438, 17.438304901123047, 18.17826271057129, 18.91822052001953, 19.65817642211914, 20.398134231567383, 21.138092041015625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 2.0, 4.0, 7.0, 6.0, 13.0, 13.0, 11.0, 23.0, 30.0, 36.0, 21.0, 37.0, 36.0, 36.0, 39.0, 41.0, 51.0, 48.0, 48.0, 40.0, 45.0, 37.0, 49.0, 44.0, 33.0, 37.0, 31.0, 33.0, 27.0, 21.0, 19.0, 16.0, 17.0, 11.0, 11.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.371337890625, -3.25830078125, -3.145263671875, -3.0322265625, -2.919189453125, -2.80615234375, -2.693115234375, -2.580078125, -2.467041015625, -2.35400390625, -2.240966796875, -2.1279296875, -2.014892578125, -1.90185546875, -1.788818359375, -1.67578125, -1.562744140625, -1.44970703125, -1.336669921875, -1.2236328125, -1.110595703125, -0.99755859375, -0.884521484375, -0.771484375, -0.658447265625, -0.54541015625, -0.432373046875, -0.3193359375, -0.206298828125, -0.09326171875, 0.019775390625, 0.1328125, 0.245849609375, 0.35888671875, 0.471923828125, 0.5849609375, 0.697998046875, 0.81103515625, 0.924072265625, 1.037109375, 1.150146484375, 1.26318359375, 1.376220703125, 1.4892578125, 1.602294921875, 1.71533203125, 1.828369140625, 1.94140625, 2.054443359375, 2.16748046875, 2.280517578125, 2.3935546875, 2.506591796875, 2.61962890625, 2.732666015625, 2.845703125, 2.958740234375, 3.07177734375, 3.184814453125, 3.2978515625, 3.410888671875, 3.52392578125, 3.636962890625, 3.75]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 13.0, 16.0, 32.0, 38.0, 62.0, 119.0, 186.0, 297.0, 480.0, 860.0, 1432.0, 2475.0, 4249.0, 7955.0, 15053.0, 28498.0, 57613.0, 124255.0, 306941.0, 275974.0, 112141.0, 52361.0, 26570.0, 13764.0, 7550.0, 4057.0, 2304.0, 1311.0, 740.0, 460.0, 289.0, 155.0, 102.0, 64.0, 48.0, 22.0, 20.0, 7.0, 13.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03289794921875, -0.03183460235595703, -0.030771255493164062, -0.029707908630371094, -0.028644561767578125, -0.027581214904785156, -0.026517868041992188, -0.02545452117919922, -0.02439117431640625, -0.02332782745361328, -0.022264480590820312, -0.021201133728027344, -0.020137786865234375, -0.019074440002441406, -0.018011093139648438, -0.01694774627685547, -0.0158843994140625, -0.014821052551269531, -0.013757705688476562, -0.012694358825683594, -0.011631011962890625, -0.010567665100097656, -0.009504318237304688, -0.008440971374511719, -0.00737762451171875, -0.006314277648925781, -0.0052509307861328125, -0.004187583923339844, -0.003124237060546875, -0.0020608901977539062, -0.0009975433349609375, 6.580352783203125e-05, 0.001129150390625, 0.0021924972534179688, 0.0032558441162109375, 0.004319190979003906, 0.005382537841796875, 0.006445884704589844, 0.0075092315673828125, 0.008572578430175781, 0.00963592529296875, 0.010699272155761719, 0.011762619018554688, 0.012825965881347656, 0.013889312744140625, 0.014952659606933594, 0.016016006469726562, 0.01707935333251953, 0.0181427001953125, 0.01920604705810547, 0.020269393920898438, 0.021332740783691406, 0.022396087646484375, 0.023459434509277344, 0.024522781372070312, 0.02558612823486328, 0.02664947509765625, 0.02771282196044922, 0.028776168823242188, 0.029839515686035156, 0.030902862548828125, 0.031966209411621094, 0.03302955627441406, 0.03409290313720703, 0.03515625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 5.0, 5.0, 9.0, 15.0, 18.0, 21.0, 20.0, 31.0, 31.0, 38.0, 32.0, 35.0, 48.0, 34.0, 42.0, 48.0, 36.0, 1061.0, 53.0, 49.0, 32.0, 43.0, 33.0, 42.0, 36.0, 32.0, 23.0, 22.0, 24.0, 23.0, 10.0, 13.0, 19.0, 6.0, 7.0, 11.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.7991943359375, -2.707763671875, -2.6163330078125, -2.52490234375, -2.4334716796875, -2.342041015625, -2.2506103515625, -2.1591796875, -2.0677490234375, -1.976318359375, -1.8848876953125, -1.79345703125, -1.7020263671875, -1.610595703125, -1.5191650390625, -1.427734375, -1.3363037109375, -1.244873046875, -1.1534423828125, -1.06201171875, -0.9705810546875, -0.879150390625, -0.7877197265625, -0.6962890625, -0.6048583984375, -0.513427734375, -0.4219970703125, -0.33056640625, -0.2391357421875, -0.147705078125, -0.0562744140625, 0.03515625, 0.1265869140625, 0.218017578125, 0.3094482421875, 0.40087890625, 0.4923095703125, 0.583740234375, 0.6751708984375, 0.7666015625, 0.8580322265625, 0.949462890625, 1.0408935546875, 1.13232421875, 1.2237548828125, 1.315185546875, 1.4066162109375, 1.498046875, 1.5894775390625, 1.680908203125, 1.7723388671875, 1.86376953125, 1.9552001953125, 2.046630859375, 2.1380615234375, 2.2294921875, 2.3209228515625, 2.412353515625, 2.5037841796875, 2.59521484375, 2.6866455078125, 2.778076171875, 2.8695068359375, 2.9609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 5.0, 7.0, 8.0, 21.0, 22.0, 22.0, 53.0, 63.0, 115.0, 147.0, 247.0, 342.0, 525.0, 775.0, 1153.0, 1723.0, 2722.0, 4152.0, 6355.0, 10198.0, 15983.0, 25092.0, 39969.0, 64394.0, 105689.0, 176607.0, 1264156.0, 145061.0, 86783.0, 53275.0, 33155.0, 20871.0, 13257.0, 8457.0, 5464.0, 3510.0, 2274.0, 1475.0, 1007.0, 673.0, 423.0, 278.0, 191.0, 141.0, 87.0, 72.0, 38.0, 34.0, 24.0, 14.0, 8.0, 5.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.0098419189453125, -0.009537220001220703, -0.009232521057128906, -0.00892782211303711, -0.008623123168945312, -0.008318424224853516, -0.008013725280761719, -0.007709026336669922, -0.007404327392578125, -0.007099628448486328, -0.006794929504394531, -0.006490230560302734, -0.0061855316162109375, -0.005880832672119141, -0.005576133728027344, -0.005271434783935547, -0.00496673583984375, -0.004662036895751953, -0.004357337951660156, -0.004052639007568359, -0.0037479400634765625, -0.0034432411193847656, -0.0031385421752929688, -0.002833843231201172, -0.002529144287109375, -0.002224445343017578, -0.0019197463989257812, -0.0016150474548339844, -0.0013103485107421875, -0.0010056495666503906, -0.0007009506225585938, -0.0003962516784667969, -9.1552734375e-05, 0.00021314620971679688, 0.0005178451538085938, 0.0008225440979003906, 0.0011272430419921875, 0.0014319419860839844, 0.0017366409301757812, 0.002041339874267578, 0.002346038818359375, 0.002650737762451172, 0.0029554367065429688, 0.0032601356506347656, 0.0035648345947265625, 0.0038695335388183594, 0.004174232482910156, 0.004478931427001953, 0.00478363037109375, 0.005088329315185547, 0.005393028259277344, 0.005697727203369141, 0.0060024261474609375, 0.006307125091552734, 0.006611824035644531, 0.006916522979736328, 0.007221221923828125, 0.007525920867919922, 0.007830619812011719, 0.008135318756103516, 0.008440017700195312, 0.00874471664428711, 0.009049415588378906, 0.009354114532470703, 0.0096588134765625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 10.0, 0.0, 12.0, 12.0, 0.0, 15.0, 0.0, 30.0, 32.0, 0.0, 52.0, 0.0, 84.0, 0.0, 137.0, 228.0, 0.0, 150.0, 0.0, 80.0, 0.0, 56.0, 49.0, 0.0, 22.0, 0.0, 14.0, 11.0, 0.0, 3.0, 0.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0980293154716492e-06, -1.0635703802108765e-06, -1.0291114449501038e-06, -9.94652509689331e-07, -9.601935744285583e-07, -9.257346391677856e-07, -8.912757039070129e-07, -8.568167686462402e-07, -8.223578333854675e-07, -7.878988981246948e-07, -7.534399628639221e-07, -7.189810276031494e-07, -6.845220923423767e-07, -6.50063157081604e-07, -6.156042218208313e-07, -5.811452865600586e-07, -5.466863512992859e-07, -5.122274160385132e-07, -4.777684807777405e-07, -4.4330954551696777e-07, -4.0885061025619507e-07, -3.7439167499542236e-07, -3.3993273973464966e-07, -3.0547380447387695e-07, -2.7101486921310425e-07, -2.3655593395233154e-07, -2.0209699869155884e-07, -1.6763806343078613e-07, -1.3317912817001343e-07, -9.872019290924072e-08, -6.426125764846802e-08, -2.9802322387695312e-08, 4.6566128730773926e-09, 3.91155481338501e-08, 7.35744833946228e-08, 1.0803341865539551e-07, 1.424923539161682e-07, 1.7695128917694092e-07, 2.1141022443771362e-07, 2.4586915969848633e-07, 2.8032809495925903e-07, 3.1478703022003174e-07, 3.4924596548080444e-07, 3.8370490074157715e-07, 4.1816383600234985e-07, 4.5262277126312256e-07, 4.870817065238953e-07, 5.21540641784668e-07, 5.559995770454407e-07, 5.904585123062134e-07, 6.249174475669861e-07, 6.593763828277588e-07, 6.938353180885315e-07, 7.282942533493042e-07, 7.627531886100769e-07, 7.972121238708496e-07, 8.316710591316223e-07, 8.66129994392395e-07, 9.005889296531677e-07, 9.350478649139404e-07, 9.695068001747131e-07, 1.0039657354354858e-06, 1.0384246706962585e-06, 1.0728836059570312e-06]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 4.0, 14.0, 16.0, 14.0, 40.0, 38.0, 54.0, 101.0, 252.0, 2001.0, 354813.0, 688045.0, 2552.0, 251.0, 116.0, 74.0, 40.0, 24.0, 13.0, 27.0, 12.0, 5.0, 3.0, 10.0, 7.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.396106719970703e-05, -2.31890007853508e-05, -2.2416934370994568e-05, -2.1644867956638336e-05, -2.0872801542282104e-05, -2.0100735127925873e-05, -1.932866871356964e-05, -1.855660229921341e-05, -1.7784535884857178e-05, -1.7012469470500946e-05, -1.6240403056144714e-05, -1.5468336641788483e-05, -1.4696270227432251e-05, -1.392420381307602e-05, -1.3152137398719788e-05, -1.2380070984363556e-05, -1.1608004570007324e-05, -1.0835938155651093e-05, -1.006387174129486e-05, -9.291805326938629e-06, -8.519738912582397e-06, -7.747672498226166e-06, -6.975606083869934e-06, -6.203539669513702e-06, -5.431473255157471e-06, -4.659406840801239e-06, -3.887340426445007e-06, -3.1152740120887756e-06, -2.343207597732544e-06, -1.5711411833763123e-06, -7.990747690200806e-07, -2.7008354663848877e-08, 7.450580596923828e-07, 1.5171244740486145e-06, 2.289190888404846e-06, 3.061257302761078e-06, 3.8333237171173096e-06, 4.605390131473541e-06, 5.377456545829773e-06, 6.149522960186005e-06, 6.921589374542236e-06, 7.693655788898468e-06, 8.4657222032547e-06, 9.237788617610931e-06, 1.0009855031967163e-05, 1.0781921446323395e-05, 1.1553987860679626e-05, 1.2326054275035858e-05, 1.309812068939209e-05, 1.3870187103748322e-05, 1.4642253518104553e-05, 1.5414319932460785e-05, 1.6186386346817017e-05, 1.6958452761173248e-05, 1.773051917552948e-05, 1.850258558988571e-05, 1.9274652004241943e-05, 2.0046718418598175e-05, 2.0818784832954407e-05, 2.159085124731064e-05, 2.236291766166687e-05, 2.3134984076023102e-05, 2.3907050490379333e-05, 2.4679116904735565e-05, 2.5451183319091797e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 15.0, 32.0, 99.0, 217.0, 295.0, 215.0, 88.0, 25.0, 17.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2235677736025536e-06, -3.1608997232979164e-06, -3.098231672993279e-06, -3.0355636226886418e-06, -2.97289579975768e-06, -2.9102277494530426e-06, -2.8475596991484053e-06, -2.784891648843768e-06, -2.7222235985391308e-06, -2.6595555482344935e-06, -2.596887497929856e-06, -2.534219447625219e-06, -2.4715513973205816e-06, -2.4088835743896198e-06, -2.3462155240849825e-06, -2.283547473780345e-06, -2.220879423475708e-06, -2.1582113731710706e-06, -2.0955433228664333e-06, -2.032875272561796e-06, -1.970207449630834e-06, -1.907539399326197e-06, -1.8448713490215596e-06, -1.7822032987169223e-06, -1.719535248412285e-06, -1.6568671981076477e-06, -1.5941991478030104e-06, -1.5315312111852109e-06, -1.4688631608805736e-06, -1.4061951105759363e-06, -1.3435271739581367e-06, -1.2808591236534994e-06, -1.2181911870356998e-06, -1.1555231367310626e-06, -1.092855200113263e-06, -1.0301871498086257e-06, -9.675190995039884e-07, -9.048510491993511e-07, -8.421830557381327e-07, -7.795150622769143e-07, -7.16847011972277e-07, -6.541789616676397e-07, -5.915109682064212e-07, -5.288429747452028e-07, -4.661749244405655e-07, -4.0350690255763766e-07, -3.408388806747098e-07, -2.7817085879178194e-07, -2.1550283690885408e-07, -1.5283481502592622e-07, -9.016679314299836e-08, -2.7498771260070498e-08, 3.516925062285736e-08, 9.783727250578522e-08, 1.6050529438871308e-07, 2.2317331627164094e-07, 2.858413381545688e-07, 3.4850936003749666e-07, 4.111773819204245e-07, 4.738454038033524e-07, 5.365134256862802e-07, 5.991814759909175e-07, 6.61849469452136e-07, 7.245174629133544e-07, 7.871855132179917e-07]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 109.0, 0.0, 0.0, 0.0, 192.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 189.0, 0.0, 0.0, 0.0, 104.0, 0.0, 0.0, 0.0, 54.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 2.0, 4.0, 7.0, 6.0, 13.0, 13.0, 11.0, 23.0, 30.0, 36.0, 21.0, 37.0, 36.0, 36.0, 39.0, 41.0, 51.0, 48.0, 48.0, 40.0, 45.0, 37.0, 49.0, 44.0, 33.0, 37.0, 31.0, 33.0, 27.0, 21.0, 19.0, 16.0, 17.0, 11.0, 11.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.371337890625, -3.25830078125, -3.145263671875, -3.0322265625, -2.919189453125, -2.80615234375, -2.693115234375, -2.580078125, -2.467041015625, -2.35400390625, -2.240966796875, -2.1279296875, -2.014892578125, -1.90185546875, -1.788818359375, -1.67578125, -1.562744140625, -1.44970703125, -1.336669921875, -1.2236328125, -1.110595703125, -0.99755859375, -0.884521484375, -0.771484375, -0.658447265625, -0.54541015625, -0.432373046875, -0.3193359375, -0.206298828125, -0.09326171875, 0.019775390625, 0.1328125, 0.245849609375, 0.35888671875, 0.471923828125, 0.5849609375, 0.697998046875, 0.81103515625, 0.924072265625, 1.037109375, 1.150146484375, 1.26318359375, 1.376220703125, 1.4892578125, 1.602294921875, 1.71533203125, 1.828369140625, 1.94140625, 2.054443359375, 2.16748046875, 2.280517578125, 2.3935546875, 2.506591796875, 2.61962890625, 2.732666015625, 2.845703125, 2.958740234375, 3.07177734375, 3.184814453125, 3.2978515625, 3.410888671875, 3.52392578125, 3.636962890625, 3.75]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 8.0, 8.0, 11.0, 15.0, 23.0, 46.0, 81.0, 139.0, 219.0, 320.0, 606.0, 915.0, 1372.0, 2234.0, 3562.0, 5609.0, 9200.0, 14500.0, 24102.0, 43947.0, 86170.0, 227802.0, 375069.0, 118786.0, 56375.0, 30585.0, 17610.0, 11037.0, 6752.0, 4284.0, 2618.0, 1732.0, 1060.0, 646.0, 442.0, 260.0, 141.0, 112.0, 65.0, 35.0, 31.0, 15.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.642608642578125, -2.54888916015625, -2.455169677734375, -2.3614501953125, -2.267730712890625, -2.17401123046875, -2.080291748046875, -1.986572265625, -1.892852783203125, -1.79913330078125, -1.705413818359375, -1.6116943359375, -1.517974853515625, -1.42425537109375, -1.330535888671875, -1.23681640625, -1.143096923828125, -1.04937744140625, -0.955657958984375, -0.8619384765625, -0.768218994140625, -0.67449951171875, -0.580780029296875, -0.487060546875, -0.393341064453125, -0.29962158203125, -0.205902099609375, -0.1121826171875, -0.018463134765625, 0.07525634765625, 0.168975830078125, 0.2626953125, 0.356414794921875, 0.45013427734375, 0.543853759765625, 0.6375732421875, 0.731292724609375, 0.82501220703125, 0.918731689453125, 1.012451171875, 1.106170654296875, 1.19989013671875, 1.293609619140625, 1.3873291015625, 1.481048583984375, 1.57476806640625, 1.668487548828125, 1.76220703125, 1.855926513671875, 1.94964599609375, 2.043365478515625, 2.1370849609375, 2.230804443359375, 2.32452392578125, 2.418243408203125, 2.511962890625, 2.605682373046875, 2.69940185546875, 2.793121337890625, 2.8868408203125, 2.980560302734375, 3.07427978515625, 3.167999267578125, 3.26171875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 14.0, 15.0, 12.0, 14.0, 13.0, 21.0, 22.0, 35.0, 28.0, 36.0, 31.0, 39.0, 56.0, 56.0, 87.0, 178.0, 1581.0, 264.0, 79.0, 54.0, 45.0, 63.0, 34.0, 38.0, 27.0, 24.0, 17.0, 27.0, 23.0, 19.0, 17.0, 15.0, 9.0, 11.0, 8.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.365966796875, -9.06005859375, -8.754150390625, -8.4482421875, -8.142333984375, -7.83642578125, -7.530517578125, -7.224609375, -6.918701171875, -6.61279296875, -6.306884765625, -6.0009765625, -5.695068359375, -5.38916015625, -5.083251953125, -4.77734375, -4.471435546875, -4.16552734375, -3.859619140625, -3.5537109375, -3.247802734375, -2.94189453125, -2.635986328125, -2.330078125, -2.024169921875, -1.71826171875, -1.412353515625, -1.1064453125, -0.800537109375, -0.49462890625, -0.188720703125, 0.1171875, 0.423095703125, 0.72900390625, 1.034912109375, 1.3408203125, 1.646728515625, 1.95263671875, 2.258544921875, 2.564453125, 2.870361328125, 3.17626953125, 3.482177734375, 3.7880859375, 4.093994140625, 4.39990234375, 4.705810546875, 5.01171875, 5.317626953125, 5.62353515625, 5.929443359375, 6.2353515625, 6.541259765625, 6.84716796875, 7.153076171875, 7.458984375, 7.764892578125, 8.07080078125, 8.376708984375, 8.6826171875, 8.988525390625, 9.29443359375, 9.600341796875, 9.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 5.0, 10.0, 15.0, 18.0, 31.0, 29.0, 56.0, 49.0, 66.0, 108.0, 118.0, 204.0, 257.0, 475.0, 1214.0, 6324.0, 87333.0, 2863403.0, 172818.0, 10011.0, 1558.0, 558.0, 289.0, 199.0, 140.0, 117.0, 59.0, 50.0, 46.0, 26.0, 32.0, 20.0, 11.0, 12.0, 9.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.359375, -15.8575439453125, -15.355712890625, -14.8538818359375, -14.35205078125, -13.8502197265625, -13.348388671875, -12.8465576171875, -12.3447265625, -11.8428955078125, -11.341064453125, -10.8392333984375, -10.33740234375, -9.8355712890625, -9.333740234375, -8.8319091796875, -8.330078125, -7.8282470703125, -7.326416015625, -6.8245849609375, -6.32275390625, -5.8209228515625, -5.319091796875, -4.8172607421875, -4.3154296875, -3.8135986328125, -3.311767578125, -2.8099365234375, -2.30810546875, -1.8062744140625, -1.304443359375, -0.8026123046875, -0.30078125, 0.2010498046875, 0.702880859375, 1.2047119140625, 1.70654296875, 2.2083740234375, 2.710205078125, 3.2120361328125, 3.7138671875, 4.2156982421875, 4.717529296875, 5.2193603515625, 5.72119140625, 6.2230224609375, 6.724853515625, 7.2266845703125, 7.728515625, 8.2303466796875, 8.732177734375, 9.2340087890625, 9.73583984375, 10.2376708984375, 10.739501953125, 11.2413330078125, 11.7431640625, 12.2449951171875, 12.746826171875, 13.2486572265625, 13.75048828125, 14.2523193359375, 14.754150390625, 15.2559814453125, 15.7578125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 15.0, 176.0, 509.0, 281.0, 28.0, 5.0, 0.0, 0.0, 1.0], "bins": [-152.0040283203125, -149.3657684326172, -146.72750854492188, -144.08924865722656, -141.45098876953125, -138.812744140625, -136.1744842529297, -133.53622436523438, -130.89796447753906, -128.25970458984375, -125.62144470214844, -122.98319244384766, -120.34493255615234, -117.70667266845703, -115.06842041015625, -112.43016052246094, -109.79190063476562, -107.15364074707031, -104.515380859375, -101.87712860107422, -99.2388687133789, -96.6006088256836, -93.96235656738281, -91.3240966796875, -88.68583679199219, -86.04757690429688, -83.40931701660156, -80.77106475830078, -78.13280487060547, -75.49454498291016, -72.85629272460938, -70.21803283691406, -67.57976531982422, -64.9415054321289, -62.30324935913086, -59.66499328613281, -57.0267333984375, -54.38847351074219, -51.75021743774414, -49.111961364746094, -46.47370147705078, -43.83544158935547, -41.19718551635742, -38.558929443359375, -35.92066955566406, -33.28240966796875, -30.644153594970703, -28.005895614624023, -25.367639541625977, -22.729381561279297, -20.091123580932617, -17.452865600585938, -14.814607620239258, -12.176349639892578, -9.538091659545898, -6.899833679199219, -4.261575698852539, -1.6233177185058594, 1.0149402618408203, 3.6531982421875, 6.29145622253418, 8.92971420288086, 11.567972183227539, 14.206230163574219, 16.8444881439209]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 5.0, 12.0, 9.0, 16.0, 20.0, 13.0, 25.0, 26.0, 34.0, 18.0, 38.0, 38.0, 53.0, 31.0, 43.0, 33.0, 38.0, 44.0, 49.0, 43.0, 44.0, 55.0, 43.0, 36.0, 32.0, 37.0, 28.0, 29.0, 25.0, 18.0, 13.0, 9.0, 8.0, 11.0, 11.0, 7.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.28861999511719, -37.29345703125, -36.29829406738281, -35.303131103515625, -34.30796432495117, -33.312801361083984, -32.3176383972168, -31.32247543334961, -30.327312469482422, -29.332149505615234, -28.336984634399414, -27.341821670532227, -26.34665870666504, -25.35149383544922, -24.35633087158203, -23.361167907714844, -22.366003036499023, -21.370840072631836, -20.375675201416016, -19.380512237548828, -18.38534927368164, -17.390186309814453, -16.395021438598633, -15.399858474731445, -14.404694557189941, -13.409530639648438, -12.41436767578125, -11.419203758239746, -10.424039840698242, -9.428876876831055, -8.43371295928955, -7.438549518585205, -6.443386077880859, -5.448222637176514, -4.453059196472168, -3.457895278930664, -2.4627318382263184, -1.4675683975219727, -0.47240447998046875, 0.522758960723877, 1.5179224014282227, 2.5130858421325684, 3.508249521255493, 4.503413200378418, 5.498576641082764, 6.493740081787109, 7.488903999328613, 8.484067916870117, 9.479230880737305, 10.474394798278809, 11.469557762145996, 12.4647216796875, 13.459884643554688, 14.455048561096191, 15.450212478637695, 16.445375442504883, 17.440540313720703, 18.43570327758789, 19.43086814880371, 20.4260311126709, 21.421194076538086, 22.416358947753906, 23.411521911621094, 24.40668487548828, 25.40184783935547]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 1.0, 9.0, 6.0, 14.0, 9.0, 16.0, 21.0, 16.0, 24.0, 39.0, 31.0, 35.0, 46.0, 42.0, 40.0, 48.0, 56.0, 38.0, 45.0, 50.0, 46.0, 30.0, 42.0, 47.0, 40.0, 37.0, 30.0, 21.0, 25.0, 23.0, 18.0, 13.0, 11.0, 7.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.763671875, -3.642486572265625, -3.52130126953125, -3.400115966796875, -3.2789306640625, -3.157745361328125, -3.03656005859375, -2.915374755859375, -2.794189453125, -2.673004150390625, -2.55181884765625, -2.430633544921875, -2.3094482421875, -2.188262939453125, -2.06707763671875, -1.945892333984375, -1.82470703125, -1.703521728515625, -1.58233642578125, -1.461151123046875, -1.3399658203125, -1.218780517578125, -1.09759521484375, -0.976409912109375, -0.855224609375, -0.734039306640625, -0.61285400390625, -0.491668701171875, -0.3704833984375, -0.249298095703125, -0.12811279296875, -0.006927490234375, 0.1142578125, 0.235443115234375, 0.35662841796875, 0.477813720703125, 0.5989990234375, 0.720184326171875, 0.84136962890625, 0.962554931640625, 1.083740234375, 1.204925537109375, 1.32611083984375, 1.447296142578125, 1.5684814453125, 1.689666748046875, 1.81085205078125, 1.932037353515625, 2.05322265625, 2.174407958984375, 2.29559326171875, 2.416778564453125, 2.5379638671875, 2.659149169921875, 2.78033447265625, 2.901519775390625, 3.022705078125, 3.143890380859375, 3.26507568359375, 3.386260986328125, 3.5074462890625, 3.628631591796875, 3.74981689453125, 3.871002197265625, 3.9921875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 15.0, 11.0, 13.0, 27.0, 34.0, 37.0, 52.0, 67.0, 98.0, 170.0, 299.0, 451.0, 853.0, 1754.0, 3871.0, 10810.0, 34493.0, 152549.0, 1047642.0, 2404297.0, 428335.0, 76246.0, 19911.0, 6648.0, 2699.0, 1254.0, 620.0, 372.0, 197.0, 137.0, 83.0, 66.0, 31.0, 34.0, 35.0, 23.0, 11.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.4765625, -8.22186279296875, -7.9671630859375, -7.71246337890625, -7.457763671875, -7.20306396484375, -6.9483642578125, -6.69366455078125, -6.43896484375, -6.18426513671875, -5.9295654296875, -5.67486572265625, -5.420166015625, -5.16546630859375, -4.9107666015625, -4.65606689453125, -4.4013671875, -4.14666748046875, -3.8919677734375, -3.63726806640625, -3.382568359375, -3.12786865234375, -2.8731689453125, -2.61846923828125, -2.36376953125, -2.10906982421875, -1.8543701171875, -1.59967041015625, -1.344970703125, -1.09027099609375, -0.8355712890625, -0.58087158203125, -0.326171875, -0.07147216796875, 0.1832275390625, 0.43792724609375, 0.692626953125, 0.94732666015625, 1.2020263671875, 1.45672607421875, 1.71142578125, 1.96612548828125, 2.2208251953125, 2.47552490234375, 2.730224609375, 2.98492431640625, 3.2396240234375, 3.49432373046875, 3.7490234375, 4.00372314453125, 4.2584228515625, 4.51312255859375, 4.767822265625, 5.02252197265625, 5.2772216796875, 5.53192138671875, 5.78662109375, 6.04132080078125, 6.2960205078125, 6.55072021484375, 6.805419921875, 7.06011962890625, 7.3148193359375, 7.56951904296875, 7.82421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 0.0, 5.0, 15.0, 14.0, 28.0, 44.0, 51.0, 77.0, 98.0, 169.0, 211.0, 289.0, 405.0, 565.0, 560.0, 478.0, 327.0, 221.0, 164.0, 113.0, 82.0, 47.0, 30.0, 25.0, 14.0, 15.0, 4.0, 7.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.62109375, -8.3828125, -8.14453125, -7.90625, -7.66796875, -7.4296875, -7.19140625, -6.953125, -6.71484375, -6.4765625, -6.23828125, -6.0, -5.76171875, -5.5234375, -5.28515625, -5.046875, -4.80859375, -4.5703125, -4.33203125, -4.09375, -3.85546875, -3.6171875, -3.37890625, -3.140625, -2.90234375, -2.6640625, -2.42578125, -2.1875, -1.94921875, -1.7109375, -1.47265625, -1.234375, -0.99609375, -0.7578125, -0.51953125, -0.28125, -0.04296875, 0.1953125, 0.43359375, 0.671875, 0.91015625, 1.1484375, 1.38671875, 1.625, 1.86328125, 2.1015625, 2.33984375, 2.578125, 2.81640625, 3.0546875, 3.29296875, 3.53125, 3.76953125, 4.0078125, 4.24609375, 4.484375, 4.72265625, 4.9609375, 5.19921875, 5.4375, 5.67578125, 5.9140625, 6.15234375, 6.390625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 10.0, 19.0, 25.0, 34.0, 43.0, 89.0, 120.0, 182.0, 311.0, 1009.0, 12094.0, 3055910.0, 1116114.0, 6660.0, 766.0, 318.0, 181.0, 127.0, 80.0, 52.0, 45.0, 27.0, 20.0, 13.0, 8.0, 2.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.5654296875, -32.318359375, -31.0712890625, -29.82421875, -28.5771484375, -27.330078125, -26.0830078125, -24.8359375, -23.5888671875, -22.341796875, -21.0947265625, -19.84765625, -18.6005859375, -17.353515625, -16.1064453125, -14.859375, -13.6123046875, -12.365234375, -11.1181640625, -9.87109375, -8.6240234375, -7.376953125, -6.1298828125, -4.8828125, -3.6357421875, -2.388671875, -1.1416015625, 0.10546875, 1.3525390625, 2.599609375, 3.8466796875, 5.09375, 6.3408203125, 7.587890625, 8.8349609375, 10.08203125, 11.3291015625, 12.576171875, 13.8232421875, 15.0703125, 16.3173828125, 17.564453125, 18.8115234375, 20.05859375, 21.3056640625, 22.552734375, 23.7998046875, 25.046875, 26.2939453125, 27.541015625, 28.7880859375, 30.03515625, 31.2822265625, 32.529296875, 33.7763671875, 35.0234375, 36.2705078125, 37.517578125, 38.7646484375, 40.01171875, 41.2587890625, 42.505859375, 43.7529296875, 45.0]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 10.0, 20.0, 34.0, 42.0, 58.0, 84.0, 100.0, 110.0, 119.0, 106.0, 80.0, 85.0, 55.0, 51.0, 22.0, 14.0, 11.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.600330352783203, -20.448476791381836, -19.29662322998047, -18.144771575927734, -16.992918014526367, -15.841064453125, -14.689210891723633, -13.537358283996582, -12.385504722595215, -11.233651161193848, -10.081798553466797, -8.92994499206543, -7.778091907501221, -6.626238822937012, -5.4743852615356445, -4.322532653808594, -3.1706790924072266, -2.0188260078430176, -0.8669726848602295, 0.2848806381225586, 1.4367337226867676, 2.5885868072509766, 3.7404403686523438, 4.8922929763793945, 6.044146537780762, 7.195999622344971, 8.34785270690918, 9.499706268310547, 10.651559829711914, 11.803412437438965, 12.955265998840332, 14.107118606567383, 15.25897216796875, 16.410825729370117, 17.562679290771484, 18.71453094482422, 19.866384506225586, 21.018238067626953, 22.17009162902832, 23.321945190429688, 24.473796844482422, 25.62565040588379, 26.777503967285156, 27.92935562133789, 29.081209182739258, 30.233062744140625, 31.384916305541992, 32.53676986694336, 33.688621520996094, 34.84047317504883, 35.99232864379883, 37.14418029785156, 38.29603576660156, 39.4478874206543, 40.59973907470703, 41.75159454345703, 42.90345001220703, 44.055301666259766, 45.207157135009766, 46.3590087890625, 47.5108642578125, 48.662715911865234, 49.81456756591797, 50.96642303466797, 52.1182746887207]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 14.0, 8.0, 14.0, 14.0, 21.0, 13.0, 22.0, 19.0, 24.0, 30.0, 43.0, 40.0, 35.0, 45.0, 54.0, 49.0, 41.0, 43.0, 40.0, 34.0, 32.0, 23.0, 43.0, 37.0, 32.0, 30.0, 23.0, 17.0, 18.0, 16.0, 16.0, 18.0, 9.0, 16.0, 14.0, 4.0, 10.0, 8.0, 2.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.611778259277344, -21.919265747070312, -21.22675323486328, -20.53424072265625, -19.841726303100586, -19.149213790893555, -18.456701278686523, -17.764188766479492, -17.071674346923828, -16.379161834716797, -15.68664836883545, -14.994135856628418, -14.30162239074707, -13.609109878540039, -12.916597366333008, -12.224084854125977, -11.531572341918945, -10.839059829711914, -10.146546363830566, -9.454033851623535, -8.761520385742188, -8.069007873535156, -7.376495361328125, -6.6839823722839355, -5.991469383239746, -5.298956394195557, -4.606443405151367, -3.913930892944336, -3.2214179039001465, -2.528904914855957, -1.8363924026489258, -1.1438794136047363, -0.45136451721191406, 0.24114835262298584, 0.9336612224578857, 1.626173973083496, 2.3186869621276855, 3.011199951171875, 3.7037124633789062, 4.396225452423096, 5.088738441467285, 5.781251430511475, 6.473764419555664, 7.166276931762695, 7.858789920806885, 8.551302909851074, 9.243815422058105, 9.936328887939453, 10.628841400146484, 11.321353912353516, 12.013867378234863, 12.706379890441895, 13.398893356323242, 14.091405868530273, 14.783918380737305, 15.476430892944336, 16.1689453125, 16.86145782470703, 17.553970336914062, 18.246482849121094, 18.938997268676758, 19.63150978088379, 20.32402229309082, 21.01653480529785, 21.709047317504883]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 12.0, 9.0, 4.0, 12.0, 21.0, 17.0, 18.0, 38.0, 32.0, 44.0, 59.0, 54.0, 34.0, 47.0, 56.0, 54.0, 55.0, 47.0, 50.0, 44.0, 56.0, 34.0, 33.0, 16.0, 35.0, 24.0, 28.0, 11.0, 18.0, 2.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.2288818359375, -4.094482421875, -3.9600830078125, -3.82568359375, -3.6912841796875, -3.556884765625, -3.4224853515625, -3.2880859375, -3.1536865234375, -3.019287109375, -2.8848876953125, -2.75048828125, -2.6160888671875, -2.481689453125, -2.3472900390625, -2.212890625, -2.0784912109375, -1.944091796875, -1.8096923828125, -1.67529296875, -1.5408935546875, -1.406494140625, -1.2720947265625, -1.1376953125, -1.0032958984375, -0.868896484375, -0.7344970703125, -0.60009765625, -0.4656982421875, -0.331298828125, -0.1968994140625, -0.0625, 0.0718994140625, 0.206298828125, 0.3406982421875, 0.47509765625, 0.6094970703125, 0.743896484375, 0.8782958984375, 1.0126953125, 1.1470947265625, 1.281494140625, 1.4158935546875, 1.55029296875, 1.6846923828125, 1.819091796875, 1.9534912109375, 2.087890625, 2.2222900390625, 2.356689453125, 2.4910888671875, 2.62548828125, 2.7598876953125, 2.894287109375, 3.0286865234375, 3.1630859375, 3.2974853515625, 3.431884765625, 3.5662841796875, 3.70068359375, 3.8350830078125, 3.969482421875, 4.1038818359375, 4.23828125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 13.0, 15.0, 25.0, 47.0, 61.0, 92.0, 145.0, 256.0, 381.0, 634.0, 1019.0, 1747.0, 2906.0, 5014.0, 8693.0, 15161.0, 27513.0, 53400.0, 107975.0, 232777.0, 300490.0, 141963.0, 68574.0, 35019.0, 19032.0, 10617.0, 6084.0, 3500.0, 2130.0, 1254.0, 760.0, 475.0, 265.0, 168.0, 108.0, 81.0, 46.0, 38.0, 17.0, 11.0, 9.0, 11.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.030792236328125, -0.02986431121826172, -0.028936386108398438, -0.028008460998535156, -0.027080535888671875, -0.026152610778808594, -0.025224685668945312, -0.02429676055908203, -0.02336883544921875, -0.02244091033935547, -0.021512985229492188, -0.020585060119628906, -0.019657135009765625, -0.018729209899902344, -0.017801284790039062, -0.01687335968017578, -0.0159454345703125, -0.015017509460449219, -0.014089584350585938, -0.013161659240722656, -0.012233734130859375, -0.011305809020996094, -0.010377883911132812, -0.009449958801269531, -0.00852203369140625, -0.007594108581542969, -0.0066661834716796875, -0.005738258361816406, -0.004810333251953125, -0.0038824081420898438, -0.0029544830322265625, -0.0020265579223632812, -0.0010986328125, -0.00017070770263671875, 0.0007572174072265625, 0.0016851425170898438, 0.002613067626953125, 0.0035409927368164062, 0.0044689178466796875, 0.005396842956542969, 0.00632476806640625, 0.007252693176269531, 0.008180618286132812, 0.009108543395996094, 0.010036468505859375, 0.010964393615722656, 0.011892318725585938, 0.012820243835449219, 0.0137481689453125, 0.014676094055175781, 0.015604019165039062, 0.016531944274902344, 0.017459869384765625, 0.018387794494628906, 0.019315719604492188, 0.02024364471435547, 0.02117156982421875, 0.02209949493408203, 0.023027420043945312, 0.023955345153808594, 0.024883270263671875, 0.025811195373535156, 0.026739120483398438, 0.02766704559326172, 0.028594970703125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 8.0, 15.0, 12.0, 10.0, 17.0, 20.0, 25.0, 40.0, 21.0, 29.0, 27.0, 32.0, 43.0, 55.0, 47.0, 46.0, 44.0, 1064.0, 33.0, 33.0, 33.0, 50.0, 23.0, 36.0, 23.0, 24.0, 20.0, 29.0, 19.0, 22.0, 15.0, 16.0, 15.0, 15.0, 4.0, 5.0, 6.0, 4.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.640625, -2.55615234375, -2.4716796875, -2.38720703125, -2.302734375, -2.21826171875, -2.1337890625, -2.04931640625, -1.96484375, -1.88037109375, -1.7958984375, -1.71142578125, -1.626953125, -1.54248046875, -1.4580078125, -1.37353515625, -1.2890625, -1.20458984375, -1.1201171875, -1.03564453125, -0.951171875, -0.86669921875, -0.7822265625, -0.69775390625, -0.61328125, -0.52880859375, -0.4443359375, -0.35986328125, -0.275390625, -0.19091796875, -0.1064453125, -0.02197265625, 0.0625, 0.14697265625, 0.2314453125, 0.31591796875, 0.400390625, 0.48486328125, 0.5693359375, 0.65380859375, 0.73828125, 0.82275390625, 0.9072265625, 0.99169921875, 1.076171875, 1.16064453125, 1.2451171875, 1.32958984375, 1.4140625, 1.49853515625, 1.5830078125, 1.66748046875, 1.751953125, 1.83642578125, 1.9208984375, 2.00537109375, 2.08984375, 2.17431640625, 2.2587890625, 2.34326171875, 2.427734375, 2.51220703125, 2.5966796875, 2.68115234375, 2.765625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 12.0, 22.0, 33.0, 52.0, 71.0, 80.0, 124.0, 182.0, 257.0, 323.0, 549.0, 740.0, 1066.0, 1597.0, 2470.0, 3667.0, 5412.0, 8015.0, 12240.0, 18519.0, 28481.0, 44568.0, 71075.0, 117896.0, 189888.0, 1247939.0, 127852.0, 77102.0, 47617.0, 30507.0, 19670.0, 12877.0, 8578.0, 5669.0, 3934.0, 2529.0, 1757.0, 1150.0, 821.0, 550.0, 367.0, 274.0, 196.0, 118.0, 85.0, 56.0, 44.0, 37.0, 27.0, 16.0, 10.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.0096282958984375, -0.009328126907348633, -0.009027957916259766, -0.008727788925170898, -0.008427619934082031, -0.008127450942993164, -0.007827281951904297, -0.00752711296081543, -0.0072269439697265625, -0.006926774978637695, -0.006626605987548828, -0.006326436996459961, -0.006026268005371094, -0.0057260990142822266, -0.005425930023193359, -0.005125761032104492, -0.004825592041015625, -0.004525423049926758, -0.004225254058837891, -0.0039250850677490234, -0.0036249160766601562, -0.003324747085571289, -0.003024578094482422, -0.0027244091033935547, -0.0024242401123046875, -0.0021240711212158203, -0.0018239021301269531, -0.001523733139038086, -0.0012235641479492188, -0.0009233951568603516, -0.0006232261657714844, -0.0003230571746826172, -2.288818359375e-05, 0.0002772808074951172, 0.0005774497985839844, 0.0008776187896728516, 0.0011777877807617188, 0.001477956771850586, 0.0017781257629394531, 0.0020782947540283203, 0.0023784637451171875, 0.0026786327362060547, 0.002978801727294922, 0.003278970718383789, 0.0035791397094726562, 0.0038793087005615234, 0.004179477691650391, 0.004479646682739258, 0.004779815673828125, 0.005079984664916992, 0.005380153656005859, 0.0056803226470947266, 0.005980491638183594, 0.006280660629272461, 0.006580829620361328, 0.006880998611450195, 0.0071811676025390625, 0.00748133659362793, 0.007781505584716797, 0.008081674575805664, 0.008381843566894531, 0.008682012557983398, 0.008982181549072266, 0.009282350540161133, 0.00958251953125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 6.0, 2.0, 6.0, 0.0, 6.0, 7.0, 12.0, 0.0, 19.0, 42.0, 46.0, 0.0, 77.0, 144.0, 245.0, 0.0, 136.0, 98.0, 51.0, 0.0, 41.0, 15.0, 13.0, 0.0, 10.0, 4.0, 4.0, 0.0, 5.0, 9.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5050172805786133e-06, -1.4603137969970703e-06, -1.4156103134155273e-06, -1.3709068298339844e-06, -1.3262033462524414e-06, -1.2814998626708984e-06, -1.2367963790893555e-06, -1.1920928955078125e-06, -1.1473894119262695e-06, -1.1026859283447266e-06, -1.0579824447631836e-06, -1.0132789611816406e-06, -9.685754776000977e-07, -9.238719940185547e-07, -8.791685104370117e-07, -8.344650268554688e-07, -7.897615432739258e-07, -7.450580596923828e-07, -7.003545761108398e-07, -6.556510925292969e-07, -6.109476089477539e-07, -5.662441253662109e-07, -5.21540641784668e-07, -4.76837158203125e-07, -4.3213367462158203e-07, -3.8743019104003906e-07, -3.427267074584961e-07, -2.980232238769531e-07, -2.5331974029541016e-07, -2.086162567138672e-07, -1.6391277313232422e-07, -1.1920928955078125e-07, -7.450580596923828e-08, -2.9802322387695312e-08, 1.4901161193847656e-08, 5.960464477539063e-08, 1.043081283569336e-07, 1.4901161193847656e-07, 1.9371509552001953e-07, 2.384185791015625e-07, 2.8312206268310547e-07, 3.2782554626464844e-07, 3.725290298461914e-07, 4.172325134277344e-07, 4.6193599700927734e-07, 5.066394805908203e-07, 5.513429641723633e-07, 5.960464477539062e-07, 6.407499313354492e-07, 6.854534149169922e-07, 7.301568984985352e-07, 7.748603820800781e-07, 8.195638656616211e-07, 8.642673492431641e-07, 9.08970832824707e-07, 9.5367431640625e-07, 9.98377799987793e-07, 1.043081283569336e-06, 1.087784767150879e-06, 1.1324882507324219e-06, 1.1771917343139648e-06, 1.2218952178955078e-06, 1.2665987014770508e-06, 1.3113021850585938e-06]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 4.0, 3.0, 6.0, 3.0, 12.0, 10.0, 16.0, 32.0, 60.0, 82.0, 218.0, 1043.0, 707537.0, 338427.0, 681.0, 164.0, 95.0, 55.0, 30.0, 21.0, 9.0, 7.0, 5.0, 10.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9265880584716797e-05, -2.828892320394516e-05, -2.7311965823173523e-05, -2.6335008442401886e-05, -2.535805106163025e-05, -2.4381093680858612e-05, -2.3404136300086975e-05, -2.2427178919315338e-05, -2.14502215385437e-05, -2.0473264157772064e-05, -1.9496306777000427e-05, -1.851934939622879e-05, -1.7542392015457153e-05, -1.6565434634685516e-05, -1.558847725391388e-05, -1.4611519873142242e-05, -1.3634562492370605e-05, -1.2657605111598969e-05, -1.1680647730827332e-05, -1.0703690350055695e-05, -9.726732969284058e-06, -8.74977558851242e-06, -7.772818207740784e-06, -6.795860826969147e-06, -5.81890344619751e-06, -4.841946065425873e-06, -3.864988684654236e-06, -2.888031303882599e-06, -1.911073923110962e-06, -9.34116542339325e-07, 4.284083843231201e-08, 1.019798219203949e-06, 1.996755599975586e-06, 2.973712980747223e-06, 3.95067036151886e-06, 4.927627742290497e-06, 5.904585123062134e-06, 6.881542503833771e-06, 7.858499884605408e-06, 8.835457265377045e-06, 9.812414646148682e-06, 1.0789372026920319e-05, 1.1766329407691956e-05, 1.2743286788463593e-05, 1.372024416923523e-05, 1.4697201550006866e-05, 1.5674158930778503e-05, 1.665111631155014e-05, 1.7628073692321777e-05, 1.8605031073093414e-05, 1.958198845386505e-05, 2.0558945834636688e-05, 2.1535903215408325e-05, 2.2512860596179962e-05, 2.34898179769516e-05, 2.4466775357723236e-05, 2.5443732738494873e-05, 2.642069011926651e-05, 2.7397647500038147e-05, 2.8374604880809784e-05, 2.935156226158142e-05, 3.0328519642353058e-05, 3.1305477023124695e-05, 3.228243440389633e-05, 3.325939178466797e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 12.0, 36.0, 149.0, 381.0, 290.0, 113.0, 31.0, 2.0, 2.0, 1.0, 4.0], "bins": [-4.538730536296498e-06, -4.45892055722652e-06, -4.379110578156542e-06, -4.299300144339213e-06, -4.219490165269235e-06, -4.139680186199257e-06, -4.059870207129279e-06, -3.980060228059301e-06, -3.900249794241972e-06, -3.820439815171994e-06, -3.740629608728341e-06, -3.660819629658363e-06, -3.5810094232147094e-06, -3.5011994441447314e-06, -3.4213894650747534e-06, -3.3415794860047754e-06, -3.2617695069347974e-06, -3.1819595278648194e-06, -3.102149321421166e-06, -3.022339342351188e-06, -2.9425291359075345e-06, -2.8627191568375565e-06, -2.7829091777675785e-06, -2.7030991986976005e-06, -2.623288992253947e-06, -2.543479013183969e-06, -2.4636688067403156e-06, -2.3838588276703376e-06, -2.3040488486003596e-06, -2.224238642156706e-06, -2.144428663086728e-06, -2.0646184566430748e-06, -1.9848084775730968e-06, -1.904998384816281e-06, -1.8251882920594653e-06, -1.7453783129894873e-06, -1.6655682202326716e-06, -1.5857581274758559e-06, -1.5059481484058779e-06, -1.4261380556490622e-06, -1.3463279628922464e-06, -1.2665178701354307e-06, -1.186707777378615e-06, -1.106897798308637e-06, -1.0270877055518213e-06, -9.472776127950056e-07, -8.674675768816087e-07, -7.876575409682118e-07, -7.07847505054815e-07, -6.280374691414181e-07, -5.482273763846024e-07, -4.684173120494961e-07, -3.886072477143898e-07, -3.087971833792835e-07, -2.2898711904417723e-07, -1.4917708313078037e-07, -6.936699037396465e-08, 1.0443073961141636e-08, 9.025313829624793e-08, 1.7006320263135422e-07, 2.498732669664605e-07, 3.296833313015668e-07, 4.094933956366731e-07, 4.893034315500699e-07, 5.691135243068857e-07]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 65.0, 0.0, 0.0, 112.0, 0.0, 0.0, 0.0, 167.0, 0.0, 0.0, 0.0, 221.0, 0.0, 0.0, 0.0, 185.0, 0.0, 0.0, 132.0, 0.0, 0.0, 0.0, 52.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.0140002965927124e-07, -3.855675458908081e-07, -3.6973506212234497e-07, -3.5390257835388184e-07, -3.380700945854187e-07, -3.2223761081695557e-07, -3.0640512704849243e-07, -2.905726432800293e-07, -2.7474015951156616e-07, -2.5890767574310303e-07, -2.430751919746399e-07, -2.2724270820617676e-07, -2.1141022443771362e-07, -1.955777406692505e-07, -1.7974525690078735e-07, -1.6391277313232422e-07, -1.4808028936386108e-07, -1.3224780559539795e-07, -1.1641532182693481e-07, -1.0058283805847168e-07, -8.475035429000854e-08, -6.891787052154541e-08, -5.3085386753082275e-08, -3.725290298461914e-08, -2.1420419216156006e-08, -5.587935447692871e-09, 1.0244548320770264e-08, 2.60770320892334e-08, 4.190951585769653e-08, 5.774199962615967e-08, 7.35744833946228e-08, 8.940696716308594e-08, 1.0523945093154907e-07, 1.210719347000122e-07, 1.3690441846847534e-07, 1.5273690223693848e-07, 1.685693860054016e-07, 1.8440186977386475e-07, 2.0023435354232788e-07, 2.1606683731079102e-07, 2.3189932107925415e-07, 2.477318048477173e-07, 2.635642886161804e-07, 2.7939677238464355e-07, 2.952292561531067e-07, 3.110617399215698e-07, 3.2689422369003296e-07, 3.427267074584961e-07, 3.5855919122695923e-07, 3.7439167499542236e-07, 3.902241587638855e-07, 4.0605664253234863e-07, 4.2188912630081177e-07, 4.377216100692749e-07, 4.5355409383773804e-07, 4.6938657760620117e-07, 4.852190613746643e-07, 5.010515451431274e-07, 5.168840289115906e-07, 5.327165126800537e-07, 5.485489964485168e-07, 5.6438148021698e-07, 5.802139639854431e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 12.0, 9.0, 4.0, 12.0, 21.0, 17.0, 18.0, 38.0, 32.0, 44.0, 59.0, 54.0, 34.0, 47.0, 56.0, 54.0, 55.0, 47.0, 50.0, 44.0, 56.0, 34.0, 33.0, 16.0, 35.0, 24.0, 28.0, 11.0, 18.0, 2.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.2288818359375, -4.094482421875, -3.9600830078125, -3.82568359375, -3.6912841796875, -3.556884765625, -3.4224853515625, -3.2880859375, -3.1536865234375, -3.019287109375, -2.8848876953125, -2.75048828125, -2.6160888671875, -2.481689453125, -2.3472900390625, -2.212890625, -2.0784912109375, -1.944091796875, -1.8096923828125, -1.67529296875, -1.5408935546875, -1.406494140625, -1.2720947265625, -1.1376953125, -1.0032958984375, -0.868896484375, -0.7344970703125, -0.60009765625, -0.4656982421875, -0.331298828125, -0.1968994140625, -0.0625, 0.0718994140625, 0.206298828125, 0.3406982421875, 0.47509765625, 0.6094970703125, 0.743896484375, 0.8782958984375, 1.0126953125, 1.1470947265625, 1.281494140625, 1.4158935546875, 1.55029296875, 1.6846923828125, 1.819091796875, 1.9534912109375, 2.087890625, 2.2222900390625, 2.356689453125, 2.4910888671875, 2.62548828125, 2.7598876953125, 2.894287109375, 3.0286865234375, 3.1630859375, 3.2974853515625, 3.431884765625, 3.5662841796875, 3.70068359375, 3.8350830078125, 3.969482421875, 4.1038818359375, 4.23828125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 6.0, 10.0, 12.0, 10.0, 21.0, 31.0, 31.0, 52.0, 51.0, 83.0, 127.0, 184.0, 258.0, 387.0, 610.0, 867.0, 1316.0, 2048.0, 3171.0, 5078.0, 8454.0, 14790.0, 27272.0, 56413.0, 165846.0, 514303.0, 136205.0, 50845.0, 24956.0, 13624.0, 8061.0, 4661.0, 3053.0, 1960.0, 1203.0, 780.0, 550.0, 367.0, 254.0, 174.0, 127.0, 95.0, 50.0, 46.0, 34.0, 24.0, 22.0, 7.0, 10.0, 3.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.9921875, -3.86517333984375, -3.7381591796875, -3.61114501953125, -3.484130859375, -3.35711669921875, -3.2301025390625, -3.10308837890625, -2.97607421875, -2.84906005859375, -2.7220458984375, -2.59503173828125, -2.468017578125, -2.34100341796875, -2.2139892578125, -2.08697509765625, -1.9599609375, -1.83294677734375, -1.7059326171875, -1.57891845703125, -1.451904296875, -1.32489013671875, -1.1978759765625, -1.07086181640625, -0.94384765625, -0.81683349609375, -0.6898193359375, -0.56280517578125, -0.435791015625, -0.30877685546875, -0.1817626953125, -0.05474853515625, 0.072265625, 0.19927978515625, 0.3262939453125, 0.45330810546875, 0.580322265625, 0.70733642578125, 0.8343505859375, 0.96136474609375, 1.08837890625, 1.21539306640625, 1.3424072265625, 1.46942138671875, 1.596435546875, 1.72344970703125, 1.8504638671875, 1.97747802734375, 2.1044921875, 2.23150634765625, 2.3585205078125, 2.48553466796875, 2.612548828125, 2.73956298828125, 2.8665771484375, 2.99359130859375, 3.12060546875, 3.24761962890625, 3.3746337890625, 3.50164794921875, 3.628662109375, 3.75567626953125, 3.8826904296875, 4.00970458984375, 4.13671875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 7.0, 8.0, 10.0, 15.0, 17.0, 16.0, 27.0, 28.0, 19.0, 35.0, 31.0, 29.0, 58.0, 64.0, 68.0, 74.0, 163.0, 1544.0, 266.0, 101.0, 75.0, 42.0, 46.0, 24.0, 36.0, 29.0, 27.0, 17.0, 17.0, 19.0, 16.0, 24.0, 12.0, 11.0, 11.0, 5.0, 7.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.765625, -10.4468994140625, -10.128173828125, -9.8094482421875, -9.49072265625, -9.1719970703125, -8.853271484375, -8.5345458984375, -8.2158203125, -7.8970947265625, -7.578369140625, -7.2596435546875, -6.94091796875, -6.6221923828125, -6.303466796875, -5.9847412109375, -5.666015625, -5.3472900390625, -5.028564453125, -4.7098388671875, -4.39111328125, -4.0723876953125, -3.753662109375, -3.4349365234375, -3.1162109375, -2.7974853515625, -2.478759765625, -2.1600341796875, -1.84130859375, -1.5225830078125, -1.203857421875, -0.8851318359375, -0.56640625, -0.2476806640625, 0.071044921875, 0.3897705078125, 0.70849609375, 1.0272216796875, 1.345947265625, 1.6646728515625, 1.9833984375, 2.3021240234375, 2.620849609375, 2.9395751953125, 3.25830078125, 3.5770263671875, 3.895751953125, 4.2144775390625, 4.533203125, 4.8519287109375, 5.170654296875, 5.4893798828125, 5.80810546875, 6.1268310546875, 6.445556640625, 6.7642822265625, 7.0830078125, 7.4017333984375, 7.720458984375, 8.0391845703125, 8.35791015625, 8.6766357421875, 8.995361328125, 9.3140869140625, 9.6328125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 3.0, 7.0, 5.0, 8.0, 10.0, 9.0, 20.0, 20.0, 24.0, 26.0, 27.0, 30.0, 33.0, 62.0, 67.0, 108.0, 151.0, 333.0, 733.0, 2821.0, 15735.0, 189543.0, 2809978.0, 110939.0, 11262.0, 2174.0, 665.0, 287.0, 148.0, 114.0, 78.0, 54.0, 58.0, 34.0, 26.0, 29.0, 16.0, 15.0, 6.0, 8.0, 10.0, 4.0, 2.0, 7.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.28125, -14.77880859375, -14.2763671875, -13.77392578125, -13.271484375, -12.76904296875, -12.2666015625, -11.76416015625, -11.26171875, -10.75927734375, -10.2568359375, -9.75439453125, -9.251953125, -8.74951171875, -8.2470703125, -7.74462890625, -7.2421875, -6.73974609375, -6.2373046875, -5.73486328125, -5.232421875, -4.72998046875, -4.2275390625, -3.72509765625, -3.22265625, -2.72021484375, -2.2177734375, -1.71533203125, -1.212890625, -0.71044921875, -0.2080078125, 0.29443359375, 0.796875, 1.29931640625, 1.8017578125, 2.30419921875, 2.806640625, 3.30908203125, 3.8115234375, 4.31396484375, 4.81640625, 5.31884765625, 5.8212890625, 6.32373046875, 6.826171875, 7.32861328125, 7.8310546875, 8.33349609375, 8.8359375, 9.33837890625, 9.8408203125, 10.34326171875, 10.845703125, 11.34814453125, 11.8505859375, 12.35302734375, 12.85546875, 13.35791015625, 13.8603515625, 14.36279296875, 14.865234375, 15.36767578125, 15.8701171875, 16.37255859375, 16.875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 133.0, 370.0, 333.0, 123.0, 19.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.88629913330078, -65.94255828857422, -63.99882125854492, -62.05508041381836, -60.11134338378906, -58.1676025390625, -56.22386169433594, -54.280120849609375, -52.33638381958008, -50.392642974853516, -48.44890594482422, -46.505165100097656, -44.561424255371094, -42.6176872253418, -40.673946380615234, -38.73020935058594, -36.786468505859375, -34.84272766113281, -32.898990631103516, -30.955249786376953, -29.011510848999023, -27.067771911621094, -25.12403106689453, -23.1802921295166, -21.236553192138672, -19.292814254760742, -17.349075317382812, -15.40533447265625, -13.46159553527832, -11.51785659790039, -9.574116706848145, -7.630376815795898, -5.686641693115234, -3.7429022789001465, -1.7991628646850586, 0.1445765495300293, 2.088315963745117, 4.032054901123047, 5.975794792175293, 7.919534683227539, 9.863273620605469, 11.807012557983398, 13.750752449035645, 15.69449234008789, 17.63823127746582, 19.58197021484375, 21.525711059570312, 23.469449996948242, 25.413188934326172, 27.3569278717041, 29.30066680908203, 31.244407653808594, 33.188148498535156, 35.13188552856445, 37.075626373291016, 39.01936340332031, 40.963104248046875, 42.90684509277344, 44.850582122802734, 46.7943229675293, 48.738059997558594, 50.681800842285156, 52.62554168701172, 54.56928253173828, 56.51301956176758]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 8.0, 3.0, 3.0, 11.0, 4.0, 7.0, 8.0, 8.0, 7.0, 25.0, 16.0, 25.0, 29.0, 34.0, 35.0, 34.0, 33.0, 31.0, 33.0, 43.0, 40.0, 49.0, 57.0, 49.0, 53.0, 40.0, 36.0, 26.0, 36.0, 28.0, 27.0, 27.0, 28.0, 19.0, 19.0, 17.0, 11.0, 19.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.740440368652344, -33.620113372802734, -32.499786376953125, -31.379457473754883, -30.25912857055664, -29.13880157470703, -28.018474578857422, -26.898147583007812, -25.77781867980957, -24.65749168395996, -23.53716278076172, -22.41683578491211, -21.2965087890625, -20.176179885864258, -19.05585289001465, -17.935523986816406, -16.815196990966797, -15.694869041442871, -14.574541091918945, -13.454214096069336, -12.33388614654541, -11.213558197021484, -10.093231201171875, -8.97290325164795, -7.852575302124023, -6.732247352600098, -5.61191987991333, -4.4915924072265625, -3.3712644577026367, -2.250936508178711, -1.1306090354919434, -0.010281562805175781, 1.1100425720214844, 2.230370283126831, 3.3506979942321777, 4.471025466918945, 5.591353416442871, 6.711681365966797, 7.8320088386535645, 8.952336311340332, 10.072664260864258, 11.192992210388184, 12.31332015991211, 13.433647155761719, 14.553975105285645, 15.67430305480957, 16.79463005065918, 17.914958953857422, 19.03528594970703, 20.15561294555664, 21.275941848754883, 22.396268844604492, 23.516597747802734, 24.636924743652344, 25.757251739501953, 26.877578735351562, 27.997907638549805, 29.118234634399414, 30.238563537597656, 31.358890533447266, 32.479217529296875, 33.59954833984375, 34.71987533569336, 35.84020233154297, 36.96052932739258]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 10.0, 7.0, 14.0, 8.0, 16.0, 17.0, 16.0, 34.0, 36.0, 39.0, 48.0, 49.0, 34.0, 48.0, 46.0, 39.0, 50.0, 51.0, 56.0, 41.0, 36.0, 35.0, 39.0, 34.0, 30.0, 28.0, 28.0, 23.0, 13.0, 18.0, 11.0, 10.0, 8.0, 3.0, 5.0, 0.0, 0.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.22265625, -4.095611572265625, -3.96856689453125, -3.841522216796875, -3.7144775390625, -3.587432861328125, -3.46038818359375, -3.333343505859375, -3.206298828125, -3.079254150390625, -2.95220947265625, -2.825164794921875, -2.6981201171875, -2.571075439453125, -2.44403076171875, -2.316986083984375, -2.18994140625, -2.062896728515625, -1.93585205078125, -1.808807373046875, -1.6817626953125, -1.554718017578125, -1.42767333984375, -1.300628662109375, -1.173583984375, -1.046539306640625, -0.91949462890625, -0.792449951171875, -0.6654052734375, -0.538360595703125, -0.41131591796875, -0.284271240234375, -0.1572265625, -0.030181884765625, 0.09686279296875, 0.223907470703125, 0.3509521484375, 0.477996826171875, 0.60504150390625, 0.732086181640625, 0.859130859375, 0.986175537109375, 1.11322021484375, 1.240264892578125, 1.3673095703125, 1.494354248046875, 1.62139892578125, 1.748443603515625, 1.87548828125, 2.002532958984375, 2.12957763671875, 2.256622314453125, 2.3836669921875, 2.510711669921875, 2.63775634765625, 2.764801025390625, 2.891845703125, 3.018890380859375, 3.14593505859375, 3.272979736328125, 3.4000244140625, 3.527069091796875, 3.65411376953125, 3.781158447265625, 3.908203125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 10.0, 17.0, 33.0, 47.0, 70.0, 86.0, 138.0, 260.0, 394.0, 548.0, 827.0, 1340.0, 2279.0, 3525.0, 6110.0, 10495.0, 19181.0, 37373.0, 79999.0, 188504.0, 475043.0, 1105554.0, 1253570.0, 585309.0, 231622.0, 96429.0, 44179.0, 22393.0, 11834.0, 6591.0, 3919.0, 2383.0, 1497.0, 968.0, 602.0, 404.0, 253.0, 169.0, 112.0, 70.0, 43.0, 40.0, 20.0, 13.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0], "bins": [-4.3828125, -4.261444091796875, -4.14007568359375, -4.018707275390625, -3.8973388671875, -3.775970458984375, -3.65460205078125, -3.533233642578125, -3.411865234375, -3.290496826171875, -3.16912841796875, -3.047760009765625, -2.9263916015625, -2.805023193359375, -2.68365478515625, -2.562286376953125, -2.44091796875, -2.319549560546875, -2.19818115234375, -2.076812744140625, -1.9554443359375, -1.834075927734375, -1.71270751953125, -1.591339111328125, -1.469970703125, -1.348602294921875, -1.22723388671875, -1.105865478515625, -0.9844970703125, -0.863128662109375, -0.74176025390625, -0.620391845703125, -0.4990234375, -0.377655029296875, -0.25628662109375, -0.134918212890625, -0.0135498046875, 0.107818603515625, 0.22918701171875, 0.350555419921875, 0.471923828125, 0.593292236328125, 0.71466064453125, 0.836029052734375, 0.9573974609375, 1.078765869140625, 1.20013427734375, 1.321502685546875, 1.44287109375, 1.564239501953125, 1.68560791015625, 1.806976318359375, 1.9283447265625, 2.049713134765625, 2.17108154296875, 2.292449951171875, 2.413818359375, 2.535186767578125, 2.65655517578125, 2.777923583984375, 2.8992919921875, 3.020660400390625, 3.14202880859375, 3.263397216796875, 3.384765625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 1.0, 8.0, 6.0, 10.0, 13.0, 19.0, 28.0, 19.0, 47.0, 41.0, 64.0, 81.0, 90.0, 120.0, 178.0, 222.0, 264.0, 357.0, 374.0, 441.0, 329.0, 298.0, 242.0, 188.0, 131.0, 112.0, 85.0, 69.0, 54.0, 45.0, 25.0, 26.0, 14.0, 13.0, 14.0, 12.0, 9.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.4439697265625, -5.274658203125, -5.1053466796875, -4.93603515625, -4.7667236328125, -4.597412109375, -4.4281005859375, -4.2587890625, -4.0894775390625, -3.920166015625, -3.7508544921875, -3.58154296875, -3.4122314453125, -3.242919921875, -3.0736083984375, -2.904296875, -2.7349853515625, -2.565673828125, -2.3963623046875, -2.22705078125, -2.0577392578125, -1.888427734375, -1.7191162109375, -1.5498046875, -1.3804931640625, -1.211181640625, -1.0418701171875, -0.87255859375, -0.7032470703125, -0.533935546875, -0.3646240234375, -0.1953125, -0.0260009765625, 0.143310546875, 0.3126220703125, 0.48193359375, 0.6512451171875, 0.820556640625, 0.9898681640625, 1.1591796875, 1.3284912109375, 1.497802734375, 1.6671142578125, 1.83642578125, 2.0057373046875, 2.175048828125, 2.3443603515625, 2.513671875, 2.6829833984375, 2.852294921875, 3.0216064453125, 3.19091796875, 3.3602294921875, 3.529541015625, 3.6988525390625, 3.8681640625, 4.0374755859375, 4.206787109375, 4.3760986328125, 4.54541015625, 4.7147216796875, 4.884033203125, 5.0533447265625, 5.22265625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 6.0, 9.0, 7.0, 18.0, 21.0, 27.0, 35.0, 42.0, 67.0, 102.0, 134.0, 196.0, 321.0, 610.0, 1542.0, 6671.0, 69963.0, 2326284.0, 1724043.0, 55435.0, 5732.0, 1439.0, 590.0, 329.0, 191.0, 118.0, 83.0, 66.0, 41.0, 35.0, 23.0, 24.0, 17.0, 9.0, 7.0, 6.0, 7.0, 5.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.265625, -18.643310546875, -18.02099609375, -17.398681640625, -16.7763671875, -16.154052734375, -15.53173828125, -14.909423828125, -14.287109375, -13.664794921875, -13.04248046875, -12.420166015625, -11.7978515625, -11.175537109375, -10.55322265625, -9.930908203125, -9.30859375, -8.686279296875, -8.06396484375, -7.441650390625, -6.8193359375, -6.197021484375, -5.57470703125, -4.952392578125, -4.330078125, -3.707763671875, -3.08544921875, -2.463134765625, -1.8408203125, -1.218505859375, -0.59619140625, 0.026123046875, 0.6484375, 1.270751953125, 1.89306640625, 2.515380859375, 3.1376953125, 3.760009765625, 4.38232421875, 5.004638671875, 5.626953125, 6.249267578125, 6.87158203125, 7.493896484375, 8.1162109375, 8.738525390625, 9.36083984375, 9.983154296875, 10.60546875, 11.227783203125, 11.85009765625, 12.472412109375, 13.0947265625, 13.717041015625, 14.33935546875, 14.961669921875, 15.583984375, 16.206298828125, 16.82861328125, 17.450927734375, 18.0732421875, 18.695556640625, 19.31787109375, 19.940185546875, 20.5625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 16.0, 78.0, 248.0, 331.0, 233.0, 88.0, 18.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-172.13938903808594, -168.85865783691406, -165.5779266357422, -162.2971954345703, -159.01646423339844, -155.73573303222656, -152.4550018310547, -149.1742706298828, -145.89353942871094, -142.61280822753906, -139.3320770263672, -136.0513458251953, -132.77061462402344, -129.48988342285156, -126.20915222167969, -122.92842102050781, -119.64768981933594, -116.36695861816406, -113.08622741699219, -109.80549621582031, -106.52476501464844, -103.24403381347656, -99.96330261230469, -96.68257141113281, -93.4018325805664, -90.12110137939453, -86.84037017822266, -83.55963897705078, -80.2789077758789, -76.99817657470703, -73.71744537353516, -70.43671417236328, -67.1559829711914, -63.87525177001953, -60.594520568847656, -57.31378936767578, -54.033058166503906, -50.75232696533203, -47.471595764160156, -44.19086456298828, -40.910133361816406, -37.62940216064453, -34.348670959472656, -31.06793975830078, -27.787208557128906, -24.5064754486084, -21.225744247436523, -17.94501304626465, -14.66427993774414, -11.383548736572266, -8.10281753540039, -4.822085380554199, -1.5413541793823242, 1.7393779754638672, 5.020109176635742, 8.300840377807617, 11.581571578979492, 14.862302780151367, 18.143033981323242, 21.42376708984375, 24.704498291015625, 27.9852294921875, 31.265960693359375, 34.54669189453125, 37.827423095703125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 9.0, 7.0, 17.0, 11.0, 15.0, 16.0, 22.0, 17.0, 15.0, 25.0, 23.0, 27.0, 32.0, 50.0, 41.0, 45.0, 32.0, 46.0, 50.0, 34.0, 40.0, 39.0, 36.0, 32.0, 28.0, 39.0, 35.0, 27.0, 23.0, 26.0, 20.0, 10.0, 20.0, 14.0, 13.0, 14.0, 12.0, 10.0, 7.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.730224609375, -21.10227394104004, -20.474321365356445, -19.846370697021484, -19.21841812133789, -18.59046745300293, -17.962514877319336, -17.334564208984375, -16.70661163330078, -16.07866096496582, -15.450708389282227, -14.82275676727295, -14.194805145263672, -13.566854476928711, -12.938902854919434, -12.310951232910156, -11.683000564575195, -11.055048942565918, -10.42709732055664, -9.799145698547363, -9.171194076538086, -8.543243408203125, -7.915291786193848, -7.28734016418457, -6.659388542175293, -6.031436920166016, -5.403485298156738, -4.775534152984619, -4.147582530975342, -3.5196309089660645, -2.891679525375366, -2.263728141784668, -1.6357765197753906, -1.0078250169754028, -0.37987351417541504, 0.24807798862457275, 0.8760294914245605, 1.503981113433838, 2.131932497024536, 2.7598838806152344, 3.3878355026245117, 4.015787124633789, 4.643738746643066, 5.2716898918151855, 5.899641513824463, 6.52759313583374, 7.155544281005859, 7.783495903015137, 8.411447525024414, 9.039399147033691, 9.667350769042969, 10.295302391052246, 10.923254013061523, 11.551204681396484, 12.179156303405762, 12.807107925415039, 13.435059547424316, 14.063011169433594, 14.690962791442871, 15.318914413452148, 15.94686508178711, 16.574817657470703, 17.202768325805664, 17.830718994140625, 18.45867156982422]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 9.0, 18.0, 15.0, 23.0, 9.0, 19.0, 27.0, 28.0, 34.0, 46.0, 36.0, 54.0, 45.0, 40.0, 43.0, 39.0, 49.0, 37.0, 46.0, 46.0, 41.0, 33.0, 37.0, 24.0, 24.0, 28.0, 21.0, 23.0, 18.0, 15.0, 10.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.87890625, -3.759674072265625, -3.64044189453125, -3.521209716796875, -3.4019775390625, -3.282745361328125, -3.16351318359375, -3.044281005859375, -2.925048828125, -2.805816650390625, -2.68658447265625, -2.567352294921875, -2.4481201171875, -2.328887939453125, -2.20965576171875, -2.090423583984375, -1.97119140625, -1.851959228515625, -1.73272705078125, -1.613494873046875, -1.4942626953125, -1.375030517578125, -1.25579833984375, -1.136566162109375, -1.017333984375, -0.898101806640625, -0.77886962890625, -0.659637451171875, -0.5404052734375, -0.421173095703125, -0.30194091796875, -0.182708740234375, -0.0634765625, 0.055755615234375, 0.17498779296875, 0.294219970703125, 0.4134521484375, 0.532684326171875, 0.65191650390625, 0.771148681640625, 0.890380859375, 1.009613037109375, 1.12884521484375, 1.248077392578125, 1.3673095703125, 1.486541748046875, 1.60577392578125, 1.725006103515625, 1.84423828125, 1.963470458984375, 2.08270263671875, 2.201934814453125, 2.3211669921875, 2.440399169921875, 2.55963134765625, 2.678863525390625, 2.798095703125, 2.917327880859375, 3.03656005859375, 3.155792236328125, 3.2750244140625, 3.394256591796875, 3.51348876953125, 3.632720947265625, 3.751953125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 10.0, 11.0, 9.0, 27.0, 36.0, 38.0, 60.0, 85.0, 143.0, 193.0, 366.0, 470.0, 742.0, 1282.0, 1928.0, 3009.0, 5156.0, 8281.0, 13524.0, 23544.0, 42242.0, 82175.0, 173123.0, 307131.0, 188411.0, 88507.0, 45385.0, 25330.0, 14486.0, 8681.0, 5258.0, 3222.0, 2054.0, 1262.0, 817.0, 542.0, 337.0, 213.0, 166.0, 95.0, 57.0, 45.0, 29.0, 24.0, 15.0, 12.0, 11.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0290985107421875, -0.028204679489135742, -0.027310848236083984, -0.026417016983032227, -0.02552318572998047, -0.02462935447692871, -0.023735523223876953, -0.022841691970825195, -0.021947860717773438, -0.02105402946472168, -0.020160198211669922, -0.019266366958618164, -0.018372535705566406, -0.01747870445251465, -0.01658487319946289, -0.015691041946411133, -0.014797210693359375, -0.013903379440307617, -0.01300954818725586, -0.012115716934204102, -0.011221885681152344, -0.010328054428100586, -0.009434223175048828, -0.00854039192199707, -0.0076465606689453125, -0.006752729415893555, -0.005858898162841797, -0.004965066909790039, -0.004071235656738281, -0.0031774044036865234, -0.0022835731506347656, -0.0013897418975830078, -0.00049591064453125, 0.0003979206085205078, 0.0012917518615722656, 0.0021855831146240234, 0.0030794143676757812, 0.003973245620727539, 0.004867076873779297, 0.005760908126831055, 0.0066547393798828125, 0.00754857063293457, 0.008442401885986328, 0.009336233139038086, 0.010230064392089844, 0.011123895645141602, 0.01201772689819336, 0.012911558151245117, 0.013805389404296875, 0.014699220657348633, 0.01559305191040039, 0.01648688316345215, 0.017380714416503906, 0.018274545669555664, 0.019168376922607422, 0.02006220817565918, 0.020956039428710938, 0.021849870681762695, 0.022743701934814453, 0.02363753318786621, 0.02453136444091797, 0.025425195693969727, 0.026319026947021484, 0.027212858200073242, 0.028106689453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 3.0, 5.0, 5.0, 3.0, 13.0, 4.0, 10.0, 9.0, 15.0, 15.0, 14.0, 21.0, 18.0, 20.0, 27.0, 28.0, 34.0, 27.0, 31.0, 33.0, 47.0, 42.0, 38.0, 27.0, 1079.0, 28.0, 35.0, 43.0, 29.0, 26.0, 35.0, 29.0, 33.0, 29.0, 22.0, 23.0, 14.0, 21.0, 21.0, 14.0, 10.0, 6.0, 8.0, 13.0, 2.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.60546875, -2.522430419921875, -2.43939208984375, -2.356353759765625, -2.2733154296875, -2.190277099609375, -2.10723876953125, -2.024200439453125, -1.941162109375, -1.858123779296875, -1.77508544921875, -1.692047119140625, -1.6090087890625, -1.525970458984375, -1.44293212890625, -1.359893798828125, -1.27685546875, -1.193817138671875, -1.11077880859375, -1.027740478515625, -0.9447021484375, -0.861663818359375, -0.77862548828125, -0.695587158203125, -0.612548828125, -0.529510498046875, -0.44647216796875, -0.363433837890625, -0.2803955078125, -0.197357177734375, -0.11431884765625, -0.031280517578125, 0.0517578125, 0.134796142578125, 0.21783447265625, 0.300872802734375, 0.3839111328125, 0.466949462890625, 0.54998779296875, 0.633026123046875, 0.716064453125, 0.799102783203125, 0.88214111328125, 0.965179443359375, 1.0482177734375, 1.131256103515625, 1.21429443359375, 1.297332763671875, 1.38037109375, 1.463409423828125, 1.54644775390625, 1.629486083984375, 1.7125244140625, 1.795562744140625, 1.87860107421875, 1.961639404296875, 2.044677734375, 2.127716064453125, 2.21075439453125, 2.293792724609375, 2.3768310546875, 2.459869384765625, 2.54290771484375, 2.625946044921875, 2.708984375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 14.0, 28.0, 41.0, 68.0, 65.0, 108.0, 141.0, 237.0, 326.0, 502.0, 703.0, 1155.0, 1696.0, 2553.0, 3930.0, 6188.0, 9447.0, 15185.0, 23862.0, 38394.0, 61938.0, 102020.0, 171177.0, 1267023.0, 151168.0, 90133.0, 55187.0, 34479.0, 21351.0, 13405.0, 8627.0, 5485.0, 3498.0, 2329.0, 1524.0, 1027.0, 698.0, 463.0, 314.0, 192.0, 159.0, 103.0, 76.0, 40.0, 23.0, 19.0, 10.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01013946533203125, -0.009805679321289062, -0.009471893310546875, -0.009138107299804688, -0.0088043212890625, -0.008470535278320312, -0.008136749267578125, -0.0078029632568359375, -0.00746917724609375, -0.0071353912353515625, -0.006801605224609375, -0.0064678192138671875, -0.006134033203125, -0.0058002471923828125, -0.005466461181640625, -0.0051326751708984375, -0.00479888916015625, -0.0044651031494140625, -0.004131317138671875, -0.0037975311279296875, -0.0034637451171875, -0.0031299591064453125, -0.002796173095703125, -0.0024623870849609375, -0.00212860107421875, -0.0017948150634765625, -0.001461029052734375, -0.0011272430419921875, -0.00079345703125, -0.0004596710205078125, -0.000125885009765625, 0.0002079010009765625, 0.00054168701171875, 0.0008754730224609375, 0.001209259033203125, 0.0015430450439453125, 0.0018768310546875, 0.0022106170654296875, 0.002544403076171875, 0.0028781890869140625, 0.00321197509765625, 0.0035457611083984375, 0.003879547119140625, 0.0042133331298828125, 0.004547119140625, 0.0048809051513671875, 0.005214691162109375, 0.0055484771728515625, 0.00588226318359375, 0.0062160491943359375, 0.006549835205078125, 0.0068836212158203125, 0.0072174072265625, 0.0075511932373046875, 0.007884979248046875, 0.008218765258789062, 0.00855255126953125, 0.008886337280273438, 0.009220123291015625, 0.009553909301757812, 0.0098876953125, 0.010221481323242188, 0.010555267333984375, 0.010889053344726562, 0.01122283935546875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 6.0, 0.0, 8.0, 0.0, 13.0, 0.0, 10.0, 0.0, 32.0, 0.0, 25.0, 41.0, 0.0, 98.0, 0.0, 125.0, 0.0, 260.0, 0.0, 136.0, 0.0, 89.0, 0.0, 50.0, 0.0, 40.0, 0.0, 23.0, 0.0, 18.0, 0.0, 13.0, 0.0, 5.0, 0.0, 7.0, 0.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1613592505455017e-06, -1.130625605583191e-06, -1.0998919606208801e-06, -1.0691583156585693e-06, -1.0384246706962585e-06, -1.0076910257339478e-06, -9.76957380771637e-07, -9.462237358093262e-07, -9.154900908470154e-07, -8.847564458847046e-07, -8.540228009223938e-07, -8.23289155960083e-07, -7.925555109977722e-07, -7.618218660354614e-07, -7.310882210731506e-07, -7.003545761108398e-07, -6.69620931148529e-07, -6.388872861862183e-07, -6.081536412239075e-07, -5.774199962615967e-07, -5.466863512992859e-07, -5.159527063369751e-07, -4.852190613746643e-07, -4.544854164123535e-07, -4.237517714500427e-07, -3.9301812648773193e-07, -3.6228448152542114e-07, -3.3155083656311035e-07, -3.0081719160079956e-07, -2.7008354663848877e-07, -2.39349901676178e-07, -2.086162567138672e-07, -1.778826117515564e-07, -1.471489667892456e-07, -1.1641532182693481e-07, -8.568167686462402e-08, -5.494803190231323e-08, -2.421438694000244e-08, 6.51925802230835e-09, 3.725290298461914e-08, 6.798654794692993e-08, 9.872019290924072e-08, 1.2945383787155151e-07, 1.601874828338623e-07, 1.909211277961731e-07, 2.2165477275848389e-07, 2.523884177207947e-07, 2.8312206268310547e-07, 3.1385570764541626e-07, 3.4458935260772705e-07, 3.7532299757003784e-07, 4.0605664253234863e-07, 4.367902874946594e-07, 4.675239324569702e-07, 4.98257577419281e-07, 5.289912223815918e-07, 5.597248673439026e-07, 5.904585123062134e-07, 6.211921572685242e-07, 6.51925802230835e-07, 6.826594471931458e-07, 7.133930921554565e-07, 7.441267371177673e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 7.0, 10.0, 5.0, 19.0, 8.0, 20.0, 37.0, 36.0, 58.0, 95.0, 179.0, 459.0, 17120.0, 1019398.0, 10270.0, 362.0, 175.0, 92.0, 61.0, 22.0, 25.0, 14.0, 14.0, 18.0, 3.0, 4.0, 10.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7404556274414062e-05, -1.669209450483322e-05, -1.597963273525238e-05, -1.526717096567154e-05, -1.4554709196090698e-05, -1.3842247426509857e-05, -1.3129785656929016e-05, -1.2417323887348175e-05, -1.1704862117767334e-05, -1.0992400348186493e-05, -1.0279938578605652e-05, -9.56747680902481e-06, -8.85501503944397e-06, -8.142553269863129e-06, -7.430091500282288e-06, -6.7176297307014465e-06, -6.0051679611206055e-06, -5.292706191539764e-06, -4.580244421958923e-06, -3.867782652378082e-06, -3.155320882797241e-06, -2.4428591132164e-06, -1.730397343635559e-06, -1.017935574054718e-06, -3.0547380447387695e-07, 4.069879651069641e-07, 1.1194497346878052e-06, 1.8319115042686462e-06, 2.5443732738494873e-06, 3.2568350434303284e-06, 3.9692968130111694e-06, 4.6817585825920105e-06, 5.3942203521728516e-06, 6.106682121753693e-06, 6.819143891334534e-06, 7.531605660915375e-06, 8.244067430496216e-06, 8.956529200077057e-06, 9.668990969657898e-06, 1.0381452739238739e-05, 1.109391450881958e-05, 1.1806376278400421e-05, 1.2518838047981262e-05, 1.3231299817562103e-05, 1.3943761587142944e-05, 1.4656223356723785e-05, 1.5368685126304626e-05, 1.6081146895885468e-05, 1.679360866546631e-05, 1.750607043504715e-05, 1.821853220462799e-05, 1.8930993974208832e-05, 1.9643455743789673e-05, 2.0355917513370514e-05, 2.1068379282951355e-05, 2.1780841052532196e-05, 2.2493302822113037e-05, 2.3205764591693878e-05, 2.391822636127472e-05, 2.463068813085556e-05, 2.53431499004364e-05, 2.6055611670017242e-05, 2.6768073439598083e-05, 2.7480535209178925e-05, 2.8192996978759766e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 30.0, 96.0, 286.0, 426.0, 131.0, 32.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.9762257983966265e-06, -3.904108780261595e-06, -3.831991762126563e-06, -3.759874516617856e-06, -3.6877574984828243e-06, -3.6156404803477926e-06, -3.543523462212761e-06, -3.4714064440777292e-06, -3.399289198569022e-06, -3.3271721804339904e-06, -3.2550551622989587e-06, -3.1829379167902516e-06, -3.11082089865522e-06, -3.0387038805201882e-06, -2.9665868623851566e-06, -2.894469844250125e-06, -2.822352826115093e-06, -2.7502358079800615e-06, -2.67811878984503e-06, -2.6060015443363227e-06, -2.533884526201291e-06, -2.4617675080662593e-06, -2.3896504899312276e-06, -2.317533471796196e-06, -2.2454164536611643e-06, -2.1732994355261326e-06, -2.101182417391101e-06, -2.0290651718823938e-06, -1.956948153747362e-06, -1.8848311356123304e-06, -1.8127141174772987e-06, -1.740597099342267e-06, -1.6684796264598845e-06, -1.5963626083248528e-06, -1.5242454765029834e-06, -1.4521284583679517e-06, -1.3800113265460823e-06, -1.3078943084110506e-06, -1.235777290276019e-06, -1.1636602721409872e-06, -1.0915432540059555e-06, -1.0194262358709238e-06, -9.473091040490544e-07, -8.751920859140228e-07, -8.030750109355722e-07, -7.309579359571217e-07, -6.5884091782209e-07, -5.867238428436394e-07, -5.1460671102177e-07, -4.424896360433195e-07, -3.7037258948657836e-07, -2.9825554292983725e-07, -2.261384679513867e-07, -1.5402139297293616e-07, -8.190434641619504e-08, -9.787299859453924e-09, 6.232977511899662e-08, 1.3444683588659245e-07, 2.0656389665418828e-07, 2.786809432109294e-07, 3.5079801818937995e-07, 4.229150931678305e-07, 4.95032168146281e-07, 5.671491862813127e-07, 6.392662612597633e-07]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 103.0, 0.0, 0.0, 0.0, 206.0, 0.0, 0.0, 0.0, 0.0, 239.0, 0.0, 0.0, 0.0, 184.0, 0.0, 0.0, 0.0, 122.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.76837158203125e-07, -4.628673195838928e-07, -4.4889748096466064e-07, -4.3492764234542847e-07, -4.209578037261963e-07, -4.069879651069641e-07, -3.9301812648773193e-07, -3.7904828786849976e-07, -3.650784492492676e-07, -3.511086106300354e-07, -3.371387720108032e-07, -3.2316893339157104e-07, -3.0919909477233887e-07, -2.952292561531067e-07, -2.812594175338745e-07, -2.6728957891464233e-07, -2.5331974029541016e-07, -2.39349901676178e-07, -2.253800630569458e-07, -2.1141022443771362e-07, -1.9744038581848145e-07, -1.8347054719924927e-07, -1.695007085800171e-07, -1.555308699607849e-07, -1.4156103134155273e-07, -1.2759119272232056e-07, -1.1362135410308838e-07, -9.96515154838562e-08, -8.568167686462402e-08, -7.171183824539185e-08, -5.774199962615967e-08, -4.377216100692749e-08, -2.9802322387695312e-08, -1.5832483768463135e-08, -1.862645149230957e-09, 1.210719347000122e-08, 2.60770320892334e-08, 4.0046870708465576e-08, 5.4016709327697754e-08, 6.798654794692993e-08, 8.195638656616211e-08, 9.592622518539429e-08, 1.0989606380462646e-07, 1.2386590242385864e-07, 1.3783574104309082e-07, 1.51805579662323e-07, 1.6577541828155518e-07, 1.7974525690078735e-07, 1.9371509552001953e-07, 2.076849341392517e-07, 2.2165477275848389e-07, 2.3562461137771606e-07, 2.4959444999694824e-07, 2.635642886161804e-07, 2.775341272354126e-07, 2.915039658546448e-07, 3.0547380447387695e-07, 3.1944364309310913e-07, 3.334134817123413e-07, 3.473833203315735e-07, 3.6135315895080566e-07, 3.7532299757003784e-07, 3.8929283618927e-07, 4.032626748085022e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 9.0, 18.0, 15.0, 23.0, 9.0, 19.0, 27.0, 28.0, 34.0, 46.0, 36.0, 54.0, 45.0, 40.0, 43.0, 39.0, 49.0, 37.0, 46.0, 46.0, 41.0, 33.0, 37.0, 24.0, 24.0, 28.0, 21.0, 23.0, 18.0, 15.0, 10.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.87890625, -3.759674072265625, -3.64044189453125, -3.521209716796875, -3.4019775390625, -3.282745361328125, -3.16351318359375, -3.044281005859375, -2.925048828125, -2.805816650390625, -2.68658447265625, -2.567352294921875, -2.4481201171875, -2.328887939453125, -2.20965576171875, -2.090423583984375, -1.97119140625, -1.851959228515625, -1.73272705078125, -1.613494873046875, -1.4942626953125, -1.375030517578125, -1.25579833984375, -1.136566162109375, -1.017333984375, -0.898101806640625, -0.77886962890625, -0.659637451171875, -0.5404052734375, -0.421173095703125, -0.30194091796875, -0.182708740234375, -0.0634765625, 0.055755615234375, 0.17498779296875, 0.294219970703125, 0.4134521484375, 0.532684326171875, 0.65191650390625, 0.771148681640625, 0.890380859375, 1.009613037109375, 1.12884521484375, 1.248077392578125, 1.3673095703125, 1.486541748046875, 1.60577392578125, 1.725006103515625, 1.84423828125, 1.963470458984375, 2.08270263671875, 2.201934814453125, 2.3211669921875, 2.440399169921875, 2.55963134765625, 2.678863525390625, 2.798095703125, 2.917327880859375, 3.03656005859375, 3.155792236328125, 3.2750244140625, 3.394256591796875, 3.51348876953125, 3.632720947265625, 3.751953125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 27.0, 21.0, 24.0, 53.0, 68.0, 120.0, 148.0, 205.0, 327.0, 467.0, 680.0, 1000.0, 1509.0, 2352.0, 3523.0, 5434.0, 8473.0, 14204.0, 24426.0, 44029.0, 83841.0, 175314.0, 326400.0, 169772.0, 81485.0, 42499.0, 23849.0, 14052.0, 8477.0, 5413.0, 3434.0, 2223.0, 1572.0, 1005.0, 639.0, 475.0, 321.0, 212.0, 165.0, 80.0, 70.0, 48.0, 37.0, 30.0, 12.0, 13.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.294921875, -3.179229736328125, -3.06353759765625, -2.947845458984375, -2.8321533203125, -2.716461181640625, -2.60076904296875, -2.485076904296875, -2.369384765625, -2.253692626953125, -2.13800048828125, -2.022308349609375, -1.9066162109375, -1.790924072265625, -1.67523193359375, -1.559539794921875, -1.44384765625, -1.328155517578125, -1.21246337890625, -1.096771240234375, -0.9810791015625, -0.865386962890625, -0.74969482421875, -0.634002685546875, -0.518310546875, -0.402618408203125, -0.28692626953125, -0.171234130859375, -0.0555419921875, 0.060150146484375, 0.17584228515625, 0.291534423828125, 0.4072265625, 0.522918701171875, 0.63861083984375, 0.754302978515625, 0.8699951171875, 0.985687255859375, 1.10137939453125, 1.217071533203125, 1.332763671875, 1.448455810546875, 1.56414794921875, 1.679840087890625, 1.7955322265625, 1.911224365234375, 2.02691650390625, 2.142608642578125, 2.25830078125, 2.373992919921875, 2.48968505859375, 2.605377197265625, 2.7210693359375, 2.836761474609375, 2.95245361328125, 3.068145751953125, 3.183837890625, 3.299530029296875, 3.41522216796875, 3.530914306640625, 3.6466064453125, 3.762298583984375, 3.87799072265625, 3.993682861328125, 4.109375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 16.0, 10.0, 14.0, 20.0, 22.0, 26.0, 26.0, 36.0, 34.0, 34.0, 37.0, 50.0, 53.0, 91.0, 169.0, 1391.0, 327.0, 151.0, 81.0, 54.0, 34.0, 59.0, 32.0, 27.0, 30.0, 41.0, 28.0, 18.0, 14.0, 22.0, 22.0, 7.0, 10.0, 10.0, 10.0, 4.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.2626953125, -8.931640625, -8.6005859375, -8.26953125, -7.9384765625, -7.607421875, -7.2763671875, -6.9453125, -6.6142578125, -6.283203125, -5.9521484375, -5.62109375, -5.2900390625, -4.958984375, -4.6279296875, -4.296875, -3.9658203125, -3.634765625, -3.3037109375, -2.97265625, -2.6416015625, -2.310546875, -1.9794921875, -1.6484375, -1.3173828125, -0.986328125, -0.6552734375, -0.32421875, 0.0068359375, 0.337890625, 0.6689453125, 1.0, 1.3310546875, 1.662109375, 1.9931640625, 2.32421875, 2.6552734375, 2.986328125, 3.3173828125, 3.6484375, 3.9794921875, 4.310546875, 4.6416015625, 4.97265625, 5.3037109375, 5.634765625, 5.9658203125, 6.296875, 6.6279296875, 6.958984375, 7.2900390625, 7.62109375, 7.9521484375, 8.283203125, 8.6142578125, 8.9453125, 9.2763671875, 9.607421875, 9.9384765625, 10.26953125, 10.6005859375, 10.931640625, 11.2626953125, 11.59375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 11.0, 15.0, 17.0, 23.0, 26.0, 41.0, 62.0, 66.0, 85.0, 150.0, 199.0, 354.0, 626.0, 1575.0, 5374.0, 28479.0, 273984.0, 2587046.0, 215353.0, 24414.0, 4772.0, 1458.0, 594.0, 326.0, 225.0, 135.0, 74.0, 41.0, 56.0, 20.0, 24.0, 14.0, 11.0, 10.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5625, -11.182861328125, -10.80322265625, -10.423583984375, -10.0439453125, -9.664306640625, -9.28466796875, -8.905029296875, -8.525390625, -8.145751953125, -7.76611328125, -7.386474609375, -7.0068359375, -6.627197265625, -6.24755859375, -5.867919921875, -5.48828125, -5.108642578125, -4.72900390625, -4.349365234375, -3.9697265625, -3.590087890625, -3.21044921875, -2.830810546875, -2.451171875, -2.071533203125, -1.69189453125, -1.312255859375, -0.9326171875, -0.552978515625, -0.17333984375, 0.206298828125, 0.5859375, 0.965576171875, 1.34521484375, 1.724853515625, 2.1044921875, 2.484130859375, 2.86376953125, 3.243408203125, 3.623046875, 4.002685546875, 4.38232421875, 4.761962890625, 5.1416015625, 5.521240234375, 5.90087890625, 6.280517578125, 6.66015625, 7.039794921875, 7.41943359375, 7.799072265625, 8.1787109375, 8.558349609375, 8.93798828125, 9.317626953125, 9.697265625, 10.076904296875, 10.45654296875, 10.836181640625, 11.2158203125, 11.595458984375, 11.97509765625, 12.354736328125, 12.734375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 18.0, 70.0, 170.0, 291.0, 254.0, 131.0, 61.0, 13.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.1630973815918, -59.54860305786133, -57.934104919433594, -56.319610595703125, -54.70511245727539, -53.09061813354492, -51.47611999511719, -49.86162567138672, -48.24713134765625, -46.63263702392578, -45.01813888549805, -43.40364456176758, -41.789146423339844, -40.174652099609375, -38.560157775878906, -36.94565963745117, -35.33116149902344, -33.71666717529297, -32.102169036865234, -30.487674713134766, -28.873178482055664, -27.258682250976562, -25.64418601989746, -24.02968978881836, -22.41519546508789, -20.80069923400879, -19.186203002929688, -17.57170867919922, -15.957212448120117, -14.342716217041016, -12.728219985961914, -11.113724708557129, -9.499229431152344, -7.8847336769104, -6.270237922668457, -4.6557416915893555, -3.041245937347412, -1.4267501831054688, 0.1877460479736328, 1.802241325378418, 3.4167375564575195, 5.031233310699463, 6.645729064941406, 8.260225296020508, 9.87472152709961, 11.489216804504395, 13.103713035583496, 14.718208312988281, 16.332704544067383, 17.947200775146484, 19.561697006225586, 21.176193237304688, 22.790687561035156, 24.405183792114258, 26.01968002319336, 27.634174346923828, 29.248672485351562, 30.863168716430664, 32.477664947509766, 34.092159271240234, 35.70665740966797, 37.32115173339844, 38.935646057128906, 40.55014419555664, 42.16463851928711]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 6.0, 6.0, 6.0, 19.0, 17.0, 19.0, 22.0, 18.0, 21.0, 27.0, 32.0, 31.0, 45.0, 47.0, 42.0, 27.0, 38.0, 44.0, 54.0, 34.0, 48.0, 47.0, 36.0, 35.0, 38.0, 38.0, 27.0, 24.0, 26.0, 24.0, 17.0, 14.0, 7.0, 23.0, 12.0, 4.0, 5.0, 3.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.847381591796875, -31.868642807006836, -30.88990592956543, -29.91116714477539, -28.932430267333984, -27.953691482543945, -26.974952697753906, -25.9962158203125, -25.017478942871094, -24.038740158081055, -23.06000328063965, -22.08126449584961, -21.102527618408203, -20.123788833618164, -19.145050048828125, -18.16631317138672, -17.18757438659668, -16.20883560180664, -15.230098724365234, -14.251359939575195, -13.272623062133789, -12.29388427734375, -11.315146446228027, -10.336408615112305, -9.357670783996582, -8.37893295288086, -7.400195121765137, -6.421456813812256, -5.442718982696533, -4.4639811515808105, -3.4852428436279297, -2.506505012512207, -1.5277671813964844, -0.5490292310714722, 0.42970871925354004, 1.4084467887878418, 2.3871846199035645, 3.365922451019287, 4.344660758972168, 5.323398590087891, 6.302136421203613, 7.280874252319336, 8.259612083435059, 9.238349914550781, 10.21708869934082, 11.195825576782227, 12.174564361572266, 13.153302192687988, 14.132040023803711, 15.110777854919434, 16.089515686035156, 17.068254470825195, 18.0469913482666, 19.02573013305664, 20.004467010498047, 20.983205795288086, 21.961944580078125, 22.940683364868164, 23.91942024230957, 24.89815902709961, 25.876895904541016, 26.855634689331055, 27.834373474121094, 28.8131103515625, 29.791847229003906]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 10.0, 5.0, 11.0, 11.0, 21.0, 11.0, 17.0, 17.0, 24.0, 21.0, 26.0, 46.0, 40.0, 47.0, 54.0, 39.0, 50.0, 35.0, 42.0, 46.0, 46.0, 50.0, 40.0, 41.0, 33.0, 25.0, 28.0, 24.0, 26.0, 24.0, 13.0, 18.0, 13.0, 8.0, 5.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.015625, -3.894073486328125, -3.77252197265625, -3.650970458984375, -3.5294189453125, -3.407867431640625, -3.28631591796875, -3.164764404296875, -3.043212890625, -2.921661376953125, -2.80010986328125, -2.678558349609375, -2.5570068359375, -2.435455322265625, -2.31390380859375, -2.192352294921875, -2.07080078125, -1.949249267578125, -1.82769775390625, -1.706146240234375, -1.5845947265625, -1.463043212890625, -1.34149169921875, -1.219940185546875, -1.098388671875, -0.976837158203125, -0.85528564453125, -0.733734130859375, -0.6121826171875, -0.490631103515625, -0.36907958984375, -0.247528076171875, -0.1259765625, -0.004425048828125, 0.11712646484375, 0.238677978515625, 0.3602294921875, 0.481781005859375, 0.60333251953125, 0.724884033203125, 0.846435546875, 0.967987060546875, 1.08953857421875, 1.211090087890625, 1.3326416015625, 1.454193115234375, 1.57574462890625, 1.697296142578125, 1.81884765625, 1.940399169921875, 2.06195068359375, 2.183502197265625, 2.3050537109375, 2.426605224609375, 2.54815673828125, 2.669708251953125, 2.791259765625, 2.912811279296875, 3.03436279296875, 3.155914306640625, 3.2774658203125, 3.399017333984375, 3.52056884765625, 3.642120361328125, 3.763671875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 6.0, 7.0, 6.0, 15.0, 15.0, 23.0, 29.0, 48.0, 55.0, 126.0, 228.0, 445.0, 902.0, 2148.0, 5572.0, 15704.0, 55088.0, 269880.0, 1926734.0, 1619431.0, 226474.0, 48555.0, 14008.0, 4981.0, 1982.0, 870.0, 417.0, 198.0, 103.0, 55.0, 47.0, 27.0, 25.0, 15.0, 8.0, 12.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.9765625, -8.712158203125, -8.44775390625, -8.183349609375, -7.9189453125, -7.654541015625, -7.39013671875, -7.125732421875, -6.861328125, -6.596923828125, -6.33251953125, -6.068115234375, -5.8037109375, -5.539306640625, -5.27490234375, -5.010498046875, -4.74609375, -4.481689453125, -4.21728515625, -3.952880859375, -3.6884765625, -3.424072265625, -3.15966796875, -2.895263671875, -2.630859375, -2.366455078125, -2.10205078125, -1.837646484375, -1.5732421875, -1.308837890625, -1.04443359375, -0.780029296875, -0.515625, -0.251220703125, 0.01318359375, 0.277587890625, 0.5419921875, 0.806396484375, 1.07080078125, 1.335205078125, 1.599609375, 1.864013671875, 2.12841796875, 2.392822265625, 2.6572265625, 2.921630859375, 3.18603515625, 3.450439453125, 3.71484375, 3.979248046875, 4.24365234375, 4.508056640625, 4.7724609375, 5.036865234375, 5.30126953125, 5.565673828125, 5.830078125, 6.094482421875, 6.35888671875, 6.623291015625, 6.8876953125, 7.152099609375, 7.41650390625, 7.680908203125, 7.9453125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 12.0, 16.0, 15.0, 19.0, 27.0, 58.0, 84.0, 123.0, 174.0, 241.0, 402.0, 579.0, 649.0, 491.0, 350.0, 282.0, 165.0, 102.0, 95.0, 52.0, 45.0, 29.0, 20.0, 14.0, 4.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.20703125, -6.96270751953125, -6.7183837890625, -6.47406005859375, -6.229736328125, -5.98541259765625, -5.7410888671875, -5.49676513671875, -5.25244140625, -5.00811767578125, -4.7637939453125, -4.51947021484375, -4.275146484375, -4.03082275390625, -3.7864990234375, -3.54217529296875, -3.2978515625, -3.05352783203125, -2.8092041015625, -2.56488037109375, -2.320556640625, -2.07623291015625, -1.8319091796875, -1.58758544921875, -1.34326171875, -1.09893798828125, -0.8546142578125, -0.61029052734375, -0.365966796875, -0.12164306640625, 0.1226806640625, 0.36700439453125, 0.611328125, 0.85565185546875, 1.0999755859375, 1.34429931640625, 1.588623046875, 1.83294677734375, 2.0772705078125, 2.32159423828125, 2.56591796875, 2.81024169921875, 3.0545654296875, 3.29888916015625, 3.543212890625, 3.78753662109375, 4.0318603515625, 4.27618408203125, 4.5205078125, 4.76483154296875, 5.0091552734375, 5.25347900390625, 5.497802734375, 5.74212646484375, 5.9864501953125, 6.23077392578125, 6.47509765625, 6.71942138671875, 6.9637451171875, 7.20806884765625, 7.452392578125, 7.69671630859375, 7.9410400390625, 8.18536376953125, 8.4296875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 7.0, 21.0, 27.0, 51.0, 66.0, 112.0, 206.0, 428.0, 1377.0, 8413.0, 212779.0, 3800108.0, 161231.0, 7284.0, 1285.0, 396.0, 192.0, 106.0, 69.0, 39.0, 23.0, 17.0, 10.0, 14.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.6875, -29.822265625, -28.95703125, -28.091796875, -27.2265625, -26.361328125, -25.49609375, -24.630859375, -23.765625, -22.900390625, -22.03515625, -21.169921875, -20.3046875, -19.439453125, -18.57421875, -17.708984375, -16.84375, -15.978515625, -15.11328125, -14.248046875, -13.3828125, -12.517578125, -11.65234375, -10.787109375, -9.921875, -9.056640625, -8.19140625, -7.326171875, -6.4609375, -5.595703125, -4.73046875, -3.865234375, -3.0, -2.134765625, -1.26953125, -0.404296875, 0.4609375, 1.326171875, 2.19140625, 3.056640625, 3.921875, 4.787109375, 5.65234375, 6.517578125, 7.3828125, 8.248046875, 9.11328125, 9.978515625, 10.84375, 11.708984375, 12.57421875, 13.439453125, 14.3046875, 15.169921875, 16.03515625, 16.900390625, 17.765625, 18.630859375, 19.49609375, 20.361328125, 21.2265625, 22.091796875, 22.95703125, 23.822265625, 24.6875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 46.0, 97.0, 228.0, 253.0, 193.0, 124.0, 49.0, 7.0, 7.0, 0.0, 2.0, 1.0, 1.0], "bins": [-129.52093505859375, -127.14391326904297, -124.76689910888672, -122.38987731933594, -120.01285552978516, -117.6358413696289, -115.25881958007812, -112.88180541992188, -110.5047836303711, -108.12776184082031, -105.75074768066406, -103.37372589111328, -100.9967041015625, -98.61968994140625, -96.24266815185547, -93.86564636230469, -91.48863220214844, -89.11161041259766, -86.7345962524414, -84.35757446289062, -81.98055267333984, -79.6035385131836, -77.22651672363281, -74.84950256347656, -72.47247314453125, -70.09545135498047, -67.71843719482422, -65.34141540527344, -62.96439743041992, -60.587379455566406, -58.210357666015625, -55.83333969116211, -53.456321716308594, -51.07930374145508, -48.7022819519043, -46.32526397705078, -43.948246002197266, -41.57122802734375, -39.19420623779297, -36.81718826293945, -34.44017028808594, -32.06315231323242, -29.686132431030273, -27.309112548828125, -24.93209457397461, -22.55507469177246, -20.178054809570312, -17.801036834716797, -15.424016952514648, -13.046998023986816, -10.669979095458984, -8.292959213256836, -5.915940284729004, -3.538921356201172, -1.1619014739990234, 1.2151165008544922, 3.5921363830566406, 5.969155311584473, 8.346174240112305, 10.723194122314453, 13.100213050842285, 15.477231979370117, 17.854251861572266, 20.23126983642578, 22.60828971862793]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 0.0, 11.0, 14.0, 14.0, 13.0, 15.0, 17.0, 22.0, 19.0, 23.0, 23.0, 42.0, 39.0, 31.0, 36.0, 38.0, 40.0, 37.0, 39.0, 31.0, 29.0, 38.0, 27.0, 43.0, 52.0, 37.0, 37.0, 33.0, 30.0, 29.0, 22.0, 10.0, 16.0, 10.0, 14.0, 15.0, 10.0, 10.0, 3.0, 4.0, 7.0, 6.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.04638671875, -21.394601821899414, -20.742816925048828, -20.091032028198242, -19.439247131347656, -18.78746223449707, -18.135677337646484, -17.48389434814453, -16.832107543945312, -16.180322647094727, -15.52853775024414, -14.876752853393555, -14.224967956542969, -13.573183059692383, -12.921399116516113, -12.269614219665527, -11.617830276489258, -10.966045379638672, -10.314260482788086, -9.6624755859375, -9.010690689086914, -8.358905792236328, -7.707121849060059, -7.055336952209473, -6.403552055358887, -5.751767158508301, -5.099982261657715, -4.448197841644287, -3.796412944793701, -3.1446280479431152, -2.4928433895111084, -1.8410587310791016, -1.1892738342285156, -0.5374890565872192, 0.11429572105407715, 0.7660804986953735, 1.41786527633667, 2.069650173187256, 2.7214348316192627, 3.3732194900512695, 4.0250043869018555, 4.676789283752441, 5.328574180603027, 5.980358600616455, 6.632143497467041, 7.283928394317627, 7.935712814331055, 8.58749771118164, 9.239282608032227, 9.891067504882812, 10.542852401733398, 11.194637298583984, 11.84642219543457, 12.498207092285156, 13.149991035461426, 13.801775932312012, 14.453560829162598, 15.105345726013184, 15.75713062286377, 16.40891456604004, 17.060699462890625, 17.71248435974121, 18.364269256591797, 19.016054153442383, 19.66783905029297]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 10.0, 7.0, 7.0, 9.0, 13.0, 17.0, 19.0, 18.0, 18.0, 27.0, 19.0, 30.0, 31.0, 34.0, 31.0, 54.0, 54.0, 51.0, 44.0, 38.0, 39.0, 53.0, 32.0, 35.0, 42.0, 24.0, 26.0, 29.0, 26.0, 35.0, 19.0, 27.0, 12.0, 14.0, 15.0, 10.0, 11.0, 2.0, 8.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.88671875, -3.7667236328125, -3.646728515625, -3.5267333984375, -3.40673828125, -3.2867431640625, -3.166748046875, -3.0467529296875, -2.9267578125, -2.8067626953125, -2.686767578125, -2.5667724609375, -2.44677734375, -2.3267822265625, -2.206787109375, -2.0867919921875, -1.966796875, -1.8468017578125, -1.726806640625, -1.6068115234375, -1.48681640625, -1.3668212890625, -1.246826171875, -1.1268310546875, -1.0068359375, -0.8868408203125, -0.766845703125, -0.6468505859375, -0.52685546875, -0.4068603515625, -0.286865234375, -0.1668701171875, -0.046875, 0.0731201171875, 0.193115234375, 0.3131103515625, 0.43310546875, 0.5531005859375, 0.673095703125, 0.7930908203125, 0.9130859375, 1.0330810546875, 1.153076171875, 1.2730712890625, 1.39306640625, 1.5130615234375, 1.633056640625, 1.7530517578125, 1.873046875, 1.9930419921875, 2.113037109375, 2.2330322265625, 2.35302734375, 2.4730224609375, 2.593017578125, 2.7130126953125, 2.8330078125, 2.9530029296875, 3.072998046875, 3.1929931640625, 3.31298828125, 3.4329833984375, 3.552978515625, 3.6729736328125, 3.79296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 6.0, 8.0, 17.0, 13.0, 24.0, 47.0, 56.0, 72.0, 115.0, 203.0, 254.0, 344.0, 554.0, 876.0, 1314.0, 1940.0, 3048.0, 4645.0, 7312.0, 11670.0, 18224.0, 28931.0, 47650.0, 82464.0, 147939.0, 255492.0, 183010.0, 101539.0, 57146.0, 34518.0, 21354.0, 13415.0, 8541.0, 5516.0, 3530.0, 2298.0, 1438.0, 1002.0, 658.0, 420.0, 323.0, 211.0, 131.0, 82.0, 63.0, 50.0, 26.0, 16.0, 22.0, 10.0, 5.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.025238037109375, -0.024441242218017578, -0.023644447326660156, -0.022847652435302734, -0.022050857543945312, -0.02125406265258789, -0.02045726776123047, -0.019660472869873047, -0.018863677978515625, -0.018066883087158203, -0.01727008819580078, -0.01647329330444336, -0.015676498413085938, -0.014879703521728516, -0.014082908630371094, -0.013286113739013672, -0.01248931884765625, -0.011692523956298828, -0.010895729064941406, -0.010098934173583984, -0.009302139282226562, -0.00850534439086914, -0.007708549499511719, -0.006911754608154297, -0.006114959716796875, -0.005318164825439453, -0.004521369934082031, -0.0037245750427246094, -0.0029277801513671875, -0.0021309852600097656, -0.0013341903686523438, -0.0005373954772949219, 0.0002593994140625, 0.0010561943054199219, 0.0018529891967773438, 0.0026497840881347656, 0.0034465789794921875, 0.004243373870849609, 0.005040168762207031, 0.005836963653564453, 0.006633758544921875, 0.007430553436279297, 0.008227348327636719, 0.00902414321899414, 0.009820938110351562, 0.010617733001708984, 0.011414527893066406, 0.012211322784423828, 0.01300811767578125, 0.013804912567138672, 0.014601707458496094, 0.015398502349853516, 0.016195297241210938, 0.01699209213256836, 0.01778888702392578, 0.018585681915283203, 0.019382476806640625, 0.020179271697998047, 0.02097606658935547, 0.02177286148071289, 0.022569656372070312, 0.023366451263427734, 0.024163246154785156, 0.024960041046142578, 0.0257568359375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 0.0, 1.0, 6.0, 6.0, 5.0, 6.0, 9.0, 13.0, 14.0, 13.0, 21.0, 21.0, 19.0, 20.0, 20.0, 35.0, 34.0, 26.0, 32.0, 45.0, 38.0, 40.0, 34.0, 1065.0, 50.0, 44.0, 34.0, 45.0, 40.0, 30.0, 35.0, 26.0, 32.0, 27.0, 25.0, 21.0, 15.0, 17.0, 16.0, 11.0, 8.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2734375, -3.168914794921875, -3.06439208984375, -2.959869384765625, -2.8553466796875, -2.750823974609375, -2.64630126953125, -2.541778564453125, -2.437255859375, -2.332733154296875, -2.22821044921875, -2.123687744140625, -2.0191650390625, -1.914642333984375, -1.81011962890625, -1.705596923828125, -1.60107421875, -1.496551513671875, -1.39202880859375, -1.287506103515625, -1.1829833984375, -1.078460693359375, -0.97393798828125, -0.869415283203125, -0.764892578125, -0.660369873046875, -0.55584716796875, -0.451324462890625, -0.3468017578125, -0.242279052734375, -0.13775634765625, -0.033233642578125, 0.0712890625, 0.175811767578125, 0.28033447265625, 0.384857177734375, 0.4893798828125, 0.593902587890625, 0.69842529296875, 0.802947998046875, 0.907470703125, 1.011993408203125, 1.11651611328125, 1.221038818359375, 1.3255615234375, 1.430084228515625, 1.53460693359375, 1.639129638671875, 1.74365234375, 1.848175048828125, 1.95269775390625, 2.057220458984375, 2.1617431640625, 2.266265869140625, 2.37078857421875, 2.475311279296875, 2.579833984375, 2.684356689453125, 2.78887939453125, 2.893402099609375, 2.9979248046875, 3.102447509765625, 3.20697021484375, 3.311492919921875, 3.416015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 6.0, 12.0, 11.0, 20.0, 18.0, 37.0, 47.0, 78.0, 90.0, 125.0, 189.0, 210.0, 380.0, 535.0, 716.0, 1028.0, 1572.0, 2177.0, 3077.0, 4431.0, 6765.0, 10007.0, 15081.0, 22758.0, 34779.0, 54396.0, 86785.0, 143799.0, 1263456.0, 166463.0, 98845.0, 61632.0, 39460.0, 25876.0, 16974.0, 11342.0, 7493.0, 5133.0, 3479.0, 2345.0, 1661.0, 1106.0, 795.0, 557.0, 382.0, 270.0, 222.0, 137.0, 110.0, 89.0, 61.0, 31.0, 27.0, 20.0, 20.0, 11.0, 6.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.01081085205078125, -0.010469198226928711, -0.010127544403076172, -0.009785890579223633, -0.009444236755371094, -0.009102582931518555, -0.008760929107666016, -0.008419275283813477, -0.008077621459960938, -0.0077359676361083984, -0.007394313812255859, -0.00705265998840332, -0.006711006164550781, -0.006369352340698242, -0.006027698516845703, -0.005686044692993164, -0.005344390869140625, -0.005002737045288086, -0.004661083221435547, -0.004319429397583008, -0.003977775573730469, -0.0036361217498779297, -0.0032944679260253906, -0.0029528141021728516, -0.0026111602783203125, -0.0022695064544677734, -0.0019278526306152344, -0.0015861988067626953, -0.0012445449829101562, -0.0009028911590576172, -0.0005612373352050781, -0.00021958351135253906, 0.0001220703125, 0.00046372413635253906, 0.0008053779602050781, 0.0011470317840576172, 0.0014886856079101562, 0.0018303394317626953, 0.0021719932556152344, 0.0025136470794677734, 0.0028553009033203125, 0.0031969547271728516, 0.0035386085510253906, 0.0038802623748779297, 0.004221916198730469, 0.004563570022583008, 0.004905223846435547, 0.005246877670288086, 0.005588531494140625, 0.005930185317993164, 0.006271839141845703, 0.006613492965698242, 0.006955146789550781, 0.00729680061340332, 0.007638454437255859, 0.007980108261108398, 0.008321762084960938, 0.008663415908813477, 0.009005069732666016, 0.009346723556518555, 0.009688377380371094, 0.010030031204223633, 0.010371685028076172, 0.010713338851928711, 0.01105499267578125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 0.0, 3.0, 9.0, 0.0, 5.0, 9.0, 0.0, 26.0, 35.0, 0.0, 30.0, 45.0, 0.0, 94.0, 0.0, 128.0, 230.0, 0.0, 146.0, 81.0, 0.0, 48.0, 43.0, 0.0, 21.0, 0.0, 18.0, 16.0, 0.0, 12.0, 1.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0943040251731873e-06, -1.0561197996139526e-06, -1.017935574054718e-06, -9.797513484954834e-07, -9.415671229362488e-07, -9.033828973770142e-07, -8.651986718177795e-07, -8.270144462585449e-07, -7.888302206993103e-07, -7.506459951400757e-07, -7.124617695808411e-07, -6.742775440216064e-07, -6.360933184623718e-07, -5.979090929031372e-07, -5.597248673439026e-07, -5.21540641784668e-07, -4.833564162254333e-07, -4.4517219066619873e-07, -4.069879651069641e-07, -3.688037395477295e-07, -3.3061951398849487e-07, -2.9243528842926025e-07, -2.5425106287002563e-07, -2.1606683731079102e-07, -1.778826117515564e-07, -1.3969838619232178e-07, -1.0151416063308716e-07, -6.332993507385254e-08, -2.514570951461792e-08, 1.30385160446167e-08, 5.122274160385132e-08, 8.940696716308594e-08, 1.2759119272232056e-07, 1.6577541828155518e-07, 2.039596438407898e-07, 2.421438694000244e-07, 2.8032809495925903e-07, 3.1851232051849365e-07, 3.5669654607772827e-07, 3.948807716369629e-07, 4.330649971961975e-07, 4.7124922275543213e-07, 5.094334483146667e-07, 5.476176738739014e-07, 5.85801899433136e-07, 6.239861249923706e-07, 6.621703505516052e-07, 7.003545761108398e-07, 7.385388016700745e-07, 7.767230272293091e-07, 8.149072527885437e-07, 8.530914783477783e-07, 8.912757039070129e-07, 9.294599294662476e-07, 9.676441550254822e-07, 1.0058283805847168e-06, 1.0440126061439514e-06, 1.082196831703186e-06, 1.1203810572624207e-06, 1.1585652828216553e-06, 1.1967495083808899e-06, 1.2349337339401245e-06, 1.2731179594993591e-06, 1.3113021850585938e-06]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 12.0, 16.0, 12.0, 17.0, 21.0, 45.0, 64.0, 98.0, 204.0, 1458.0, 854987.0, 190355.0, 762.0, 215.0, 83.0, 47.0, 40.0, 29.0, 19.0, 24.0, 10.0, 3.0, 5.0, 5.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921531677246094e-05, -2.903863787651062e-05, -2.8155744075775146e-05, -2.7272850275039673e-05, -2.63899564743042e-05, -2.5507062673568726e-05, -2.4624168872833252e-05, -2.374127507209778e-05, -2.2858381271362305e-05, -2.197548747062683e-05, -2.1092593669891357e-05, -2.0209699869155884e-05, -1.932680606842041e-05, -1.8443912267684937e-05, -1.7561018466949463e-05, -1.667812466621399e-05, -1.5795230865478516e-05, -1.4912337064743042e-05, -1.4029443264007568e-05, -1.3146549463272095e-05, -1.2263655662536621e-05, -1.1380761861801147e-05, -1.0497868061065674e-05, -9.6149742603302e-06, -8.732080459594727e-06, -7.849186658859253e-06, -6.966292858123779e-06, -6.083399057388306e-06, -5.200505256652832e-06, -4.317611455917358e-06, -3.4347176551818848e-06, -2.551823854446411e-06, -1.6689300537109375e-06, -7.860362529754639e-07, 9.685754776000977e-08, 9.797513484954834e-07, 1.862645149230957e-06, 2.7455389499664307e-06, 3.6284327507019043e-06, 4.511326551437378e-06, 5.3942203521728516e-06, 6.277114152908325e-06, 7.160007953643799e-06, 8.042901754379272e-06, 8.925795555114746e-06, 9.80868935585022e-06, 1.0691583156585693e-05, 1.1574476957321167e-05, 1.245737075805664e-05, 1.3340264558792114e-05, 1.4223158359527588e-05, 1.5106052160263062e-05, 1.5988945960998535e-05, 1.687183976173401e-05, 1.7754733562469482e-05, 1.8637627363204956e-05, 1.952052116394043e-05, 2.0403414964675903e-05, 2.1286308765411377e-05, 2.216920256614685e-05, 2.3052096366882324e-05, 2.3934990167617798e-05, 2.481788396835327e-05, 2.5700777769088745e-05, 2.658367156982422e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [6.0, 11.0, 35.0, 99.0, 279.0, 350.0, 159.0, 51.0, 22.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8575390703954326e-07, -3.1141877343543456e-07, -2.3708366825303528e-07, -1.627485488597813e-07, -8.84134294665273e-08, -1.407832428412803e-08, 6.025680931998068e-08, 1.3459194292408938e-07, 2.0892704810648866e-07, 2.8326218171059736e-07, 3.5759728689299664e-07, 4.319323920753959e-07, 5.062674972577952e-07, 5.806026592836133e-07, 6.549377644660126e-07, 7.292728696484119e-07, 8.0360803167423e-07, 8.779431368566293e-07, 9.522782420390286e-07, 1.0266134040648467e-06, 1.1009485660906648e-06, 1.1752836144296452e-06, 1.2496187764554634e-06, 1.3239539384812815e-06, 1.398288986820262e-06, 1.47262414884608e-06, 1.5469591971850605e-06, 1.6212943592108786e-06, 1.695629407549859e-06, 1.7699645695756772e-06, 1.8442997316014953e-06, 1.9186347799404757e-06, 1.992969828279456e-06, 2.0673048766184365e-06, 2.1416401523310924e-06, 2.215975200670073e-06, 2.2903102490090532e-06, 2.3646452973480336e-06, 2.4389805730606895e-06, 2.51331562139967e-06, 2.5876506697386503e-06, 2.6619857180776307e-06, 2.7363209937902866e-06, 2.810656042129267e-06, 2.8849910904682474e-06, 2.959326138807228e-06, 3.0336614145198837e-06, 3.107996462858864e-06, 3.18233173857152e-06, 3.2566667869105004e-06, 3.3310020626231562e-06, 3.4053371109621366e-06, 3.479672159301117e-06, 3.554007435013773e-06, 3.6283424833527533e-06, 3.7026775316917337e-06, 3.7770128074043896e-06, 3.8513480831170455e-06, 3.9256829040823504e-06, 4.000018179795006e-06, 4.074353455507662e-06, 4.148688276472967e-06, 4.223023552185623e-06, 4.297358827898279e-06, 4.371693648863584e-06]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 105.0, 0.0, 0.0, 0.0, 168.0, 0.0, 0.0, 0.0, 207.0, 0.0, 0.0, 0.0, 166.0, 0.0, 0.0, 0.0, 123.0, 0.0, 0.0, 0.0, 68.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 10.0, 7.0, 7.0, 9.0, 13.0, 17.0, 19.0, 18.0, 18.0, 27.0, 19.0, 30.0, 31.0, 34.0, 31.0, 54.0, 54.0, 51.0, 44.0, 38.0, 39.0, 53.0, 32.0, 35.0, 42.0, 24.0, 26.0, 29.0, 26.0, 35.0, 19.0, 27.0, 12.0, 14.0, 15.0, 10.0, 11.0, 2.0, 8.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.88671875, -3.7667236328125, -3.646728515625, -3.5267333984375, -3.40673828125, -3.2867431640625, -3.166748046875, -3.0467529296875, -2.9267578125, -2.8067626953125, -2.686767578125, -2.5667724609375, -2.44677734375, -2.3267822265625, -2.206787109375, -2.0867919921875, -1.966796875, -1.8468017578125, -1.726806640625, -1.6068115234375, -1.48681640625, -1.3668212890625, -1.246826171875, -1.1268310546875, -1.0068359375, -0.8868408203125, -0.766845703125, -0.6468505859375, -0.52685546875, -0.4068603515625, -0.286865234375, -0.1668701171875, -0.046875, 0.0731201171875, 0.193115234375, 0.3131103515625, 0.43310546875, 0.5531005859375, 0.673095703125, 0.7930908203125, 0.9130859375, 1.0330810546875, 1.153076171875, 1.2730712890625, 1.39306640625, 1.5130615234375, 1.633056640625, 1.7530517578125, 1.873046875, 1.9930419921875, 2.113037109375, 2.2330322265625, 2.35302734375, 2.4730224609375, 2.593017578125, 2.7130126953125, 2.8330078125, 2.9530029296875, 3.072998046875, 3.1929931640625, 3.31298828125, 3.4329833984375, 3.552978515625, 3.6729736328125, 3.79296875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 6.0, 14.0, 21.0, 26.0, 41.0, 56.0, 108.0, 164.0, 257.0, 418.0, 695.0, 1019.0, 1895.0, 3085.0, 5060.0, 8407.0, 15094.0, 28542.0, 73623.0, 300296.0, 431562.0, 100828.0, 35560.0, 17506.0, 9615.0, 5881.0, 3442.0, 2042.0, 1248.0, 762.0, 496.0, 305.0, 178.0, 126.0, 70.0, 43.0, 22.0, 14.0, 9.0, 5.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.859375, -4.7081298828125, -4.556884765625, -4.4056396484375, -4.25439453125, -4.1031494140625, -3.951904296875, -3.8006591796875, -3.6494140625, -3.4981689453125, -3.346923828125, -3.1956787109375, -3.04443359375, -2.8931884765625, -2.741943359375, -2.5906982421875, -2.439453125, -2.2882080078125, -2.136962890625, -1.9857177734375, -1.83447265625, -1.6832275390625, -1.531982421875, -1.3807373046875, -1.2294921875, -1.0782470703125, -0.927001953125, -0.7757568359375, -0.62451171875, -0.4732666015625, -0.322021484375, -0.1707763671875, -0.01953125, 0.1317138671875, 0.282958984375, 0.4342041015625, 0.58544921875, 0.7366943359375, 0.887939453125, 1.0391845703125, 1.1904296875, 1.3416748046875, 1.492919921875, 1.6441650390625, 1.79541015625, 1.9466552734375, 2.097900390625, 2.2491455078125, 2.400390625, 2.5516357421875, 2.702880859375, 2.8541259765625, 3.00537109375, 3.1566162109375, 3.307861328125, 3.4591064453125, 3.6103515625, 3.7615966796875, 3.912841796875, 4.0640869140625, 4.21533203125, 4.3665771484375, 4.517822265625, 4.6690673828125, 4.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 8.0, 16.0, 13.0, 15.0, 16.0, 22.0, 26.0, 17.0, 28.0, 33.0, 40.0, 41.0, 29.0, 46.0, 71.0, 114.0, 385.0, 1510.0, 166.0, 63.0, 36.0, 40.0, 36.0, 31.0, 27.0, 36.0, 33.0, 29.0, 21.0, 14.0, 19.0, 10.0, 13.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1015625, -10.7452392578125, -10.388916015625, -10.0325927734375, -9.67626953125, -9.3199462890625, -8.963623046875, -8.6072998046875, -8.2509765625, -7.8946533203125, -7.538330078125, -7.1820068359375, -6.82568359375, -6.4693603515625, -6.113037109375, -5.7567138671875, -5.400390625, -5.0440673828125, -4.687744140625, -4.3314208984375, -3.97509765625, -3.6187744140625, -3.262451171875, -2.9061279296875, -2.5498046875, -2.1934814453125, -1.837158203125, -1.4808349609375, -1.12451171875, -0.7681884765625, -0.411865234375, -0.0555419921875, 0.30078125, 0.6571044921875, 1.013427734375, 1.3697509765625, 1.72607421875, 2.0823974609375, 2.438720703125, 2.7950439453125, 3.1513671875, 3.5076904296875, 3.864013671875, 4.2203369140625, 4.57666015625, 4.9329833984375, 5.289306640625, 5.6456298828125, 6.001953125, 6.3582763671875, 6.714599609375, 7.0709228515625, 7.42724609375, 7.7835693359375, 8.139892578125, 8.4962158203125, 8.8525390625, 9.2088623046875, 9.565185546875, 9.9215087890625, 10.27783203125, 10.6341552734375, 10.990478515625, 11.3468017578125, 11.703125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 9.0, 13.0, 22.0, 34.0, 41.0, 52.0, 66.0, 103.0, 111.0, 166.0, 318.0, 847.0, 3134.0, 14541.0, 146782.0, 2832732.0, 128140.0, 13923.0, 2782.0, 856.0, 323.0, 206.0, 114.0, 80.0, 78.0, 54.0, 39.0, 33.0, 29.0, 18.0, 9.0, 11.0, 7.0, 8.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.484375, -13.0560302734375, -12.627685546875, -12.1993408203125, -11.77099609375, -11.3426513671875, -10.914306640625, -10.4859619140625, -10.0576171875, -9.6292724609375, -9.200927734375, -8.7725830078125, -8.34423828125, -7.9158935546875, -7.487548828125, -7.0592041015625, -6.630859375, -6.2025146484375, -5.774169921875, -5.3458251953125, -4.91748046875, -4.4891357421875, -4.060791015625, -3.6324462890625, -3.2041015625, -2.7757568359375, -2.347412109375, -1.9190673828125, -1.49072265625, -1.0623779296875, -0.634033203125, -0.2056884765625, 0.22265625, 0.6510009765625, 1.079345703125, 1.5076904296875, 1.93603515625, 2.3643798828125, 2.792724609375, 3.2210693359375, 3.6494140625, 4.0777587890625, 4.506103515625, 4.9344482421875, 5.36279296875, 5.7911376953125, 6.219482421875, 6.6478271484375, 7.076171875, 7.5045166015625, 7.932861328125, 8.3612060546875, 8.78955078125, 9.2178955078125, 9.646240234375, 10.0745849609375, 10.5029296875, 10.9312744140625, 11.359619140625, 11.7879638671875, 12.21630859375, 12.6446533203125, 13.072998046875, 13.5013427734375, 13.9296875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [36.0, 437.0, 512.0, 32.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.806355953216553, -3.492382764816284, -0.17840957641601562, 3.135563373565674, 6.4495368003845215, 9.763509750366211, 13.077482223510742, 16.391456604003906, 19.705429077148438, 23.01940155029297, 26.333375930786133, 29.647348403930664, 32.96132278442383, 36.27529525756836, 39.58926773071289, 42.90324401855469, 46.21721649169922, 49.53118896484375, 52.84516143798828, 56.15913391113281, 59.47311019897461, 62.78708267211914, 66.10105895996094, 69.41503143310547, 72.72900390625, 76.04297637939453, 79.35694885253906, 82.6709213256836, 85.98489379882812, 89.29887390136719, 92.61283874511719, 95.92681884765625, 99.24079132080078, 102.55476379394531, 105.86873626708984, 109.18270874023438, 112.4966812133789, 115.81065368652344, 119.1246337890625, 122.43860626220703, 125.75257873535156, 129.06655883789062, 132.38052368164062, 135.6945037841797, 139.0084686279297, 142.32244873046875, 145.63641357421875, 148.9503936767578, 152.2643585205078, 155.57833862304688, 158.89230346679688, 162.20628356933594, 165.52024841308594, 168.834228515625, 172.148193359375, 175.46217346191406, 178.77615356445312, 182.0901336669922, 185.4040985107422, 188.71807861328125, 192.03204345703125, 195.3460235595703, 198.6599884033203, 201.97396850585938, 205.28793334960938]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 8.0, 17.0, 17.0, 9.0, 8.0, 18.0, 24.0, 28.0, 25.0, 49.0, 30.0, 38.0, 41.0, 31.0, 33.0, 59.0, 49.0, 46.0, 49.0, 36.0, 41.0, 41.0, 35.0, 37.0, 35.0, 25.0, 23.0, 26.0, 20.0, 19.0, 16.0, 10.0, 5.0, 12.0, 8.0, 5.0, 7.0, 0.0, 2.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.620820999145508, -28.647905349731445, -27.67498779296875, -26.702072143554688, -25.729154586791992, -24.75623893737793, -23.783321380615234, -22.810405731201172, -21.83749008178711, -20.864574432373047, -19.89165687561035, -18.91874122619629, -17.945823669433594, -16.97290802001953, -15.999991416931152, -15.027074813842773, -14.054157257080078, -13.0812406539917, -12.10832405090332, -11.135408401489258, -10.162490844726562, -9.1895751953125, -8.216658592224121, -7.243741989135742, -6.270825386047363, -5.297908782958984, -4.3249921798706055, -3.3520760536193848, -2.379159450531006, -1.406242847442627, -0.43332672119140625, 0.5395898818969727, 1.5125083923339844, 2.4854249954223633, 3.458341360092163, 4.431257724761963, 5.404174327850342, 6.377090930938721, 7.350007057189941, 8.32292366027832, 9.2958402633667, 10.268756866455078, 11.241673469543457, 12.214590072631836, 13.187505722045898, 14.160423278808594, 15.133338928222656, 16.10625457763672, 17.079172134399414, 18.052087783813477, 19.025005340576172, 19.997920989990234, 20.97083854675293, 21.943754196166992, 22.916671752929688, 23.88958740234375, 24.862503051757812, 25.835418701171875, 26.80833625793457, 27.781251907348633, 28.754169464111328, 29.72708511352539, 30.700000762939453, 31.67291831970215, 32.645835876464844]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 3.0, 7.0, 5.0, 11.0, 15.0, 17.0, 15.0, 20.0, 23.0, 19.0, 21.0, 24.0, 31.0, 27.0, 32.0, 39.0, 44.0, 53.0, 53.0, 44.0, 37.0, 33.0, 45.0, 40.0, 34.0, 35.0, 29.0, 33.0, 23.0, 25.0, 31.0, 15.0, 23.0, 17.0, 15.0, 15.0, 9.0, 10.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.9765625, -3.856170654296875, -3.73577880859375, -3.615386962890625, -3.4949951171875, -3.374603271484375, -3.25421142578125, -3.133819580078125, -3.013427734375, -2.893035888671875, -2.77264404296875, -2.652252197265625, -2.5318603515625, -2.411468505859375, -2.29107666015625, -2.170684814453125, -2.05029296875, -1.929901123046875, -1.80950927734375, -1.689117431640625, -1.5687255859375, -1.448333740234375, -1.32794189453125, -1.207550048828125, -1.087158203125, -0.966766357421875, -0.84637451171875, -0.725982666015625, -0.6055908203125, -0.485198974609375, -0.36480712890625, -0.244415283203125, -0.1240234375, -0.003631591796875, 0.11676025390625, 0.237152099609375, 0.3575439453125, 0.477935791015625, 0.59832763671875, 0.718719482421875, 0.839111328125, 0.959503173828125, 1.07989501953125, 1.200286865234375, 1.3206787109375, 1.441070556640625, 1.56146240234375, 1.681854248046875, 1.80224609375, 1.922637939453125, 2.04302978515625, 2.163421630859375, 2.2838134765625, 2.404205322265625, 2.52459716796875, 2.644989013671875, 2.765380859375, 2.885772705078125, 3.00616455078125, 3.126556396484375, 3.2469482421875, 3.367340087890625, 3.48773193359375, 3.608123779296875, 3.728515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 15.0, 12.0, 18.0, 26.0, 42.0, 46.0, 75.0, 99.0, 135.0, 224.0, 331.0, 463.0, 685.0, 1171.0, 1979.0, 3397.0, 5811.0, 11036.0, 22702.0, 52305.0, 140142.0, 470734.0, 1599023.0, 1324111.0, 359749.0, 112734.0, 43659.0, 19988.0, 10068.0, 5459.0, 3075.0, 1753.0, 1086.0, 689.0, 447.0, 294.0, 195.0, 132.0, 93.0, 60.0, 66.0, 43.0, 29.0, 23.0, 9.0, 9.0, 10.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0], "bins": [-5.95703125, -5.78131103515625, -5.6055908203125, -5.42987060546875, -5.254150390625, -5.07843017578125, -4.9027099609375, -4.72698974609375, -4.55126953125, -4.37554931640625, -4.1998291015625, -4.02410888671875, -3.848388671875, -3.67266845703125, -3.4969482421875, -3.32122802734375, -3.1455078125, -2.96978759765625, -2.7940673828125, -2.61834716796875, -2.442626953125, -2.26690673828125, -2.0911865234375, -1.91546630859375, -1.73974609375, -1.56402587890625, -1.3883056640625, -1.21258544921875, -1.036865234375, -0.86114501953125, -0.6854248046875, -0.50970458984375, -0.333984375, -0.15826416015625, 0.0174560546875, 0.19317626953125, 0.368896484375, 0.54461669921875, 0.7203369140625, 0.89605712890625, 1.07177734375, 1.24749755859375, 1.4232177734375, 1.59893798828125, 1.774658203125, 1.95037841796875, 2.1260986328125, 2.30181884765625, 2.4775390625, 2.65325927734375, 2.8289794921875, 3.00469970703125, 3.180419921875, 3.35614013671875, 3.5318603515625, 3.70758056640625, 3.88330078125, 4.05902099609375, 4.2347412109375, 4.41046142578125, 4.586181640625, 4.76190185546875, 4.9376220703125, 5.11334228515625, 5.2890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 9.0, 9.0, 16.0, 12.0, 23.0, 47.0, 45.0, 64.0, 82.0, 118.0, 161.0, 195.0, 316.0, 393.0, 495.0, 517.0, 414.0, 283.0, 241.0, 164.0, 111.0, 93.0, 60.0, 47.0, 47.0, 19.0, 22.0, 16.0, 11.0, 7.0, 5.0, 11.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.109375, -6.90020751953125, -6.6910400390625, -6.48187255859375, -6.272705078125, -6.06353759765625, -5.8543701171875, -5.64520263671875, -5.43603515625, -5.22686767578125, -5.0177001953125, -4.80853271484375, -4.599365234375, -4.39019775390625, -4.1810302734375, -3.97186279296875, -3.7626953125, -3.55352783203125, -3.3443603515625, -3.13519287109375, -2.926025390625, -2.71685791015625, -2.5076904296875, -2.29852294921875, -2.08935546875, -1.88018798828125, -1.6710205078125, -1.46185302734375, -1.252685546875, -1.04351806640625, -0.8343505859375, -0.62518310546875, -0.416015625, -0.20684814453125, 0.0023193359375, 0.21148681640625, 0.420654296875, 0.62982177734375, 0.8389892578125, 1.04815673828125, 1.25732421875, 1.46649169921875, 1.6756591796875, 1.88482666015625, 2.093994140625, 2.30316162109375, 2.5123291015625, 2.72149658203125, 2.9306640625, 3.13983154296875, 3.3489990234375, 3.55816650390625, 3.767333984375, 3.97650146484375, 4.1856689453125, 4.39483642578125, 4.60400390625, 4.81317138671875, 5.0223388671875, 5.23150634765625, 5.440673828125, 5.64984130859375, 5.8590087890625, 6.06817626953125, 6.27734375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 13.0, 13.0, 19.0, 18.0, 33.0, 42.0, 66.0, 118.0, 184.0, 305.0, 541.0, 1269.0, 3242.0, 11446.0, 64011.0, 689405.0, 3071211.0, 304870.0, 35425.0, 7602.0, 2367.0, 947.0, 437.0, 241.0, 159.0, 81.0, 56.0, 44.0, 25.0, 25.0, 14.0, 10.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.984375, -14.50634765625, -14.0283203125, -13.55029296875, -13.072265625, -12.59423828125, -12.1162109375, -11.63818359375, -11.16015625, -10.68212890625, -10.2041015625, -9.72607421875, -9.248046875, -8.77001953125, -8.2919921875, -7.81396484375, -7.3359375, -6.85791015625, -6.3798828125, -5.90185546875, -5.423828125, -4.94580078125, -4.4677734375, -3.98974609375, -3.51171875, -3.03369140625, -2.5556640625, -2.07763671875, -1.599609375, -1.12158203125, -0.6435546875, -0.16552734375, 0.3125, 0.79052734375, 1.2685546875, 1.74658203125, 2.224609375, 2.70263671875, 3.1806640625, 3.65869140625, 4.13671875, 4.61474609375, 5.0927734375, 5.57080078125, 6.048828125, 6.52685546875, 7.0048828125, 7.48291015625, 7.9609375, 8.43896484375, 8.9169921875, 9.39501953125, 9.873046875, 10.35107421875, 10.8291015625, 11.30712890625, 11.78515625, 12.26318359375, 12.7412109375, 13.21923828125, 13.697265625, 14.17529296875, 14.6533203125, 15.13134765625, 15.609375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 17.0, 61.0, 212.0, 353.0, 264.0, 86.0, 15.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.74615478515625, -167.5551300048828, -164.36410522460938, -161.17308044433594, -157.98207092285156, -154.79104614257812, -151.6000213623047, -148.40899658203125, -145.2179718017578, -142.02694702148438, -138.83592224121094, -135.6448974609375, -132.45388793945312, -129.2628631591797, -126.07183837890625, -122.88081359863281, -119.68978881835938, -116.49876403808594, -113.30774688720703, -110.1167221069336, -106.92569732666016, -103.73467254638672, -100.54365539550781, -97.35263061523438, -94.16161346435547, -90.97058868408203, -87.77957153320312, -84.58854675292969, -81.39752197265625, -78.20649719238281, -75.0154800415039, -71.82445526123047, -68.63343048095703, -65.4424057006836, -62.25138473510742, -59.06036376953125, -55.86933898925781, -52.67831802368164, -49.48729705810547, -46.29627227783203, -43.105247497558594, -39.91422653198242, -36.723201751708984, -33.53218078613281, -30.341156005859375, -27.150135040283203, -23.9591121673584, -20.768089294433594, -17.577068328857422, -14.386045455932617, -11.195022583007812, -8.004000663757324, -4.8129777908325195, -1.6219549179077148, 1.5690670013427734, 4.760089874267578, 7.951112747192383, 11.142135620117188, 14.333158493041992, 17.524181365966797, 20.71520233154297, 23.906227111816406, 27.097248077392578, 30.288270950317383, 33.47929382324219]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 8.0, 4.0, 13.0, 9.0, 9.0, 6.0, 20.0, 13.0, 15.0, 22.0, 19.0, 27.0, 20.0, 36.0, 37.0, 32.0, 49.0, 48.0, 44.0, 44.0, 40.0, 60.0, 45.0, 39.0, 38.0, 39.0, 32.0, 43.0, 24.0, 24.0, 26.0, 28.0, 23.0, 13.0, 15.0, 6.0, 6.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.090110778808594, -22.3328914642334, -21.575674057006836, -20.81845474243164, -20.061235427856445, -19.30401611328125, -18.546798706054688, -17.789579391479492, -17.032360076904297, -16.2751407623291, -15.517922401428223, -14.760704040527344, -14.003484725952148, -13.24626636505127, -12.48904800415039, -11.731828689575195, -10.974611282348633, -10.217392921447754, -9.460173606872559, -8.70295524597168, -7.945736408233643, -7.1885175704956055, -6.431299209594727, -5.6740803718566895, -4.916861534118652, -4.159642696380615, -3.4024240970611572, -2.645205497741699, -1.887986660003662, -1.130767822265625, -0.3735494613647461, 0.383669376373291, 1.1408882141113281, 1.8981069326400757, 2.6553256511688232, 3.4125442504882812, 4.169763088226318, 4.9269819259643555, 5.684200286865234, 6.4414191246032715, 7.198637962341309, 7.955856800079346, 8.713075637817383, 9.470293998718262, 10.22751235961914, 10.984731674194336, 11.741950035095215, 12.499168395996094, 13.256387710571289, 14.013606071472168, 14.770825386047363, 15.528043746948242, 16.285263061523438, 17.04248046875, 17.799699783325195, 18.55691909790039, 19.314136505126953, 20.07135581970215, 20.82857322692871, 21.585792541503906, 22.3430118560791, 23.100231170654297, 23.85744857788086, 24.614667892456055, 25.37188720703125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 12.0, 15.0, 21.0, 23.0, 16.0, 22.0, 27.0, 24.0, 33.0, 34.0, 33.0, 27.0, 48.0, 49.0, 41.0, 44.0, 54.0, 47.0, 52.0, 27.0, 48.0, 32.0, 33.0, 29.0, 26.0, 29.0, 28.0, 14.0, 15.0, 12.0, 9.0, 16.0, 4.0, 9.0, 13.0, 7.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.896484375, -3.766815185546875, -3.63714599609375, -3.507476806640625, -3.3778076171875, -3.248138427734375, -3.11846923828125, -2.988800048828125, -2.859130859375, -2.729461669921875, -2.59979248046875, -2.470123291015625, -2.3404541015625, -2.210784912109375, -2.08111572265625, -1.951446533203125, -1.82177734375, -1.692108154296875, -1.56243896484375, -1.432769775390625, -1.3031005859375, -1.173431396484375, -1.04376220703125, -0.914093017578125, -0.784423828125, -0.654754638671875, -0.52508544921875, -0.395416259765625, -0.2657470703125, -0.136077880859375, -0.00640869140625, 0.123260498046875, 0.2529296875, 0.382598876953125, 0.51226806640625, 0.641937255859375, 0.7716064453125, 0.901275634765625, 1.03094482421875, 1.160614013671875, 1.290283203125, 1.419952392578125, 1.54962158203125, 1.679290771484375, 1.8089599609375, 1.938629150390625, 2.06829833984375, 2.197967529296875, 2.32763671875, 2.457305908203125, 2.58697509765625, 2.716644287109375, 2.8463134765625, 2.975982666015625, 3.10565185546875, 3.235321044921875, 3.364990234375, 3.494659423828125, 3.62432861328125, 3.753997802734375, 3.8836669921875, 4.013336181640625, 4.14300537109375, 4.272674560546875, 4.40234375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 3.0, 7.0, 6.0, 15.0, 23.0, 28.0, 45.0, 59.0, 76.0, 142.0, 166.0, 238.0, 336.0, 484.0, 718.0, 949.0, 1453.0, 2032.0, 3038.0, 4137.0, 5982.0, 8689.0, 12872.0, 19053.0, 28976.0, 45226.0, 73658.0, 126919.0, 221421.0, 195757.0, 109671.0, 64975.0, 40383.0, 25914.0, 17329.0, 11605.0, 8081.0, 5509.0, 3779.0, 2618.0, 1836.0, 1296.0, 923.0, 670.0, 449.0, 296.0, 192.0, 153.0, 112.0, 86.0, 53.0, 31.0, 41.0, 20.0, 9.0, 14.0, 4.0, 5.0, 1.0, 2.0], "bins": [-0.0235595703125, -0.022842884063720703, -0.022126197814941406, -0.02140951156616211, -0.020692825317382812, -0.019976139068603516, -0.01925945281982422, -0.018542766571044922, -0.017826080322265625, -0.017109394073486328, -0.01639270782470703, -0.015676021575927734, -0.014959335327148438, -0.01424264907836914, -0.013525962829589844, -0.012809276580810547, -0.01209259033203125, -0.011375904083251953, -0.010659217834472656, -0.00994253158569336, -0.009225845336914062, -0.008509159088134766, -0.007792472839355469, -0.007075786590576172, -0.006359100341796875, -0.005642414093017578, -0.004925727844238281, -0.004209041595458984, -0.0034923553466796875, -0.0027756690979003906, -0.0020589828491210938, -0.0013422966003417969, -0.0006256103515625, 9.107589721679688e-05, 0.0008077621459960938, 0.0015244483947753906, 0.0022411346435546875, 0.0029578208923339844, 0.0036745071411132812, 0.004391193389892578, 0.005107879638671875, 0.005824565887451172, 0.006541252136230469, 0.007257938385009766, 0.007974624633789062, 0.00869131088256836, 0.009407997131347656, 0.010124683380126953, 0.01084136962890625, 0.011558055877685547, 0.012274742126464844, 0.01299142837524414, 0.013708114624023438, 0.014424800872802734, 0.015141487121582031, 0.015858173370361328, 0.016574859619140625, 0.017291545867919922, 0.01800823211669922, 0.018724918365478516, 0.019441604614257812, 0.02015829086303711, 0.020874977111816406, 0.021591663360595703, 0.022308349609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 1.0, 3.0, 9.0, 18.0, 10.0, 12.0, 5.0, 21.0, 13.0, 18.0, 34.0, 22.0, 23.0, 22.0, 31.0, 36.0, 28.0, 30.0, 46.0, 40.0, 32.0, 48.0, 1060.0, 32.0, 38.0, 34.0, 31.0, 28.0, 34.0, 30.0, 33.0, 24.0, 28.0, 25.0, 24.0, 15.0, 16.0, 13.0, 8.0, 7.0, 8.0, 8.0, 8.0, 1.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.486328125, -3.378021240234375, -3.26971435546875, -3.161407470703125, -3.0531005859375, -2.944793701171875, -2.83648681640625, -2.728179931640625, -2.619873046875, -2.511566162109375, -2.40325927734375, -2.294952392578125, -2.1866455078125, -2.078338623046875, -1.97003173828125, -1.861724853515625, -1.75341796875, -1.645111083984375, -1.53680419921875, -1.428497314453125, -1.3201904296875, -1.211883544921875, -1.10357666015625, -0.995269775390625, -0.886962890625, -0.778656005859375, -0.67034912109375, -0.562042236328125, -0.4537353515625, -0.345428466796875, -0.23712158203125, -0.128814697265625, -0.0205078125, 0.087799072265625, 0.19610595703125, 0.304412841796875, 0.4127197265625, 0.521026611328125, 0.62933349609375, 0.737640380859375, 0.845947265625, 0.954254150390625, 1.06256103515625, 1.170867919921875, 1.2791748046875, 1.387481689453125, 1.49578857421875, 1.604095458984375, 1.71240234375, 1.820709228515625, 1.92901611328125, 2.037322998046875, 2.1456298828125, 2.253936767578125, 2.36224365234375, 2.470550537109375, 2.578857421875, 2.687164306640625, 2.79547119140625, 2.903778076171875, 3.0120849609375, 3.120391845703125, 3.22869873046875, 3.337005615234375, 3.4453125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 14.0, 6.0, 23.0, 38.0, 34.0, 67.0, 91.0, 127.0, 166.0, 248.0, 386.0, 555.0, 729.0, 1124.0, 1582.0, 2344.0, 3392.0, 5299.0, 7841.0, 11614.0, 17411.0, 27463.0, 42470.0, 67740.0, 113124.0, 194589.0, 1259575.0, 127986.0, 75648.0, 46810.0, 30423.0, 19333.0, 12706.0, 8554.0, 5730.0, 3642.0, 2576.0, 1775.0, 1206.0, 754.0, 603.0, 424.0, 302.0, 167.0, 112.0, 101.0, 74.0, 59.0, 38.0, 21.0, 13.0, 6.0, 5.0, 9.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.012420654296875, -0.012033820152282715, -0.01164698600769043, -0.011260151863098145, -0.01087331771850586, -0.010486483573913574, -0.010099649429321289, -0.009712815284729004, -0.009325981140136719, -0.008939146995544434, -0.008552312850952148, -0.008165478706359863, -0.007778644561767578, -0.007391810417175293, -0.007004976272583008, -0.006618142127990723, -0.0062313079833984375, -0.005844473838806152, -0.005457639694213867, -0.005070805549621582, -0.004683971405029297, -0.004297137260437012, -0.0039103031158447266, -0.0035234689712524414, -0.0031366348266601562, -0.002749800682067871, -0.002362966537475586, -0.0019761323928833008, -0.0015892982482910156, -0.0012024641036987305, -0.0008156299591064453, -0.00042879581451416016, -4.1961669921875e-05, 0.00034487247467041016, 0.0007317066192626953, 0.0011185407638549805, 0.0015053749084472656, 0.0018922090530395508, 0.002279043197631836, 0.002665877342224121, 0.0030527114868164062, 0.0034395456314086914, 0.0038263797760009766, 0.004213213920593262, 0.004600048065185547, 0.004986882209777832, 0.005373716354370117, 0.005760550498962402, 0.0061473846435546875, 0.006534218788146973, 0.006921052932739258, 0.007307887077331543, 0.007694721221923828, 0.008081555366516113, 0.008468389511108398, 0.008855223655700684, 0.009242057800292969, 0.009628891944885254, 0.010015726089477539, 0.010402560234069824, 0.01078939437866211, 0.011176228523254395, 0.01156306266784668, 0.011949896812438965, 0.01233673095703125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 0.0, 4.0, 8.0, 0.0, 8.0, 8.0, 0.0, 21.0, 24.0, 0.0, 39.0, 80.0, 0.0, 154.0, 267.0, 0.0, 148.0, 79.0, 0.0, 52.0, 33.0, 0.0, 29.0, 12.0, 0.0, 8.0, 9.0, 0.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.152046024799347e-06, -1.1119991540908813e-06, -1.0719522833824158e-06, -1.0319054126739502e-06, -9.918585419654846e-07, -9.51811671257019e-07, -9.117648005485535e-07, -8.717179298400879e-07, -8.316710591316223e-07, -7.916241884231567e-07, -7.515773177146912e-07, -7.115304470062256e-07, -6.7148357629776e-07, -6.314367055892944e-07, -5.913898348808289e-07, -5.513429641723633e-07, -5.112960934638977e-07, -4.7124922275543213e-07, -4.3120235204696655e-07, -3.91155481338501e-07, -3.511086106300354e-07, -3.110617399215698e-07, -2.7101486921310425e-07, -2.3096799850463867e-07, -1.909211277961731e-07, -1.5087425708770752e-07, -1.1082738637924194e-07, -7.078051567077637e-08, -3.073364496231079e-08, 9.313225746154785e-09, 4.936009645462036e-08, 8.940696716308594e-08, 1.2945383787155151e-07, 1.695007085800171e-07, 2.0954757928848267e-07, 2.4959444999694824e-07, 2.896413207054138e-07, 3.296881914138794e-07, 3.6973506212234497e-07, 4.0978193283081055e-07, 4.498288035392761e-07, 4.898756742477417e-07, 5.299225449562073e-07, 5.699694156646729e-07, 6.100162863731384e-07, 6.50063157081604e-07, 6.901100277900696e-07, 7.301568984985352e-07, 7.702037692070007e-07, 8.102506399154663e-07, 8.502975106239319e-07, 8.903443813323975e-07, 9.30391252040863e-07, 9.704381227493286e-07, 1.0104849934577942e-06, 1.0505318641662598e-06, 1.0905787348747253e-06, 1.130625605583191e-06, 1.1706724762916565e-06, 1.210719347000122e-06, 1.2507662177085876e-06, 1.2908130884170532e-06, 1.3308599591255188e-06, 1.3709068298339844e-06]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 7.0, 10.0, 19.0, 22.0, 40.0, 66.0, 82.0, 185.0, 712.0, 170858.0, 875121.0, 982.0, 187.0, 87.0, 49.0, 25.0, 22.0, 19.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1948089599609375e-05, -3.101024776697159e-05, -3.00724059343338e-05, -2.9134564101696014e-05, -2.8196722269058228e-05, -2.725888043642044e-05, -2.6321038603782654e-05, -2.5383196771144867e-05, -2.444535493850708e-05, -2.3507513105869293e-05, -2.2569671273231506e-05, -2.163182944059372e-05, -2.0693987607955933e-05, -1.9756145775318146e-05, -1.881830394268036e-05, -1.7880462110042572e-05, -1.6942620277404785e-05, -1.6004778444766998e-05, -1.5066936612129211e-05, -1.4129094779491425e-05, -1.3191252946853638e-05, -1.225341111421585e-05, -1.1315569281578064e-05, -1.0377727448940277e-05, -9.43988561630249e-06, -8.502043783664703e-06, -7.5642019510269165e-06, -6.62636011838913e-06, -5.688518285751343e-06, -4.750676453113556e-06, -3.812834620475769e-06, -2.874992787837982e-06, -1.9371509552001953e-06, -9.993091225624084e-07, -6.146728992462158e-08, 8.763745427131653e-07, 1.8142163753509521e-06, 2.752058207988739e-06, 3.689900040626526e-06, 4.627741873264313e-06, 5.5655837059021e-06, 6.5034255385398865e-06, 7.441267371177673e-06, 8.37910920381546e-06, 9.316951036453247e-06, 1.0254792869091034e-05, 1.119263470172882e-05, 1.2130476534366608e-05, 1.3068318367004395e-05, 1.4006160199642181e-05, 1.4944002032279968e-05, 1.5881843864917755e-05, 1.6819685697555542e-05, 1.775752753019333e-05, 1.8695369362831116e-05, 1.9633211195468903e-05, 2.057105302810669e-05, 2.1508894860744476e-05, 2.2446736693382263e-05, 2.338457852602005e-05, 2.4322420358657837e-05, 2.5260262191295624e-05, 2.619810402393341e-05, 2.7135945856571198e-05, 2.8073787689208984e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 17.0, 51.0, 131.0, 204.0, 288.0, 167.0, 78.0, 34.0, 17.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.900216481473763e-07, -4.425238842031831e-07, -3.9502612025899e-07, -3.475283278930874e-07, -3.0003056394889427e-07, -2.5253280000470113e-07, -2.0503500763879856e-07, -1.5753724369460542e-07, -1.1003947975041228e-07, -6.254170870079179e-08, -1.504393765117129e-08, 3.245384050387656e-08, 7.99516044480697e-08, 1.2744936839226284e-07, 1.749471607581654e-07, 2.2244492470235855e-07, 2.699426886465517e-07, 3.174404525907448e-07, 3.6493821653493796e-07, 4.1243600890084053e-07, 4.5993377284503367e-07, 5.074315367892268e-07, 5.549293291551294e-07, 6.02427121521032e-07, 6.499248570435157e-07, 6.974226494094182e-07, 7.449203849319019e-07, 7.924181772978045e-07, 8.399159696637071e-07, 8.874137051861908e-07, 9.349114975520934e-07, 9.82409233074577e-07, 1.0299070254404796e-06, 1.0774048178063822e-06, 1.1249026101722848e-06, 1.1724002888513496e-06, 1.2198980812172522e-06, 1.2673958735831548e-06, 1.3148936659490573e-06, 1.3623914583149599e-06, 1.4098891369940247e-06, 1.4573869293599273e-06, 1.5048847217258299e-06, 1.5523824004048947e-06, 1.5998801927707973e-06, 1.6473779851366999e-06, 1.6948757775026024e-06, 1.742373569868505e-06, 1.7898713622344076e-06, 1.8373691546003101e-06, 1.8848669469662127e-06, 1.9323647393321153e-06, 1.97986241801118e-06, 2.027360096690245e-06, 2.0748580027429853e-06, 2.12235568142205e-06, 2.1698535874747904e-06, 2.2173512661538552e-06, 2.2648491722065955e-06, 2.3123468508856604e-06, 2.3598447569384007e-06, 2.4073424356174655e-06, 2.454840341670206e-06, 2.5023380203492707e-06, 2.5498356990283355e-06]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 103.0, 0.0, 0.0, 0.0, 192.0, 0.0, 0.0, 0.0, 228.0, 0.0, 0.0, 0.0, 0.0, 203.0, 0.0, 0.0, 0.0, 110.0, 0.0, 0.0, 0.0, 66.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.032626748085022e-07, -3.8929283618927e-07, -3.7532299757003784e-07, -3.6135315895080566e-07, -3.473833203315735e-07, -3.334134817123413e-07, -3.1944364309310913e-07, -3.0547380447387695e-07, -2.915039658546448e-07, -2.775341272354126e-07, -2.635642886161804e-07, -2.4959444999694824e-07, -2.3562461137771606e-07, -2.2165477275848389e-07, -2.076849341392517e-07, -1.9371509552001953e-07, -1.7974525690078735e-07, -1.6577541828155518e-07, -1.51805579662323e-07, -1.3783574104309082e-07, -1.2386590242385864e-07, -1.0989606380462646e-07, -9.592622518539429e-08, -8.195638656616211e-08, -6.798654794692993e-08, -5.4016709327697754e-08, -4.0046870708465576e-08, -2.60770320892334e-08, -1.210719347000122e-08, 1.862645149230957e-09, 1.5832483768463135e-08, 2.9802322387695312e-08, 4.377216100692749e-08, 5.774199962615967e-08, 7.171183824539185e-08, 8.568167686462402e-08, 9.96515154838562e-08, 1.1362135410308838e-07, 1.2759119272232056e-07, 1.4156103134155273e-07, 1.555308699607849e-07, 1.695007085800171e-07, 1.8347054719924927e-07, 1.9744038581848145e-07, 2.1141022443771362e-07, 2.253800630569458e-07, 2.39349901676178e-07, 2.5331974029541016e-07, 2.6728957891464233e-07, 2.812594175338745e-07, 2.952292561531067e-07, 3.0919909477233887e-07, 3.2316893339157104e-07, 3.371387720108032e-07, 3.511086106300354e-07, 3.650784492492676e-07, 3.7904828786849976e-07, 3.9301812648773193e-07, 4.069879651069641e-07, 4.209578037261963e-07, 4.3492764234542847e-07, 4.4889748096466064e-07, 4.628673195838928e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 12.0, 15.0, 21.0, 23.0, 16.0, 22.0, 27.0, 24.0, 33.0, 34.0, 33.0, 27.0, 48.0, 49.0, 41.0, 44.0, 54.0, 47.0, 52.0, 27.0, 48.0, 32.0, 33.0, 29.0, 26.0, 29.0, 28.0, 14.0, 15.0, 12.0, 9.0, 16.0, 4.0, 9.0, 13.0, 7.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.896484375, -3.766815185546875, -3.63714599609375, -3.507476806640625, -3.3778076171875, -3.248138427734375, -3.11846923828125, -2.988800048828125, -2.859130859375, -2.729461669921875, -2.59979248046875, -2.470123291015625, -2.3404541015625, -2.210784912109375, -2.08111572265625, -1.951446533203125, -1.82177734375, -1.692108154296875, -1.56243896484375, -1.432769775390625, -1.3031005859375, -1.173431396484375, -1.04376220703125, -0.914093017578125, -0.784423828125, -0.654754638671875, -0.52508544921875, -0.395416259765625, -0.2657470703125, -0.136077880859375, -0.00640869140625, 0.123260498046875, 0.2529296875, 0.382598876953125, 0.51226806640625, 0.641937255859375, 0.7716064453125, 0.901275634765625, 1.03094482421875, 1.160614013671875, 1.290283203125, 1.419952392578125, 1.54962158203125, 1.679290771484375, 1.8089599609375, 1.938629150390625, 2.06829833984375, 2.197967529296875, 2.32763671875, 2.457305908203125, 2.58697509765625, 2.716644287109375, 2.8463134765625, 2.975982666015625, 3.10565185546875, 3.235321044921875, 3.364990234375, 3.494659423828125, 3.62432861328125, 3.753997802734375, 3.8836669921875, 4.013336181640625, 4.14300537109375, 4.272674560546875, 4.40234375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 6.0, 2.0, 14.0, 6.0, 15.0, 16.0, 29.0, 26.0, 44.0, 58.0, 93.0, 133.0, 200.0, 275.0, 433.0, 611.0, 896.0, 1450.0, 2226.0, 3546.0, 5311.0, 8293.0, 13026.0, 21130.0, 37355.0, 91105.0, 572685.0, 171428.0, 48967.0, 25637.0, 15533.0, 9931.0, 6268.0, 4170.0, 2651.0, 1653.0, 1084.0, 756.0, 449.0, 313.0, 216.0, 164.0, 106.0, 70.0, 45.0, 48.0, 32.0, 16.0, 15.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.890625, -4.72589111328125, -4.5611572265625, -4.39642333984375, -4.231689453125, -4.06695556640625, -3.9022216796875, -3.73748779296875, -3.57275390625, -3.40802001953125, -3.2432861328125, -3.07855224609375, -2.913818359375, -2.74908447265625, -2.5843505859375, -2.41961669921875, -2.2548828125, -2.09014892578125, -1.9254150390625, -1.76068115234375, -1.595947265625, -1.43121337890625, -1.2664794921875, -1.10174560546875, -0.93701171875, -0.77227783203125, -0.6075439453125, -0.44281005859375, -0.278076171875, -0.11334228515625, 0.0513916015625, 0.21612548828125, 0.380859375, 0.54559326171875, 0.7103271484375, 0.87506103515625, 1.039794921875, 1.20452880859375, 1.3692626953125, 1.53399658203125, 1.69873046875, 1.86346435546875, 2.0281982421875, 2.19293212890625, 2.357666015625, 2.52239990234375, 2.6871337890625, 2.85186767578125, 3.0166015625, 3.18133544921875, 3.3460693359375, 3.51080322265625, 3.675537109375, 3.84027099609375, 4.0050048828125, 4.16973876953125, 4.33447265625, 4.49920654296875, 4.6639404296875, 4.82867431640625, 4.993408203125, 5.15814208984375, 5.3228759765625, 5.48760986328125, 5.65234375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 4.0, 15.0, 7.0, 9.0, 17.0, 14.0, 26.0, 28.0, 22.0, 16.0, 29.0, 32.0, 46.0, 29.0, 52.0, 34.0, 78.0, 106.0, 291.0, 1494.0, 116.0, 97.0, 50.0, 53.0, 43.0, 33.0, 37.0, 33.0, 25.0, 32.0, 22.0, 15.0, 15.0, 24.0, 21.0, 14.0, 11.0, 14.0, 6.0, 7.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.28125, -10.9501953125, -10.619140625, -10.2880859375, -9.95703125, -9.6259765625, -9.294921875, -8.9638671875, -8.6328125, -8.3017578125, -7.970703125, -7.6396484375, -7.30859375, -6.9775390625, -6.646484375, -6.3154296875, -5.984375, -5.6533203125, -5.322265625, -4.9912109375, -4.66015625, -4.3291015625, -3.998046875, -3.6669921875, -3.3359375, -3.0048828125, -2.673828125, -2.3427734375, -2.01171875, -1.6806640625, -1.349609375, -1.0185546875, -0.6875, -0.3564453125, -0.025390625, 0.3056640625, 0.63671875, 0.9677734375, 1.298828125, 1.6298828125, 1.9609375, 2.2919921875, 2.623046875, 2.9541015625, 3.28515625, 3.6162109375, 3.947265625, 4.2783203125, 4.609375, 4.9404296875, 5.271484375, 5.6025390625, 5.93359375, 6.2646484375, 6.595703125, 6.9267578125, 7.2578125, 7.5888671875, 7.919921875, 8.2509765625, 8.58203125, 8.9130859375, 9.244140625, 9.5751953125, 9.90625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 12.0, 13.0, 25.0, 37.0, 53.0, 72.0, 81.0, 145.0, 235.0, 350.0, 910.0, 3741.0, 20809.0, 205423.0, 2792103.0, 104153.0, 13362.0, 2594.0, 753.0, 311.0, 158.0, 125.0, 88.0, 35.0, 36.0, 24.0, 18.0, 8.0, 3.0, 10.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.25, -16.71728515625, -16.1845703125, -15.65185546875, -15.119140625, -14.58642578125, -14.0537109375, -13.52099609375, -12.98828125, -12.45556640625, -11.9228515625, -11.39013671875, -10.857421875, -10.32470703125, -9.7919921875, -9.25927734375, -8.7265625, -8.19384765625, -7.6611328125, -7.12841796875, -6.595703125, -6.06298828125, -5.5302734375, -4.99755859375, -4.46484375, -3.93212890625, -3.3994140625, -2.86669921875, -2.333984375, -1.80126953125, -1.2685546875, -0.73583984375, -0.203125, 0.32958984375, 0.8623046875, 1.39501953125, 1.927734375, 2.46044921875, 2.9931640625, 3.52587890625, 4.05859375, 4.59130859375, 5.1240234375, 5.65673828125, 6.189453125, 6.72216796875, 7.2548828125, 7.78759765625, 8.3203125, 8.85302734375, 9.3857421875, 9.91845703125, 10.451171875, 10.98388671875, 11.5166015625, 12.04931640625, 12.58203125, 13.11474609375, 13.6474609375, 14.18017578125, 14.712890625, 15.24560546875, 15.7783203125, 16.31103515625, 16.84375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 3.0, 9.0, 18.0, 14.0, 26.0, 41.0, 50.0, 59.0, 87.0, 90.0, 101.0, 94.0, 92.0, 71.0, 69.0, 46.0, 40.0, 30.0, 19.0, 11.0, 14.0, 6.0, 5.0, 0.0, 4.0, 1.0, 3.0], "bins": [-23.106103897094727, -22.62194061279297, -22.137779235839844, -21.653615951538086, -21.16945457458496, -20.685291290283203, -20.201129913330078, -19.71696662902832, -19.232805252075195, -18.748641967773438, -18.264480590820312, -17.780317306518555, -17.29615592956543, -16.811992645263672, -16.327831268310547, -15.843667984008789, -15.359504699707031, -14.87534236907959, -14.391180038452148, -13.907017707824707, -13.422855377197266, -12.938692092895508, -12.454530715942383, -11.970367431640625, -11.4862060546875, -11.002043724060059, -10.517881393432617, -10.033719062805176, -9.549556732177734, -9.065393447875977, -8.581232070922852, -8.097068786621094, -7.612906455993652, -7.128744125366211, -6.6445817947387695, -6.160419464111328, -5.6762566566467285, -5.192094326019287, -4.707931995391846, -4.223769187927246, -3.739607095718384, -3.2554447650909424, -2.771282196044922, -2.2871198654174805, -1.8029574155807495, -1.3187949657440186, -0.8346326351165771, -0.35047006607055664, 0.13369226455688477, 0.6178547143936157, 1.1020171642303467, 1.586179494857788, 2.0703420639038086, 2.55450439453125, 3.0386667251586914, 3.522829294204712, 4.006991386413574, 4.491153717041016, 4.975316047668457, 5.459478378295898, 5.943641185760498, 6.4278035163879395, 6.911965847015381, 7.3961286544799805, 7.880290985107422]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 4.0, 6.0, 5.0, 13.0, 17.0, 18.0, 16.0, 25.0, 29.0, 22.0, 21.0, 28.0, 37.0, 28.0, 33.0, 31.0, 51.0, 36.0, 47.0, 47.0, 37.0, 42.0, 33.0, 40.0, 32.0, 41.0, 38.0, 31.0, 20.0, 22.0, 20.0, 21.0, 15.0, 18.0, 15.0, 11.0, 14.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 6.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0], "bins": [-30.62610626220703, -29.68626594543457, -28.746423721313477, -27.806583404541016, -26.866743087768555, -25.926902770996094, -24.987060546875, -24.04722023010254, -23.107379913330078, -22.167539596557617, -21.227697372436523, -20.287857055664062, -19.3480167388916, -18.40817642211914, -17.468334197998047, -16.528493881225586, -15.588652610778809, -14.648811340332031, -13.70897102355957, -12.769129753112793, -11.829289436340332, -10.889448165893555, -9.949607849121094, -9.009766578674316, -8.069925308227539, -7.13008451461792, -6.190243721008301, -5.250402450561523, -4.3105621337890625, -3.370720863342285, -2.430880069732666, -1.4910392761230469, -0.5511989593505859, 0.388641893863678, 1.328482747077942, 2.2683236598968506, 3.2081644535064697, 4.148005485534668, 5.087846279144287, 6.027687072753906, 6.967527866363525, 7.9073686599731445, 8.847209930419922, 9.787050247192383, 10.72689151763916, 11.666732788085938, 12.606573104858398, 13.54641342163086, 14.486254692077637, 15.426095962524414, 16.365936279296875, 17.305776596069336, 18.24561882019043, 19.18545913696289, 20.12529945373535, 21.065139770507812, 22.004981994628906, 22.944822311401367, 23.88466453552246, 24.824504852294922, 25.764345169067383, 26.704185485839844, 27.644027709960938, 28.5838680267334, 29.52370834350586]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 7.0, 4.0, 6.0, 7.0, 12.0, 10.0, 18.0, 22.0, 15.0, 23.0, 24.0, 13.0, 28.0, 28.0, 37.0, 35.0, 40.0, 38.0, 44.0, 41.0, 25.0, 58.0, 44.0, 31.0, 44.0, 26.0, 41.0, 29.0, 37.0, 34.0, 31.0, 23.0, 14.0, 21.0, 15.0, 11.0, 14.0, 4.0, 7.0, 10.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.536529541015625, -3.41094970703125, -3.285369873046875, -3.1597900390625, -3.034210205078125, -2.90863037109375, -2.783050537109375, -2.657470703125, -2.531890869140625, -2.40631103515625, -2.280731201171875, -2.1551513671875, -2.029571533203125, -1.90399169921875, -1.778411865234375, -1.65283203125, -1.527252197265625, -1.40167236328125, -1.276092529296875, -1.1505126953125, -1.024932861328125, -0.89935302734375, -0.773773193359375, -0.648193359375, -0.522613525390625, -0.39703369140625, -0.271453857421875, -0.1458740234375, -0.020294189453125, 0.10528564453125, 0.230865478515625, 0.3564453125, 0.482025146484375, 0.60760498046875, 0.733184814453125, 0.8587646484375, 0.984344482421875, 1.10992431640625, 1.235504150390625, 1.361083984375, 1.486663818359375, 1.61224365234375, 1.737823486328125, 1.8634033203125, 1.988983154296875, 2.11456298828125, 2.240142822265625, 2.36572265625, 2.491302490234375, 2.61688232421875, 2.742462158203125, 2.8680419921875, 2.993621826171875, 3.11920166015625, 3.244781494140625, 3.370361328125, 3.495941162109375, 3.62152099609375, 3.747100830078125, 3.8726806640625, 3.998260498046875, 4.12384033203125, 4.249420166015625, 4.375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 13.0, 24.0, 25.0, 28.0, 51.0, 78.0, 115.0, 145.0, 196.0, 282.0, 428.0, 583.0, 904.0, 1347.0, 2119.0, 3508.0, 6048.0, 10629.0, 20813.0, 43880.0, 103609.0, 283978.0, 890806.0, 1686886.0, 734457.0, 233958.0, 87618.0, 38012.0, 18800.0, 9837.0, 5463.0, 3282.0, 2115.0, 1331.0, 909.0, 603.0, 388.0, 320.0, 212.0, 145.0, 92.0, 71.0, 46.0, 40.0, 29.0, 19.0, 9.0, 10.0, 2.0, 5.0, 4.0, 3.0, 2.0, 3.0], "bins": [-5.3046875, -5.14593505859375, -4.9871826171875, -4.82843017578125, -4.669677734375, -4.51092529296875, -4.3521728515625, -4.19342041015625, -4.03466796875, -3.87591552734375, -3.7171630859375, -3.55841064453125, -3.399658203125, -3.24090576171875, -3.0821533203125, -2.92340087890625, -2.7646484375, -2.60589599609375, -2.4471435546875, -2.28839111328125, -2.129638671875, -1.97088623046875, -1.8121337890625, -1.65338134765625, -1.49462890625, -1.33587646484375, -1.1771240234375, -1.01837158203125, -0.859619140625, -0.70086669921875, -0.5421142578125, -0.38336181640625, -0.224609375, -0.06585693359375, 0.0928955078125, 0.25164794921875, 0.410400390625, 0.56915283203125, 0.7279052734375, 0.88665771484375, 1.04541015625, 1.20416259765625, 1.3629150390625, 1.52166748046875, 1.680419921875, 1.83917236328125, 1.9979248046875, 2.15667724609375, 2.3154296875, 2.47418212890625, 2.6329345703125, 2.79168701171875, 2.950439453125, 3.10919189453125, 3.2679443359375, 3.42669677734375, 3.58544921875, 3.74420166015625, 3.9029541015625, 4.06170654296875, 4.220458984375, 4.37921142578125, 4.5379638671875, 4.69671630859375, 4.85546875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 11.0, 8.0, 25.0, 27.0, 42.0, 77.0, 127.0, 194.0, 304.0, 503.0, 788.0, 737.0, 490.0, 299.0, 182.0, 93.0, 52.0, 47.0, 27.0, 18.0, 6.0, 7.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7890625, -11.4420166015625, -11.094970703125, -10.7479248046875, -10.40087890625, -10.0538330078125, -9.706787109375, -9.3597412109375, -9.0126953125, -8.6656494140625, -8.318603515625, -7.9715576171875, -7.62451171875, -7.2774658203125, -6.930419921875, -6.5833740234375, -6.236328125, -5.8892822265625, -5.542236328125, -5.1951904296875, -4.84814453125, -4.5010986328125, -4.154052734375, -3.8070068359375, -3.4599609375, -3.1129150390625, -2.765869140625, -2.4188232421875, -2.07177734375, -1.7247314453125, -1.377685546875, -1.0306396484375, -0.68359375, -0.3365478515625, 0.010498046875, 0.3575439453125, 0.70458984375, 1.0516357421875, 1.398681640625, 1.7457275390625, 2.0927734375, 2.4398193359375, 2.786865234375, 3.1339111328125, 3.48095703125, 3.8280029296875, 4.175048828125, 4.5220947265625, 4.869140625, 5.2161865234375, 5.563232421875, 5.9102783203125, 6.25732421875, 6.6043701171875, 6.951416015625, 7.2984619140625, 7.6455078125, 7.9925537109375, 8.339599609375, 8.6866455078125, 9.03369140625, 9.3807373046875, 9.727783203125, 10.0748291015625, 10.421875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 7.0, 15.0, 29.0, 37.0, 66.0, 121.0, 208.0, 359.0, 730.0, 1711.0, 5582.0, 34162.0, 696045.0, 3300701.0, 136130.0, 13018.0, 3045.0, 1183.0, 494.0, 274.0, 151.0, 80.0, 50.0, 36.0, 14.0, 13.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.421875, -18.734619140625, -18.04736328125, -17.360107421875, -16.6728515625, -15.985595703125, -15.29833984375, -14.611083984375, -13.923828125, -13.236572265625, -12.54931640625, -11.862060546875, -11.1748046875, -10.487548828125, -9.80029296875, -9.113037109375, -8.42578125, -7.738525390625, -7.05126953125, -6.364013671875, -5.6767578125, -4.989501953125, -4.30224609375, -3.614990234375, -2.927734375, -2.240478515625, -1.55322265625, -0.865966796875, -0.1787109375, 0.508544921875, 1.19580078125, 1.883056640625, 2.5703125, 3.257568359375, 3.94482421875, 4.632080078125, 5.3193359375, 6.006591796875, 6.69384765625, 7.381103515625, 8.068359375, 8.755615234375, 9.44287109375, 10.130126953125, 10.8173828125, 11.504638671875, 12.19189453125, 12.879150390625, 13.56640625, 14.253662109375, 14.94091796875, 15.628173828125, 16.3154296875, 17.002685546875, 17.68994140625, 18.377197265625, 19.064453125, 19.751708984375, 20.43896484375, 21.126220703125, 21.8134765625, 22.500732421875, 23.18798828125, 23.875244140625, 24.5625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 15.0, 29.0, 133.0, 321.0, 366.0, 118.0, 31.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.84858703613281, -79.87300109863281, -75.89741516113281, -71.92182922363281, -67.94624328613281, -63.97065734863281, -59.99507141113281, -56.01948547363281, -52.04389953613281, -48.06831359863281, -44.09272766113281, -40.11714172363281, -36.14155578613281, -32.16596984863281, -28.190383911132812, -24.214797973632812, -20.239212036132812, -16.263626098632812, -12.288040161132812, -8.312454223632812, -4.3368682861328125, -0.3612823486328125, 3.6143035888671875, 7.5898895263671875, 11.565475463867188, 15.541061401367188, 19.516647338867188, 23.492233276367188, 27.467819213867188, 31.443405151367188, 35.41899108886719, 39.39457702636719, 43.37016296386719, 47.34574890136719, 51.32133483886719, 55.29692077636719, 59.27250671386719, 63.24809265136719, 67.22367858886719, 71.19926452636719, 75.17485046386719, 79.15043640136719, 83.12602233886719, 87.10160827636719, 91.07719421386719, 95.05278015136719, 99.02836608886719, 103.00395202636719, 106.97953796386719, 110.95512390136719, 114.93070983886719, 118.90629577636719, 122.88188171386719, 126.85746765136719, 130.8330535888672, 134.8086395263672, 138.7842254638672, 142.7598114013672, 146.7353973388672, 150.7109832763672, 154.6865692138672, 158.6621551513672, 162.6377410888672, 166.6133270263672, 170.5889129638672]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 6.0, 8.0, 11.0, 14.0, 21.0, 18.0, 19.0, 17.0, 28.0, 38.0, 31.0, 40.0, 48.0, 32.0, 51.0, 40.0, 45.0, 42.0, 33.0, 53.0, 48.0, 37.0, 30.0, 33.0, 33.0, 20.0, 33.0, 27.0, 30.0, 20.0, 14.0, 13.0, 13.0, 6.0, 9.0, 9.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.58300018310547, -27.684797286987305, -26.78659439086914, -25.888391494750977, -24.990188598632812, -24.091983795166016, -23.19378089904785, -22.295578002929688, -21.397375106811523, -20.49917221069336, -19.600969314575195, -18.70276641845703, -17.804561614990234, -16.906360626220703, -16.008155822753906, -15.109952926635742, -14.211750030517578, -13.313547134399414, -12.41534423828125, -11.51714038848877, -10.618937492370605, -9.720734596252441, -8.822530746459961, -7.924327850341797, -7.026124954223633, -6.127922058105469, -5.2297186851501465, -4.331515312194824, -3.43331241607666, -2.535109519958496, -1.6369061470031738, -0.7387027740478516, 0.1595001220703125, 1.0577032566070557, 1.9559063911437988, 2.854109525680542, 3.752312660217285, 4.650515556335449, 5.5487189292907715, 6.446922302246094, 7.345125198364258, 8.243328094482422, 9.141530990600586, 10.039734840393066, 10.93793773651123, 11.836140632629395, 12.734344482421875, 13.632547378540039, 14.530750274658203, 15.428953170776367, 16.32715606689453, 17.225358963012695, 18.12356185913086, 19.021766662597656, 19.91996955871582, 20.818172454833984, 21.71637535095215, 22.614578247070312, 23.512781143188477, 24.41098403930664, 25.309188842773438, 26.20738983154297, 27.105594635009766, 28.00379753112793, 28.902000427246094]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 6.0, 8.0, 9.0, 8.0, 11.0, 22.0, 24.0, 13.0, 25.0, 32.0, 29.0, 30.0, 32.0, 39.0, 33.0, 33.0, 35.0, 40.0, 38.0, 50.0, 49.0, 34.0, 33.0, 43.0, 35.0, 44.0, 26.0, 32.0, 25.0, 25.0, 28.0, 12.0, 22.0, 8.0, 13.0, 8.0, 7.0, 9.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.821044921875, -3.68896484375, -3.556884765625, -3.4248046875, -3.292724609375, -3.16064453125, -3.028564453125, -2.896484375, -2.764404296875, -2.63232421875, -2.500244140625, -2.3681640625, -2.236083984375, -2.10400390625, -1.971923828125, -1.83984375, -1.707763671875, -1.57568359375, -1.443603515625, -1.3115234375, -1.179443359375, -1.04736328125, -0.915283203125, -0.783203125, -0.651123046875, -0.51904296875, -0.386962890625, -0.2548828125, -0.122802734375, 0.00927734375, 0.141357421875, 0.2734375, 0.405517578125, 0.53759765625, 0.669677734375, 0.8017578125, 0.933837890625, 1.06591796875, 1.197998046875, 1.330078125, 1.462158203125, 1.59423828125, 1.726318359375, 1.8583984375, 1.990478515625, 2.12255859375, 2.254638671875, 2.38671875, 2.518798828125, 2.65087890625, 2.782958984375, 2.9150390625, 3.047119140625, 3.17919921875, 3.311279296875, 3.443359375, 3.575439453125, 3.70751953125, 3.839599609375, 3.9716796875, 4.103759765625, 4.23583984375, 4.367919921875, 4.5]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 14.0, 15.0, 29.0, 40.0, 48.0, 76.0, 121.0, 173.0, 248.0, 354.0, 549.0, 791.0, 1125.0, 1668.0, 2643.0, 3829.0, 5846.0, 9214.0, 14151.0, 22713.0, 36307.0, 59143.0, 99594.0, 184623.0, 254161.0, 141169.0, 79476.0, 47775.0, 29510.0, 18582.0, 11897.0, 7558.0, 5022.0, 3310.0, 2219.0, 1484.0, 971.0, 693.0, 452.0, 287.0, 204.0, 161.0, 96.0, 57.0, 45.0, 46.0, 21.0, 13.0, 8.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.0261688232421875, -0.02535843849182129, -0.024548053741455078, -0.023737668991088867, -0.022927284240722656, -0.022116899490356445, -0.021306514739990234, -0.020496129989624023, -0.019685745239257812, -0.0188753604888916, -0.01806497573852539, -0.01725459098815918, -0.01644420623779297, -0.015633821487426758, -0.014823436737060547, -0.014013051986694336, -0.013202667236328125, -0.012392282485961914, -0.011581897735595703, -0.010771512985229492, -0.009961128234863281, -0.00915074348449707, -0.00834035873413086, -0.0075299739837646484, -0.0067195892333984375, -0.0059092044830322266, -0.005098819732666016, -0.004288434982299805, -0.0034780502319335938, -0.002667665481567383, -0.0018572807312011719, -0.001046895980834961, -0.00023651123046875, 0.0005738735198974609, 0.0013842582702636719, 0.002194643020629883, 0.0030050277709960938, 0.0038154125213623047, 0.004625797271728516, 0.0054361820220947266, 0.0062465667724609375, 0.0070569515228271484, 0.00786733627319336, 0.00867772102355957, 0.009488105773925781, 0.010298490524291992, 0.011108875274658203, 0.011919260025024414, 0.012729644775390625, 0.013540029525756836, 0.014350414276123047, 0.015160799026489258, 0.01597118377685547, 0.01678156852722168, 0.01759195327758789, 0.0184023380279541, 0.019212722778320312, 0.020023107528686523, 0.020833492279052734, 0.021643877029418945, 0.022454261779785156, 0.023264646530151367, 0.024075031280517578, 0.02488541603088379, 0.02569580078125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 12.0, 16.0, 13.0, 19.0, 11.0, 20.0, 25.0, 41.0, 27.0, 31.0, 33.0, 43.0, 41.0, 33.0, 38.0, 31.0, 42.0, 1056.0, 28.0, 36.0, 44.0, 34.0, 29.0, 33.0, 37.0, 35.0, 25.0, 28.0, 21.0, 18.0, 18.0, 15.0, 15.0, 10.0, 13.0, 5.0, 4.0, 9.0, 6.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.46875, -4.342376708984375, -4.21600341796875, -4.089630126953125, -3.9632568359375, -3.836883544921875, -3.71051025390625, -3.584136962890625, -3.457763671875, -3.331390380859375, -3.20501708984375, -3.078643798828125, -2.9522705078125, -2.825897216796875, -2.69952392578125, -2.573150634765625, -2.44677734375, -2.320404052734375, -2.19403076171875, -2.067657470703125, -1.9412841796875, -1.814910888671875, -1.68853759765625, -1.562164306640625, -1.435791015625, -1.309417724609375, -1.18304443359375, -1.056671142578125, -0.9302978515625, -0.803924560546875, -0.67755126953125, -0.551177978515625, -0.4248046875, -0.298431396484375, -0.17205810546875, -0.045684814453125, 0.0806884765625, 0.207061767578125, 0.33343505859375, 0.459808349609375, 0.586181640625, 0.712554931640625, 0.83892822265625, 0.965301513671875, 1.0916748046875, 1.218048095703125, 1.34442138671875, 1.470794677734375, 1.59716796875, 1.723541259765625, 1.84991455078125, 1.976287841796875, 2.1026611328125, 2.229034423828125, 2.35540771484375, 2.481781005859375, 2.608154296875, 2.734527587890625, 2.86090087890625, 2.987274169921875, 3.1136474609375, 3.240020751953125, 3.36639404296875, 3.492767333984375, 3.619140625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 11.0, 16.0, 38.0, 34.0, 64.0, 91.0, 123.0, 185.0, 278.0, 412.0, 577.0, 886.0, 1267.0, 1857.0, 2843.0, 4306.0, 6483.0, 9964.0, 15560.0, 24412.0, 38519.0, 62383.0, 102196.0, 176130.0, 1276326.0, 143255.0, 85234.0, 52248.0, 32572.0, 20425.0, 13196.0, 8571.0, 5590.0, 3577.0, 2401.0, 1637.0, 1129.0, 757.0, 497.0, 344.0, 239.0, 154.0, 107.0, 68.0, 58.0, 41.0, 28.0, 21.0, 10.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.01488494873046875, -0.014438152313232422, -0.013991355895996094, -0.013544559478759766, -0.013097763061523438, -0.01265096664428711, -0.012204170227050781, -0.011757373809814453, -0.011310577392578125, -0.010863780975341797, -0.010416984558105469, -0.00997018814086914, -0.009523391723632812, -0.009076595306396484, -0.008629798889160156, -0.008183002471923828, -0.0077362060546875, -0.007289409637451172, -0.006842613220214844, -0.006395816802978516, -0.0059490203857421875, -0.005502223968505859, -0.005055427551269531, -0.004608631134033203, -0.004161834716796875, -0.003715038299560547, -0.0032682418823242188, -0.0028214454650878906, -0.0023746490478515625, -0.0019278526306152344, -0.0014810562133789062, -0.0010342597961425781, -0.00058746337890625, -0.00014066696166992188, 0.00030612945556640625, 0.0007529258728027344, 0.0011997222900390625, 0.0016465187072753906, 0.0020933151245117188, 0.002540111541748047, 0.002986907958984375, 0.003433704376220703, 0.0038805007934570312, 0.004327297210693359, 0.0047740936279296875, 0.005220890045166016, 0.005667686462402344, 0.006114482879638672, 0.006561279296875, 0.007008075714111328, 0.007454872131347656, 0.007901668548583984, 0.008348464965820312, 0.00879526138305664, 0.009242057800292969, 0.009688854217529297, 0.010135650634765625, 0.010582447052001953, 0.011029243469238281, 0.01147603988647461, 0.011922836303710938, 0.012369632720947266, 0.012816429138183594, 0.013263225555419922, 0.01371002197265625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 3.0, 7.0, 0.0, 4.0, 8.0, 0.0, 16.0, 12.0, 0.0, 19.0, 31.0, 0.0, 46.0, 0.0, 77.0, 157.0, 0.0, 198.0, 144.0, 0.0, 91.0, 59.0, 0.0, 30.0, 0.0, 19.0, 17.0, 0.0, 8.0, 8.0, 0.0, 8.0, 5.0, 0.0, 6.0, 7.0, 0.0, 4.0, 0.0, 6.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1539086699485779e-06, -1.1157244443893433e-06, -1.0775402188301086e-06, -1.039355993270874e-06, -1.0011717677116394e-06, -9.629875421524048e-07, -9.248033165931702e-07, -8.866190910339355e-07, -8.484348654747009e-07, -8.102506399154663e-07, -7.720664143562317e-07, -7.338821887969971e-07, -6.956979632377625e-07, -6.575137376785278e-07, -6.193295121192932e-07, -5.811452865600586e-07, -5.42961061000824e-07, -5.047768354415894e-07, -4.6659260988235474e-07, -4.284083843231201e-07, -3.902241587638855e-07, -3.520399332046509e-07, -3.1385570764541626e-07, -2.7567148208618164e-07, -2.3748725652694702e-07, -1.993030309677124e-07, -1.6111880540847778e-07, -1.2293457984924316e-07, -8.475035429000854e-08, -4.6566128730773926e-08, -8.381903171539307e-09, 2.9802322387695312e-08, 6.798654794692993e-08, 1.0617077350616455e-07, 1.4435499906539917e-07, 1.825392246246338e-07, 2.207234501838684e-07, 2.5890767574310303e-07, 2.9709190130233765e-07, 3.3527612686157227e-07, 3.734603524208069e-07, 4.116445779800415e-07, 4.498288035392761e-07, 4.880130290985107e-07, 5.261972546577454e-07, 5.6438148021698e-07, 6.025657057762146e-07, 6.407499313354492e-07, 6.789341568946838e-07, 7.171183824539185e-07, 7.553026080131531e-07, 7.934868335723877e-07, 8.316710591316223e-07, 8.698552846908569e-07, 9.080395102500916e-07, 9.462237358093262e-07, 9.844079613685608e-07, 1.0225921869277954e-06, 1.06077641248703e-06, 1.0989606380462646e-06, 1.1371448636054993e-06, 1.1753290891647339e-06, 1.2135133147239685e-06, 1.2516975402832031e-06]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 5.0, 5.0, 6.0, 9.0, 16.0, 27.0, 28.0, 38.0, 69.0, 112.0, 245.0, 712.0, 39768.0, 1002439.0, 4308.0, 299.0, 149.0, 89.0, 51.0, 25.0, 23.0, 18.0, 13.0, 10.0, 14.0, 4.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.8252601623535156e-05, -2.7377158403396606e-05, -2.6501715183258057e-05, -2.5626271963119507e-05, -2.4750828742980957e-05, -2.3875385522842407e-05, -2.2999942302703857e-05, -2.2124499082565308e-05, -2.1249055862426758e-05, -2.0373612642288208e-05, -1.9498169422149658e-05, -1.862272620201111e-05, -1.774728298187256e-05, -1.687183976173401e-05, -1.599639654159546e-05, -1.512095332145691e-05, -1.424551010131836e-05, -1.337006688117981e-05, -1.249462366104126e-05, -1.161918044090271e-05, -1.074373722076416e-05, -9.86829400062561e-06, -8.99285078048706e-06, -8.11740756034851e-06, -7.241964340209961e-06, -6.366521120071411e-06, -5.491077899932861e-06, -4.6156346797943115e-06, -3.7401914596557617e-06, -2.864748239517212e-06, -1.989305019378662e-06, -1.1138617992401123e-06, -2.384185791015625e-07, 6.370246410369873e-07, 1.5124678611755371e-06, 2.387911081314087e-06, 3.2633543014526367e-06, 4.1387975215911865e-06, 5.014240741729736e-06, 5.889683961868286e-06, 6.765127182006836e-06, 7.640570402145386e-06, 8.516013622283936e-06, 9.391456842422485e-06, 1.0266900062561035e-05, 1.1142343282699585e-05, 1.2017786502838135e-05, 1.2893229722976685e-05, 1.3768672943115234e-05, 1.4644116163253784e-05, 1.5519559383392334e-05, 1.6395002603530884e-05, 1.7270445823669434e-05, 1.8145889043807983e-05, 1.9021332263946533e-05, 1.9896775484085083e-05, 2.0772218704223633e-05, 2.1647661924362183e-05, 2.2523105144500732e-05, 2.3398548364639282e-05, 2.4273991584777832e-05, 2.5149434804916382e-05, 2.602487802505493e-05, 2.690032124519348e-05, 2.777576446533203e-05]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [11.0, 51.0, 328.0, 505.0, 108.0, 16.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.076991615420411e-07, -2.7785171141658793e-07, -1.4800423286942532e-07, -1.8156782743972144e-08, 1.1169069580319047e-07, 2.415381743503531e-07, 3.713855960540968e-07, 5.012331030229689e-07, 6.310805247267126e-07, 7.609280032738752e-07, 8.907754818210378e-07, 1.0206229035247816e-06, 1.1504703252285253e-06, 1.2803178606191068e-06, 1.4101652823228505e-06, 1.540012817713432e-06, 1.6698602394171758e-06, 1.7997076611209195e-06, 1.9295550828246633e-06, 2.059402504528407e-06, 2.189250153605826e-06, 2.31909757530957e-06, 2.4489449970133137e-06, 2.5787924187170574e-06, 2.7086400677944766e-06, 2.8384874894982204e-06, 2.968334911201964e-06, 3.098182332905708e-06, 3.228029981983127e-06, 3.357877403686871e-06, 3.4877248253906146e-06, 3.6175722470943583e-06, 3.747419668798102e-06, 3.877267317875521e-06, 4.0071145122055896e-06, 4.136962161283009e-06, 4.266809355613077e-06, 4.396657004690496e-06, 4.5265041990205646e-06, 4.656351848097984e-06, 4.786199497175403e-06, 4.916047146252822e-06, 5.0458943405828904e-06, 5.17574198966031e-06, 5.305589183990378e-06, 5.435436833067797e-06, 5.565284482145216e-06, 5.695131676475285e-06, 5.824978870805353e-06, 5.954826519882772e-06, 6.08467371421284e-06, 6.21452136329026e-06, 6.344368557620328e-06, 6.474216206697747e-06, 6.604063855775166e-06, 6.733911050105235e-06, 6.863758699182654e-06, 6.993606348260073e-06, 7.123453542590141e-06, 7.2533011916675605e-06, 7.383148385997629e-06, 7.512996035075048e-06, 7.642843229405116e-06, 7.772690878482535e-06, 7.902538527559955e-06]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 33.0, 0.0, 0.0, 74.0, 0.0, 0.0, 128.0, 0.0, 0.0, 176.0, 0.0, 0.0, 0.0, 178.0, 0.0, 0.0, 156.0, 0.0, 0.0, 112.0, 0.0, 0.0, 60.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 6.0, 8.0, 9.0, 8.0, 11.0, 22.0, 24.0, 13.0, 25.0, 32.0, 29.0, 30.0, 32.0, 39.0, 33.0, 33.0, 35.0, 40.0, 38.0, 50.0, 49.0, 34.0, 33.0, 43.0, 35.0, 44.0, 26.0, 32.0, 25.0, 25.0, 28.0, 12.0, 22.0, 8.0, 13.0, 8.0, 7.0, 9.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.821044921875, -3.68896484375, -3.556884765625, -3.4248046875, -3.292724609375, -3.16064453125, -3.028564453125, -2.896484375, -2.764404296875, -2.63232421875, -2.500244140625, -2.3681640625, -2.236083984375, -2.10400390625, -1.971923828125, -1.83984375, -1.707763671875, -1.57568359375, -1.443603515625, -1.3115234375, -1.179443359375, -1.04736328125, -0.915283203125, -0.783203125, -0.651123046875, -0.51904296875, -0.386962890625, -0.2548828125, -0.122802734375, 0.00927734375, 0.141357421875, 0.2734375, 0.405517578125, 0.53759765625, 0.669677734375, 0.8017578125, 0.933837890625, 1.06591796875, 1.197998046875, 1.330078125, 1.462158203125, 1.59423828125, 1.726318359375, 1.8583984375, 1.990478515625, 2.12255859375, 2.254638671875, 2.38671875, 2.518798828125, 2.65087890625, 2.782958984375, 2.9150390625, 3.047119140625, 3.17919921875, 3.311279296875, 3.443359375, 3.575439453125, 3.70751953125, 3.839599609375, 3.9716796875, 4.103759765625, 4.23583984375, 4.367919921875, 4.5]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 10.0, 13.0, 21.0, 26.0, 43.0, 49.0, 96.0, 121.0, 178.0, 256.0, 387.0, 589.0, 884.0, 1349.0, 2027.0, 3309.0, 5247.0, 8853.0, 14886.0, 24917.0, 42103.0, 72370.0, 140928.0, 313351.0, 197321.0, 90921.0, 51558.0, 30651.0, 17833.0, 10696.0, 6415.0, 3894.0, 2550.0, 1571.0, 1015.0, 675.0, 421.0, 324.0, 202.0, 151.0, 117.0, 75.0, 41.0, 31.0, 23.0, 16.0, 15.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0], "bins": [-5.56640625, -5.40594482421875, -5.2454833984375, -5.08502197265625, -4.924560546875, -4.76409912109375, -4.6036376953125, -4.44317626953125, -4.28271484375, -4.12225341796875, -3.9617919921875, -3.80133056640625, -3.640869140625, -3.48040771484375, -3.3199462890625, -3.15948486328125, -2.9990234375, -2.83856201171875, -2.6781005859375, -2.51763916015625, -2.357177734375, -2.19671630859375, -2.0362548828125, -1.87579345703125, -1.71533203125, -1.55487060546875, -1.3944091796875, -1.23394775390625, -1.073486328125, -0.91302490234375, -0.7525634765625, -0.59210205078125, -0.431640625, -0.27117919921875, -0.1107177734375, 0.04974365234375, 0.210205078125, 0.37066650390625, 0.5311279296875, 0.69158935546875, 0.85205078125, 1.01251220703125, 1.1729736328125, 1.33343505859375, 1.493896484375, 1.65435791015625, 1.8148193359375, 1.97528076171875, 2.1357421875, 2.29620361328125, 2.4566650390625, 2.61712646484375, 2.777587890625, 2.93804931640625, 3.0985107421875, 3.25897216796875, 3.41943359375, 3.57989501953125, 3.7403564453125, 3.90081787109375, 4.061279296875, 4.22174072265625, 4.3822021484375, 4.54266357421875, 4.703125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 12.0, 10.0, 11.0, 11.0, 10.0, 21.0, 21.0, 20.0, 31.0, 32.0, 30.0, 37.0, 38.0, 50.0, 63.0, 74.0, 110.0, 171.0, 1440.0, 235.0, 113.0, 82.0, 49.0, 43.0, 43.0, 35.0, 29.0, 30.0, 25.0, 30.0, 26.0, 13.0, 12.0, 15.0, 10.0, 10.0, 9.0, 7.0, 6.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.390625, -11.0302734375, -10.669921875, -10.3095703125, -9.94921875, -9.5888671875, -9.228515625, -8.8681640625, -8.5078125, -8.1474609375, -7.787109375, -7.4267578125, -7.06640625, -6.7060546875, -6.345703125, -5.9853515625, -5.625, -5.2646484375, -4.904296875, -4.5439453125, -4.18359375, -3.8232421875, -3.462890625, -3.1025390625, -2.7421875, -2.3818359375, -2.021484375, -1.6611328125, -1.30078125, -0.9404296875, -0.580078125, -0.2197265625, 0.140625, 0.5009765625, 0.861328125, 1.2216796875, 1.58203125, 1.9423828125, 2.302734375, 2.6630859375, 3.0234375, 3.3837890625, 3.744140625, 4.1044921875, 4.46484375, 4.8251953125, 5.185546875, 5.5458984375, 5.90625, 6.2666015625, 6.626953125, 6.9873046875, 7.34765625, 7.7080078125, 8.068359375, 8.4287109375, 8.7890625, 9.1494140625, 9.509765625, 9.8701171875, 10.23046875, 10.5908203125, 10.951171875, 11.3115234375, 11.671875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 11.0, 12.0, 12.0, 13.0, 19.0, 29.0, 37.0, 59.0, 64.0, 88.0, 187.0, 354.0, 780.0, 2004.0, 6341.0, 23321.0, 126200.0, 1890579.0, 981782.0, 87736.0, 17908.0, 4923.0, 1743.0, 660.0, 322.0, 161.0, 107.0, 62.0, 43.0, 29.0, 28.0, 20.0, 13.0, 16.0, 5.0, 6.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.375, -10.99462890625, -10.6142578125, -10.23388671875, -9.853515625, -9.47314453125, -9.0927734375, -8.71240234375, -8.33203125, -7.95166015625, -7.5712890625, -7.19091796875, -6.810546875, -6.43017578125, -6.0498046875, -5.66943359375, -5.2890625, -4.90869140625, -4.5283203125, -4.14794921875, -3.767578125, -3.38720703125, -3.0068359375, -2.62646484375, -2.24609375, -1.86572265625, -1.4853515625, -1.10498046875, -0.724609375, -0.34423828125, 0.0361328125, 0.41650390625, 0.796875, 1.17724609375, 1.5576171875, 1.93798828125, 2.318359375, 2.69873046875, 3.0791015625, 3.45947265625, 3.83984375, 4.22021484375, 4.6005859375, 4.98095703125, 5.361328125, 5.74169921875, 6.1220703125, 6.50244140625, 6.8828125, 7.26318359375, 7.6435546875, 8.02392578125, 8.404296875, 8.78466796875, 9.1650390625, 9.54541015625, 9.92578125, 10.30615234375, 10.6865234375, 11.06689453125, 11.447265625, 11.82763671875, 12.2080078125, 12.58837890625, 12.96875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 35.0, 60.0, 128.0, 201.0, 234.0, 177.0, 100.0, 54.0, 15.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.812421798706055, -10.224956512451172, -8.637491226196289, -7.050025939941406, -5.462560653686523, -3.8750953674316406, -2.287630081176758, -0.700164794921875, 0.8873004913330078, 2.4747657775878906, 4.062231063842773, 5.649696350097656, 7.237161636352539, 8.824626922607422, 10.412092208862305, 11.999557495117188, 13.58702278137207, 15.174488067626953, 16.761953353881836, 18.34941864013672, 19.9368839263916, 21.524349212646484, 23.111814498901367, 24.69927978515625, 26.286745071411133, 27.874210357666016, 29.4616756439209, 31.04914093017578, 32.63660430908203, 34.22407150268555, 35.81153869628906, 37.39900207519531, 38.98646545410156, 40.57392883300781, 42.16139602661133, 43.748863220214844, 45.336326599121094, 46.923789978027344, 48.51125717163086, 50.098724365234375, 51.686187744140625, 53.273651123046875, 54.86111831665039, 56.448585510253906, 58.036048889160156, 59.623512268066406, 61.21097946166992, 62.79844665527344, 64.38591003417969, 65.97337341308594, 67.56083679199219, 69.14830780029297, 70.73577117919922, 72.32323455810547, 73.91070556640625, 75.4981689453125, 77.08563232421875, 78.673095703125, 80.26055908203125, 81.84803009033203, 83.43549346923828, 85.02295684814453, 86.61042785644531, 88.19789123535156, 89.78535461425781]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 10.0, 8.0, 10.0, 11.0, 11.0, 17.0, 13.0, 11.0, 24.0, 21.0, 21.0, 25.0, 24.0, 32.0, 33.0, 39.0, 39.0, 40.0, 48.0, 41.0, 44.0, 36.0, 26.0, 27.0, 36.0, 30.0, 29.0, 35.0, 29.0, 26.0, 26.0, 32.0, 30.0, 17.0, 15.0, 10.0, 14.0, 14.0, 11.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-30.29950714111328, -29.36054229736328, -28.42157745361328, -27.48261260986328, -26.543649673461914, -25.604684829711914, -24.665719985961914, -23.726755142211914, -22.787792205810547, -21.848827362060547, -20.909862518310547, -19.970897674560547, -19.03193473815918, -18.09296989440918, -17.15400505065918, -16.21504020690918, -15.27607536315918, -14.33711051940918, -13.398146629333496, -12.459181785583496, -11.520217895507812, -10.581253051757812, -9.642288208007812, -8.703323364257812, -7.764359474182129, -6.825395107269287, -5.886430740356445, -4.947465896606445, -4.0085015296936035, -3.0695371627807617, -2.1305723190307617, -1.19160795211792, -0.2526435852050781, 0.6863209009170532, 1.6252853870391846, 2.5642499923706055, 3.5032143592834473, 4.442178726196289, 5.381143569946289, 6.320107936859131, 7.259072303771973, 8.198037147521973, 9.137001037597656, 10.075965881347656, 11.014930725097656, 11.95389461517334, 12.89285945892334, 13.831823348999023, 14.770788192749023, 15.709753036499023, 16.648717880249023, 17.58768081665039, 18.52664566040039, 19.46561050415039, 20.40457534790039, 21.34354019165039, 22.28250503540039, 23.22146987915039, 24.16043472290039, 25.09939956665039, 26.038362503051758, 26.977327346801758, 27.916292190551758, 28.855257034301758, 29.794219970703125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 8.0, 12.0, 8.0, 9.0, 17.0, 15.0, 20.0, 26.0, 24.0, 31.0, 33.0, 31.0, 32.0, 35.0, 42.0, 35.0, 37.0, 30.0, 53.0, 51.0, 44.0, 35.0, 52.0, 42.0, 29.0, 32.0, 33.0, 31.0, 26.0, 27.0, 21.0, 13.0, 8.0, 10.0, 13.0, 6.0, 5.0, 5.0, 0.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.87762451171875, -3.7357177734375, -3.59381103515625, -3.451904296875, -3.30999755859375, -3.1680908203125, -3.02618408203125, -2.88427734375, -2.74237060546875, -2.6004638671875, -2.45855712890625, -2.316650390625, -2.17474365234375, -2.0328369140625, -1.89093017578125, -1.7490234375, -1.60711669921875, -1.4652099609375, -1.32330322265625, -1.181396484375, -1.03948974609375, -0.8975830078125, -0.75567626953125, -0.61376953125, -0.47186279296875, -0.3299560546875, -0.18804931640625, -0.046142578125, 0.09576416015625, 0.2376708984375, 0.37957763671875, 0.521484375, 0.66339111328125, 0.8052978515625, 0.94720458984375, 1.089111328125, 1.23101806640625, 1.3729248046875, 1.51483154296875, 1.65673828125, 1.79864501953125, 1.9405517578125, 2.08245849609375, 2.224365234375, 2.36627197265625, 2.5081787109375, 2.65008544921875, 2.7919921875, 2.93389892578125, 3.0758056640625, 3.21771240234375, 3.359619140625, 3.50152587890625, 3.6434326171875, 3.78533935546875, 3.92724609375, 4.06915283203125, 4.2110595703125, 4.35296630859375, 4.494873046875, 4.63677978515625, 4.7786865234375, 4.92059326171875, 5.0625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 9.0, 11.0, 19.0, 24.0, 41.0, 64.0, 107.0, 142.0, 211.0, 360.0, 600.0, 1027.0, 1959.0, 4147.0, 9678.0, 26984.0, 101953.0, 682500.0, 2739272.0, 502834.0, 82923.0, 23163.0, 8374.0, 3667.0, 1846.0, 979.0, 529.0, 294.0, 195.0, 122.0, 77.0, 45.0, 33.0, 29.0, 16.0, 12.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.905517578125, -8.59228515625, -8.279052734375, -7.9658203125, -7.652587890625, -7.33935546875, -7.026123046875, -6.712890625, -6.399658203125, -6.08642578125, -5.773193359375, -5.4599609375, -5.146728515625, -4.83349609375, -4.520263671875, -4.20703125, -3.893798828125, -3.58056640625, -3.267333984375, -2.9541015625, -2.640869140625, -2.32763671875, -2.014404296875, -1.701171875, -1.387939453125, -1.07470703125, -0.761474609375, -0.4482421875, -0.135009765625, 0.17822265625, 0.491455078125, 0.8046875, 1.117919921875, 1.43115234375, 1.744384765625, 2.0576171875, 2.370849609375, 2.68408203125, 2.997314453125, 3.310546875, 3.623779296875, 3.93701171875, 4.250244140625, 4.5634765625, 4.876708984375, 5.18994140625, 5.503173828125, 5.81640625, 6.129638671875, 6.44287109375, 6.756103515625, 7.0693359375, 7.382568359375, 7.69580078125, 8.009033203125, 8.322265625, 8.635498046875, 8.94873046875, 9.261962890625, 9.5751953125, 9.888427734375, 10.20166015625, 10.514892578125, 10.828125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 9.0, 12.0, 14.0, 25.0, 24.0, 32.0, 47.0, 56.0, 69.0, 95.0, 121.0, 165.0, 256.0, 315.0, 459.0, 514.0, 432.0, 365.0, 241.0, 198.0, 139.0, 111.0, 100.0, 48.0, 46.0, 29.0, 28.0, 28.0, 20.0, 14.0, 14.0, 7.0, 14.0, 5.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.0748291015625, -4.884033203125, -4.6932373046875, -4.50244140625, -4.3116455078125, -4.120849609375, -3.9300537109375, -3.7392578125, -3.5484619140625, -3.357666015625, -3.1668701171875, -2.97607421875, -2.7852783203125, -2.594482421875, -2.4036865234375, -2.212890625, -2.0220947265625, -1.831298828125, -1.6405029296875, -1.44970703125, -1.2589111328125, -1.068115234375, -0.8773193359375, -0.6865234375, -0.4957275390625, -0.304931640625, -0.1141357421875, 0.07666015625, 0.2674560546875, 0.458251953125, 0.6490478515625, 0.83984375, 1.0306396484375, 1.221435546875, 1.4122314453125, 1.60302734375, 1.7938232421875, 1.984619140625, 2.1754150390625, 2.3662109375, 2.5570068359375, 2.747802734375, 2.9385986328125, 3.12939453125, 3.3201904296875, 3.510986328125, 3.7017822265625, 3.892578125, 4.0833740234375, 4.274169921875, 4.4649658203125, 4.65576171875, 4.8465576171875, 5.037353515625, 5.2281494140625, 5.4189453125, 5.6097412109375, 5.800537109375, 5.9913330078125, 6.18212890625, 6.3729248046875, 6.563720703125, 6.7545166015625, 6.9453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 8.0, 15.0, 13.0, 34.0, 32.0, 52.0, 79.0, 108.0, 169.0, 266.0, 437.0, 716.0, 1310.0, 2560.0, 5203.0, 12172.0, 32731.0, 106639.0, 449253.0, 2337547.0, 965616.0, 191874.0, 53867.0, 18426.0, 7550.0, 3482.0, 1663.0, 1013.0, 542.0, 305.0, 194.0, 134.0, 95.0, 57.0, 37.0, 21.0, 15.0, 15.0, 8.0, 3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4122314453125, -8.129150390625, -7.8460693359375, -7.56298828125, -7.2799072265625, -6.996826171875, -6.7137451171875, -6.4306640625, -6.1475830078125, -5.864501953125, -5.5814208984375, -5.29833984375, -5.0152587890625, -4.732177734375, -4.4490966796875, -4.166015625, -3.8829345703125, -3.599853515625, -3.3167724609375, -3.03369140625, -2.7506103515625, -2.467529296875, -2.1844482421875, -1.9013671875, -1.6182861328125, -1.335205078125, -1.0521240234375, -0.76904296875, -0.4859619140625, -0.202880859375, 0.0802001953125, 0.36328125, 0.6463623046875, 0.929443359375, 1.2125244140625, 1.49560546875, 1.7786865234375, 2.061767578125, 2.3448486328125, 2.6279296875, 2.9110107421875, 3.194091796875, 3.4771728515625, 3.76025390625, 4.0433349609375, 4.326416015625, 4.6094970703125, 4.892578125, 5.1756591796875, 5.458740234375, 5.7418212890625, 6.02490234375, 6.3079833984375, 6.591064453125, 6.8741455078125, 7.1572265625, 7.4403076171875, 7.723388671875, 8.0064697265625, 8.28955078125, 8.5726318359375, 8.855712890625, 9.1387939453125, 9.421875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 23.0, 202.0, 437.0, 296.0, 51.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-228.0792236328125, -223.8254852294922, -219.57176208496094, -215.31802368164062, -211.0642852783203, -206.810546875, -202.55682373046875, -198.30308532714844, -194.04934692382812, -189.7956085205078, -185.54188537597656, -181.28814697265625, -177.03440856933594, -172.78067016601562, -168.52694702148438, -164.27320861816406, -160.01947021484375, -155.76573181152344, -151.5120086669922, -147.25827026367188, -143.00453186035156, -138.75079345703125, -134.4970703125, -130.2433319091797, -125.98960876464844, -121.73587799072266, -117.48213958740234, -113.22840881347656, -108.97467041015625, -104.72093963623047, -100.46720886230469, -96.21347045898438, -91.95973205566406, -87.70600128173828, -83.45226287841797, -79.19853210449219, -74.94479370117188, -70.6910629272461, -66.43733215332031, -62.18359375, -57.92985916137695, -53.676124572753906, -49.42238998413086, -45.16865539550781, -40.91492462158203, -36.66118621826172, -32.40745544433594, -28.15372085571289, -23.899986267089844, -19.646251678466797, -15.392518043518066, -11.138784408569336, -6.885049819946289, -2.631315231323242, 1.6224174499511719, 5.876152038574219, 10.129886627197266, 14.383621215820312, 18.63735580444336, 22.891088485717773, 27.14482307434082, 31.398557662963867, 35.65229034423828, 39.90602493286133, 44.159759521484375]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 9.0, 14.0, 17.0, 15.0, 25.0, 27.0, 23.0, 23.0, 40.0, 40.0, 45.0, 41.0, 47.0, 33.0, 44.0, 42.0, 55.0, 53.0, 43.0, 47.0, 29.0, 32.0, 30.0, 34.0, 23.0, 28.0, 21.0, 20.0, 11.0, 8.0, 18.0, 10.0, 9.0, 9.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.772537231445312, -26.928003311157227, -26.08346939086914, -25.238933563232422, -24.394399642944336, -23.54986572265625, -22.70532989501953, -21.860795974731445, -21.01626205444336, -20.171728134155273, -19.327194213867188, -18.48265838623047, -17.638124465942383, -16.793590545654297, -15.949055671691895, -15.104520797729492, -14.259986877441406, -13.41545295715332, -12.570918083190918, -11.726383209228516, -10.88184928894043, -10.037315368652344, -9.192780494689941, -8.348245620727539, -7.503711700439453, -6.659177303314209, -5.814642906188965, -4.970108509063721, -4.125574111938477, -3.2810397148132324, -2.4365053176879883, -1.5919709205627441, -0.7474365234375, 0.09709787368774414, 0.9416322708129883, 1.7861666679382324, 2.6307010650634766, 3.4752354621887207, 4.319769859313965, 5.164304256439209, 6.008838653564453, 6.853373050689697, 7.697907447814941, 8.542442321777344, 9.38697624206543, 10.231510162353516, 11.076045036315918, 11.92057991027832, 12.765113830566406, 13.609647750854492, 14.454182624816895, 15.298717498779297, 16.143251419067383, 16.98778533935547, 17.832321166992188, 18.676855087280273, 19.52138900756836, 20.365922927856445, 21.21045684814453, 22.05499267578125, 22.899526596069336, 23.744060516357422, 24.58859634399414, 25.433130264282227, 26.277664184570312]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 5.0, 10.0, 9.0, 14.0, 15.0, 16.0, 20.0, 20.0, 14.0, 27.0, 27.0, 31.0, 43.0, 27.0, 40.0, 39.0, 34.0, 47.0, 49.0, 39.0, 46.0, 26.0, 45.0, 35.0, 45.0, 43.0, 35.0, 36.0, 26.0, 22.0, 22.0, 13.0, 21.0, 12.0, 10.0, 13.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.77734375, -3.6337890625, -3.490234375, -3.3466796875, -3.203125, -3.0595703125, -2.916015625, -2.7724609375, -2.62890625, -2.4853515625, -2.341796875, -2.1982421875, -2.0546875, -1.9111328125, -1.767578125, -1.6240234375, -1.48046875, -1.3369140625, -1.193359375, -1.0498046875, -0.90625, -0.7626953125, -0.619140625, -0.4755859375, -0.33203125, -0.1884765625, -0.044921875, 0.0986328125, 0.2421875, 0.3857421875, 0.529296875, 0.6728515625, 0.81640625, 0.9599609375, 1.103515625, 1.2470703125, 1.390625, 1.5341796875, 1.677734375, 1.8212890625, 1.96484375, 2.1083984375, 2.251953125, 2.3955078125, 2.5390625, 2.6826171875, 2.826171875, 2.9697265625, 3.11328125, 3.2568359375, 3.400390625, 3.5439453125, 3.6875, 3.8310546875, 3.974609375, 4.1181640625, 4.26171875, 4.4052734375, 4.548828125, 4.6923828125, 4.8359375, 4.9794921875, 5.123046875, 5.2666015625, 5.41015625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 11.0, 15.0, 27.0, 52.0, 64.0, 95.0, 147.0, 226.0, 328.0, 470.0, 716.0, 1140.0, 1751.0, 2745.0, 4109.0, 6326.0, 9837.0, 16274.0, 26956.0, 45675.0, 78398.0, 136040.0, 245950.0, 200151.0, 110109.0, 64070.0, 37222.0, 22286.0, 13550.0, 8259.0, 5364.0, 3403.0, 2374.0, 1487.0, 962.0, 649.0, 441.0, 283.0, 194.0, 137.0, 70.0, 49.0, 42.0, 22.0, 20.0, 15.0, 8.0, 6.0, 9.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.026519775390625, -0.02563023567199707, -0.02474069595336914, -0.02385115623474121, -0.02296161651611328, -0.02207207679748535, -0.021182537078857422, -0.020292997360229492, -0.019403457641601562, -0.018513917922973633, -0.017624378204345703, -0.016734838485717773, -0.015845298767089844, -0.014955759048461914, -0.014066219329833984, -0.013176679611206055, -0.012287139892578125, -0.011397600173950195, -0.010508060455322266, -0.009618520736694336, -0.008728981018066406, -0.007839441299438477, -0.006949901580810547, -0.006060361862182617, -0.0051708221435546875, -0.004281282424926758, -0.003391742706298828, -0.0025022029876708984, -0.0016126632690429688, -0.0007231235504150391, 0.00016641616821289062, 0.0010559558868408203, 0.00194549560546875, 0.0028350353240966797, 0.0037245750427246094, 0.004614114761352539, 0.005503654479980469, 0.0063931941986083984, 0.007282733917236328, 0.008172273635864258, 0.009061813354492188, 0.009951353073120117, 0.010840892791748047, 0.011730432510375977, 0.012619972229003906, 0.013509511947631836, 0.014399051666259766, 0.015288591384887695, 0.016178131103515625, 0.017067670822143555, 0.017957210540771484, 0.018846750259399414, 0.019736289978027344, 0.020625829696655273, 0.021515369415283203, 0.022404909133911133, 0.023294448852539062, 0.024183988571166992, 0.025073528289794922, 0.02596306800842285, 0.02685260772705078, 0.02774214744567871, 0.02863168716430664, 0.02952122688293457, 0.0304107666015625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 1.0, 8.0, 5.0, 8.0, 9.0, 4.0, 11.0, 11.0, 13.0, 17.0, 13.0, 23.0, 21.0, 28.0, 20.0, 40.0, 26.0, 25.0, 33.0, 32.0, 29.0, 37.0, 32.0, 39.0, 1053.0, 39.0, 32.0, 44.0, 43.0, 31.0, 34.0, 26.0, 26.0, 28.0, 24.0, 19.0, 15.0, 12.0, 27.0, 15.0, 13.0, 13.0, 5.0, 9.0, 4.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.16015625, -4.0313720703125, -3.902587890625, -3.7738037109375, -3.64501953125, -3.5162353515625, -3.387451171875, -3.2586669921875, -3.1298828125, -3.0010986328125, -2.872314453125, -2.7435302734375, -2.61474609375, -2.4859619140625, -2.357177734375, -2.2283935546875, -2.099609375, -1.9708251953125, -1.842041015625, -1.7132568359375, -1.58447265625, -1.4556884765625, -1.326904296875, -1.1981201171875, -1.0693359375, -0.9405517578125, -0.811767578125, -0.6829833984375, -0.55419921875, -0.4254150390625, -0.296630859375, -0.1678466796875, -0.0390625, 0.0897216796875, 0.218505859375, 0.3472900390625, 0.47607421875, 0.6048583984375, 0.733642578125, 0.8624267578125, 0.9912109375, 1.1199951171875, 1.248779296875, 1.3775634765625, 1.50634765625, 1.6351318359375, 1.763916015625, 1.8927001953125, 2.021484375, 2.1502685546875, 2.279052734375, 2.4078369140625, 2.53662109375, 2.6654052734375, 2.794189453125, 2.9229736328125, 3.0517578125, 3.1805419921875, 3.309326171875, 3.4381103515625, 3.56689453125, 3.6956787109375, 3.824462890625, 3.9532470703125, 4.08203125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 9.0, 11.0, 19.0, 26.0, 33.0, 53.0, 62.0, 98.0, 124.0, 194.0, 244.0, 323.0, 472.0, 649.0, 943.0, 1339.0, 1790.0, 2588.0, 3590.0, 5094.0, 7336.0, 10543.0, 15321.0, 21905.0, 33232.0, 49156.0, 75730.0, 121485.0, 1240097.0, 179470.0, 110470.0, 69672.0, 45921.0, 30838.0, 20844.0, 13919.0, 10022.0, 6876.0, 4819.0, 3471.0, 2370.0, 1706.0, 1190.0, 876.0, 614.0, 445.0, 339.0, 226.0, 173.0, 133.0, 89.0, 60.0, 56.0, 32.0, 18.0, 18.0, 7.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.01357269287109375, -0.013147354125976562, -0.012722015380859375, -0.012296676635742188, -0.011871337890625, -0.011445999145507812, -0.011020660400390625, -0.010595321655273438, -0.01016998291015625, -0.009744644165039062, -0.009319305419921875, -0.008893966674804688, -0.0084686279296875, -0.008043289184570312, -0.007617950439453125, -0.0071926116943359375, -0.00676727294921875, -0.0063419342041015625, -0.005916595458984375, -0.0054912567138671875, -0.00506591796875, -0.0046405792236328125, -0.004215240478515625, -0.0037899017333984375, -0.00336456298828125, -0.0029392242431640625, -0.002513885498046875, -0.0020885467529296875, -0.0016632080078125, -0.0012378692626953125, -0.000812530517578125, -0.0003871917724609375, 3.814697265625e-05, 0.0004634857177734375, 0.000888824462890625, 0.0013141632080078125, 0.001739501953125, 0.0021648406982421875, 0.002590179443359375, 0.0030155181884765625, 0.00344085693359375, 0.0038661956787109375, 0.004291534423828125, 0.0047168731689453125, 0.0051422119140625, 0.0055675506591796875, 0.005992889404296875, 0.0064182281494140625, 0.00684356689453125, 0.0072689056396484375, 0.007694244384765625, 0.008119583129882812, 0.008544921875, 0.008970260620117188, 0.009395599365234375, 0.009820938110351562, 0.01024627685546875, 0.010671615600585938, 0.011096954345703125, 0.011522293090820312, 0.0119476318359375, 0.012372970581054688, 0.012798309326171875, 0.013223648071289062, 0.01364898681640625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 6.0, 6.0, 10.0, 7.0, 13.0, 17.0, 15.0, 13.0, 22.0, 22.0, 20.0, 20.0, 38.0, 53.0, 79.0, 106.0, 118.0, 78.0, 72.0, 57.0, 31.0, 26.0, 22.0, 24.0, 20.0, 11.0, 10.0, 14.0, 4.0, 12.0, 8.0, 8.0, 3.0, 9.0, 3.0, 4.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.9669532775878906e-06, -1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 5.0, 8.0, 6.0, 12.0, 10.0, 6.0, 13.0, 14.0, 19.0, 24.0, 33.0, 42.0, 69.0, 105.0, 241.0, 496.0, 8826.0, 1033589.0, 3968.0, 440.0, 213.0, 130.0, 56.0, 39.0, 23.0, 26.0, 21.0, 21.0, 18.0, 16.0, 8.0, 9.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.208087921142578e-05, -4.065129905939102e-05, -3.922171890735626e-05, -3.77921387553215e-05, -3.636255860328674e-05, -3.4932978451251984e-05, -3.3503398299217224e-05, -3.2073818147182465e-05, -3.0644237995147705e-05, -2.9214657843112946e-05, -2.7785077691078186e-05, -2.6355497539043427e-05, -2.4925917387008667e-05, -2.3496337234973907e-05, -2.2066757082939148e-05, -2.063717693090439e-05, -1.920759677886963e-05, -1.777801662683487e-05, -1.634843647480011e-05, -1.491885632276535e-05, -1.348927617073059e-05, -1.2059696018695831e-05, -1.0630115866661072e-05, -9.200535714626312e-06, -7.770955562591553e-06, -6.341375410556793e-06, -4.911795258522034e-06, -3.482215106487274e-06, -2.0526349544525146e-06, -6.230548024177551e-07, 8.065253496170044e-07, 2.236105501651764e-06, 3.6656856536865234e-06, 5.095265805721283e-06, 6.5248459577560425e-06, 7.954426109790802e-06, 9.384006261825562e-06, 1.0813586413860321e-05, 1.224316656589508e-05, 1.367274671792984e-05, 1.51023268699646e-05, 1.653190702199936e-05, 1.796148717403412e-05, 1.9391067326068878e-05, 2.0820647478103638e-05, 2.2250227630138397e-05, 2.3679807782173157e-05, 2.5109387934207916e-05, 2.6538968086242676e-05, 2.7968548238277435e-05, 2.9398128390312195e-05, 3.0827708542346954e-05, 3.2257288694381714e-05, 3.3686868846416473e-05, 3.511644899845123e-05, 3.654602915048599e-05, 3.797560930252075e-05, 3.940518945455551e-05, 4.083476960659027e-05, 4.226434975862503e-05, 4.369392991065979e-05, 4.512351006269455e-05, 4.655309021472931e-05, 4.798267036676407e-05, 4.941225051879883e-05]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [135.0, 852.0, 33.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.440404606815719e-07, -1.346054148143594e-07, 2.748296310528531e-07, 6.842646484983561e-07, 1.0936996659438591e-06, 1.5031348539196188e-06, 1.912569814521703e-06, 2.3220050024974626e-06, 2.7314399630995467e-06, 3.140874923701631e-06, 3.5503101116773905e-06, 3.95974529965315e-06, 4.369180260255234e-06, 4.7786152208573185e-06, 5.188050181459403e-06, 5.597485142061487e-06, 6.006920102663571e-06, 6.416355063265655e-06, 6.825790023867739e-06, 7.2352249844698235e-06, 7.644660399819259e-06, 8.054095815168694e-06, 8.463530321023427e-06, 8.872965736372862e-06, 9.282400242227595e-06, 9.69183565757703e-06, 1.0101270163431764e-05, 1.0510705578781199e-05, 1.0920140084635932e-05, 1.1329575499985367e-05, 1.17390100058401e-05, 1.2148445421189535e-05, 1.2557881746033672e-05, 1.2967317161383107e-05, 1.337675166723784e-05, 1.3786187082587276e-05, 1.4195621588442009e-05, 1.4605057003791444e-05, 1.5014491509646177e-05, 1.5423927834490314e-05, 1.5833362340345047e-05, 1.624279684619978e-05, 1.6652233171043918e-05, 1.706166767689865e-05, 1.7471102182753384e-05, 1.788053850759752e-05, 1.8289973013452254e-05, 1.8699407519306988e-05, 1.910884202516172e-05, 1.9518276531016454e-05, 1.992771285586059e-05, 2.0337147361715324e-05, 2.0746581867570058e-05, 2.1156018192414194e-05, 2.1565452698268928e-05, 2.197488720412366e-05, 2.2384323528967798e-05, 2.279375803482253e-05, 2.3203194359666668e-05, 2.36126288655214e-05, 2.4022063371376134e-05, 2.4431497877230868e-05, 2.4840934202075005e-05, 2.5250368707929738e-05, 2.565980321378447e-05]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 0.0, 9.0, 0.0, 12.0, 0.0, 11.0, 13.0, 0.0, 23.0, 0.0, 33.0, 0.0, 41.0, 0.0, 53.0, 0.0, 76.0, 0.0, 81.0, 0.0, 109.0, 0.0, 102.0, 95.0, 0.0, 85.0, 0.0, 67.0, 0.0, 52.0, 0.0, 42.0, 0.0, 32.0, 0.0, 20.0, 0.0, 15.0, 13.0, 0.0, 8.0, 0.0, 6.0, 0.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.0132789611816406e-06, -9.816139936447144e-07, -9.499490261077881e-07, -9.182840585708618e-07, -8.866190910339355e-07, -8.549541234970093e-07, -8.23289155960083e-07, -7.916241884231567e-07, -7.599592208862305e-07, -7.282942533493042e-07, -6.966292858123779e-07, -6.649643182754517e-07, -6.332993507385254e-07, -6.016343832015991e-07, -5.699694156646729e-07, -5.383044481277466e-07, -5.066394805908203e-07, -4.7497451305389404e-07, -4.4330954551696777e-07, -4.116445779800415e-07, -3.7997961044311523e-07, -3.4831464290618896e-07, -3.166496753692627e-07, -2.849847078323364e-07, -2.5331974029541016e-07, -2.2165477275848389e-07, -1.8998980522155762e-07, -1.5832483768463135e-07, -1.2665987014770508e-07, -9.499490261077881e-08, -6.332993507385254e-08, -3.166496753692627e-08, 0.0, 3.166496753692627e-08, 6.332993507385254e-08, 9.499490261077881e-08, 1.2665987014770508e-07, 1.5832483768463135e-07, 1.8998980522155762e-07, 2.2165477275848389e-07, 2.5331974029541016e-07, 2.849847078323364e-07, 3.166496753692627e-07, 3.4831464290618896e-07, 3.7997961044311523e-07, 4.116445779800415e-07, 4.4330954551696777e-07, 4.7497451305389404e-07, 5.066394805908203e-07, 5.383044481277466e-07, 5.699694156646729e-07, 6.016343832015991e-07, 6.332993507385254e-07, 6.649643182754517e-07, 6.966292858123779e-07, 7.282942533493042e-07, 7.599592208862305e-07, 7.916241884231567e-07, 8.23289155960083e-07, 8.549541234970093e-07, 8.866190910339355e-07, 9.182840585708618e-07, 9.499490261077881e-07, 9.816139936447144e-07, 1.0132789611816406e-06]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 5.0, 10.0, 9.0, 14.0, 15.0, 16.0, 20.0, 20.0, 14.0, 27.0, 27.0, 31.0, 43.0, 27.0, 40.0, 39.0, 34.0, 47.0, 49.0, 39.0, 46.0, 26.0, 45.0, 35.0, 45.0, 43.0, 35.0, 36.0, 26.0, 22.0, 22.0, 13.0, 21.0, 12.0, 10.0, 13.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.77734375, -3.6337890625, -3.490234375, -3.3466796875, -3.203125, -3.0595703125, -2.916015625, -2.7724609375, -2.62890625, -2.4853515625, -2.341796875, -2.1982421875, -2.0546875, -1.9111328125, -1.767578125, -1.6240234375, -1.48046875, -1.3369140625, -1.193359375, -1.0498046875, -0.90625, -0.7626953125, -0.619140625, -0.4755859375, -0.33203125, -0.1884765625, -0.044921875, 0.0986328125, 0.2421875, 0.3857421875, 0.529296875, 0.6728515625, 0.81640625, 0.9599609375, 1.103515625, 1.2470703125, 1.390625, 1.5341796875, 1.677734375, 1.8212890625, 1.96484375, 2.1083984375, 2.251953125, 2.3955078125, 2.5390625, 2.6826171875, 2.826171875, 2.9697265625, 3.11328125, 3.2568359375, 3.400390625, 3.5439453125, 3.6875, 3.8310546875, 3.974609375, 4.1181640625, 4.26171875, 4.4052734375, 4.548828125, 4.6923828125, 4.8359375, 4.9794921875, 5.123046875, 5.2666015625, 5.41015625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 20.0, 21.0, 33.0, 63.0, 73.0, 101.0, 136.0, 192.0, 307.0, 426.0, 701.0, 1008.0, 1549.0, 2288.0, 3599.0, 5671.0, 8651.0, 13540.0, 21440.0, 34932.0, 57832.0, 100797.0, 182807.0, 274526.0, 136405.0, 78568.0, 46082.0, 27662.0, 17400.0, 11204.0, 7150.0, 4594.0, 2989.0, 1918.0, 1248.0, 856.0, 538.0, 376.0, 250.0, 167.0, 121.0, 78.0, 61.0, 46.0, 29.0, 25.0, 14.0, 12.0, 5.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.4921875, -4.34381103515625, -4.1954345703125, -4.04705810546875, -3.898681640625, -3.75030517578125, -3.6019287109375, -3.45355224609375, -3.30517578125, -3.15679931640625, -3.0084228515625, -2.86004638671875, -2.711669921875, -2.56329345703125, -2.4149169921875, -2.26654052734375, -2.1181640625, -1.96978759765625, -1.8214111328125, -1.67303466796875, -1.524658203125, -1.37628173828125, -1.2279052734375, -1.07952880859375, -0.93115234375, -0.78277587890625, -0.6343994140625, -0.48602294921875, -0.337646484375, -0.18927001953125, -0.0408935546875, 0.10748291015625, 0.255859375, 0.40423583984375, 0.5526123046875, 0.70098876953125, 0.849365234375, 0.99774169921875, 1.1461181640625, 1.29449462890625, 1.44287109375, 1.59124755859375, 1.7396240234375, 1.88800048828125, 2.036376953125, 2.18475341796875, 2.3331298828125, 2.48150634765625, 2.6298828125, 2.77825927734375, 2.9266357421875, 3.07501220703125, 3.223388671875, 3.37176513671875, 3.5201416015625, 3.66851806640625, 3.81689453125, 3.96527099609375, 4.1136474609375, 4.26202392578125, 4.410400390625, 4.55877685546875, 4.7071533203125, 4.85552978515625, 5.00390625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 8.0, 8.0, 7.0, 3.0, 8.0, 9.0, 10.0, 10.0, 11.0, 28.0, 14.0, 23.0, 22.0, 23.0, 32.0, 30.0, 34.0, 30.0, 62.0, 54.0, 87.0, 108.0, 190.0, 1350.0, 244.0, 129.0, 81.0, 67.0, 48.0, 28.0, 26.0, 40.0, 39.0, 24.0, 19.0, 31.0, 14.0, 16.0, 14.0, 9.0, 14.0, 8.0, 7.0, 10.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.8046875, -9.4847412109375, -9.164794921875, -8.8448486328125, -8.52490234375, -8.2049560546875, -7.885009765625, -7.5650634765625, -7.2451171875, -6.9251708984375, -6.605224609375, -6.2852783203125, -5.96533203125, -5.6453857421875, -5.325439453125, -5.0054931640625, -4.685546875, -4.3656005859375, -4.045654296875, -3.7257080078125, -3.40576171875, -3.0858154296875, -2.765869140625, -2.4459228515625, -2.1259765625, -1.8060302734375, -1.486083984375, -1.1661376953125, -0.84619140625, -0.5262451171875, -0.206298828125, 0.1136474609375, 0.43359375, 0.7535400390625, 1.073486328125, 1.3934326171875, 1.71337890625, 2.0333251953125, 2.353271484375, 2.6732177734375, 2.9931640625, 3.3131103515625, 3.633056640625, 3.9530029296875, 4.27294921875, 4.5928955078125, 4.912841796875, 5.2327880859375, 5.552734375, 5.8726806640625, 6.192626953125, 6.5125732421875, 6.83251953125, 7.1524658203125, 7.472412109375, 7.7923583984375, 8.1123046875, 8.4322509765625, 8.752197265625, 9.0721435546875, 9.39208984375, 9.7120361328125, 10.031982421875, 10.3519287109375, 10.671875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 8.0, 9.0, 9.0, 8.0, 11.0, 15.0, 27.0, 29.0, 32.0, 42.0, 76.0, 69.0, 143.0, 188.0, 469.0, 1269.0, 4846.0, 23911.0, 164034.0, 2398536.0, 489662.0, 49519.0, 9188.0, 2107.0, 657.0, 275.0, 155.0, 94.0, 60.0, 51.0, 48.0, 40.0, 32.0, 15.0, 13.0, 15.0, 8.0, 6.0, 7.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.90625, -13.4676513671875, -13.029052734375, -12.5904541015625, -12.15185546875, -11.7132568359375, -11.274658203125, -10.8360595703125, -10.3974609375, -9.9588623046875, -9.520263671875, -9.0816650390625, -8.64306640625, -8.2044677734375, -7.765869140625, -7.3272705078125, -6.888671875, -6.4500732421875, -6.011474609375, -5.5728759765625, -5.13427734375, -4.6956787109375, -4.257080078125, -3.8184814453125, -3.3798828125, -2.9412841796875, -2.502685546875, -2.0640869140625, -1.62548828125, -1.1868896484375, -0.748291015625, -0.3096923828125, 0.12890625, 0.5675048828125, 1.006103515625, 1.4447021484375, 1.88330078125, 2.3218994140625, 2.760498046875, 3.1990966796875, 3.6376953125, 4.0762939453125, 4.514892578125, 4.9534912109375, 5.39208984375, 5.8306884765625, 6.269287109375, 6.7078857421875, 7.146484375, 7.5850830078125, 8.023681640625, 8.4622802734375, 8.90087890625, 9.3394775390625, 9.778076171875, 10.2166748046875, 10.6552734375, 11.0938720703125, 11.532470703125, 11.9710693359375, 12.40966796875, 12.8482666015625, 13.286865234375, 13.7254638671875, 14.1640625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 17.0, 79.0, 310.0, 385.0, 180.0, 36.0, 6.0, 2.0, 1.0], "bins": [-177.2153778076172, -174.1724395751953, -171.12950134277344, -168.08656311035156, -165.0436248779297, -162.0006866455078, -158.95774841308594, -155.91481018066406, -152.8718719482422, -149.8289337158203, -146.78599548339844, -143.74305725097656, -140.7001190185547, -137.6571807861328, -134.61424255371094, -131.57130432128906, -128.52838134765625, -125.48544311523438, -122.4425048828125, -119.39956665039062, -116.35662841796875, -113.31369018554688, -110.270751953125, -107.22782135009766, -104.18487548828125, -101.14193725585938, -98.0989990234375, -95.05606079101562, -92.01312255859375, -88.97018432617188, -85.92724609375, -82.88431549072266, -79.84138488769531, -76.79844665527344, -73.75550842285156, -70.71257019042969, -67.66963195800781, -64.62669372558594, -61.58375930786133, -58.54082489013672, -55.49788284301758, -52.4549446105957, -49.41200637817383, -46.36907196044922, -43.326133728027344, -40.28319549560547, -37.240257263183594, -34.19731903076172, -31.154382705688477, -28.1114444732666, -25.06850814819336, -22.025569915771484, -18.98263168334961, -15.939695358276367, -12.896757125854492, -9.85382080078125, -6.810882568359375, -3.7679450511932373, -0.7250075340270996, 2.317930221557617, 5.360867500305176, 8.403804779052734, 11.44674301147461, 14.489679336547852, 17.532617568969727]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 8.0, 15.0, 13.0, 13.0, 24.0, 20.0, 23.0, 40.0, 49.0, 34.0, 44.0, 40.0, 41.0, 43.0, 41.0, 42.0, 44.0, 51.0, 54.0, 52.0, 42.0, 34.0, 38.0, 33.0, 24.0, 25.0, 18.0, 19.0, 8.0, 10.0, 11.0, 7.0, 13.0, 5.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.805797576904297, -28.655921936035156, -27.506046295166016, -26.356168746948242, -25.2062931060791, -24.05641746520996, -22.906539916992188, -21.756664276123047, -20.606788635253906, -19.456912994384766, -18.307037353515625, -17.15715980529785, -16.00728416442871, -14.85740852355957, -13.707531929016113, -12.557655334472656, -11.407779693603516, -10.257904052734375, -9.108027458190918, -7.958151340484619, -6.80827522277832, -5.6583991050720215, -4.508522987365723, -3.3586463928222656, -2.208770751953125, -1.0588946342468262, 0.09098148345947266, 1.2408576011657715, 2.3907337188720703, 3.540609836578369, 4.690485954284668, 5.840362548828125, 6.990234375, 8.14011001586914, 9.289986610412598, 10.439863204956055, 11.589738845825195, 12.739614486694336, 13.889491081237793, 15.03936767578125, 16.18924331665039, 17.33911895751953, 18.488994598388672, 19.638872146606445, 20.788747787475586, 21.938623428344727, 23.0885009765625, 24.23837661743164, 25.38825225830078, 26.538127899169922, 27.688003540039062, 28.837881088256836, 29.987756729125977, 31.137632369995117, 32.28750991821289, 33.43738555908203, 34.58726119995117, 35.73713684082031, 36.88701248168945, 38.036888122558594, 39.186767578125, 40.33664321899414, 41.48651885986328, 42.63639450073242, 43.78627014160156]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 11.0, 8.0, 21.0, 17.0, 22.0, 15.0, 23.0, 29.0, 35.0, 33.0, 31.0, 41.0, 40.0, 39.0, 53.0, 56.0, 39.0, 46.0, 43.0, 41.0, 53.0, 49.0, 40.0, 36.0, 33.0, 29.0, 18.0, 18.0, 16.0, 13.0, 13.0, 8.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51171875, -4.35260009765625, -4.1934814453125, -4.03436279296875, -3.875244140625, -3.71612548828125, -3.5570068359375, -3.39788818359375, -3.23876953125, -3.07965087890625, -2.9205322265625, -2.76141357421875, -2.602294921875, -2.44317626953125, -2.2840576171875, -2.12493896484375, -1.9658203125, -1.80670166015625, -1.6475830078125, -1.48846435546875, -1.329345703125, -1.17022705078125, -1.0111083984375, -0.85198974609375, -0.69287109375, -0.53375244140625, -0.3746337890625, -0.21551513671875, -0.056396484375, 0.10272216796875, 0.2618408203125, 0.42095947265625, 0.580078125, 0.73919677734375, 0.8983154296875, 1.05743408203125, 1.216552734375, 1.37567138671875, 1.5347900390625, 1.69390869140625, 1.85302734375, 2.01214599609375, 2.1712646484375, 2.33038330078125, 2.489501953125, 2.64862060546875, 2.8077392578125, 2.96685791015625, 3.1259765625, 3.28509521484375, 3.4442138671875, 3.60333251953125, 3.762451171875, 3.92156982421875, 4.0806884765625, 4.23980712890625, 4.39892578125, 4.55804443359375, 4.7171630859375, 4.87628173828125, 5.035400390625, 5.19451904296875, 5.3536376953125, 5.51275634765625, 5.671875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 12.0, 14.0, 15.0, 24.0, 21.0, 31.0, 36.0, 61.0, 78.0, 78.0, 119.0, 219.0, 270.0, 444.0, 1688.0, 283132.0, 3902240.0, 4147.0, 509.0, 326.0, 202.0, 165.0, 94.0, 62.0, 62.0, 46.0, 37.0, 28.0, 23.0, 18.0, 13.0, 13.0, 11.0, 8.0, 5.0, 7.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.4375, -58.4326171875, -56.427734375, -54.4228515625, -52.41796875, -50.4130859375, -48.408203125, -46.4033203125, -44.3984375, -42.3935546875, -40.388671875, -38.3837890625, -36.37890625, -34.3740234375, -32.369140625, -30.3642578125, -28.359375, -26.3544921875, -24.349609375, -22.3447265625, -20.33984375, -18.3349609375, -16.330078125, -14.3251953125, -12.3203125, -10.3154296875, -8.310546875, -6.3056640625, -4.30078125, -2.2958984375, -0.291015625, 1.7138671875, 3.71875, 5.7236328125, 7.728515625, 9.7333984375, 11.73828125, 13.7431640625, 15.748046875, 17.7529296875, 19.7578125, 21.7626953125, 23.767578125, 25.7724609375, 27.77734375, 29.7822265625, 31.787109375, 33.7919921875, 35.796875, 37.8017578125, 39.806640625, 41.8115234375, 43.81640625, 45.8212890625, 47.826171875, 49.8310546875, 51.8359375, 53.8408203125, 55.845703125, 57.8505859375, 59.85546875, 61.8603515625, 63.865234375, 65.8701171875, 67.875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 4.0, 7.0, 10.0, 9.0, 12.0, 22.0, 32.0, 26.0, 58.0, 64.0, 82.0, 151.0, 159.0, 225.0, 337.0, 497.0, 613.0, 521.0, 366.0, 223.0, 152.0, 133.0, 82.0, 72.0, 49.0, 42.0, 24.0, 20.0, 16.0, 21.0, 8.0, 9.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.1583251953125, -5.949462890625, -5.7406005859375, -5.53173828125, -5.3228759765625, -5.114013671875, -4.9051513671875, -4.6962890625, -4.4874267578125, -4.278564453125, -4.0697021484375, -3.86083984375, -3.6519775390625, -3.443115234375, -3.2342529296875, -3.025390625, -2.8165283203125, -2.607666015625, -2.3988037109375, -2.18994140625, -1.9810791015625, -1.772216796875, -1.5633544921875, -1.3544921875, -1.1456298828125, -0.936767578125, -0.7279052734375, -0.51904296875, -0.3101806640625, -0.101318359375, 0.1075439453125, 0.31640625, 0.5252685546875, 0.734130859375, 0.9429931640625, 1.15185546875, 1.3607177734375, 1.569580078125, 1.7784423828125, 1.9873046875, 2.1961669921875, 2.405029296875, 2.6138916015625, 2.82275390625, 3.0316162109375, 3.240478515625, 3.4493408203125, 3.658203125, 3.8670654296875, 4.075927734375, 4.2847900390625, 4.49365234375, 4.7025146484375, 4.911376953125, 5.1202392578125, 5.3291015625, 5.5379638671875, 5.746826171875, 5.9556884765625, 6.16455078125, 6.3734130859375, 6.582275390625, 6.7911376953125, 7.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 2.0, 9.0, 14.0, 13.0, 21.0, 20.0, 33.0, 51.0, 116.0, 280.0, 1128.0, 7638.0, 174921.0, 3908421.0, 94840.0, 5405.0, 918.0, 205.0, 97.0, 58.0, 31.0, 21.0, 14.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.80126953125, -32.7900390625, -31.77880859375, -30.767578125, -29.75634765625, -28.7451171875, -27.73388671875, -26.72265625, -25.71142578125, -24.7001953125, -23.68896484375, -22.677734375, -21.66650390625, -20.6552734375, -19.64404296875, -18.6328125, -17.62158203125, -16.6103515625, -15.59912109375, -14.587890625, -13.57666015625, -12.5654296875, -11.55419921875, -10.54296875, -9.53173828125, -8.5205078125, -7.50927734375, -6.498046875, -5.48681640625, -4.4755859375, -3.46435546875, -2.453125, -1.44189453125, -0.4306640625, 0.58056640625, 1.591796875, 2.60302734375, 3.6142578125, 4.62548828125, 5.63671875, 6.64794921875, 7.6591796875, 8.67041015625, 9.681640625, 10.69287109375, 11.7041015625, 12.71533203125, 13.7265625, 14.73779296875, 15.7490234375, 16.76025390625, 17.771484375, 18.78271484375, 19.7939453125, 20.80517578125, 21.81640625, 22.82763671875, 23.8388671875, 24.85009765625, 25.861328125, 26.87255859375, 27.8837890625, 28.89501953125, 29.90625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 22.0, 104.0, 295.0, 369.0, 163.0, 39.0, 17.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.0868377685547, -154.0750732421875, -151.06329345703125, -148.05152893066406, -145.03976440429688, -142.02798461914062, -139.01622009277344, -136.00445556640625, -132.99267578125, -129.9809112548828, -126.9691390991211, -123.95736694335938, -120.94559478759766, -117.93382263183594, -114.92205810546875, -111.91028594970703, -108.89851379394531, -105.8867416381836, -102.8749771118164, -99.86320495605469, -96.85143280029297, -93.83966064453125, -90.82789611816406, -87.81612396240234, -84.80435943603516, -81.79258728027344, -78.78082275390625, -75.76905059814453, -72.75727844238281, -69.7455062866211, -66.7337417602539, -63.72196960449219, -60.71019744873047, -57.698429107666016, -54.6866569519043, -51.674888610839844, -48.663116455078125, -45.65134811401367, -42.63957977294922, -39.6278076171875, -36.61603546142578, -33.60426712036133, -30.59249496459961, -27.580726623535156, -24.568954467773438, -21.557186126708984, -18.5454158782959, -15.533645629882812, -12.52187728881836, -9.510107040405273, -6.498337268829346, -3.486567497253418, -0.47479724884033203, 2.536972999572754, 5.548742294311523, 8.56051254272461, 11.572282791137695, 14.584053039550781, 17.595823287963867, 20.607593536376953, 23.619361877441406, 26.631134033203125, 29.642902374267578, 32.65467071533203, 35.66644287109375]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 4.0, 11.0, 5.0, 12.0, 8.0, 15.0, 13.0, 17.0, 18.0, 26.0, 22.0, 28.0, 24.0, 33.0, 34.0, 40.0, 44.0, 42.0, 33.0, 36.0, 39.0, 49.0, 39.0, 37.0, 37.0, 42.0, 29.0, 20.0, 37.0, 34.0, 34.0, 23.0, 17.0, 16.0, 16.0, 7.0, 7.0, 9.0, 8.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-21.501502990722656, -20.853721618652344, -20.20594024658203, -19.55815887451172, -18.910377502441406, -18.262596130371094, -17.61481475830078, -16.96703338623047, -16.319252014160156, -15.671470642089844, -15.023689270019531, -14.375907897949219, -13.728126525878906, -13.080345153808594, -12.432564735412598, -11.784783363342285, -11.137002944946289, -10.489221572875977, -9.841440200805664, -9.193658828735352, -8.545877456665039, -7.898096561431885, -7.2503156661987305, -6.602534294128418, -5.9547529220581055, -5.306971549987793, -4.6591901779174805, -4.011409282684326, -3.3636279106140137, -2.715846538543701, -2.0680654048919678, -1.4202842712402344, -0.7725028991699219, -0.12472164630889893, 0.523059606552124, 1.170840859413147, 1.81862211227417, 2.4664034843444824, 3.114184617996216, 3.761965751647949, 4.409747123718262, 5.057528495788574, 5.705309867858887, 6.353090763092041, 7.0008721351623535, 7.648653507232666, 8.29643440246582, 8.944215774536133, 9.591997146606445, 10.239778518676758, 10.88755989074707, 11.535341262817383, 12.183122634887695, 12.830904006958008, 13.478684425354004, 14.126465797424316, 14.774247169494629, 15.422028541564941, 16.069808959960938, 16.71759033203125, 17.365371704101562, 18.013153076171875, 18.660934448242188, 19.3087158203125, 19.956497192382812]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 11.0, 9.0, 4.0, 9.0, 12.0, 14.0, 15.0, 20.0, 22.0, 30.0, 23.0, 45.0, 34.0, 38.0, 41.0, 38.0, 39.0, 39.0, 42.0, 47.0, 36.0, 58.0, 55.0, 43.0, 45.0, 39.0, 22.0, 31.0, 28.0, 26.0, 14.0, 12.0, 18.0, 13.0, 7.0, 2.0, 9.0, 6.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.55859375, -4.40673828125, -4.2548828125, -4.10302734375, -3.951171875, -3.79931640625, -3.6474609375, -3.49560546875, -3.34375, -3.19189453125, -3.0400390625, -2.88818359375, -2.736328125, -2.58447265625, -2.4326171875, -2.28076171875, -2.12890625, -1.97705078125, -1.8251953125, -1.67333984375, -1.521484375, -1.36962890625, -1.2177734375, -1.06591796875, -0.9140625, -0.76220703125, -0.6103515625, -0.45849609375, -0.306640625, -0.15478515625, -0.0029296875, 0.14892578125, 0.30078125, 0.45263671875, 0.6044921875, 0.75634765625, 0.908203125, 1.06005859375, 1.2119140625, 1.36376953125, 1.515625, 1.66748046875, 1.8193359375, 1.97119140625, 2.123046875, 2.27490234375, 2.4267578125, 2.57861328125, 2.73046875, 2.88232421875, 3.0341796875, 3.18603515625, 3.337890625, 3.48974609375, 3.6416015625, 3.79345703125, 3.9453125, 4.09716796875, 4.2490234375, 4.40087890625, 4.552734375, 4.70458984375, 4.8564453125, 5.00830078125, 5.16015625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 20.0, 9.0, 24.0, 44.0, 50.0, 75.0, 120.0, 169.0, 270.0, 404.0, 578.0, 881.0, 1270.0, 1945.0, 3017.0, 4546.0, 6918.0, 10764.0, 16554.0, 25736.0, 41536.0, 67785.0, 115162.0, 196834.0, 220348.0, 130470.0, 76498.0, 45798.0, 28449.0, 18214.0, 11709.0, 7494.0, 5018.0, 3235.0, 2176.0, 1397.0, 1040.0, 684.0, 432.0, 301.0, 181.0, 124.0, 91.0, 55.0, 29.0, 22.0, 28.0, 16.0, 7.0, 7.0, 1.0, 3.0, 2.0, 5.0], "bins": [-0.03131103515625, -0.030393123626708984, -0.02947521209716797, -0.028557300567626953, -0.027639389038085938, -0.026721477508544922, -0.025803565979003906, -0.02488565444946289, -0.023967742919921875, -0.02304983139038086, -0.022131919860839844, -0.021214008331298828, -0.020296096801757812, -0.019378185272216797, -0.01846027374267578, -0.017542362213134766, -0.01662445068359375, -0.015706539154052734, -0.014788627624511719, -0.013870716094970703, -0.012952804565429688, -0.012034893035888672, -0.011116981506347656, -0.01019906997680664, -0.009281158447265625, -0.00836324691772461, -0.007445335388183594, -0.006527423858642578, -0.0056095123291015625, -0.004691600799560547, -0.0037736892700195312, -0.0028557777404785156, -0.0019378662109375, -0.0010199546813964844, -0.00010204315185546875, 0.0008158683776855469, 0.0017337799072265625, 0.002651691436767578, 0.0035696029663085938, 0.004487514495849609, 0.005405426025390625, 0.006323337554931641, 0.007241249084472656, 0.008159160614013672, 0.009077072143554688, 0.009994983673095703, 0.010912895202636719, 0.011830806732177734, 0.01274871826171875, 0.013666629791259766, 0.014584541320800781, 0.015502452850341797, 0.016420364379882812, 0.017338275909423828, 0.018256187438964844, 0.01917409896850586, 0.020092010498046875, 0.02100992202758789, 0.021927833557128906, 0.022845745086669922, 0.023763656616210938, 0.024681568145751953, 0.02559947967529297, 0.026517391204833984, 0.027435302734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 12.0, 8.0, 5.0, 12.0, 9.0, 9.0, 18.0, 17.0, 21.0, 16.0, 25.0, 24.0, 24.0, 38.0, 31.0, 38.0, 38.0, 26.0, 33.0, 28.0, 45.0, 1064.0, 43.0, 30.0, 34.0, 38.0, 43.0, 38.0, 29.0, 38.0, 21.0, 25.0, 20.0, 16.0, 17.0, 18.0, 12.0, 14.0, 7.0, 12.0, 5.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.455078125, -3.344146728515625, -3.23321533203125, -3.122283935546875, -3.0113525390625, -2.900421142578125, -2.78948974609375, -2.678558349609375, -2.567626953125, -2.456695556640625, -2.34576416015625, -2.234832763671875, -2.1239013671875, -2.012969970703125, -1.90203857421875, -1.791107177734375, -1.68017578125, -1.569244384765625, -1.45831298828125, -1.347381591796875, -1.2364501953125, -1.125518798828125, -1.01458740234375, -0.903656005859375, -0.792724609375, -0.681793212890625, -0.57086181640625, -0.459930419921875, -0.3489990234375, -0.238067626953125, -0.12713623046875, -0.016204833984375, 0.0947265625, 0.205657958984375, 0.31658935546875, 0.427520751953125, 0.5384521484375, 0.649383544921875, 0.76031494140625, 0.871246337890625, 0.982177734375, 1.093109130859375, 1.20404052734375, 1.314971923828125, 1.4259033203125, 1.536834716796875, 1.64776611328125, 1.758697509765625, 1.86962890625, 1.980560302734375, 2.09149169921875, 2.202423095703125, 2.3133544921875, 2.424285888671875, 2.53521728515625, 2.646148681640625, 2.757080078125, 2.868011474609375, 2.97894287109375, 3.089874267578125, 3.2008056640625, 3.311737060546875, 3.42266845703125, 3.533599853515625, 3.64453125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 10.0, 16.0, 8.0, 15.0, 20.0, 31.0, 57.0, 82.0, 129.0, 167.0, 226.0, 313.0, 460.0, 679.0, 936.0, 1324.0, 1967.0, 2946.0, 4105.0, 6119.0, 8909.0, 13251.0, 19582.0, 29283.0, 44892.0, 69324.0, 107847.0, 169693.0, 1240814.0, 130051.0, 82679.0, 53906.0, 34815.0, 23231.0, 15695.0, 10540.0, 7291.0, 4872.0, 3340.0, 2292.0, 1529.0, 1124.0, 753.0, 559.0, 393.0, 259.0, 183.0, 118.0, 110.0, 64.0, 41.0, 32.0, 20.0, 9.0, 11.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.01202392578125, -0.011638641357421875, -0.01125335693359375, -0.010868072509765625, -0.0104827880859375, -0.010097503662109375, -0.00971221923828125, -0.009326934814453125, -0.008941650390625, -0.008556365966796875, -0.00817108154296875, -0.007785797119140625, -0.0074005126953125, -0.007015228271484375, -0.00662994384765625, -0.006244659423828125, -0.005859375, -0.005474090576171875, -0.00508880615234375, -0.004703521728515625, -0.0043182373046875, -0.003932952880859375, -0.00354766845703125, -0.003162384033203125, -0.002777099609375, -0.002391815185546875, -0.00200653076171875, -0.001621246337890625, -0.0012359619140625, -0.000850677490234375, -0.00046539306640625, -8.0108642578125e-05, 0.00030517578125, 0.000690460205078125, 0.00107574462890625, 0.001461029052734375, 0.0018463134765625, 0.002231597900390625, 0.00261688232421875, 0.003002166748046875, 0.003387451171875, 0.003772735595703125, 0.00415802001953125, 0.004543304443359375, 0.0049285888671875, 0.005313873291015625, 0.00569915771484375, 0.006084442138671875, 0.0064697265625, 0.006855010986328125, 0.00724029541015625, 0.007625579833984375, 0.0080108642578125, 0.008396148681640625, 0.00878143310546875, 0.009166717529296875, 0.009552001953125, 0.009937286376953125, 0.01032257080078125, 0.010707855224609375, 0.0110931396484375, 0.011478424072265625, 0.01186370849609375, 0.012248992919921875, 0.01263427734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 12.0, 0.0, 9.0, 3.0, 8.0, 0.0, 11.0, 20.0, 20.0, 0.0, 12.0, 13.0, 19.0, 0.0, 27.0, 52.0, 56.0, 84.0, 0.0, 107.0, 123.0, 106.0, 0.0, 83.0, 45.0, 45.0, 0.0, 30.0, 27.0, 23.0, 0.0, 14.0, 15.0, 8.0, 4.0, 0.0, 12.0, 8.0, 3.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.623295247554779e-06, -1.5776604413986206e-06, -1.5320256352424622e-06, -1.4863908290863037e-06, -1.4407560229301453e-06, -1.3951212167739868e-06, -1.3494864106178284e-06, -1.30385160446167e-06, -1.2582167983055115e-06, -1.212581992149353e-06, -1.1669471859931946e-06, -1.1213123798370361e-06, -1.0756775736808777e-06, -1.0300427675247192e-06, -9.844079613685608e-07, -9.387731552124023e-07, -8.931383490562439e-07, -8.475035429000854e-07, -8.01868736743927e-07, -7.562339305877686e-07, -7.105991244316101e-07, -6.649643182754517e-07, -6.193295121192932e-07, -5.736947059631348e-07, -5.280598998069763e-07, -4.824250936508179e-07, -4.367902874946594e-07, -3.91155481338501e-07, -3.4552067518234253e-07, -2.998858690261841e-07, -2.5425106287002563e-07, -2.086162567138672e-07, -1.6298145055770874e-07, -1.1734664440155029e-07, -7.171183824539185e-08, -2.60770320892334e-08, 1.955777406692505e-08, 6.51925802230835e-08, 1.1082738637924194e-07, 1.564621925354004e-07, 2.0209699869155884e-07, 2.477318048477173e-07, 2.9336661100387573e-07, 3.390014171600342e-07, 3.8463622331619263e-07, 4.302710294723511e-07, 4.759058356285095e-07, 5.21540641784668e-07, 5.671754479408264e-07, 6.128102540969849e-07, 6.584450602531433e-07, 7.040798664093018e-07, 7.497146725654602e-07, 7.953494787216187e-07, 8.409842848777771e-07, 8.866190910339355e-07, 9.32253897190094e-07, 9.778887033462524e-07, 1.0235235095024109e-06, 1.0691583156585693e-06, 1.1147931218147278e-06, 1.1604279279708862e-06, 1.2060627341270447e-06, 1.2516975402832031e-06]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 12.0, 5.0, 7.0, 7.0, 8.0, 15.0, 16.0, 26.0, 36.0, 39.0, 53.0, 99.0, 189.0, 419.0, 4292.0, 935321.0, 105947.0, 1243.0, 346.0, 134.0, 86.0, 49.0, 46.0, 30.0, 27.0, 12.0, 12.0, 18.0, 15.0, 8.0, 5.0, 4.0, 8.0, 9.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-05, -2.864748239517212e-05, -2.7492642402648926e-05, -2.6337802410125732e-05, -2.518296241760254e-05, -2.4028122425079346e-05, -2.2873282432556152e-05, -2.171844244003296e-05, -2.0563602447509766e-05, -1.9408762454986572e-05, -1.825392246246338e-05, -1.7099082469940186e-05, -1.5944242477416992e-05, -1.4789402484893799e-05, -1.3634562492370605e-05, -1.2479722499847412e-05, -1.1324882507324219e-05, -1.0170042514801025e-05, -9.015202522277832e-06, -7.860362529754639e-06, -6.705522537231445e-06, -5.550682544708252e-06, -4.395842552185059e-06, -3.2410025596618652e-06, -2.086162567138672e-06, -9.313225746154785e-07, 2.2351741790771484e-07, 1.3783574104309082e-06, 2.5331974029541016e-06, 3.688037395477295e-06, 4.842877388000488e-06, 5.997717380523682e-06, 7.152557373046875e-06, 8.307397365570068e-06, 9.462237358093262e-06, 1.0617077350616455e-05, 1.1771917343139648e-05, 1.2926757335662842e-05, 1.4081597328186035e-05, 1.5236437320709229e-05, 1.6391277313232422e-05, 1.7546117305755615e-05, 1.870095729827881e-05, 1.9855797290802002e-05, 2.1010637283325195e-05, 2.216547727584839e-05, 2.3320317268371582e-05, 2.4475157260894775e-05, 2.562999725341797e-05, 2.6784837245941162e-05, 2.7939677238464355e-05, 2.909451723098755e-05, 3.0249357223510742e-05, 3.1404197216033936e-05, 3.255903720855713e-05, 3.371387720108032e-05, 3.4868717193603516e-05, 3.602355718612671e-05, 3.71783971786499e-05, 3.8333237171173096e-05, 3.948807716369629e-05, 4.064291715621948e-05, 4.1797757148742676e-05, 4.295259714126587e-05, 4.410743713378906e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [136.0, 852.0, 32.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.463166985464341e-07, -1.3300893897394417e-07, 2.802988205985457e-07, 6.936065233276167e-07, 1.1069143965869443e-06, 1.520222213002853e-06, 1.9335298020450864e-06, 2.346837618460995e-06, 2.760145434876904e-06, 3.1734532512928126e-06, 3.5867610677087214e-06, 4.000068656750955e-06, 4.413376700540539e-06, 4.826684289582772e-06, 5.2399918786250055e-06, 5.65329992241459e-06, 6.066607511456823e-06, 6.479915100499056e-06, 6.8932231442886405e-06, 7.306530733330874e-06, 7.719838322373107e-06, 8.133146366162691e-06, 8.546454409952275e-06, 8.959761544247158e-06, 9.373069588036742e-06, 9.786377631826326e-06, 1.0199684766121209e-05, 1.0612992809910793e-05, 1.1026300853700377e-05, 1.143960798799526e-05, 1.1852916031784844e-05, 1.2266224075574428e-05, 1.267953120986931e-05, 1.3092839253658894e-05, 1.3506146387953777e-05, 1.3919454431743361e-05, 1.4332762475532945e-05, 1.474607051932253e-05, 1.5159377653617412e-05, 1.5572684787912294e-05, 1.598599374119658e-05, 1.6399300875491463e-05, 1.681260982877575e-05, 1.722591696307063e-05, 1.7639224097365513e-05, 1.80525330506498e-05, 1.8465840184944682e-05, 1.8879147319239564e-05, 1.929245627252385e-05, 1.9705763406818733e-05, 2.011907236010302e-05, 2.05323794943979e-05, 2.0945686628692783e-05, 2.135899558197707e-05, 2.1772302716271952e-05, 2.2185609850566834e-05, 2.2598916984861717e-05, 2.30122241191566e-05, 2.3425533072440885e-05, 2.3838840206735767e-05, 2.425214734103065e-05, 2.4665456294314936e-05, 2.5078763428609818e-05, 2.54920705629047e-05, 2.5905379516188987e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 10.0, 0.0, 21.0, 0.0, 25.0, 0.0, 32.0, 0.0, 50.0, 0.0, 46.0, 0.0, 64.0, 0.0, 70.0, 0.0, 92.0, 113.0, 0.0, 99.0, 0.0, 82.0, 0.0, 88.0, 0.0, 66.0, 0.0, 44.0, 0.0, 43.0, 0.0, 18.0, 0.0, 17.0, 0.0, 16.0, 0.0, 4.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.825453162193298e-07, -9.51811671257019e-07, -9.210780262947083e-07, -8.903443813323975e-07, -8.596107363700867e-07, -8.288770914077759e-07, -7.981434464454651e-07, -7.674098014831543e-07, -7.366761565208435e-07, -7.059425115585327e-07, -6.752088665962219e-07, -6.444752216339111e-07, -6.137415766716003e-07, -5.830079317092896e-07, -5.522742867469788e-07, -5.21540641784668e-07, -4.908069968223572e-07, -4.600733518600464e-07, -4.293397068977356e-07, -3.986060619354248e-07, -3.67872416973114e-07, -3.371387720108032e-07, -3.0640512704849243e-07, -2.7567148208618164e-07, -2.4493783712387085e-07, -2.1420419216156006e-07, -1.8347054719924927e-07, -1.5273690223693848e-07, -1.2200325727462769e-07, -9.12696123123169e-08, -6.05359673500061e-08, -2.9802322387695312e-08, 9.313225746154785e-10, 3.166496753692627e-08, 6.239861249923706e-08, 9.313225746154785e-08, 1.2386590242385864e-07, 1.5459954738616943e-07, 1.8533319234848022e-07, 2.1606683731079102e-07, 2.468004822731018e-07, 2.775341272354126e-07, 3.082677721977234e-07, 3.390014171600342e-07, 3.6973506212234497e-07, 4.0046870708465576e-07, 4.3120235204696655e-07, 4.6193599700927734e-07, 4.926696419715881e-07, 5.234032869338989e-07, 5.541369318962097e-07, 5.848705768585205e-07, 6.156042218208313e-07, 6.463378667831421e-07, 6.770715117454529e-07, 7.078051567077637e-07, 7.385388016700745e-07, 7.692724466323853e-07, 8.00006091594696e-07, 8.307397365570068e-07, 8.614733815193176e-07, 8.922070264816284e-07, 9.229406714439392e-07, 9.5367431640625e-07]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 11.0, 9.0, 4.0, 9.0, 12.0, 14.0, 15.0, 20.0, 22.0, 30.0, 23.0, 45.0, 34.0, 38.0, 41.0, 38.0, 39.0, 39.0, 42.0, 47.0, 36.0, 58.0, 55.0, 43.0, 45.0, 39.0, 22.0, 31.0, 28.0, 26.0, 14.0, 12.0, 18.0, 13.0, 7.0, 2.0, 9.0, 6.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.55859375, -4.40673828125, -4.2548828125, -4.10302734375, -3.951171875, -3.79931640625, -3.6474609375, -3.49560546875, -3.34375, -3.19189453125, -3.0400390625, -2.88818359375, -2.736328125, -2.58447265625, -2.4326171875, -2.28076171875, -2.12890625, -1.97705078125, -1.8251953125, -1.67333984375, -1.521484375, -1.36962890625, -1.2177734375, -1.06591796875, -0.9140625, -0.76220703125, -0.6103515625, -0.45849609375, -0.306640625, -0.15478515625, -0.0029296875, 0.14892578125, 0.30078125, 0.45263671875, 0.6044921875, 0.75634765625, 0.908203125, 1.06005859375, 1.2119140625, 1.36376953125, 1.515625, 1.66748046875, 1.8193359375, 1.97119140625, 2.123046875, 2.27490234375, 2.4267578125, 2.57861328125, 2.73046875, 2.88232421875, 3.0341796875, 3.18603515625, 3.337890625, 3.48974609375, 3.6416015625, 3.79345703125, 3.9453125, 4.09716796875, 4.2490234375, 4.40087890625, 4.552734375, 4.70458984375, 4.8564453125, 5.00830078125, 5.16015625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 18.0, 34.0, 27.0, 43.0, 59.0, 93.0, 137.0, 224.0, 274.0, 404.0, 631.0, 896.0, 1266.0, 2019.0, 3139.0, 4976.0, 8238.0, 13297.0, 22020.0, 37223.0, 63813.0, 110842.0, 188719.0, 225198.0, 151375.0, 86712.0, 50430.0, 29529.0, 17843.0, 10790.0, 6451.0, 4159.0, 2604.0, 1667.0, 1085.0, 706.0, 471.0, 329.0, 234.0, 176.0, 115.0, 83.0, 63.0, 36.0, 29.0, 19.0, 17.0, 5.0, 8.0, 5.0, 3.0, 3.0, 0.0, 5.0, 1.0, 2.0], "bins": [-4.5859375, -4.4393310546875, -4.292724609375, -4.1461181640625, -3.99951171875, -3.8529052734375, -3.706298828125, -3.5596923828125, -3.4130859375, -3.2664794921875, -3.119873046875, -2.9732666015625, -2.82666015625, -2.6800537109375, -2.533447265625, -2.3868408203125, -2.240234375, -2.0936279296875, -1.947021484375, -1.8004150390625, -1.65380859375, -1.5072021484375, -1.360595703125, -1.2139892578125, -1.0673828125, -0.9207763671875, -0.774169921875, -0.6275634765625, -0.48095703125, -0.3343505859375, -0.187744140625, -0.0411376953125, 0.10546875, 0.2520751953125, 0.398681640625, 0.5452880859375, 0.69189453125, 0.8385009765625, 0.985107421875, 1.1317138671875, 1.2783203125, 1.4249267578125, 1.571533203125, 1.7181396484375, 1.86474609375, 2.0113525390625, 2.157958984375, 2.3045654296875, 2.451171875, 2.5977783203125, 2.744384765625, 2.8909912109375, 3.03759765625, 3.1842041015625, 3.330810546875, 3.4774169921875, 3.6240234375, 3.7706298828125, 3.917236328125, 4.0638427734375, 4.21044921875, 4.3570556640625, 4.503662109375, 4.6502685546875, 4.796875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 9.0, 9.0, 9.0, 12.0, 19.0, 22.0, 22.0, 17.0, 30.0, 32.0, 42.0, 27.0, 40.0, 67.0, 84.0, 129.0, 209.0, 1338.0, 219.0, 162.0, 89.0, 62.0, 51.0, 47.0, 37.0, 33.0, 34.0, 20.0, 17.0, 13.0, 20.0, 12.0, 19.0, 15.0, 13.0, 12.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.22607421875, -8.9052734375, -8.58447265625, -8.263671875, -7.94287109375, -7.6220703125, -7.30126953125, -6.98046875, -6.65966796875, -6.3388671875, -6.01806640625, -5.697265625, -5.37646484375, -5.0556640625, -4.73486328125, -4.4140625, -4.09326171875, -3.7724609375, -3.45166015625, -3.130859375, -2.81005859375, -2.4892578125, -2.16845703125, -1.84765625, -1.52685546875, -1.2060546875, -0.88525390625, -0.564453125, -0.24365234375, 0.0771484375, 0.39794921875, 0.71875, 1.03955078125, 1.3603515625, 1.68115234375, 2.001953125, 2.32275390625, 2.6435546875, 2.96435546875, 3.28515625, 3.60595703125, 3.9267578125, 4.24755859375, 4.568359375, 4.88916015625, 5.2099609375, 5.53076171875, 5.8515625, 6.17236328125, 6.4931640625, 6.81396484375, 7.134765625, 7.45556640625, 7.7763671875, 8.09716796875, 8.41796875, 8.73876953125, 9.0595703125, 9.38037109375, 9.701171875, 10.02197265625, 10.3427734375, 10.66357421875, 10.984375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 16.0, 13.0, 23.0, 17.0, 39.0, 38.0, 53.0, 97.0, 147.0, 269.0, 534.0, 1349.0, 22939.0, 2995740.0, 120322.0, 2483.0, 689.0, 358.0, 158.0, 112.0, 76.0, 44.0, 36.0, 32.0, 26.0, 18.0, 14.0, 8.0, 9.0, 3.0, 2.0, 2.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.9375, -26.962890625, -25.98828125, -25.013671875, -24.0390625, -23.064453125, -22.08984375, -21.115234375, -20.140625, -19.166015625, -18.19140625, -17.216796875, -16.2421875, -15.267578125, -14.29296875, -13.318359375, -12.34375, -11.369140625, -10.39453125, -9.419921875, -8.4453125, -7.470703125, -6.49609375, -5.521484375, -4.546875, -3.572265625, -2.59765625, -1.623046875, -0.6484375, 0.326171875, 1.30078125, 2.275390625, 3.25, 4.224609375, 5.19921875, 6.173828125, 7.1484375, 8.123046875, 9.09765625, 10.072265625, 11.046875, 12.021484375, 12.99609375, 13.970703125, 14.9453125, 15.919921875, 16.89453125, 17.869140625, 18.84375, 19.818359375, 20.79296875, 21.767578125, 22.7421875, 23.716796875, 24.69140625, 25.666015625, 26.640625, 27.615234375, 28.58984375, 29.564453125, 30.5390625, 31.513671875, 32.48828125, 33.462890625, 34.4375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 8.0, 18.0, 64.0, 177.0, 258.0, 246.0, 151.0, 68.0, 18.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.480012893676758, -17.034095764160156, -14.588180541992188, -12.142264366149902, -9.696348190307617, -7.250432014465332, -4.804515838623047, -2.3585987091064453, 0.08731651306152344, 2.5332326889038086, 4.979148864746094, 7.425065040588379, 9.870981216430664, 12.31689739227295, 14.762813568115234, 17.208730697631836, 19.654645919799805, 22.100563049316406, 24.546478271484375, 26.992393493652344, 29.438310623168945, 31.884227752685547, 34.330142974853516, 36.77606201171875, 39.22197723388672, 41.66789245605469, 44.113807678222656, 46.55972671508789, 49.00564193725586, 51.45155715942383, 53.89747619628906, 56.34339141845703, 58.789306640625, 61.23522186279297, 63.68113708496094, 66.1270523071289, 68.57296752929688, 71.01889038085938, 73.46480560302734, 75.91072082519531, 78.35663604736328, 80.80255126953125, 83.24846649169922, 85.69438171386719, 88.14030456542969, 90.58621978759766, 93.03213500976562, 95.4780502319336, 97.92396545410156, 100.36988067626953, 102.8157958984375, 105.26171112060547, 107.70762634277344, 110.15354919433594, 112.5994644165039, 115.04537963867188, 117.49129486083984, 119.93721008300781, 122.38312530517578, 124.82904052734375, 127.27496337890625, 129.7208709716797, 132.1667938232422, 134.61270141601562, 137.05862426757812]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 10.0, 10.0, 4.0, 9.0, 19.0, 24.0, 13.0, 19.0, 34.0, 25.0, 30.0, 21.0, 29.0, 32.0, 27.0, 49.0, 34.0, 47.0, 49.0, 36.0, 35.0, 34.0, 27.0, 33.0, 37.0, 30.0, 38.0, 36.0, 33.0, 21.0, 24.0, 28.0, 13.0, 10.0, 20.0, 12.0, 7.0, 8.0, 5.0, 4.0, 7.0, 1.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-35.830047607421875, -34.75184631347656, -33.67364501953125, -32.59544372558594, -31.517240524291992, -30.43903923034668, -29.360836029052734, -28.282634735107422, -27.20443344116211, -26.126232147216797, -25.048030853271484, -23.96982765197754, -22.891626358032227, -21.813425064086914, -20.73522186279297, -19.657020568847656, -18.578819274902344, -17.50061798095703, -16.42241668701172, -15.344213485717773, -14.266012191772461, -13.187810897827148, -12.10960865020752, -11.03140640258789, -9.953205108642578, -8.875003814697266, -7.796801567077637, -6.718599796295166, -5.640398025512695, -4.562196254730225, -3.483994483947754, -2.405792713165283, -1.3275909423828125, -0.2493891716003418, 0.8288125991821289, 1.9070143699645996, 2.9852161407470703, 4.063417911529541, 5.141619682312012, 6.219821453094482, 7.298023223876953, 8.376224517822266, 9.454426765441895, 10.532629013061523, 11.610830307006836, 12.689031600952148, 13.767233848571777, 14.845436096191406, 15.923637390136719, 17.00183868408203, 18.080039978027344, 19.15824317932129, 20.2364444732666, 21.314645767211914, 22.39284896850586, 23.471050262451172, 24.549251556396484, 25.627452850341797, 26.70565414428711, 27.783857345581055, 28.862058639526367, 29.94025993347168, 31.018463134765625, 32.09666442871094, 33.17486572265625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 4.0, 7.0, 9.0, 15.0, 11.0, 19.0, 19.0, 22.0, 28.0, 31.0, 36.0, 44.0, 33.0, 39.0, 48.0, 43.0, 42.0, 36.0, 47.0, 46.0, 52.0, 45.0, 42.0, 37.0, 37.0, 30.0, 26.0, 24.0, 20.0, 23.0, 16.0, 10.0, 9.0, 7.0, 11.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.51202392578125, -4.3599853515625, -4.20794677734375, -4.055908203125, -3.90386962890625, -3.7518310546875, -3.59979248046875, -3.44775390625, -3.29571533203125, -3.1436767578125, -2.99163818359375, -2.839599609375, -2.68756103515625, -2.5355224609375, -2.38348388671875, -2.2314453125, -2.07940673828125, -1.9273681640625, -1.77532958984375, -1.623291015625, -1.47125244140625, -1.3192138671875, -1.16717529296875, -1.01513671875, -0.86309814453125, -0.7110595703125, -0.55902099609375, -0.406982421875, -0.25494384765625, -0.1029052734375, 0.04913330078125, 0.201171875, 0.35321044921875, 0.5052490234375, 0.65728759765625, 0.809326171875, 0.96136474609375, 1.1134033203125, 1.26544189453125, 1.41748046875, 1.56951904296875, 1.7215576171875, 1.87359619140625, 2.025634765625, 2.17767333984375, 2.3297119140625, 2.48175048828125, 2.6337890625, 2.78582763671875, 2.9378662109375, 3.08990478515625, 3.241943359375, 3.39398193359375, 3.5460205078125, 3.69805908203125, 3.85009765625, 4.00213623046875, 4.1541748046875, 4.30621337890625, 4.458251953125, 4.61029052734375, 4.7623291015625, 4.91436767578125, 5.06640625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 9.0, 13.0, 15.0, 14.0, 22.0, 36.0, 48.0, 56.0, 89.0, 128.0, 196.0, 285.0, 450.0, 767.0, 1373.0, 2873.0, 6042.0, 15533.0, 54168.0, 422949.0, 2687621.0, 872569.0, 91348.0, 22022.0, 7962.0, 3534.0, 1656.0, 866.0, 552.0, 323.0, 223.0, 156.0, 95.0, 69.0, 52.0, 40.0, 31.0, 19.0, 19.0, 11.0, 11.0, 5.0, 5.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3046875, -9.968505859375, -9.63232421875, -9.296142578125, -8.9599609375, -8.623779296875, -8.28759765625, -7.951416015625, -7.615234375, -7.279052734375, -6.94287109375, -6.606689453125, -6.2705078125, -5.934326171875, -5.59814453125, -5.261962890625, -4.92578125, -4.589599609375, -4.25341796875, -3.917236328125, -3.5810546875, -3.244873046875, -2.90869140625, -2.572509765625, -2.236328125, -1.900146484375, -1.56396484375, -1.227783203125, -0.8916015625, -0.555419921875, -0.21923828125, 0.116943359375, 0.453125, 0.789306640625, 1.12548828125, 1.461669921875, 1.7978515625, 2.134033203125, 2.47021484375, 2.806396484375, 3.142578125, 3.478759765625, 3.81494140625, 4.151123046875, 4.4873046875, 4.823486328125, 5.15966796875, 5.495849609375, 5.83203125, 6.168212890625, 6.50439453125, 6.840576171875, 7.1767578125, 7.512939453125, 7.84912109375, 8.185302734375, 8.521484375, 8.857666015625, 9.19384765625, 9.530029296875, 9.8662109375, 10.202392578125, 10.53857421875, 10.874755859375, 11.2109375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 9.0, 6.0, 14.0, 14.0, 22.0, 30.0, 35.0, 42.0, 66.0, 64.0, 110.0, 134.0, 192.0, 278.0, 337.0, 489.0, 530.0, 448.0, 303.0, 268.0, 159.0, 117.0, 104.0, 69.0, 55.0, 49.0, 40.0, 25.0, 16.0, 12.0, 6.0, 12.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.46875, -8.24114990234375, -8.0135498046875, -7.78594970703125, -7.558349609375, -7.33074951171875, -7.1031494140625, -6.87554931640625, -6.64794921875, -6.42034912109375, -6.1927490234375, -5.96514892578125, -5.737548828125, -5.50994873046875, -5.2823486328125, -5.05474853515625, -4.8271484375, -4.59954833984375, -4.3719482421875, -4.14434814453125, -3.916748046875, -3.68914794921875, -3.4615478515625, -3.23394775390625, -3.00634765625, -2.77874755859375, -2.5511474609375, -2.32354736328125, -2.095947265625, -1.86834716796875, -1.6407470703125, -1.41314697265625, -1.185546875, -0.95794677734375, -0.7303466796875, -0.50274658203125, -0.275146484375, -0.04754638671875, 0.1800537109375, 0.40765380859375, 0.63525390625, 0.86285400390625, 1.0904541015625, 1.31805419921875, 1.545654296875, 1.77325439453125, 2.0008544921875, 2.22845458984375, 2.4560546875, 2.68365478515625, 2.9112548828125, 3.13885498046875, 3.366455078125, 3.59405517578125, 3.8216552734375, 4.04925537109375, 4.27685546875, 4.50445556640625, 4.7320556640625, 4.95965576171875, 5.187255859375, 5.41485595703125, 5.6424560546875, 5.87005615234375, 6.09765625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 11.0, 10.0, 21.0, 31.0, 51.0, 64.0, 116.0, 197.0, 302.0, 536.0, 812.0, 1658.0, 3245.0, 7679.0, 21376.0, 77732.0, 408489.0, 2603189.0, 878950.0, 136713.0, 33311.0, 10853.0, 4352.0, 1979.0, 1060.0, 592.0, 359.0, 204.0, 125.0, 91.0, 66.0, 32.0, 24.0, 15.0, 10.0, 10.0, 5.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296875, -7.9859619140625, -7.675048828125, -7.3641357421875, -7.05322265625, -6.7423095703125, -6.431396484375, -6.1204833984375, -5.8095703125, -5.4986572265625, -5.187744140625, -4.8768310546875, -4.56591796875, -4.2550048828125, -3.944091796875, -3.6331787109375, -3.322265625, -3.0113525390625, -2.700439453125, -2.3895263671875, -2.07861328125, -1.7677001953125, -1.456787109375, -1.1458740234375, -0.8349609375, -0.5240478515625, -0.213134765625, 0.0977783203125, 0.40869140625, 0.7196044921875, 1.030517578125, 1.3414306640625, 1.65234375, 1.9632568359375, 2.274169921875, 2.5850830078125, 2.89599609375, 3.2069091796875, 3.517822265625, 3.8287353515625, 4.1396484375, 4.4505615234375, 4.761474609375, 5.0723876953125, 5.38330078125, 5.6942138671875, 6.005126953125, 6.3160400390625, 6.626953125, 6.9378662109375, 7.248779296875, 7.5596923828125, 7.87060546875, 8.1815185546875, 8.492431640625, 8.8033447265625, 9.1142578125, 9.4251708984375, 9.736083984375, 10.0469970703125, 10.35791015625, 10.6688232421875, 10.979736328125, 11.2906494140625, 11.6015625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 28.0, 277.0, 544.0, 151.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-268.76300048828125, -263.0848693847656, -257.4067077636719, -251.72857666015625, -246.05043029785156, -240.37228393554688, -234.69415283203125, -229.01600646972656, -223.33786010742188, -217.6597137451172, -211.98158264160156, -206.30343627929688, -200.6252899169922, -194.9471435546875, -189.26901245117188, -183.5908660888672, -177.91273498535156, -172.23458862304688, -166.55645751953125, -160.87831115722656, -155.20016479492188, -149.52203369140625, -143.84388732910156, -138.16574096679688, -132.48760986328125, -126.8094711303711, -121.1313247680664, -115.45318603515625, -109.77503967285156, -104.0969009399414, -98.41876220703125, -92.74061584472656, -87.06248474121094, -81.38434600830078, -75.7061996459961, -70.02806091308594, -64.34991455078125, -58.671775817871094, -52.99363708496094, -47.315494537353516, -41.637351989746094, -35.95920944213867, -30.281068801879883, -24.602928161621094, -18.924785614013672, -13.24664306640625, -7.568504333496094, -1.8903617858886719, 3.78778076171875, 9.465922355651855, 15.144063949584961, 20.82220458984375, 26.500347137451172, 32.178489685058594, 37.85662841796875, 43.53477096557617, 49.212913513183594, 54.891056060791016, 60.56919860839844, 66.2473373413086, 71.92547607421875, 77.60362243652344, 83.2817611694336, 88.95989990234375, 94.63804626464844]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 4.0, 2.0, 4.0, 8.0, 14.0, 14.0, 16.0, 13.0, 19.0, 23.0, 23.0, 21.0, 23.0, 40.0, 31.0, 29.0, 47.0, 39.0, 42.0, 41.0, 50.0, 45.0, 31.0, 31.0, 37.0, 44.0, 37.0, 29.0, 21.0, 27.0, 27.0, 28.0, 31.0, 15.0, 23.0, 11.0, 17.0, 9.0, 4.0, 2.0, 10.0, 5.0, 5.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.735641479492188, -26.862028121948242, -25.98841667175293, -25.114803314208984, -24.241191864013672, -23.367578506469727, -22.49396514892578, -21.62035369873047, -20.746740341186523, -19.873126983642578, -18.999515533447266, -18.12590217590332, -17.252288818359375, -16.378677368164062, -15.505064010620117, -14.631451606750488, -13.75783920288086, -12.88422679901123, -12.010614395141602, -11.137001037597656, -10.263388633728027, -9.389776229858398, -8.516162872314453, -7.642550468444824, -6.768938064575195, -5.895325660705566, -5.021712779998779, -4.148099899291992, -3.2744874954223633, -2.4008750915527344, -1.5272622108459473, -0.6536493301391602, 0.21996307373046875, 1.0935757160186768, 1.9671883583068848, 2.8408010005950928, 3.714413642883301, 4.58802604675293, 5.461638927459717, 6.335251808166504, 7.208864212036133, 8.082476615905762, 8.95608901977539, 9.829702377319336, 10.703314781188965, 11.576927185058594, 12.450540542602539, 13.324152946472168, 14.197765350341797, 15.071377754211426, 15.944990158081055, 16.818603515625, 17.692214965820312, 18.565828323364258, 19.439441680908203, 20.313053131103516, 21.18666648864746, 22.060279846191406, 22.93389129638672, 23.807504653930664, 24.68111801147461, 25.554729461669922, 26.428342819213867, 27.301956176757812, 28.175567626953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 2.0, 7.0, 8.0, 15.0, 8.0, 11.0, 15.0, 19.0, 19.0, 28.0, 27.0, 27.0, 40.0, 38.0, 36.0, 41.0, 48.0, 42.0, 40.0, 52.0, 37.0, 35.0, 56.0, 41.0, 48.0, 39.0, 33.0, 26.0, 33.0, 15.0, 22.0, 9.0, 15.0, 16.0, 8.0, 13.0, 11.0, 6.0, 6.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.484375, -4.34210205078125, -4.1998291015625, -4.05755615234375, -3.915283203125, -3.77301025390625, -3.6307373046875, -3.48846435546875, -3.34619140625, -3.20391845703125, -3.0616455078125, -2.91937255859375, -2.777099609375, -2.63482666015625, -2.4925537109375, -2.35028076171875, -2.2080078125, -2.06573486328125, -1.9234619140625, -1.78118896484375, -1.638916015625, -1.49664306640625, -1.3543701171875, -1.21209716796875, -1.06982421875, -0.92755126953125, -0.7852783203125, -0.64300537109375, -0.500732421875, -0.35845947265625, -0.2161865234375, -0.07391357421875, 0.068359375, 0.21063232421875, 0.3529052734375, 0.49517822265625, 0.637451171875, 0.77972412109375, 0.9219970703125, 1.06427001953125, 1.20654296875, 1.34881591796875, 1.4910888671875, 1.63336181640625, 1.775634765625, 1.91790771484375, 2.0601806640625, 2.20245361328125, 2.3447265625, 2.48699951171875, 2.6292724609375, 2.77154541015625, 2.913818359375, 3.05609130859375, 3.1983642578125, 3.34063720703125, 3.48291015625, 3.62518310546875, 3.7674560546875, 3.90972900390625, 4.052001953125, 4.19427490234375, 4.3365478515625, 4.47882080078125, 4.62109375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 4.0, 12.0, 24.0, 18.0, 42.0, 50.0, 93.0, 124.0, 181.0, 305.0, 429.0, 669.0, 1059.0, 1634.0, 2546.0, 4067.0, 6642.0, 10913.0, 17853.0, 30575.0, 52344.0, 94638.0, 171384.0, 259714.0, 170164.0, 93918.0, 52434.0, 30262.0, 17849.0, 10698.0, 6593.0, 4056.0, 2627.0, 1605.0, 1034.0, 682.0, 464.0, 264.0, 167.0, 144.0, 97.0, 51.0, 31.0, 35.0, 15.0, 9.0, 12.0, 12.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.032318115234375, -0.031291961669921875, -0.03026580810546875, -0.029239654541015625, -0.0282135009765625, -0.027187347412109375, -0.02616119384765625, -0.025135040283203125, -0.02410888671875, -0.023082733154296875, -0.02205657958984375, -0.021030426025390625, -0.0200042724609375, -0.018978118896484375, -0.01795196533203125, -0.016925811767578125, -0.015899658203125, -0.014873504638671875, -0.01384735107421875, -0.012821197509765625, -0.0117950439453125, -0.010768890380859375, -0.00974273681640625, -0.008716583251953125, -0.0076904296875, -0.006664276123046875, -0.00563812255859375, -0.004611968994140625, -0.0035858154296875, -0.002559661865234375, -0.00153350830078125, -0.000507354736328125, 0.000518798828125, 0.001544952392578125, 0.00257110595703125, 0.003597259521484375, 0.0046234130859375, 0.005649566650390625, 0.00667572021484375, 0.007701873779296875, 0.00872802734375, 0.009754180908203125, 0.01078033447265625, 0.011806488037109375, 0.0128326416015625, 0.013858795166015625, 0.01488494873046875, 0.015911102294921875, 0.016937255859375, 0.017963409423828125, 0.01898956298828125, 0.020015716552734375, 0.0210418701171875, 0.022068023681640625, 0.02309417724609375, 0.024120330810546875, 0.025146484375, 0.026172637939453125, 0.02719879150390625, 0.028224945068359375, 0.0292510986328125, 0.030277252197265625, 0.03130340576171875, 0.032329559326171875, 0.033355712890625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 13.0, 15.0, 7.0, 17.0, 16.0, 13.0, 20.0, 20.0, 31.0, 33.0, 28.0, 32.0, 44.0, 30.0, 42.0, 36.0, 49.0, 43.0, 1074.0, 48.0, 50.0, 41.0, 39.0, 32.0, 30.0, 36.0, 30.0, 19.0, 27.0, 23.0, 14.0, 15.0, 16.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.76953125, -3.6590576171875, -3.548583984375, -3.4381103515625, -3.32763671875, -3.2171630859375, -3.106689453125, -2.9962158203125, -2.8857421875, -2.7752685546875, -2.664794921875, -2.5543212890625, -2.44384765625, -2.3333740234375, -2.222900390625, -2.1124267578125, -2.001953125, -1.8914794921875, -1.781005859375, -1.6705322265625, -1.56005859375, -1.4495849609375, -1.339111328125, -1.2286376953125, -1.1181640625, -1.0076904296875, -0.897216796875, -0.7867431640625, -0.67626953125, -0.5657958984375, -0.455322265625, -0.3448486328125, -0.234375, -0.1239013671875, -0.013427734375, 0.0970458984375, 0.20751953125, 0.3179931640625, 0.428466796875, 0.5389404296875, 0.6494140625, 0.7598876953125, 0.870361328125, 0.9808349609375, 1.09130859375, 1.2017822265625, 1.312255859375, 1.4227294921875, 1.533203125, 1.6436767578125, 1.754150390625, 1.8646240234375, 1.97509765625, 2.0855712890625, 2.196044921875, 2.3065185546875, 2.4169921875, 2.5274658203125, 2.637939453125, 2.7484130859375, 2.85888671875, 2.9693603515625, 3.079833984375, 3.1903076171875, 3.30078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 11.0, 11.0, 30.0, 30.0, 34.0, 55.0, 63.0, 109.0, 142.0, 219.0, 321.0, 437.0, 691.0, 971.0, 1473.0, 2144.0, 3105.0, 4834.0, 7389.0, 11251.0, 17136.0, 26850.0, 41948.0, 65198.0, 105121.0, 171724.0, 1258321.0, 139409.0, 85390.0, 54248.0, 34534.0, 22130.0, 14152.0, 9211.0, 6086.0, 3923.0, 2737.0, 1808.0, 1218.0, 830.0, 543.0, 413.0, 265.0, 191.0, 120.0, 90.0, 60.0, 34.0, 39.0, 29.0, 20.0, 12.0, 7.0, 7.0, 3.0, 4.0, 2.0], "bins": [-0.01258087158203125, -0.012202858924865723, -0.011824846267700195, -0.011446833610534668, -0.01106882095336914, -0.010690808296203613, -0.010312795639038086, -0.009934782981872559, -0.009556770324707031, -0.009178757667541504, -0.008800745010375977, -0.00842273235321045, -0.008044719696044922, -0.0076667070388793945, -0.007288694381713867, -0.00691068172454834, -0.0065326690673828125, -0.006154656410217285, -0.005776643753051758, -0.0053986310958862305, -0.005020618438720703, -0.004642605781555176, -0.0042645931243896484, -0.003886580467224121, -0.0035085678100585938, -0.0031305551528930664, -0.002752542495727539, -0.0023745298385620117, -0.0019965171813964844, -0.001618504524230957, -0.0012404918670654297, -0.0008624792098999023, -0.000484466552734375, -0.00010645389556884766, 0.0002715587615966797, 0.000649571418762207, 0.0010275840759277344, 0.0014055967330932617, 0.001783609390258789, 0.0021616220474243164, 0.0025396347045898438, 0.002917647361755371, 0.0032956600189208984, 0.0036736726760864258, 0.004051685333251953, 0.0044296979904174805, 0.004807710647583008, 0.005185723304748535, 0.0055637359619140625, 0.00594174861907959, 0.006319761276245117, 0.0066977739334106445, 0.007075786590576172, 0.007453799247741699, 0.007831811904907227, 0.008209824562072754, 0.008587837219238281, 0.008965849876403809, 0.009343862533569336, 0.009721875190734863, 0.01009988784790039, 0.010477900505065918, 0.010855913162231445, 0.011233925819396973, 0.0116119384765625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 12.0, 5.0, 4.0, 10.0, 8.0, 15.0, 14.0, 20.0, 27.0, 46.0, 61.0, 92.0, 126.0, 124.0, 130.0, 85.0, 60.0, 31.0, 27.0, 24.0, 15.0, 16.0, 10.0, 7.0, 8.0, 1.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.4437904357910156e-06, -2.3832544684410095e-06, -2.3227185010910034e-06, -2.2621825337409973e-06, -2.201646566390991e-06, -2.141110599040985e-06, -2.080574631690979e-06, -2.020038664340973e-06, -1.959502696990967e-06, -1.8989667296409607e-06, -1.8384307622909546e-06, -1.7778947949409485e-06, -1.7173588275909424e-06, -1.6568228602409363e-06, -1.5962868928909302e-06, -1.535750925540924e-06, -1.475214958190918e-06, -1.4146789908409119e-06, -1.3541430234909058e-06, -1.2936070561408997e-06, -1.2330710887908936e-06, -1.1725351214408875e-06, -1.1119991540908813e-06, -1.0514631867408752e-06, -9.909272193908691e-07, -9.30391252040863e-07, -8.698552846908569e-07, -8.093193173408508e-07, -7.487833499908447e-07, -6.882473826408386e-07, -6.277114152908325e-07, -5.671754479408264e-07, -5.066394805908203e-07, -4.461035132408142e-07, -3.855675458908081e-07, -3.25031578540802e-07, -2.644956111907959e-07, -2.039596438407898e-07, -1.434236764907837e-07, -8.288770914077759e-08, -2.2351741790771484e-08, 3.818422555923462e-08, 9.872019290924072e-08, 1.5925616025924683e-07, 2.1979212760925293e-07, 2.8032809495925903e-07, 3.4086406230926514e-07, 4.0140002965927124e-07, 4.6193599700927734e-07, 5.224719643592834e-07, 5.830079317092896e-07, 6.435438990592957e-07, 7.040798664093018e-07, 7.646158337593079e-07, 8.25151801109314e-07, 8.856877684593201e-07, 9.462237358093262e-07, 1.0067597031593323e-06, 1.0672956705093384e-06, 1.1278316378593445e-06, 1.1883676052093506e-06, 1.2489035725593567e-06, 1.3094395399093628e-06, 1.369975507259369e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 3.0, 2.0, 9.0, 5.0, 8.0, 10.0, 9.0, 17.0, 26.0, 25.0, 23.0, 47.0, 72.0, 163.0, 259.0, 1212.0, 122033.0, 920486.0, 3236.0, 401.0, 191.0, 104.0, 46.0, 47.0, 23.0, 19.0, 16.0, 16.0, 12.0, 7.0, 7.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8967857360839844e-05, -2.7816742658615112e-05, -2.666562795639038e-05, -2.551451325416565e-05, -2.4363398551940918e-05, -2.3212283849716187e-05, -2.2061169147491455e-05, -2.0910054445266724e-05, -1.9758939743041992e-05, -1.860782504081726e-05, -1.745671033859253e-05, -1.6305595636367798e-05, -1.5154480934143066e-05, -1.4003366231918335e-05, -1.2852251529693604e-05, -1.1701136827468872e-05, -1.055002212524414e-05, -9.39890742301941e-06, -8.247792720794678e-06, -7.096678018569946e-06, -5.945563316345215e-06, -4.794448614120483e-06, -3.643333911895752e-06, -2.4922192096710205e-06, -1.341104507446289e-06, -1.8998980522155762e-07, 9.611248970031738e-07, 2.1122395992279053e-06, 3.2633543014526367e-06, 4.414469003677368e-06, 5.5655837059021e-06, 6.716698408126831e-06, 7.867813110351562e-06, 9.018927812576294e-06, 1.0170042514801025e-05, 1.1321157217025757e-05, 1.2472271919250488e-05, 1.362338662147522e-05, 1.4774501323699951e-05, 1.5925616025924683e-05, 1.7076730728149414e-05, 1.8227845430374146e-05, 1.9378960132598877e-05, 2.053007483482361e-05, 2.168118953704834e-05, 2.283230423927307e-05, 2.3983418941497803e-05, 2.5134533643722534e-05, 2.6285648345947266e-05, 2.7436763048171997e-05, 2.858787775039673e-05, 2.973899245262146e-05, 3.089010715484619e-05, 3.204122185707092e-05, 3.3192336559295654e-05, 3.4343451261520386e-05, 3.549456596374512e-05, 3.664568066596985e-05, 3.779679536819458e-05, 3.894791007041931e-05, 4.009902477264404e-05, 4.1250139474868774e-05, 4.2401254177093506e-05, 4.355236887931824e-05, 4.470348358154297e-05]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 10.0, 2.0, 12.0, 12.0, 12.0, 25.0, 46.0, 66.0, 140.0, 157.0, 174.0, 130.0, 89.0, 46.0, 39.0, 16.0, 13.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.810659556322207e-07, -6.328792210297252e-07, -5.846925432706485e-07, -5.365058086681529e-07, -4.883190740656573e-07, -4.401323678848712e-07, -3.9194566170408507e-07, -3.437589271015895e-07, -2.955722209208034e-07, -2.4738551474001724e-07, -1.9919878013752168e-07, -1.5101207395673555e-07, -1.028253535650947e-07, -5.4638633173453854e-08, -6.4519269926677225e-09, 4.173480760982784e-08, 8.992151379061397e-08, 1.3810823418225482e-07, 1.8629495457389567e-07, 2.344816607546818e-07, 2.8266839535717736e-07, 3.308551015379635e-07, 3.790418077187496e-07, 4.272285423212452e-07, 4.754152485020313e-07, 5.236019546828174e-07, 5.71788689285313e-07, 6.199753670443897e-07, 6.681621016468853e-07, 7.163488362493808e-07, 7.645355708518764e-07, 8.12722305454372e-07, 8.609089263700298e-07, 9.090956609725254e-07, 9.57282395575021e-07, 1.0054691301775165e-06, 1.0536557510931743e-06, 1.1018424856956699e-06, 1.1500292202981655e-06, 1.198215954900661e-06, 1.2464026895031566e-06, 1.2945894241056521e-06, 1.3427761587081477e-06, 1.3909627796238055e-06, 1.4391495142263011e-06, 1.4873362488287967e-06, 1.5355229834312922e-06, 1.5837097180337878e-06, 1.6318963389494456e-06, 1.6800830735519412e-06, 1.7282698081544368e-06, 1.7764564290700946e-06, 1.8246431636725902e-06, 1.8728298982750857e-06, 1.9210165191907436e-06, 1.969203367480077e-06, 2.01739021576941e-06, 2.065576836685068e-06, 2.1137636849744013e-06, 2.161950305890059e-06, 2.2101371541793924e-06, 2.2583237750950502e-06, 2.306510396010708e-06, 2.3546972443000413e-06, 2.402883865215699e-06]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 16.0, 0.0, 27.0, 0.0, 0.0, 33.0, 0.0, 54.0, 0.0, 0.0, 85.0, 0.0, 110.0, 0.0, 106.0, 0.0, 0.0, 113.0, 0.0, 129.0, 0.0, 101.0, 0.0, 0.0, 73.0, 0.0, 66.0, 0.0, 0.0, 36.0, 0.0, 28.0, 0.0, 22.0, 0.0, 0.0, 5.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 2.0, 7.0, 8.0, 15.0, 8.0, 11.0, 15.0, 19.0, 19.0, 28.0, 27.0, 27.0, 40.0, 38.0, 36.0, 41.0, 48.0, 42.0, 40.0, 52.0, 37.0, 35.0, 56.0, 41.0, 48.0, 39.0, 33.0, 26.0, 33.0, 15.0, 22.0, 9.0, 15.0, 16.0, 8.0, 13.0, 11.0, 6.0, 6.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.484375, -4.34210205078125, -4.1998291015625, -4.05755615234375, -3.915283203125, -3.77301025390625, -3.6307373046875, -3.48846435546875, -3.34619140625, -3.20391845703125, -3.0616455078125, -2.91937255859375, -2.777099609375, -2.63482666015625, -2.4925537109375, -2.35028076171875, -2.2080078125, -2.06573486328125, -1.9234619140625, -1.78118896484375, -1.638916015625, -1.49664306640625, -1.3543701171875, -1.21209716796875, -1.06982421875, -0.92755126953125, -0.7852783203125, -0.64300537109375, -0.500732421875, -0.35845947265625, -0.2161865234375, -0.07391357421875, 0.068359375, 0.21063232421875, 0.3529052734375, 0.49517822265625, 0.637451171875, 0.77972412109375, 0.9219970703125, 1.06427001953125, 1.20654296875, 1.34881591796875, 1.4910888671875, 1.63336181640625, 1.775634765625, 1.91790771484375, 2.0601806640625, 2.20245361328125, 2.3447265625, 2.48699951171875, 2.6292724609375, 2.77154541015625, 2.913818359375, 3.05609130859375, 3.1983642578125, 3.34063720703125, 3.48291015625, 3.62518310546875, 3.7674560546875, 3.90972900390625, 4.052001953125, 4.19427490234375, 4.3365478515625, 4.47882080078125, 4.62109375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 2.0, 4.0, 10.0, 12.0, 25.0, 27.0, 50.0, 49.0, 98.0, 146.0, 215.0, 324.0, 542.0, 941.0, 1764.0, 3423.0, 6588.0, 14489.0, 33050.0, 87130.0, 286521.0, 409163.0, 123255.0, 44583.0, 18635.0, 8366.0, 4078.0, 2143.0, 1117.0, 655.0, 416.0, 261.0, 140.0, 114.0, 73.0, 40.0, 30.0, 21.0, 22.0, 13.0, 5.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.0859375, -7.8623046875, -7.638671875, -7.4150390625, -7.19140625, -6.9677734375, -6.744140625, -6.5205078125, -6.296875, -6.0732421875, -5.849609375, -5.6259765625, -5.40234375, -5.1787109375, -4.955078125, -4.7314453125, -4.5078125, -4.2841796875, -4.060546875, -3.8369140625, -3.61328125, -3.3896484375, -3.166015625, -2.9423828125, -2.71875, -2.4951171875, -2.271484375, -2.0478515625, -1.82421875, -1.6005859375, -1.376953125, -1.1533203125, -0.9296875, -0.7060546875, -0.482421875, -0.2587890625, -0.03515625, 0.1884765625, 0.412109375, 0.6357421875, 0.859375, 1.0830078125, 1.306640625, 1.5302734375, 1.75390625, 1.9775390625, 2.201171875, 2.4248046875, 2.6484375, 2.8720703125, 3.095703125, 3.3193359375, 3.54296875, 3.7666015625, 3.990234375, 4.2138671875, 4.4375, 4.6611328125, 4.884765625, 5.1083984375, 5.33203125, 5.5556640625, 5.779296875, 6.0029296875, 6.2265625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 6.0, 4.0, 8.0, 9.0, 11.0, 15.0, 20.0, 24.0, 19.0, 40.0, 39.0, 33.0, 48.0, 66.0, 97.0, 172.0, 245.0, 1440.0, 173.0, 131.0, 90.0, 51.0, 38.0, 45.0, 25.0, 30.0, 21.0, 27.0, 19.0, 15.0, 7.0, 17.0, 16.0, 11.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-12.125, -11.7813720703125, -11.437744140625, -11.0941162109375, -10.75048828125, -10.4068603515625, -10.063232421875, -9.7196044921875, -9.3759765625, -9.0323486328125, -8.688720703125, -8.3450927734375, -8.00146484375, -7.6578369140625, -7.314208984375, -6.9705810546875, -6.626953125, -6.2833251953125, -5.939697265625, -5.5960693359375, -5.25244140625, -4.9088134765625, -4.565185546875, -4.2215576171875, -3.8779296875, -3.5343017578125, -3.190673828125, -2.8470458984375, -2.50341796875, -2.1597900390625, -1.816162109375, -1.4725341796875, -1.12890625, -0.7852783203125, -0.441650390625, -0.0980224609375, 0.24560546875, 0.5892333984375, 0.932861328125, 1.2764892578125, 1.6201171875, 1.9637451171875, 2.307373046875, 2.6510009765625, 2.99462890625, 3.3382568359375, 3.681884765625, 4.0255126953125, 4.369140625, 4.7127685546875, 5.056396484375, 5.4000244140625, 5.74365234375, 6.0872802734375, 6.430908203125, 6.7745361328125, 7.1181640625, 7.4617919921875, 7.805419921875, 8.1490478515625, 8.49267578125, 8.8363037109375, 9.179931640625, 9.5235595703125, 9.8671875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 10.0, 10.0, 10.0, 23.0, 27.0, 25.0, 31.0, 58.0, 77.0, 105.0, 199.0, 290.0, 476.0, 911.0, 5800.0, 1557229.0, 1572268.0, 5916.0, 932.0, 474.0, 265.0, 167.0, 98.0, 80.0, 47.0, 38.0, 23.0, 24.0, 15.0, 14.0, 8.0, 8.0, 9.0, 8.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.515625, -24.742431640625, -23.96923828125, -23.196044921875, -22.4228515625, -21.649658203125, -20.87646484375, -20.103271484375, -19.330078125, -18.556884765625, -17.78369140625, -17.010498046875, -16.2373046875, -15.464111328125, -14.69091796875, -13.917724609375, -13.14453125, -12.371337890625, -11.59814453125, -10.824951171875, -10.0517578125, -9.278564453125, -8.50537109375, -7.732177734375, -6.958984375, -6.185791015625, -5.41259765625, -4.639404296875, -3.8662109375, -3.093017578125, -2.31982421875, -1.546630859375, -0.7734375, -0.000244140625, 0.77294921875, 1.546142578125, 2.3193359375, 3.092529296875, 3.86572265625, 4.638916015625, 5.412109375, 6.185302734375, 6.95849609375, 7.731689453125, 8.5048828125, 9.278076171875, 10.05126953125, 10.824462890625, 11.59765625, 12.370849609375, 13.14404296875, 13.917236328125, 14.6904296875, 15.463623046875, 16.23681640625, 17.010009765625, 17.783203125, 18.556396484375, 19.32958984375, 20.102783203125, 20.8759765625, 21.649169921875, 22.42236328125, 23.195556640625, 23.96875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 14.0, 67.0, 218.0, 367.0, 253.0, 80.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.10261917114258, -44.062416076660156, -41.022216796875, -37.98201370239258, -34.941810607910156, -31.901607513427734, -28.861406326293945, -25.821205139160156, -22.781002044677734, -19.740798950195312, -16.700597763061523, -13.660395622253418, -10.620193481445312, -7.579991340637207, -4.539789199829102, -1.4995880126953125, 1.5406150817871094, 4.580817222595215, 7.62101936340332, 10.661221504211426, 13.701423645019531, 16.741626739501953, 19.781827926635742, 22.82202911376953, 25.862232208251953, 28.902435302734375, 31.942636489868164, 34.98283767700195, 38.023040771484375, 41.0632438659668, 44.10344696044922, 47.143646240234375, 50.18385314941406, 53.224056243896484, 56.264259338378906, 59.30445861816406, 62.344661712646484, 65.3848648071289, 68.42506408691406, 71.46527099609375, 74.5054702758789, 77.54566955566406, 80.58587646484375, 83.6260757446289, 86.66627502441406, 89.70648193359375, 92.7466812133789, 95.78688049316406, 98.82708740234375, 101.8672866821289, 104.9074935913086, 107.94769287109375, 110.98789978027344, 114.0280990600586, 117.06829833984375, 120.10850524902344, 123.1487045288086, 126.18890380859375, 129.22911071777344, 132.26931762695312, 135.30950927734375, 138.34971618652344, 141.38992309570312, 144.43011474609375, 147.47032165527344]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 3.0, 8.0, 10.0, 5.0, 11.0, 7.0, 12.0, 17.0, 20.0, 15.0, 17.0, 32.0, 28.0, 20.0, 33.0, 34.0, 36.0, 44.0, 43.0, 36.0, 39.0, 49.0, 44.0, 44.0, 38.0, 40.0, 37.0, 39.0, 28.0, 28.0, 25.0, 20.0, 26.0, 18.0, 23.0, 10.0, 13.0, 14.0, 11.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.33778381347656, -33.19041442871094, -32.04304885864258, -30.895681381225586, -29.748313903808594, -28.6009464263916, -27.45357894897461, -26.306209564208984, -25.158843994140625, -24.011476516723633, -22.86410903930664, -21.71674156188965, -20.569374084472656, -19.422006607055664, -18.274639129638672, -17.127269744873047, -15.979902267456055, -14.832534790039062, -13.68516731262207, -12.537799835205078, -11.390432357788086, -10.243064880371094, -9.095696449279785, -7.948328971862793, -6.800961494445801, -5.653594017028809, -4.506226539611816, -3.358858585357666, -2.211491107940674, -1.0641236305236816, 0.08324432373046875, 1.230611801147461, 2.377979278564453, 3.5253467559814453, 4.6727142333984375, 5.820082187652588, 6.96744966506958, 8.114816665649414, 9.262185096740723, 10.409552574157715, 11.556920051574707, 12.7042875289917, 13.851655006408691, 14.9990234375, 16.146390914916992, 17.293758392333984, 18.441125869750977, 19.58849334716797, 20.73586082458496, 21.883228302001953, 23.030595779418945, 24.177963256835938, 25.32533073425293, 26.472698211669922, 27.620067596435547, 28.767433166503906, 29.91480255126953, 31.062170028686523, 32.209537506103516, 33.35690689086914, 34.5042724609375, 35.651641845703125, 36.799007415771484, 37.94637680053711, 39.09374237060547]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 4.0, 8.0, 14.0, 10.0, 17.0, 24.0, 20.0, 32.0, 37.0, 39.0, 19.0, 38.0, 30.0, 49.0, 42.0, 46.0, 45.0, 44.0, 51.0, 41.0, 39.0, 40.0, 42.0, 34.0, 30.0, 28.0, 32.0, 18.0, 19.0, 16.0, 16.0, 10.0, 14.0, 9.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.83026123046875, -4.6839599609375, -4.53765869140625, -4.391357421875, -4.24505615234375, -4.0987548828125, -3.95245361328125, -3.80615234375, -3.65985107421875, -3.5135498046875, -3.36724853515625, -3.220947265625, -3.07464599609375, -2.9283447265625, -2.78204345703125, -2.6357421875, -2.48944091796875, -2.3431396484375, -2.19683837890625, -2.050537109375, -1.90423583984375, -1.7579345703125, -1.61163330078125, -1.46533203125, -1.31903076171875, -1.1727294921875, -1.02642822265625, -0.880126953125, -0.73382568359375, -0.5875244140625, -0.44122314453125, -0.294921875, -0.14862060546875, -0.0023193359375, 0.14398193359375, 0.290283203125, 0.43658447265625, 0.5828857421875, 0.72918701171875, 0.87548828125, 1.02178955078125, 1.1680908203125, 1.31439208984375, 1.460693359375, 1.60699462890625, 1.7532958984375, 1.89959716796875, 2.0458984375, 2.19219970703125, 2.3385009765625, 2.48480224609375, 2.631103515625, 2.77740478515625, 2.9237060546875, 3.07000732421875, 3.21630859375, 3.36260986328125, 3.5089111328125, 3.65521240234375, 3.801513671875, 3.94781494140625, 4.0941162109375, 4.24041748046875, 4.38671875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 5.0, 5.0, 10.0, 12.0, 21.0, 30.0, 31.0, 60.0, 69.0, 124.0, 166.0, 242.0, 324.0, 479.0, 739.0, 1085.0, 1644.0, 2691.0, 4313.0, 7365.0, 13253.0, 27867.0, 99820.0, 619629.0, 2252770.0, 931467.0, 155070.0, 36962.0, 15763.0, 8626.0, 4911.0, 3020.0, 1919.0, 1235.0, 809.0, 565.0, 368.0, 235.0, 188.0, 117.0, 83.0, 59.0, 52.0, 25.0, 18.0, 17.0, 10.0, 7.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.6197509765625, -6.380126953125, -6.1405029296875, -5.90087890625, -5.6612548828125, -5.421630859375, -5.1820068359375, -4.9423828125, -4.7027587890625, -4.463134765625, -4.2235107421875, -3.98388671875, -3.7442626953125, -3.504638671875, -3.2650146484375, -3.025390625, -2.7857666015625, -2.546142578125, -2.3065185546875, -2.06689453125, -1.8272705078125, -1.587646484375, -1.3480224609375, -1.1083984375, -0.8687744140625, -0.629150390625, -0.3895263671875, -0.14990234375, 0.0897216796875, 0.329345703125, 0.5689697265625, 0.80859375, 1.0482177734375, 1.287841796875, 1.5274658203125, 1.76708984375, 2.0067138671875, 2.246337890625, 2.4859619140625, 2.7255859375, 2.9652099609375, 3.204833984375, 3.4444580078125, 3.68408203125, 3.9237060546875, 4.163330078125, 4.4029541015625, 4.642578125, 4.8822021484375, 5.121826171875, 5.3614501953125, 5.60107421875, 5.8406982421875, 6.080322265625, 6.3199462890625, 6.5595703125, 6.7991943359375, 7.038818359375, 7.2784423828125, 7.51806640625, 7.7576904296875, 7.997314453125, 8.2369384765625, 8.4765625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 5.0, 10.0, 11.0, 10.0, 28.0, 20.0, 38.0, 52.0, 66.0, 124.0, 151.0, 215.0, 322.0, 377.0, 561.0, 520.0, 436.0, 316.0, 236.0, 165.0, 104.0, 92.0, 72.0, 26.0, 30.0, 20.0, 15.0, 7.0, 6.0, 9.0, 10.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.95703125, -7.7576904296875, -7.558349609375, -7.3590087890625, -7.15966796875, -6.9603271484375, -6.760986328125, -6.5616455078125, -6.3623046875, -6.1629638671875, -5.963623046875, -5.7642822265625, -5.56494140625, -5.3656005859375, -5.166259765625, -4.9669189453125, -4.767578125, -4.5682373046875, -4.368896484375, -4.1695556640625, -3.97021484375, -3.7708740234375, -3.571533203125, -3.3721923828125, -3.1728515625, -2.9735107421875, -2.774169921875, -2.5748291015625, -2.37548828125, -2.1761474609375, -1.976806640625, -1.7774658203125, -1.578125, -1.3787841796875, -1.179443359375, -0.9801025390625, -0.78076171875, -0.5814208984375, -0.382080078125, -0.1827392578125, 0.0166015625, 0.2159423828125, 0.415283203125, 0.6146240234375, 0.81396484375, 1.0133056640625, 1.212646484375, 1.4119873046875, 1.611328125, 1.8106689453125, 2.010009765625, 2.2093505859375, 2.40869140625, 2.6080322265625, 2.807373046875, 3.0067138671875, 3.2060546875, 3.4053955078125, 3.604736328125, 3.8040771484375, 4.00341796875, 4.2027587890625, 4.402099609375, 4.6014404296875, 4.80078125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 10.0, 17.0, 30.0, 25.0, 52.0, 82.0, 197.0, 355.0, 734.0, 1851.0, 5511.0, 28089.0, 379659.0, 3532465.0, 217866.0, 20124.0, 4423.0, 1486.0, 623.0, 292.0, 131.0, 79.0, 58.0, 31.0, 15.0, 12.0, 18.0, 6.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.1875, -10.747314453125, -10.30712890625, -9.866943359375, -9.4267578125, -8.986572265625, -8.54638671875, -8.106201171875, -7.666015625, -7.225830078125, -6.78564453125, -6.345458984375, -5.9052734375, -5.465087890625, -5.02490234375, -4.584716796875, -4.14453125, -3.704345703125, -3.26416015625, -2.823974609375, -2.3837890625, -1.943603515625, -1.50341796875, -1.063232421875, -0.623046875, -0.182861328125, 0.25732421875, 0.697509765625, 1.1376953125, 1.577880859375, 2.01806640625, 2.458251953125, 2.8984375, 3.338623046875, 3.77880859375, 4.218994140625, 4.6591796875, 5.099365234375, 5.53955078125, 5.979736328125, 6.419921875, 6.860107421875, 7.30029296875, 7.740478515625, 8.1806640625, 8.620849609375, 9.06103515625, 9.501220703125, 9.94140625, 10.381591796875, 10.82177734375, 11.261962890625, 11.7021484375, 12.142333984375, 12.58251953125, 13.022705078125, 13.462890625, 13.903076171875, 14.34326171875, 14.783447265625, 15.2236328125, 15.663818359375, 16.10400390625, 16.544189453125, 16.984375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 10.0, 111.0, 558.0, 301.0, 38.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.09686279296875, -135.38832092285156, -129.6797637939453, -123.97122192382812, -118.26268005371094, -112.55413055419922, -106.8455810546875, -101.13703918457031, -95.4284896850586, -89.71994018554688, -84.01139831542969, -78.30284881591797, -72.59429931640625, -66.88575744628906, -61.177207946777344, -55.46866226196289, -49.76011657714844, -44.051570892333984, -38.34302520751953, -32.63447570800781, -26.92593002319336, -21.217384338378906, -15.508834838867188, -9.800289154052734, -4.091743469238281, 1.6168031692504883, 7.325349807739258, 13.033897399902344, 18.742443084716797, 24.45098876953125, 30.15953826904297, 35.86808395385742, 41.576629638671875, 47.28517532348633, 52.99372100830078, 58.7022705078125, 64.41081237792969, 70.1193618774414, 75.82791137695312, 81.53645324707031, 87.24500274658203, 92.95355224609375, 98.66209411621094, 104.37064361572266, 110.07919311523438, 115.78773498535156, 121.49628448486328, 127.204833984375, 132.9133758544922, 138.62191772460938, 144.33047485351562, 150.0390167236328, 155.74755859375, 161.45611572265625, 167.16465759277344, 172.87319946289062, 178.58175659179688, 184.29029846191406, 189.9988555908203, 195.7073974609375, 201.4159393310547, 207.12448120117188, 212.83303833007812, 218.5415802001953, 224.2501220703125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 7.0, 16.0, 15.0, 13.0, 11.0, 18.0, 19.0, 22.0, 36.0, 30.0, 21.0, 23.0, 23.0, 32.0, 37.0, 37.0, 41.0, 33.0, 42.0, 37.0, 37.0, 38.0, 36.0, 43.0, 23.0, 36.0, 31.0, 31.0, 24.0, 25.0, 18.0, 15.0, 16.0, 19.0, 13.0, 12.0, 9.0, 9.0, 12.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.692291259765625, -20.019268035888672, -19.34624481201172, -18.673221588134766, -18.000200271606445, -17.327177047729492, -16.65415382385254, -15.981130599975586, -15.30810832977295, -14.635085105895996, -13.96206283569336, -13.289039611816406, -12.616016387939453, -11.942994117736816, -11.269970893859863, -10.596948623657227, -9.923925399780273, -9.25090217590332, -8.577879905700684, -7.9048566818237305, -7.2318339347839355, -6.558811187744141, -5.8857879638671875, -5.212765216827393, -4.539742469787598, -3.8667197227478027, -3.1936967372894287, -2.5206737518310547, -1.8476510047912598, -1.1746282577514648, -0.5016050338745117, 0.1714177131652832, 0.8444404602050781, 1.5174633264541626, 2.190486192703247, 2.863509178161621, 3.536531925201416, 4.209554672241211, 4.882577896118164, 5.555600643157959, 6.228623390197754, 6.901646137237549, 7.574668884277344, 8.247692108154297, 8.92071533203125, 9.593737602233887, 10.26676082611084, 10.939783096313477, 11.61280632019043, 12.285829544067383, 12.95885181427002, 13.631875038146973, 14.30489730834961, 14.977920532226562, 15.650943756103516, 16.32396697998047, 16.996990203857422, 17.670013427734375, 18.343036651611328, 19.01605987548828, 19.6890811920166, 20.362104415893555, 21.035127639770508, 21.70815086364746, 22.38117218017578]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 4.0, 5.0, 16.0, 17.0, 13.0, 19.0, 14.0, 30.0, 38.0, 30.0, 30.0, 38.0, 32.0, 48.0, 35.0, 47.0, 44.0, 51.0, 58.0, 35.0, 31.0, 55.0, 32.0, 30.0, 37.0, 30.0, 26.0, 28.0, 17.0, 18.0, 22.0, 17.0, 9.0, 10.0, 4.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.3638916015625, -4.219970703125, -4.0760498046875, -3.93212890625, -3.7882080078125, -3.644287109375, -3.5003662109375, -3.3564453125, -3.2125244140625, -3.068603515625, -2.9246826171875, -2.78076171875, -2.6368408203125, -2.492919921875, -2.3489990234375, -2.205078125, -2.0611572265625, -1.917236328125, -1.7733154296875, -1.62939453125, -1.4854736328125, -1.341552734375, -1.1976318359375, -1.0537109375, -0.9097900390625, -0.765869140625, -0.6219482421875, -0.47802734375, -0.3341064453125, -0.190185546875, -0.0462646484375, 0.09765625, 0.2415771484375, 0.385498046875, 0.5294189453125, 0.67333984375, 0.8172607421875, 0.961181640625, 1.1051025390625, 1.2490234375, 1.3929443359375, 1.536865234375, 1.6807861328125, 1.82470703125, 1.9686279296875, 2.112548828125, 2.2564697265625, 2.400390625, 2.5443115234375, 2.688232421875, 2.8321533203125, 2.97607421875, 3.1199951171875, 3.263916015625, 3.4078369140625, 3.5517578125, 3.6956787109375, 3.839599609375, 3.9835205078125, 4.12744140625, 4.2713623046875, 4.415283203125, 4.5592041015625, 4.703125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 16.0, 25.0, 27.0, 45.0, 66.0, 109.0, 155.0, 221.0, 340.0, 514.0, 798.0, 1220.0, 1931.0, 2817.0, 4399.0, 6983.0, 10900.0, 16688.0, 26005.0, 42043.0, 71067.0, 123548.0, 228950.0, 215311.0, 116715.0, 67490.0, 39912.0, 25046.0, 16214.0, 10247.0, 6624.0, 4256.0, 2783.0, 1713.0, 1172.0, 742.0, 509.0, 312.0, 206.0, 155.0, 88.0, 57.0, 40.0, 24.0, 24.0, 16.0, 13.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.03786945343017578, -0.03664588928222656, -0.035422325134277344, -0.034198760986328125, -0.032975196838378906, -0.03175163269042969, -0.03052806854248047, -0.02930450439453125, -0.02808094024658203, -0.026857376098632812, -0.025633811950683594, -0.024410247802734375, -0.023186683654785156, -0.021963119506835938, -0.02073955535888672, -0.0195159912109375, -0.01829242706298828, -0.017068862915039062, -0.015845298767089844, -0.014621734619140625, -0.013398170471191406, -0.012174606323242188, -0.010951042175292969, -0.00972747802734375, -0.008503913879394531, -0.0072803497314453125, -0.006056785583496094, -0.004833221435546875, -0.0036096572875976562, -0.0023860931396484375, -0.0011625289916992188, 6.103515625e-05, 0.0012845993041992188, 0.0025081634521484375, 0.0037317276000976562, 0.004955291748046875, 0.006178855895996094, 0.0074024200439453125, 0.008625984191894531, 0.00984954833984375, 0.011073112487792969, 0.012296676635742188, 0.013520240783691406, 0.014743804931640625, 0.015967369079589844, 0.017190933227539062, 0.01841449737548828, 0.0196380615234375, 0.02086162567138672, 0.022085189819335938, 0.023308753967285156, 0.024532318115234375, 0.025755882263183594, 0.026979446411132812, 0.02820301055908203, 0.02942657470703125, 0.03065013885498047, 0.03187370300292969, 0.033097267150878906, 0.034320831298828125, 0.035544395446777344, 0.03676795959472656, 0.03799152374267578, 0.039215087890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 11.0, 11.0, 10.0, 16.0, 25.0, 18.0, 26.0, 31.0, 40.0, 40.0, 27.0, 49.0, 54.0, 41.0, 55.0, 1073.0, 47.0, 47.0, 48.0, 51.0, 39.0, 42.0, 35.0, 21.0, 33.0, 27.0, 18.0, 21.0, 14.0, 14.0, 9.0, 2.0, 9.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8125, -3.68292236328125, -3.5533447265625, -3.42376708984375, -3.294189453125, -3.16461181640625, -3.0350341796875, -2.90545654296875, -2.77587890625, -2.64630126953125, -2.5167236328125, -2.38714599609375, -2.257568359375, -2.12799072265625, -1.9984130859375, -1.86883544921875, -1.7392578125, -1.60968017578125, -1.4801025390625, -1.35052490234375, -1.220947265625, -1.09136962890625, -0.9617919921875, -0.83221435546875, -0.70263671875, -0.57305908203125, -0.4434814453125, -0.31390380859375, -0.184326171875, -0.05474853515625, 0.0748291015625, 0.20440673828125, 0.333984375, 0.46356201171875, 0.5931396484375, 0.72271728515625, 0.852294921875, 0.98187255859375, 1.1114501953125, 1.24102783203125, 1.37060546875, 1.50018310546875, 1.6297607421875, 1.75933837890625, 1.888916015625, 2.01849365234375, 2.1480712890625, 2.27764892578125, 2.4072265625, 2.53680419921875, 2.6663818359375, 2.79595947265625, 2.925537109375, 3.05511474609375, 3.1846923828125, 3.31427001953125, 3.44384765625, 3.57342529296875, 3.7030029296875, 3.83258056640625, 3.962158203125, 4.09173583984375, 4.2213134765625, 4.35089111328125, 4.48046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 15.0, 20.0, 26.0, 47.0, 58.0, 81.0, 117.0, 200.0, 317.0, 470.0, 651.0, 1062.0, 1704.0, 2637.0, 4221.0, 6925.0, 11275.0, 18662.0, 31243.0, 53491.0, 93087.0, 171965.0, 1303113.0, 169600.0, 93388.0, 53159.0, 30965.0, 18692.0, 11332.0, 6931.0, 4172.0, 2703.0, 1675.0, 1055.0, 709.0, 474.0, 286.0, 178.0, 136.0, 92.0, 55.0, 47.0, 15.0, 22.0, 13.0, 16.0, 9.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0142669677734375, -0.013799190521240234, -0.013331413269042969, -0.012863636016845703, -0.012395858764648438, -0.011928081512451172, -0.011460304260253906, -0.01099252700805664, -0.010524749755859375, -0.01005697250366211, -0.009589195251464844, -0.009121417999267578, -0.008653640747070312, -0.008185863494873047, -0.007718086242675781, -0.007250308990478516, -0.00678253173828125, -0.006314754486083984, -0.005846977233886719, -0.005379199981689453, -0.0049114227294921875, -0.004443645477294922, -0.003975868225097656, -0.0035080909729003906, -0.003040313720703125, -0.0025725364685058594, -0.0021047592163085938, -0.0016369819641113281, -0.0011692047119140625, -0.0007014274597167969, -0.00023365020751953125, 0.00023412704467773438, 0.000701904296875, 0.0011696815490722656, 0.0016374588012695312, 0.002105236053466797, 0.0025730133056640625, 0.003040790557861328, 0.0035085678100585938, 0.003976345062255859, 0.004444122314453125, 0.004911899566650391, 0.005379676818847656, 0.005847454071044922, 0.0063152313232421875, 0.006783008575439453, 0.007250785827636719, 0.007718563079833984, 0.00818634033203125, 0.008654117584228516, 0.009121894836425781, 0.009589672088623047, 0.010057449340820312, 0.010525226593017578, 0.010993003845214844, 0.01146078109741211, 0.011928558349609375, 0.01239633560180664, 0.012864112854003906, 0.013331890106201172, 0.013799667358398438, 0.014267444610595703, 0.014735221862792969, 0.015202999114990234, 0.0156707763671875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 12.0, 0.0, 16.0, 25.0, 37.0, 48.0, 0.0, 65.0, 89.0, 121.0, 141.0, 0.0, 123.0, 88.0, 72.0, 52.0, 0.0, 28.0, 28.0, 20.0, 8.0, 0.0, 7.0, 8.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5618279576301575e-06, -1.514330506324768e-06, -1.4668330550193787e-06, -1.4193356037139893e-06, -1.3718381524085999e-06, -1.3243407011032104e-06, -1.276843249797821e-06, -1.2293457984924316e-06, -1.1818483471870422e-06, -1.1343508958816528e-06, -1.0868534445762634e-06, -1.039355993270874e-06, -9.918585419654846e-07, -9.443610906600952e-07, -8.968636393547058e-07, -8.493661880493164e-07, -8.01868736743927e-07, -7.543712854385376e-07, -7.068738341331482e-07, -6.593763828277588e-07, -6.118789315223694e-07, -5.6438148021698e-07, -5.168840289115906e-07, -4.6938657760620117e-07, -4.2188912630081177e-07, -3.7439167499542236e-07, -3.2689422369003296e-07, -2.7939677238464355e-07, -2.3189932107925415e-07, -1.8440186977386475e-07, -1.3690441846847534e-07, -8.940696716308594e-08, -4.190951585769653e-08, 5.587935447692871e-09, 5.3085386753082275e-08, 1.0058283805847168e-07, 1.4808028936386108e-07, 1.955777406692505e-07, 2.430751919746399e-07, 2.905726432800293e-07, 3.380700945854187e-07, 3.855675458908081e-07, 4.330649971961975e-07, 4.805624485015869e-07, 5.280598998069763e-07, 5.755573511123657e-07, 6.230548024177551e-07, 6.705522537231445e-07, 7.180497050285339e-07, 7.655471563339233e-07, 8.130446076393127e-07, 8.605420589447021e-07, 9.080395102500916e-07, 9.55536961555481e-07, 1.0030344128608704e-06, 1.0505318641662598e-06, 1.0980293154716492e-06, 1.1455267667770386e-06, 1.193024218082428e-06, 1.2405216693878174e-06, 1.2880191206932068e-06, 1.3355165719985962e-06, 1.3830140233039856e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 8.0, 14.0, 14.0, 28.0, 23.0, 61.0, 58.0, 70.0, 125.0, 273.0, 590.0, 2436.0, 9894.0, 73665.0, 703596.0, 227558.0, 23214.0, 4693.0, 1298.0, 387.0, 179.0, 83.0, 69.0, 49.0, 28.0, 24.0, 18.0, 18.0, 12.0, 10.0, 4.0, 7.0, 4.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8596649169921875e-05, -1.797173172235489e-05, -1.7346814274787903e-05, -1.6721896827220917e-05, -1.609697937965393e-05, -1.5472061932086945e-05, -1.4847144484519958e-05, -1.4222227036952972e-05, -1.3597309589385986e-05, -1.2972392141819e-05, -1.2347474694252014e-05, -1.1722557246685028e-05, -1.1097639799118042e-05, -1.0472722351551056e-05, -9.84780490398407e-06, -9.222887456417084e-06, -8.597970008850098e-06, -7.973052561283112e-06, -7.3481351137161255e-06, -6.723217666149139e-06, -6.098300218582153e-06, -5.473382771015167e-06, -4.848465323448181e-06, -4.223547875881195e-06, -3.598630428314209e-06, -2.973712980747223e-06, -2.348795533180237e-06, -1.7238780856132507e-06, -1.0989606380462646e-06, -4.7404319047927856e-07, 1.5087425708770752e-07, 7.757917046546936e-07, 1.4007091522216797e-06, 2.0256265997886658e-06, 2.650544047355652e-06, 3.275461494922638e-06, 3.900378942489624e-06, 4.52529639005661e-06, 5.150213837623596e-06, 5.775131285190582e-06, 6.400048732757568e-06, 7.0249661803245544e-06, 7.64988362789154e-06, 8.274801075458527e-06, 8.899718523025513e-06, 9.524635970592499e-06, 1.0149553418159485e-05, 1.0774470865726471e-05, 1.1399388313293457e-05, 1.2024305760860443e-05, 1.264922320842743e-05, 1.3274140655994415e-05, 1.3899058103561401e-05, 1.4523975551128387e-05, 1.5148892998695374e-05, 1.577381044626236e-05, 1.6398727893829346e-05, 1.7023645341396332e-05, 1.7648562788963318e-05, 1.8273480236530304e-05, 1.889839768409729e-05, 1.9523315131664276e-05, 2.0148232579231262e-05, 2.0773150026798248e-05, 2.1398067474365234e-05]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 14.0, 39.0, 88.0, 229.0, 358.0, 170.0, 64.0, 28.0, 11.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.162233825714793e-06, -8.003089533303864e-06, -7.843946150387637e-06, -7.684801857976709e-06, -7.525658475060482e-06, -7.366514182649553e-06, -7.207370344985975e-06, -7.048226507322397e-06, -6.889082669658819e-06, -6.729938831995241e-06, -6.5707949943316635e-06, -6.411651156668086e-06, -6.252506864257157e-06, -6.093363026593579e-06, -5.934219188930001e-06, -5.775075351266423e-06, -5.615931513602845e-06, -5.4567876759392675e-06, -5.29764383827569e-06, -5.138500000612112e-06, -4.979356162948534e-06, -4.820211870537605e-06, -4.661068032874027e-06, -4.501924195210449e-06, -4.3427803575468715e-06, -4.183636519883294e-06, -4.024492682219716e-06, -3.865348844556138e-06, -3.7062047795188846e-06, -3.5470609418553067e-06, -3.3879168768180534e-06, -3.2287730391544756e-06, -3.0696289741172222e-06, -2.9104851364536444e-06, -2.751341071416391e-06, -2.592197233752813e-06, -2.4330533960892353e-06, -2.2739095584256575e-06, -2.1147657207620796e-06, -1.9556216557248263e-06, -1.7964778180612484e-06, -1.6373339803976705e-06, -1.478190029047255e-06, -1.3190460776968393e-06, -1.1599022400332615e-06, -1.0007584023696836e-06, -8.41614451019268e-07, -6.824704996688524e-07, -5.233266620052746e-07, -3.641827674982778e-07, -2.050388729912811e-07, -4.5894978484284366e-08, 1.1324891602271236e-07, 2.723928105297091e-07, 4.315367050367058e-07, 5.906806563871214e-07, 7.498244940506993e-07, 9.08968388557696e-07, 1.0681122830646927e-06, 1.2272562344151083e-06, 1.3864000720786862e-06, 1.545543909742264e-06, 1.7046878610926797e-06, 1.8638318124430953e-06, 2.022975650106673e-06]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 12.0, 0.0, 0.0, 13.0, 0.0, 0.0, 23.0, 0.0, 0.0, 47.0, 0.0, 0.0, 63.0, 0.0, 0.0, 72.0, 0.0, 0.0, 109.0, 0.0, 0.0, 117.0, 0.0, 0.0, 119.0, 0.0, 0.0, 119.0, 0.0, 0.0, 103.0, 0.0, 0.0, 72.0, 0.0, 0.0, 59.0, 0.0, 0.0, 40.0, 0.0, 0.0, 18.0, 0.0, 0.0, 16.0, 0.0, 0.0, 10.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0], "bins": [-6.556510925292969e-07, -6.360933184623718e-07, -6.165355443954468e-07, -5.969777703285217e-07, -5.774199962615967e-07, -5.578622221946716e-07, -5.383044481277466e-07, -5.187466740608215e-07, -4.991888999938965e-07, -4.796311259269714e-07, -4.600733518600464e-07, -4.4051557779312134e-07, -4.209578037261963e-07, -4.0140002965927124e-07, -3.818422555923462e-07, -3.6228448152542114e-07, -3.427267074584961e-07, -3.2316893339157104e-07, -3.03611159324646e-07, -2.8405338525772095e-07, -2.644956111907959e-07, -2.4493783712387085e-07, -2.253800630569458e-07, -2.0582228899002075e-07, -1.862645149230957e-07, -1.6670674085617065e-07, -1.471489667892456e-07, -1.2759119272232056e-07, -1.0803341865539551e-07, -8.847564458847046e-08, -6.891787052154541e-08, -4.936009645462036e-08, -2.9802322387695312e-08, -1.0244548320770264e-08, 9.313225746154785e-09, 2.8870999813079834e-08, 4.842877388000488e-08, 6.798654794692993e-08, 8.754432201385498e-08, 1.0710209608078003e-07, 1.2665987014770508e-07, 1.4621764421463013e-07, 1.6577541828155518e-07, 1.8533319234848022e-07, 2.0489096641540527e-07, 2.2444874048233032e-07, 2.4400651454925537e-07, 2.635642886161804e-07, 2.8312206268310547e-07, 3.026798367500305e-07, 3.2223761081695557e-07, 3.417953848838806e-07, 3.6135315895080566e-07, 3.809109330177307e-07, 4.0046870708465576e-07, 4.200264811515808e-07, 4.3958425521850586e-07, 4.591420292854309e-07, 4.78699803352356e-07, 4.98257577419281e-07, 5.178153514862061e-07, 5.373731255531311e-07, 5.569308996200562e-07, 5.764886736869812e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 4.0, 5.0, 16.0, 17.0, 13.0, 19.0, 14.0, 30.0, 38.0, 30.0, 30.0, 38.0, 32.0, 48.0, 35.0, 47.0, 44.0, 51.0, 58.0, 35.0, 31.0, 55.0, 32.0, 30.0, 37.0, 30.0, 26.0, 28.0, 17.0, 18.0, 22.0, 17.0, 9.0, 10.0, 4.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.3638916015625, -4.219970703125, -4.0760498046875, -3.93212890625, -3.7882080078125, -3.644287109375, -3.5003662109375, -3.3564453125, -3.2125244140625, -3.068603515625, -2.9246826171875, -2.78076171875, -2.6368408203125, -2.492919921875, -2.3489990234375, -2.205078125, -2.0611572265625, -1.917236328125, -1.7733154296875, -1.62939453125, -1.4854736328125, -1.341552734375, -1.1976318359375, -1.0537109375, -0.9097900390625, -0.765869140625, -0.6219482421875, -0.47802734375, -0.3341064453125, -0.190185546875, -0.0462646484375, 0.09765625, 0.2415771484375, 0.385498046875, 0.5294189453125, 0.67333984375, 0.8172607421875, 0.961181640625, 1.1051025390625, 1.2490234375, 1.3929443359375, 1.536865234375, 1.6807861328125, 1.82470703125, 1.9686279296875, 2.112548828125, 2.2564697265625, 2.400390625, 2.5443115234375, 2.688232421875, 2.8321533203125, 2.97607421875, 3.1199951171875, 3.263916015625, 3.4078369140625, 3.5517578125, 3.6956787109375, 3.839599609375, 3.9835205078125, 4.12744140625, 4.2713623046875, 4.415283203125, 4.5592041015625, 4.703125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 5.0, 7.0, 13.0, 15.0, 10.0, 20.0, 37.0, 47.0, 62.0, 117.0, 259.0, 398.0, 715.0, 1421.0, 2816.0, 5787.0, 12820.0, 32617.0, 100479.0, 311801.0, 376171.0, 131219.0, 42131.0, 15696.0, 6855.0, 3318.0, 1749.0, 828.0, 461.0, 258.0, 149.0, 71.0, 64.0, 39.0, 26.0, 26.0, 8.0, 9.0, 9.0, 8.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.786376953125, -4.62744140625, -4.468505859375, -4.3095703125, -4.150634765625, -3.99169921875, -3.832763671875, -3.673828125, -3.514892578125, -3.35595703125, -3.197021484375, -3.0380859375, -2.879150390625, -2.72021484375, -2.561279296875, -2.40234375, -2.243408203125, -2.08447265625, -1.925537109375, -1.7666015625, -1.607666015625, -1.44873046875, -1.289794921875, -1.130859375, -0.971923828125, -0.81298828125, -0.654052734375, -0.4951171875, -0.336181640625, -0.17724609375, -0.018310546875, 0.140625, 0.299560546875, 0.45849609375, 0.617431640625, 0.7763671875, 0.935302734375, 1.09423828125, 1.253173828125, 1.412109375, 1.571044921875, 1.72998046875, 1.888916015625, 2.0478515625, 2.206787109375, 2.36572265625, 2.524658203125, 2.68359375, 2.842529296875, 3.00146484375, 3.160400390625, 3.3193359375, 3.478271484375, 3.63720703125, 3.796142578125, 3.955078125, 4.114013671875, 4.27294921875, 4.431884765625, 4.5908203125, 4.749755859375, 4.90869140625, 5.067626953125, 5.2265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 14.0, 14.0, 14.0, 18.0, 21.0, 24.0, 39.0, 38.0, 41.0, 59.0, 83.0, 126.0, 281.0, 1595.0, 198.0, 106.0, 67.0, 47.0, 65.0, 39.0, 32.0, 28.0, 22.0, 17.0, 18.0, 13.0, 10.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.84375, -16.392822265625, -15.94189453125, -15.490966796875, -15.0400390625, -14.589111328125, -14.13818359375, -13.687255859375, -13.236328125, -12.785400390625, -12.33447265625, -11.883544921875, -11.4326171875, -10.981689453125, -10.53076171875, -10.079833984375, -9.62890625, -9.177978515625, -8.72705078125, -8.276123046875, -7.8251953125, -7.374267578125, -6.92333984375, -6.472412109375, -6.021484375, -5.570556640625, -5.11962890625, -4.668701171875, -4.2177734375, -3.766845703125, -3.31591796875, -2.864990234375, -2.4140625, -1.963134765625, -1.51220703125, -1.061279296875, -0.6103515625, -0.159423828125, 0.29150390625, 0.742431640625, 1.193359375, 1.644287109375, 2.09521484375, 2.546142578125, 2.9970703125, 3.447998046875, 3.89892578125, 4.349853515625, 4.80078125, 5.251708984375, 5.70263671875, 6.153564453125, 6.6044921875, 7.055419921875, 7.50634765625, 7.957275390625, 8.408203125, 8.859130859375, 9.31005859375, 9.760986328125, 10.2119140625, 10.662841796875, 11.11376953125, 11.564697265625, 12.015625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 5.0, 15.0, 12.0, 20.0, 30.0, 45.0, 63.0, 69.0, 105.0, 158.0, 272.0, 560.0, 2842.0, 66301.0, 3049824.0, 22439.0, 1809.0, 434.0, 200.0, 137.0, 102.0, 46.0, 62.0, 43.0, 24.0, 21.0, 11.0, 8.0, 19.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140625, -16.490966796875, -15.84130859375, -15.191650390625, -14.5419921875, -13.892333984375, -13.24267578125, -12.593017578125, -11.943359375, -11.293701171875, -10.64404296875, -9.994384765625, -9.3447265625, -8.695068359375, -8.04541015625, -7.395751953125, -6.74609375, -6.096435546875, -5.44677734375, -4.797119140625, -4.1474609375, -3.497802734375, -2.84814453125, -2.198486328125, -1.548828125, -0.899169921875, -0.24951171875, 0.400146484375, 1.0498046875, 1.699462890625, 2.34912109375, 2.998779296875, 3.6484375, 4.298095703125, 4.94775390625, 5.597412109375, 6.2470703125, 6.896728515625, 7.54638671875, 8.196044921875, 8.845703125, 9.495361328125, 10.14501953125, 10.794677734375, 11.4443359375, 12.093994140625, 12.74365234375, 13.393310546875, 14.04296875, 14.692626953125, 15.34228515625, 15.991943359375, 16.6416015625, 17.291259765625, 17.94091796875, 18.590576171875, 19.240234375, 19.889892578125, 20.53955078125, 21.189208984375, 21.8388671875, 22.488525390625, 23.13818359375, 23.787841796875, 24.4375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 18.0, 153.0, 471.0, 316.0, 49.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.64859771728516, -63.4387092590332, -60.228816986083984, -57.01892852783203, -53.80903625488281, -50.59914779663086, -47.389259338378906, -44.17936706542969, -40.969478607177734, -37.75959014892578, -34.54969787597656, -31.33980941772461, -28.129919052124023, -24.920028686523438, -21.710140228271484, -18.5002498626709, -15.290359497070312, -12.080469131469727, -8.870579719543457, -5.6606903076171875, -2.4507999420166016, 0.7590904235839844, 3.9689788818359375, 7.178869247436523, 10.38875961303711, 13.598649978637695, 16.80854034423828, 20.018428802490234, 23.22831916809082, 26.438209533691406, 29.64809799194336, 32.85798645019531, 36.06787109375, 39.27775955200195, 42.48765182495117, 45.697540283203125, 48.907432556152344, 52.1173210144043, 55.32720947265625, 58.53710174560547, 61.74699020385742, 64.95687866210938, 68.1667709350586, 71.37666320800781, 74.5865478515625, 77.79644012451172, 81.00633239746094, 84.21621704101562, 87.42610931396484, 90.63600158691406, 93.84588623046875, 97.05577850341797, 100.26567077636719, 103.47555541992188, 106.6854476928711, 109.89533996582031, 113.105224609375, 116.31511688232422, 119.5250015258789, 122.73489379882812, 125.94478607177734, 129.15467834472656, 132.36456298828125, 135.57444763183594, 138.7843475341797]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 3.0, 3.0, 9.0, 9.0, 13.0, 11.0, 12.0, 11.0, 19.0, 19.0, 24.0, 23.0, 24.0, 25.0, 27.0, 44.0, 39.0, 36.0, 49.0, 52.0, 35.0, 43.0, 43.0, 47.0, 28.0, 38.0, 41.0, 29.0, 34.0, 34.0, 24.0, 16.0, 13.0, 11.0, 26.0, 12.0, 16.0, 10.0, 12.0, 2.0, 8.0, 9.0, 6.0, 1.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.55046844482422, -28.6372127532959, -27.723957061767578, -26.81070327758789, -25.89744758605957, -24.98419189453125, -24.07093620300293, -23.15768051147461, -22.24442481994629, -21.33116912841797, -20.41791343688965, -19.504657745361328, -18.59140396118164, -17.67814826965332, -16.764892578125, -15.85163688659668, -14.938382148742676, -14.025126457214355, -13.111871719360352, -12.198616027832031, -11.285360336303711, -10.37210464477539, -9.458849906921387, -8.545594215393066, -7.632339000701904, -6.719083786010742, -5.805828094482422, -4.89257287979126, -3.9793174266815186, -3.0660619735717773, -2.1528067588806152, -1.239551067352295, -0.3262958526611328, 0.5869595408439636, 1.50021493434906, 2.4134702682495117, 3.326725721359253, 4.239981174468994, 5.153236389160156, 6.066492080688477, 6.979747295379639, 7.893002510070801, 8.806258201599121, 9.719512939453125, 10.632768630981445, 11.546024322509766, 12.459280014038086, 13.372535705566406, 14.28579044342041, 15.19904613494873, 16.112300872802734, 17.025556564331055, 17.938812255859375, 18.852067947387695, 19.765323638916016, 20.678577423095703, 21.591833114624023, 22.505088806152344, 23.418344497680664, 24.331600189208984, 25.244853973388672, 26.158109664916992, 27.071365356445312, 27.984621047973633, 28.897876739501953]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 8.0, 5.0, 13.0, 7.0, 14.0, 20.0, 14.0, 15.0, 33.0, 23.0, 28.0, 29.0, 32.0, 35.0, 32.0, 47.0, 45.0, 46.0, 53.0, 47.0, 56.0, 38.0, 43.0, 36.0, 37.0, 30.0, 36.0, 35.0, 22.0, 28.0, 18.0, 13.0, 22.0, 8.0, 11.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.45977783203125, -4.3062744140625, -4.15277099609375, -3.999267578125, -3.84576416015625, -3.6922607421875, -3.53875732421875, -3.38525390625, -3.23175048828125, -3.0782470703125, -2.92474365234375, -2.771240234375, -2.61773681640625, -2.4642333984375, -2.31072998046875, -2.1572265625, -2.00372314453125, -1.8502197265625, -1.69671630859375, -1.543212890625, -1.38970947265625, -1.2362060546875, -1.08270263671875, -0.92919921875, -0.77569580078125, -0.6221923828125, -0.46868896484375, -0.315185546875, -0.16168212890625, -0.0081787109375, 0.14532470703125, 0.298828125, 0.45233154296875, 0.6058349609375, 0.75933837890625, 0.912841796875, 1.06634521484375, 1.2198486328125, 1.37335205078125, 1.52685546875, 1.68035888671875, 1.8338623046875, 1.98736572265625, 2.140869140625, 2.29437255859375, 2.4478759765625, 2.60137939453125, 2.7548828125, 2.90838623046875, 3.0618896484375, 3.21539306640625, 3.368896484375, 3.52239990234375, 3.6759033203125, 3.82940673828125, 3.98291015625, 4.13641357421875, 4.2899169921875, 4.44342041015625, 4.596923828125, 4.75042724609375, 4.9039306640625, 5.05743408203125, 5.2109375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 13.0, 12.0, 25.0, 28.0, 46.0, 58.0, 62.0, 105.0, 133.0, 156.0, 200.0, 310.0, 419.0, 608.0, 1053.0, 2207.0, 7007.0, 40785.0, 456043.0, 3256467.0, 379664.0, 36889.0, 6758.0, 2089.0, 1019.0, 597.0, 370.0, 301.0, 209.0, 174.0, 112.0, 88.0, 64.0, 57.0, 53.0, 25.0, 23.0, 11.0, 14.0, 8.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.1875, -24.36083984375, -23.5341796875, -22.70751953125, -21.880859375, -21.05419921875, -20.2275390625, -19.40087890625, -18.57421875, -17.74755859375, -16.9208984375, -16.09423828125, -15.267578125, -14.44091796875, -13.6142578125, -12.78759765625, -11.9609375, -11.13427734375, -10.3076171875, -9.48095703125, -8.654296875, -7.82763671875, -7.0009765625, -6.17431640625, -5.34765625, -4.52099609375, -3.6943359375, -2.86767578125, -2.041015625, -1.21435546875, -0.3876953125, 0.43896484375, 1.265625, 2.09228515625, 2.9189453125, 3.74560546875, 4.572265625, 5.39892578125, 6.2255859375, 7.05224609375, 7.87890625, 8.70556640625, 9.5322265625, 10.35888671875, 11.185546875, 12.01220703125, 12.8388671875, 13.66552734375, 14.4921875, 15.31884765625, 16.1455078125, 16.97216796875, 17.798828125, 18.62548828125, 19.4521484375, 20.27880859375, 21.10546875, 21.93212890625, 22.7587890625, 23.58544921875, 24.412109375, 25.23876953125, 26.0654296875, 26.89208984375, 27.71875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 7.0, 11.0, 13.0, 4.0, 7.0, 15.0, 19.0, 23.0, 30.0, 52.0, 62.0, 76.0, 102.0, 122.0, 138.0, 150.0, 216.0, 229.0, 295.0, 327.0, 320.0, 322.0, 265.0, 229.0, 185.0, 176.0, 116.0, 108.0, 87.0, 73.0, 60.0, 47.0, 39.0, 36.0, 25.0, 16.0, 12.0, 15.0, 6.0, 12.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.6796875, -8.42718505859375, -8.1746826171875, -7.92218017578125, -7.669677734375, -7.41717529296875, -7.1646728515625, -6.91217041015625, -6.65966796875, -6.40716552734375, -6.1546630859375, -5.90216064453125, -5.649658203125, -5.39715576171875, -5.1446533203125, -4.89215087890625, -4.6396484375, -4.38714599609375, -4.1346435546875, -3.88214111328125, -3.629638671875, -3.37713623046875, -3.1246337890625, -2.87213134765625, -2.61962890625, -2.36712646484375, -2.1146240234375, -1.86212158203125, -1.609619140625, -1.35711669921875, -1.1046142578125, -0.85211181640625, -0.599609375, -0.34710693359375, -0.0946044921875, 0.15789794921875, 0.410400390625, 0.66290283203125, 0.9154052734375, 1.16790771484375, 1.42041015625, 1.67291259765625, 1.9254150390625, 2.17791748046875, 2.430419921875, 2.68292236328125, 2.9354248046875, 3.18792724609375, 3.4404296875, 3.69293212890625, 3.9454345703125, 4.19793701171875, 4.450439453125, 4.70294189453125, 4.9554443359375, 5.20794677734375, 5.46044921875, 5.71295166015625, 5.9654541015625, 6.21795654296875, 6.470458984375, 6.72296142578125, 6.9754638671875, 7.22796630859375, 7.48046875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 4.0, 3.0, 8.0, 17.0, 13.0, 20.0, 25.0, 28.0, 76.0, 80.0, 132.0, 198.0, 317.0, 604.0, 1188.0, 2807.0, 7981.0, 24980.0, 94661.0, 419560.0, 1923423.0, 1347639.0, 276983.0, 65304.0, 17897.0, 5835.0, 2194.0, 944.0, 494.0, 287.0, 184.0, 121.0, 85.0, 59.0, 37.0, 26.0, 17.0, 16.0, 10.0, 8.0, 6.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.546875, -11.1468505859375, -10.746826171875, -10.3468017578125, -9.94677734375, -9.5467529296875, -9.146728515625, -8.7467041015625, -8.3466796875, -7.9466552734375, -7.546630859375, -7.1466064453125, -6.74658203125, -6.3465576171875, -5.946533203125, -5.5465087890625, -5.146484375, -4.7464599609375, -4.346435546875, -3.9464111328125, -3.54638671875, -3.1463623046875, -2.746337890625, -2.3463134765625, -1.9462890625, -1.5462646484375, -1.146240234375, -0.7462158203125, -0.34619140625, 0.0538330078125, 0.453857421875, 0.8538818359375, 1.25390625, 1.6539306640625, 2.053955078125, 2.4539794921875, 2.85400390625, 3.2540283203125, 3.654052734375, 4.0540771484375, 4.4541015625, 4.8541259765625, 5.254150390625, 5.6541748046875, 6.05419921875, 6.4542236328125, 6.854248046875, 7.2542724609375, 7.654296875, 8.0543212890625, 8.454345703125, 8.8543701171875, 9.25439453125, 9.6544189453125, 10.054443359375, 10.4544677734375, 10.8544921875, 11.2545166015625, 11.654541015625, 12.0545654296875, 12.45458984375, 12.8546142578125, 13.254638671875, 13.6546630859375, 14.0546875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 9.0, 7.0, 4.0, 14.0, 22.0, 32.0, 36.0, 58.0, 76.0, 72.0, 87.0, 100.0, 92.0, 88.0, 83.0, 66.0, 39.0, 35.0, 32.0, 18.0, 17.0, 5.0, 9.0, 4.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0766830444336, -71.915283203125, -68.75387573242188, -65.59247589111328, -62.43107604980469, -59.269676208496094, -56.108272552490234, -52.946868896484375, -49.78546905517578, -46.62406921386719, -43.46266555786133, -40.30126190185547, -37.139862060546875, -33.97846221923828, -30.817058563232422, -27.655656814575195, -24.49425506591797, -21.332853317260742, -18.171451568603516, -15.010049819946289, -11.848648071289062, -8.687246322631836, -5.525844573974609, -2.364442825317383, 0.7969589233398438, 3.9583606719970703, 7.119762420654297, 10.281164169311523, 13.44256591796875, 16.603967666625977, 19.765369415283203, 22.92677116394043, 26.088165283203125, 29.24956703186035, 32.41096878051758, 35.57237243652344, 38.73377227783203, 41.895172119140625, 45.056575775146484, 48.217979431152344, 51.37937927246094, 54.54077911376953, 57.70218276977539, 60.86358642578125, 64.02498626708984, 67.18638610839844, 70.34779357910156, 73.50919342041016, 76.67059326171875, 79.83199310302734, 82.99339294433594, 86.15480041503906, 89.31620025634766, 92.47760009765625, 95.63900756835938, 98.80040740966797, 101.96180725097656, 105.12320709228516, 108.28460693359375, 111.44601440429688, 114.60741424560547, 117.76881408691406, 120.93022155761719, 124.09162139892578, 127.25302124023438]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 8.0, 10.0, 15.0, 13.0, 8.0, 19.0, 21.0, 28.0, 27.0, 24.0, 30.0, 36.0, 28.0, 39.0, 45.0, 41.0, 47.0, 41.0, 50.0, 39.0, 50.0, 45.0, 31.0, 34.0, 34.0, 39.0, 23.0, 27.0, 27.0, 24.0, 16.0, 13.0, 10.0, 16.0, 9.0, 8.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.72960662841797, -56.040584564208984, -54.351566314697266, -52.66254425048828, -50.97352600097656, -49.28450393676758, -47.595481872558594, -45.906463623046875, -44.217445373535156, -42.52842330932617, -40.83940505981445, -39.15038299560547, -37.46136474609375, -35.772342681884766, -34.08332061767578, -32.39430236816406, -30.705280303955078, -29.016260147094727, -27.327239990234375, -25.63821792602539, -23.949199676513672, -22.260177612304688, -20.571157455444336, -18.882137298583984, -17.193117141723633, -15.504096984863281, -13.81507682800293, -12.126055717468262, -10.43703556060791, -8.748015403747559, -7.058994293212891, -5.369974136352539, -3.680950164794922, -1.9919297695159912, -0.30290937423706055, 1.3861112594604492, 3.075131416320801, 4.764151573181152, 6.45317268371582, 8.142192840576172, 9.831212997436523, 11.520233154296875, 13.209253311157227, 14.898274421691895, 16.587295532226562, 18.27631378173828, 19.965335845947266, 21.654356002807617, 23.34337615966797, 25.03239631652832, 26.721416473388672, 28.410438537597656, 30.099456787109375, 31.78847885131836, 33.477500915527344, 35.16651916503906, 36.85553741455078, 38.544559478759766, 40.233577728271484, 41.92259979248047, 43.61161804199219, 45.30064010620117, 46.989662170410156, 48.678680419921875, 50.36770248413086]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 9.0, 8.0, 8.0, 16.0, 11.0, 13.0, 26.0, 30.0, 10.0, 24.0, 25.0, 29.0, 27.0, 33.0, 34.0, 31.0, 29.0, 35.0, 48.0, 50.0, 53.0, 49.0, 40.0, 36.0, 32.0, 26.0, 31.0, 29.0, 27.0, 19.0, 23.0, 19.0, 19.0, 10.0, 8.0, 17.0, 12.0, 3.0, 7.0, 4.0, 6.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-106.125, -103.0478515625, -99.970703125, -96.8935546875, -93.81640625, -90.7392578125, -87.662109375, -84.5849609375, -81.5078125, -78.4306640625, -75.353515625, -72.2763671875, -69.19921875, -66.1220703125, -63.044921875, -59.9677734375, -56.890625, -53.8134765625, -50.736328125, -47.6591796875, -44.58203125, -41.5048828125, -38.427734375, -35.3505859375, -32.2734375, -29.1962890625, -26.119140625, -23.0419921875, -19.96484375, -16.8876953125, -13.810546875, -10.7333984375, -7.65625, -4.5791015625, -1.501953125, 1.5751953125, 4.65234375, 7.7294921875, 10.806640625, 13.8837890625, 16.9609375, 20.0380859375, 23.115234375, 26.1923828125, 29.26953125, 32.3466796875, 35.423828125, 38.5009765625, 41.578125, 44.6552734375, 47.732421875, 50.8095703125, 53.88671875, 56.9638671875, 60.041015625, 63.1181640625, 66.1953125, 69.2724609375, 72.349609375, 75.4267578125, 78.50390625, 81.5810546875, 84.658203125, 87.7353515625, 90.8125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 15.0, 30.0, 24.0, 51.0, 82.0, 128.0, 177.0, 269.0, 386.0, 589.0, 901.0, 1329.0, 1982.0, 2930.0, 4662.0, 7123.0, 10850.0, 17072.0, 27874.0, 45557.0, 79389.0, 147418.0, 273679.0, 185027.0, 96785.0, 54991.0, 32703.0, 20158.0, 12701.0, 8074.0, 5243.0, 3413.0, 2326.0, 1513.0, 1037.0, 698.0, 492.0, 290.0, 217.0, 136.0, 80.0, 47.0, 35.0, 16.0, 20.0, 10.0, 11.0, 10.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.86279296875, -0.8379058837890625, -0.813018798828125, -0.7881317138671875, -0.76324462890625, -0.7383575439453125, -0.713470458984375, -0.6885833740234375, -0.6636962890625, -0.6388092041015625, -0.613922119140625, -0.5890350341796875, -0.56414794921875, -0.5392608642578125, -0.514373779296875, -0.4894866943359375, -0.464599609375, -0.4397125244140625, -0.414825439453125, -0.3899383544921875, -0.36505126953125, -0.3401641845703125, -0.315277099609375, -0.2903900146484375, -0.2655029296875, -0.2406158447265625, -0.215728759765625, -0.1908416748046875, -0.16595458984375, -0.1410675048828125, -0.116180419921875, -0.0912933349609375, -0.06640625, -0.0415191650390625, -0.016632080078125, 0.0082550048828125, 0.03314208984375, 0.0580291748046875, 0.082916259765625, 0.1078033447265625, 0.1326904296875, 0.1575775146484375, 0.182464599609375, 0.2073516845703125, 0.23223876953125, 0.2571258544921875, 0.282012939453125, 0.3069000244140625, 0.331787109375, 0.3566741943359375, 0.381561279296875, 0.4064483642578125, 0.43133544921875, 0.4562225341796875, 0.481109619140625, 0.5059967041015625, 0.5308837890625, 0.5557708740234375, 0.580657958984375, 0.6055450439453125, 0.63043212890625, 0.6553192138671875, 0.680206298828125, 0.7050933837890625, 0.72998046875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 6.0, 3.0, 1.0, 2.0, 7.0, 4.0, 6.0, 5.0, 5.0, 7.0, 5.0, 12.0, 13.0, 15.0, 16.0, 17.0, 25.0, 20.0, 19.0, 25.0, 25.0, 25.0, 39.0, 39.0, 41.0, 38.0, 35.0, 30.0, 1071.0, 39.0, 34.0, 34.0, 57.0, 36.0, 39.0, 26.0, 25.0, 20.0, 28.0, 17.0, 17.0, 17.0, 13.0, 11.0, 10.0, 12.0, 11.0, 6.0, 5.0, 6.0, 9.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-77.8125, -75.3857421875, -72.958984375, -70.5322265625, -68.10546875, -65.6787109375, -63.251953125, -60.8251953125, -58.3984375, -55.9716796875, -53.544921875, -51.1181640625, -48.69140625, -46.2646484375, -43.837890625, -41.4111328125, -38.984375, -36.5576171875, -34.130859375, -31.7041015625, -29.27734375, -26.8505859375, -24.423828125, -21.9970703125, -19.5703125, -17.1435546875, -14.716796875, -12.2900390625, -9.86328125, -7.4365234375, -5.009765625, -2.5830078125, -0.15625, 2.2705078125, 4.697265625, 7.1240234375, 9.55078125, 11.9775390625, 14.404296875, 16.8310546875, 19.2578125, 21.6845703125, 24.111328125, 26.5380859375, 28.96484375, 31.3916015625, 33.818359375, 36.2451171875, 38.671875, 41.0986328125, 43.525390625, 45.9521484375, 48.37890625, 50.8056640625, 53.232421875, 55.6591796875, 58.0859375, 60.5126953125, 62.939453125, 65.3662109375, 67.79296875, 70.2197265625, 72.646484375, 75.0732421875, 77.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 8.0, 6.0, 19.0, 14.0, 35.0, 32.0, 53.0, 73.0, 105.0, 137.0, 209.0, 308.0, 431.0, 650.0, 864.0, 1328.0, 1807.0, 2683.0, 3904.0, 5834.0, 8495.0, 12922.0, 19395.0, 29934.0, 46309.0, 74722.0, 123994.0, 1248216.0, 193282.0, 118305.0, 71673.0, 44827.0, 29048.0, 18859.0, 12301.0, 8484.0, 5582.0, 3898.0, 2517.0, 1716.0, 1219.0, 846.0, 645.0, 456.0, 302.0, 200.0, 159.0, 116.0, 65.0, 45.0, 32.0, 18.0, 18.0, 21.0, 9.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.298095703125, -0.2884674072265625, -0.278839111328125, -0.2692108154296875, -0.25958251953125, -0.2499542236328125, -0.240325927734375, -0.2306976318359375, -0.2210693359375, -0.2114410400390625, -0.201812744140625, -0.1921844482421875, -0.18255615234375, -0.1729278564453125, -0.163299560546875, -0.1536712646484375, -0.14404296875, -0.1344146728515625, -0.124786376953125, -0.1151580810546875, -0.10552978515625, -0.0959014892578125, -0.086273193359375, -0.0766448974609375, -0.0670166015625, -0.0573883056640625, -0.047760009765625, -0.0381317138671875, -0.02850341796875, -0.0188751220703125, -0.009246826171875, 0.0003814697265625, 0.010009765625, 0.0196380615234375, 0.029266357421875, 0.0388946533203125, 0.04852294921875, 0.0581512451171875, 0.067779541015625, 0.0774078369140625, 0.0870361328125, 0.0966644287109375, 0.106292724609375, 0.1159210205078125, 0.12554931640625, 0.1351776123046875, 0.144805908203125, 0.1544342041015625, 0.1640625, 0.1736907958984375, 0.183319091796875, 0.1929473876953125, 0.20257568359375, 0.2122039794921875, 0.221832275390625, 0.2314605712890625, 0.2410888671875, 0.2507171630859375, 0.260345458984375, 0.2699737548828125, 0.27960205078125, 0.2892303466796875, 0.298858642578125, 0.3084869384765625, 0.318115234375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 7.0, 6.0, 7.0, 9.0, 8.0, 10.0, 15.0, 26.0, 41.0, 32.0, 58.0, 100.0, 143.0, 134.0, 119.0, 66.0, 54.0, 34.0, 28.0, 23.0, 11.0, 12.0, 9.0, 6.0, 7.0, 5.0, 5.0, 7.0, 0.0, 3.0, 2.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.796815872192383e-05, -3.645848482847214e-05, -3.494881093502045e-05, -3.3439137041568756e-05, -3.1929463148117065e-05, -3.0419789254665375e-05, -2.8910115361213684e-05, -2.7400441467761993e-05, -2.5890767574310303e-05, -2.4381093680858612e-05, -2.287141978740692e-05, -2.136174589395523e-05, -1.985207200050354e-05, -1.834239810705185e-05, -1.683272421360016e-05, -1.5323050320148468e-05, -1.3813376426696777e-05, -1.2303702533245087e-05, -1.0794028639793396e-05, -9.284354746341705e-06, -7.774680852890015e-06, -6.265006959438324e-06, -4.755333065986633e-06, -3.2456591725349426e-06, -1.735985279083252e-06, -2.2631138563156128e-07, 1.2833625078201294e-06, 2.79303640127182e-06, 4.302710294723511e-06, 5.812384188175201e-06, 7.322058081626892e-06, 8.831731975078583e-06, 1.0341405868530273e-05, 1.1851079761981964e-05, 1.3360753655433655e-05, 1.4870427548885345e-05, 1.6380101442337036e-05, 1.7889775335788727e-05, 1.9399449229240417e-05, 2.0909123122692108e-05, 2.24187970161438e-05, 2.392847090959549e-05, 2.543814480304718e-05, 2.694781869649887e-05, 2.845749258995056e-05, 2.9967166483402252e-05, 3.147684037685394e-05, 3.2986514270305634e-05, 3.4496188163757324e-05, 3.6005862057209015e-05, 3.7515535950660706e-05, 3.9025209844112396e-05, 4.053488373756409e-05, 4.204455763101578e-05, 4.355423152446747e-05, 4.506390541791916e-05, 4.657357931137085e-05, 4.808325320482254e-05, 4.959292709827423e-05, 5.110260099172592e-05, 5.261227488517761e-05, 5.41219487786293e-05, 5.5631622672080994e-05, 5.7141296565532684e-05, 5.8650970458984375e-05]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 3.0, 6.0, 11.0, 11.0, 19.0, 22.0, 46.0, 48.0, 66.0, 112.0, 189.0, 290.0, 500.0, 924.0, 1772.0, 3345.0, 6469.0, 13784.0, 31265.0, 77119.0, 242696.0, 435466.0, 141036.0, 51176.0, 21837.0, 9830.0, 4858.0, 2459.0, 1337.0, 737.0, 396.0, 248.0, 159.0, 97.0, 71.0, 44.0, 38.0, 19.0, 13.0, 6.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00021970272064208984, -0.00021310150623321533, -0.00020650029182434082, -0.0001998990774154663, -0.0001932978630065918, -0.00018669664859771729, -0.00018009543418884277, -0.00017349421977996826, -0.00016689300537109375, -0.00016029179096221924, -0.00015369057655334473, -0.00014708936214447021, -0.0001404881477355957, -0.0001338869333267212, -0.00012728571891784668, -0.00012068450450897217, -0.00011408329010009766, -0.00010748207569122314, -0.00010088086128234863, -9.427964687347412e-05, -8.767843246459961e-05, -8.10772180557251e-05, -7.447600364685059e-05, -6.787478923797607e-05, -6.127357482910156e-05, -5.467236042022705e-05, -4.807114601135254e-05, -4.146993160247803e-05, -3.4868717193603516e-05, -2.8267502784729004e-05, -2.1666288375854492e-05, -1.506507396697998e-05, -8.463859558105469e-06, -1.862645149230957e-06, 4.738569259643555e-06, 1.1339783668518066e-05, 1.7940998077392578e-05, 2.454221248626709e-05, 3.11434268951416e-05, 3.774464130401611e-05, 4.4345855712890625e-05, 5.094707012176514e-05, 5.754828453063965e-05, 6.414949893951416e-05, 7.075071334838867e-05, 7.735192775726318e-05, 8.39531421661377e-05, 9.055435657501221e-05, 9.715557098388672e-05, 0.00010375678539276123, 0.00011035799980163574, 0.00011695921421051025, 0.00012356042861938477, 0.00013016164302825928, 0.0001367628574371338, 0.0001433640718460083, 0.0001499652862548828, 0.00015656650066375732, 0.00016316771507263184, 0.00016976892948150635, 0.00017637014389038086, 0.00018297135829925537, 0.00018957257270812988, 0.0001961737871170044, 0.0002027750015258789]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 12.0, 8.0, 12.0, 20.0, 32.0, 56.0, 90.0, 109.0, 127.0, 132.0, 98.0, 91.0, 46.0, 54.0, 32.0, 27.0, 14.0, 13.0, 7.0, 10.0, 1.0, 6.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5547399824718013e-05, -5.274198701954447e-05, -4.9936570576392114e-05, -4.713115777121857e-05, -4.432574496604502e-05, -4.1520332160871476e-05, -3.871491935569793e-05, -3.590950291254558e-05, -3.310409010737203e-05, -3.0298677302198485e-05, -2.7493262678035535e-05, -2.4687848053872585e-05, -2.188243524869904e-05, -1.9077022443525493e-05, -1.6271607819362544e-05, -1.3466193195199594e-05, -1.0660780390026048e-05, -7.8553666753578e-06, -5.049952960689552e-06, -2.2445392460213043e-06, 5.608744686469436e-07, 3.3662881833151914e-06, 6.171701897983439e-06, 8.977116522146389e-06, 1.1782529327319935e-05, 1.4587943041988183e-05, 1.739335675665643e-05, 2.019877138081938e-05, 2.3004184185992926e-05, 2.5809596991166472e-05, 2.8615011615329422e-05, 3.142042623949237e-05, 3.4225842682644725e-05, 3.703125548781827e-05, 3.983666829299182e-05, 4.264208473614417e-05, 4.5447497541317716e-05, 4.825291034649126e-05, 5.1058326789643615e-05, 5.386373959481716e-05, 5.666915239999071e-05, 5.9474565205164254e-05, 6.22799780103378e-05, 6.508539081551135e-05, 6.78908108966425e-05, 7.069622370181605e-05, 7.35016365069896e-05, 7.630704931216314e-05, 7.911246211733669e-05, 8.191787492251024e-05, 8.472328772768378e-05, 8.752870053285733e-05, 9.033411333803087e-05, 9.313953341916203e-05, 9.594494622433558e-05, 9.875035902950913e-05, 0.00010155577183468267, 0.00010436118463985622, 0.00010716659744502977, 0.00010997201025020331, 0.00011277743033133447, 0.00011558284313650802, 0.00011838825594168156, 0.00012119366874685511, 0.00012399908155202866]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 8.0, 10.0, 5.0, 13.0, 9.0, 9.0, 22.0, 14.0, 17.0, 34.0, 17.0, 26.0, 39.0, 27.0, 43.0, 33.0, 40.0, 36.0, 28.0, 33.0, 41.0, 34.0, 41.0, 29.0, 29.0, 35.0, 27.0, 33.0, 31.0, 32.0, 29.0, 21.0, 21.0, 16.0, 18.0, 12.0, 13.0, 13.0, 8.0, 5.0, 6.0, 4.0, 4.0, 8.0, 11.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-2.4020671844482422e-05, -2.329424023628235e-05, -2.2567808628082275e-05, -2.1841377019882202e-05, -2.111494541168213e-05, -2.0388513803482056e-05, -1.9662082195281982e-05, -1.893565058708191e-05, -1.8209218978881836e-05, -1.7482787370681763e-05, -1.675635576248169e-05, -1.6029924154281616e-05, -1.5303492546081543e-05, -1.457706093788147e-05, -1.3850629329681396e-05, -1.3124197721481323e-05, -1.239776611328125e-05, -1.1671334505081177e-05, -1.0944902896881104e-05, -1.021847128868103e-05, -9.492039680480957e-06, -8.765608072280884e-06, -8.03917646408081e-06, -7.312744855880737e-06, -6.586313247680664e-06, -5.859881639480591e-06, -5.133450031280518e-06, -4.407018423080444e-06, -3.680586814880371e-06, -2.954155206680298e-06, -2.2277235984802246e-06, -1.5012919902801514e-06, -7.748603820800781e-07, -4.842877388000488e-08, 6.780028343200684e-07, 1.4044344425201416e-06, 2.130866050720215e-06, 2.857297658920288e-06, 3.5837292671203613e-06, 4.3101608753204346e-06, 5.036592483520508e-06, 5.763024091720581e-06, 6.489455699920654e-06, 7.2158873081207275e-06, 7.9423189163208e-06, 8.668750524520874e-06, 9.395182132720947e-06, 1.012161374092102e-05, 1.0848045349121094e-05, 1.1574476957321167e-05, 1.230090856552124e-05, 1.3027340173721313e-05, 1.3753771781921387e-05, 1.448020339012146e-05, 1.5206634998321533e-05, 1.5933066606521606e-05, 1.665949821472168e-05, 1.7385929822921753e-05, 1.8112361431121826e-05, 1.88387930393219e-05, 1.9565224647521973e-05, 2.0291656255722046e-05, 2.101808786392212e-05, 2.1744519472122192e-05, 2.2470951080322266e-05]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 9.0, 8.0, 8.0, 16.0, 11.0, 13.0, 26.0, 30.0, 10.0, 24.0, 25.0, 29.0, 27.0, 33.0, 34.0, 31.0, 29.0, 35.0, 48.0, 50.0, 53.0, 49.0, 40.0, 36.0, 32.0, 26.0, 31.0, 29.0, 27.0, 19.0, 23.0, 19.0, 19.0, 10.0, 8.0, 17.0, 12.0, 3.0, 7.0, 4.0, 6.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-106.125, -103.0478515625, -99.970703125, -96.8935546875, -93.81640625, -90.7392578125, -87.662109375, -84.5849609375, -81.5078125, -78.4306640625, -75.353515625, -72.2763671875, -69.19921875, -66.1220703125, -63.044921875, -59.9677734375, -56.890625, -53.8134765625, -50.736328125, -47.6591796875, -44.58203125, -41.5048828125, -38.427734375, -35.3505859375, -32.2734375, -29.1962890625, -26.119140625, -23.0419921875, -19.96484375, -16.8876953125, -13.810546875, -10.7333984375, -7.65625, -4.5791015625, -1.501953125, 1.5751953125, 4.65234375, 7.7294921875, 10.806640625, 13.8837890625, 16.9609375, 20.0380859375, 23.115234375, 26.1923828125, 29.26953125, 32.3466796875, 35.423828125, 38.5009765625, 41.578125, 44.6552734375, 47.732421875, 50.8095703125, 53.88671875, 56.9638671875, 60.041015625, 63.1181640625, 66.1953125, 69.2724609375, 72.349609375, 75.4267578125, 78.50390625, 81.5810546875, 84.658203125, 87.7353515625, 90.8125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 3.0, 8.0, 9.0, 7.0, 11.0, 15.0, 14.0, 31.0, 33.0, 40.0, 31.0, 42.0, 57.0, 87.0, 158.0, 295.0, 571.0, 1509.0, 8218.0, 79967.0, 574036.0, 342415.0, 34497.0, 4308.0, 1037.0, 418.0, 221.0, 143.0, 90.0, 63.0, 41.0, 30.0, 29.0, 24.0, 14.0, 13.0, 10.0, 12.0, 7.0, 3.0, 5.0, 8.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-19.078125, -18.5302734375, -17.982421875, -17.4345703125, -16.88671875, -16.3388671875, -15.791015625, -15.2431640625, -14.6953125, -14.1474609375, -13.599609375, -13.0517578125, -12.50390625, -11.9560546875, -11.408203125, -10.8603515625, -10.3125, -9.7646484375, -9.216796875, -8.6689453125, -8.12109375, -7.5732421875, -7.025390625, -6.4775390625, -5.9296875, -5.3818359375, -4.833984375, -4.2861328125, -3.73828125, -3.1904296875, -2.642578125, -2.0947265625, -1.546875, -0.9990234375, -0.451171875, 0.0966796875, 0.64453125, 1.1923828125, 1.740234375, 2.2880859375, 2.8359375, 3.3837890625, 3.931640625, 4.4794921875, 5.02734375, 5.5751953125, 6.123046875, 6.6708984375, 7.21875, 7.7666015625, 8.314453125, 8.8623046875, 9.41015625, 9.9580078125, 10.505859375, 11.0537109375, 11.6015625, 12.1494140625, 12.697265625, 13.2451171875, 13.79296875, 14.3408203125, 14.888671875, 15.4365234375, 15.984375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 11.0, 10.0, 10.0, 17.0, 19.0, 22.0, 24.0, 33.0, 37.0, 37.0, 34.0, 54.0, 44.0, 44.0, 46.0, 55.0, 2092.0, 45.0, 45.0, 47.0, 31.0, 39.0, 34.0, 45.0, 28.0, 21.0, 25.0, 17.0, 14.0, 12.0, 8.0, 11.0, 7.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-171.5, -166.658203125, -161.81640625, -156.974609375, -152.1328125, -147.291015625, -142.44921875, -137.607421875, -132.765625, -127.923828125, -123.08203125, -118.240234375, -113.3984375, -108.556640625, -103.71484375, -98.873046875, -94.03125, -89.189453125, -84.34765625, -79.505859375, -74.6640625, -69.822265625, -64.98046875, -60.138671875, -55.296875, -50.455078125, -45.61328125, -40.771484375, -35.9296875, -31.087890625, -26.24609375, -21.404296875, -16.5625, -11.720703125, -6.87890625, -2.037109375, 2.8046875, 7.646484375, 12.48828125, 17.330078125, 22.171875, 27.013671875, 31.85546875, 36.697265625, 41.5390625, 46.380859375, 51.22265625, 56.064453125, 60.90625, 65.748046875, 70.58984375, 75.431640625, 80.2734375, 85.115234375, 89.95703125, 94.798828125, 99.640625, 104.482421875, 109.32421875, 114.166015625, 119.0078125, 123.849609375, 128.69140625, 133.533203125, 138.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 10.0, 7.0, 15.0, 16.0, 32.0, 73.0, 99.0, 188.0, 371.0, 757.0, 1908.0, 9557.0, 184799.0, 2894731.0, 46445.0, 4298.0, 1197.0, 562.0, 272.0, 152.0, 82.0, 49.0, 29.0, 17.0, 17.0, 6.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5234375, -14.8843994140625, -14.245361328125, -13.6063232421875, -12.96728515625, -12.3282470703125, -11.689208984375, -11.0501708984375, -10.4111328125, -9.7720947265625, -9.133056640625, -8.4940185546875, -7.85498046875, -7.2159423828125, -6.576904296875, -5.9378662109375, -5.298828125, -4.6597900390625, -4.020751953125, -3.3817138671875, -2.74267578125, -2.1036376953125, -1.464599609375, -0.8255615234375, -0.1865234375, 0.4525146484375, 1.091552734375, 1.7305908203125, 2.36962890625, 3.0086669921875, 3.647705078125, 4.2867431640625, 4.92578125, 5.5648193359375, 6.203857421875, 6.8428955078125, 7.48193359375, 8.1209716796875, 8.760009765625, 9.3990478515625, 10.0380859375, 10.6771240234375, 11.316162109375, 11.9552001953125, 12.59423828125, 13.2332763671875, 13.872314453125, 14.5113525390625, 15.150390625, 15.7894287109375, 16.428466796875, 17.0675048828125, 17.70654296875, 18.3455810546875, 18.984619140625, 19.6236572265625, 20.2626953125, 20.9017333984375, 21.540771484375, 22.1798095703125, 22.81884765625, 23.4578857421875, 24.096923828125, 24.7359619140625, 25.375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 9.0, 12.0, 11.0, 22.0, 45.0, 93.0, 115.0, 163.0, 166.0, 142.0, 90.0, 56.0, 27.0, 16.0, 12.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-231.48439025878906, -220.6607666015625, -209.837158203125, -199.01353454589844, -188.18991088867188, -177.3662872314453, -166.54266357421875, -155.71905517578125, -144.8954315185547, -134.07180786132812, -123.2481918334961, -112.42457580566406, -101.6009521484375, -90.77732849121094, -79.9537124633789, -69.13009643554688, -58.30647277832031, -47.482852935791016, -36.65923309326172, -25.835613250732422, -15.011993408203125, -4.188373565673828, 6.635246276855469, 17.4588623046875, 28.282485961914062, 39.10610580444336, 49.929725646972656, 60.75334548950195, 71.57696533203125, 82.40058898925781, 93.22420501708984, 104.04782104492188, 114.87142944335938, 125.69505310058594, 136.5186767578125, 147.34228515625, 158.16590881347656, 168.98953247070312, 179.81314086914062, 190.6367645263672, 201.46038818359375, 212.2840118408203, 223.10763549804688, 233.93124389648438, 244.75486755371094, 255.5784912109375, 266.402099609375, 277.2257080078125, 288.0493469238281, 298.8729553222656, 309.69659423828125, 320.52020263671875, 331.34381103515625, 342.1674499511719, 352.9910583496094, 363.814697265625, 374.6383056640625, 385.4619140625, 396.2855529785156, 407.1091613769531, 417.93280029296875, 428.75640869140625, 439.58001708984375, 450.40362548828125, 461.2272644042969]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 9.0, 6.0, 12.0, 13.0, 12.0, 16.0, 13.0, 12.0, 18.0, 19.0, 21.0, 29.0, 30.0, 30.0, 25.0, 30.0, 45.0, 42.0, 37.0, 41.0, 41.0, 42.0, 33.0, 36.0, 43.0, 30.0, 30.0, 39.0, 27.0, 29.0, 24.0, 16.0, 28.0, 24.0, 13.0, 10.0, 9.0, 13.0, 9.0, 10.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-218.80093383789062, -211.5113983154297, -204.2218780517578, -196.93234252929688, -189.642822265625, -182.35328674316406, -175.06375122070312, -167.77423095703125, -160.48471069335938, -153.19517517089844, -145.90565490722656, -138.61611938476562, -131.32659912109375, -124.03706359863281, -116.7475357055664, -109.4580078125, -102.16847229003906, -94.87894439697266, -87.58941650390625, -80.29988098144531, -73.01036071777344, -65.7208251953125, -58.431297302246094, -51.14176940917969, -43.85224151611328, -36.562713623046875, -29.273183822631836, -21.983654022216797, -14.69412612915039, -7.404598236083984, -0.1150665283203125, 7.174461364746094, 14.464004516601562, 21.75353240966797, 29.043062210083008, 36.33259201049805, 43.62211990356445, 50.91164779663086, 58.20117950439453, 65.49070739746094, 72.78023529052734, 80.06976318359375, 87.35929107666016, 94.64881896972656, 101.9383544921875, 109.22787475585938, 116.51741027832031, 123.80693817138672, 131.09646606445312, 138.38600158691406, 145.67552185058594, 152.96505737304688, 160.25457763671875, 167.5441131591797, 174.83364868164062, 182.1231689453125, 189.41268920898438, 196.7022247314453, 203.9917449951172, 211.28128051757812, 218.57080078125, 225.86033630371094, 233.14987182617188, 240.43939208984375, 247.7289276123047]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 15.0, 7.0, 21.0, 20.0, 33.0, 31.0, 55.0, 64.0, 99.0, 120.0, 159.0, 224.0, 233.0, 335.0, 441.0, 519.0, 686.0, 1079.0, 1040564.0, 938.0, 632.0, 524.0, 402.0, 329.0, 252.0, 210.0, 132.0, 97.0, 86.0, 62.0, 60.0, 49.0, 21.0, 12.0, 16.0, 5.0, 12.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.50636672973633, -58.374576568603516, -56.2427864074707, -54.11099624633789, -51.97920608520508, -49.847415924072266, -47.71562957763672, -45.583839416503906, -43.452049255371094, -41.32025909423828, -39.18846893310547, -37.056678771972656, -34.924888610839844, -32.79309844970703, -30.66131019592285, -28.52952003479004, -26.397727966308594, -24.26593780517578, -22.13414764404297, -20.002357482910156, -17.870567321777344, -15.738778114318848, -13.606988906860352, -11.475198745727539, -9.343408584594727, -7.211618423461914, -5.07982873916626, -2.9480390548706055, -0.816248893737793, 1.3155412673950195, 3.4473304748535156, 5.579120635986328, 7.710906982421875, 9.842697143554688, 11.9744873046875, 14.106276512145996, 16.238067626953125, 18.369857788085938, 20.501646041870117, 22.63343620300293, 24.765226364135742, 26.897016525268555, 29.028806686401367, 31.160594940185547, 33.29238510131836, 35.42417526245117, 37.555965423583984, 39.6877555847168, 41.81954574584961, 43.95133590698242, 46.083126068115234, 48.21491622924805, 50.34670639038086, 52.47849655151367, 54.61028289794922, 56.74207305908203, 58.873863220214844, 61.005653381347656, 63.13744354248047, 65.26923370361328, 67.4010238647461, 69.5328140258789, 71.66460418701172, 73.79639434814453, 75.92818450927734]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 12.0, 3.0, 9.0, 6.0, 11.0, 25.0, 50.0, 73.0, 115.0, 187.0, 1657.0, 51435812.0, 24197.0, 674.0, 141.0, 72.0, 40.0, 18.0, 14.0, 9.0, 4.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1009.6558837890625, -973.3961181640625, -937.1363525390625, -900.8765869140625, -864.6168212890625, -828.3570556640625, -792.0973510742188, -755.8375854492188, -719.5778198242188, -683.3180541992188, -647.0582885742188, -610.7985229492188, -574.538818359375, -538.279052734375, -502.019287109375, -465.759521484375, -429.499755859375, -393.239990234375, -356.980224609375, -320.7204895019531, -284.4607238769531, -248.20095825195312, -211.9412078857422, -175.68145751953125, -139.42169189453125, -103.16193389892578, -66.90217590332031, -30.642417907714844, 5.617340087890625, 41.877105712890625, 78.13685607910156, 114.3966064453125, 150.6563720703125, 186.9161376953125, 223.17588806152344, 259.4356384277344, 295.6954040527344, 331.9551696777344, 368.21490478515625, 404.47467041015625, 440.73443603515625, 476.99420166015625, 513.2539672851562, 549.5137329101562, 585.7734375, 622.033203125, 658.29296875, 694.552734375, 730.8125, 767.072265625, 803.33203125, 839.591796875, 875.8515625, 912.111328125, 948.3710327148438, 984.6307983398438, 1020.8905639648438, 1057.1502685546875, 1093.4100341796875, 1129.6697998046875, 1165.9295654296875, 1202.1893310546875, 1238.4490966796875, 1274.7088623046875, 1310.9686279296875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 9.0, 12.0, 23.0, 32.0, 35.0, 62.0, 94.0, 160.0, 254.0, 395.0, 531.0, 845.0, 1320.0, 1960.0, 3012.0, 4577.0, 6914.0, 10934.0, 16889.0, 26845.0, 42673.0, 69498.0, 114709.0, 191176.0, 327152.0, 531196.0, 3783744.0, 460198.0, 275487.0, 162428.0, 97433.0, 59325.0, 36633.0, 23232.0, 14458.0, 9534.0, 6095.0, 3905.0, 2718.0, 1718.0, 1061.0, 676.0, 497.0, 313.0, 202.0, 166.0, 112.0, 74.0, 32.0, 30.0, 24.0, 8.0, 11.0, 7.0, 10.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1298828125, -0.1254558563232422, -0.12102890014648438, -0.11660194396972656, -0.11217498779296875, -0.10774803161621094, -0.10332107543945312, -0.09889411926269531, -0.0944671630859375, -0.09004020690917969, -0.08561325073242188, -0.08118629455566406, -0.07675933837890625, -0.07233238220214844, -0.06790542602539062, -0.06347846984863281, -0.059051513671875, -0.05462455749511719, -0.050197601318359375, -0.04577064514160156, -0.04134368896484375, -0.03691673278808594, -0.032489776611328125, -0.028062820434570312, -0.0236358642578125, -0.019208908081054688, -0.014781951904296875, -0.010354995727539062, -0.00592803955078125, -0.0015010833740234375, 0.002925872802734375, 0.0073528289794921875, 0.01177978515625, 0.016206741333007812, 0.020633697509765625, 0.025060653686523438, 0.02948760986328125, 0.03391456604003906, 0.038341522216796875, 0.04276847839355469, 0.0471954345703125, 0.05162239074707031, 0.056049346923828125, 0.06047630310058594, 0.06490325927734375, 0.06933021545410156, 0.07375717163085938, 0.07818412780761719, 0.082611083984375, 0.08703804016113281, 0.09146499633789062, 0.09589195251464844, 0.10031890869140625, 0.10474586486816406, 0.10917282104492188, 0.11359977722167969, 0.1180267333984375, 0.12245368957519531, 0.12688064575195312, 0.13130760192871094, 0.13573455810546875, 0.14016151428222656, 0.14458847045898438, 0.1490154266357422, 0.1534423828125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 6.0, 6.0, 12.0, 13.0, 17.0, 23.0, 20.0, 22.0, 22.0, 32.0, 30.0, 24.0, 34.0, 30.0, 26.0, 36.0, 50.0, 37.0, 109.0, 996.0, 44.0, 42.0, 29.0, 22.0, 39.0, 31.0, 38.0, 30.0, 20.0, 24.0, 20.0, 17.0, 23.0, 10.0, 11.0, 18.0, 5.0, 6.0, 7.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-48.5625, -47.17578125, -45.7890625, -44.40234375, -43.015625, -41.62890625, -40.2421875, -38.85546875, -37.46875, -36.08203125, -34.6953125, -33.30859375, -31.921875, -30.53515625, -29.1484375, -27.76171875, -26.375, -24.98828125, -23.6015625, -22.21484375, -20.828125, -19.44140625, -18.0546875, -16.66796875, -15.28125, -13.89453125, -12.5078125, -11.12109375, -9.734375, -8.34765625, -6.9609375, -5.57421875, -4.1875, -2.80078125, -1.4140625, -0.02734375, 1.359375, 2.74609375, 4.1328125, 5.51953125, 6.90625, 8.29296875, 9.6796875, 11.06640625, 12.453125, 13.83984375, 15.2265625, 16.61328125, 18.0, 19.38671875, 20.7734375, 22.16015625, 23.546875, 24.93359375, 26.3203125, 27.70703125, 29.09375, 30.48046875, 31.8671875, 33.25390625, 34.640625, 36.02734375, 37.4140625, 38.80078125, 40.1875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 5.0, 8.0, 11.0, 16.0, 19.0, 26.0, 32.0, 52.0, 77.0, 110.0, 174.0, 243.0, 365.0, 476.0, 734.0, 1050.0, 1617.0, 2465.0, 3703.0, 5842.0, 8940.0, 14045.0, 21850.0, 35297.0, 57644.0, 93337.0, 152964.0, 256885.0, 426407.0, 3758659.0, 551751.0, 351975.0, 210411.0, 126797.0, 77120.0, 47843.0, 30044.0, 18838.0, 11667.0, 7451.0, 4948.0, 3072.0, 2103.0, 1434.0, 967.0, 630.0, 425.0, 263.0, 202.0, 140.0, 97.0, 73.0, 44.0, 38.0, 25.0, 10.0, 10.0, 8.0, 3.0, 0.0, 3.0, 2.0, 3.0], "bins": [-0.12384033203125, -0.11982059478759766, -0.11580085754394531, -0.11178112030029297, -0.10776138305664062, -0.10374164581298828, -0.09972190856933594, -0.0957021713256836, -0.09168243408203125, -0.0876626968383789, -0.08364295959472656, -0.07962322235107422, -0.07560348510742188, -0.07158374786376953, -0.06756401062011719, -0.06354427337646484, -0.0595245361328125, -0.055504798889160156, -0.05148506164550781, -0.04746532440185547, -0.043445587158203125, -0.03942584991455078, -0.03540611267089844, -0.031386375427246094, -0.02736663818359375, -0.023346900939941406, -0.019327163696289062, -0.015307426452636719, -0.011287689208984375, -0.007267951965332031, -0.0032482147216796875, 0.0007715225219726562, 0.004791259765625, 0.008810997009277344, 0.012830734252929688, 0.01685047149658203, 0.020870208740234375, 0.02488994598388672, 0.028909683227539062, 0.032929420471191406, 0.03694915771484375, 0.040968894958496094, 0.04498863220214844, 0.04900836944580078, 0.053028106689453125, 0.05704784393310547, 0.06106758117675781, 0.06508731842041016, 0.0691070556640625, 0.07312679290771484, 0.07714653015136719, 0.08116626739501953, 0.08518600463867188, 0.08920574188232422, 0.09322547912597656, 0.0972452163696289, 0.10126495361328125, 0.1052846908569336, 0.10930442810058594, 0.11332416534423828, 0.11734390258789062, 0.12136363983154297, 0.1253833770751953, 0.12940311431884766, 0.1334228515625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 11.0, 9.0, 9.0, 18.0, 15.0, 17.0, 21.0, 20.0, 31.0, 29.0, 40.0, 29.0, 47.0, 39.0, 51.0, 42.0, 27.0, 1068.0, 49.0, 38.0, 35.0, 40.0, 35.0, 38.0, 33.0, 27.0, 36.0, 20.0, 31.0, 19.0, 20.0, 10.0, 14.0, 13.0, 7.0, 7.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.40625, -40.05029296875, -38.6943359375, -37.33837890625, -35.982421875, -34.62646484375, -33.2705078125, -31.91455078125, -30.55859375, -29.20263671875, -27.8466796875, -26.49072265625, -25.134765625, -23.77880859375, -22.4228515625, -21.06689453125, -19.7109375, -18.35498046875, -16.9990234375, -15.64306640625, -14.287109375, -12.93115234375, -11.5751953125, -10.21923828125, -8.86328125, -7.50732421875, -6.1513671875, -4.79541015625, -3.439453125, -2.08349609375, -0.7275390625, 0.62841796875, 1.984375, 3.34033203125, 4.6962890625, 6.05224609375, 7.408203125, 8.76416015625, 10.1201171875, 11.47607421875, 12.83203125, 14.18798828125, 15.5439453125, 16.89990234375, 18.255859375, 19.61181640625, 20.9677734375, 22.32373046875, 23.6796875, 25.03564453125, 26.3916015625, 27.74755859375, 29.103515625, 30.45947265625, 31.8154296875, 33.17138671875, 34.52734375, 35.88330078125, 37.2392578125, 38.59521484375, 39.951171875, 41.30712890625, 42.6630859375, 44.01904296875, 45.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 15.0, 12.0, 19.0, 16.0, 30.0, 33.0, 55.0, 79.0, 81.0, 84.0, 123.0, 112.0, 220.0, 302.0, 494.0, 906.0, 2835.0, 14666.0, 103144.0, 6078680.0, 73373.0, 11474.0, 2382.0, 822.0, 425.0, 264.0, 176.0, 131.0, 114.0, 80.0, 61.0, 38.0, 47.0, 39.0, 26.0, 22.0, 10.0, 14.0, 7.0, 7.0, 4.0, 2.0, 0.0, 3.0], "bins": [-1.408203125, -1.3724822998046875, -1.336761474609375, -1.3010406494140625, -1.26531982421875, -1.2295989990234375, -1.193878173828125, -1.1581573486328125, -1.1224365234375, -1.0867156982421875, -1.050994873046875, -1.0152740478515625, -0.97955322265625, -0.9438323974609375, -0.908111572265625, -0.8723907470703125, -0.836669921875, -0.8009490966796875, -0.765228271484375, -0.7295074462890625, -0.69378662109375, -0.6580657958984375, -0.622344970703125, -0.5866241455078125, -0.5509033203125, -0.5151824951171875, -0.479461669921875, -0.4437408447265625, -0.40802001953125, -0.3722991943359375, -0.336578369140625, -0.3008575439453125, -0.26513671875, -0.2294158935546875, -0.193695068359375, -0.1579742431640625, -0.12225341796875, -0.0865325927734375, -0.050811767578125, -0.0150909423828125, 0.0206298828125, 0.0563507080078125, 0.092071533203125, 0.1277923583984375, 0.16351318359375, 0.1992340087890625, 0.234954833984375, 0.2706756591796875, 0.306396484375, 0.3421173095703125, 0.377838134765625, 0.4135589599609375, 0.44927978515625, 0.4850006103515625, 0.520721435546875, 0.5564422607421875, 0.5921630859375, 0.6278839111328125, 0.663604736328125, 0.6993255615234375, 0.73504638671875, 0.7707672119140625, 0.806488037109375, 0.8422088623046875, 0.8779296875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 7.0, 9.0, 17.0, 23.0, 20.0, 24.0, 32.0, 28.0, 27.0, 38.0, 41.0, 34.0, 57.0, 51.0, 47.0, 67.0, 1047.0, 59.0, 48.0, 37.0, 41.0, 36.0, 41.0, 21.0, 34.0, 26.0, 18.0, 17.0, 17.0, 12.0, 9.0, 13.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.96875, -40.864990234375, -39.76123046875, -38.657470703125, -37.5537109375, -36.449951171875, -35.34619140625, -34.242431640625, -33.138671875, -32.034912109375, -30.93115234375, -29.827392578125, -28.7236328125, -27.619873046875, -26.51611328125, -25.412353515625, -24.30859375, -23.204833984375, -22.10107421875, -20.997314453125, -19.8935546875, -18.789794921875, -17.68603515625, -16.582275390625, -15.478515625, -14.374755859375, -13.27099609375, -12.167236328125, -11.0634765625, -9.959716796875, -8.85595703125, -7.752197265625, -6.6484375, -5.544677734375, -4.44091796875, -3.337158203125, -2.2333984375, -1.129638671875, -0.02587890625, 1.077880859375, 2.181640625, 3.285400390625, 4.38916015625, 5.492919921875, 6.5966796875, 7.700439453125, 8.80419921875, 9.907958984375, 11.01171875, 12.115478515625, 13.21923828125, 14.322998046875, 15.4267578125, 16.530517578125, 17.63427734375, 18.738037109375, 19.841796875, 20.945556640625, 22.04931640625, 23.153076171875, 24.2568359375, 25.360595703125, 26.46435546875, 27.568115234375, 28.671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [4.0, 6.0, 865.0, 130.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.044088363647461, -7.142311096191406, -3.2405333518981934, 0.6612443923950195, 4.563021659851074, 8.464799880981445, 12.3665771484375, 16.268354415893555, 20.17013168334961, 24.071908950805664, 27.97368621826172, 31.875465393066406, 35.77724075317383, 39.679019927978516, 43.58079528808594, 47.482574462890625, 51.38435363769531, 55.2861328125, 59.18790817260742, 63.08968734741211, 66.99146270751953, 70.89324188232422, 74.7950210571289, 78.69679260253906, 82.59857177734375, 86.50035095214844, 90.40213012695312, 94.30390167236328, 98.20568084716797, 102.10746002197266, 106.00923919677734, 109.9110107421875, 113.81279754638672, 117.7145767211914, 121.6163558959961, 125.51812744140625, 129.41990661621094, 133.32168579101562, 137.2234649658203, 141.125244140625, 145.0270233154297, 148.92880249023438, 152.83058166503906, 156.73236083984375, 160.63414001464844, 164.53591918945312, 168.43768310546875, 172.33946228027344, 176.24124145507812, 180.1430206298828, 184.0447998046875, 187.9465789794922, 191.84835815429688, 195.7501220703125, 199.6519012451172, 203.55368041992188, 207.45545959472656, 211.35723876953125, 215.25901794433594, 219.16079711914062, 223.0625762939453, 226.96435546875, 230.86611938476562, 234.7678985595703, 238.669677734375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 4.0, 5.0, 13.0, 5.0, 16.0, 9.0, 6.0, 26.0, 19.0, 18.0, 26.0, 25.0, 30.0, 25.0, 34.0, 21.0, 49.0, 41.0, 37.0, 47.0, 35.0, 37.0, 54.0, 41.0, 34.0, 41.0, 34.0, 32.0, 32.0, 33.0, 26.0, 20.0, 17.0, 15.0, 13.0, 10.0, 26.0, 3.0, 10.0, 7.0, 0.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.79846954345703, -43.307960510253906, -41.81745529174805, -40.32694625854492, -38.83644104003906, -37.34593200683594, -35.85542297363281, -34.36491775512695, -32.87440872192383, -31.383901596069336, -29.893394470214844, -28.40288543701172, -26.912378311157227, -25.421871185302734, -23.931364059448242, -22.44085693359375, -20.950349807739258, -19.459842681884766, -17.969335556030273, -16.47882843017578, -14.988319396972656, -13.497812271118164, -12.007305145263672, -10.516797065734863, -9.026289939880371, -7.535782337188721, -6.04527473449707, -4.554767608642578, -3.0642600059509277, -1.5737524032592773, -0.08324527740478516, 1.4072628021240234, 2.8977699279785156, 4.388277530670166, 5.878785133361816, 7.369292259216309, 8.859800338745117, 10.35030746459961, 11.840814590454102, 13.33132266998291, 14.821829795837402, 16.31233787536621, 17.802845001220703, 19.293352127075195, 20.783859252929688, 22.274368286132812, 23.764873504638672, 25.255382537841797, 26.74588966369629, 28.23639678955078, 29.726903915405273, 31.217411041259766, 32.70792007446289, 34.19842529296875, 35.688934326171875, 37.179443359375, 38.66994857788086, 40.160457611083984, 41.650962829589844, 43.14147186279297, 44.63197708129883, 46.12248611450195, 47.61299133300781, 49.10350036621094, 50.59400939941406]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 6.0, 1.0, 13.0, 10.0, 3.0, 2.0, 12.0, 6.0, 13.0, 10.0, 19.0, 15.0, 18.0, 32.0, 33.0, 46.0, 59.0, 113.0, 146.0, 239.0, 949.0, 5480.0, 40906.0, 4125321.0, 14530.0, 4733.0, 843.0, 359.0, 89.0, 68.0, 42.0, 40.0, 21.0, 17.0, 18.0, 25.0, 7.0, 3.0, 6.0, 6.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-0.05975341796875, -0.0581507682800293, -0.056548118591308594, -0.05494546890258789, -0.05334281921386719, -0.051740169525146484, -0.05013751983642578, -0.04853487014770508, -0.046932220458984375, -0.04532957077026367, -0.04372692108154297, -0.042124271392822266, -0.04052162170410156, -0.03891897201538086, -0.037316322326660156, -0.03571367263793945, -0.03411102294921875, -0.03250837326049805, -0.030905723571777344, -0.02930307388305664, -0.027700424194335938, -0.026097774505615234, -0.02449512481689453, -0.022892475128173828, -0.021289825439453125, -0.019687175750732422, -0.01808452606201172, -0.016481876373291016, -0.014879226684570312, -0.01327657699584961, -0.011673927307128906, -0.010071277618408203, -0.0084686279296875, -0.006865978240966797, -0.005263328552246094, -0.0036606788635253906, -0.0020580291748046875, -0.0004553794860839844, 0.0011472702026367188, 0.002749919891357422, 0.004352569580078125, 0.005955219268798828, 0.007557868957519531, 0.009160518646240234, 0.010763168334960938, 0.01236581802368164, 0.013968467712402344, 0.015571117401123047, 0.01717376708984375, 0.018776416778564453, 0.020379066467285156, 0.02198171615600586, 0.023584365844726562, 0.025187015533447266, 0.02678966522216797, 0.028392314910888672, 0.029994964599609375, 0.03159761428833008, 0.03320026397705078, 0.034802913665771484, 0.03640556335449219, 0.03800821304321289, 0.039610862731933594, 0.0412135124206543, 0.042816162109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 6.0, 14.0, 5.0, 11.0, 14.0, 22.0, 784.0, 30.0, 16.0, 14.0, 11.0, 2.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.039825439453125, -0.03876519203186035, -0.0377049446105957, -0.036644697189331055, -0.035584449768066406, -0.03452420234680176, -0.03346395492553711, -0.03240370750427246, -0.03134346008300781, -0.030283212661743164, -0.029222965240478516, -0.028162717819213867, -0.02710247039794922, -0.02604222297668457, -0.024981975555419922, -0.023921728134155273, -0.022861480712890625, -0.021801233291625977, -0.020740985870361328, -0.01968073844909668, -0.01862049102783203, -0.017560243606567383, -0.016499996185302734, -0.015439748764038086, -0.014379501342773438, -0.013319253921508789, -0.01225900650024414, -0.011198759078979492, -0.010138511657714844, -0.009078264236450195, -0.008018016815185547, -0.0069577693939208984, -0.00589752197265625, -0.0048372745513916016, -0.003777027130126953, -0.0027167797088623047, -0.0016565322875976562, -0.0005962848663330078, 0.0004639625549316406, 0.001524209976196289, 0.0025844573974609375, 0.003644704818725586, 0.004704952239990234, 0.005765199661254883, 0.006825447082519531, 0.00788569450378418, 0.008945941925048828, 0.010006189346313477, 0.011066436767578125, 0.012126684188842773, 0.013186931610107422, 0.01424717903137207, 0.015307426452636719, 0.016367673873901367, 0.017427921295166016, 0.018488168716430664, 0.019548416137695312, 0.02060866355895996, 0.02166891098022461, 0.022729158401489258, 0.023789405822753906, 0.024849653244018555, 0.025909900665283203, 0.02697014808654785, 0.0280303955078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 7.0, 5.0, 17.0, 17.0, 20.0, 57.0, 125.0, 493.0, 3425.0, 4135649.0, 52308.0, 1633.0, 287.0, 92.0, 43.0, 32.0, 15.0, 8.0, 7.0, 5.0, 12.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.206298828125, -0.2000255584716797, -0.19375228881835938, -0.18747901916503906, -0.18120574951171875, -0.17493247985839844, -0.16865921020507812, -0.1623859405517578, -0.1561126708984375, -0.1498394012451172, -0.14356613159179688, -0.13729286193847656, -0.13101959228515625, -0.12474632263183594, -0.11847305297851562, -0.11219978332519531, -0.105926513671875, -0.09965324401855469, -0.09337997436523438, -0.08710670471191406, -0.08083343505859375, -0.07456016540527344, -0.06828689575195312, -0.06201362609863281, -0.0557403564453125, -0.04946708679199219, -0.043193817138671875, -0.03692054748535156, -0.03064727783203125, -0.024374008178710938, -0.018100738525390625, -0.011827468872070312, -0.00555419921875, 0.0007190704345703125, 0.006992340087890625, 0.013265609741210938, 0.01953887939453125, 0.025812149047851562, 0.032085418701171875, 0.03835868835449219, 0.0446319580078125, 0.05090522766113281, 0.057178497314453125, 0.06345176696777344, 0.06972503662109375, 0.07599830627441406, 0.08227157592773438, 0.08854484558105469, 0.094818115234375, 0.10109138488769531, 0.10736465454101562, 0.11363792419433594, 0.11991119384765625, 0.12618446350097656, 0.13245773315429688, 0.1387310028076172, 0.1450042724609375, 0.1512775421142578, 0.15755081176757812, 0.16382408142089844, 0.17009735107421875, 0.17637062072753906, 0.18264389038085938, 0.1889171600341797, 0.1951904296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 8.0, 9.0, 6.0, 7.0, 16.0, 23.0, 117.0, 2959.0, 783.0, 76.0, 17.0, 7.0, 11.0, 10.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0738525390625, -0.07160663604736328, -0.06936073303222656, -0.06711483001708984, -0.06486892700195312, -0.0626230239868164, -0.06037712097167969, -0.05813121795654297, -0.05588531494140625, -0.05363941192626953, -0.05139350891113281, -0.049147605895996094, -0.046901702880859375, -0.044655799865722656, -0.04240989685058594, -0.04016399383544922, -0.0379180908203125, -0.03567218780517578, -0.03342628479003906, -0.031180381774902344, -0.028934478759765625, -0.026688575744628906, -0.024442672729492188, -0.02219676971435547, -0.01995086669921875, -0.01770496368408203, -0.015459060668945312, -0.013213157653808594, -0.010967254638671875, -0.008721351623535156, -0.0064754486083984375, -0.004229545593261719, -0.001983642578125, 0.00026226043701171875, 0.0025081634521484375, 0.004754066467285156, 0.006999969482421875, 0.009245872497558594, 0.011491775512695312, 0.013737678527832031, 0.01598358154296875, 0.01822948455810547, 0.020475387573242188, 0.022721290588378906, 0.024967193603515625, 0.027213096618652344, 0.029458999633789062, 0.03170490264892578, 0.0339508056640625, 0.03619670867919922, 0.03844261169433594, 0.040688514709472656, 0.042934417724609375, 0.045180320739746094, 0.04742622375488281, 0.04967212677001953, 0.05191802978515625, 0.05416393280029297, 0.05640983581542969, 0.058655738830566406, 0.060901641845703125, 0.06314754486083984, 0.06539344787597656, 0.06763935089111328, 0.06988525390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 199.0, 813.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10257516801357269, -0.08216091245412827, -0.06174665316939354, -0.041332393884658813, -0.020918138325214386, -0.0005038827657699585, 0.019910380244255066, 0.040324628353118896, 0.06073889136314392, 0.08115314692258835, 0.10156740248203278, 0.1219816654920578, 0.14239591360092163, 0.16281017661094666, 0.18322443962097168, 0.2036386877298355, 0.22405295073986053, 0.24446721374988556, 0.2648814618587494, 0.2852957248687744, 0.30570998787879944, 0.32612425088882446, 0.3465384840965271, 0.3669527471065521, 0.38736701011657715, 0.4077812731266022, 0.4281955361366272, 0.44860976934432983, 0.46902403235435486, 0.4894382953643799, 0.5098525285720825, 0.5302668213844299, 0.5506810545921326, 0.5710952877998352, 0.5915095806121826, 0.6119238138198853, 0.6323381066322327, 0.6527523398399353, 0.6731666326522827, 0.6935808658599854, 0.713995099067688, 0.7344093322753906, 0.754823625087738, 0.7752378582954407, 0.7956521511077881, 0.8160663843154907, 0.8364806175231934, 0.8568949103355408, 0.8773092031478882, 0.8977234363555908, 0.9181377291679382, 0.9385519623756409, 0.9589662551879883, 0.9793804883956909, 0.9997947216033936, 1.0202089548110962, 1.0406231880187988, 1.0610374212265015, 1.081451654434204, 1.1018660068511963, 1.122280240058899, 1.1426944732666016, 1.1631087064743042, 1.1835229396820068, 1.203937292098999]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 12.0, 14.0, 13.0, 27.0, 28.0, 45.0, 61.0, 73.0, 98.0, 96.0, 107.0, 77.0, 70.0, 51.0, 54.0, 27.0, 20.0, 19.0, 12.0, 12.0, 5.0, 3.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1507476568222046, -0.14573675394058228, -0.14072585105895996, -0.13571494817733765, -0.13070404529571533, -0.12569314241409302, -0.1206822395324707, -0.11567133665084839, -0.11066043376922607, -0.10564953088760376, -0.10063862800598145, -0.09562772512435913, -0.09061682224273682, -0.0856059193611145, -0.08059501647949219, -0.07558411359786987, -0.07057321071624756, -0.06556230783462524, -0.06055140495300293, -0.055540502071380615, -0.0505295991897583, -0.045518696308135986, -0.04050779342651367, -0.03549689054489136, -0.030485987663269043, -0.02547508478164673, -0.020464181900024414, -0.0154532790184021, -0.010442376136779785, -0.005431473255157471, -0.00042057037353515625, 0.004590332508087158, 0.009601235389709473, 0.014612138271331787, 0.0196230411529541, 0.024633944034576416, 0.02964484691619873, 0.034655749797821045, 0.03966665267944336, 0.044677555561065674, 0.04968845844268799, 0.0546993613243103, 0.05971026420593262, 0.06472116708755493, 0.06973206996917725, 0.07474297285079956, 0.07975387573242188, 0.08476477861404419, 0.0897756814956665, 0.09478658437728882, 0.09979748725891113, 0.10480839014053345, 0.10981929302215576, 0.11483019590377808, 0.11984109878540039, 0.1248520016670227, 0.12986290454864502, 0.13487380743026733, 0.13988471031188965, 0.14489561319351196, 0.14990651607513428, 0.1549174189567566, 0.1599283218383789, 0.16493922472000122, 0.16995012760162354]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 6.0, 12.0, 22.0, 28.0, 44.0, 41.0, 80.0, 93.0, 167.0, 255.0, 349.0, 504.0, 732.0, 1141.0, 1669.0, 2501.0, 4071.0, 7484.0, 16762.0, 82994.0, 887604.0, 20237.0, 8670.0, 4663.0, 2757.0, 1921.0, 1223.0, 806.0, 532.0, 360.0, 281.0, 171.0, 113.0, 76.0, 63.0, 29.0, 30.0, 20.0, 5.0, 11.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052642822265625, -0.05100297927856445, -0.049363136291503906, -0.04772329330444336, -0.04608345031738281, -0.044443607330322266, -0.04280376434326172, -0.04116392135620117, -0.039524078369140625, -0.03788423538208008, -0.03624439239501953, -0.034604549407958984, -0.03296470642089844, -0.03132486343383789, -0.029685020446777344, -0.028045177459716797, -0.02640533447265625, -0.024765491485595703, -0.023125648498535156, -0.02148580551147461, -0.019845962524414062, -0.018206119537353516, -0.01656627655029297, -0.014926433563232422, -0.013286590576171875, -0.011646747589111328, -0.010006904602050781, -0.008367061614990234, -0.0067272186279296875, -0.005087375640869141, -0.0034475326538085938, -0.0018076896667480469, -0.0001678466796875, 0.0014719963073730469, 0.0031118392944335938, 0.004751682281494141, 0.0063915252685546875, 0.008031368255615234, 0.009671211242675781, 0.011311054229736328, 0.012950897216796875, 0.014590740203857422, 0.01623058319091797, 0.017870426177978516, 0.019510269165039062, 0.02115011215209961, 0.022789955139160156, 0.024429798126220703, 0.02606964111328125, 0.027709484100341797, 0.029349327087402344, 0.03098917007446289, 0.03262901306152344, 0.034268856048583984, 0.03590869903564453, 0.03754854202270508, 0.039188385009765625, 0.04082822799682617, 0.04246807098388672, 0.044107913970947266, 0.04574775695800781, 0.04738759994506836, 0.049027442932128906, 0.05066728591918945, 0.05230712890625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 12.0, 6.0, 12.0, 14.0, 21.0, 777.0, 34.0, 19.0, 9.0, 16.0, 4.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.039459228515625, -0.03840994834899902, -0.03736066818237305, -0.03631138801574707, -0.035262107849121094, -0.03421282768249512, -0.03316354751586914, -0.032114267349243164, -0.031064987182617188, -0.03001570701599121, -0.028966426849365234, -0.027917146682739258, -0.02686786651611328, -0.025818586349487305, -0.024769306182861328, -0.02372002601623535, -0.022670745849609375, -0.0216214656829834, -0.020572185516357422, -0.019522905349731445, -0.01847362518310547, -0.017424345016479492, -0.016375064849853516, -0.015325784683227539, -0.014276504516601562, -0.013227224349975586, -0.01217794418334961, -0.011128664016723633, -0.010079383850097656, -0.00903010368347168, -0.007980823516845703, -0.0069315433502197266, -0.00588226318359375, -0.0048329830169677734, -0.003783702850341797, -0.0027344226837158203, -0.0016851425170898438, -0.0006358623504638672, 0.0004134178161621094, 0.001462697982788086, 0.0025119781494140625, 0.003561258316040039, 0.004610538482666016, 0.005659818649291992, 0.006709098815917969, 0.007758378982543945, 0.008807659149169922, 0.009856939315795898, 0.010906219482421875, 0.011955499649047852, 0.013004779815673828, 0.014054059982299805, 0.015103340148925781, 0.016152620315551758, 0.017201900482177734, 0.01825118064880371, 0.019300460815429688, 0.020349740982055664, 0.02139902114868164, 0.022448301315307617, 0.023497581481933594, 0.02454686164855957, 0.025596141815185547, 0.026645421981811523, 0.0276947021484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 2.0, 9.0, 12.0, 10.0, 17.0, 21.0, 21.0, 22.0, 24.0, 41.0, 46.0, 77.0, 89.0, 98.0, 137.0, 209.0, 353.0, 725.0, 1782.0, 6859.0, 49689.0, 875778.0, 97874.0, 10133.0, 2392.0, 808.0, 392.0, 242.0, 150.0, 118.0, 81.0, 73.0, 55.0, 35.0, 28.0, 29.0, 19.0, 24.0, 19.0, 6.0, 12.0, 12.0, 1.0, 5.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.08428955078125, -0.08162403106689453, -0.07895851135253906, -0.0762929916381836, -0.07362747192382812, -0.07096195220947266, -0.06829643249511719, -0.06563091278076172, -0.06296539306640625, -0.06029987335205078, -0.05763435363769531, -0.054968833923339844, -0.052303314208984375, -0.049637794494628906, -0.04697227478027344, -0.04430675506591797, -0.0416412353515625, -0.03897571563720703, -0.03631019592285156, -0.033644676208496094, -0.030979156494140625, -0.028313636779785156, -0.025648117065429688, -0.02298259735107422, -0.02031707763671875, -0.01765155792236328, -0.014986038208007812, -0.012320518493652344, -0.009654998779296875, -0.006989479064941406, -0.0043239593505859375, -0.0016584396362304688, 0.001007080078125, 0.0036725997924804688, 0.0063381195068359375, 0.009003639221191406, 0.011669158935546875, 0.014334678649902344, 0.017000198364257812, 0.01966571807861328, 0.02233123779296875, 0.02499675750732422, 0.027662277221679688, 0.030327796936035156, 0.032993316650390625, 0.035658836364746094, 0.03832435607910156, 0.04098987579345703, 0.0436553955078125, 0.04632091522216797, 0.04898643493652344, 0.051651954650878906, 0.054317474365234375, 0.056982994079589844, 0.05964851379394531, 0.06231403350830078, 0.06497955322265625, 0.06764507293701172, 0.07031059265136719, 0.07297611236572266, 0.07564163208007812, 0.0783071517944336, 0.08097267150878906, 0.08363819122314453, 0.0863037109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 2.0, 8.0, 10.0, 8.0, 11.0, 14.0, 14.0, 12.0, 13.0, 20.0, 21.0, 28.0, 28.0, 28.0, 23.0, 28.0, 33.0, 41.0, 30.0, 37.0, 45.0, 43.0, 39.0, 39.0, 36.0, 24.0, 31.0, 32.0, 37.0, 39.0, 23.0, 31.0, 27.0, 15.0, 14.0, 17.0, 11.0, 17.0, 15.0, 5.0, 10.0, 12.0, 1.0, 5.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.11431884765625, -0.1107034683227539, -0.10708808898925781, -0.10347270965576172, -0.09985733032226562, -0.09624195098876953, -0.09262657165527344, -0.08901119232177734, -0.08539581298828125, -0.08178043365478516, -0.07816505432128906, -0.07454967498779297, -0.07093429565429688, -0.06731891632080078, -0.06370353698730469, -0.060088157653808594, -0.0564727783203125, -0.052857398986816406, -0.04924201965332031, -0.04562664031982422, -0.042011260986328125, -0.03839588165283203, -0.03478050231933594, -0.031165122985839844, -0.02754974365234375, -0.023934364318847656, -0.020318984985351562, -0.01670360565185547, -0.013088226318359375, -0.009472846984863281, -0.0058574676513671875, -0.0022420883178710938, 0.001373291015625, 0.004988670349121094, 0.008604049682617188, 0.012219429016113281, 0.015834808349609375, 0.01945018768310547, 0.023065567016601562, 0.026680946350097656, 0.03029632568359375, 0.033911705017089844, 0.03752708435058594, 0.04114246368408203, 0.044757843017578125, 0.04837322235107422, 0.05198860168457031, 0.055603981018066406, 0.0592193603515625, 0.0628347396850586, 0.06645011901855469, 0.07006549835205078, 0.07368087768554688, 0.07729625701904297, 0.08091163635253906, 0.08452701568603516, 0.08814239501953125, 0.09175777435302734, 0.09537315368652344, 0.09898853302001953, 0.10260391235351562, 0.10621929168701172, 0.10983467102050781, 0.1134500503540039, 0.1170654296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 8.0, 11.0, 18.0, 23.0, 38.0, 45.0, 88.0, 128.0, 212.0, 397.0, 657.0, 1463.0, 3299.0, 10731.0, 61425.0, 857913.0, 92147.0, 12658.0, 3900.0, 1633.0, 733.0, 399.0, 215.0, 149.0, 79.0, 48.0, 44.0, 21.0, 16.0, 15.0, 6.0, 4.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.100271224975586e-05, -7.865950465202332e-05, -7.631629705429077e-05, -7.397308945655823e-05, -7.162988185882568e-05, -6.928667426109314e-05, -6.69434666633606e-05, -6.460025906562805e-05, -6.225705146789551e-05, -5.9913843870162964e-05, -5.757063627243042e-05, -5.5227428674697876e-05, -5.288422107696533e-05, -5.054101347923279e-05, -4.8197805881500244e-05, -4.58545982837677e-05, -4.3511390686035156e-05, -4.116818308830261e-05, -3.882497549057007e-05, -3.6481767892837524e-05, -3.413856029510498e-05, -3.1795352697372437e-05, -2.9452145099639893e-05, -2.710893750190735e-05, -2.4765729904174805e-05, -2.242252230644226e-05, -2.0079314708709717e-05, -1.7736107110977173e-05, -1.539289951324463e-05, -1.3049691915512085e-05, -1.0706484317779541e-05, -8.363276720046997e-06, -6.020069122314453e-06, -3.676861524581909e-06, -1.3336539268493652e-06, 1.0095536708831787e-06, 3.3527612686157227e-06, 5.695968866348267e-06, 8.03917646408081e-06, 1.0382384061813354e-05, 1.2725591659545898e-05, 1.5068799257278442e-05, 1.7412006855010986e-05, 1.975521445274353e-05, 2.2098422050476074e-05, 2.4441629648208618e-05, 2.6784837245941162e-05, 2.9128044843673706e-05, 3.147125244140625e-05, 3.3814460039138794e-05, 3.615766763687134e-05, 3.850087523460388e-05, 4.0844082832336426e-05, 4.318729043006897e-05, 4.5530498027801514e-05, 4.787370562553406e-05, 5.02169132232666e-05, 5.2560120820999146e-05, 5.490332841873169e-05, 5.7246536016464233e-05, 5.958974361419678e-05, 6.193295121192932e-05, 6.427615880966187e-05, 6.661936640739441e-05, 6.896257400512695e-05]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 9.0, 4.0, 2.0, 5.0, 3.0, 11.0, 11.0, 9.0, 9.0, 13.0, 12.0, 38.0, 15.0, 27.0, 19.0, 19.0, 55.0, 29.0, 22.0, 31.0, 34.0, 86.0, 40.0, 34.0, 38.0, 28.0, 19.0, 63.0, 27.0, 32.0, 33.0, 29.0, 53.0, 14.0, 15.0, 20.0, 19.0, 18.0, 9.0, 8.0, 6.0, 7.0, 4.0, 12.0, 3.0, 8.0, 1.0, 2.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.955777406692505e-06, -1.8849968910217285e-06, -1.8142163753509521e-06, -1.7434358596801758e-06, -1.6726553440093994e-06, -1.601874828338623e-06, -1.5310943126678467e-06, -1.4603137969970703e-06, -1.389533281326294e-06, -1.3187527656555176e-06, -1.2479722499847412e-06, -1.1771917343139648e-06, -1.1064112186431885e-06, -1.0356307029724121e-06, -9.648501873016357e-07, -8.940696716308594e-07, -8.23289155960083e-07, -7.525086402893066e-07, -6.817281246185303e-07, -6.109476089477539e-07, -5.401670932769775e-07, -4.6938657760620117e-07, -3.986060619354248e-07, -3.2782554626464844e-07, -2.5704503059387207e-07, -1.862645149230957e-07, -1.1548399925231934e-07, -4.470348358154297e-08, 2.60770320892334e-08, 9.685754776000977e-08, 1.6763806343078613e-07, 2.384185791015625e-07, 3.0919909477233887e-07, 3.7997961044311523e-07, 4.507601261138916e-07, 5.21540641784668e-07, 5.923211574554443e-07, 6.631016731262207e-07, 7.338821887969971e-07, 8.046627044677734e-07, 8.754432201385498e-07, 9.462237358093262e-07, 1.0170042514801025e-06, 1.087784767150879e-06, 1.1585652828216553e-06, 1.2293457984924316e-06, 1.300126314163208e-06, 1.3709068298339844e-06, 1.4416873455047607e-06, 1.5124678611755371e-06, 1.5832483768463135e-06, 1.6540288925170898e-06, 1.7248094081878662e-06, 1.7955899238586426e-06, 1.866370439529419e-06, 1.9371509552001953e-06, 2.0079314708709717e-06, 2.078711986541748e-06, 2.1494925022125244e-06, 2.2202730178833008e-06, 2.291053533554077e-06, 2.3618340492248535e-06, 2.43261456489563e-06, 2.5033950805664062e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 10.0, 14.0, 17.0, 15.0, 36.0, 36.0, 60.0, 120.0, 197.0, 340.0, 971.0, 3924.0, 81564.0, 944430.0, 13864.0, 1800.0, 493.0, 238.0, 150.0, 73.0, 58.0, 38.0, 34.0, 16.0, 13.0, 5.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.967782974243164e-05, -6.721261888742447e-05, -6.47474080324173e-05, -6.228219717741013e-05, -5.9816986322402954e-05, -5.735177546739578e-05, -5.488656461238861e-05, -5.242135375738144e-05, -4.995614290237427e-05, -4.7490932047367096e-05, -4.5025721192359924e-05, -4.256051033735275e-05, -4.009529948234558e-05, -3.763008862733841e-05, -3.516487777233124e-05, -3.2699666917324066e-05, -3.0234456062316895e-05, -2.7769245207309723e-05, -2.530403435230255e-05, -2.283882349729538e-05, -2.0373612642288208e-05, -1.7908401787281036e-05, -1.5443190932273865e-05, -1.2977980077266693e-05, -1.0512769222259521e-05, -8.04755836725235e-06, -5.582347512245178e-06, -3.1171366572380066e-06, -6.51925802230835e-07, 1.8132850527763367e-06, 4.278495907783508e-06, 6.74370676279068e-06, 9.208917617797852e-06, 1.1674128472805023e-05, 1.4139339327812195e-05, 1.6604550182819366e-05, 1.9069761037826538e-05, 2.153497189283371e-05, 2.400018274784088e-05, 2.6465393602848053e-05, 2.8930604457855225e-05, 3.1395815312862396e-05, 3.386102616786957e-05, 3.632623702287674e-05, 3.879144787788391e-05, 4.125665873289108e-05, 4.3721869587898254e-05, 4.6187080442905426e-05, 4.86522912979126e-05, 5.111750215291977e-05, 5.358271300792694e-05, 5.604792386293411e-05, 5.8513134717941284e-05, 6.0978345572948456e-05, 6.344355642795563e-05, 6.59087672829628e-05, 6.837397813796997e-05, 7.083918899297714e-05, 7.330439984798431e-05, 7.576961070299149e-05, 7.823482155799866e-05, 8.070003241300583e-05, 8.3165243268013e-05, 8.563045412302017e-05, 8.809566497802734e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 9.0, 11.0, 9.0, 25.0, 18.0, 22.0, 46.0, 42.0, 54.0, 69.0, 76.0, 83.0, 74.0, 69.0, 81.0, 49.0, 45.0, 63.0, 27.0, 31.0, 20.0, 25.0, 9.0, 13.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.429454803466797e-05, -9.09566879272461e-05, -8.761882781982422e-05, -8.428096771240234e-05, -8.094310760498047e-05, -7.76052474975586e-05, -7.426738739013672e-05, -7.092952728271484e-05, -6.759166717529297e-05, -6.42538070678711e-05, -6.091594696044922e-05, -5.7578086853027344e-05, -5.424022674560547e-05, -5.0902366638183594e-05, -4.756450653076172e-05, -4.4226646423339844e-05, -4.088878631591797e-05, -3.7550926208496094e-05, -3.421306610107422e-05, -3.0875205993652344e-05, -2.753734588623047e-05, -2.4199485778808594e-05, -2.086162567138672e-05, -1.7523765563964844e-05, -1.4185905456542969e-05, -1.0848045349121094e-05, -7.510185241699219e-06, -4.172325134277344e-06, -8.344650268554688e-07, 2.5033950805664062e-06, 5.841255187988281e-06, 9.179115295410156e-06, 1.2516975402832031e-05, 1.5854835510253906e-05, 1.919269561767578e-05, 2.2530555725097656e-05, 2.586841583251953e-05, 2.9206275939941406e-05, 3.254413604736328e-05, 3.5881996154785156e-05, 3.921985626220703e-05, 4.2557716369628906e-05, 4.589557647705078e-05, 4.9233436584472656e-05, 5.257129669189453e-05, 5.5909156799316406e-05, 5.924701690673828e-05, 6.258487701416016e-05, 6.592273712158203e-05, 6.92605972290039e-05, 7.259845733642578e-05, 7.593631744384766e-05, 7.927417755126953e-05, 8.26120376586914e-05, 8.594989776611328e-05, 8.928775787353516e-05, 9.262561798095703e-05, 9.59634780883789e-05, 9.930133819580078e-05, 0.00010263919830322266, 0.00010597705841064453, 0.0001093149185180664, 0.00011265277862548828, 0.00011599063873291016, 0.00011932849884033203]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 992.0, 17.0, 2.0, 1.0], "bins": [-11.061187744140625, -10.87851619720459, -10.695844650268555, -10.51317310333252, -10.330501556396484, -10.147829055786133, -9.965157508850098, -9.782485961914062, -9.599814414978027, -9.417142868041992, -9.234471321105957, -9.051799774169922, -8.869128227233887, -8.686455726623535, -8.5037841796875, -8.321112632751465, -8.13844108581543, -7.9557695388793945, -7.773097991943359, -7.590425968170166, -7.407754421234131, -7.225082874298096, -7.0424113273620605, -6.859739303588867, -6.67706823348999, -6.494396686553955, -6.31172513961792, -6.129053115844727, -5.946381568908691, -5.763710021972656, -5.581038475036621, -5.398366928100586, -5.215694904327393, -5.033023357391357, -4.850351810455322, -4.667679786682129, -4.485008239746094, -4.302336692810059, -4.119665145874023, -3.936993360519409, -3.754321813583374, -3.571650266647339, -3.3889784812927246, -3.2063069343566895, -3.023635149002075, -2.84096360206604, -2.658291816711426, -2.4756202697753906, -2.2929487228393555, -2.1102771759033203, -1.927605390548706, -1.744933843612671, -1.5622620582580566, -1.3795905113220215, -1.1969188451766968, -1.014247179031372, -0.8315754532814026, -0.6489037871360779, -0.46623215079307556, -0.28356051445007324, -0.10088884830474854, 0.08178281784057617, 0.2644544243812561, 0.4471260905265808, 0.6297977566719055]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 5.0, 2.0, 7.0, 8.0, 15.0, 9.0, 29.0, 40.0, 59.0, 101.0, 146.0, 190.0, 134.0, 69.0, 48.0, 39.0, 13.0, 4.0, 14.0, 7.0, 5.0, 4.0, 4.0, 11.0, 4.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9148207902908325, -1.8361753225326538, -1.757529854774475, -1.6788843870162964, -1.6002390384674072, -1.5215935707092285, -1.4429481029510498, -1.364302635192871, -1.2856571674346924, -1.2070116996765137, -1.128366231918335, -1.0497207641601562, -0.9710753560066223, -0.8924298882484436, -0.8137844800949097, -0.735139012336731, -0.6564935445785522, -0.5778480768203735, -0.4992026388645172, -0.4205572009086609, -0.3419117331504822, -0.26326626539230347, -0.18462082743644714, -0.10597538948059082, -0.02732992172241211, 0.05131553113460541, 0.12996098399162292, 0.20860643684864044, 0.28725188970565796, 0.36589735746383667, 0.444542795419693, 0.5231882333755493, 0.6018338203430176, 0.6804792881011963, 0.759124755859375, 0.8377701640129089, 0.9164156317710876, 0.9950610995292664, 1.0737065076828003, 1.152351975440979, 1.2309974431991577, 1.3096429109573364, 1.3882883787155151, 1.4669338464736938, 1.545579195022583, 1.6242246627807617, 1.7028701305389404, 1.7815155982971191, 1.8601610660552979, 1.9388065338134766, 2.0174520015716553, 2.096097469329834, 2.1747429370880127, 2.2533884048461914, 2.33203387260437, 2.410679340362549, 2.4893245697021484, 2.567970037460327, 2.646615505218506, 2.7252609729766846, 2.8039064407348633, 2.882551908493042, 2.9611973762512207, 3.0398426055908203, 3.118488311767578]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 9.0, 14.0, 16.0, 32.0, 62.0, 130.0, 387.0, 1254.0, 5322.0, 4175431.0, 9771.0, 1300.0, 306.0, 101.0, 41.0, 23.0, 14.0, 14.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.61669921875, -0.5998649597167969, -0.5830307006835938, -0.5661964416503906, -0.5493621826171875, -0.5325279235839844, -0.5156936645507812, -0.4988594055175781, -0.482025146484375, -0.4651908874511719, -0.44835662841796875, -0.4315223693847656, -0.4146881103515625, -0.3978538513183594, -0.38101959228515625, -0.3641853332519531, -0.34735107421875, -0.3305168151855469, -0.31368255615234375, -0.2968482971191406, -0.2800140380859375, -0.2631797790527344, -0.24634552001953125, -0.22951126098632812, -0.212677001953125, -0.19584274291992188, -0.17900848388671875, -0.16217422485351562, -0.1453399658203125, -0.12850570678710938, -0.11167144775390625, -0.09483718872070312, -0.0780029296875, -0.061168670654296875, -0.04433441162109375, -0.027500152587890625, -0.0106658935546875, 0.006168365478515625, 0.02300262451171875, 0.039836883544921875, 0.056671142578125, 0.07350540161132812, 0.09033966064453125, 0.10717391967773438, 0.1240081787109375, 0.14084243774414062, 0.15767669677734375, 0.17451095581054688, 0.19134521484375, 0.20817947387695312, 0.22501373291015625, 0.24184799194335938, 0.2586822509765625, 0.2755165100097656, 0.29235076904296875, 0.3091850280761719, 0.326019287109375, 0.3428535461425781, 0.35968780517578125, 0.3765220642089844, 0.3933563232421875, 0.4101905822753906, 0.42702484130859375, 0.4438591003417969, 0.460693359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 6.0, 11.0, 17.0, 11.0, 15.0, 15.0, 649.0, 151.0, 18.0, 10.0, 13.0, 10.0, 5.0, 6.0, 8.0, 7.0, 3.0, 3.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0313720703125, -0.030516386032104492, -0.029660701751708984, -0.028805017471313477, -0.02794933319091797, -0.02709364891052246, -0.026237964630126953, -0.025382280349731445, -0.024526596069335938, -0.02367091178894043, -0.022815227508544922, -0.021959543228149414, -0.021103858947753906, -0.0202481746673584, -0.01939249038696289, -0.018536806106567383, -0.017681121826171875, -0.016825437545776367, -0.01596975326538086, -0.015114068984985352, -0.014258384704589844, -0.013402700424194336, -0.012547016143798828, -0.01169133186340332, -0.010835647583007812, -0.009979963302612305, -0.009124279022216797, -0.008268594741821289, -0.007412910461425781, -0.0065572261810302734, -0.005701541900634766, -0.004845857620239258, -0.00399017333984375, -0.003134489059448242, -0.0022788047790527344, -0.0014231204986572266, -0.0005674362182617188, 0.00028824806213378906, 0.0011439323425292969, 0.0019996166229248047, 0.0028553009033203125, 0.0037109851837158203, 0.004566669464111328, 0.005422353744506836, 0.006278038024902344, 0.0071337223052978516, 0.00798940658569336, 0.008845090866088867, 0.009700775146484375, 0.010556459426879883, 0.01141214370727539, 0.012267827987670898, 0.013123512268066406, 0.013979196548461914, 0.014834880828857422, 0.01569056510925293, 0.016546249389648438, 0.017401933670043945, 0.018257617950439453, 0.01911330223083496, 0.01996898651123047, 0.020824670791625977, 0.021680355072021484, 0.022536039352416992, 0.0233917236328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 8.0, 12.0, 16.0, 10.0, 15.0, 24.0, 26.0, 45.0, 40.0, 72.0, 123.0, 246.0, 635.0, 2255.0, 14783.0, 4102724.0, 65823.0, 5350.0, 1143.0, 372.0, 181.0, 96.0, 57.0, 36.0, 35.0, 23.0, 26.0, 19.0, 12.0, 7.0, 9.0, 7.0, 3.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.265869140625, -0.25722503662109375, -0.2485809326171875, -0.23993682861328125, -0.231292724609375, -0.22264862060546875, -0.2140045166015625, -0.20536041259765625, -0.19671630859375, -0.18807220458984375, -0.1794281005859375, -0.17078399658203125, -0.162139892578125, -0.15349578857421875, -0.1448516845703125, -0.13620758056640625, -0.1275634765625, -0.11891937255859375, -0.1102752685546875, -0.10163116455078125, -0.092987060546875, -0.08434295654296875, -0.0756988525390625, -0.06705474853515625, -0.05841064453125, -0.04976654052734375, -0.0411224365234375, -0.03247833251953125, -0.023834228515625, -0.01519012451171875, -0.0065460205078125, 0.00209808349609375, 0.0107421875, 0.01938629150390625, 0.0280303955078125, 0.03667449951171875, 0.045318603515625, 0.05396270751953125, 0.0626068115234375, 0.07125091552734375, 0.07989501953125, 0.08853912353515625, 0.0971832275390625, 0.10582733154296875, 0.114471435546875, 0.12311553955078125, 0.1317596435546875, 0.14040374755859375, 0.1490478515625, 0.15769195556640625, 0.1663360595703125, 0.17498016357421875, 0.183624267578125, 0.19226837158203125, 0.2009124755859375, 0.20955657958984375, 0.21820068359375, 0.22684478759765625, 0.2354888916015625, 0.24413299560546875, 0.252777099609375, 0.26142120361328125, 0.2700653076171875, 0.27870941162109375, 0.287353515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 6.0, 2.0, 3.0, 6.0, 7.0, 8.0, 5.0, 9.0, 11.0, 9.0, 11.0, 10.0, 11.0, 13.0, 19.0, 21.0, 28.0, 33.0, 3615.0, 40.0, 21.0, 30.0, 22.0, 21.0, 14.0, 8.0, 15.0, 11.0, 8.0, 15.0, 8.0, 7.0, 4.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.039306640625, -0.038028717041015625, -0.03675079345703125, -0.035472869873046875, -0.0341949462890625, -0.032917022705078125, -0.03163909912109375, -0.030361175537109375, -0.029083251953125, -0.027805328369140625, -0.02652740478515625, -0.025249481201171875, -0.0239715576171875, -0.022693634033203125, -0.02141571044921875, -0.020137786865234375, -0.01885986328125, -0.017581939697265625, -0.01630401611328125, -0.015026092529296875, -0.0137481689453125, -0.012470245361328125, -0.01119232177734375, -0.009914398193359375, -0.008636474609375, -0.007358551025390625, -0.00608062744140625, -0.004802703857421875, -0.0035247802734375, -0.002246856689453125, -0.00096893310546875, 0.000308990478515625, 0.0015869140625, 0.002864837646484375, 0.00414276123046875, 0.005420684814453125, 0.0066986083984375, 0.007976531982421875, 0.00925445556640625, 0.010532379150390625, 0.011810302734375, 0.013088226318359375, 0.01436614990234375, 0.015644073486328125, 0.0169219970703125, 0.018199920654296875, 0.01947784423828125, 0.020755767822265625, 0.02203369140625, 0.023311614990234375, 0.02458953857421875, 0.025867462158203125, 0.0271453857421875, 0.028423309326171875, 0.02970123291015625, 0.030979156494140625, 0.032257080078125, 0.033535003662109375, 0.03481292724609375, 0.036090850830078125, 0.0373687744140625, 0.038646697998046875, 0.03992462158203125, 0.041202545166015625, 0.04248046875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 25.0, 901.0, 79.0, 10.0, 3.0], "bins": [-0.5195388793945312, -0.5109933018684387, -0.5024476647377014, -0.4939020872116089, -0.48535650968551636, -0.47681090235710144, -0.4682652950286865, -0.459719717502594, -0.4511741101741791, -0.44262850284576416, -0.43408292531967163, -0.4255373179912567, -0.4169917106628418, -0.40844613313674927, -0.39990052580833435, -0.3913549482822418, -0.3828093409538269, -0.374263733625412, -0.36571815609931946, -0.35717254877090454, -0.348626971244812, -0.3400813639163971, -0.3315357565879822, -0.32299017906188965, -0.31444457173347473, -0.3058989644050598, -0.2973533868789673, -0.28880777955055237, -0.28026217222213745, -0.2717165946960449, -0.26317098736763, -0.2546254098415375, -0.24607977271080017, -0.23753418028354645, -0.22898858785629272, -0.2204429805278778, -0.21189738810062408, -0.20335179567337036, -0.19480618834495544, -0.18626059591770172, -0.177715003490448, -0.16916941106319427, -0.16062381863594055, -0.15207821130752563, -0.1435326188802719, -0.1349870264530182, -0.12644141912460327, -0.11789582669734955, -0.10935023427009583, -0.1008046418428421, -0.09225904196500778, -0.08371344208717346, -0.07516784965991974, -0.06662225723266602, -0.058076657354831696, -0.049531061202287674, -0.04098546504974365, -0.03243986889719963, -0.02389427274465561, -0.015348676592111588, -0.006803080439567566, 0.0017425157129764557, 0.010288111865520477, 0.0188337080180645, 0.02737930417060852]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 6.0, 24.0, 20.0, 24.0, 59.0, 107.0, 146.0, 167.0, 157.0, 95.0, 59.0, 28.0, 20.0, 8.0, 10.0, 6.0, 5.0, 5.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2094680666923523, -0.20156686007976532, -0.19366565346717834, -0.18576443195343018, -0.1778632253408432, -0.16996201872825623, -0.16206081211566925, -0.15415960550308228, -0.1462583839893341, -0.13835717737674713, -0.13045597076416016, -0.12255475670099258, -0.11465354263782501, -0.10675233602523804, -0.09885112941265106, -0.09094992280006409, -0.08304871618747711, -0.07514750957489014, -0.06724629551172256, -0.05934508889913559, -0.051443878561258316, -0.04354266822338104, -0.03564146161079407, -0.027740251272916794, -0.01983904093503952, -0.011937831528484821, -0.004036622121930122, 0.003864586353302002, 0.011765796691179276, 0.01966700702905655, 0.027568213641643524, 0.0354694239795208, 0.04337063431739807, 0.051271844655275345, 0.05917305499315262, 0.0670742616057396, 0.07497547566890717, 0.08287668228149414, 0.09077788889408112, 0.09867909550666809, 0.10658030956983566, 0.11448151618242264, 0.12238273024559021, 0.13028393685817719, 0.13818514347076416, 0.14608636498451233, 0.1539875566959381, 0.16188877820968628, 0.16978998482227325, 0.17769119143486023, 0.1855923980474472, 0.19349360466003418, 0.20139482617378235, 0.20929603278636932, 0.2171972393989563, 0.22509844601154327, 0.23299965262413025, 0.24090085923671722, 0.2488020658493042, 0.25670328736305237, 0.26460447907447815, 0.2725057005882263, 0.2804068922996521, 0.28830811381340027, 0.29620933532714844]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 8.0, 17.0, 10.0, 21.0, 28.0, 53.0, 55.0, 71.0, 102.0, 163.0, 222.0, 321.0, 427.0, 633.0, 920.0, 1329.0, 1959.0, 3185.0, 5099.0, 9826.0, 22235.0, 806959.0, 152364.0, 19653.0, 8843.0, 4976.0, 2878.0, 1910.0, 1322.0, 855.0, 638.0, 412.0, 293.0, 211.0, 151.0, 103.0, 72.0, 46.0, 47.0, 36.0, 25.0, 17.0, 13.0, 11.0, 11.0, 6.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.07537841796875, -0.07294178009033203, -0.07050514221191406, -0.0680685043334961, -0.06563186645507812, -0.06319522857666016, -0.06075859069824219, -0.05832195281982422, -0.05588531494140625, -0.05344867706298828, -0.05101203918457031, -0.048575401306152344, -0.046138763427734375, -0.043702125549316406, -0.04126548767089844, -0.03882884979248047, -0.0363922119140625, -0.03395557403564453, -0.03151893615722656, -0.029082298278808594, -0.026645660400390625, -0.024209022521972656, -0.021772384643554688, -0.01933574676513672, -0.01689910888671875, -0.014462471008300781, -0.012025833129882812, -0.009589195251464844, -0.007152557373046875, -0.004715919494628906, -0.0022792816162109375, 0.00015735626220703125, 0.002593994140625, 0.005030632019042969, 0.0074672698974609375, 0.009903907775878906, 0.012340545654296875, 0.014777183532714844, 0.017213821411132812, 0.01965045928955078, 0.02208709716796875, 0.02452373504638672, 0.026960372924804688, 0.029397010803222656, 0.031833648681640625, 0.034270286560058594, 0.03670692443847656, 0.03914356231689453, 0.0415802001953125, 0.04401683807373047, 0.04645347595214844, 0.048890113830566406, 0.051326751708984375, 0.053763389587402344, 0.05620002746582031, 0.05863666534423828, 0.06107330322265625, 0.06350994110107422, 0.06594657897949219, 0.06838321685791016, 0.07081985473632812, 0.0732564926147461, 0.07569313049316406, 0.07812976837158203, 0.08056640625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 15.0, 16.0, 11.0, 13.0, 112.0, 674.0, 29.0, 17.0, 6.0, 11.0, 6.0, 4.0, 11.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0281524658203125, -0.027372121810913086, -0.026591777801513672, -0.025811433792114258, -0.025031089782714844, -0.02425074577331543, -0.023470401763916016, -0.0226900577545166, -0.021909713745117188, -0.021129369735717773, -0.02034902572631836, -0.019568681716918945, -0.01878833770751953, -0.018007993698120117, -0.017227649688720703, -0.01644730567932129, -0.015666961669921875, -0.014886617660522461, -0.014106273651123047, -0.013325929641723633, -0.012545585632324219, -0.011765241622924805, -0.01098489761352539, -0.010204553604125977, -0.009424209594726562, -0.008643865585327148, -0.007863521575927734, -0.00708317756652832, -0.006302833557128906, -0.005522489547729492, -0.004742145538330078, -0.003961801528930664, -0.00318145751953125, -0.002401113510131836, -0.0016207695007324219, -0.0008404254913330078, -6.008148193359375e-05, 0.0007202625274658203, 0.0015006065368652344, 0.0022809505462646484, 0.0030612945556640625, 0.0038416385650634766, 0.004621982574462891, 0.005402326583862305, 0.006182670593261719, 0.006963014602661133, 0.007743358612060547, 0.008523702621459961, 0.009304046630859375, 0.010084390640258789, 0.010864734649658203, 0.011645078659057617, 0.012425422668457031, 0.013205766677856445, 0.01398611068725586, 0.014766454696655273, 0.015546798706054688, 0.0163271427154541, 0.017107486724853516, 0.01788783073425293, 0.018668174743652344, 0.019448518753051758, 0.020228862762451172, 0.021009206771850586, 0.02178955078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 6.0, 9.0, 14.0, 16.0, 29.0, 18.0, 37.0, 34.0, 39.0, 54.0, 79.0, 87.0, 111.0, 155.0, 170.0, 285.0, 633.0, 2936.0, 147910.0, 887293.0, 6462.0, 888.0, 334.0, 230.0, 152.0, 108.0, 93.0, 90.0, 55.0, 47.0, 43.0, 30.0, 18.0, 24.0, 12.0, 15.0, 8.0, 6.0, 4.0, 2.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17584991455078125, -0.1705474853515625, -0.16524505615234375, -0.159942626953125, -0.15464019775390625, -0.1493377685546875, -0.14403533935546875, -0.13873291015625, -0.13343048095703125, -0.1281280517578125, -0.12282562255859375, -0.117523193359375, -0.11222076416015625, -0.1069183349609375, -0.10161590576171875, -0.0963134765625, -0.09101104736328125, -0.0857086181640625, -0.08040618896484375, -0.075103759765625, -0.06980133056640625, -0.0644989013671875, -0.05919647216796875, -0.05389404296875, -0.04859161376953125, -0.0432891845703125, -0.03798675537109375, -0.032684326171875, -0.02738189697265625, -0.0220794677734375, -0.01677703857421875, -0.011474609375, -0.00617218017578125, -0.0008697509765625, 0.00443267822265625, 0.009735107421875, 0.01503753662109375, 0.0203399658203125, 0.02564239501953125, 0.03094482421875, 0.03624725341796875, 0.0415496826171875, 0.04685211181640625, 0.052154541015625, 0.05745697021484375, 0.0627593994140625, 0.06806182861328125, 0.0733642578125, 0.07866668701171875, 0.0839691162109375, 0.08927154541015625, 0.094573974609375, 0.09987640380859375, 0.1051788330078125, 0.11048126220703125, 0.11578369140625, 0.12108612060546875, 0.1263885498046875, 0.13169097900390625, 0.136993408203125, 0.14229583740234375, 0.1475982666015625, 0.15290069580078125, 0.158203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 4.0, 2.0, 4.0, 8.0, 14.0, 10.0, 20.0, 15.0, 25.0, 21.0, 21.0, 20.0, 28.0, 27.0, 30.0, 40.0, 31.0, 45.0, 40.0, 53.0, 50.0, 43.0, 40.0, 49.0, 44.0, 45.0, 33.0, 32.0, 21.0, 37.0, 18.0, 22.0, 17.0, 17.0, 15.0, 16.0, 9.0, 10.0, 7.0, 5.0, 4.0, 0.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.08526611328125, -0.08277225494384766, -0.08027839660644531, -0.07778453826904297, -0.07529067993164062, -0.07279682159423828, -0.07030296325683594, -0.0678091049194336, -0.06531524658203125, -0.0628213882446289, -0.06032752990722656, -0.05783367156982422, -0.055339813232421875, -0.05284595489501953, -0.05035209655761719, -0.047858238220214844, -0.0453643798828125, -0.042870521545410156, -0.04037666320800781, -0.03788280487060547, -0.035388946533203125, -0.03289508819580078, -0.030401229858398438, -0.027907371520996094, -0.02541351318359375, -0.022919654846191406, -0.020425796508789062, -0.01793193817138672, -0.015438079833984375, -0.012944221496582031, -0.010450363159179688, -0.007956504821777344, -0.005462646484375, -0.0029687881469726562, -0.0004749298095703125, 0.0020189285278320312, 0.004512786865234375, 0.007006645202636719, 0.009500503540039062, 0.011994361877441406, 0.01448822021484375, 0.016982078552246094, 0.019475936889648438, 0.02196979522705078, 0.024463653564453125, 0.02695751190185547, 0.029451370239257812, 0.031945228576660156, 0.0344390869140625, 0.036932945251464844, 0.03942680358886719, 0.04192066192626953, 0.044414520263671875, 0.04690837860107422, 0.04940223693847656, 0.051896095275878906, 0.05438995361328125, 0.056883811950683594, 0.05937767028808594, 0.06187152862548828, 0.06436538696289062, 0.06685924530029297, 0.06935310363769531, 0.07184696197509766, 0.0743408203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 6.0, 11.0, 24.0, 23.0, 42.0, 64.0, 119.0, 260.0, 495.0, 1342.0, 5193.0, 63765.0, 953984.0, 18498.0, 2913.0, 986.0, 383.0, 183.0, 97.0, 67.0, 40.0, 18.0, 11.0, 2.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002181529998779297, -0.00021095573902130127, -0.00020375847816467285, -0.00019656121730804443, -0.00018936395645141602, -0.0001821666955947876, -0.00017496943473815918, -0.00016777217388153076, -0.00016057491302490234, -0.00015337765216827393, -0.0001461803913116455, -0.0001389831304550171, -0.00013178586959838867, -0.00012458860874176025, -0.00011739134788513184, -0.00011019408702850342, -0.000102996826171875, -9.579956531524658e-05, -8.860230445861816e-05, -8.140504360198975e-05, -7.420778274536133e-05, -6.701052188873291e-05, -5.981326103210449e-05, -5.2616000175476074e-05, -4.5418739318847656e-05, -3.822147846221924e-05, -3.102421760559082e-05, -2.3826956748962402e-05, -1.6629695892333984e-05, -9.432435035705566e-06, -2.2351741790771484e-06, 4.9620866775512695e-06, 1.2159347534179688e-05, 1.9356608390808105e-05, 2.6553869247436523e-05, 3.375113010406494e-05, 4.094839096069336e-05, 4.814565181732178e-05, 5.5342912673950195e-05, 6.254017353057861e-05, 6.973743438720703e-05, 7.693469524383545e-05, 8.413195610046387e-05, 9.132921695709229e-05, 9.85264778137207e-05, 0.00010572373867034912, 0.00011292099952697754, 0.00012011826038360596, 0.00012731552124023438, 0.0001345127820968628, 0.0001417100429534912, 0.00014890730381011963, 0.00015610456466674805, 0.00016330182552337646, 0.00017049908638000488, 0.0001776963472366333, 0.00018489360809326172, 0.00019209086894989014, 0.00019928812980651855, 0.00020648539066314697, 0.0002136826515197754, 0.0002208799123764038, 0.00022807717323303223, 0.00023527443408966064, 0.00024247169494628906]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 3.0, 16.0, 25.0, 37.0, 52.0, 71.0, 105.0, 92.0, 131.0, 91.0, 114.0, 55.0, 67.0, 36.0, 45.0, 24.0, 16.0, 10.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.331371307373047e-06, -7.119961082935333e-06, -6.90855085849762e-06, -6.697140634059906e-06, -6.485730409622192e-06, -6.274320185184479e-06, -6.062909960746765e-06, -5.8514997363090515e-06, -5.640089511871338e-06, -5.428679287433624e-06, -5.217269062995911e-06, -5.005858838558197e-06, -4.794448614120483e-06, -4.58303838968277e-06, -4.371628165245056e-06, -4.1602179408073425e-06, -3.948807716369629e-06, -3.7373974919319153e-06, -3.5259872674942017e-06, -3.314577043056488e-06, -3.1031668186187744e-06, -2.891756594181061e-06, -2.680346369743347e-06, -2.4689361453056335e-06, -2.25752592086792e-06, -2.0461156964302063e-06, -1.8347054719924927e-06, -1.623295247554779e-06, -1.4118850231170654e-06, -1.2004747986793518e-06, -9.890645742416382e-07, -7.776543498039246e-07, -5.662441253662109e-07, -3.548339009284973e-07, -1.434236764907837e-07, 6.798654794692993e-08, 2.7939677238464355e-07, 4.908069968223572e-07, 7.022172212600708e-07, 9.136274456977844e-07, 1.125037670135498e-06, 1.3364478945732117e-06, 1.5478581190109253e-06, 1.759268343448639e-06, 1.9706785678863525e-06, 2.182088792324066e-06, 2.3934990167617798e-06, 2.6049092411994934e-06, 2.816319465637207e-06, 3.0277296900749207e-06, 3.2391399145126343e-06, 3.450550138950348e-06, 3.6619603633880615e-06, 3.873370587825775e-06, 4.084780812263489e-06, 4.296191036701202e-06, 4.507601261138916e-06, 4.71901148557663e-06, 4.930421710014343e-06, 5.141831934452057e-06, 5.3532421588897705e-06, 5.564652383327484e-06, 5.776062607765198e-06, 5.987472832202911e-06, 6.198883056640625e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 5.0, 9.0, 14.0, 19.0, 17.0, 23.0, 39.0, 41.0, 84.0, 102.0, 173.0, 285.0, 627.0, 4735.0, 1010626.0, 29736.0, 1038.0, 350.0, 191.0, 131.0, 85.0, 64.0, 40.0, 43.0, 18.0, 10.0, 15.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001894235610961914, -0.00018282420933246613, -0.00017622485756874084, -0.00016962550580501556, -0.00016302615404129028, -0.000156426802277565, -0.00014982745051383972, -0.00014322809875011444, -0.00013662874698638916, -0.00013002939522266388, -0.0001234300434589386, -0.00011683069169521332, -0.00011023133993148804, -0.00010363198816776276, -9.703263640403748e-05, -9.04332846403122e-05, -8.383393287658691e-05, -7.723458111286163e-05, -7.063522934913635e-05, -6.403587758541107e-05, -5.743652582168579e-05, -5.083717405796051e-05, -4.423782229423523e-05, -3.763847053050995e-05, -3.103911876678467e-05, -2.4439767003059387e-05, -1.7840415239334106e-05, -1.1241063475608826e-05, -4.641711711883545e-06, 1.957640051841736e-06, 8.556991815567017e-06, 1.5156343579292297e-05, 2.1755695343017578e-05, 2.835504710674286e-05, 3.495439887046814e-05, 4.155375063419342e-05, 4.81531023979187e-05, 5.475245416164398e-05, 6.135180592536926e-05, 6.795115768909454e-05, 7.455050945281982e-05, 8.11498612165451e-05, 8.774921298027039e-05, 9.434856474399567e-05, 0.00010094791650772095, 0.00010754726827144623, 0.00011414662003517151, 0.00012074597179889679, 0.00012734532356262207, 0.00013394467532634735, 0.00014054402709007263, 0.0001471433788537979, 0.0001537427306175232, 0.00016034208238124847, 0.00016694143414497375, 0.00017354078590869904, 0.00018014013767242432, 0.0001867394894361496, 0.00019333884119987488, 0.00019993819296360016, 0.00020653754472732544, 0.00021313689649105072, 0.000219736248254776, 0.00022633560001850128, 0.00023293495178222656]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 7.0, 10.0, 14.0, 11.0, 11.0, 19.0, 22.0, 32.0, 45.0, 53.0, 63.0, 82.0, 68.0, 83.0, 86.0, 63.0, 74.0, 51.0, 41.0, 41.0, 34.0, 14.0, 26.0, 11.0, 6.0, 9.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.916854858398438e-05, -8.606258779764175e-05, -8.295662701129913e-05, -7.985066622495651e-05, -7.674470543861389e-05, -7.363874465227127e-05, -7.053278386592865e-05, -6.742682307958603e-05, -6.432086229324341e-05, -6.121490150690079e-05, -5.8108940720558167e-05, -5.5002979934215546e-05, -5.1897019147872925e-05, -4.8791058361530304e-05, -4.568509757518768e-05, -4.257913678884506e-05, -3.947317600250244e-05, -3.636721521615982e-05, -3.32612544298172e-05, -3.015529364347458e-05, -2.7049332857131958e-05, -2.3943372070789337e-05, -2.0837411284446716e-05, -1.7731450498104095e-05, -1.4625489711761475e-05, -1.1519528925418854e-05, -8.413568139076233e-06, -5.307607352733612e-06, -2.201646566390991e-06, 9.043142199516296e-07, 4.0102750062942505e-06, 7.116235792636871e-06, 1.0222196578979492e-05, 1.3328157365322113e-05, 1.6434118151664734e-05, 1.9540078938007355e-05, 2.2646039724349976e-05, 2.5752000510692596e-05, 2.8857961297035217e-05, 3.196392208337784e-05, 3.506988286972046e-05, 3.817584365606308e-05, 4.12818044424057e-05, 4.438776522874832e-05, 4.749372601509094e-05, 5.059968680143356e-05, 5.3705647587776184e-05, 5.6811608374118805e-05, 5.9917569160461426e-05, 6.302352994680405e-05, 6.612949073314667e-05, 6.923545151948929e-05, 7.234141230583191e-05, 7.544737309217453e-05, 7.855333387851715e-05, 8.165929466485977e-05, 8.476525545120239e-05, 8.787121623754501e-05, 9.097717702388763e-05, 9.408313781023026e-05, 9.718909859657288e-05, 0.0001002950593829155, 0.00010340102016925812, 0.00010650698095560074, 0.00010961294174194336]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 36.0, 967.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22593055665493011, -0.1744968444108963, -0.12306312471628189, -0.07162940502166748, -0.020195692777633667, 0.03123803436756134, 0.08267174661159515, 0.13410545885562897, 0.18553917109966278, 0.2369728833436966, 0.2884066104888916, 0.3398403227329254, 0.39127403497695923, 0.44270777702331543, 0.49414145946502686, 0.5455752015113831, 0.5970088839530945, 0.6484426259994507, 0.6998763084411621, 0.7513100504875183, 0.8027437329292297, 0.8541774749755859, 0.9056111574172974, 0.9570448994636536, 1.0084786415100098, 1.0599123239517212, 1.1113461256027222, 1.1627798080444336, 1.214213490486145, 1.2656471729278564, 1.3170809745788574, 1.3685146570205688, 1.4199484586715698, 1.4713821411132812, 1.5228159427642822, 1.5742496252059937, 1.625683307647705, 1.677117109298706, 1.7285507917404175, 1.779984474182129, 1.8314181566238403, 1.8828518390655518, 1.9342856407165527, 1.9857193231582642, 2.0371530055999756, 2.0885868072509766, 2.1400203704833984, 2.1914541721343994, 2.2428879737854004, 2.2943217754364014, 2.3457553386688232, 2.397189140319824, 2.448622941970825, 2.500056505203247, 2.551490306854248, 2.60292387008667, 2.654357671737671, 2.705791473388672, 2.7572250366210938, 2.8086588382720947, 2.8600926399230957, 2.9115262031555176, 2.9629600048065186, 3.0143938064575195, 3.0658273696899414]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 6.0, 13.0, 12.0, 6.0, 8.0, 15.0, 22.0, 32.0, 33.0, 53.0, 56.0, 60.0, 78.0, 70.0, 83.0, 71.0, 55.0, 70.0, 50.0, 53.0, 36.0, 33.0, 12.0, 12.0, 12.0, 4.0, 6.0, 6.0, 2.0, 1.0, 5.0, 2.0, 0.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.7773054242134094, -0.7545614838600159, -0.7318175435066223, -0.7090736031532288, -0.6863296031951904, -0.6635856628417969, -0.6408417224884033, -0.6180977821350098, -0.5953538417816162, -0.5726099014282227, -0.5498659610748291, -0.5271220207214355, -0.504378080368042, -0.48163411021232605, -0.4588901400566101, -0.43614619970321655, -0.413402259349823, -0.39065831899642944, -0.3679143786430359, -0.34517040848731995, -0.3224264681339264, -0.29968252778053284, -0.2769385576248169, -0.25419461727142334, -0.23145067691802979, -0.20870673656463623, -0.18596278131008148, -0.16321882605552673, -0.14047488570213318, -0.11773093789815903, -0.09498699009418488, -0.07224303483963013, -0.0494990348815918, -0.026755087077617645, -0.004011139273643494, 0.018732808530330658, 0.04147675633430481, 0.06422070413827896, 0.08696465194225311, 0.10970860719680786, 0.13245254755020142, 0.15519648790359497, 0.17794044315814972, 0.20068439841270447, 0.22342833876609802, 0.24617227911949158, 0.2689162492752075, 0.2916601896286011, 0.31440412998199463, 0.3371480703353882, 0.35989201068878174, 0.3826359808444977, 0.40537992119789124, 0.4281238615512848, 0.45086783170700073, 0.4736117720603943, 0.49635571241378784, 0.5190996527671814, 0.541843593120575, 0.5645875334739685, 0.5873315334320068, 0.6100754737854004, 0.632819414138794, 0.6555633544921875, 0.678307294845581]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 14.0, 11.0, 15.0, 31.0, 34.0, 63.0, 84.0, 139.0, 228.0, 397.0, 669.0, 1349.0, 2939.0, 8716.0, 4119184.0, 51205.0, 5617.0, 1867.0, 794.0, 389.0, 213.0, 103.0, 70.0, 51.0, 18.0, 20.0, 9.0, 10.0, 6.0, 5.0, 1.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.264404296875, -0.25702667236328125, -0.2496490478515625, -0.24227142333984375, -0.234893798828125, -0.22751617431640625, -0.2201385498046875, -0.21276092529296875, -0.20538330078125, -0.19800567626953125, -0.1906280517578125, -0.18325042724609375, -0.175872802734375, -0.16849517822265625, -0.1611175537109375, -0.15373992919921875, -0.1463623046875, -0.13898468017578125, -0.1316070556640625, -0.12422943115234375, -0.116851806640625, -0.10947418212890625, -0.1020965576171875, -0.09471893310546875, -0.08734130859375, -0.07996368408203125, -0.0725860595703125, -0.06520843505859375, -0.057830810546875, -0.05045318603515625, -0.0430755615234375, -0.03569793701171875, -0.0283203125, -0.02094268798828125, -0.0135650634765625, -0.00618743896484375, 0.001190185546875, 0.00856781005859375, 0.0159454345703125, 0.02332305908203125, 0.03070068359375, 0.03807830810546875, 0.0454559326171875, 0.05283355712890625, 0.060211181640625, 0.06758880615234375, 0.0749664306640625, 0.08234405517578125, 0.0897216796875, 0.09709930419921875, 0.1044769287109375, 0.11185455322265625, 0.119232177734375, 0.12660980224609375, 0.1339874267578125, 0.14136505126953125, 0.14874267578125, 0.15612030029296875, 0.1634979248046875, 0.17087554931640625, 0.178253173828125, 0.18563079833984375, 0.1930084228515625, 0.20038604736328125, 0.207763671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 3.0, 6.0, 10.0, 17.0, 14.0, 16.0, 9.0, 272.0, 509.0, 29.0, 18.0, 9.0, 12.0, 4.0, 9.0, 8.0, 9.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0264892578125, -0.02575230598449707, -0.02501535415649414, -0.02427840232849121, -0.02354145050048828, -0.02280449867248535, -0.022067546844482422, -0.021330595016479492, -0.020593643188476562, -0.019856691360473633, -0.019119739532470703, -0.018382787704467773, -0.017645835876464844, -0.016908884048461914, -0.016171932220458984, -0.015434980392456055, -0.014698028564453125, -0.013961076736450195, -0.013224124908447266, -0.012487173080444336, -0.011750221252441406, -0.011013269424438477, -0.010276317596435547, -0.009539365768432617, -0.008802413940429688, -0.008065462112426758, -0.007328510284423828, -0.0065915584564208984, -0.005854606628417969, -0.005117654800415039, -0.004380702972412109, -0.0036437511444091797, -0.00290679931640625, -0.0021698474884033203, -0.0014328956604003906, -0.0006959438323974609, 4.100799560546875e-05, 0.0007779598236083984, 0.0015149116516113281, 0.002251863479614258, 0.0029888153076171875, 0.003725767135620117, 0.004462718963623047, 0.0051996707916259766, 0.005936622619628906, 0.006673574447631836, 0.007410526275634766, 0.008147478103637695, 0.008884429931640625, 0.009621381759643555, 0.010358333587646484, 0.011095285415649414, 0.011832237243652344, 0.012569189071655273, 0.013306140899658203, 0.014043092727661133, 0.014780044555664062, 0.015516996383666992, 0.016253948211669922, 0.01699090003967285, 0.01772785186767578, 0.01846480369567871, 0.01920175552368164, 0.01993870735168457, 0.0206756591796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 14.0, 10.0, 7.0, 18.0, 38.0, 54.0, 86.0, 123.0, 324.0, 1283.0, 115543.0, 4074336.0, 1686.0, 372.0, 127.0, 90.0, 62.0, 29.0, 22.0, 14.0, 11.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6365127563476562, -0.6172637939453125, -0.5980148315429688, -0.578765869140625, -0.5595169067382812, -0.5402679443359375, -0.5210189819335938, -0.50177001953125, -0.48252105712890625, -0.4632720947265625, -0.44402313232421875, -0.424774169921875, -0.40552520751953125, -0.3862762451171875, -0.36702728271484375, -0.3477783203125, -0.32852935791015625, -0.3092803955078125, -0.29003143310546875, -0.270782470703125, -0.25153350830078125, -0.2322845458984375, -0.21303558349609375, -0.19378662109375, -0.17453765869140625, -0.1552886962890625, -0.13603973388671875, -0.116790771484375, -0.09754180908203125, -0.0782928466796875, -0.05904388427734375, -0.039794921875, -0.02054595947265625, -0.0012969970703125, 0.01795196533203125, 0.037200927734375, 0.05644989013671875, 0.0756988525390625, 0.09494781494140625, 0.11419677734375, 0.13344573974609375, 0.1526947021484375, 0.17194366455078125, 0.191192626953125, 0.21044158935546875, 0.2296905517578125, 0.24893951416015625, 0.2681884765625, 0.28743743896484375, 0.3066864013671875, 0.32593536376953125, 0.345184326171875, 0.36443328857421875, 0.3836822509765625, 0.40293121337890625, 0.42218017578125, 0.44142913818359375, 0.4606781005859375, 0.47992706298828125, 0.499176025390625, 0.5184249877929688, 0.5376739501953125, 0.5569229125976562, 0.576171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 7.0, 9.0, 17.0, 23.0, 23.0, 21.0, 51.0, 85.0, 132.0, 3050.0, 316.0, 101.0, 65.0, 37.0, 37.0, 25.0, 17.0, 8.0, 12.0, 8.0, 4.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.10040283203125, -0.09794187545776367, -0.09548091888427734, -0.09301996231079102, -0.09055900573730469, -0.08809804916381836, -0.08563709259033203, -0.0831761360168457, -0.08071517944335938, -0.07825422286987305, -0.07579326629638672, -0.07333230972290039, -0.07087135314941406, -0.06841039657592773, -0.0659494400024414, -0.06348848342895508, -0.06102752685546875, -0.05856657028198242, -0.056105613708496094, -0.053644657135009766, -0.05118370056152344, -0.04872274398803711, -0.04626178741455078, -0.04380083084106445, -0.041339874267578125, -0.0388789176940918, -0.03641796112060547, -0.03395700454711914, -0.03149604797363281, -0.029035091400146484, -0.026574134826660156, -0.024113178253173828, -0.0216522216796875, -0.019191265106201172, -0.016730308532714844, -0.014269351959228516, -0.011808395385742188, -0.00934743881225586, -0.006886482238769531, -0.004425525665283203, -0.001964569091796875, 0.0004963874816894531, 0.0029573440551757812, 0.005418300628662109, 0.007879257202148438, 0.010340213775634766, 0.012801170349121094, 0.015262126922607422, 0.01772308349609375, 0.020184040069580078, 0.022644996643066406, 0.025105953216552734, 0.027566909790039062, 0.03002786636352539, 0.03248882293701172, 0.03494977951049805, 0.037410736083984375, 0.0398716926574707, 0.04233264923095703, 0.04479360580444336, 0.04725456237792969, 0.049715518951416016, 0.052176475524902344, 0.05463743209838867, 0.057098388671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 6.0, 29.0, 90.0, 610.0, 205.0, 36.0, 12.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1501970887184143, -0.14717577397823334, -0.14415445923805237, -0.1411331295967102, -0.13811181485652924, -0.13509050011634827, -0.1320691853761673, -0.12904787063598633, -0.12602655589580536, -0.12300524115562439, -0.11998391896486282, -0.11696260422468185, -0.11394128948450089, -0.11091996729373932, -0.10789865255355835, -0.10487733781337738, -0.10185600817203522, -0.09883469343185425, -0.09581337124109268, -0.09279205650091171, -0.08977074176073074, -0.08674941956996918, -0.08372810482978821, -0.08070679008960724, -0.07768547534942627, -0.0746641606092453, -0.07164283841848373, -0.06862152367830276, -0.0656002089381218, -0.06257888674736023, -0.05955757200717926, -0.05653625354170799, -0.053514935076236725, -0.05049361661076546, -0.04747230187058449, -0.04445098340511322, -0.04142966493964195, -0.038408346474170685, -0.035387031733989716, -0.03236571326851845, -0.02934439666569233, -0.02632308006286621, -0.023301761597394943, -0.020280444994568825, -0.017259128391742706, -0.014237809926271439, -0.01121649332344532, -0.008195174857974052, -0.005173858255147934, -0.0021525409538298845, 0.0008687763474881649, 0.0038900934159755707, 0.006911410950124264, 0.009932728484272957, 0.012954045087099075, 0.015975363552570343, 0.01899668015539646, 0.02201799675822258, 0.025039315223693848, 0.028060631826519966, 0.031081948429346085, 0.03410326689481735, 0.03712458163499832, 0.04014590382575989, 0.04316721856594086]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 7.0, 9.0, 21.0, 35.0, 43.0, 81.0, 83.0, 112.0, 112.0, 113.0, 84.0, 81.0, 68.0, 38.0, 29.0, 18.0, 7.0, 7.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28254222869873047, -0.2722442150115967, -0.2619462013244629, -0.2516481876373291, -0.2413501888513565, -0.23105217516422272, -0.22075417637825012, -0.21045616269111633, -0.20015814900398254, -0.18986013531684875, -0.17956212162971497, -0.16926412284374237, -0.15896610915660858, -0.1486680954694748, -0.1383700966835022, -0.1280720829963684, -0.11777406930923462, -0.10747605562210083, -0.09717804938554764, -0.08688004314899445, -0.07658202946186066, -0.06628401577472687, -0.055986009538173676, -0.04568800330162048, -0.035389989614486694, -0.025091979652643204, -0.014793969690799713, -0.0044959597289562225, 0.005802050232887268, 0.01610006019473076, 0.02639807015657425, 0.03669607639312744, 0.04699409008026123, 0.05729210004210472, 0.06759011000394821, 0.0778881162405014, 0.08818612992763519, 0.09848414361476898, 0.10878214985132217, 0.11908015608787537, 0.12937816977500916, 0.13967618346214294, 0.14997419714927673, 0.16027219593524933, 0.17057020962238312, 0.1808682233095169, 0.1911662220954895, 0.2014642357826233, 0.21176224946975708, 0.22206026315689087, 0.23235827684402466, 0.24265627562999725, 0.25295430421829224, 0.26325228810310364, 0.2735503017902374, 0.2838483154773712, 0.294146329164505, 0.3044443428516388, 0.3147423565387726, 0.32504037022590637, 0.3353383541107178, 0.34563636779785156, 0.35593438148498535, 0.36623239517211914, 0.37653040885925293]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 3.0, 15.0, 12.0, 10.0, 23.0, 25.0, 27.0, 34.0, 54.0, 63.0, 84.0, 104.0, 141.0, 151.0, 228.0, 292.0, 381.0, 537.0, 742.0, 1141.0, 1592.0, 2605.0, 4664.0, 8837.0, 20527.0, 805958.0, 162476.0, 18022.0, 7606.0, 4170.0, 2543.0, 1638.0, 1072.0, 762.0, 506.0, 369.0, 279.0, 226.0, 148.0, 122.0, 76.0, 70.0, 63.0, 39.0, 29.0, 16.0, 13.0, 12.0, 15.0, 5.0, 10.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0], "bins": [-0.06182861328125, -0.059950828552246094, -0.05807304382324219, -0.05619525909423828, -0.054317474365234375, -0.05243968963623047, -0.05056190490722656, -0.048684120178222656, -0.04680633544921875, -0.044928550720214844, -0.04305076599121094, -0.04117298126220703, -0.039295196533203125, -0.03741741180419922, -0.03553962707519531, -0.033661842346191406, -0.0317840576171875, -0.029906272888183594, -0.028028488159179688, -0.02615070343017578, -0.024272918701171875, -0.02239513397216797, -0.020517349243164062, -0.018639564514160156, -0.01676177978515625, -0.014883995056152344, -0.013006210327148438, -0.011128425598144531, -0.009250640869140625, -0.007372856140136719, -0.0054950714111328125, -0.0036172866821289062, -0.001739501953125, 0.00013828277587890625, 0.0020160675048828125, 0.0038938522338867188, 0.005771636962890625, 0.007649421691894531, 0.009527206420898438, 0.011404991149902344, 0.01328277587890625, 0.015160560607910156, 0.017038345336914062, 0.01891613006591797, 0.020793914794921875, 0.02267169952392578, 0.024549484252929688, 0.026427268981933594, 0.0283050537109375, 0.030182838439941406, 0.03206062316894531, 0.03393840789794922, 0.035816192626953125, 0.03769397735595703, 0.03957176208496094, 0.041449546813964844, 0.04332733154296875, 0.045205116271972656, 0.04708290100097656, 0.04896068572998047, 0.050838470458984375, 0.05271625518798828, 0.05459403991699219, 0.056471824645996094, 0.058349609375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 2.0, 7.0, 10.0, 16.0, 14.0, 13.0, 7.0, 103.0, 620.0, 82.0, 24.0, 13.0, 8.0, 8.0, 4.0, 12.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0231781005859375, -0.022502422332763672, -0.021826744079589844, -0.021151065826416016, -0.020475387573242188, -0.01979970932006836, -0.01912403106689453, -0.018448352813720703, -0.017772674560546875, -0.017096996307373047, -0.01642131805419922, -0.01574563980102539, -0.015069961547851562, -0.014394283294677734, -0.013718605041503906, -0.013042926788330078, -0.01236724853515625, -0.011691570281982422, -0.011015892028808594, -0.010340213775634766, -0.009664535522460938, -0.00898885726928711, -0.008313179016113281, -0.007637500762939453, -0.006961822509765625, -0.006286144256591797, -0.005610466003417969, -0.004934787750244141, -0.0042591094970703125, -0.0035834312438964844, -0.0029077529907226562, -0.002232074737548828, -0.001556396484375, -0.0008807182312011719, -0.00020503997802734375, 0.0004706382751464844, 0.0011463165283203125, 0.0018219947814941406, 0.0024976730346679688, 0.003173351287841797, 0.003849029541015625, 0.004524707794189453, 0.005200386047363281, 0.005876064300537109, 0.0065517425537109375, 0.007227420806884766, 0.007903099060058594, 0.008578777313232422, 0.00925445556640625, 0.009930133819580078, 0.010605812072753906, 0.011281490325927734, 0.011957168579101562, 0.01263284683227539, 0.013308525085449219, 0.013984203338623047, 0.014659881591796875, 0.015335559844970703, 0.01601123809814453, 0.01668691635131836, 0.017362594604492188, 0.018038272857666016, 0.018713951110839844, 0.019389629364013672, 0.0200653076171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 9.0, 12.0, 16.0, 24.0, 22.0, 36.0, 40.0, 42.0, 60.0, 81.0, 86.0, 110.0, 125.0, 188.0, 234.0, 516.0, 2499.0, 256256.0, 782890.0, 3481.0, 593.0, 296.0, 208.0, 140.0, 114.0, 89.0, 86.0, 54.0, 50.0, 36.0, 33.0, 27.0, 18.0, 11.0, 19.0, 9.0, 13.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15586090087890625, -0.1501007080078125, -0.14434051513671875, -0.138580322265625, -0.13282012939453125, -0.1270599365234375, -0.12129974365234375, -0.11553955078125, -0.10977935791015625, -0.1040191650390625, -0.09825897216796875, -0.092498779296875, -0.08673858642578125, -0.0809783935546875, -0.07521820068359375, -0.0694580078125, -0.06369781494140625, -0.0579376220703125, -0.05217742919921875, -0.046417236328125, -0.04065704345703125, -0.0348968505859375, -0.02913665771484375, -0.02337646484375, -0.01761627197265625, -0.0118560791015625, -0.00609588623046875, -0.000335693359375, 0.00542449951171875, 0.0111846923828125, 0.01694488525390625, 0.022705078125, 0.02846527099609375, 0.0342254638671875, 0.03998565673828125, 0.045745849609375, 0.05150604248046875, 0.0572662353515625, 0.06302642822265625, 0.06878662109375, 0.07454681396484375, 0.0803070068359375, 0.08606719970703125, 0.091827392578125, 0.09758758544921875, 0.1033477783203125, 0.10910797119140625, 0.1148681640625, 0.12062835693359375, 0.1263885498046875, 0.13214874267578125, 0.137908935546875, 0.14366912841796875, 0.1494293212890625, 0.15518951416015625, 0.16094970703125, 0.16670989990234375, 0.1724700927734375, 0.17823028564453125, 0.183990478515625, 0.18975067138671875, 0.1955108642578125, 0.20127105712890625, 0.20703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 9.0, 11.0, 16.0, 10.0, 19.0, 25.0, 14.0, 26.0, 29.0, 27.0, 37.0, 29.0, 36.0, 34.0, 55.0, 43.0, 52.0, 39.0, 43.0, 46.0, 43.0, 50.0, 42.0, 42.0, 34.0, 30.0, 20.0, 18.0, 17.0, 19.0, 16.0, 9.0, 5.0, 13.0, 6.0, 10.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0538330078125, -0.05191230773925781, -0.049991607666015625, -0.04807090759277344, -0.04615020751953125, -0.04422950744628906, -0.042308807373046875, -0.04038810729980469, -0.0384674072265625, -0.03654670715332031, -0.034626007080078125, -0.03270530700683594, -0.03078460693359375, -0.028863906860351562, -0.026943206787109375, -0.025022506713867188, -0.023101806640625, -0.021181106567382812, -0.019260406494140625, -0.017339706420898438, -0.01541900634765625, -0.013498306274414062, -0.011577606201171875, -0.009656906127929688, -0.0077362060546875, -0.0058155059814453125, -0.003894805908203125, -0.0019741058349609375, -5.340576171875e-05, 0.0018672943115234375, 0.003787994384765625, 0.0057086944580078125, 0.00762939453125, 0.009550094604492188, 0.011470794677734375, 0.013391494750976562, 0.01531219482421875, 0.017232894897460938, 0.019153594970703125, 0.021074295043945312, 0.0229949951171875, 0.024915695190429688, 0.026836395263671875, 0.028757095336914062, 0.03067779541015625, 0.03259849548339844, 0.034519195556640625, 0.03643989562988281, 0.038360595703125, 0.04028129577636719, 0.042201995849609375, 0.04412269592285156, 0.04604339599609375, 0.04796409606933594, 0.049884796142578125, 0.05180549621582031, 0.0537261962890625, 0.05564689636230469, 0.057567596435546875, 0.05948829650878906, 0.06140899658203125, 0.06332969665527344, 0.06525039672851562, 0.06717109680175781, 0.069091796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 8.0, 22.0, 21.0, 40.0, 61.0, 74.0, 159.0, 262.0, 446.0, 986.0, 2383.0, 10972.0, 313018.0, 701596.0, 13679.0, 2581.0, 1025.0, 511.0, 262.0, 159.0, 107.0, 54.0, 44.0, 25.0, 11.0, 16.0, 4.0, 7.0, 0.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002498626708984375, -0.00024273432791233063, -0.00023560598492622375, -0.00022847764194011688, -0.00022134929895401, -0.00021422095596790314, -0.00020709261298179626, -0.0001999642699956894, -0.00019283592700958252, -0.00018570758402347565, -0.00017857924103736877, -0.0001714508980512619, -0.00016432255506515503, -0.00015719421207904816, -0.00015006586909294128, -0.0001429375261068344, -0.00013580918312072754, -0.00012868084013462067, -0.0001215524971485138, -0.00011442415416240692, -0.00010729581117630005, -0.00010016746819019318, -9.30391252040863e-05, -8.591078221797943e-05, -7.878243923187256e-05, -7.165409624576569e-05, -6.452575325965881e-05, -5.739741027355194e-05, -5.026906728744507e-05, -4.3140724301338196e-05, -3.601238131523132e-05, -2.888403832912445e-05, -2.1755695343017578e-05, -1.4627352356910706e-05, -7.499009370803833e-06, -3.7066638469696045e-07, 6.757676601409912e-06, 1.3886019587516785e-05, 2.1014362573623657e-05, 2.814270555973053e-05, 3.52710485458374e-05, 4.2399391531944275e-05, 4.952773451805115e-05, 5.665607750415802e-05, 6.378442049026489e-05, 7.091276347637177e-05, 7.804110646247864e-05, 8.516944944858551e-05, 9.229779243469238e-05, 9.942613542079926e-05, 0.00010655447840690613, 0.000113682821393013, 0.00012081116437911987, 0.00012793950736522675, 0.00013506785035133362, 0.0001421961933374405, 0.00014932453632354736, 0.00015645287930965424, 0.0001635812222957611, 0.00017070956528186798, 0.00017783790826797485, 0.00018496625125408173, 0.0001920945942401886, 0.00019922293722629547, 0.00020635128021240234]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 4.0, 6.0, 4.0, 11.0, 8.0, 22.0, 18.0, 22.0, 40.0, 38.0, 62.0, 51.0, 75.0, 93.0, 78.0, 70.0, 80.0, 80.0, 46.0, 47.0, 28.0, 23.0, 27.0, 13.0, 18.0, 11.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.092952728271484e-06, -6.86105340719223e-06, -6.629154086112976e-06, -6.397254765033722e-06, -6.165355443954468e-06, -5.933456122875214e-06, -5.7015568017959595e-06, -5.469657480716705e-06, -5.237758159637451e-06, -5.005858838558197e-06, -4.773959517478943e-06, -4.542060196399689e-06, -4.3101608753204346e-06, -4.07826155424118e-06, -3.846362233161926e-06, -3.614462912082672e-06, -3.382563591003418e-06, -3.150664269924164e-06, -2.9187649488449097e-06, -2.6868656277656555e-06, -2.4549663066864014e-06, -2.2230669856071472e-06, -1.991167664527893e-06, -1.759268343448639e-06, -1.5273690223693848e-06, -1.2954697012901306e-06, -1.0635703802108765e-06, -8.316710591316223e-07, -5.997717380523682e-07, -3.67872416973114e-07, -1.3597309589385986e-07, 9.592622518539429e-08, 3.2782554626464844e-07, 5.597248673439026e-07, 7.916241884231567e-07, 1.0235235095024109e-06, 1.255422830581665e-06, 1.4873221516609192e-06, 1.7192214727401733e-06, 1.9511207938194275e-06, 2.1830201148986816e-06, 2.414919435977936e-06, 2.64681875705719e-06, 2.878718078136444e-06, 3.1106173992156982e-06, 3.3425167202949524e-06, 3.5744160413742065e-06, 3.8063153624534607e-06, 4.038214683532715e-06, 4.270114004611969e-06, 4.502013325691223e-06, 4.733912646770477e-06, 4.9658119678497314e-06, 5.197711288928986e-06, 5.42961061000824e-06, 5.661509931087494e-06, 5.893409252166748e-06, 6.125308573246002e-06, 6.357207894325256e-06, 6.5891072154045105e-06, 6.821006536483765e-06, 7.052905857563019e-06, 7.284805178642273e-06, 7.516704499721527e-06, 7.748603820800781e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 13.0, 10.0, 11.0, 17.0, 24.0, 34.0, 40.0, 76.0, 92.0, 134.0, 212.0, 372.0, 1125.0, 69410.0, 973671.0, 2114.0, 449.0, 244.0, 139.0, 99.0, 61.0, 51.0, 33.0, 30.0, 13.0, 20.0, 12.0, 8.0, 7.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0004417896270751953, -0.00042956694960594177, -0.00041734427213668823, -0.0004051215946674347, -0.00039289891719818115, -0.0003806762397289276, -0.00036845356225967407, -0.00035623088479042053, -0.000344008207321167, -0.00033178552985191345, -0.0003195628523826599, -0.00030734017491340637, -0.00029511749744415283, -0.0002828948199748993, -0.00027067214250564575, -0.0002584494650363922, -0.00024622678756713867, -0.00023400411009788513, -0.0002217814326286316, -0.00020955875515937805, -0.0001973360776901245, -0.00018511340022087097, -0.00017289072275161743, -0.0001606680452823639, -0.00014844536781311035, -0.0001362226903438568, -0.00012400001287460327, -0.00011177733540534973, -9.955465793609619e-05, -8.733198046684265e-05, -7.510930299758911e-05, -6.288662552833557e-05, -5.066394805908203e-05, -3.844127058982849e-05, -2.621859312057495e-05, -1.3995915651321411e-05, -1.773238182067871e-06, 1.0449439287185669e-05, 2.267211675643921e-05, 3.489479422569275e-05, 4.711747169494629e-05, 5.934014916419983e-05, 7.156282663345337e-05, 8.378550410270691e-05, 9.600818157196045e-05, 0.00010823085904121399, 0.00012045353651046753, 0.00013267621397972107, 0.0001448988914489746, 0.00015712156891822815, 0.0001693442463874817, 0.00018156692385673523, 0.00019378960132598877, 0.0002060122787952423, 0.00021823495626449585, 0.0002304576337337494, 0.00024268031120300293, 0.00025490298867225647, 0.00026712566614151, 0.00027934834361076355, 0.0002915710210800171, 0.00030379369854927063, 0.00031601637601852417, 0.0003282390534877777, 0.00034046173095703125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 4.0, 5.0, 14.0, 14.0, 16.0, 18.0, 34.0, 31.0, 55.0, 63.0, 60.0, 89.0, 80.0, 90.0, 85.0, 64.0, 64.0, 51.0, 36.0, 20.0, 19.0, 19.0, 17.0, 5.0, 13.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014710426330566406, -0.0001430325210094452, -0.00013896077871322632, -0.00013488903641700745, -0.00013081729412078857, -0.0001267455518245697, -0.00012267380952835083, -0.00011860206723213196, -0.00011453032493591309, -0.00011045858263969421, -0.00010638684034347534, -0.00010231509804725647, -9.82433557510376e-05, -9.417161345481873e-05, -9.009987115859985e-05, -8.602812886238098e-05, -8.195638656616211e-05, -7.788464426994324e-05, -7.381290197372437e-05, -6.974115967750549e-05, -6.566941738128662e-05, -6.159767508506775e-05, -5.752593278884888e-05, -5.3454190492630005e-05, -4.938244819641113e-05, -4.531070590019226e-05, -4.123896360397339e-05, -3.7167221307754517e-05, -3.3095479011535645e-05, -2.9023736715316772e-05, -2.49519944190979e-05, -2.088025212287903e-05, -1.6808509826660156e-05, -1.2736767530441284e-05, -8.665025234222412e-06, -4.59328293800354e-06, -5.21540641784668e-07, 3.550201654434204e-06, 7.621943950653076e-06, 1.1693686246871948e-05, 1.576542854309082e-05, 1.9837170839309692e-05, 2.3908913135528564e-05, 2.7980655431747437e-05, 3.205239772796631e-05, 3.612414002418518e-05, 4.019588232040405e-05, 4.4267624616622925e-05, 4.83393669128418e-05, 5.241110920906067e-05, 5.648285150527954e-05, 6.055459380149841e-05, 6.462633609771729e-05, 6.869807839393616e-05, 7.276982069015503e-05, 7.68415629863739e-05, 8.091330528259277e-05, 8.498504757881165e-05, 8.905678987503052e-05, 9.312853217124939e-05, 9.720027446746826e-05, 0.00010127201676368713, 0.000105343759059906, 0.00010941550135612488, 0.00011348724365234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 226.0, 782.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6853296756744385, -1.6479500532150269, -1.6105704307556152, -1.5731908082962036, -1.535811185836792, -1.4984315633773804, -1.4610519409179688, -1.4236721992492676, -1.3862926959991455, -1.3489130735397339, -1.3115334510803223, -1.2741538286209106, -1.236774206161499, -1.1993945837020874, -1.1620149612426758, -1.1246352195739746, -1.087255597114563, -1.0498759746551514, -1.0124963521957397, -0.9751167297363281, -0.9377371072769165, -0.9003574848175049, -0.8629778027534485, -0.8255981802940369, -0.7882185578346252, -0.7508389353752136, -0.713459312915802, -0.6760796904563904, -0.638700008392334, -0.6013203859329224, -0.5639407634735107, -0.5265611410140991, -0.48918139934539795, -0.45180177688598633, -0.4144221544265747, -0.3770425021648407, -0.3396628797054291, -0.30228325724601746, -0.26490360498428345, -0.22752398252487183, -0.1901443600654602, -0.15276473760604858, -0.11538510024547577, -0.07800547033548355, -0.04062584042549133, -0.003246217966079712, 0.0341334193944931, 0.07151305675506592, 0.10889267921447754, 0.14627230167388916, 0.18365193903446198, 0.2210315763950348, 0.2584111988544464, 0.29579082131385803, 0.33317047357559204, 0.37055009603500366, 0.4079297184944153, 0.4453093409538269, 0.4826889634132385, 0.5200685858726501, 0.5574482679367065, 0.5948278903961182, 0.6322075128555298, 0.6695871353149414, 0.706966757774353]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 9.0, 12.0, 14.0, 15.0, 12.0, 27.0, 30.0, 33.0, 47.0, 40.0, 55.0, 61.0, 61.0, 67.0, 80.0, 60.0, 59.0, 46.0, 54.0, 38.0, 47.0, 32.0, 28.0, 13.0, 18.0, 9.0, 8.0, 11.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6014357805252075, -0.5824732780456543, -0.5635108351707458, -0.5445483922958374, -0.5255858898162842, -0.506623387336731, -0.4876609444618225, -0.4686984717845917, -0.44973599910736084, -0.43077352643013, -0.41181105375289917, -0.39284858107566833, -0.3738861083984375, -0.35492363572120667, -0.33596116304397583, -0.316998690366745, -0.29803621768951416, -0.2790737450122833, -0.2601112723350525, -0.24114879965782166, -0.22218632698059082, -0.20322385430335999, -0.18426138162612915, -0.16529890894889832, -0.14633643627166748, -0.12737396359443665, -0.10841149091720581, -0.08944901823997498, -0.07048654556274414, -0.051524072885513306, -0.03256160020828247, -0.013599127531051636, 0.005363285541534424, 0.02432575821876526, 0.043288230895996094, 0.06225070357322693, 0.08121317625045776, 0.1001756489276886, 0.11913812160491943, 0.13810059428215027, 0.1570630669593811, 0.17602553963661194, 0.19498801231384277, 0.2139504849910736, 0.23291295766830444, 0.2518754303455353, 0.2708379030227661, 0.28980037569999695, 0.3087628483772278, 0.3277253210544586, 0.34668779373168945, 0.3656502664089203, 0.3846127390861511, 0.40357521176338196, 0.4225376844406128, 0.44150015711784363, 0.46046262979507446, 0.4794251024723053, 0.49838757514953613, 0.5173500776290894, 0.5363125205039978, 0.5552749633789062, 0.5742374658584595, 0.5931999683380127, 0.6121624112129211]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 4.0, 7.0, 5.0, 3.0, 5.0, 14.0, 27.0, 51.0, 90.0, 190.0, 505.0, 1989.0, 4182162.0, 8010.0, 803.0, 221.0, 74.0, 32.0, 21.0, 16.0, 9.0, 7.0, 10.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38818359375, -0.3766822814941406, -0.36518096923828125, -0.3536796569824219, -0.3421783447265625, -0.3306770324707031, -0.31917572021484375, -0.3076744079589844, -0.296173095703125, -0.2846717834472656, -0.27317047119140625, -0.2616691589355469, -0.2501678466796875, -0.23866653442382812, -0.22716522216796875, -0.21566390991210938, -0.20416259765625, -0.19266128540039062, -0.18115997314453125, -0.16965866088867188, -0.1581573486328125, -0.14665603637695312, -0.13515472412109375, -0.12365341186523438, -0.112152099609375, -0.10065078735351562, -0.08914947509765625, -0.07764816284179688, -0.0661468505859375, -0.054645538330078125, -0.04314422607421875, -0.031642913818359375, -0.0201416015625, -0.008640289306640625, 0.00286102294921875, 0.014362335205078125, 0.0258636474609375, 0.037364959716796875, 0.04886627197265625, 0.060367584228515625, 0.071868896484375, 0.08337020874023438, 0.09487152099609375, 0.10637283325195312, 0.1178741455078125, 0.12937545776367188, 0.14087677001953125, 0.15237808227539062, 0.16387939453125, 0.17538070678710938, 0.18688201904296875, 0.19838333129882812, 0.2098846435546875, 0.22138595581054688, 0.23288726806640625, 0.24438858032226562, 0.255889892578125, 0.2673912048339844, 0.27889251708984375, 0.2903938293457031, 0.3018951416015625, 0.3133964538574219, 0.32489776611328125, 0.3363990783691406, 0.347900390625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 6.0, 2.0, 2.0, 2.0, 4.0, 6.0, 15.0, 19.0, 11.0, 15.0, 27.0, 420.0, 335.0, 34.0, 20.0, 8.0, 9.0, 7.0, 8.0, 8.0, 6.0, 9.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0225830078125, -0.021914243698120117, -0.021245479583740234, -0.02057671546936035, -0.01990795135498047, -0.019239187240600586, -0.018570423126220703, -0.01790165901184082, -0.017232894897460938, -0.016564130783081055, -0.015895366668701172, -0.015226602554321289, -0.014557838439941406, -0.013889074325561523, -0.01322031021118164, -0.012551546096801758, -0.011882781982421875, -0.011214017868041992, -0.01054525375366211, -0.009876489639282227, -0.009207725524902344, -0.008538961410522461, -0.007870197296142578, -0.007201433181762695, -0.0065326690673828125, -0.00586390495300293, -0.005195140838623047, -0.004526376724243164, -0.0038576126098632812, -0.0031888484954833984, -0.0025200843811035156, -0.0018513202667236328, -0.00118255615234375, -0.0005137920379638672, 0.00015497207641601562, 0.0008237361907958984, 0.0014925003051757812, 0.002161264419555664, 0.002830028533935547, 0.0034987926483154297, 0.0041675567626953125, 0.004836320877075195, 0.005505084991455078, 0.006173849105834961, 0.006842613220214844, 0.0075113773345947266, 0.00818014144897461, 0.008848905563354492, 0.009517669677734375, 0.010186433792114258, 0.01085519790649414, 0.011523962020874023, 0.012192726135253906, 0.012861490249633789, 0.013530254364013672, 0.014199018478393555, 0.014867782592773438, 0.01553654670715332, 0.016205310821533203, 0.016874074935913086, 0.01754283905029297, 0.01821160316467285, 0.018880367279052734, 0.019549131393432617, 0.0202178955078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 7.0, 12.0, 9.0, 8.0, 16.0, 25.0, 19.0, 47.0, 39.0, 69.0, 113.0, 204.0, 427.0, 2190.0, 4039359.0, 148879.0, 1856.0, 429.0, 189.0, 107.0, 59.0, 40.0, 36.0, 16.0, 28.0, 15.0, 8.0, 11.0, 13.0, 8.0, 3.0, 6.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.23388671875, -0.22699928283691406, -0.22011184692382812, -0.2132244110107422, -0.20633697509765625, -0.1994495391845703, -0.19256210327148438, -0.18567466735839844, -0.1787872314453125, -0.17189979553222656, -0.16501235961914062, -0.1581249237060547, -0.15123748779296875, -0.1443500518798828, -0.13746261596679688, -0.13057518005371094, -0.123687744140625, -0.11680030822753906, -0.10991287231445312, -0.10302543640136719, -0.09613800048828125, -0.08925056457519531, -0.08236312866210938, -0.07547569274902344, -0.0685882568359375, -0.06170082092285156, -0.054813385009765625, -0.04792594909667969, -0.04103851318359375, -0.03415107727050781, -0.027263641357421875, -0.020376205444335938, -0.01348876953125, -0.0066013336181640625, 0.000286102294921875, 0.0071735382080078125, 0.01406097412109375, 0.020948410034179688, 0.027835845947265625, 0.03472328186035156, 0.0416107177734375, 0.04849815368652344, 0.055385589599609375, 0.06227302551269531, 0.06916046142578125, 0.07604789733886719, 0.08293533325195312, 0.08982276916503906, 0.096710205078125, 0.10359764099121094, 0.11048507690429688, 0.11737251281738281, 0.12425994873046875, 0.1311473846435547, 0.13803482055664062, 0.14492225646972656, 0.1518096923828125, 0.15869712829589844, 0.16558456420898438, 0.1724720001220703, 0.17935943603515625, 0.1862468719482422, 0.19313430786132812, 0.20002174377441406, 0.2069091796875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 8.0, 6.0, 5.0, 14.0, 8.0, 16.0, 19.0, 19.0, 24.0, 70.0, 3139.0, 496.0, 66.0, 31.0, 22.0, 26.0, 19.0, 14.0, 8.0, 6.0, 12.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0377197265625, -0.03660869598388672, -0.03549766540527344, -0.034386634826660156, -0.033275604248046875, -0.032164573669433594, -0.031053543090820312, -0.02994251251220703, -0.02883148193359375, -0.02772045135498047, -0.026609420776367188, -0.025498390197753906, -0.024387359619140625, -0.023276329040527344, -0.022165298461914062, -0.02105426788330078, -0.0199432373046875, -0.01883220672607422, -0.017721176147460938, -0.016610145568847656, -0.015499114990234375, -0.014388084411621094, -0.013277053833007812, -0.012166023254394531, -0.01105499267578125, -0.009943962097167969, -0.008832931518554688, -0.007721900939941406, -0.006610870361328125, -0.005499839782714844, -0.0043888092041015625, -0.0032777786254882812, -0.002166748046875, -0.0010557174682617188, 5.53131103515625e-05, 0.0011663436889648438, 0.002277374267578125, 0.0033884048461914062, 0.0044994354248046875, 0.005610466003417969, 0.00672149658203125, 0.007832527160644531, 0.008943557739257812, 0.010054588317871094, 0.011165618896484375, 0.012276649475097656, 0.013387680053710938, 0.014498710632324219, 0.0156097412109375, 0.01672077178955078, 0.017831802368164062, 0.018942832946777344, 0.020053863525390625, 0.021164894104003906, 0.022275924682617188, 0.02338695526123047, 0.02449798583984375, 0.02560901641845703, 0.026720046997070312, 0.027831077575683594, 0.028942108154296875, 0.030053138732910156, 0.031164169311523438, 0.03227519989013672, 0.03338623046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 107.0, 910.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9734079837799072, -0.9554080963134766, -0.9374082088470459, -0.9194082617759705, -0.9014083743095398, -0.8834084868431091, -0.8654085397720337, -0.847408652305603, -0.8294087648391724, -0.8114088773727417, -0.793408989906311, -0.7754090428352356, -0.7574091553688049, -0.7394092679023743, -0.7214093208312988, -0.7034094333648682, -0.6854095458984375, -0.6674096584320068, -0.6494097709655762, -0.6314098238945007, -0.6134099364280701, -0.5954100489616394, -0.577410101890564, -0.5594102144241333, -0.5414103269577026, -0.523410439491272, -0.5054105520248413, -0.48741060495376587, -0.4694107174873352, -0.45141083002090454, -0.4334109127521515, -0.41541099548339844, -0.3974111080169678, -0.3794112205505371, -0.36141130328178406, -0.343411386013031, -0.32541149854660034, -0.3074116110801697, -0.2894116938114166, -0.2714117765426636, -0.2534118890762329, -0.23541198670864105, -0.2174120843410492, -0.19941218197345734, -0.18141227960586548, -0.16341237723827362, -0.14541247487068176, -0.1274125725030899, -0.10941268503665924, -0.09141278266906738, -0.07341288030147552, -0.05541297793388367, -0.03741307556629181, -0.01941317319869995, -0.0014132708311080933, 0.016586631536483765, 0.03458653390407562, 0.05258643627166748, 0.07058633863925934, 0.0885862410068512, 0.10658614337444305, 0.12458604574203491, 0.14258594810962677, 0.16058585047721863, 0.17858575284481049]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 9.0, 6.0, 16.0, 30.0, 21.0, 34.0, 42.0, 59.0, 57.0, 71.0, 78.0, 77.0, 78.0, 77.0, 76.0, 65.0, 46.0, 38.0, 31.0, 28.0, 10.0, 11.0, 8.0, 8.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11659932136535645, -0.1123775988817215, -0.10815587639808655, -0.1039341539144516, -0.09971243143081665, -0.0954907089471817, -0.09126899391412735, -0.0870472714304924, -0.08282554894685745, -0.0786038264632225, -0.07438210397958755, -0.0701603814959526, -0.06593866646289825, -0.06171694025397301, -0.05749522149562836, -0.05327349901199341, -0.04905177652835846, -0.04483005404472351, -0.04060833156108856, -0.03638661280274391, -0.03216489031910896, -0.027943167835474014, -0.023721447214484215, -0.019499726593494415, -0.015278004109859467, -0.011056282557547092, -0.006834561005234718, -0.002612839452922344, 0.00160888209939003, 0.005830604583024979, 0.010052325204014778, 0.014274045825004578, 0.018495768308639526, 0.022717490792274475, 0.026939211413264275, 0.031160932034254074, 0.03538265451788902, 0.03960437700152397, 0.04382609575986862, 0.04804781824350357, 0.05226954072713852, 0.05649126321077347, 0.06071298569440842, 0.06493470817804337, 0.06915642321109772, 0.07337814569473267, 0.07759986817836761, 0.08182159066200256, 0.08604331314563751, 0.09026503562927246, 0.09448675811290741, 0.09870848059654236, 0.10293020308017731, 0.10715192556381226, 0.11137364059686661, 0.11559536308050156, 0.1198170855641365, 0.12403880804777145, 0.1282605230808258, 0.13248224556446075, 0.1367039680480957, 0.14092569053173065, 0.1451474130153656, 0.14936913549900055, 0.1535908579826355]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 11.0, 3.0, 5.0, 7.0, 17.0, 25.0, 27.0, 53.0, 60.0, 96.0, 122.0, 148.0, 245.0, 342.0, 550.0, 857.0, 1300.0, 2229.0, 3990.0, 8308.0, 22522.0, 883313.0, 93734.0, 15604.0, 6545.0, 3429.0, 1803.0, 1071.0, 709.0, 451.0, 278.0, 198.0, 138.0, 94.0, 80.0, 63.0, 33.0, 27.0, 11.0, 10.0, 14.0, 8.0, 11.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.054718017578125, -0.05294370651245117, -0.051169395446777344, -0.049395084381103516, -0.04762077331542969, -0.04584646224975586, -0.04407215118408203, -0.0422978401184082, -0.040523529052734375, -0.03874921798706055, -0.03697490692138672, -0.03520059585571289, -0.03342628479003906, -0.031651973724365234, -0.029877662658691406, -0.028103351593017578, -0.02632904052734375, -0.024554729461669922, -0.022780418395996094, -0.021006107330322266, -0.019231796264648438, -0.01745748519897461, -0.01568317413330078, -0.013908863067626953, -0.012134552001953125, -0.010360240936279297, -0.008585929870605469, -0.006811618804931641, -0.0050373077392578125, -0.0032629966735839844, -0.0014886856079101562, 0.0002856254577636719, 0.0020599365234375, 0.003834247589111328, 0.005608558654785156, 0.007382869720458984, 0.009157180786132812, 0.01093149185180664, 0.012705802917480469, 0.014480113983154297, 0.016254425048828125, 0.018028736114501953, 0.01980304718017578, 0.02157735824584961, 0.023351669311523438, 0.025125980377197266, 0.026900291442871094, 0.028674602508544922, 0.03044891357421875, 0.03222322463989258, 0.033997535705566406, 0.035771846771240234, 0.03754615783691406, 0.03932046890258789, 0.04109477996826172, 0.04286909103393555, 0.044643402099609375, 0.0464177131652832, 0.04819202423095703, 0.04996633529663086, 0.05174064636230469, 0.053514957427978516, 0.055289268493652344, 0.05706357955932617, 0.058837890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 4.0, 5.0, 12.0, 15.0, 17.0, 9.0, 18.0, 164.0, 545.0, 87.0, 23.0, 12.0, 9.0, 5.0, 6.0, 13.0, 8.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0216827392578125, -0.02102971076965332, -0.02037668228149414, -0.01972365379333496, -0.01907062530517578, -0.0184175968170166, -0.017764568328857422, -0.017111539840698242, -0.016458511352539062, -0.015805482864379883, -0.015152454376220703, -0.014499425888061523, -0.013846397399902344, -0.013193368911743164, -0.012540340423583984, -0.011887311935424805, -0.011234283447265625, -0.010581254959106445, -0.009928226470947266, -0.009275197982788086, -0.008622169494628906, -0.007969141006469727, -0.007316112518310547, -0.006663084030151367, -0.0060100555419921875, -0.005357027053833008, -0.004703998565673828, -0.0040509700775146484, -0.0033979415893554688, -0.002744913101196289, -0.0020918846130371094, -0.0014388561248779297, -0.00078582763671875, -0.0001327991485595703, 0.0005202293395996094, 0.001173257827758789, 0.0018262863159179688, 0.0024793148040771484, 0.003132343292236328, 0.003785371780395508, 0.0044384002685546875, 0.005091428756713867, 0.005744457244873047, 0.0063974857330322266, 0.007050514221191406, 0.007703542709350586, 0.008356571197509766, 0.009009599685668945, 0.009662628173828125, 0.010315656661987305, 0.010968685150146484, 0.011621713638305664, 0.012274742126464844, 0.012927770614624023, 0.013580799102783203, 0.014233827590942383, 0.014886856079101562, 0.015539884567260742, 0.016192913055419922, 0.0168459415435791, 0.01749897003173828, 0.01815199851989746, 0.01880502700805664, 0.01945805549621582, 0.020111083984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 7.0, 13.0, 13.0, 24.0, 24.0, 21.0, 27.0, 33.0, 45.0, 38.0, 46.0, 60.0, 85.0, 102.0, 105.0, 119.0, 187.0, 228.0, 373.0, 795.0, 4118.0, 292039.0, 741435.0, 5957.0, 966.0, 448.0, 215.0, 166.0, 130.0, 118.0, 101.0, 99.0, 58.0, 55.0, 50.0, 46.0, 36.0, 23.0, 28.0, 23.0, 20.0, 15.0, 16.0, 6.0, 10.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.1275634765625, -0.12358474731445312, -0.11960601806640625, -0.11562728881835938, -0.1116485595703125, -0.10766983032226562, -0.10369110107421875, -0.09971237182617188, -0.095733642578125, -0.09175491333007812, -0.08777618408203125, -0.08379745483398438, -0.0798187255859375, -0.07583999633789062, -0.07186126708984375, -0.06788253784179688, -0.06390380859375, -0.059925079345703125, -0.05594635009765625, -0.051967620849609375, -0.0479888916015625, -0.044010162353515625, -0.04003143310546875, -0.036052703857421875, -0.032073974609375, -0.028095245361328125, -0.02411651611328125, -0.020137786865234375, -0.0161590576171875, -0.012180328369140625, -0.00820159912109375, -0.004222869873046875, -0.000244140625, 0.003734588623046875, 0.00771331787109375, 0.011692047119140625, 0.0156707763671875, 0.019649505615234375, 0.02362823486328125, 0.027606964111328125, 0.031585693359375, 0.035564422607421875, 0.03954315185546875, 0.043521881103515625, 0.0475006103515625, 0.051479339599609375, 0.05545806884765625, 0.059436798095703125, 0.06341552734375, 0.06739425659179688, 0.07137298583984375, 0.07535171508789062, 0.0793304443359375, 0.08330917358398438, 0.08728790283203125, 0.09126663208007812, 0.095245361328125, 0.09922409057617188, 0.10320281982421875, 0.10718154907226562, 0.1111602783203125, 0.11513900756835938, 0.11911773681640625, 0.12309646606445312, 0.1270751953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 8.0, 6.0, 9.0, 7.0, 8.0, 9.0, 13.0, 7.0, 15.0, 17.0, 29.0, 24.0, 22.0, 41.0, 33.0, 36.0, 47.0, 35.0, 47.0, 54.0, 45.0, 46.0, 39.0, 53.0, 36.0, 29.0, 28.0, 24.0, 34.0, 28.0, 28.0, 27.0, 11.0, 23.0, 15.0, 16.0, 3.0, 9.0, 8.0, 13.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.058685302734375, -0.05681800842285156, -0.054950714111328125, -0.05308341979980469, -0.05121612548828125, -0.04934883117675781, -0.047481536865234375, -0.04561424255371094, -0.0437469482421875, -0.04187965393066406, -0.040012359619140625, -0.03814506530761719, -0.03627777099609375, -0.03441047668457031, -0.032543182373046875, -0.030675888061523438, -0.02880859375, -0.026941299438476562, -0.025074005126953125, -0.023206710815429688, -0.02133941650390625, -0.019472122192382812, -0.017604827880859375, -0.015737533569335938, -0.0138702392578125, -0.012002944946289062, -0.010135650634765625, -0.008268356323242188, -0.00640106201171875, -0.0045337677001953125, -0.002666473388671875, -0.0007991790771484375, 0.001068115234375, 0.0029354095458984375, 0.004802703857421875, 0.0066699981689453125, 0.00853729248046875, 0.010404586791992188, 0.012271881103515625, 0.014139175415039062, 0.0160064697265625, 0.017873764038085938, 0.019741058349609375, 0.021608352661132812, 0.02347564697265625, 0.025342941284179688, 0.027210235595703125, 0.029077529907226562, 0.03094482421875, 0.03281211853027344, 0.034679412841796875, 0.03654670715332031, 0.03841400146484375, 0.04028129577636719, 0.042148590087890625, 0.04401588439941406, 0.0458831787109375, 0.04775047302246094, 0.049617767333984375, 0.05148506164550781, 0.05335235595703125, 0.05521965026855469, 0.057086944580078125, 0.05895423889160156, 0.060821533203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 10.0, 11.0, 22.0, 23.0, 31.0, 47.0, 82.0, 115.0, 170.0, 266.0, 462.0, 804.0, 1541.0, 3549.0, 9687.0, 38324.0, 697813.0, 254614.0, 27134.0, 7634.0, 2960.0, 1349.0, 724.0, 395.0, 265.0, 144.0, 111.0, 70.0, 47.0, 31.0, 33.0, 6.0, 15.0, 15.0, 10.0, 5.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00010824203491210938, -0.00010514073073863983, -0.00010203942656517029, -9.893812239170074e-05, -9.58368182182312e-05, -9.273551404476166e-05, -8.963420987129211e-05, -8.653290569782257e-05, -8.343160152435303e-05, -8.033029735088348e-05, -7.722899317741394e-05, -7.41276890039444e-05, -7.102638483047485e-05, -6.792508065700531e-05, -6.482377648353577e-05, -6.172247231006622e-05, -5.862116813659668e-05, -5.5519863963127136e-05, -5.241855978965759e-05, -4.931725561618805e-05, -4.6215951442718506e-05, -4.311464726924896e-05, -4.001334309577942e-05, -3.6912038922309875e-05, -3.381073474884033e-05, -3.070943057537079e-05, -2.7608126401901245e-05, -2.45068222284317e-05, -2.1405518054962158e-05, -1.8304213881492615e-05, -1.5202909708023071e-05, -1.2101605534553528e-05, -9.000301361083984e-06, -5.898997187614441e-06, -2.7976930141448975e-06, 3.03611159324646e-07, 3.4049153327941895e-06, 6.506219506263733e-06, 9.607523679733276e-06, 1.270882785320282e-05, 1.5810132026672363e-05, 1.8911436200141907e-05, 2.201274037361145e-05, 2.5114044547080994e-05, 2.8215348720550537e-05, 3.131665289402008e-05, 3.4417957067489624e-05, 3.751926124095917e-05, 4.062056541442871e-05, 4.3721869587898254e-05, 4.68231737613678e-05, 4.992447793483734e-05, 5.3025782108306885e-05, 5.612708628177643e-05, 5.922839045524597e-05, 6.232969462871552e-05, 6.543099880218506e-05, 6.85323029756546e-05, 7.163360714912415e-05, 7.473491132259369e-05, 7.783621549606323e-05, 8.093751966953278e-05, 8.403882384300232e-05, 8.714012801647186e-05, 9.02414321899414e-05]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 6.0, 8.0, 3.0, 7.0, 24.0, 18.0, 17.0, 27.0, 51.0, 47.0, 70.0, 68.0, 85.0, 65.0, 88.0, 78.0, 49.0, 56.0, 43.0, 38.0, 32.0, 32.0, 21.0, 19.0, 8.0, 8.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.4871121644973755e-06, -4.325062036514282e-06, -4.163011908531189e-06, -4.000961780548096e-06, -3.8389116525650024e-06, -3.676861524581909e-06, -3.514811396598816e-06, -3.3527612686157227e-06, -3.1907111406326294e-06, -3.028661012649536e-06, -2.866610884666443e-06, -2.7045607566833496e-06, -2.5425106287002563e-06, -2.380460500717163e-06, -2.21841037273407e-06, -2.0563602447509766e-06, -1.8943101167678833e-06, -1.73225998878479e-06, -1.5702098608016968e-06, -1.4081597328186035e-06, -1.2461096048355103e-06, -1.084059476852417e-06, -9.220093488693237e-07, -7.599592208862305e-07, -5.979090929031372e-07, -4.3585896492004395e-07, -2.738088369369507e-07, -1.1175870895385742e-07, 5.029141902923584e-08, 2.123415470123291e-07, 3.7439167499542236e-07, 5.364418029785156e-07, 6.984919309616089e-07, 8.605420589447021e-07, 1.0225921869277954e-06, 1.1846423149108887e-06, 1.346692442893982e-06, 1.5087425708770752e-06, 1.6707926988601685e-06, 1.8328428268432617e-06, 1.994892954826355e-06, 2.1569430828094482e-06, 2.3189932107925415e-06, 2.4810433387756348e-06, 2.643093466758728e-06, 2.8051435947418213e-06, 2.9671937227249146e-06, 3.129243850708008e-06, 3.291293978691101e-06, 3.4533441066741943e-06, 3.6153942346572876e-06, 3.777444362640381e-06, 3.939494490623474e-06, 4.101544618606567e-06, 4.263594746589661e-06, 4.425644874572754e-06, 4.587695002555847e-06, 4.7497451305389404e-06, 4.911795258522034e-06, 5.073845386505127e-06, 5.23589551448822e-06, 5.3979456424713135e-06, 5.559995770454407e-06, 5.7220458984375e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 12.0, 17.0, 21.0, 48.0, 66.0, 109.0, 207.0, 332.0, 1157.0, 846193.0, 198523.0, 1043.0, 321.0, 199.0, 111.0, 68.0, 46.0, 22.0, 19.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003566741943359375, -0.0003455132246017456, -0.0003343522548675537, -0.0003231912851333618, -0.0003120303153991699, -0.00030086934566497803, -0.00028970837593078613, -0.00027854740619659424, -0.00026738643646240234, -0.00025622546672821045, -0.00024506449699401855, -0.00023390352725982666, -0.00022274255752563477, -0.00021158158779144287, -0.00020042061805725098, -0.00018925964832305908, -0.0001780986785888672, -0.0001669377088546753, -0.0001557767391204834, -0.0001446157693862915, -0.0001334547996520996, -0.00012229382991790771, -0.00011113286018371582, -9.997189044952393e-05, -8.881092071533203e-05, -7.764995098114014e-05, -6.648898124694824e-05, -5.532801151275635e-05, -4.416704177856445e-05, -3.300607204437256e-05, -2.1845102310180664e-05, -1.068413257598877e-05, 4.76837158203125e-07, 1.163780689239502e-05, 2.2798776626586914e-05, 3.395974636077881e-05, 4.51207160949707e-05, 5.62816858291626e-05, 6.744265556335449e-05, 7.860362529754639e-05, 8.976459503173828e-05, 0.00010092556476593018, 0.00011208653450012207, 0.00012324750423431396, 0.00013440847396850586, 0.00014556944370269775, 0.00015673041343688965, 0.00016789138317108154, 0.00017905235290527344, 0.00019021332263946533, 0.00020137429237365723, 0.00021253526210784912, 0.00022369623184204102, 0.0002348572015762329, 0.0002460181713104248, 0.0002571791410446167, 0.0002683401107788086, 0.0002795010805130005, 0.0002906620502471924, 0.0003018230199813843, 0.00031298398971557617, 0.00032414495944976807, 0.00033530592918395996, 0.00034646689891815186, 0.00035762786865234375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 10.0, 15.0, 15.0, 38.0, 53.0, 58.0, 103.0, 122.0, 136.0, 126.0, 107.0, 54.0, 58.0, 33.0, 23.0, 17.0, 7.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017142295837402344, -0.00016671046614646912, -0.0001619979739189148, -0.00015728548169136047, -0.00015257298946380615, -0.00014786049723625183, -0.0001431480050086975, -0.0001384355127811432, -0.00013372302055358887, -0.00012901052832603455, -0.00012429803609848022, -0.0001195855438709259, -0.00011487305164337158, -0.00011016055941581726, -0.00010544806718826294, -0.00010073557496070862, -9.60230827331543e-05, -9.131059050559998e-05, -8.659809827804565e-05, -8.188560605049133e-05, -7.717311382293701e-05, -7.246062159538269e-05, -6.774812936782837e-05, -6.303563714027405e-05, -5.8323144912719727e-05, -5.3610652685165405e-05, -4.8898160457611084e-05, -4.418566823005676e-05, -3.947317600250244e-05, -3.476068377494812e-05, -3.00481915473938e-05, -2.5335699319839478e-05, -2.0623207092285156e-05, -1.5910714864730835e-05, -1.1198222637176514e-05, -6.485730409622192e-06, -1.773238182067871e-06, 2.93925404548645e-06, 7.651746273040771e-06, 1.2364238500595093e-05, 1.7076730728149414e-05, 2.1789222955703735e-05, 2.6501715183258057e-05, 3.121420741081238e-05, 3.59266996383667e-05, 4.063919186592102e-05, 4.535168409347534e-05, 5.006417632102966e-05, 5.4776668548583984e-05, 5.9489160776138306e-05, 6.420165300369263e-05, 6.891414523124695e-05, 7.362663745880127e-05, 7.833912968635559e-05, 8.305162191390991e-05, 8.776411414146423e-05, 9.247660636901855e-05, 9.718909859657288e-05, 0.0001019015908241272, 0.00010661408305168152, 0.00011132657527923584, 0.00011603906750679016, 0.00012075155973434448, 0.0001254640519618988, 0.00013017654418945312]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 37.0, 964.0, 16.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.892841100692749, -0.8576000928878784, -0.822359025478363, -0.7871179580688477, -0.751876950263977, -0.7166359424591064, -0.6813948750495911, -0.6461538076400757, -0.6109127998352051, -0.5756717920303345, -0.5404307246208191, -0.5051896572113037, -0.4699486494064331, -0.4347076117992401, -0.3994665741920471, -0.3642255365848541, -0.32898449897766113, -0.29374346137046814, -0.25850242376327515, -0.22326138615608215, -0.18802034854888916, -0.15277931094169617, -0.11753827333450317, -0.08229723572731018, -0.04705619812011719, -0.011815160512924194, 0.0234258770942688, 0.05866691470146179, 0.09390795230865479, 0.12914898991584778, 0.16439002752304077, 0.19963106513023376, 0.23487210273742676, 0.27011314034461975, 0.30535417795181274, 0.34059521555900574, 0.37583625316619873, 0.4110772907733917, 0.4463183283805847, 0.4815593659877777, 0.5168004035949707, 0.5520414113998413, 0.5872824788093567, 0.6225235462188721, 0.6577645540237427, 0.6930055618286133, 0.7282466292381287, 0.763487696647644, 0.7987287044525146, 0.8339697122573853, 0.8692107796669006, 0.904451847076416, 0.9396928548812866, 0.9749338626861572, 1.0101749897003174, 1.045415997505188, 1.0806570053100586, 1.1158980131149292, 1.1511390209197998, 1.18638014793396, 1.2216211557388306, 1.2568621635437012, 1.2921032905578613, 1.327344298362732, 1.3625853061676025]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 6.0, 10.0, 9.0, 17.0, 23.0, 27.0, 26.0, 20.0, 25.0, 26.0, 41.0, 38.0, 45.0, 43.0, 58.0, 49.0, 54.0, 42.0, 45.0, 40.0, 44.0, 47.0, 49.0, 38.0, 35.0, 34.0, 24.0, 16.0, 18.0, 15.0, 13.0, 2.0, 5.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.48736441135406494, -0.4729677438735962, -0.45857110619544983, -0.4441744387149811, -0.4297778010368347, -0.41538113355636597, -0.4009844660758972, -0.38658782839775085, -0.3721911907196045, -0.35779452323913574, -0.3433978855609894, -0.32900121808052063, -0.31460458040237427, -0.3002079129219055, -0.28581124544143677, -0.2714146077632904, -0.25701794028282166, -0.2426212877035141, -0.22822463512420654, -0.2138279676437378, -0.19943132996559143, -0.18503466248512268, -0.17063800990581512, -0.15624135732650757, -0.1418447047472, -0.12744805216789246, -0.1130513995885849, -0.09865473955869675, -0.08425808697938919, -0.06986143440008163, -0.05546477437019348, -0.041068121790885925, -0.02667146921157837, -0.012274814769625664, 0.0021218396723270416, 0.016518495976924896, 0.030915148556232452, 0.04531180113554001, 0.05970846116542816, 0.07410511374473572, 0.08850176632404327, 0.10289841890335083, 0.11729507148265839, 0.13169172406196594, 0.1460883915424347, 0.16048502922058105, 0.1748816967010498, 0.18927834928035736, 0.20367500185966492, 0.21807165443897247, 0.23246830701828003, 0.24686497449874878, 0.26126161217689514, 0.2756582796573639, 0.29005491733551025, 0.304451584815979, 0.31884825229644775, 0.3332449197769165, 0.34764155745506287, 0.3620382249355316, 0.376434862613678, 0.39083153009414673, 0.4052281975746155, 0.41962483525276184, 0.4340214729309082]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 6.0, 1.0, 4.0, 10.0, 13.0, 9.0, 12.0, 24.0, 24.0, 23.0, 34.0, 46.0, 62.0, 93.0, 131.0, 204.0, 297.0, 571.0, 2567.0, 4171887.0, 16358.0, 815.0, 401.0, 220.0, 128.0, 96.0, 69.0, 49.0, 26.0, 26.0, 16.0, 10.0, 12.0, 11.0, 3.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1055908203125, -0.10236167907714844, -0.09913253784179688, -0.09590339660644531, -0.09267425537109375, -0.08944511413574219, -0.08621597290039062, -0.08298683166503906, -0.0797576904296875, -0.07652854919433594, -0.07329940795898438, -0.07007026672363281, -0.06684112548828125, -0.06361198425292969, -0.060382843017578125, -0.05715370178222656, -0.053924560546875, -0.05069541931152344, -0.047466278076171875, -0.04423713684082031, -0.04100799560546875, -0.03777885437011719, -0.034549713134765625, -0.03132057189941406, -0.0280914306640625, -0.024862289428710938, -0.021633148193359375, -0.018404006958007812, -0.01517486572265625, -0.011945724487304688, -0.008716583251953125, -0.0054874420166015625, -0.00225830078125, 0.0009708404541015625, 0.004199981689453125, 0.0074291229248046875, 0.01065826416015625, 0.013887405395507812, 0.017116546630859375, 0.020345687866210938, 0.0235748291015625, 0.026803970336914062, 0.030033111572265625, 0.03326225280761719, 0.03649139404296875, 0.03972053527832031, 0.042949676513671875, 0.04617881774902344, 0.049407958984375, 0.05263710021972656, 0.055866241455078125, 0.05909538269042969, 0.06232452392578125, 0.06555366516113281, 0.06878280639648438, 0.07201194763183594, 0.0752410888671875, 0.07847023010253906, 0.08169937133789062, 0.08492851257324219, 0.08815765380859375, 0.09138679504394531, 0.09461593627929688, 0.09784507751464844, 0.10107421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 8.0, 16.0, 17.0, 12.0, 11.0, 51.0, 374.0, 337.0, 57.0, 19.0, 7.0, 9.0, 5.0, 7.0, 12.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02099609375, -0.020355939865112305, -0.01971578598022461, -0.019075632095336914, -0.01843547821044922, -0.017795324325561523, -0.017155170440673828, -0.016515016555786133, -0.015874862670898438, -0.015234708786010742, -0.014594554901123047, -0.013954401016235352, -0.013314247131347656, -0.012674093246459961, -0.012033939361572266, -0.01139378547668457, -0.010753631591796875, -0.01011347770690918, -0.009473323822021484, -0.008833169937133789, -0.008193016052246094, -0.0075528621673583984, -0.006912708282470703, -0.006272554397583008, -0.0056324005126953125, -0.004992246627807617, -0.004352092742919922, -0.0037119388580322266, -0.0030717849731445312, -0.002431631088256836, -0.0017914772033691406, -0.0011513233184814453, -0.00051116943359375, 0.0001289844512939453, 0.0007691383361816406, 0.001409292221069336, 0.0020494461059570312, 0.0026895999908447266, 0.003329753875732422, 0.003969907760620117, 0.0046100616455078125, 0.005250215530395508, 0.005890369415283203, 0.0065305233001708984, 0.007170677185058594, 0.007810831069946289, 0.008450984954833984, 0.00909113883972168, 0.009731292724609375, 0.01037144660949707, 0.011011600494384766, 0.011651754379272461, 0.012291908264160156, 0.012932062149047852, 0.013572216033935547, 0.014212369918823242, 0.014852523803710938, 0.015492677688598633, 0.016132831573486328, 0.016772985458374023, 0.01741313934326172, 0.018053293228149414, 0.01869344711303711, 0.019333600997924805, 0.0199737548828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 3.0, 9.0, 7.0, 15.0, 9.0, 21.0, 29.0, 59.0, 70.0, 213.0, 1460.0, 4174301.0, 16951.0, 774.0, 160.0, 63.0, 38.0, 22.0, 16.0, 14.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.191650390625, -0.18580245971679688, -0.17995452880859375, -0.17410659790039062, -0.1682586669921875, -0.16241073608398438, -0.15656280517578125, -0.15071487426757812, -0.144866943359375, -0.13901901245117188, -0.13317108154296875, -0.12732315063476562, -0.1214752197265625, -0.11562728881835938, -0.10977935791015625, -0.10393142700195312, -0.09808349609375, -0.09223556518554688, -0.08638763427734375, -0.08053970336914062, -0.0746917724609375, -0.06884384155273438, -0.06299591064453125, -0.057147979736328125, -0.051300048828125, -0.045452117919921875, -0.03960418701171875, -0.033756256103515625, -0.0279083251953125, -0.022060394287109375, -0.01621246337890625, -0.010364532470703125, -0.0045166015625, 0.001331329345703125, 0.00717926025390625, 0.013027191162109375, 0.0188751220703125, 0.024723052978515625, 0.03057098388671875, 0.036418914794921875, 0.042266845703125, 0.048114776611328125, 0.05396270751953125, 0.059810638427734375, 0.0656585693359375, 0.07150650024414062, 0.07735443115234375, 0.08320236206054688, 0.08905029296875, 0.09489822387695312, 0.10074615478515625, 0.10659408569335938, 0.1124420166015625, 0.11828994750976562, 0.12413787841796875, 0.12998580932617188, 0.135833740234375, 0.14168167114257812, 0.14752960205078125, 0.15337753295898438, 0.1592254638671875, 0.16507339477539062, 0.17092132568359375, 0.17676925659179688, 0.1826171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 6.0, 12.0, 26.0, 76.0, 3651.0, 189.0, 42.0, 15.0, 9.0, 8.0, 3.0, 4.0, 2.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033660888671875, -0.03252983093261719, -0.031398773193359375, -0.030267715454101562, -0.02913665771484375, -0.028005599975585938, -0.026874542236328125, -0.025743484497070312, -0.0246124267578125, -0.023481369018554688, -0.022350311279296875, -0.021219253540039062, -0.02008819580078125, -0.018957138061523438, -0.017826080322265625, -0.016695022583007812, -0.01556396484375, -0.014432907104492188, -0.013301849365234375, -0.012170791625976562, -0.01103973388671875, -0.009908676147460938, -0.008777618408203125, -0.0076465606689453125, -0.0065155029296875, -0.0053844451904296875, -0.004253387451171875, -0.0031223297119140625, -0.00199127197265625, -0.0008602142333984375, 0.000270843505859375, 0.0014019012451171875, 0.002532958984375, 0.0036640167236328125, 0.004795074462890625, 0.0059261322021484375, 0.00705718994140625, 0.008188247680664062, 0.009319305419921875, 0.010450363159179688, 0.0115814208984375, 0.012712478637695312, 0.013843536376953125, 0.014974594116210938, 0.01610565185546875, 0.017236709594726562, 0.018367767333984375, 0.019498825073242188, 0.0206298828125, 0.021760940551757812, 0.022891998291015625, 0.024023056030273438, 0.02515411376953125, 0.026285171508789062, 0.027416229248046875, 0.028547286987304688, 0.0296783447265625, 0.030809402465820312, 0.031940460205078125, 0.03307151794433594, 0.03420257568359375, 0.03533363342285156, 0.036464691162109375, 0.03759574890136719, 0.038726806640625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1016.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8144657015800476, -0.800572395324707, -0.7866790294647217, -0.7727857232093811, -0.7588924169540405, -0.7449990510940552, -0.7311057448387146, -0.717212438583374, -0.7033190727233887, -0.6894257664680481, -0.6755324006080627, -0.6616390943527222, -0.6477457880973816, -0.6338524222373962, -0.6199591159820557, -0.6060658097267151, -0.5921725034713745, -0.5782791972160339, -0.5643858313560486, -0.550492525100708, -0.5365992188453674, -0.5227058529853821, -0.5088125467300415, -0.4949192404747009, -0.4810258746147156, -0.4671325385570526, -0.45323923230171204, -0.4393458962440491, -0.4254525601863861, -0.41155925393104553, -0.39766591787338257, -0.383772611618042, -0.3698793053627014, -0.35598596930503845, -0.3420926630496979, -0.3281993269920349, -0.31430599093437195, -0.30041268467903137, -0.2865193486213684, -0.27262604236602783, -0.2587326765060425, -0.2448393553495407, -0.23094601929187775, -0.21705269813537598, -0.2031593769788742, -0.18926605582237244, -0.17537271976470947, -0.1614793986082077, -0.14758607745170593, -0.13369275629520416, -0.1197994276881218, -0.10590609908103943, -0.09201277792453766, -0.07811944931745529, -0.06422612071037292, -0.050332799553871155, -0.03643947094678879, -0.02254614606499672, -0.008652819320559502, 0.005240507423877716, 0.019133832305669785, 0.03302715718746185, 0.04692048579454422, 0.06081380695104599, 0.07470713555812836]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 4.0, 4.0, 9.0, 9.0, 10.0, 9.0, 17.0, 13.0, 21.0, 16.0, 24.0, 24.0, 28.0, 36.0, 41.0, 41.0, 40.0, 40.0, 62.0, 50.0, 51.0, 41.0, 51.0, 38.0, 44.0, 25.0, 44.0, 27.0, 23.0, 26.0, 21.0, 15.0, 22.0, 20.0, 9.0, 13.0, 9.0, 4.0, 7.0, 2.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.047602951526641846, -0.04605260118842125, -0.04450225085020065, -0.04295190051198006, -0.04140155017375946, -0.039851199835538864, -0.03830084949731827, -0.03675049915909767, -0.035200148820877075, -0.03364979848265648, -0.03209944814443588, -0.030549097806215286, -0.02899874746799469, -0.027448397129774094, -0.025898046791553497, -0.0243476964533329, -0.022797346115112305, -0.02124699577689171, -0.019696645438671112, -0.018146295100450516, -0.01659594476222992, -0.015045594424009323, -0.013495244085788727, -0.01194489374756813, -0.010394543409347534, -0.008844193071126938, -0.0072938427329063416, -0.005743492394685745, -0.004193142056465149, -0.0026427917182445526, -0.0010924413800239563, 0.00045790895819664, 0.0020082592964172363, 0.0035586096346378326, 0.005108959972858429, 0.006659310311079025, 0.008209660649299622, 0.009760010987520218, 0.011310361325740814, 0.01286071166396141, 0.014411062002182007, 0.015961412340402603, 0.0175117626786232, 0.019062113016843796, 0.020612463355064392, 0.02216281369328499, 0.023713164031505585, 0.02526351436972618, 0.026813864707946777, 0.028364215046167374, 0.02991456538438797, 0.031464915722608566, 0.03301526606082916, 0.03456561639904976, 0.036115966737270355, 0.03766631707549095, 0.03921666741371155, 0.040767017751932144, 0.04231736809015274, 0.04386771842837334, 0.04541806876659393, 0.04696841910481453, 0.048518769443035126, 0.05006911978125572, 0.05161947011947632]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 11.0, 9.0, 12.0, 35.0, 33.0, 52.0, 78.0, 86.0, 160.0, 190.0, 281.0, 457.0, 638.0, 989.0, 1592.0, 2614.0, 4363.0, 9258.0, 26853.0, 910672.0, 61795.0, 13669.0, 6075.0, 3111.0, 1932.0, 1077.0, 791.0, 509.0, 368.0, 252.0, 144.0, 104.0, 91.0, 65.0, 51.0, 29.0, 32.0, 21.0, 15.0, 5.0, 6.0, 5.0, 0.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03955078125, -0.038341522216796875, -0.03713226318359375, -0.035923004150390625, -0.0347137451171875, -0.033504486083984375, -0.03229522705078125, -0.031085968017578125, -0.029876708984375, -0.028667449951171875, -0.02745819091796875, -0.026248931884765625, -0.0250396728515625, -0.023830413818359375, -0.02262115478515625, -0.021411895751953125, -0.02020263671875, -0.018993377685546875, -0.01778411865234375, -0.016574859619140625, -0.0153656005859375, -0.014156341552734375, -0.01294708251953125, -0.011737823486328125, -0.010528564453125, -0.009319305419921875, -0.00811004638671875, -0.006900787353515625, -0.0056915283203125, -0.004482269287109375, -0.00327301025390625, -0.002063751220703125, -0.0008544921875, 0.000354766845703125, 0.00156402587890625, 0.002773284912109375, 0.0039825439453125, 0.005191802978515625, 0.00640106201171875, 0.007610321044921875, 0.008819580078125, 0.010028839111328125, 0.01123809814453125, 0.012447357177734375, 0.0136566162109375, 0.014865875244140625, 0.01607513427734375, 0.017284393310546875, 0.01849365234375, 0.019702911376953125, 0.02091217041015625, 0.022121429443359375, 0.0233306884765625, 0.024539947509765625, 0.02574920654296875, 0.026958465576171875, 0.028167724609375, 0.029376983642578125, 0.03058624267578125, 0.031795501708984375, 0.0330047607421875, 0.034214019775390625, 0.03542327880859375, 0.036632537841796875, 0.037841796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 10.0, 15.0, 16.0, 12.0, 10.0, 61.0, 388.0, 315.0, 57.0, 17.0, 11.0, 5.0, 6.0, 8.0, 11.0, 7.0, 9.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208740234375, -0.020236492156982422, -0.019598960876464844, -0.018961429595947266, -0.018323898315429688, -0.01768636703491211, -0.01704883575439453, -0.016411304473876953, -0.015773773193359375, -0.015136241912841797, -0.014498710632324219, -0.01386117935180664, -0.013223648071289062, -0.012586116790771484, -0.011948585510253906, -0.011311054229736328, -0.01067352294921875, -0.010035991668701172, -0.009398460388183594, -0.008760929107666016, -0.008123397827148438, -0.007485866546630859, -0.006848335266113281, -0.006210803985595703, -0.005573272705078125, -0.004935741424560547, -0.004298210144042969, -0.0036606788635253906, -0.0030231475830078125, -0.0023856163024902344, -0.0017480850219726562, -0.0011105537414550781, -0.0004730224609375, 0.00016450881958007812, 0.0008020401000976562, 0.0014395713806152344, 0.0020771026611328125, 0.0027146339416503906, 0.0033521652221679688, 0.003989696502685547, 0.004627227783203125, 0.005264759063720703, 0.005902290344238281, 0.006539821624755859, 0.0071773529052734375, 0.007814884185791016, 0.008452415466308594, 0.009089946746826172, 0.00972747802734375, 0.010365009307861328, 0.011002540588378906, 0.011640071868896484, 0.012277603149414062, 0.01291513442993164, 0.013552665710449219, 0.014190196990966797, 0.014827728271484375, 0.015465259552001953, 0.01610279083251953, 0.01674032211303711, 0.017377853393554688, 0.018015384674072266, 0.018652915954589844, 0.019290447235107422, 0.019927978515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 2.0, 7.0, 8.0, 5.0, 9.0, 12.0, 11.0, 29.0, 39.0, 30.0, 43.0, 62.0, 66.0, 95.0, 100.0, 112.0, 184.0, 220.0, 350.0, 678.0, 1819.0, 25732.0, 997098.0, 18239.0, 1595.0, 658.0, 321.0, 226.0, 161.0, 140.0, 99.0, 70.0, 73.0, 67.0, 51.0, 31.0, 21.0, 24.0, 19.0, 18.0, 7.0, 9.0, 5.0, 3.0, 7.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09132194519042969, -0.08822250366210938, -0.08512306213378906, -0.08202362060546875, -0.07892417907714844, -0.07582473754882812, -0.07272529602050781, -0.0696258544921875, -0.06652641296386719, -0.06342697143554688, -0.06032752990722656, -0.05722808837890625, -0.05412864685058594, -0.051029205322265625, -0.04792976379394531, -0.044830322265625, -0.04173088073730469, -0.038631439208984375, -0.03553199768066406, -0.03243255615234375, -0.029333114624023438, -0.026233673095703125, -0.023134231567382812, -0.0200347900390625, -0.016935348510742188, -0.013835906982421875, -0.010736465454101562, -0.00763702392578125, -0.0045375823974609375, -0.001438140869140625, 0.0016613006591796875, 0.0047607421875, 0.007860183715820312, 0.010959625244140625, 0.014059066772460938, 0.01715850830078125, 0.020257949829101562, 0.023357391357421875, 0.026456832885742188, 0.0295562744140625, 0.03265571594238281, 0.035755157470703125, 0.03885459899902344, 0.04195404052734375, 0.04505348205566406, 0.048152923583984375, 0.05125236511230469, 0.054351806640625, 0.05745124816894531, 0.060550689697265625, 0.06365013122558594, 0.06674957275390625, 0.06984901428222656, 0.07294845581054688, 0.07604789733886719, 0.0791473388671875, 0.08224678039550781, 0.08534622192382812, 0.08844566345214844, 0.09154510498046875, 0.09464454650878906, 0.09774398803710938, 0.10084342956542969, 0.10394287109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 10.0, 14.0, 16.0, 19.0, 22.0, 20.0, 24.0, 27.0, 32.0, 38.0, 33.0, 35.0, 55.0, 46.0, 46.0, 50.0, 55.0, 45.0, 51.0, 37.0, 43.0, 38.0, 28.0, 18.0, 18.0, 26.0, 22.0, 24.0, 23.0, 11.0, 9.0, 10.0, 15.0, 5.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055206298828125, -0.05335378646850586, -0.05150127410888672, -0.04964876174926758, -0.04779624938964844, -0.0459437370300293, -0.044091224670410156, -0.042238712310791016, -0.040386199951171875, -0.038533687591552734, -0.036681175231933594, -0.03482866287231445, -0.03297615051269531, -0.031123638153076172, -0.02927112579345703, -0.02741861343383789, -0.02556610107421875, -0.02371358871459961, -0.02186107635498047, -0.020008563995361328, -0.018156051635742188, -0.016303539276123047, -0.014451026916503906, -0.012598514556884766, -0.010746002197265625, -0.008893489837646484, -0.007040977478027344, -0.005188465118408203, -0.0033359527587890625, -0.0014834403991699219, 0.00036907196044921875, 0.0022215843200683594, 0.0040740966796875, 0.005926609039306641, 0.007779121398925781, 0.009631633758544922, 0.011484146118164062, 0.013336658477783203, 0.015189170837402344, 0.017041683197021484, 0.018894195556640625, 0.020746707916259766, 0.022599220275878906, 0.024451732635498047, 0.026304244995117188, 0.028156757354736328, 0.03000926971435547, 0.03186178207397461, 0.03371429443359375, 0.03556680679321289, 0.03741931915283203, 0.03927183151245117, 0.04112434387207031, 0.04297685623168945, 0.044829368591308594, 0.046681880950927734, 0.048534393310546875, 0.050386905670166016, 0.052239418029785156, 0.0540919303894043, 0.05594444274902344, 0.05779695510864258, 0.05964946746826172, 0.06150197982788086, 0.0633544921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 6.0, 5.0, 7.0, 7.0, 22.0, 36.0, 43.0, 84.0, 147.0, 310.0, 682.0, 1830.0, 6690.0, 50846.0, 926746.0, 50960.0, 7018.0, 1756.0, 727.0, 272.0, 144.0, 78.0, 42.0, 28.0, 18.0, 12.0, 9.0, 6.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.499622344970703e-05, -8.229818195104599e-05, -7.960014045238495e-05, -7.690209895372391e-05, -7.420405745506287e-05, -7.150601595640182e-05, -6.880797445774078e-05, -6.610993295907974e-05, -6.34118914604187e-05, -6.071384996175766e-05, -5.801580846309662e-05, -5.531776696443558e-05, -5.2619725465774536e-05, -4.9921683967113495e-05, -4.7223642468452454e-05, -4.452560096979141e-05, -4.182755947113037e-05, -3.912951797246933e-05, -3.643147647380829e-05, -3.373343497514725e-05, -3.1035393476486206e-05, -2.8337351977825165e-05, -2.5639310479164124e-05, -2.2941268980503082e-05, -2.024322748184204e-05, -1.7545185983181e-05, -1.4847144484519958e-05, -1.2149102985858917e-05, -9.451061487197876e-06, -6.753019988536835e-06, -4.0549784898757935e-06, -1.3569369912147522e-06, 1.341104507446289e-06, 4.03914600610733e-06, 6.737187504768372e-06, 9.435229003429413e-06, 1.2133270502090454e-05, 1.4831312000751495e-05, 1.7529353499412537e-05, 2.0227394998073578e-05, 2.292543649673462e-05, 2.562347799539566e-05, 2.83215194940567e-05, 3.101956099271774e-05, 3.3717602491378784e-05, 3.6415643990039825e-05, 3.911368548870087e-05, 4.181172698736191e-05, 4.450976848602295e-05, 4.720780998468399e-05, 4.990585148334503e-05, 5.260389298200607e-05, 5.5301934480667114e-05, 5.7999975979328156e-05, 6.06980174779892e-05, 6.339605897665024e-05, 6.609410047531128e-05, 6.879214197397232e-05, 7.149018347263336e-05, 7.41882249712944e-05, 7.688626646995544e-05, 7.958430796861649e-05, 8.228234946727753e-05, 8.498039096593857e-05, 8.767843246459961e-05]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 9.0, 9.0, 11.0, 9.0, 17.0, 15.0, 21.0, 25.0, 23.0, 48.0, 50.0, 37.0, 65.0, 33.0, 78.0, 46.0, 67.0, 66.0, 38.0, 50.0, 28.0, 50.0, 24.0, 31.0, 32.0, 18.0, 25.0, 11.0, 16.0, 8.0, 3.0, 7.0, 1.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.614703357219696e-06, -4.461035132408142e-06, -4.307366907596588e-06, -4.153698682785034e-06, -4.00003045797348e-06, -3.846362233161926e-06, -3.6926940083503723e-06, -3.5390257835388184e-06, -3.3853575587272644e-06, -3.2316893339157104e-06, -3.0780211091041565e-06, -2.9243528842926025e-06, -2.7706846594810486e-06, -2.6170164346694946e-06, -2.4633482098579407e-06, -2.3096799850463867e-06, -2.1560117602348328e-06, -2.002343535423279e-06, -1.8486753106117249e-06, -1.695007085800171e-06, -1.541338860988617e-06, -1.387670636177063e-06, -1.234002411365509e-06, -1.080334186553955e-06, -9.266659617424011e-07, -7.729977369308472e-07, -6.193295121192932e-07, -4.6566128730773926e-07, -3.119930624961853e-07, -1.5832483768463135e-07, -4.6566128730773926e-09, 1.4901161193847656e-07, 3.026798367500305e-07, 4.5634806156158447e-07, 6.100162863731384e-07, 7.636845111846924e-07, 9.173527359962463e-07, 1.0710209608078003e-06, 1.2246891856193542e-06, 1.3783574104309082e-06, 1.5320256352424622e-06, 1.6856938600540161e-06, 1.83936208486557e-06, 1.993030309677124e-06, 2.146698534488678e-06, 2.300366759300232e-06, 2.454034984111786e-06, 2.60770320892334e-06, 2.761371433734894e-06, 2.9150396585464478e-06, 3.0687078833580017e-06, 3.2223761081695557e-06, 3.3760443329811096e-06, 3.5297125577926636e-06, 3.6833807826042175e-06, 3.8370490074157715e-06, 3.9907172322273254e-06, 4.144385457038879e-06, 4.298053681850433e-06, 4.451721906661987e-06, 4.605390131473541e-06, 4.759058356285095e-06, 4.912726581096649e-06, 5.066394805908203e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 8.0, 12.0, 23.0, 16.0, 21.0, 49.0, 74.0, 101.0, 151.0, 313.0, 673.0, 3927.0, 1029759.0, 11608.0, 902.0, 361.0, 206.0, 105.0, 79.0, 48.0, 35.0, 16.0, 17.0, 10.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001697540283203125, -0.0001647062599658966, -0.0001596584916114807, -0.00015461072325706482, -0.00014956295490264893, -0.00014451518654823303, -0.00013946741819381714, -0.00013441964983940125, -0.00012937188148498535, -0.00012432411313056946, -0.00011927634477615356, -0.00011422857642173767, -0.00010918080806732178, -0.00010413303971290588, -9.908527135848999e-05, -9.40375030040741e-05, -8.89897346496582e-05, -8.394196629524231e-05, -7.889419794082642e-05, -7.384642958641052e-05, -6.879866123199463e-05, -6.375089287757874e-05, -5.870312452316284e-05, -5.365535616874695e-05, -4.8607587814331055e-05, -4.355981945991516e-05, -3.851205110549927e-05, -3.3464282751083374e-05, -2.841651439666748e-05, -2.3368746042251587e-05, -1.8320977687835693e-05, -1.32732093334198e-05, -8.225440979003906e-06, -3.1776726245880127e-06, 1.8700957298278809e-06, 6.917864084243774e-06, 1.1965632438659668e-05, 1.701340079307556e-05, 2.2061169147491455e-05, 2.710893750190735e-05, 3.215670585632324e-05, 3.7204474210739136e-05, 4.225224256515503e-05, 4.730001091957092e-05, 5.2347779273986816e-05, 5.739554762840271e-05, 6.24433159828186e-05, 6.74910843372345e-05, 7.253885269165039e-05, 7.758662104606628e-05, 8.263438940048218e-05, 8.768215775489807e-05, 9.272992610931396e-05, 9.777769446372986e-05, 0.00010282546281814575, 0.00010787323117256165, 0.00011292099952697754, 0.00011796876788139343, 0.00012301653623580933, 0.00012806430459022522, 0.0001331120729446411, 0.000138159841299057, 0.0001432076096534729, 0.0001482553780078888, 0.0001533031463623047]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 9.0, 8.0, 8.0, 18.0, 18.0, 24.0, 31.0, 36.0, 58.0, 71.0, 111.0, 115.0, 115.0, 87.0, 76.0, 56.0, 51.0, 23.0, 28.0, 18.0, 12.0, 6.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010448694229125977, -0.00010173581540584564, -9.898468852043152e-05, -9.62335616350174e-05, -9.348243474960327e-05, -9.073130786418915e-05, -8.798018097877502e-05, -8.52290540933609e-05, -8.247792720794678e-05, -7.972680032253265e-05, -7.697567343711853e-05, -7.42245465517044e-05, -7.147341966629028e-05, -6.872229278087616e-05, -6.597116589546204e-05, -6.322003901004791e-05, -6.046891212463379e-05, -5.7717785239219666e-05, -5.496665835380554e-05, -5.221553146839142e-05, -4.9464404582977295e-05, -4.671327769756317e-05, -4.396215081214905e-05, -4.1211023926734924e-05, -3.84598970413208e-05, -3.570877015590668e-05, -3.2957643270492554e-05, -3.020651638507843e-05, -2.7455389499664307e-05, -2.4704262614250183e-05, -2.195313572883606e-05, -1.9202008843421936e-05, -1.6450881958007812e-05, -1.3699755072593689e-05, -1.0948628187179565e-05, -8.197501301765442e-06, -5.446374416351318e-06, -2.695247530937195e-06, 5.587935447692871e-08, 2.8070062398910522e-06, 5.558133125305176e-06, 8.3092600107193e-06, 1.1060386896133423e-05, 1.3811513781547546e-05, 1.656264066696167e-05, 1.9313767552375793e-05, 2.2064894437789917e-05, 2.481602132320404e-05, 2.7567148208618164e-05, 3.0318275094032288e-05, 3.306940197944641e-05, 3.5820528864860535e-05, 3.857165575027466e-05, 4.132278263568878e-05, 4.4073909521102905e-05, 4.682503640651703e-05, 4.957616329193115e-05, 5.2327290177345276e-05, 5.50784170627594e-05, 5.782954394817352e-05, 6.0580670833587646e-05, 6.333179771900177e-05, 6.60829246044159e-05, 6.883405148983002e-05, 7.158517837524414e-05]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 9.0, 58.0, 748.0, 173.0, 21.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49996310472488403, -0.4876924157142639, -0.4754217565059662, -0.46315106749534607, -0.45088037848472595, -0.43860968947410583, -0.4263390302658081, -0.414068341255188, -0.40179765224456787, -0.38952696323394775, -0.37725630402565, -0.3649856150150299, -0.3527149260044098, -0.3404442369937897, -0.32817357778549194, -0.3159028887748718, -0.3036321997642517, -0.2913615107536316, -0.27909085154533386, -0.26682016253471375, -0.25454947352409363, -0.2422787994146347, -0.23000812530517578, -0.21773743629455566, -0.20546677708625793, -0.193196102976799, -0.1809254139661789, -0.16865473985671997, -0.15638405084609985, -0.14411337673664093, -0.131842702627182, -0.11957201361656189, -0.10730132460594177, -0.09503064304590225, -0.08275996148586273, -0.07048928737640381, -0.05821860209107399, -0.04594792053103447, -0.03367724269628525, -0.021406561136245728, -0.009135879576206207, 0.0031348010525107384, 0.015405481681227684, 0.027676161378622055, 0.039946842938661575, 0.052217524498701096, 0.06448820233345032, 0.07675888389348984, 0.08902956545352936, 0.10130024701356888, 0.1135709285736084, 0.12584160268306732, 0.13811229169368744, 0.15038296580314636, 0.16265365481376648, 0.1749243289232254, 0.18719500303268433, 0.19946567714214325, 0.21173636615276337, 0.2240070402622223, 0.2362777292728424, 0.24854840338230133, 0.26081907749176025, 0.27308976650238037, 0.2853604555130005]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 10.0, 10.0, 18.0, 19.0, 21.0, 26.0, 13.0, 39.0, 30.0, 36.0, 54.0, 42.0, 49.0, 46.0, 71.0, 65.0, 67.0, 51.0, 48.0, 43.0, 48.0, 29.0, 37.0, 25.0, 24.0, 16.0, 16.0, 21.0, 3.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3970259428024292, -0.3834264278411865, -0.36982694268226624, -0.35622742772102356, -0.34262794256210327, -0.3290284276008606, -0.3154289126396179, -0.30182939767837524, -0.28822991251945496, -0.2746303975582123, -0.261030912399292, -0.24743139743804932, -0.23383189737796783, -0.22023239731788635, -0.20663288235664368, -0.1930333822965622, -0.1794338822364807, -0.16583438217639923, -0.15223488211631775, -0.13863536715507507, -0.1250358670949936, -0.11143636703491211, -0.09783685952425003, -0.08423735201358795, -0.07063785195350647, -0.05703834816813469, -0.04343884438276291, -0.02983934059739113, -0.016239836812019348, -0.002640336751937866, 0.010959170758724213, 0.02455867826938629, 0.03815817832946777, 0.051757682114839554, 0.06535718590021133, 0.07895669341087341, 0.0925561934709549, 0.10615569353103638, 0.11975520104169846, 0.13335470855236053, 0.14695420861244202, 0.1605537086725235, 0.17415320873260498, 0.18775272369384766, 0.20135222375392914, 0.21495172381401062, 0.2285512387752533, 0.24215073883533478, 0.25575023889541626, 0.26934975385665894, 0.2829492390155792, 0.2965487539768219, 0.3101482391357422, 0.32374775409698486, 0.33734726905822754, 0.3509467840194702, 0.3645462691783905, 0.3781457841396332, 0.39174526929855347, 0.40534478425979614, 0.4189442992210388, 0.4325437843799591, 0.4461432993412018, 0.45974278450012207, 0.47334229946136475]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 6.0, 3.0, 5.0, 8.0, 8.0, 23.0, 18.0, 15.0, 18.0, 31.0, 46.0, 56.0, 84.0, 106.0, 221.0, 3370.0, 4188287.0, 1400.0, 171.0, 113.0, 71.0, 56.0, 41.0, 26.0, 21.0, 17.0, 11.0, 12.0, 6.0, 2.0, 7.0, 1.0, 2.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12432861328125, -0.120361328125, -0.11639404296875, -0.1124267578125, -0.10845947265625, -0.1044921875, -0.10052490234375, -0.0965576171875, -0.09259033203125, -0.088623046875, -0.08465576171875, -0.0806884765625, -0.07672119140625, -0.07275390625, -0.06878662109375, -0.0648193359375, -0.06085205078125, -0.056884765625, -0.05291748046875, -0.0489501953125, -0.04498291015625, -0.041015625, -0.03704833984375, -0.0330810546875, -0.02911376953125, -0.025146484375, -0.02117919921875, -0.0172119140625, -0.01324462890625, -0.00927734375, -0.00531005859375, -0.0013427734375, 0.00262451171875, 0.006591796875, 0.01055908203125, 0.0145263671875, 0.01849365234375, 0.0224609375, 0.02642822265625, 0.0303955078125, 0.03436279296875, 0.038330078125, 0.04229736328125, 0.0462646484375, 0.05023193359375, 0.05419921875, 0.05816650390625, 0.0621337890625, 0.06610107421875, 0.070068359375, 0.07403564453125, 0.0780029296875, 0.08197021484375, 0.0859375, 0.08990478515625, 0.0938720703125, 0.09783935546875, 0.101806640625, 0.10577392578125, 0.1097412109375, 0.11370849609375, 0.11767578125, 0.12164306640625, 0.1256103515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 6.0, 1.0, 3.0, 1.0, 4.0, 10.0, 15.0, 22.0, 7.0, 19.0, 138.0, 455.0, 183.0, 40.0, 13.0, 8.0, 8.0, 6.0, 10.0, 11.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204925537109375, -0.01986098289489746, -0.019229412078857422, -0.018597841262817383, -0.017966270446777344, -0.017334699630737305, -0.016703128814697266, -0.016071557998657227, -0.015439987182617188, -0.014808416366577148, -0.01417684555053711, -0.01354527473449707, -0.012913703918457031, -0.012282133102416992, -0.011650562286376953, -0.011018991470336914, -0.010387420654296875, -0.009755849838256836, -0.009124279022216797, -0.008492708206176758, -0.007861137390136719, -0.00722956657409668, -0.006597995758056641, -0.0059664249420166016, -0.0053348541259765625, -0.0047032833099365234, -0.004071712493896484, -0.0034401416778564453, -0.0028085708618164062, -0.002177000045776367, -0.0015454292297363281, -0.0009138584136962891, -0.00028228759765625, 0.00034928321838378906, 0.0009808540344238281, 0.0016124248504638672, 0.0022439956665039062, 0.0028755664825439453, 0.0035071372985839844, 0.0041387081146240234, 0.0047702789306640625, 0.0054018497467041016, 0.006033420562744141, 0.00666499137878418, 0.007296562194824219, 0.007928133010864258, 0.008559703826904297, 0.009191274642944336, 0.009822845458984375, 0.010454416275024414, 0.011085987091064453, 0.011717557907104492, 0.012349128723144531, 0.01298069953918457, 0.01361227035522461, 0.014243841171264648, 0.014875411987304688, 0.015506982803344727, 0.016138553619384766, 0.016770124435424805, 0.017401695251464844, 0.018033266067504883, 0.018664836883544922, 0.01929640769958496, 0.019927978515625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 21.0, 17.0, 38.0, 148.0, 527.0, 3281.0, 4187496.0, 2404.0, 193.0, 76.0, 30.0, 11.0, 12.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08441162109375, -0.0813302993774414, -0.07824897766113281, -0.07516765594482422, -0.07208633422851562, -0.06900501251220703, -0.06592369079589844, -0.06284236907958984, -0.05976104736328125, -0.056679725646972656, -0.05359840393066406, -0.05051708221435547, -0.047435760498046875, -0.04435443878173828, -0.04127311706542969, -0.038191795349121094, -0.0351104736328125, -0.032029151916503906, -0.028947830200195312, -0.02586650848388672, -0.022785186767578125, -0.01970386505126953, -0.016622543334960938, -0.013541221618652344, -0.01045989990234375, -0.007378578186035156, -0.0042972564697265625, -0.0012159347534179688, 0.001865386962890625, 0.004946708679199219, 0.008028030395507812, 0.011109352111816406, 0.014190673828125, 0.017271995544433594, 0.020353317260742188, 0.02343463897705078, 0.026515960693359375, 0.02959728240966797, 0.03267860412597656, 0.035759925842285156, 0.03884124755859375, 0.041922569274902344, 0.04500389099121094, 0.04808521270751953, 0.051166534423828125, 0.05424785614013672, 0.05732917785644531, 0.060410499572753906, 0.0634918212890625, 0.0665731430053711, 0.06965446472167969, 0.07273578643798828, 0.07581710815429688, 0.07889842987060547, 0.08197975158691406, 0.08506107330322266, 0.08814239501953125, 0.09122371673583984, 0.09430503845214844, 0.09738636016845703, 0.10046768188476562, 0.10354900360107422, 0.10663032531738281, 0.1097116470336914, 0.11279296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 7.0, 4.0, 23.0, 64.0, 3755.0, 159.0, 32.0, 10.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0250091552734375, -0.024379968643188477, -0.023750782012939453, -0.02312159538269043, -0.022492408752441406, -0.021863222122192383, -0.02123403549194336, -0.020604848861694336, -0.019975662231445312, -0.01934647560119629, -0.018717288970947266, -0.018088102340698242, -0.01745891571044922, -0.016829729080200195, -0.016200542449951172, -0.015571355819702148, -0.014942169189453125, -0.014312982559204102, -0.013683795928955078, -0.013054609298706055, -0.012425422668457031, -0.011796236038208008, -0.011167049407958984, -0.010537862777709961, -0.009908676147460938, -0.009279489517211914, -0.00865030288696289, -0.008021116256713867, -0.007391929626464844, -0.00676274299621582, -0.006133556365966797, -0.0055043697357177734, -0.00487518310546875, -0.0042459964752197266, -0.003616809844970703, -0.0029876232147216797, -0.0023584365844726562, -0.0017292499542236328, -0.0011000633239746094, -0.00047087669372558594, 0.0001583099365234375, 0.0007874965667724609, 0.0014166831970214844, 0.002045869827270508, 0.0026750564575195312, 0.0033042430877685547, 0.003933429718017578, 0.0045626163482666016, 0.005191802978515625, 0.0058209896087646484, 0.006450176239013672, 0.007079362869262695, 0.007708549499511719, 0.008337736129760742, 0.008966922760009766, 0.009596109390258789, 0.010225296020507812, 0.010854482650756836, 0.01148366928100586, 0.012112855911254883, 0.012742042541503906, 0.01337122917175293, 0.014000415802001953, 0.014629602432250977, 0.0152587890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 998.0, 21.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5493103265762329, -0.5399830937385559, -0.5306558012962341, -0.5213285684585571, -0.5120012760162354, -0.5026740431785583, -0.49334678053855896, -0.48401951789855957, -0.4746922552585602, -0.4653649926185608, -0.4560377299785614, -0.446710467338562, -0.437383234500885, -0.4280559718608856, -0.41872870922088623, -0.40940144658088684, -0.40007418394088745, -0.39074692130088806, -0.38141965866088867, -0.3720923960208893, -0.3627651333808899, -0.3534379005432129, -0.3441106379032135, -0.3347833752632141, -0.3254561126232147, -0.31612884998321533, -0.30680158734321594, -0.29747432470321655, -0.28814709186553955, -0.27881982922554016, -0.26949256658554077, -0.2601653039455414, -0.250838041305542, -0.2415107786655426, -0.2321835160255432, -0.22285626828670502, -0.21352900564670563, -0.20420174300670624, -0.19487449526786804, -0.18554723262786865, -0.17621998488903046, -0.16689272224903107, -0.15756547451019287, -0.14823821187019348, -0.1389109492301941, -0.1295836865901947, -0.12025643140077591, -0.11092917621135712, -0.10160191357135773, -0.09227465093135834, -0.08294739574193954, -0.07362014055252075, -0.06429287791252136, -0.05496561899781227, -0.04563836008310318, -0.03631110489368439, -0.026983842253684998, -0.017656583338975906, -0.008329324424266815, 0.000997934490442276, 0.010325193405151367, 0.01965245231986046, 0.02897971123456955, 0.03830696642398834, 0.04763422906398773]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 5.0, 17.0, 16.0, 26.0, 26.0, 31.0, 44.0, 45.0, 40.0, 54.0, 66.0, 64.0, 76.0, 66.0, 52.0, 57.0, 60.0, 41.0, 40.0, 33.0, 32.0, 32.0, 19.0, 11.0, 10.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023692727088928223, -0.022679012268781662, -0.021665295585989952, -0.020651578903198242, -0.01963786408305168, -0.01862414926290512, -0.01761043258011341, -0.0165967158973217, -0.01558300107717514, -0.014569285325706005, -0.01355556957423687, -0.012541853822767735, -0.0115281380712986, -0.010514422319829464, -0.009500706568360329, -0.008486990816891193, -0.007473275065422058, -0.006459559313952923, -0.0054458435624837875, -0.004432127811014652, -0.003418412059545517, -0.0024046963080763817, -0.0013909805566072464, -0.0003772648051381111, 0.0006364509463310242, 0.0016501666978001595, 0.0026638824492692947, 0.00367759820073843, 0.004691313952207565, 0.005705029703676701, 0.006718745455145836, 0.007732461206614971, 0.008746176958084106, 0.009759892709553242, 0.010773608461022377, 0.011787324212491512, 0.012801039963960648, 0.013814755715429783, 0.014828471466898918, 0.015842188149690628, 0.01685590296983719, 0.01786961778998375, 0.01888333447277546, 0.01989705115556717, 0.02091076597571373, 0.02192448079586029, 0.022938197478652, 0.02395191416144371, 0.02496562898159027, 0.02597934380173683, 0.02699306048452854, 0.02800677716732025, 0.029020491987466812, 0.030034206807613373, 0.031047923490405083, 0.03206164017319679, 0.03307535499334335, 0.034089069813489914, 0.035102784633636475, 0.036116503179073334, 0.037130217999219894, 0.038143932819366455, 0.039157651364803314, 0.040171366184949875, 0.041185081005096436]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 5.0, 12.0, 10.0, 9.0, 13.0, 19.0, 31.0, 46.0, 53.0, 67.0, 97.0, 127.0, 155.0, 217.0, 307.0, 438.0, 631.0, 943.0, 1452.0, 2341.0, 4026.0, 7524.0, 18436.0, 261692.0, 709523.0, 20707.0, 8350.0, 4068.0, 2336.0, 1469.0, 1019.0, 677.0, 493.0, 333.0, 234.0, 167.0, 124.0, 110.0, 63.0, 56.0, 48.0, 31.0, 19.0, 13.0, 13.0, 6.0, 6.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0235137939453125, -0.02277994155883789, -0.02204608917236328, -0.021312236785888672, -0.020578384399414062, -0.019844532012939453, -0.019110679626464844, -0.018376827239990234, -0.017642974853515625, -0.016909122467041016, -0.016175270080566406, -0.015441417694091797, -0.014707565307617188, -0.013973712921142578, -0.013239860534667969, -0.01250600814819336, -0.01177215576171875, -0.01103830337524414, -0.010304450988769531, -0.009570598602294922, -0.008836746215820312, -0.008102893829345703, -0.007369041442871094, -0.006635189056396484, -0.005901336669921875, -0.005167484283447266, -0.004433631896972656, -0.003699779510498047, -0.0029659271240234375, -0.002232074737548828, -0.0014982223510742188, -0.0007643699645996094, -3.0517578125e-05, 0.0007033348083496094, 0.0014371871948242188, 0.002171039581298828, 0.0029048919677734375, 0.003638744354248047, 0.004372596740722656, 0.005106449127197266, 0.005840301513671875, 0.006574153900146484, 0.007308006286621094, 0.008041858673095703, 0.008775711059570312, 0.009509563446044922, 0.010243415832519531, 0.01097726821899414, 0.01171112060546875, 0.01244497299194336, 0.013178825378417969, 0.013912677764892578, 0.014646530151367188, 0.015380382537841797, 0.016114234924316406, 0.016848087310791016, 0.017581939697265625, 0.018315792083740234, 0.019049644470214844, 0.019783496856689453, 0.020517349243164062, 0.021251201629638672, 0.02198505401611328, 0.02271890640258789, 0.0234527587890625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 6.0, 1.0, 3.0, 1.0, 4.0, 10.0, 15.0, 22.0, 7.0, 17.0, 127.0, 458.0, 191.0, 40.0, 14.0, 9.0, 8.0, 6.0, 10.0, 10.0, 5.0, 6.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204925537109375, -0.019861459732055664, -0.019230365753173828, -0.018599271774291992, -0.017968177795410156, -0.01733708381652832, -0.016705989837646484, -0.01607489585876465, -0.015443801879882812, -0.014812707901000977, -0.01418161392211914, -0.013550519943237305, -0.012919425964355469, -0.012288331985473633, -0.011657238006591797, -0.011026144027709961, -0.010395050048828125, -0.009763956069946289, -0.009132862091064453, -0.008501768112182617, -0.007870674133300781, -0.007239580154418945, -0.006608486175537109, -0.0059773921966552734, -0.0053462982177734375, -0.0047152042388916016, -0.004084110260009766, -0.0034530162811279297, -0.0028219223022460938, -0.002190828323364258, -0.0015597343444824219, -0.0009286403656005859, -0.00029754638671875, 0.00033354759216308594, 0.0009646415710449219, 0.0015957355499267578, 0.0022268295288085938, 0.0028579235076904297, 0.0034890174865722656, 0.0041201114654541016, 0.0047512054443359375, 0.0053822994232177734, 0.006013393402099609, 0.006644487380981445, 0.007275581359863281, 0.007906675338745117, 0.008537769317626953, 0.009168863296508789, 0.009799957275390625, 0.010431051254272461, 0.011062145233154297, 0.011693239212036133, 0.012324333190917969, 0.012955427169799805, 0.01358652114868164, 0.014217615127563477, 0.014848709106445312, 0.015479803085327148, 0.016110897064208984, 0.01674199104309082, 0.017373085021972656, 0.018004179000854492, 0.018635272979736328, 0.019266366958618164, 0.0198974609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 6.0, 4.0, 2.0, 4.0, 7.0, 9.0, 12.0, 23.0, 15.0, 17.0, 27.0, 20.0, 26.0, 35.0, 50.0, 53.0, 62.0, 97.0, 110.0, 188.0, 249.0, 409.0, 688.0, 1462.0, 8608.0, 899537.0, 130456.0, 3513.0, 1117.0, 530.0, 318.0, 206.0, 128.0, 113.0, 88.0, 76.0, 67.0, 41.0, 35.0, 39.0, 15.0, 30.0, 15.0, 12.0, 9.0, 11.0, 3.0, 9.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06378173828125, -0.06164264678955078, -0.05950355529785156, -0.057364463806152344, -0.055225372314453125, -0.053086280822753906, -0.05094718933105469, -0.04880809783935547, -0.04666900634765625, -0.04452991485595703, -0.04239082336425781, -0.040251731872558594, -0.038112640380859375, -0.035973548889160156, -0.03383445739746094, -0.03169536590576172, -0.0295562744140625, -0.02741718292236328, -0.025278091430664062, -0.023138999938964844, -0.020999908447265625, -0.018860816955566406, -0.016721725463867188, -0.014582633972167969, -0.01244354248046875, -0.010304450988769531, -0.008165359497070312, -0.006026268005371094, -0.003887176513671875, -0.0017480850219726562, 0.0003910064697265625, 0.0025300979614257812, 0.004669189453125, 0.006808280944824219, 0.008947372436523438, 0.011086463928222656, 0.013225555419921875, 0.015364646911621094, 0.017503738403320312, 0.01964282989501953, 0.02178192138671875, 0.02392101287841797, 0.026060104370117188, 0.028199195861816406, 0.030338287353515625, 0.032477378845214844, 0.03461647033691406, 0.03675556182861328, 0.0388946533203125, 0.04103374481201172, 0.04317283630371094, 0.045311927795410156, 0.047451019287109375, 0.049590110778808594, 0.05172920227050781, 0.05386829376220703, 0.05600738525390625, 0.05814647674560547, 0.06028556823730469, 0.062424659729003906, 0.06456375122070312, 0.06670284271240234, 0.06884193420410156, 0.07098102569580078, 0.0731201171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 8.0, 3.0, 4.0, 9.0, 15.0, 8.0, 19.0, 11.0, 8.0, 18.0, 14.0, 22.0, 23.0, 25.0, 28.0, 34.0, 39.0, 35.0, 38.0, 51.0, 27.0, 50.0, 43.0, 40.0, 41.0, 48.0, 39.0, 37.0, 32.0, 39.0, 25.0, 34.0, 25.0, 22.0, 16.0, 15.0, 12.0, 4.0, 9.0, 4.0, 6.0, 7.0, 5.0, 1.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.045745849609375, -0.04419136047363281, -0.042636871337890625, -0.04108238220214844, -0.03952789306640625, -0.03797340393066406, -0.036418914794921875, -0.03486442565917969, -0.0333099365234375, -0.03175544738769531, -0.030200958251953125, -0.028646469116210938, -0.02709197998046875, -0.025537490844726562, -0.023983001708984375, -0.022428512573242188, -0.0208740234375, -0.019319534301757812, -0.017765045166015625, -0.016210556030273438, -0.01465606689453125, -0.013101577758789062, -0.011547088623046875, -0.009992599487304688, -0.0084381103515625, -0.0068836212158203125, -0.005329132080078125, -0.0037746429443359375, -0.00222015380859375, -0.0006656646728515625, 0.000888824462890625, 0.0024433135986328125, 0.003997802734375, 0.0055522918701171875, 0.007106781005859375, 0.008661270141601562, 0.01021575927734375, 0.011770248413085938, 0.013324737548828125, 0.014879226684570312, 0.0164337158203125, 0.017988204956054688, 0.019542694091796875, 0.021097183227539062, 0.02265167236328125, 0.024206161499023438, 0.025760650634765625, 0.027315139770507812, 0.02886962890625, 0.030424118041992188, 0.031978607177734375, 0.03353309631347656, 0.03508758544921875, 0.03664207458496094, 0.038196563720703125, 0.03975105285644531, 0.0413055419921875, 0.04286003112792969, 0.044414520263671875, 0.04596900939941406, 0.04752349853515625, 0.04907798767089844, 0.050632476806640625, 0.05218696594238281, 0.053741455078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 10.0, 3.0, 12.0, 17.0, 18.0, 33.0, 51.0, 66.0, 137.0, 277.0, 714.0, 2829.0, 19488.0, 960456.0, 57580.0, 4869.0, 1195.0, 370.0, 163.0, 99.0, 55.0, 30.0, 18.0, 17.0, 17.0, 3.0, 6.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.16312026977539e-05, -5.878787487745285e-05, -5.5944547057151794e-05, -5.310121923685074e-05, -5.025789141654968e-05, -4.741456359624863e-05, -4.457123577594757e-05, -4.1727907955646515e-05, -3.888458013534546e-05, -3.60412523150444e-05, -3.319792449474335e-05, -3.035459667444229e-05, -2.7511268854141235e-05, -2.466794103384018e-05, -2.1824613213539124e-05, -1.8981285393238068e-05, -1.6137957572937012e-05, -1.3294629752635956e-05, -1.04513019323349e-05, -7.607974112033844e-06, -4.764646291732788e-06, -1.921318471431732e-06, 9.220093488693237e-07, 3.7653371691703796e-06, 6.6086649894714355e-06, 9.451992809772491e-06, 1.2295320630073547e-05, 1.5138648450374603e-05, 1.798197627067566e-05, 2.0825304090976715e-05, 2.366863191127777e-05, 2.6511959731578827e-05, 2.9355287551879883e-05, 3.219861537218094e-05, 3.5041943192481995e-05, 3.788527101278305e-05, 4.0728598833084106e-05, 4.357192665338516e-05, 4.641525447368622e-05, 4.9258582293987274e-05, 5.210191011428833e-05, 5.4945237934589386e-05, 5.778856575489044e-05, 6.06318935751915e-05, 6.347522139549255e-05, 6.631854921579361e-05, 6.916187703609467e-05, 7.200520485639572e-05, 7.484853267669678e-05, 7.769186049699783e-05, 8.053518831729889e-05, 8.337851613759995e-05, 8.6221843957901e-05, 8.906517177820206e-05, 9.190849959850311e-05, 9.475182741880417e-05, 9.759515523910522e-05, 0.00010043848305940628, 0.00010328181087970734, 0.00010612513870000839, 0.00010896846652030945, 0.0001118117943406105, 0.00011465512216091156, 0.00011749844998121262, 0.00012034177780151367]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 8.0, 2.0, 11.0, 13.0, 14.0, 20.0, 26.0, 31.0, 32.0, 54.0, 35.0, 35.0, 90.0, 40.0, 75.0, 52.0, 71.0, 56.0, 60.0, 42.0, 40.0, 36.0, 27.0, 29.0, 11.0, 20.0, 8.0, 8.0, 9.0, 4.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.066394805908203e-06, -4.9211084842681885e-06, -4.775822162628174e-06, -4.630535840988159e-06, -4.4852495193481445e-06, -4.33996319770813e-06, -4.194676876068115e-06, -4.049390554428101e-06, -3.904104232788086e-06, -3.7588179111480713e-06, -3.6135315895080566e-06, -3.468245267868042e-06, -3.3229589462280273e-06, -3.1776726245880127e-06, -3.032386302947998e-06, -2.8870999813079834e-06, -2.7418136596679688e-06, -2.596527338027954e-06, -2.4512410163879395e-06, -2.305954694747925e-06, -2.16066837310791e-06, -2.0153820514678955e-06, -1.8700957298278809e-06, -1.7248094081878662e-06, -1.5795230865478516e-06, -1.434236764907837e-06, -1.2889504432678223e-06, -1.1436641216278076e-06, -9.98377799987793e-07, -8.530914783477783e-07, -7.078051567077637e-07, -5.62518835067749e-07, -4.172325134277344e-07, -2.7194619178771973e-07, -1.2665987014770508e-07, 1.862645149230957e-08, 1.6391277313232422e-07, 3.0919909477233887e-07, 4.544854164123535e-07, 5.997717380523682e-07, 7.450580596923828e-07, 8.903443813323975e-07, 1.0356307029724121e-06, 1.1809170246124268e-06, 1.3262033462524414e-06, 1.471489667892456e-06, 1.6167759895324707e-06, 1.7620623111724854e-06, 1.9073486328125e-06, 2.0526349544525146e-06, 2.1979212760925293e-06, 2.343207597732544e-06, 2.4884939193725586e-06, 2.6337802410125732e-06, 2.779066562652588e-06, 2.9243528842926025e-06, 3.069639205932617e-06, 3.214925527572632e-06, 3.3602118492126465e-06, 3.505498170852661e-06, 3.6507844924926758e-06, 3.7960708141326904e-06, 3.941357135772705e-06, 4.08664345741272e-06, 4.231929779052734e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 7.0, 7.0, 10.0, 19.0, 17.0, 13.0, 21.0, 18.0, 45.0, 28.0, 47.0, 71.0, 89.0, 182.0, 254.0, 521.0, 1303.0, 16911.0, 1012063.0, 14229.0, 1312.0, 515.0, 276.0, 174.0, 106.0, 66.0, 48.0, 33.0, 18.0, 31.0, 24.0, 8.0, 10.0, 10.0, 15.0, 12.0, 8.0, 3.0, 4.0, 2.0, 7.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.949901580810547e-05, -6.722006946802139e-05, -6.494112312793732e-05, -6.266217678785324e-05, -6.0383230447769165e-05, -5.810428410768509e-05, -5.582533776760101e-05, -5.354639142751694e-05, -5.126744508743286e-05, -4.8988498747348785e-05, -4.670955240726471e-05, -4.4430606067180634e-05, -4.215165972709656e-05, -3.987271338701248e-05, -3.7593767046928406e-05, -3.531482070684433e-05, -3.3035874366760254e-05, -3.075692802667618e-05, -2.8477981686592102e-05, -2.6199035346508026e-05, -2.392008900642395e-05, -2.1641142666339874e-05, -1.93621963262558e-05, -1.7083249986171722e-05, -1.4804303646087646e-05, -1.252535730600357e-05, -1.0246410965919495e-05, -7.967464625835419e-06, -5.688518285751343e-06, -3.409571945667267e-06, -1.130625605583191e-06, 1.148320734500885e-06, 3.427267074584961e-06, 5.706213414669037e-06, 7.985159754753113e-06, 1.0264106094837189e-05, 1.2543052434921265e-05, 1.482199877500534e-05, 1.7100945115089417e-05, 1.9379891455173492e-05, 2.165883779525757e-05, 2.3937784135341644e-05, 2.621673047542572e-05, 2.8495676815509796e-05, 3.077462315559387e-05, 3.305356949567795e-05, 3.5332515835762024e-05, 3.76114621758461e-05, 3.9890408515930176e-05, 4.216935485601425e-05, 4.444830119609833e-05, 4.6727247536182404e-05, 4.900619387626648e-05, 5.1285140216350555e-05, 5.356408655643463e-05, 5.584303289651871e-05, 5.812197923660278e-05, 6.040092557668686e-05, 6.267987191677094e-05, 6.495881825685501e-05, 6.723776459693909e-05, 6.951671093702316e-05, 7.179565727710724e-05, 7.407460361719131e-05, 7.635354995727539e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 6.0, 5.0, 10.0, 4.0, 5.0, 12.0, 21.0, 14.0, 18.0, 36.0, 39.0, 65.0, 85.0, 99.0, 94.0, 79.0, 97.0, 65.0, 44.0, 40.0, 31.0, 15.0, 13.0, 12.0, 8.0, 12.0, 12.0, 4.0, 4.0, 3.0, 11.0, 7.0, 7.0, 1.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.161762237548828e-05, -4.9930065870285034e-05, -4.824250936508179e-05, -4.655495285987854e-05, -4.486739635467529e-05, -4.3179839849472046e-05, -4.14922833442688e-05, -3.980472683906555e-05, -3.8117170333862305e-05, -3.642961382865906e-05, -3.474205732345581e-05, -3.3054500818252563e-05, -3.1366944313049316e-05, -2.967938780784607e-05, -2.7991831302642822e-05, -2.6304274797439575e-05, -2.4616718292236328e-05, -2.292916178703308e-05, -2.1241605281829834e-05, -1.9554048776626587e-05, -1.786649227142334e-05, -1.6178935766220093e-05, -1.4491379261016846e-05, -1.2803822755813599e-05, -1.1116266250610352e-05, -9.428709745407104e-06, -7.741153240203857e-06, -6.05359673500061e-06, -4.366040229797363e-06, -2.678483724594116e-06, -9.909272193908691e-07, 6.966292858123779e-07, 2.384185791015625e-06, 4.071742296218872e-06, 5.759298801422119e-06, 7.446855306625366e-06, 9.134411811828613e-06, 1.082196831703186e-05, 1.2509524822235107e-05, 1.4197081327438354e-05, 1.58846378326416e-05, 1.757219433784485e-05, 1.9259750843048096e-05, 2.0947307348251343e-05, 2.263486385345459e-05, 2.4322420358657837e-05, 2.6009976863861084e-05, 2.769753336906433e-05, 2.9385089874267578e-05, 3.1072646379470825e-05, 3.276020288467407e-05, 3.444775938987732e-05, 3.6135315895080566e-05, 3.7822872400283813e-05, 3.951042890548706e-05, 4.119798541069031e-05, 4.2885541915893555e-05, 4.45730984210968e-05, 4.626065492630005e-05, 4.7948211431503296e-05, 4.963576793670654e-05, 5.132332444190979e-05, 5.301088094711304e-05, 5.4698437452316284e-05, 5.638599395751953e-05]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 48.0, 914.0, 46.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21399924159049988, -0.1953517198562622, -0.17670419812202454, -0.15805667638778687, -0.1394091546535492, -0.12076162546873093, -0.10211409628391266, -0.08346657454967499, -0.06481905281543732, -0.046171531081199646, -0.027524005621671677, -0.008876480162143707, 0.009771041572093964, 0.028418563306331635, 0.0470660924911499, 0.06571361422538757, 0.08436113595962524, 0.10300865769386292, 0.12165617942810059, 0.14030370116233826, 0.15895122289657593, 0.1775987446308136, 0.19624628126621246, 0.21489380300045013, 0.2335413247346878, 0.25218886137008667, 0.27083638310432434, 0.289483904838562, 0.3081314265727997, 0.32677894830703735, 0.345426470041275, 0.3640739917755127, 0.382721483707428, 0.40136900544166565, 0.4200165271759033, 0.438664048910141, 0.45731157064437866, 0.47595909237861633, 0.494606614112854, 0.5132541656494141, 0.5319016575813293, 0.5505492091178894, 0.5691967010498047, 0.5878442525863647, 0.60649174451828, 0.6251392960548401, 0.6437867879867554, 0.6624343395233154, 0.6810818910598755, 0.6997294425964355, 0.7183769345283508, 0.7370244860649109, 0.7556719779968262, 0.7743195295333862, 0.7929670214653015, 0.8116145730018616, 0.8302620649337769, 0.8489096164703369, 0.8675571084022522, 0.8862046599388123, 0.9048521518707275, 0.9234997034072876, 0.9421471953392029, 0.9607947468757629, 0.9794422388076782]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 12.0, 11.0, 31.0, 38.0, 36.0, 54.0, 69.0, 82.0, 106.0, 82.0, 98.0, 77.0, 65.0, 56.0, 47.0, 35.0, 24.0, 11.0, 15.0, 10.0, 6.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4558250308036804, -0.43731236457824707, -0.4187996983528137, -0.40028703212738037, -0.3817743957042694, -0.36326172947883606, -0.3447490632534027, -0.32623642683029175, -0.3077237606048584, -0.28921109437942505, -0.2706984281539917, -0.25218576192855835, -0.2336731255054474, -0.21516045928001404, -0.1966477930545807, -0.17813514173030853, -0.159622460603714, -0.14110979437828064, -0.12259714305400848, -0.10408447682857513, -0.08557181805372238, -0.06705915927886963, -0.04854649305343628, -0.030033841729164124, -0.011521175503730774, 0.006991485133767128, 0.02550414577126503, 0.04401680827140808, 0.06252946704626083, 0.08104212582111359, 0.09955479204654694, 0.11806744337081909, 0.13658010959625244, 0.1550927758216858, 0.17360542714595795, 0.1921180933713913, 0.21063074469566345, 0.2291434109210968, 0.24765607714653015, 0.2661687135696411, 0.28468137979507446, 0.3031940460205078, 0.32170671224594116, 0.3402193784713745, 0.3587320148944855, 0.3772446811199188, 0.3957573473453522, 0.41426998376846313, 0.43278267979621887, 0.4512953460216522, 0.46980801224708557, 0.48832064867019653, 0.5068333148956299, 0.5253459811210632, 0.5438586473464966, 0.5623713135719299, 0.5808839797973633, 0.5993966460227966, 0.61790931224823, 0.6364219784736633, 0.6549346446990967, 0.6734472513198853, 0.6919599771499634, 0.710472583770752, 0.7289852499961853]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 10.0, 10.0, 12.0, 7.0, 10.0, 15.0, 21.0, 24.0, 39.0, 46.0, 56.0, 55.0, 108.0, 185.0, 352.0, 4836.0, 4091495.0, 91885.0, 4352.0, 228.0, 158.0, 123.0, 62.0, 42.0, 39.0, 26.0, 24.0, 10.0, 15.0, 4.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062744140625, -0.060776710510253906, -0.05880928039550781, -0.05684185028076172, -0.054874420166015625, -0.05290699005126953, -0.05093955993652344, -0.048972129821777344, -0.04700469970703125, -0.045037269592285156, -0.04306983947753906, -0.04110240936279297, -0.039134979248046875, -0.03716754913330078, -0.03520011901855469, -0.033232688903808594, -0.0312652587890625, -0.029297828674316406, -0.027330398559570312, -0.02536296844482422, -0.023395538330078125, -0.02142810821533203, -0.019460678100585938, -0.017493247985839844, -0.01552581787109375, -0.013558387756347656, -0.011590957641601562, -0.009623527526855469, -0.007656097412109375, -0.005688667297363281, -0.0037212371826171875, -0.0017538070678710938, 0.000213623046875, 0.0021810531616210938, 0.0041484832763671875, 0.006115913391113281, 0.008083343505859375, 0.010050773620605469, 0.012018203735351562, 0.013985633850097656, 0.01595306396484375, 0.017920494079589844, 0.019887924194335938, 0.02185535430908203, 0.023822784423828125, 0.02579021453857422, 0.027757644653320312, 0.029725074768066406, 0.0316925048828125, 0.033659934997558594, 0.03562736511230469, 0.03759479522705078, 0.039562225341796875, 0.04152965545654297, 0.04349708557128906, 0.045464515686035156, 0.04743194580078125, 0.049399375915527344, 0.05136680603027344, 0.05333423614501953, 0.055301666259765625, 0.05726909637451172, 0.05923652648925781, 0.061203956604003906, 0.06317138671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 9.0, 21.0, 18.0, 8.0, 24.0, 189.0, 442.0, 148.0, 27.0, 15.0, 11.0, 6.0, 7.0, 10.0, 12.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020233154296875, -0.019606351852416992, -0.018979549407958984, -0.018352746963500977, -0.01772594451904297, -0.01709914207458496, -0.016472339630126953, -0.015845537185668945, -0.015218734741210938, -0.01459193229675293, -0.013965129852294922, -0.013338327407836914, -0.012711524963378906, -0.012084722518920898, -0.01145792007446289, -0.010831117630004883, -0.010204315185546875, -0.009577512741088867, -0.00895071029663086, -0.008323907852172852, -0.007697105407714844, -0.007070302963256836, -0.006443500518798828, -0.00581669807434082, -0.0051898956298828125, -0.004563093185424805, -0.003936290740966797, -0.003309488296508789, -0.0026826858520507812, -0.0020558834075927734, -0.0014290809631347656, -0.0008022785186767578, -0.00017547607421875, 0.0004513263702392578, 0.0010781288146972656, 0.0017049312591552734, 0.0023317337036132812, 0.002958536148071289, 0.003585338592529297, 0.004212141036987305, 0.0048389434814453125, 0.00546574592590332, 0.006092548370361328, 0.006719350814819336, 0.007346153259277344, 0.007972955703735352, 0.00859975814819336, 0.009226560592651367, 0.009853363037109375, 0.010480165481567383, 0.01110696792602539, 0.011733770370483398, 0.012360572814941406, 0.012987375259399414, 0.013614177703857422, 0.01424098014831543, 0.014867782592773438, 0.015494585037231445, 0.016121387481689453, 0.01674818992614746, 0.01737499237060547, 0.018001794815063477, 0.018628597259521484, 0.019255399703979492, 0.0198822021484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 0.0, 3.0, 1.0, 11.0, 14.0, 14.0, 33.0, 36.0, 89.0, 251.0, 1214.0, 28606.0, 4160928.0, 2345.0, 456.0, 116.0, 45.0, 41.0, 22.0, 18.0, 7.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.085693359375, -0.08318614959716797, -0.08067893981933594, -0.0781717300415039, -0.07566452026367188, -0.07315731048583984, -0.07065010070800781, -0.06814289093017578, -0.06563568115234375, -0.06312847137451172, -0.06062126159667969, -0.058114051818847656, -0.055606842041015625, -0.053099632263183594, -0.05059242248535156, -0.04808521270751953, -0.0455780029296875, -0.04307079315185547, -0.04056358337402344, -0.038056373596191406, -0.035549163818359375, -0.033041954040527344, -0.030534744262695312, -0.02802753448486328, -0.02552032470703125, -0.02301311492919922, -0.020505905151367188, -0.017998695373535156, -0.015491485595703125, -0.012984275817871094, -0.010477066040039062, -0.007969856262207031, -0.005462646484375, -0.0029554367065429688, -0.0004482269287109375, 0.0020589828491210938, 0.004566192626953125, 0.007073402404785156, 0.009580612182617188, 0.012087821960449219, 0.01459503173828125, 0.01710224151611328, 0.019609451293945312, 0.022116661071777344, 0.024623870849609375, 0.027131080627441406, 0.029638290405273438, 0.03214550018310547, 0.0346527099609375, 0.03715991973876953, 0.03966712951660156, 0.042174339294433594, 0.044681549072265625, 0.047188758850097656, 0.04969596862792969, 0.05220317840576172, 0.05471038818359375, 0.05721759796142578, 0.05972480773925781, 0.062232017517089844, 0.06473922729492188, 0.0672464370727539, 0.06975364685058594, 0.07226085662841797, 0.07476806640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 11.0, 17.0, 41.0, 166.0, 2793.0, 850.0, 110.0, 38.0, 16.0, 6.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249786376953125, -0.02411341667175293, -0.02324819564819336, -0.02238297462463379, -0.02151775360107422, -0.02065253257751465, -0.019787311553955078, -0.018922090530395508, -0.018056869506835938, -0.017191648483276367, -0.016326427459716797, -0.015461206436157227, -0.014595985412597656, -0.013730764389038086, -0.012865543365478516, -0.012000322341918945, -0.011135101318359375, -0.010269880294799805, -0.009404659271240234, -0.008539438247680664, -0.007674217224121094, -0.0068089962005615234, -0.005943775177001953, -0.005078554153442383, -0.0042133331298828125, -0.003348112106323242, -0.002482891082763672, -0.0016176700592041016, -0.0007524490356445312, 0.00011277198791503906, 0.0009779930114746094, 0.0018432140350341797, 0.00270843505859375, 0.0035736560821533203, 0.004438877105712891, 0.005304098129272461, 0.006169319152832031, 0.0070345401763916016, 0.007899761199951172, 0.008764982223510742, 0.009630203247070312, 0.010495424270629883, 0.011360645294189453, 0.012225866317749023, 0.013091087341308594, 0.013956308364868164, 0.014821529388427734, 0.015686750411987305, 0.016551971435546875, 0.017417192459106445, 0.018282413482666016, 0.019147634506225586, 0.020012855529785156, 0.020878076553344727, 0.021743297576904297, 0.022608518600463867, 0.023473739624023438, 0.024338960647583008, 0.025204181671142578, 0.02606940269470215, 0.02693462371826172, 0.02779984474182129, 0.02866506576538086, 0.02953028678894043, 0.0303955078125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 28.0, 983.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3283839225769043, -0.3226533532142639, -0.31692278385162354, -0.31119221448898315, -0.3054616451263428, -0.2997310757637024, -0.294000506401062, -0.28826993703842163, -0.28253936767578125, -0.27680879831314087, -0.2710782289505005, -0.2653476595878601, -0.2596170902252197, -0.25388652086257935, -0.24815595149993896, -0.24242539703845978, -0.2366948425769806, -0.2309642732143402, -0.22523370385169983, -0.21950313448905945, -0.21377256512641907, -0.2080419957637787, -0.2023114264011383, -0.19658087193965912, -0.19085028767585754, -0.18511971831321716, -0.17938914895057678, -0.1736585795879364, -0.16792801022529602, -0.16219744086265564, -0.15646687150001526, -0.15073631703853607, -0.14500576257705688, -0.1392751932144165, -0.13354462385177612, -0.12781405448913574, -0.12208349257707596, -0.11635292321443558, -0.1106223538517952, -0.10489179193973541, -0.09916120767593384, -0.09343063831329346, -0.08770006895065308, -0.0819694995880127, -0.07623893767595291, -0.07050836831331253, -0.06477779895067215, -0.05904723331332207, -0.053316667675971985, -0.047586098313331604, -0.04185553267598152, -0.03612496331334114, -0.03039439581334591, -0.024663828313350677, -0.018933258950710297, -0.013202693313360214, -0.007472123950719833, -0.0017415559850633144, 0.0039890119805932045, 0.00971958041191101, 0.015450147911906242, 0.021180715411901474, 0.026911284774541855, 0.03264185041189194, 0.03837241977453232]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 12.0, 7.0, 9.0, 12.0, 16.0, 17.0, 25.0, 34.0, 54.0, 48.0, 50.0, 69.0, 69.0, 72.0, 76.0, 65.0, 55.0, 58.0, 47.0, 50.0, 27.0, 36.0, 24.0, 21.0, 23.0, 7.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06458860635757446, -0.06287883967161179, -0.061169080436229706, -0.05945931375026703, -0.05774955078959465, -0.05603978782892227, -0.054330021142959595, -0.052620258182287216, -0.05091049522161484, -0.04920073226094246, -0.04749096930027008, -0.045781202614307404, -0.044071439653635025, -0.042361676692962646, -0.04065191000699997, -0.03894214704632759, -0.03723238408565521, -0.035522621124982834, -0.033812858164310455, -0.03210309147834778, -0.0303933285176754, -0.02868356555700302, -0.026973800733685493, -0.025264035910367966, -0.023554272949695587, -0.02184450998902321, -0.02013474516570568, -0.018424980342388153, -0.016715217381715775, -0.015005453489720821, -0.013295689597725868, -0.011585925705730915, -0.009876161813735962, -0.008166397921741009, -0.006456634029746056, -0.0047468701377511024, -0.0030371062457561493, -0.0013273423537611961, 0.000382421538233757, 0.00209218543022871, 0.0038019493222236633, 0.0055117132142186165, 0.00722147710621357, 0.008931240998208523, 0.010641004890203476, 0.012350768782198429, 0.014060532674193382, 0.01577029749751091, 0.01748006045818329, 0.019189823418855667, 0.020899588242173195, 0.022609353065490723, 0.0243191160261631, 0.02602887898683548, 0.027738643810153008, 0.029448408633470535, 0.031158171594142914, 0.03286793455481529, 0.03457769751548767, 0.03628746420145035, 0.037997227162122726, 0.039706990122795105, 0.04141675680875778, 0.04312651976943016, 0.04483628273010254]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 5.0, 5.0, 5.0, 9.0, 14.0, 22.0, 20.0, 31.0, 33.0, 55.0, 72.0, 102.0, 133.0, 179.0, 264.0, 337.0, 505.0, 729.0, 1086.0, 1550.0, 2321.0, 3967.0, 7346.0, 15966.0, 80262.0, 878518.0, 29435.0, 10862.0, 5255.0, 3143.0, 2021.0, 1295.0, 833.0, 599.0, 432.0, 309.0, 215.0, 157.0, 116.0, 84.0, 73.0, 50.0, 32.0, 28.0, 18.0, 12.0, 9.0, 9.0, 8.0, 8.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.0200958251953125, -0.01947307586669922, -0.018850326538085938, -0.018227577209472656, -0.017604827880859375, -0.016982078552246094, -0.016359329223632812, -0.01573657989501953, -0.01511383056640625, -0.014491081237792969, -0.013868331909179688, -0.013245582580566406, -0.012622833251953125, -0.012000083923339844, -0.011377334594726562, -0.010754585266113281, -0.0101318359375, -0.009509086608886719, -0.008886337280273438, -0.008263587951660156, -0.007640838623046875, -0.007018089294433594, -0.0063953399658203125, -0.005772590637207031, -0.00514984130859375, -0.004527091979980469, -0.0039043426513671875, -0.0032815933227539062, -0.002658843994140625, -0.0020360946655273438, -0.0014133453369140625, -0.0007905960083007812, -0.0001678466796875, 0.00045490264892578125, 0.0010776519775390625, 0.0017004013061523438, 0.002323150634765625, 0.0029458999633789062, 0.0035686492919921875, 0.004191398620605469, 0.00481414794921875, 0.005436897277832031, 0.0060596466064453125, 0.006682395935058594, 0.007305145263671875, 0.007927894592285156, 0.008550643920898438, 0.009173393249511719, 0.009796142578125, 0.010418891906738281, 0.011041641235351562, 0.011664390563964844, 0.012287139892578125, 0.012909889221191406, 0.013532638549804688, 0.014155387878417969, 0.01477813720703125, 0.015400886535644531, 0.016023635864257812, 0.016646385192871094, 0.017269134521484375, 0.017891883850097656, 0.018514633178710938, 0.01913738250732422, 0.0197601318359375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 9.0, 19.0, 19.0, 8.0, 21.0, 180.0, 452.0, 153.0, 25.0, 15.0, 11.0, 5.0, 7.0, 11.0, 12.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0202484130859375, -0.019621610641479492, -0.018994808197021484, -0.018368005752563477, -0.01774120330810547, -0.01711440086364746, -0.016487598419189453, -0.015860795974731445, -0.015233993530273438, -0.01460719108581543, -0.013980388641357422, -0.013353586196899414, -0.012726783752441406, -0.012099981307983398, -0.01147317886352539, -0.010846376419067383, -0.010219573974609375, -0.009592771530151367, -0.00896596908569336, -0.008339166641235352, -0.007712364196777344, -0.007085561752319336, -0.006458759307861328, -0.00583195686340332, -0.0052051544189453125, -0.004578351974487305, -0.003951549530029297, -0.003324747085571289, -0.0026979446411132812, -0.0020711421966552734, -0.0014443397521972656, -0.0008175373077392578, -0.00019073486328125, 0.0004360675811767578, 0.0010628700256347656, 0.0016896724700927734, 0.0023164749145507812, 0.002943277359008789, 0.003570079803466797, 0.004196882247924805, 0.0048236846923828125, 0.00545048713684082, 0.006077289581298828, 0.006704092025756836, 0.007330894470214844, 0.007957696914672852, 0.00858449935913086, 0.009211301803588867, 0.009838104248046875, 0.010464906692504883, 0.01109170913696289, 0.011718511581420898, 0.012345314025878906, 0.012972116470336914, 0.013598918914794922, 0.01422572135925293, 0.014852523803710938, 0.015479326248168945, 0.016106128692626953, 0.01673293113708496, 0.01735973358154297, 0.017986536026000977, 0.018613338470458984, 0.019240140914916992, 0.019866943359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 6.0, 11.0, 8.0, 21.0, 20.0, 35.0, 38.0, 32.0, 37.0, 71.0, 79.0, 93.0, 106.0, 157.0, 209.0, 306.0, 493.0, 1115.0, 6020.0, 877122.0, 156931.0, 3177.0, 867.0, 449.0, 248.0, 194.0, 139.0, 119.0, 67.0, 79.0, 58.0, 45.0, 33.0, 40.0, 29.0, 25.0, 12.0, 13.0, 6.0, 7.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.06329345703125, -0.06130695343017578, -0.05932044982910156, -0.057333946228027344, -0.055347442626953125, -0.053360939025878906, -0.05137443542480469, -0.04938793182373047, -0.04740142822265625, -0.04541492462158203, -0.04342842102050781, -0.041441917419433594, -0.039455413818359375, -0.037468910217285156, -0.03548240661621094, -0.03349590301513672, -0.0315093994140625, -0.02952289581298828, -0.027536392211914062, -0.025549888610839844, -0.023563385009765625, -0.021576881408691406, -0.019590377807617188, -0.01760387420654297, -0.01561737060546875, -0.013630867004394531, -0.011644363403320312, -0.009657859802246094, -0.007671356201171875, -0.005684852600097656, -0.0036983489990234375, -0.0017118453979492188, 0.000274658203125, 0.0022611618041992188, 0.0042476654052734375, 0.006234169006347656, 0.008220672607421875, 0.010207176208496094, 0.012193679809570312, 0.014180183410644531, 0.01616668701171875, 0.01815319061279297, 0.020139694213867188, 0.022126197814941406, 0.024112701416015625, 0.026099205017089844, 0.028085708618164062, 0.03007221221923828, 0.0320587158203125, 0.03404521942138672, 0.03603172302246094, 0.038018226623535156, 0.040004730224609375, 0.041991233825683594, 0.04397773742675781, 0.04596424102783203, 0.04795074462890625, 0.04993724822998047, 0.05192375183105469, 0.053910255432128906, 0.055896759033203125, 0.057883262634277344, 0.05986976623535156, 0.06185626983642578, 0.0638427734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 3.0, 6.0, 4.0, 13.0, 4.0, 15.0, 18.0, 20.0, 15.0, 30.0, 20.0, 22.0, 37.0, 40.0, 37.0, 39.0, 38.0, 42.0, 47.0, 41.0, 58.0, 39.0, 42.0, 40.0, 38.0, 34.0, 31.0, 30.0, 32.0, 26.0, 29.0, 20.0, 14.0, 11.0, 17.0, 20.0, 6.0, 7.0, 4.0, 0.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0517578125, -0.05009174346923828, -0.04842567443847656, -0.046759605407714844, -0.045093536376953125, -0.043427467346191406, -0.04176139831542969, -0.04009532928466797, -0.03842926025390625, -0.03676319122314453, -0.03509712219238281, -0.033431053161621094, -0.031764984130859375, -0.030098915100097656, -0.028432846069335938, -0.02676677703857422, -0.0251007080078125, -0.02343463897705078, -0.021768569946289062, -0.020102500915527344, -0.018436431884765625, -0.016770362854003906, -0.015104293823242188, -0.013438224792480469, -0.01177215576171875, -0.010106086730957031, -0.008440017700195312, -0.006773948669433594, -0.005107879638671875, -0.0034418106079101562, -0.0017757415771484375, -0.00010967254638671875, 0.001556396484375, 0.0032224655151367188, 0.0048885345458984375, 0.006554603576660156, 0.008220672607421875, 0.009886741638183594, 0.011552810668945312, 0.013218879699707031, 0.01488494873046875, 0.01655101776123047, 0.018217086791992188, 0.019883155822753906, 0.021549224853515625, 0.023215293884277344, 0.024881362915039062, 0.02654743194580078, 0.0282135009765625, 0.02987957000732422, 0.03154563903808594, 0.033211708068847656, 0.034877777099609375, 0.036543846130371094, 0.03820991516113281, 0.03987598419189453, 0.04154205322265625, 0.04320812225341797, 0.04487419128417969, 0.046540260314941406, 0.048206329345703125, 0.049872398376464844, 0.05153846740722656, 0.05320453643798828, 0.05487060546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 6.0, 12.0, 19.0, 31.0, 31.0, 50.0, 59.0, 111.0, 165.0, 271.0, 535.0, 1030.0, 2296.0, 5325.0, 17407.0, 137635.0, 833159.0, 35474.0, 8436.0, 3419.0, 1389.0, 668.0, 379.0, 221.0, 136.0, 97.0, 71.0, 41.0, 22.0, 13.0, 9.0, 10.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2961368560791016e-05, -3.187078982591629e-05, -3.0780211091041565e-05, -2.968963235616684e-05, -2.8599053621292114e-05, -2.750847488641739e-05, -2.6417896151542664e-05, -2.5327317416667938e-05, -2.4236738681793213e-05, -2.3146159946918488e-05, -2.2055581212043762e-05, -2.0965002477169037e-05, -1.987442374229431e-05, -1.8783845007419586e-05, -1.769326627254486e-05, -1.6602687537670135e-05, -1.551210880279541e-05, -1.4421530067920685e-05, -1.333095133304596e-05, -1.2240372598171234e-05, -1.1149793863296509e-05, -1.0059215128421783e-05, -8.968636393547058e-06, -7.878057658672333e-06, -6.787478923797607e-06, -5.696900188922882e-06, -4.606321454048157e-06, -3.5157427191734314e-06, -2.425163984298706e-06, -1.3345852494239807e-06, -2.4400651454925537e-07, 8.4657222032547e-07, 1.9371509552001953e-06, 3.0277296900749207e-06, 4.118308424949646e-06, 5.208887159824371e-06, 6.299465894699097e-06, 7.390044629573822e-06, 8.480623364448547e-06, 9.571202099323273e-06, 1.0661780834197998e-05, 1.1752359569072723e-05, 1.2842938303947449e-05, 1.3933517038822174e-05, 1.50240957736969e-05, 1.6114674508571625e-05, 1.720525324344635e-05, 1.8295831978321075e-05, 1.93864107131958e-05, 2.0476989448070526e-05, 2.156756818294525e-05, 2.2658146917819977e-05, 2.3748725652694702e-05, 2.4839304387569427e-05, 2.5929883122444153e-05, 2.7020461857318878e-05, 2.8111040592193604e-05, 2.920161932706833e-05, 3.0292198061943054e-05, 3.138277679681778e-05, 3.2473355531692505e-05, 3.356393426656723e-05, 3.4654513001441956e-05, 3.574509173631668e-05, 3.6835670471191406e-05]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 8.0, 8.0, 13.0, 21.0, 16.0, 35.0, 24.0, 38.0, 38.0, 61.0, 67.0, 48.0, 81.0, 59.0, 78.0, 43.0, 81.0, 59.0, 34.0, 46.0, 24.0, 23.0, 17.0, 16.0, 18.0, 9.0, 9.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4836273193359375e-06, -5.3299590945243835e-06, -5.17629086971283e-06, -5.022622644901276e-06, -4.868954420089722e-06, -4.715286195278168e-06, -4.561617970466614e-06, -4.40794974565506e-06, -4.254281520843506e-06, -4.100613296031952e-06, -3.946945071220398e-06, -3.793276846408844e-06, -3.63960862159729e-06, -3.485940396785736e-06, -3.332272171974182e-06, -3.178603947162628e-06, -3.0249357223510742e-06, -2.8712674975395203e-06, -2.7175992727279663e-06, -2.5639310479164124e-06, -2.4102628231048584e-06, -2.2565945982933044e-06, -2.1029263734817505e-06, -1.9492581486701965e-06, -1.7955899238586426e-06, -1.6419216990470886e-06, -1.4882534742355347e-06, -1.3345852494239807e-06, -1.1809170246124268e-06, -1.0272487998008728e-06, -8.735805749893188e-07, -7.199123501777649e-07, -5.662441253662109e-07, -4.12575900554657e-07, -2.5890767574310303e-07, -1.0523945093154907e-07, 4.842877388000488e-08, 2.0209699869155884e-07, 3.557652235031128e-07, 5.094334483146667e-07, 6.631016731262207e-07, 8.167698979377747e-07, 9.704381227493286e-07, 1.1241063475608826e-06, 1.2777745723724365e-06, 1.4314427971839905e-06, 1.5851110219955444e-06, 1.7387792468070984e-06, 1.8924474716186523e-06, 2.0461156964302063e-06, 2.1997839212417603e-06, 2.353452146053314e-06, 2.507120370864868e-06, 2.660788595676422e-06, 2.814456820487976e-06, 2.96812504529953e-06, 3.121793270111084e-06, 3.275461494922638e-06, 3.429129719734192e-06, 3.582797944545746e-06, 3.7364661693573e-06, 3.890134394168854e-06, 4.043802618980408e-06, 4.197470843791962e-06, 4.351139068603516e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 2.0, 9.0, 11.0, 11.0, 13.0, 24.0, 38.0, 50.0, 59.0, 107.0, 188.0, 366.0, 1085.0, 26327.0, 1016132.0, 2882.0, 572.0, 252.0, 142.0, 77.0, 44.0, 43.0, 33.0, 15.0, 12.0, 11.0, 13.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.796287536621094e-05, -7.554329931735992e-05, -7.312372326850891e-05, -7.07041472196579e-05, -6.828457117080688e-05, -6.586499512195587e-05, -6.344541907310486e-05, -6.1025843024253845e-05, -5.860626697540283e-05, -5.618669092655182e-05, -5.3767114877700806e-05, -5.134753882884979e-05, -4.892796277999878e-05, -4.6508386731147766e-05, -4.408881068229675e-05, -4.166923463344574e-05, -3.9249658584594727e-05, -3.683008253574371e-05, -3.44105064868927e-05, -3.199093043804169e-05, -2.9571354389190674e-05, -2.715177834033966e-05, -2.4732202291488647e-05, -2.2312626242637634e-05, -1.989305019378662e-05, -1.7473474144935608e-05, -1.5053898096084595e-05, -1.2634322047233582e-05, -1.0214745998382568e-05, -7.795169949531555e-06, -5.375593900680542e-06, -2.956017851829529e-06, -5.364418029785156e-07, 1.8831342458724976e-06, 4.302710294723511e-06, 6.722286343574524e-06, 9.141862392425537e-06, 1.156143844127655e-05, 1.3981014490127563e-05, 1.6400590538978577e-05, 1.882016658782959e-05, 2.1239742636680603e-05, 2.3659318685531616e-05, 2.607889473438263e-05, 2.8498470783233643e-05, 3.0918046832084656e-05, 3.333762288093567e-05, 3.575719892978668e-05, 3.8176774978637695e-05, 4.059635102748871e-05, 4.301592707633972e-05, 4.5435503125190735e-05, 4.785507917404175e-05, 5.027465522289276e-05, 5.2694231271743774e-05, 5.511380732059479e-05, 5.75333833694458e-05, 5.9952959418296814e-05, 6.237253546714783e-05, 6.479211151599884e-05, 6.721168756484985e-05, 6.963126361370087e-05, 7.205083966255188e-05, 7.447041571140289e-05, 7.68899917602539e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 11.0, 9.0, 19.0, 10.0, 24.0, 41.0, 48.0, 82.0, 86.0, 132.0, 135.0, 93.0, 82.0, 61.0, 51.0, 18.0, 16.0, 16.0, 14.0, 11.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.747245788574219e-05, -6.5607950091362e-05, -6.374344229698181e-05, -6.187893450260162e-05, -6.0014426708221436e-05, -5.814991891384125e-05, -5.628541111946106e-05, -5.442090332508087e-05, -5.2556395530700684e-05, -5.0691887736320496e-05, -4.882737994194031e-05, -4.696287214756012e-05, -4.509836435317993e-05, -4.3233856558799744e-05, -4.1369348764419556e-05, -3.950484097003937e-05, -3.764033317565918e-05, -3.577582538127899e-05, -3.3911317586898804e-05, -3.2046809792518616e-05, -3.0182301998138428e-05, -2.831779420375824e-05, -2.6453286409378052e-05, -2.4588778614997864e-05, -2.2724270820617676e-05, -2.0859763026237488e-05, -1.89952552318573e-05, -1.7130747437477112e-05, -1.5266239643096924e-05, -1.3401731848716736e-05, -1.1537224054336548e-05, -9.67271625995636e-06, -7.808208465576172e-06, -5.943700671195984e-06, -4.079192876815796e-06, -2.214685082435608e-06, -3.501772880554199e-07, 1.514330506324768e-06, 3.378838300704956e-06, 5.243346095085144e-06, 7.107853889465332e-06, 8.97236168384552e-06, 1.0836869478225708e-05, 1.2701377272605896e-05, 1.4565885066986084e-05, 1.6430392861366272e-05, 1.829490065574646e-05, 2.0159408450126648e-05, 2.2023916244506836e-05, 2.3888424038887024e-05, 2.5752931833267212e-05, 2.76174396276474e-05, 2.9481947422027588e-05, 3.1346455216407776e-05, 3.3210963010787964e-05, 3.507547080516815e-05, 3.693997859954834e-05, 3.880448639392853e-05, 4.0668994188308716e-05, 4.2533501982688904e-05, 4.439800977706909e-05, 4.626251757144928e-05, 4.812702536582947e-05, 4.9991533160209656e-05, 5.1856040954589844e-05]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 18.0, 779.0, 203.0, 12.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18240585923194885, -0.1655949056148529, -0.14878395199775696, -0.1319730132818222, -0.11516205966472626, -0.09835110604763031, -0.08154015988111496, -0.06472921371459961, -0.04791826009750366, -0.031107310205698013, -0.014296360313892365, 0.0025145895779132843, 0.019325539469718933, 0.03613649308681488, 0.05294743925333023, 0.06975838541984558, 0.08656933903694153, 0.10338029265403748, 0.12019123882055283, 0.13700218498706818, 0.15381313860416412, 0.17062409222126007, 0.18743503093719482, 0.20424598455429077, 0.22105693817138672, 0.23786789178848267, 0.2546788454055786, 0.27148979902267456, 0.2883007526397705, 0.30511170625686646, 0.32192263007164, 0.33873358368873596, 0.3555445671081543, 0.37235552072525024, 0.3891664743423462, 0.40597742795944214, 0.4227883815765381, 0.43959933519363403, 0.4564102590084076, 0.47322121262550354, 0.4900321662425995, 0.506843090057373, 0.523654043674469, 0.5404649972915649, 0.5572759509086609, 0.5740869045257568, 0.5908978581428528, 0.6077088117599487, 0.6245197653770447, 0.6413307189941406, 0.6581416726112366, 0.6749526262283325, 0.6917635798454285, 0.7085745334625244, 0.7253854870796204, 0.7421964406967163, 0.7590073347091675, 0.7758182883262634, 0.7926292419433594, 0.8094401955604553, 0.8262511491775513, 0.8430621027946472, 0.8598730564117432, 0.8766839504241943, 0.8934949636459351]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 12.0, 16.0, 11.0, 19.0, 25.0, 33.0, 36.0, 44.0, 56.0, 51.0, 65.0, 77.0, 76.0, 77.0, 42.0, 56.0, 54.0, 47.0, 37.0, 44.0, 28.0, 24.0, 15.0, 15.0, 16.0, 12.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4224570393562317, -0.4082862138748169, -0.3941153883934021, -0.3799445629119873, -0.3657737374305725, -0.3516029119491577, -0.3374320864677429, -0.3232612609863281, -0.30909043550491333, -0.29491961002349854, -0.28074878454208374, -0.26657795906066895, -0.25240713357925415, -0.23823630809783936, -0.22406549751758575, -0.20989467203617096, -0.19572386145591736, -0.18155303597450256, -0.16738221049308777, -0.15321138501167297, -0.13904055953025818, -0.12486974149942398, -0.11069892346858978, -0.09652809798717499, -0.08235727250576019, -0.0681864470243454, -0.0540156252682209, -0.039844803512096405, -0.02567397803068161, -0.011503152549266815, 0.002667665481567383, 0.016838490962982178, 0.031009316444396973, 0.04518014192581177, 0.059350963681936264, 0.07352178543806076, 0.08769261091947556, 0.10186343640089035, 0.11603425443172455, 0.13020507991313934, 0.14437590539455414, 0.15854673087596893, 0.17271755635738373, 0.18688836693763733, 0.20105919241905212, 0.21523001790046692, 0.2294008433818817, 0.2435716688632965, 0.2577424943447113, 0.2719133198261261, 0.2860841453075409, 0.3002549707889557, 0.3144257962703705, 0.3285966217517853, 0.3427674174308777, 0.3569382429122925, 0.3711090683937073, 0.38527989387512207, 0.39945071935653687, 0.41362154483795166, 0.42779237031936646, 0.44196319580078125, 0.45613402128219604, 0.47030484676361084, 0.48447567224502563]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 16.0, 12.0, 27.0, 41.0, 53.0, 69.0, 353.0, 10782.0, 4180510.0, 2067.0, 106.0, 61.0, 43.0, 21.0, 16.0, 15.0, 15.0, 9.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.065185546875, -0.06315994262695312, -0.06113433837890625, -0.059108734130859375, -0.0570831298828125, -0.055057525634765625, -0.05303192138671875, -0.051006317138671875, -0.048980712890625, -0.046955108642578125, -0.04492950439453125, -0.042903900146484375, -0.0408782958984375, -0.038852691650390625, -0.03682708740234375, -0.034801483154296875, -0.03277587890625, -0.030750274658203125, -0.02872467041015625, -0.026699066162109375, -0.0246734619140625, -0.022647857666015625, -0.02062225341796875, -0.018596649169921875, -0.016571044921875, -0.014545440673828125, -0.01251983642578125, -0.010494232177734375, -0.0084686279296875, -0.006443023681640625, -0.00441741943359375, -0.002391815185546875, -0.0003662109375, 0.001659393310546875, 0.00368499755859375, 0.005710601806640625, 0.0077362060546875, 0.009761810302734375, 0.01178741455078125, 0.013813018798828125, 0.015838623046875, 0.017864227294921875, 0.01988983154296875, 0.021915435791015625, 0.0239410400390625, 0.025966644287109375, 0.02799224853515625, 0.030017852783203125, 0.03204345703125, 0.034069061279296875, 0.03609466552734375, 0.038120269775390625, 0.0401458740234375, 0.042171478271484375, 0.04419708251953125, 0.046222686767578125, 0.048248291015625, 0.050273895263671875, 0.05229949951171875, 0.054325103759765625, 0.0563507080078125, 0.058376312255859375, 0.06040191650390625, 0.062427520751953125, 0.064453125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 5.0, 11.0, 17.0, 17.0, 10.0, 28.0, 218.0, 439.0, 120.0, 23.0, 16.0, 12.0, 4.0, 8.0, 11.0, 12.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0199737548828125, -0.019353151321411133, -0.018732547760009766, -0.0181119441986084, -0.01749134063720703, -0.016870737075805664, -0.016250133514404297, -0.01562952995300293, -0.015008926391601562, -0.014388322830200195, -0.013767719268798828, -0.013147115707397461, -0.012526512145996094, -0.011905908584594727, -0.01128530502319336, -0.010664701461791992, -0.010044097900390625, -0.009423494338989258, -0.00880289077758789, -0.008182287216186523, -0.007561683654785156, -0.006941080093383789, -0.006320476531982422, -0.005699872970581055, -0.0050792694091796875, -0.00445866584777832, -0.003838062286376953, -0.003217458724975586, -0.0025968551635742188, -0.0019762516021728516, -0.0013556480407714844, -0.0007350444793701172, -0.00011444091796875, 0.0005061626434326172, 0.0011267662048339844, 0.0017473697662353516, 0.0023679733276367188, 0.002988576889038086, 0.003609180450439453, 0.00422978401184082, 0.0048503875732421875, 0.005470991134643555, 0.006091594696044922, 0.006712198257446289, 0.007332801818847656, 0.007953405380249023, 0.00857400894165039, 0.009194612503051758, 0.009815216064453125, 0.010435819625854492, 0.01105642318725586, 0.011677026748657227, 0.012297630310058594, 0.012918233871459961, 0.013538837432861328, 0.014159440994262695, 0.014780044555664062, 0.01540064811706543, 0.016021251678466797, 0.016641855239868164, 0.01726245880126953, 0.0178830623626709, 0.018503665924072266, 0.019124269485473633, 0.019744873046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 14.0, 14.0, 13.0, 54.0, 178.0, 543.0, 2682.0, 4185692.0, 4169.0, 622.0, 194.0, 42.0, 18.0, 18.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04180908203125, -0.04034709930419922, -0.03888511657714844, -0.037423133850097656, -0.035961151123046875, -0.034499168395996094, -0.03303718566894531, -0.03157520294189453, -0.03011322021484375, -0.02865123748779297, -0.027189254760742188, -0.025727272033691406, -0.024265289306640625, -0.022803306579589844, -0.021341323852539062, -0.01987934112548828, -0.0184173583984375, -0.01695537567138672, -0.015493392944335938, -0.014031410217285156, -0.012569427490234375, -0.011107444763183594, -0.009645462036132812, -0.008183479309082031, -0.00672149658203125, -0.005259513854980469, -0.0037975311279296875, -0.0023355484008789062, -0.000873565673828125, 0.0005884170532226562, 0.0020503997802734375, 0.0035123825073242188, 0.004974365234375, 0.006436347961425781, 0.007898330688476562, 0.009360313415527344, 0.010822296142578125, 0.012284278869628906, 0.013746261596679688, 0.015208244323730469, 0.01667022705078125, 0.01813220977783203, 0.019594192504882812, 0.021056175231933594, 0.022518157958984375, 0.023980140686035156, 0.025442123413085938, 0.02690410614013672, 0.0283660888671875, 0.02982807159423828, 0.03129005432128906, 0.032752037048339844, 0.034214019775390625, 0.035676002502441406, 0.03713798522949219, 0.03859996795654297, 0.04006195068359375, 0.04152393341064453, 0.04298591613769531, 0.044447898864746094, 0.045909881591796875, 0.047371864318847656, 0.04883384704589844, 0.05029582977294922, 0.0517578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 16.0, 35.0, 2938.0, 1014.0, 49.0, 14.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174407958984375, -0.016942381858825684, -0.016443967819213867, -0.01594555377960205, -0.015447139739990234, -0.014948725700378418, -0.014450311660766602, -0.013951897621154785, -0.013453483581542969, -0.012955069541931152, -0.012456655502319336, -0.01195824146270752, -0.011459827423095703, -0.010961413383483887, -0.01046299934387207, -0.009964585304260254, -0.009466171264648438, -0.008967757225036621, -0.008469343185424805, -0.007970929145812988, -0.007472515106201172, -0.0069741010665893555, -0.006475687026977539, -0.005977272987365723, -0.005478858947753906, -0.00498044490814209, -0.0044820308685302734, -0.003983616828918457, -0.0034852027893066406, -0.0029867887496948242, -0.002488374710083008, -0.0019899606704711914, -0.001491546630859375, -0.0009931325912475586, -0.0004947185516357422, 3.6954879760742188e-06, 0.0005021095275878906, 0.001000523567199707, 0.0014989376068115234, 0.00199735164642334, 0.0024957656860351562, 0.0029941797256469727, 0.003492593765258789, 0.0039910078048706055, 0.004489421844482422, 0.004987835884094238, 0.005486249923706055, 0.005984663963317871, 0.0064830780029296875, 0.006981492042541504, 0.00747990608215332, 0.007978320121765137, 0.008476734161376953, 0.00897514820098877, 0.009473562240600586, 0.009971976280212402, 0.010470390319824219, 0.010968804359436035, 0.011467218399047852, 0.011965632438659668, 0.012464046478271484, 0.0129624605178833, 0.013460874557495117, 0.013959288597106934, 0.01445770263671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 1007.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05711958557367325, -0.0536467619240284, -0.050173938274383545, -0.04670111835002899, -0.04322829470038414, -0.03975547105073929, -0.036282651126384735, -0.03280982747673988, -0.029337003827095032, -0.02586418017745018, -0.022391358390450478, -0.018918536603450775, -0.015445712953805923, -0.011972889304161072, -0.00850006751716137, -0.005027245730161667, -0.0015544220805168152, 0.0019184006378054619, 0.005391223356127739, 0.008864046074450016, 0.012336868792772293, 0.015809692442417145, 0.019282514229416847, 0.02275533601641655, 0.0262281596660614, 0.029700983315706253, 0.033173806965351105, 0.03664662688970566, 0.04011945053935051, 0.04359227418899536, 0.047065094113349915, 0.050537917762994766, 0.05401073396205902, 0.05748355761170387, 0.060956381261348724, 0.06442920118570328, 0.06790202856063843, 0.07137484848499298, 0.07484766840934753, 0.07832048833370209, 0.08179331570863724, 0.08526613563299179, 0.08873896300792694, 0.0922117829322815, 0.09568460285663605, 0.0991574302315712, 0.10263025015592575, 0.1061030775308609, 0.10957589745521545, 0.11304871737957001, 0.11652154475450516, 0.11999436467885971, 0.12346719205379486, 0.12694001197814941, 0.13041283190250397, 0.13388565182685852, 0.13735848665237427, 0.14083130657672882, 0.14430412650108337, 0.14777696132659912, 0.15124978125095367, 0.15472260117530823, 0.15819542109966278, 0.16166824102401733, 0.1651410609483719]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 5.0, 15.0, 22.0, 34.0, 56.0, 73.0, 88.0, 116.0, 124.0, 117.0, 95.0, 76.0, 69.0, 54.0, 30.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036485135555267334, -0.035463348031044006, -0.03444156050682068, -0.03341977670788765, -0.03239798918366432, -0.031376201659440994, -0.030354415997862816, -0.029332630336284637, -0.02831084281206131, -0.027289055287837982, -0.026267269626259804, -0.025245483964681625, -0.024223696440458298, -0.02320190891623497, -0.02218012325465679, -0.021158337593078613, -0.020136550068855286, -0.019114762544631958, -0.01809297688305378, -0.0170711912214756, -0.016049403697252274, -0.01502761710435152, -0.014005830511450768, -0.012984043918550014, -0.011962257325649261, -0.010940470732748508, -0.009918684139847755, -0.008896897546947002, -0.00787511095404625, -0.006853324361145496, -0.005831537768244743, -0.00480975117534399, -0.0037879645824432373, -0.0027661779895424843, -0.0017443913966417313, -0.0007226048037409782, 0.0002991817891597748, 0.0013209683820605278, 0.002342754974961281, 0.003364541567862034, 0.004386328160762787, 0.00540811475366354, 0.006429901346564293, 0.007451687939465046, 0.008473474532365799, 0.009495261125266552, 0.010517047718167305, 0.011538834311068058, 0.012560620903968811, 0.013582407496869564, 0.014604194089770317, 0.015625979751348495, 0.016647767275571823, 0.01766955479979515, 0.01869134046137333, 0.019713126122951508, 0.020734913647174835, 0.021756701171398163, 0.02277848683297634, 0.02380027249455452, 0.024822060018777847, 0.025843847543001175, 0.026865633204579353, 0.027887418866157532, 0.02890920639038086]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 7.0, 10.0, 16.0, 11.0, 28.0, 27.0, 35.0, 46.0, 80.0, 84.0, 143.0, 181.0, 285.0, 486.0, 821.0, 1368.0, 2555.0, 5288.0, 14076.0, 98180.0, 888218.0, 21535.0, 7287.0, 3433.0, 1722.0, 912.0, 566.0, 343.0, 191.0, 151.0, 103.0, 92.0, 58.0, 46.0, 31.0, 27.0, 18.0, 20.0, 18.0, 2.0, 10.0, 10.0, 3.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0230255126953125, -0.02230978012084961, -0.02159404754638672, -0.020878314971923828, -0.020162582397460938, -0.019446849822998047, -0.018731117248535156, -0.018015384674072266, -0.017299652099609375, -0.016583919525146484, -0.015868186950683594, -0.015152454376220703, -0.014436721801757812, -0.013720989227294922, -0.013005256652832031, -0.01228952407836914, -0.01157379150390625, -0.01085805892944336, -0.010142326354980469, -0.009426593780517578, -0.008710861206054688, -0.007995128631591797, -0.007279396057128906, -0.006563663482666016, -0.005847930908203125, -0.005132198333740234, -0.004416465759277344, -0.003700733184814453, -0.0029850006103515625, -0.002269268035888672, -0.0015535354614257812, -0.0008378028869628906, -0.0001220703125, 0.0005936622619628906, 0.0013093948364257812, 0.002025127410888672, 0.0027408599853515625, 0.003456592559814453, 0.004172325134277344, 0.004888057708740234, 0.005603790283203125, 0.006319522857666016, 0.007035255432128906, 0.007750988006591797, 0.008466720581054688, 0.009182453155517578, 0.009898185729980469, 0.01061391830444336, 0.01132965087890625, 0.01204538345336914, 0.012761116027832031, 0.013476848602294922, 0.014192581176757812, 0.014908313751220703, 0.015624046325683594, 0.016339778900146484, 0.017055511474609375, 0.017771244049072266, 0.018486976623535156, 0.019202709197998047, 0.019918441772460938, 0.020634174346923828, 0.02134990692138672, 0.02206563949584961, 0.0227813720703125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 4.0, 12.0, 17.0, 17.0, 11.0, 27.0, 217.0, 439.0, 121.0, 23.0, 16.0, 12.0, 5.0, 7.0, 11.0, 12.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0199737548828125, -0.019353151321411133, -0.018732547760009766, -0.0181119441986084, -0.01749134063720703, -0.016870737075805664, -0.016250133514404297, -0.01562952995300293, -0.015008926391601562, -0.014388322830200195, -0.013767719268798828, -0.013147115707397461, -0.012526512145996094, -0.011905908584594727, -0.01128530502319336, -0.010664701461791992, -0.010044097900390625, -0.009423494338989258, -0.00880289077758789, -0.008182287216186523, -0.007561683654785156, -0.006941080093383789, -0.006320476531982422, -0.005699872970581055, -0.0050792694091796875, -0.00445866584777832, -0.003838062286376953, -0.003217458724975586, -0.0025968551635742188, -0.0019762516021728516, -0.0013556480407714844, -0.0007350444793701172, -0.00011444091796875, 0.0005061626434326172, 0.0011267662048339844, 0.0017473697662353516, 0.0023679733276367188, 0.002988576889038086, 0.003609180450439453, 0.00422978401184082, 0.0048503875732421875, 0.005470991134643555, 0.006091594696044922, 0.006712198257446289, 0.007332801818847656, 0.007953405380249023, 0.00857400894165039, 0.009194612503051758, 0.009815216064453125, 0.010435819625854492, 0.01105642318725586, 0.011677026748657227, 0.012297630310058594, 0.012918233871459961, 0.013538837432861328, 0.014159440994262695, 0.014780044555664062, 0.01540064811706543, 0.016021251678466797, 0.016641855239868164, 0.01726245880126953, 0.0178830623626709, 0.018503665924072266, 0.019124269485473633, 0.019744873046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 9.0, 6.0, 8.0, 11.0, 15.0, 24.0, 22.0, 34.0, 29.0, 45.0, 58.0, 59.0, 76.0, 119.0, 127.0, 164.0, 241.0, 429.0, 792.0, 1904.0, 39491.0, 995941.0, 5814.0, 1219.0, 644.0, 339.0, 218.0, 134.0, 93.0, 91.0, 69.0, 64.0, 57.0, 45.0, 34.0, 34.0, 22.0, 17.0, 15.0, 10.0, 13.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05609130859375, -0.05423927307128906, -0.052387237548828125, -0.05053520202636719, -0.04868316650390625, -0.04683113098144531, -0.044979095458984375, -0.04312705993652344, -0.0412750244140625, -0.03942298889160156, -0.037570953369140625, -0.03571891784667969, -0.03386688232421875, -0.03201484680175781, -0.030162811279296875, -0.028310775756835938, -0.026458740234375, -0.024606704711914062, -0.022754669189453125, -0.020902633666992188, -0.01905059814453125, -0.017198562622070312, -0.015346527099609375, -0.013494491577148438, -0.0116424560546875, -0.009790420532226562, -0.007938385009765625, -0.0060863494873046875, -0.00423431396484375, -0.0023822784423828125, -0.000530242919921875, 0.0013217926025390625, 0.003173828125, 0.0050258636474609375, 0.006877899169921875, 0.008729934692382812, 0.01058197021484375, 0.012434005737304688, 0.014286041259765625, 0.016138076782226562, 0.0179901123046875, 0.019842147827148438, 0.021694183349609375, 0.023546218872070312, 0.02539825439453125, 0.027250289916992188, 0.029102325439453125, 0.030954360961914062, 0.032806396484375, 0.03465843200683594, 0.036510467529296875, 0.03836250305175781, 0.04021453857421875, 0.04206657409667969, 0.043918609619140625, 0.04577064514160156, 0.0476226806640625, 0.04947471618652344, 0.051326751708984375, 0.05317878723144531, 0.05503082275390625, 0.05688285827636719, 0.058734893798828125, 0.06058692932128906, 0.06243896484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 5.0, 6.0, 4.0, 12.0, 16.0, 10.0, 13.0, 14.0, 22.0, 16.0, 19.0, 22.0, 37.0, 36.0, 28.0, 32.0, 50.0, 52.0, 37.0, 44.0, 36.0, 34.0, 49.0, 52.0, 41.0, 38.0, 28.0, 24.0, 29.0, 38.0, 25.0, 15.0, 28.0, 20.0, 12.0, 9.0, 10.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041778564453125, -0.04031705856323242, -0.038855552673339844, -0.037394046783447266, -0.03593254089355469, -0.03447103500366211, -0.03300952911376953, -0.03154802322387695, -0.030086517333984375, -0.028625011444091797, -0.02716350555419922, -0.02570199966430664, -0.024240493774414062, -0.022778987884521484, -0.021317481994628906, -0.019855976104736328, -0.01839447021484375, -0.016932964324951172, -0.015471458435058594, -0.014009952545166016, -0.012548446655273438, -0.01108694076538086, -0.009625434875488281, -0.008163928985595703, -0.006702423095703125, -0.005240917205810547, -0.0037794113159179688, -0.0023179054260253906, -0.0008563995361328125, 0.0006051063537597656, 0.0020666122436523438, 0.003528118133544922, 0.0049896240234375, 0.006451129913330078, 0.007912635803222656, 0.009374141693115234, 0.010835647583007812, 0.01229715347290039, 0.013758659362792969, 0.015220165252685547, 0.016681671142578125, 0.018143177032470703, 0.01960468292236328, 0.02106618881225586, 0.022527694702148438, 0.023989200592041016, 0.025450706481933594, 0.026912212371826172, 0.02837371826171875, 0.029835224151611328, 0.031296730041503906, 0.032758235931396484, 0.03421974182128906, 0.03568124771118164, 0.03714275360107422, 0.0386042594909668, 0.040065765380859375, 0.04152727127075195, 0.04298877716064453, 0.04445028305053711, 0.04591178894042969, 0.047373294830322266, 0.048834800720214844, 0.05029630661010742, 0.0517578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 13.0, 4.0, 8.0, 8.0, 6.0, 18.0, 25.0, 30.0, 48.0, 60.0, 121.0, 117.0, 262.0, 388.0, 656.0, 1190.0, 2205.0, 5419.0, 12114.0, 43437.0, 245706.0, 649762.0, 56669.0, 17889.0, 6072.0, 2995.0, 1321.0, 806.0, 406.0, 280.0, 153.0, 113.0, 73.0, 50.0, 38.0, 30.0, 11.0, 14.0, 9.0, 10.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.09808349609375e-05, -2.0415522158145905e-05, -1.985020935535431e-05, -1.9284896552562714e-05, -1.8719583749771118e-05, -1.8154270946979523e-05, -1.7588958144187927e-05, -1.7023645341396332e-05, -1.6458332538604736e-05, -1.589301973581314e-05, -1.5327706933021545e-05, -1.476239413022995e-05, -1.4197081327438354e-05, -1.3631768524646759e-05, -1.3066455721855164e-05, -1.2501142919063568e-05, -1.1935830116271973e-05, -1.1370517313480377e-05, -1.0805204510688782e-05, -1.0239891707897186e-05, -9.67457890510559e-06, -9.109266102313995e-06, -8.5439532995224e-06, -7.978640496730804e-06, -7.413327693939209e-06, -6.8480148911476135e-06, -6.282702088356018e-06, -5.717389285564423e-06, -5.152076482772827e-06, -4.586763679981232e-06, -4.021450877189636e-06, -3.4561380743980408e-06, -2.8908252716064453e-06, -2.32551246881485e-06, -1.7601996660232544e-06, -1.194886863231659e-06, -6.295740604400635e-07, -6.426125764846802e-08, 5.010515451431274e-07, 1.066364347934723e-06, 1.6316771507263184e-06, 2.196989953517914e-06, 2.7623027563095093e-06, 3.3276155591011047e-06, 3.8929283618927e-06, 4.458241164684296e-06, 5.023553967475891e-06, 5.5888667702674866e-06, 6.154179573059082e-06, 6.7194923758506775e-06, 7.284805178642273e-06, 7.850117981433868e-06, 8.415430784225464e-06, 8.98074358701706e-06, 9.546056389808655e-06, 1.011136919260025e-05, 1.0676681995391846e-05, 1.1241994798183441e-05, 1.1807307600975037e-05, 1.2372620403766632e-05, 1.2937933206558228e-05, 1.3503246009349823e-05, 1.4068558812141418e-05, 1.4633871614933014e-05, 1.519918441772461e-05]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 3.0, 8.0, 8.0, 16.0, 22.0, 20.0, 36.0, 29.0, 58.0, 55.0, 84.0, 67.0, 83.0, 94.0, 77.0, 78.0, 50.0, 52.0, 26.0, 36.0, 24.0, 16.0, 19.0, 9.0, 13.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.616115570068359e-06, -6.411224603652954e-06, -6.206333637237549e-06, -6.0014426708221436e-06, -5.796551704406738e-06, -5.591660737991333e-06, -5.386769771575928e-06, -5.1818788051605225e-06, -4.976987838745117e-06, -4.772096872329712e-06, -4.567205905914307e-06, -4.362314939498901e-06, -4.157423973083496e-06, -3.952533006668091e-06, -3.7476420402526855e-06, -3.5427510738372803e-06, -3.337860107421875e-06, -3.1329691410064697e-06, -2.9280781745910645e-06, -2.723187208175659e-06, -2.518296241760254e-06, -2.3134052753448486e-06, -2.1085143089294434e-06, -1.903623342514038e-06, -1.6987323760986328e-06, -1.4938414096832275e-06, -1.2889504432678223e-06, -1.084059476852417e-06, -8.791685104370117e-07, -6.742775440216064e-07, -4.6938657760620117e-07, -2.644956111907959e-07, -5.960464477539063e-08, 1.4528632164001465e-07, 3.501772880554199e-07, 5.550682544708252e-07, 7.599592208862305e-07, 9.648501873016357e-07, 1.169741153717041e-06, 1.3746321201324463e-06, 1.5795230865478516e-06, 1.7844140529632568e-06, 1.989305019378662e-06, 2.1941959857940674e-06, 2.3990869522094727e-06, 2.603977918624878e-06, 2.808868885040283e-06, 3.0137598514556885e-06, 3.2186508178710938e-06, 3.423541784286499e-06, 3.6284327507019043e-06, 3.8333237171173096e-06, 4.038214683532715e-06, 4.24310564994812e-06, 4.447996616363525e-06, 4.652887582778931e-06, 4.857778549194336e-06, 5.062669515609741e-06, 5.2675604820251465e-06, 5.472451448440552e-06, 5.677342414855957e-06, 5.882233381271362e-06, 6.087124347686768e-06, 6.292015314102173e-06, 6.496906280517578e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 16.0, 21.0, 28.0, 43.0, 75.0, 139.0, 258.0, 475.0, 1948.0, 1034484.0, 9509.0, 790.0, 313.0, 155.0, 112.0, 55.0, 33.0, 26.0, 19.0, 14.0, 5.0, 5.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.112192153930664e-05, -7.871631532907486e-05, -7.631070911884308e-05, -7.39051029086113e-05, -7.149949669837952e-05, -6.909389048814774e-05, -6.668828427791595e-05, -6.428267806768417e-05, -6.187707185745239e-05, -5.947146564722061e-05, -5.706585943698883e-05, -5.466025322675705e-05, -5.225464701652527e-05, -4.984904080629349e-05, -4.7443434596061707e-05, -4.5037828385829926e-05, -4.2632222175598145e-05, -4.0226615965366364e-05, -3.782100975513458e-05, -3.54154035449028e-05, -3.300979733467102e-05, -3.060419112443924e-05, -2.819858491420746e-05, -2.5792978703975677e-05, -2.3387372493743896e-05, -2.0981766283512115e-05, -1.8576160073280334e-05, -1.6170553863048553e-05, -1.3764947652816772e-05, -1.1359341442584991e-05, -8.95373523235321e-06, -6.5481290221214294e-06, -4.1425228118896484e-06, -1.7369166016578674e-06, 6.686896085739136e-07, 3.0742958188056946e-06, 5.479902029037476e-06, 7.885508239269257e-06, 1.0291114449501038e-05, 1.2696720659732819e-05, 1.51023268699646e-05, 1.750793308019638e-05, 1.991353929042816e-05, 2.2319145500659943e-05, 2.4724751710891724e-05, 2.7130357921123505e-05, 2.9535964131355286e-05, 3.194157034158707e-05, 3.434717655181885e-05, 3.675278276205063e-05, 3.915838897228241e-05, 4.156399518251419e-05, 4.396960139274597e-05, 4.637520760297775e-05, 4.8780813813209534e-05, 5.1186420023441315e-05, 5.3592026233673096e-05, 5.599763244390488e-05, 5.840323865413666e-05, 6.080884486436844e-05, 6.321445107460022e-05, 6.5620057284832e-05, 6.802566349506378e-05, 7.043126970529556e-05, 7.283687591552734e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 7.0, 6.0, 13.0, 18.0, 22.0, 31.0, 43.0, 57.0, 76.0, 137.0, 142.0, 109.0, 91.0, 62.0, 50.0, 44.0, 38.0, 13.0, 7.0, 10.0, 8.0, 7.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.711483001708984e-05, -6.532948464155197e-05, -6.35441392660141e-05, -6.175879389047623e-05, -5.9973448514938354e-05, -5.818810313940048e-05, -5.640275776386261e-05, -5.461741238832474e-05, -5.2832067012786865e-05, -5.104672163724899e-05, -4.926137626171112e-05, -4.747603088617325e-05, -4.5690685510635376e-05, -4.3905340135097504e-05, -4.211999475955963e-05, -4.033464938402176e-05, -3.854930400848389e-05, -3.6763958632946014e-05, -3.497861325740814e-05, -3.319326788187027e-05, -3.14079225063324e-05, -2.9622577130794525e-05, -2.7837231755256653e-05, -2.605188637971878e-05, -2.4266541004180908e-05, -2.2481195628643036e-05, -2.0695850253105164e-05, -1.891050487756729e-05, -1.712515950202942e-05, -1.5339814126491547e-05, -1.3554468750953674e-05, -1.1769123375415802e-05, -9.98377799987793e-06, -8.198432624340057e-06, -6.413087248802185e-06, -4.627741873264313e-06, -2.8423964977264404e-06, -1.0570511221885681e-06, 7.282942533493042e-07, 2.5136396288871765e-06, 4.298985004425049e-06, 6.084330379962921e-06, 7.869675755500793e-06, 9.655021131038666e-06, 1.1440366506576538e-05, 1.322571188211441e-05, 1.5011057257652283e-05, 1.6796402633190155e-05, 1.8581748008728027e-05, 2.03670933842659e-05, 2.2152438759803772e-05, 2.3937784135341644e-05, 2.5723129510879517e-05, 2.750847488641739e-05, 2.929382026195526e-05, 3.1079165637493134e-05, 3.2864511013031006e-05, 3.464985638856888e-05, 3.643520176410675e-05, 3.822054713964462e-05, 4.0005892515182495e-05, 4.179123789072037e-05, 4.357658326625824e-05, 4.536192864179611e-05, 4.7147274017333984e-05]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 11.0, 52.0, 716.0, 201.0, 24.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4307551980018616, -0.4211329221725464, -0.4115106761455536, -0.4018884301185608, -0.3922661542892456, -0.3826438784599304, -0.3730216324329376, -0.3633993864059448, -0.35377711057662964, -0.34415483474731445, -0.33453258872032166, -0.32491034269332886, -0.31528806686401367, -0.3056657910346985, -0.2960435450077057, -0.2864212989807129, -0.2767990231513977, -0.2671767473220825, -0.2575545012950897, -0.24793224036693573, -0.23830997943878174, -0.22868771851062775, -0.21906545758247375, -0.20944319665431976, -0.19982093572616577, -0.19019867479801178, -0.1805764138698578, -0.1709541529417038, -0.1613318920135498, -0.1517096310853958, -0.14208737015724182, -0.13246510922908783, -0.12284283339977264, -0.11322057247161865, -0.10359831154346466, -0.09397605061531067, -0.08435378968715668, -0.07473152875900269, -0.0651092678308487, -0.0554870069026947, -0.04586474597454071, -0.03624248504638672, -0.026620224118232727, -0.016997963190078735, -0.007375702261924744, 0.002246558666229248, 0.01186881959438324, 0.02149108052253723, 0.031113341450691223, 0.040735602378845215, 0.05035786330699921, 0.0599801242351532, 0.06960238516330719, 0.07922464609146118, 0.08884690701961517, 0.09846916794776917, 0.10809142887592316, 0.11771368980407715, 0.12733595073223114, 0.13695821166038513, 0.14658047258853912, 0.15620273351669312, 0.1658249944448471, 0.1754472553730011, 0.1850695163011551]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 9.0, 9.0, 9.0, 17.0, 23.0, 25.0, 21.0, 25.0, 34.0, 23.0, 33.0, 41.0, 34.0, 41.0, 53.0, 57.0, 54.0, 49.0, 36.0, 52.0, 52.0, 28.0, 34.0, 33.0, 31.0, 24.0, 23.0, 11.0, 21.0, 23.0, 12.0, 21.0, 10.0, 15.0, 9.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23304694890975952, -0.223457932472229, -0.21386893093585968, -0.20427991449832916, -0.19469091296195984, -0.18510189652442932, -0.1755128800868988, -0.16592387855052948, -0.15633487701416016, -0.14674586057662964, -0.13715685904026031, -0.1275678426027298, -0.11797884106636047, -0.10838982462882996, -0.09880081564188004, -0.08921180665493011, -0.0796227902173996, -0.07003378123044968, -0.060444772243499756, -0.05085575953125954, -0.041266750544309616, -0.031677741557359695, -0.022088728845119476, -0.012499719858169556, -0.002910710871219635, 0.00667829904705286, 0.016267308965325356, 0.025856319814920425, 0.035445328801870346, 0.04503433778882027, 0.054623350501060486, 0.0642123594880104, 0.07380136847496033, 0.08339037746191025, 0.09297938644886017, 0.10256840288639069, 0.11215740442276001, 0.12174642086029053, 0.13133543729782104, 0.14092443883419037, 0.1505134403705597, 0.1601024568080902, 0.16969145834445953, 0.17928047478199005, 0.18886947631835938, 0.1984584927558899, 0.2080475091934204, 0.21763651072978973, 0.22722552716732025, 0.23681454360485077, 0.2464035451412201, 0.2559925615787506, 0.26558157801628113, 0.27517056465148926, 0.2847595810890198, 0.2943485975265503, 0.3039376139640808, 0.31352663040161133, 0.32311564683914185, 0.33270463347435, 0.3422936499118805, 0.351882666349411, 0.36147168278694153, 0.37106066942214966, 0.3806496858596802]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 6.0, 4.0, 8.0, 6.0, 5.0, 9.0, 4.0, 15.0, 19.0, 41.0, 49.0, 49.0, 1063.0, 4180859.0, 11200.0, 711.0, 55.0, 28.0, 17.0, 19.0, 19.0, 16.0, 12.0, 9.0, 8.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07177734375, -0.0695199966430664, -0.06726264953613281, -0.06500530242919922, -0.06274795532226562, -0.06049060821533203, -0.05823326110839844, -0.055975914001464844, -0.05371856689453125, -0.051461219787597656, -0.04920387268066406, -0.04694652557373047, -0.044689178466796875, -0.04243183135986328, -0.04017448425292969, -0.037917137145996094, -0.0356597900390625, -0.033402442932128906, -0.031145095825195312, -0.02888774871826172, -0.026630401611328125, -0.02437305450439453, -0.022115707397460938, -0.019858360290527344, -0.01760101318359375, -0.015343666076660156, -0.013086318969726562, -0.010828971862792969, -0.008571624755859375, -0.006314277648925781, -0.0040569305419921875, -0.0017995834350585938, 0.000457763671875, 0.0027151107788085938, 0.0049724578857421875, 0.007229804992675781, 0.009487152099609375, 0.011744499206542969, 0.014001846313476562, 0.016259193420410156, 0.01851654052734375, 0.020773887634277344, 0.023031234741210938, 0.02528858184814453, 0.027545928955078125, 0.02980327606201172, 0.03206062316894531, 0.034317970275878906, 0.0365753173828125, 0.038832664489746094, 0.04109001159667969, 0.04334735870361328, 0.045604705810546875, 0.04786205291748047, 0.05011940002441406, 0.052376747131347656, 0.05463409423828125, 0.056891441345214844, 0.05914878845214844, 0.06140613555908203, 0.06366348266601562, 0.06592082977294922, 0.06817817687988281, 0.0704355239868164, 0.07269287109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 6.0, 12.0, 17.0, 16.0, 10.0, 46.0, 250.0, 405.0, 105.0, 21.0, 18.0, 10.0, 5.0, 9.0, 11.0, 10.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.019247770309448242, -0.018628597259521484, -0.018009424209594727, -0.01739025115966797, -0.01677107810974121, -0.016151905059814453, -0.015532732009887695, -0.014913558959960938, -0.01429438591003418, -0.013675212860107422, -0.013056039810180664, -0.012436866760253906, -0.011817693710327148, -0.01119852066040039, -0.010579347610473633, -0.009960174560546875, -0.009341001510620117, -0.00872182846069336, -0.008102655410766602, -0.007483482360839844, -0.006864309310913086, -0.006245136260986328, -0.00562596321105957, -0.0050067901611328125, -0.004387617111206055, -0.003768444061279297, -0.003149271011352539, -0.0025300979614257812, -0.0019109249114990234, -0.0012917518615722656, -0.0006725788116455078, -5.340576171875e-05, 0.0005657672882080078, 0.0011849403381347656, 0.0018041133880615234, 0.0024232864379882812, 0.003042459487915039, 0.003661632537841797, 0.004280805587768555, 0.0048999786376953125, 0.00551915168762207, 0.006138324737548828, 0.006757497787475586, 0.007376670837402344, 0.007995843887329102, 0.00861501693725586, 0.009234189987182617, 0.009853363037109375, 0.010472536087036133, 0.01109170913696289, 0.011710882186889648, 0.012330055236816406, 0.012949228286743164, 0.013568401336669922, 0.01418757438659668, 0.014806747436523438, 0.015425920486450195, 0.016045093536376953, 0.01666426658630371, 0.01728343963623047, 0.017902612686157227, 0.018521785736083984, 0.019140958786010742, 0.0197601318359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 9.0, 20.0, 45.0, 95.0, 300.0, 1008.0, 4574.0, 4170601.0, 15512.0, 1431.0, 414.0, 132.0, 59.0, 30.0, 14.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0222015380859375, -0.021561384201049805, -0.02092123031616211, -0.020281076431274414, -0.01964092254638672, -0.019000768661499023, -0.018360614776611328, -0.017720460891723633, -0.017080307006835938, -0.016440153121948242, -0.015799999237060547, -0.015159845352172852, -0.014519691467285156, -0.013879537582397461, -0.013239383697509766, -0.01259922981262207, -0.011959075927734375, -0.01131892204284668, -0.010678768157958984, -0.010038614273071289, -0.009398460388183594, -0.008758306503295898, -0.008118152618408203, -0.007477998733520508, -0.0068378448486328125, -0.006197690963745117, -0.005557537078857422, -0.0049173831939697266, -0.004277229309082031, -0.003637075424194336, -0.0029969215393066406, -0.0023567676544189453, -0.00171661376953125, -0.0010764598846435547, -0.0004363059997558594, 0.00020384788513183594, 0.0008440017700195312, 0.0014841556549072266, 0.002124309539794922, 0.002764463424682617, 0.0034046173095703125, 0.004044771194458008, 0.004684925079345703, 0.0053250789642333984, 0.005965232849121094, 0.006605386734008789, 0.007245540618896484, 0.00788569450378418, 0.008525848388671875, 0.00916600227355957, 0.009806156158447266, 0.010446310043334961, 0.011086463928222656, 0.011726617813110352, 0.012366771697998047, 0.013006925582885742, 0.013647079467773438, 0.014287233352661133, 0.014927387237548828, 0.015567541122436523, 0.01620769500732422, 0.016847848892211914, 0.01748800277709961, 0.018128156661987305, 0.018768310546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 10.0, 15.0, 26.0, 64.0, 493.0, 3278.0, 119.0, 30.0, 21.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00795745849609375, -0.007684588432312012, -0.0074117183685302734, -0.007138848304748535, -0.006865978240966797, -0.006593108177185059, -0.00632023811340332, -0.006047368049621582, -0.005774497985839844, -0.0055016279220581055, -0.005228757858276367, -0.004955887794494629, -0.004683017730712891, -0.004410147666931152, -0.004137277603149414, -0.0038644075393676758, -0.0035915374755859375, -0.0033186674118041992, -0.003045797348022461, -0.0027729272842407227, -0.0025000572204589844, -0.002227187156677246, -0.001954317092895508, -0.0016814470291137695, -0.0014085769653320312, -0.001135706901550293, -0.0008628368377685547, -0.0005899667739868164, -0.0003170967102050781, -4.4226646423339844e-05, 0.00022864341735839844, 0.0005015134811401367, 0.000774383544921875, 0.0010472536087036133, 0.0013201236724853516, 0.0015929937362670898, 0.0018658638000488281, 0.0021387338638305664, 0.0024116039276123047, 0.002684473991394043, 0.0029573440551757812, 0.0032302141189575195, 0.003503084182739258, 0.003775954246520996, 0.004048824310302734, 0.004321694374084473, 0.004594564437866211, 0.004867434501647949, 0.0051403045654296875, 0.005413174629211426, 0.005686044692993164, 0.005958914756774902, 0.006231784820556641, 0.006504654884338379, 0.006777524948120117, 0.0070503950119018555, 0.007323265075683594, 0.007596135139465332, 0.00786900520324707, 0.008141875267028809, 0.008414745330810547, 0.008687615394592285, 0.008960485458374023, 0.009233355522155762, 0.0095062255859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1013.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016311002895236015, -0.006879863329231739, 0.0025512762367725372, 0.011982416734099388, 0.02141355536878109, 0.03084469400346279, 0.04027583450078964, 0.049706973135471344, 0.059138111770153046, 0.06856925040483475, 0.07800038903951645, 0.08743153512477875, 0.09686267375946045, 0.10629381239414215, 0.11572495102882385, 0.12515608966350555, 0.13458722829818726, 0.14401836693286896, 0.15344950556755066, 0.16288064420223236, 0.17231178283691406, 0.18174292147159576, 0.19117406010627747, 0.20060521364212036, 0.21003635227680206, 0.21946749091148376, 0.22889862954616547, 0.23832976818084717, 0.24776090681552887, 0.25719204545021057, 0.26662319898605347, 0.276054322719574, 0.28548547625541687, 0.29491662979125977, 0.3043477535247803, 0.31377890706062317, 0.3232100307941437, 0.3326411843299866, 0.3420723080635071, 0.35150346159935, 0.3609345853328705, 0.3703657388687134, 0.3797968626022339, 0.3892280161380768, 0.3986591398715973, 0.4080902934074402, 0.4175214171409607, 0.4269525706768036, 0.4363837242126465, 0.4458148777484894, 0.4552460014820099, 0.4646771550178528, 0.4741082787513733, 0.4835394322872162, 0.4929705560207367, 0.5024017095565796, 0.5118328332901001, 0.5212639570236206, 0.5306951403617859, 0.5401262640953064, 0.5495573878288269, 0.5589885115623474, 0.5684196949005127, 0.5778508186340332, 0.5872819423675537]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 0.0, 9.0, 6.0, 9.0, 15.0, 15.0, 22.0, 27.0, 37.0, 41.0, 33.0, 38.0, 65.0, 84.0, 81.0, 70.0, 72.0, 79.0, 50.0, 60.0, 42.0, 41.0, 34.0, 24.0, 21.0, 9.0, 8.0, 7.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015378296375274658, -0.014831936918199062, -0.014285577461123466, -0.01373921800404787, -0.013192858546972275, -0.012646499089896679, -0.012100139632821083, -0.011553780175745487, -0.011007420718669891, -0.010461061261594296, -0.0099147018045187, -0.009368342347443104, -0.008821982890367508, -0.008275623433291912, -0.007729263976216316, -0.00718290451914072, -0.0066365450620651245, -0.006090185604989529, -0.005543826147913933, -0.004997466690838337, -0.004451107233762741, -0.0039047477766871452, -0.0033583883196115494, -0.0028120288625359535, -0.0022656694054603577, -0.0017193099483847618, -0.001172950491309166, -0.0006265910342335701, -8.023157715797424e-05, 0.0004661278799176216, 0.0010124873369932175, 0.0015588467940688133, 0.002105206251144409, 0.002651565708220005, 0.003197925165295601, 0.0037442846223711967, 0.004290644079446793, 0.0048370035365223885, 0.005383362993597984, 0.00592972245067358, 0.006476081907749176, 0.007022441364824772, 0.007568800821900368, 0.008115160278975964, 0.00866151973605156, 0.009207879193127155, 0.009754238650202751, 0.010300598107278347, 0.010846957564353943, 0.011393317021429539, 0.011939676478505135, 0.01248603593558073, 0.013032395392656326, 0.013578754849731922, 0.014125114306807518, 0.014671473763883114, 0.01521783322095871, 0.01576419174671173, 0.0163105521351099, 0.016856912523508072, 0.017403271049261093, 0.017949629575014114, 0.018495989963412285, 0.019042350351810455, 0.019588708877563477]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 11.0, 4.0, 9.0, 14.0, 17.0, 20.0, 37.0, 42.0, 72.0, 87.0, 129.0, 187.0, 304.0, 547.0, 999.0, 1862.0, 4038.0, 11348.0, 96464.0, 904549.0, 17091.0, 5511.0, 2271.0, 1171.0, 652.0, 377.0, 234.0, 149.0, 94.0, 73.0, 45.0, 45.0, 22.0, 17.0, 12.0, 7.0, 10.0, 5.0, 3.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019744873046875, -0.019130706787109375, -0.01851654052734375, -0.017902374267578125, -0.0172882080078125, -0.016674041748046875, -0.01605987548828125, -0.015445709228515625, -0.01483154296875, -0.014217376708984375, -0.01360321044921875, -0.012989044189453125, -0.0123748779296875, -0.011760711669921875, -0.01114654541015625, -0.010532379150390625, -0.009918212890625, -0.009304046630859375, -0.00868988037109375, -0.008075714111328125, -0.0074615478515625, -0.006847381591796875, -0.00623321533203125, -0.005619049072265625, -0.0050048828125, -0.004390716552734375, -0.00377655029296875, -0.003162384033203125, -0.0025482177734375, -0.001934051513671875, -0.00131988525390625, -0.000705718994140625, -9.1552734375e-05, 0.000522613525390625, 0.00113677978515625, 0.001750946044921875, 0.0023651123046875, 0.002979278564453125, 0.00359344482421875, 0.004207611083984375, 0.00482177734375, 0.005435943603515625, 0.00605010986328125, 0.006664276123046875, 0.0072784423828125, 0.007892608642578125, 0.00850677490234375, 0.009120941162109375, 0.009735107421875, 0.010349273681640625, 0.01096343994140625, 0.011577606201171875, 0.0121917724609375, 0.012805938720703125, 0.01342010498046875, 0.014034271240234375, 0.0146484375, 0.015262603759765625, 0.01587677001953125, 0.016490936279296875, 0.0171051025390625, 0.017719268798828125, 0.01833343505859375, 0.018947601318359375, 0.019561767578125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 6.0, 12.0, 17.0, 16.0, 10.0, 46.0, 251.0, 404.0, 105.0, 21.0, 18.0, 10.0, 5.0, 9.0, 11.0, 10.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.019247770309448242, -0.018628597259521484, -0.018009424209594727, -0.01739025115966797, -0.01677107810974121, -0.016151905059814453, -0.015532732009887695, -0.014913558959960938, -0.01429438591003418, -0.013675212860107422, -0.013056039810180664, -0.012436866760253906, -0.011817693710327148, -0.01119852066040039, -0.010579347610473633, -0.009960174560546875, -0.009341001510620117, -0.00872182846069336, -0.008102655410766602, -0.007483482360839844, -0.006864309310913086, -0.006245136260986328, -0.00562596321105957, -0.0050067901611328125, -0.004387617111206055, -0.003768444061279297, -0.003149271011352539, -0.0025300979614257812, -0.0019109249114990234, -0.0012917518615722656, -0.0006725788116455078, -5.340576171875e-05, 0.0005657672882080078, 0.0011849403381347656, 0.0018041133880615234, 0.0024232864379882812, 0.003042459487915039, 0.003661632537841797, 0.004280805587768555, 0.0048999786376953125, 0.00551915168762207, 0.006138324737548828, 0.006757497787475586, 0.007376670837402344, 0.007995843887329102, 0.00861501693725586, 0.009234189987182617, 0.009853363037109375, 0.010472536087036133, 0.01109170913696289, 0.011710882186889648, 0.012330055236816406, 0.012949228286743164, 0.013568401336669922, 0.01418757438659668, 0.014806747436523438, 0.015425920486450195, 0.016045093536376953, 0.01666426658630371, 0.01728343963623047, 0.017902612686157227, 0.018521785736083984, 0.019140958786010742, 0.0197601318359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 7.0, 3.0, 12.0, 15.0, 26.0, 16.0, 21.0, 32.0, 50.0, 55.0, 83.0, 89.0, 114.0, 134.0, 194.0, 315.0, 593.0, 1426.0, 25646.0, 1004707.0, 12175.0, 1152.0, 543.0, 308.0, 212.0, 145.0, 78.0, 87.0, 73.0, 39.0, 29.0, 36.0, 30.0, 18.0, 16.0, 18.0, 11.0, 10.0, 3.0, 6.0, 11.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.031524658203125, -0.030521392822265625, -0.02951812744140625, -0.028514862060546875, -0.0275115966796875, -0.026508331298828125, -0.02550506591796875, -0.024501800537109375, -0.02349853515625, -0.022495269775390625, -0.02149200439453125, -0.020488739013671875, -0.0194854736328125, -0.018482208251953125, -0.01747894287109375, -0.016475677490234375, -0.015472412109375, -0.014469146728515625, -0.01346588134765625, -0.012462615966796875, -0.0114593505859375, -0.010456085205078125, -0.00945281982421875, -0.008449554443359375, -0.0074462890625, -0.006443023681640625, -0.00543975830078125, -0.004436492919921875, -0.0034332275390625, -0.002429962158203125, -0.00142669677734375, -0.000423431396484375, 0.000579833984375, 0.001583099365234375, 0.00258636474609375, 0.003589630126953125, 0.0045928955078125, 0.005596160888671875, 0.00659942626953125, 0.007602691650390625, 0.00860595703125, 0.009609222412109375, 0.01061248779296875, 0.011615753173828125, 0.0126190185546875, 0.013622283935546875, 0.01462554931640625, 0.015628814697265625, 0.016632080078125, 0.017635345458984375, 0.01863861083984375, 0.019641876220703125, 0.0206451416015625, 0.021648406982421875, 0.02265167236328125, 0.023654937744140625, 0.024658203125, 0.025661468505859375, 0.02666473388671875, 0.027667999267578125, 0.0286712646484375, 0.029674530029296875, 0.03067779541015625, 0.031681060791015625, 0.032684326171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 5.0, 2.0, 8.0, 12.0, 21.0, 12.0, 10.0, 15.0, 29.0, 30.0, 33.0, 35.0, 42.0, 39.0, 36.0, 37.0, 29.0, 43.0, 39.0, 35.0, 34.0, 35.0, 37.0, 47.0, 42.0, 33.0, 34.0, 27.0, 33.0, 19.0, 15.0, 21.0, 20.0, 15.0, 12.0, 14.0, 9.0, 6.0, 5.0, 5.0, 11.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.039886474609375, -0.038616180419921875, -0.03734588623046875, -0.036075592041015625, -0.0348052978515625, -0.033535003662109375, -0.03226470947265625, -0.030994415283203125, -0.02972412109375, -0.028453826904296875, -0.02718353271484375, -0.025913238525390625, -0.0246429443359375, -0.023372650146484375, -0.02210235595703125, -0.020832061767578125, -0.019561767578125, -0.018291473388671875, -0.01702117919921875, -0.015750885009765625, -0.0144805908203125, -0.013210296630859375, -0.01194000244140625, -0.010669708251953125, -0.0093994140625, -0.008129119873046875, -0.00685882568359375, -0.005588531494140625, -0.0043182373046875, -0.003047943115234375, -0.00177764892578125, -0.000507354736328125, 0.000762939453125, 0.002033233642578125, 0.00330352783203125, 0.004573822021484375, 0.0058441162109375, 0.007114410400390625, 0.00838470458984375, 0.009654998779296875, 0.01092529296875, 0.012195587158203125, 0.01346588134765625, 0.014736175537109375, 0.0160064697265625, 0.017276763916015625, 0.01854705810546875, 0.019817352294921875, 0.021087646484375, 0.022357940673828125, 0.02362823486328125, 0.024898529052734375, 0.0261688232421875, 0.027439117431640625, 0.02870941162109375, 0.029979705810546875, 0.03125, 0.032520294189453125, 0.03379058837890625, 0.035060882568359375, 0.0363311767578125, 0.037601470947265625, 0.03887176513671875, 0.040142059326171875, 0.041412353515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 5.0, 17.0, 21.0, 30.0, 49.0, 79.0, 113.0, 208.0, 425.0, 816.0, 1961.0, 7426.0, 47921.0, 930445.0, 48914.0, 6379.0, 2061.0, 741.0, 392.0, 216.0, 117.0, 67.0, 44.0, 26.0, 23.0, 13.0, 9.0, 7.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1278858184814453e-05, -2.0602717995643616e-05, -1.992657780647278e-05, -1.925043761730194e-05, -1.8574297428131104e-05, -1.7898157238960266e-05, -1.722201704978943e-05, -1.654587686061859e-05, -1.5869736671447754e-05, -1.5193596482276917e-05, -1.4517456293106079e-05, -1.3841316103935242e-05, -1.3165175914764404e-05, -1.2489035725593567e-05, -1.181289553642273e-05, -1.1136755347251892e-05, -1.0460615158081055e-05, -9.784474968910217e-06, -9.10833477973938e-06, -8.432194590568542e-06, -7.756054401397705e-06, -7.079914212226868e-06, -6.40377402305603e-06, -5.727633833885193e-06, -5.0514936447143555e-06, -4.375353455543518e-06, -3.6992132663726807e-06, -3.0230730772018433e-06, -2.346932888031006e-06, -1.6707926988601685e-06, -9.94652509689331e-07, -3.1851232051849365e-07, 3.5762786865234375e-07, 1.0337680578231812e-06, 1.7099082469940186e-06, 2.386048436164856e-06, 3.0621886253356934e-06, 3.7383288145065308e-06, 4.414469003677368e-06, 5.0906091928482056e-06, 5.766749382019043e-06, 6.44288957118988e-06, 7.119029760360718e-06, 7.795169949531555e-06, 8.471310138702393e-06, 9.14745032787323e-06, 9.823590517044067e-06, 1.0499730706214905e-05, 1.1175870895385742e-05, 1.185201108455658e-05, 1.2528151273727417e-05, 1.3204291462898254e-05, 1.3880431652069092e-05, 1.455657184123993e-05, 1.5232712030410767e-05, 1.5908852219581604e-05, 1.658499240875244e-05, 1.726113259792328e-05, 1.7937272787094116e-05, 1.8613412976264954e-05, 1.928955316543579e-05, 1.996569335460663e-05, 2.0641833543777466e-05, 2.1317973732948303e-05, 2.199411392211914e-05]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 4.0, 9.0, 13.0, 17.0, 23.0, 33.0, 46.0, 30.0, 71.0, 67.0, 75.0, 62.0, 71.0, 76.0, 79.0, 31.0, 63.0, 38.0, 29.0, 48.0, 28.0, 14.0, 6.0, 13.0, 7.0, 5.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.470348358154297e-06, -4.307366907596588e-06, -4.144385457038879e-06, -3.981404006481171e-06, -3.818422555923462e-06, -3.655441105365753e-06, -3.4924596548080444e-06, -3.3294782042503357e-06, -3.166496753692627e-06, -3.0035153031349182e-06, -2.8405338525772095e-06, -2.6775524020195007e-06, -2.514570951461792e-06, -2.3515895009040833e-06, -2.1886080503463745e-06, -2.0256265997886658e-06, -1.862645149230957e-06, -1.6996636986732483e-06, -1.5366822481155396e-06, -1.3737007975578308e-06, -1.210719347000122e-06, -1.0477378964424133e-06, -8.847564458847046e-07, -7.217749953269958e-07, -5.587935447692871e-07, -3.9581209421157837e-07, -2.3283064365386963e-07, -6.984919309616089e-08, 9.313225746154785e-08, 2.561137080192566e-07, 4.1909515857696533e-07, 5.820766091346741e-07, 7.450580596923828e-07, 9.080395102500916e-07, 1.0710209608078003e-06, 1.234002411365509e-06, 1.3969838619232178e-06, 1.5599653124809265e-06, 1.7229467630386353e-06, 1.885928213596344e-06, 2.0489096641540527e-06, 2.2118911147117615e-06, 2.3748725652694702e-06, 2.537854015827179e-06, 2.7008354663848877e-06, 2.8638169169425964e-06, 3.026798367500305e-06, 3.189779818058014e-06, 3.3527612686157227e-06, 3.5157427191734314e-06, 3.67872416973114e-06, 3.841705620288849e-06, 4.004687070846558e-06, 4.167668521404266e-06, 4.330649971961975e-06, 4.493631422519684e-06, 4.656612873077393e-06, 4.819594323635101e-06, 4.98257577419281e-06, 5.145557224750519e-06, 5.3085386753082275e-06, 5.471520125865936e-06, 5.634501576423645e-06, 5.797483026981354e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 10.0, 14.0, 21.0, 22.0, 47.0, 111.0, 315.0, 1516.0, 1042033.0, 3786.0, 393.0, 126.0, 53.0, 27.0, 33.0, 20.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.589557647705078e-05, -4.395097494125366e-05, -4.200637340545654e-05, -4.0061771869659424e-05, -3.8117170333862305e-05, -3.6172568798065186e-05, -3.4227967262268066e-05, -3.228336572647095e-05, -3.0338764190673828e-05, -2.839416265487671e-05, -2.644956111907959e-05, -2.450495958328247e-05, -2.256035804748535e-05, -2.0615756511688232e-05, -1.8671154975891113e-05, -1.6726553440093994e-05, -1.4781951904296875e-05, -1.2837350368499756e-05, -1.0892748832702637e-05, -8.948147296905518e-06, -7.0035457611083984e-06, -5.058944225311279e-06, -3.11434268951416e-06, -1.169741153717041e-06, 7.748603820800781e-07, 2.7194619178771973e-06, 4.664063453674316e-06, 6.6086649894714355e-06, 8.553266525268555e-06, 1.0497868061065674e-05, 1.2442469596862793e-05, 1.4387071132659912e-05, 1.633167266845703e-05, 1.827627420425415e-05, 2.022087574005127e-05, 2.216547727584839e-05, 2.4110078811645508e-05, 2.6054680347442627e-05, 2.7999281883239746e-05, 2.9943883419036865e-05, 3.1888484954833984e-05, 3.3833086490631104e-05, 3.577768802642822e-05, 3.772228956222534e-05, 3.966689109802246e-05, 4.161149263381958e-05, 4.35560941696167e-05, 4.550069570541382e-05, 4.744529724121094e-05, 4.938989877700806e-05, 5.1334500312805176e-05, 5.3279101848602295e-05, 5.5223703384399414e-05, 5.716830492019653e-05, 5.911290645599365e-05, 6.105750799179077e-05, 6.300210952758789e-05, 6.494671106338501e-05, 6.689131259918213e-05, 6.883591413497925e-05, 7.078051567077637e-05, 7.272511720657349e-05, 7.46697187423706e-05, 7.661432027816772e-05, 7.855892181396484e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 4.0, 4.0, 3.0, 3.0, 7.0, 5.0, 13.0, 12.0, 26.0, 45.0, 75.0, 104.0, 243.0, 203.0, 87.0, 63.0, 41.0, 20.0, 12.0, 10.0, 10.0, 4.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.319978713989258e-05, -3.1109899282455444e-05, -2.902001142501831e-05, -2.6930123567581177e-05, -2.4840235710144043e-05, -2.275034785270691e-05, -2.0660459995269775e-05, -1.857057213783264e-05, -1.6480684280395508e-05, -1.4390796422958374e-05, -1.230090856552124e-05, -1.0211020708084106e-05, -8.121132850646973e-06, -6.031244993209839e-06, -3.941357135772705e-06, -1.8514692783355713e-06, 2.384185791015625e-07, 2.3283064365386963e-06, 4.41819429397583e-06, 6.508082151412964e-06, 8.597970008850098e-06, 1.0687857866287231e-05, 1.2777745723724365e-05, 1.4867633581161499e-05, 1.6957521438598633e-05, 1.9047409296035767e-05, 2.11372971534729e-05, 2.3227185010910034e-05, 2.5317072868347168e-05, 2.7406960725784302e-05, 2.9496848583221436e-05, 3.158673644065857e-05, 3.36766242980957e-05, 3.576651215553284e-05, 3.785640001296997e-05, 3.9946287870407104e-05, 4.203617572784424e-05, 4.412606358528137e-05, 4.6215951442718506e-05, 4.830583930015564e-05, 5.0395727157592773e-05, 5.248561501502991e-05, 5.457550287246704e-05, 5.6665390729904175e-05, 5.875527858734131e-05, 6.084516644477844e-05, 6.293505430221558e-05, 6.502494215965271e-05, 6.711483001708984e-05, 6.920471787452698e-05, 7.129460573196411e-05, 7.338449358940125e-05, 7.547438144683838e-05, 7.756426930427551e-05, 7.965415716171265e-05, 8.174404501914978e-05, 8.383393287658691e-05, 8.592382073402405e-05, 8.801370859146118e-05, 9.010359644889832e-05, 9.219348430633545e-05, 9.428337216377258e-05, 9.637326002120972e-05, 9.846314787864685e-05, 0.00010055303573608398]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 44.0, 921.0, 45.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12164964526891708, -0.1073518842458725, -0.09305412322282791, -0.07875636219978333, -0.06445860862731934, -0.05016084760427475, -0.035863086581230164, -0.021565325558185577, -0.007267564535140991, 0.00703019555658102, 0.021327955648303032, 0.03562571480870247, 0.049923475831747055, 0.06422123312950134, 0.07851899415254593, 0.09281675517559052, 0.1071145161986351, 0.12141227722167969, 0.13571003079414368, 0.15000779926776886, 0.16430555284023285, 0.17860332131385803, 0.19290107488632202, 0.207198828458786, 0.2214965969324112, 0.23579435050487518, 0.25009211897850037, 0.26438987255096436, 0.27868762612342834, 0.29298537969589233, 0.3072831630706787, 0.3215809166431427, 0.3358787000179291, 0.35017645359039307, 0.36447420716285706, 0.37877199053764343, 0.3930697441101074, 0.4073674976825714, 0.4216652512550354, 0.4359630346298218, 0.45026078820228577, 0.46455854177474976, 0.47885629534721375, 0.4931540787220001, 0.5074518322944641, 0.5217496156692505, 0.5360473394393921, 0.5503451228141785, 0.5646428465843201, 0.5789406299591064, 0.593238353729248, 0.6075361371040344, 0.621833860874176, 0.6361316442489624, 0.6504294276237488, 0.6647271513938904, 0.6790249347686768, 0.6933227181434631, 0.7076204419136047, 0.7219182252883911, 0.7362159490585327, 0.7505137324333191, 0.7648115158081055, 0.7791092395782471, 0.7934070229530334]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 5.0, 0.0, 6.0, 7.0, 10.0, 15.0, 8.0, 16.0, 22.0, 23.0, 27.0, 27.0, 41.0, 38.0, 52.0, 50.0, 45.0, 59.0, 46.0, 58.0, 45.0, 57.0, 60.0, 40.0, 30.0, 35.0, 38.0, 24.0, 23.0, 26.0, 18.0, 11.0, 12.0, 12.0, 5.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.28734254837036133, -0.27920255064964294, -0.27106255292892456, -0.2629225552082062, -0.2547825574874878, -0.24664254486560822, -0.23850254714488983, -0.23036254942417145, -0.22222253680229187, -0.2140825390815735, -0.2059425413608551, -0.19780254364013672, -0.18966253101825714, -0.18152253329753876, -0.17338253557682037, -0.165242537856102, -0.1571025401353836, -0.14896254241466522, -0.14082254469394684, -0.13268253207206726, -0.12454253435134888, -0.1164025366306305, -0.10826253890991211, -0.10012254118919373, -0.09198253601789474, -0.08384253829717636, -0.07570253312587738, -0.067562535405159, -0.059422533959150314, -0.05128253251314163, -0.04314253479242325, -0.035002533346414566, -0.026862531900405884, -0.0187225304543972, -0.010582530871033669, -0.0024425312876701355, 0.005697470158338547, 0.013837471604347229, 0.021977469325065613, 0.030117470771074295, 0.03825747221708298, 0.04639747366309166, 0.05453747510910034, 0.06267747282981873, 0.07081747055053711, 0.07895747572183609, 0.08709747344255447, 0.09523747861385345, 0.10337747633457184, 0.11151747405529022, 0.1196574792265892, 0.12779748439788818, 0.13593748211860657, 0.14407747983932495, 0.15221747756004333, 0.16035747528076172, 0.1684974730014801, 0.1766374707221985, 0.18477746844291687, 0.19291746616363525, 0.20105747878551483, 0.20919747650623322, 0.2173374742269516, 0.22547747194766998, 0.23361748456954956]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 7.0, 3.0, 4.0, 6.0, 12.0, 23.0, 23.0, 25.0, 30.0, 111.0, 4189373.0, 4375.0, 112.0, 48.0, 29.0, 16.0, 7.0, 15.0, 12.0, 10.0, 4.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.202392578125, -0.19605064392089844, -0.18970870971679688, -0.1833667755126953, -0.17702484130859375, -0.1706829071044922, -0.16434097290039062, -0.15799903869628906, -0.1516571044921875, -0.14531517028808594, -0.13897323608398438, -0.1326313018798828, -0.12628936767578125, -0.11994743347167969, -0.11360549926757812, -0.10726356506347656, -0.100921630859375, -0.09457969665527344, -0.08823776245117188, -0.08189582824707031, -0.07555389404296875, -0.06921195983886719, -0.06287002563476562, -0.05652809143066406, -0.0501861572265625, -0.04384422302246094, -0.037502288818359375, -0.031160354614257812, -0.02481842041015625, -0.018476486206054688, -0.012134552001953125, -0.0057926177978515625, 0.00054931640625, 0.0068912506103515625, 0.013233184814453125, 0.019575119018554688, 0.02591705322265625, 0.03225898742675781, 0.038600921630859375, 0.04494285583496094, 0.0512847900390625, 0.05762672424316406, 0.06396865844726562, 0.07031059265136719, 0.07665252685546875, 0.08299446105957031, 0.08933639526367188, 0.09567832946777344, 0.102020263671875, 0.10836219787597656, 0.11470413208007812, 0.12104606628417969, 0.12738800048828125, 0.1337299346923828, 0.14007186889648438, 0.14641380310058594, 0.1527557373046875, 0.15909767150878906, 0.16543960571289062, 0.1717815399169922, 0.17812347412109375, 0.1844654083251953, 0.19080734252929688, 0.19714927673339844, 0.2034912109375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 13.0, 19.0, 16.0, 10.0, 58.0, 290.0, 369.0, 91.0, 20.0, 17.0, 9.0, 4.0, 10.0, 11.0, 10.0, 3.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019775390625, -0.019156932830810547, -0.018538475036621094, -0.01792001724243164, -0.017301559448242188, -0.016683101654052734, -0.01606464385986328, -0.015446186065673828, -0.014827728271484375, -0.014209270477294922, -0.013590812683105469, -0.012972354888916016, -0.012353897094726562, -0.01173543930053711, -0.011116981506347656, -0.010498523712158203, -0.00988006591796875, -0.009261608123779297, -0.008643150329589844, -0.00802469253540039, -0.0074062347412109375, -0.006787776947021484, -0.006169319152832031, -0.005550861358642578, -0.004932403564453125, -0.004313945770263672, -0.0036954879760742188, -0.0030770301818847656, -0.0024585723876953125, -0.0018401145935058594, -0.0012216567993164062, -0.0006031990051269531, 1.52587890625e-05, 0.0006337165832519531, 0.0012521743774414062, 0.0018706321716308594, 0.0024890899658203125, 0.0031075477600097656, 0.0037260055541992188, 0.004344463348388672, 0.004962921142578125, 0.005581378936767578, 0.006199836730957031, 0.006818294525146484, 0.0074367523193359375, 0.00805521011352539, 0.008673667907714844, 0.009292125701904297, 0.00991058349609375, 0.010529041290283203, 0.011147499084472656, 0.01176595687866211, 0.012384414672851562, 0.013002872467041016, 0.013621330261230469, 0.014239788055419922, 0.014858245849609375, 0.015476703643798828, 0.01609516143798828, 0.016713619232177734, 0.017332077026367188, 0.01795053482055664, 0.018568992614746094, 0.019187450408935547, 0.019805908203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 21.0, 65.0, 226.0, 638.0, 12560.0, 4179228.0, 1078.0, 307.0, 98.0, 29.0, 11.0, 8.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0267791748046875, -0.025891542434692383, -0.025003910064697266, -0.02411627769470215, -0.02322864532470703, -0.022341012954711914, -0.021453380584716797, -0.02056574821472168, -0.019678115844726562, -0.018790483474731445, -0.017902851104736328, -0.01701521873474121, -0.016127586364746094, -0.015239953994750977, -0.01435232162475586, -0.013464689254760742, -0.012577056884765625, -0.011689424514770508, -0.01080179214477539, -0.009914159774780273, -0.009026527404785156, -0.008138895034790039, -0.007251262664794922, -0.006363630294799805, -0.0054759979248046875, -0.00458836555480957, -0.003700733184814453, -0.002813100814819336, -0.0019254684448242188, -0.0010378360748291016, -0.00015020370483398438, 0.0007374286651611328, 0.00162506103515625, 0.002512693405151367, 0.0034003257751464844, 0.0042879581451416016, 0.005175590515136719, 0.006063222885131836, 0.006950855255126953, 0.00783848762512207, 0.008726119995117188, 0.009613752365112305, 0.010501384735107422, 0.011389017105102539, 0.012276649475097656, 0.013164281845092773, 0.01405191421508789, 0.014939546585083008, 0.015827178955078125, 0.016714811325073242, 0.01760244369506836, 0.018490076065063477, 0.019377708435058594, 0.02026534080505371, 0.021152973175048828, 0.022040605545043945, 0.022928237915039062, 0.02381587028503418, 0.024703502655029297, 0.025591135025024414, 0.02647876739501953, 0.02736639976501465, 0.028254032135009766, 0.029141664505004883, 0.030029296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 8.0, 24.0, 448.0, 3553.0, 21.0, 13.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00959014892578125, -0.009308338165283203, -0.009026527404785156, -0.00874471664428711, -0.008462905883789062, -0.008181095123291016, -0.007899284362792969, -0.007617473602294922, -0.007335662841796875, -0.007053852081298828, -0.006772041320800781, -0.006490230560302734, -0.0062084197998046875, -0.005926609039306641, -0.005644798278808594, -0.005362987518310547, -0.0050811767578125, -0.004799365997314453, -0.004517555236816406, -0.004235744476318359, -0.0039539337158203125, -0.0036721229553222656, -0.0033903121948242188, -0.003108501434326172, -0.002826690673828125, -0.002544879913330078, -0.0022630691528320312, -0.0019812583923339844, -0.0016994476318359375, -0.0014176368713378906, -0.0011358261108398438, -0.0008540153503417969, -0.00057220458984375, -0.0002903938293457031, -8.58306884765625e-06, 0.0002732276916503906, 0.0005550384521484375, 0.0008368492126464844, 0.0011186599731445312, 0.0014004707336425781, 0.001682281494140625, 0.001964092254638672, 0.0022459030151367188, 0.0025277137756347656, 0.0028095245361328125, 0.0030913352966308594, 0.0033731460571289062, 0.003654956817626953, 0.003936767578125, 0.004218578338623047, 0.004500389099121094, 0.004782199859619141, 0.0050640106201171875, 0.005345821380615234, 0.005627632141113281, 0.005909442901611328, 0.006191253662109375, 0.006473064422607422, 0.006754875183105469, 0.007036685943603516, 0.0073184967041015625, 0.007600307464599609, 0.007882118225097656, 0.008163928985595703, 0.00844573974609375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 869.0, 147.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04307457059621811, -0.0419674776494503, -0.040860384702682495, -0.03975329548120499, -0.03864620253443718, -0.03753910958766937, -0.036432020366191864, -0.03532492741942406, -0.03421783447265625, -0.03311074152588844, -0.032003648579120636, -0.030896559357643127, -0.02978946641087532, -0.028682373464107513, -0.027575282379984856, -0.026468191295862198, -0.02536109834909439, -0.024254005402326584, -0.023146914318203926, -0.02203982323408127, -0.02093273028731346, -0.019825637340545654, -0.018718546256422997, -0.01761145517230034, -0.016504362225532532, -0.0153972702100873, -0.014290178194642067, -0.013183086179196835, -0.012075994163751602, -0.01096890214830637, -0.009861810132861137, -0.008754718117415905, -0.007647629827260971, -0.006540537811815739, -0.005433445796370506, -0.004326353780925274, -0.0032192617654800415, -0.002112169750034809, -0.0010050777345895767, 0.00010201428085565567, 0.001209106296300888, 0.0023161983117461205, 0.003423290327191353, 0.004530382342636585, 0.005637474358081818, 0.00674456637352705, 0.007851658388972282, 0.008958750404417515, 0.010065842419862747, 0.01117293443530798, 0.012280026450753212, 0.013387118466198444, 0.014494210481643677, 0.01560130249708891, 0.01670839451253414, 0.0178154855966568, 0.018922578543424606, 0.020029671490192413, 0.02113676257431507, 0.02224385365843773, 0.023350946605205536, 0.024458039551973343, 0.025565130636096, 0.02667222172021866, 0.027779314666986465]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 10.0, 8.0, 10.0, 13.0, 19.0, 18.0, 22.0, 20.0, 21.0, 32.0, 29.0, 42.0, 37.0, 40.0, 58.0, 46.0, 48.0, 38.0, 44.0, 38.0, 46.0, 47.0, 41.0, 41.0, 35.0, 27.0, 41.0, 19.0, 16.0, 15.0, 22.0, 8.0, 12.0, 9.0, 5.0, 9.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006440162658691406, -0.006217312067747116, -0.005994461476802826, -0.005771610885858536, -0.005548760294914246, -0.0053259097039699554, -0.005103059113025665, -0.004880208522081375, -0.004657357931137085, -0.004434507340192795, -0.004211656749248505, -0.0039888061583042145, -0.0037659555673599243, -0.003543104976415634, -0.003320254385471344, -0.003097403794527054, -0.0028745532035827637, -0.0026517026126384735, -0.0024288520216941833, -0.002206001430749893, -0.001983150839805603, -0.0017603002488613129, -0.0015374496579170227, -0.0013145990669727325, -0.0010917484760284424, -0.0008688978850841522, -0.0006460472941398621, -0.0004231967031955719, -0.00020034611225128174, 2.2504478693008423e-05, 0.0002453550696372986, 0.00046820566058158875, 0.0006910562515258789, 0.0009139068424701691, 0.0011367574334144592, 0.0013596080243587494, 0.0015824586153030396, 0.0018053092062473297, 0.00202815979719162, 0.00225101038813591, 0.0024738609790802, 0.0026967115700244904, 0.0029195621609687805, 0.0031424127519130707, 0.003365263342857361, 0.003588113933801651, 0.003810964524745941, 0.004033815115690231, 0.0042566657066345215, 0.004479516297578812, 0.004702366888523102, 0.004925217479467392, 0.005148068070411682, 0.005370918661355972, 0.0055937692523002625, 0.005816619843244553, 0.006039470434188843, 0.006262321025133133, 0.006485171616077423, 0.006708022207021713, 0.006930872797966003, 0.007153723388910294, 0.007376573979854584, 0.007599424570798874, 0.007822275161743164]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 10.0, 15.0, 6.0, 22.0, 28.0, 35.0, 52.0, 47.0, 78.0, 109.0, 146.0, 233.0, 339.0, 494.0, 721.0, 1142.0, 1999.0, 3581.0, 7202.0, 19055.0, 725012.0, 255535.0, 17310.0, 6669.0, 3318.0, 1896.0, 1136.0, 744.0, 498.0, 326.0, 215.0, 166.0, 102.0, 81.0, 60.0, 50.0, 28.0, 25.0, 21.0, 6.0, 11.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0147705078125, -0.014308333396911621, -0.013846158981323242, -0.013383984565734863, -0.012921810150146484, -0.012459635734558105, -0.011997461318969727, -0.011535286903381348, -0.011073112487792969, -0.01061093807220459, -0.010148763656616211, -0.009686589241027832, -0.009224414825439453, -0.008762240409851074, -0.008300065994262695, -0.007837891578674316, -0.0073757171630859375, -0.006913542747497559, -0.00645136833190918, -0.005989193916320801, -0.005527019500732422, -0.005064845085144043, -0.004602670669555664, -0.004140496253967285, -0.0036783218383789062, -0.0032161474227905273, -0.0027539730072021484, -0.0022917985916137695, -0.0018296241760253906, -0.0013674497604370117, -0.0009052753448486328, -0.0004431009292602539, 1.9073486328125e-05, 0.0004812479019165039, 0.0009434223175048828, 0.0014055967330932617, 0.0018677711486816406, 0.0023299455642700195, 0.0027921199798583984, 0.0032542943954467773, 0.0037164688110351562, 0.004178643226623535, 0.004640817642211914, 0.005102992057800293, 0.005565166473388672, 0.006027340888977051, 0.00648951530456543, 0.006951689720153809, 0.0074138641357421875, 0.007876038551330566, 0.008338212966918945, 0.008800387382507324, 0.009262561798095703, 0.009724736213684082, 0.010186910629272461, 0.01064908504486084, 0.011111259460449219, 0.011573433876037598, 0.012035608291625977, 0.012497782707214355, 0.012959957122802734, 0.013422131538391113, 0.013884305953979492, 0.014346480369567871, 0.01480865478515625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 13.0, 19.0, 16.0, 10.0, 57.0, 291.0, 369.0, 91.0, 20.0, 17.0, 9.0, 4.0, 10.0, 11.0, 10.0, 3.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019775390625, -0.019156932830810547, -0.018538475036621094, -0.01792001724243164, -0.017301559448242188, -0.016683101654052734, -0.01606464385986328, -0.015446186065673828, -0.014827728271484375, -0.014209270477294922, -0.013590812683105469, -0.012972354888916016, -0.012353897094726562, -0.01173543930053711, -0.011116981506347656, -0.010498523712158203, -0.00988006591796875, -0.009261608123779297, -0.008643150329589844, -0.00802469253540039, -0.0074062347412109375, -0.006787776947021484, -0.006169319152832031, -0.005550861358642578, -0.004932403564453125, -0.004313945770263672, -0.0036954879760742188, -0.0030770301818847656, -0.0024585723876953125, -0.0018401145935058594, -0.0012216567993164062, -0.0006031990051269531, 1.52587890625e-05, 0.0006337165832519531, 0.0012521743774414062, 0.0018706321716308594, 0.0024890899658203125, 0.0031075477600097656, 0.0037260055541992188, 0.004344463348388672, 0.004962921142578125, 0.005581378936767578, 0.006199836730957031, 0.006818294525146484, 0.0074367523193359375, 0.00805521011352539, 0.008673667907714844, 0.009292125701904297, 0.00991058349609375, 0.010529041290283203, 0.011147499084472656, 0.01176595687866211, 0.012384414672851562, 0.013002872467041016, 0.013621330261230469, 0.014239788055419922, 0.014858245849609375, 0.015476703643798828, 0.01609516143798828, 0.016713619232177734, 0.017332077026367188, 0.01795053482055664, 0.018568992614746094, 0.019187450408935547, 0.019805908203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 8.0, 12.0, 10.0, 14.0, 21.0, 17.0, 25.0, 27.0, 41.0, 43.0, 46.0, 62.0, 59.0, 103.0, 131.0, 194.0, 319.0, 533.0, 1348.0, 11500.0, 929446.0, 99249.0, 3129.0, 830.0, 437.0, 227.0, 167.0, 109.0, 75.0, 64.0, 57.0, 46.0, 34.0, 33.0, 30.0, 23.0, 22.0, 17.0, 7.0, 7.0, 5.0, 7.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0274810791015625, -0.02661585807800293, -0.02575063705444336, -0.02488541603088379, -0.02402019500732422, -0.02315497398376465, -0.022289752960205078, -0.021424531936645508, -0.020559310913085938, -0.019694089889526367, -0.018828868865966797, -0.017963647842407227, -0.017098426818847656, -0.016233205795288086, -0.015367984771728516, -0.014502763748168945, -0.013637542724609375, -0.012772321701049805, -0.011907100677490234, -0.011041879653930664, -0.010176658630371094, -0.009311437606811523, -0.008446216583251953, -0.007580995559692383, -0.0067157745361328125, -0.005850553512573242, -0.004985332489013672, -0.0041201114654541016, -0.0032548904418945312, -0.002389669418334961, -0.0015244483947753906, -0.0006592273712158203, 0.00020599365234375, 0.0010712146759033203, 0.0019364356994628906, 0.002801656723022461, 0.0036668777465820312, 0.0045320987701416016, 0.005397319793701172, 0.006262540817260742, 0.0071277618408203125, 0.007992982864379883, 0.008858203887939453, 0.009723424911499023, 0.010588645935058594, 0.011453866958618164, 0.012319087982177734, 0.013184309005737305, 0.014049530029296875, 0.014914751052856445, 0.015779972076416016, 0.016645193099975586, 0.017510414123535156, 0.018375635147094727, 0.019240856170654297, 0.020106077194213867, 0.020971298217773438, 0.021836519241333008, 0.022701740264892578, 0.02356696128845215, 0.02443218231201172, 0.02529740333557129, 0.02616262435913086, 0.02702784538269043, 0.02789306640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 6.0, 5.0, 10.0, 8.0, 12.0, 11.0, 11.0, 18.0, 16.0, 22.0, 23.0, 25.0, 23.0, 29.0, 34.0, 34.0, 44.0, 46.0, 39.0, 40.0, 38.0, 26.0, 45.0, 42.0, 49.0, 38.0, 27.0, 33.0, 26.0, 33.0, 23.0, 25.0, 22.0, 19.0, 16.0, 16.0, 13.0, 13.0, 17.0, 4.0, 6.0, 3.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03948974609375, -0.03824615478515625, -0.0370025634765625, -0.03575897216796875, -0.034515380859375, -0.03327178955078125, -0.0320281982421875, -0.03078460693359375, -0.029541015625, -0.02829742431640625, -0.0270538330078125, -0.02581024169921875, -0.024566650390625, -0.02332305908203125, -0.0220794677734375, -0.02083587646484375, -0.01959228515625, -0.01834869384765625, -0.0171051025390625, -0.01586151123046875, -0.014617919921875, -0.01337432861328125, -0.0121307373046875, -0.01088714599609375, -0.0096435546875, -0.00839996337890625, -0.0071563720703125, -0.00591278076171875, -0.004669189453125, -0.00342559814453125, -0.0021820068359375, -0.00093841552734375, 0.00030517578125, 0.00154876708984375, 0.0027923583984375, 0.00403594970703125, 0.005279541015625, 0.00652313232421875, 0.0077667236328125, 0.00901031494140625, 0.01025390625, 0.01149749755859375, 0.0127410888671875, 0.01398468017578125, 0.015228271484375, 0.01647186279296875, 0.0177154541015625, 0.01895904541015625, 0.02020263671875, 0.02144622802734375, 0.0226898193359375, 0.02393341064453125, 0.025177001953125, 0.02642059326171875, 0.0276641845703125, 0.02890777587890625, 0.0301513671875, 0.03139495849609375, 0.0326385498046875, 0.03388214111328125, 0.035125732421875, 0.03636932373046875, 0.0376129150390625, 0.03885650634765625, 0.04010009765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 12.0, 10.0, 9.0, 9.0, 24.0, 34.0, 38.0, 52.0, 80.0, 156.0, 178.0, 271.0, 360.0, 670.0, 879.0, 1958.0, 2916.0, 7614.0, 15639.0, 88125.0, 810682.0, 80499.0, 22760.0, 6638.0, 4147.0, 1736.0, 1168.0, 580.0, 470.0, 227.0, 212.0, 133.0, 66.0, 62.0, 34.0, 41.0, 12.0, 12.0, 8.0, 11.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.821487426757812e-06, -8.550472557544708e-06, -8.279457688331604e-06, -8.0084428191185e-06, -7.737427949905396e-06, -7.466413080692291e-06, -7.195398211479187e-06, -6.924383342266083e-06, -6.6533684730529785e-06, -6.382353603839874e-06, -6.11133873462677e-06, -5.840323865413666e-06, -5.5693089962005615e-06, -5.298294126987457e-06, -5.027279257774353e-06, -4.756264388561249e-06, -4.4852495193481445e-06, -4.21423465013504e-06, -3.943219780921936e-06, -3.6722049117088318e-06, -3.4011900424957275e-06, -3.1301751732826233e-06, -2.859160304069519e-06, -2.588145434856415e-06, -2.3171305656433105e-06, -2.0461156964302063e-06, -1.775100827217102e-06, -1.5040859580039978e-06, -1.2330710887908936e-06, -9.620562195777893e-07, -6.910413503646851e-07, -4.200264811515808e-07, -1.4901161193847656e-07, 1.2200325727462769e-07, 3.9301812648773193e-07, 6.640329957008362e-07, 9.350478649139404e-07, 1.2060627341270447e-06, 1.477077603340149e-06, 1.7480924725532532e-06, 2.0191073417663574e-06, 2.2901222109794617e-06, 2.561137080192566e-06, 2.83215194940567e-06, 3.1031668186187744e-06, 3.3741816878318787e-06, 3.645196557044983e-06, 3.916211426258087e-06, 4.187226295471191e-06, 4.458241164684296e-06, 4.7292560338974e-06, 5.000270903110504e-06, 5.271285772323608e-06, 5.542300641536713e-06, 5.813315510749817e-06, 6.084330379962921e-06, 6.355345249176025e-06, 6.62636011838913e-06, 6.897374987602234e-06, 7.168389856815338e-06, 7.439404726028442e-06, 7.710419595241547e-06, 7.981434464454651e-06, 8.252449333667755e-06, 8.52346420288086e-06]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 18.0, 15.0, 20.0, 27.0, 36.0, 39.0, 77.0, 46.0, 85.0, 77.0, 102.0, 58.0, 92.0, 62.0, 73.0, 45.0, 39.0, 14.0, 15.0, 12.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.066394805908203e-06, -4.9173831939697266e-06, -4.76837158203125e-06, -4.6193599700927734e-06, -4.470348358154297e-06, -4.32133674621582e-06, -4.172325134277344e-06, -4.023313522338867e-06, -3.874301910400391e-06, -3.725290298461914e-06, -3.5762786865234375e-06, -3.427267074584961e-06, -3.2782554626464844e-06, -3.129243850708008e-06, -2.9802322387695312e-06, -2.8312206268310547e-06, -2.682209014892578e-06, -2.5331974029541016e-06, -2.384185791015625e-06, -2.2351741790771484e-06, -2.086162567138672e-06, -1.9371509552001953e-06, -1.7881393432617188e-06, -1.6391277313232422e-06, -1.4901161193847656e-06, -1.341104507446289e-06, -1.1920928955078125e-06, -1.043081283569336e-06, -8.940696716308594e-07, -7.450580596923828e-07, -5.960464477539062e-07, -4.470348358154297e-07, -2.980232238769531e-07, -1.4901161193847656e-07, 0.0, 1.4901161193847656e-07, 2.980232238769531e-07, 4.470348358154297e-07, 5.960464477539062e-07, 7.450580596923828e-07, 8.940696716308594e-07, 1.043081283569336e-06, 1.1920928955078125e-06, 1.341104507446289e-06, 1.4901161193847656e-06, 1.6391277313232422e-06, 1.7881393432617188e-06, 1.9371509552001953e-06, 2.086162567138672e-06, 2.2351741790771484e-06, 2.384185791015625e-06, 2.5331974029541016e-06, 2.682209014892578e-06, 2.8312206268310547e-06, 2.9802322387695312e-06, 3.129243850708008e-06, 3.2782554626464844e-06, 3.427267074584961e-06, 3.5762786865234375e-06, 3.725290298461914e-06, 3.874301910400391e-06, 4.023313522338867e-06, 4.172325134277344e-06, 4.32133674621582e-06, 4.470348358154297e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 0.0, 9.0, 8.0, 8.0, 18.0, 28.0, 37.0, 64.0, 111.0, 215.0, 736.0, 11247.0, 1032216.0, 3011.0, 411.0, 175.0, 89.0, 62.0, 34.0, 21.0, 14.0, 10.0, 5.0, 2.0, 5.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0471553802490234e-05, -3.935769200325012e-05, -3.824383020401001e-05, -3.71299684047699e-05, -3.6016106605529785e-05, -3.490224480628967e-05, -3.378838300704956e-05, -3.267452120780945e-05, -3.1560659408569336e-05, -3.0446797609329224e-05, -2.933293581008911e-05, -2.8219074010849e-05, -2.7105212211608887e-05, -2.5991350412368774e-05, -2.4877488613128662e-05, -2.376362681388855e-05, -2.2649765014648438e-05, -2.1535903215408325e-05, -2.0422041416168213e-05, -1.93081796169281e-05, -1.8194317817687988e-05, -1.7080456018447876e-05, -1.5966594219207764e-05, -1.4852732419967651e-05, -1.3738870620727539e-05, -1.2625008821487427e-05, -1.1511147022247314e-05, -1.0397285223007202e-05, -9.28342342376709e-06, -8.169561624526978e-06, -7.055699825286865e-06, -5.941838026046753e-06, -4.827976226806641e-06, -3.7141144275665283e-06, -2.600252628326416e-06, -1.4863908290863037e-06, -3.725290298461914e-07, 7.413327693939209e-07, 1.8551945686340332e-06, 2.9690563678741455e-06, 4.082918167114258e-06, 5.19677996635437e-06, 6.310641765594482e-06, 7.424503564834595e-06, 8.538365364074707e-06, 9.65222716331482e-06, 1.0766088962554932e-05, 1.1879950761795044e-05, 1.2993812561035156e-05, 1.4107674360275269e-05, 1.5221536159515381e-05, 1.6335397958755493e-05, 1.7449259757995605e-05, 1.8563121557235718e-05, 1.967698335647583e-05, 2.0790845155715942e-05, 2.1904706954956055e-05, 2.3018568754196167e-05, 2.413243055343628e-05, 2.524629235267639e-05, 2.6360154151916504e-05, 2.7474015951156616e-05, 2.858787775039673e-05, 2.970173954963684e-05, 3.081560134887695e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 6.0, 3.0, 7.0, 9.0, 16.0, 16.0, 22.0, 28.0, 48.0, 71.0, 114.0, 238.0, 133.0, 87.0, 60.0, 39.0, 37.0, 21.0, 19.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.823373794555664e-05, -5.6692399084568024e-05, -5.515106022357941e-05, -5.360972136259079e-05, -5.206838250160217e-05, -5.0527043640613556e-05, -4.898570477962494e-05, -4.744436591863632e-05, -4.5903027057647705e-05, -4.436168819665909e-05, -4.282034933567047e-05, -4.1279010474681854e-05, -3.973767161369324e-05, -3.819633275270462e-05, -3.6654993891716003e-05, -3.5113655030727386e-05, -3.357231616973877e-05, -3.203097730875015e-05, -3.0489638447761536e-05, -2.894829958677292e-05, -2.7406960725784302e-05, -2.5865621864795685e-05, -2.4324283003807068e-05, -2.278294414281845e-05, -2.1241605281829834e-05, -1.9700266420841217e-05, -1.81589275598526e-05, -1.6617588698863983e-05, -1.5076249837875366e-05, -1.353491097688675e-05, -1.1993572115898132e-05, -1.0452233254909515e-05, -8.910894393920898e-06, -7.3695555329322815e-06, -5.8282166719436646e-06, -4.286877810955048e-06, -2.7455389499664307e-06, -1.2042000889778137e-06, 3.371387720108032e-07, 1.8784776329994202e-06, 3.419816493988037e-06, 4.961155354976654e-06, 6.502494215965271e-06, 8.043833076953888e-06, 9.585171937942505e-06, 1.1126510798931122e-05, 1.2667849659919739e-05, 1.4209188520908356e-05, 1.5750527381896973e-05, 1.729186624288559e-05, 1.8833205103874207e-05, 2.0374543964862823e-05, 2.191588282585144e-05, 2.3457221686840057e-05, 2.4998560547828674e-05, 2.653989940881729e-05, 2.8081238269805908e-05, 2.9622577130794525e-05, 3.116391599178314e-05, 3.270525485277176e-05, 3.4246593713760376e-05, 3.578793257474899e-05, 3.732927143573761e-05, 3.887061029672623e-05, 4.0411949157714844e-05]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 15.0, 77.0, 756.0, 146.0, 15.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07345671206712723, -0.06657340377569199, -0.059690095484256744, -0.0528067909181118, -0.04592348262667656, -0.03904017433524132, -0.032156869769096375, -0.025273561477661133, -0.01839025318622589, -0.011506945826113224, -0.004623638466000557, 0.0022596679627895355, 0.009142976254224777, 0.01602628454566002, 0.022909589111804962, 0.029792897403240204, 0.036676205694675446, 0.04355951398611069, 0.05044282227754593, 0.05732612684369087, 0.06420943140983582, 0.07109273970127106, 0.0779760479927063, 0.08485935628414154, 0.09174266457557678, 0.09862597286701202, 0.10550928115844727, 0.11239258944988251, 0.11927589774131775, 0.126159206032753, 0.13304251432418823, 0.13992580771446228, 0.14680913090705872, 0.15369243919849396, 0.1605757474899292, 0.16745905578136444, 0.17434236407279968, 0.18122567236423492, 0.18810898065567017, 0.1949922740459442, 0.20187559723854065, 0.2087589055299759, 0.21564221382141113, 0.22252552211284637, 0.22940883040428162, 0.23629213869571686, 0.2431754469871521, 0.25005874037742615, 0.2569420337677002, 0.26382532715797424, 0.2707086503505707, 0.2775919437408447, 0.28447526693344116, 0.2913585603237152, 0.29824188351631165, 0.3051251769065857, 0.31200850009918213, 0.3188917934894562, 0.3257751166820526, 0.33265841007232666, 0.3395417332649231, 0.34642502665519714, 0.3533083498477936, 0.3601916432380676, 0.36707496643066406]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 12.0, 20.0, 24.0, 9.0, 17.0, 23.0, 28.0, 30.0, 31.0, 31.0, 43.0, 35.0, 42.0, 52.0, 47.0, 48.0, 58.0, 60.0, 42.0, 51.0, 41.0, 35.0, 26.0, 24.0, 18.0, 17.0, 12.0, 18.0, 16.0, 14.0, 10.0, 8.0, 6.0, 5.0, 5.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17874622344970703, -0.1722867786884308, -0.16582733392715454, -0.1593678891658783, -0.15290844440460205, -0.1464489996433258, -0.13998955488204956, -0.13353011012077332, -0.12707066535949707, -0.12061122059822083, -0.11415177583694458, -0.10769233107566833, -0.10123288631439209, -0.09477344155311584, -0.088313989341259, -0.08185454457998276, -0.07539509236812592, -0.06893564760684967, -0.062476202845573425, -0.05601675435900688, -0.04955730959773064, -0.04309786483645439, -0.03663841634988785, -0.030178971588611603, -0.023719526827335358, -0.017260082066059113, -0.010800635442137718, -0.004341188818216324, 0.0021182559430599213, 0.008577700704336166, 0.01503714919090271, 0.021496593952178955, 0.0279560387134552, 0.034415483474731445, 0.04087492823600769, 0.047334376722574234, 0.05379382148385048, 0.060253266245126724, 0.06671271473169327, 0.07317215949296951, 0.07963160425424576, 0.086091049015522, 0.09255049377679825, 0.09900994598865509, 0.10546939074993134, 0.11192883551120758, 0.11838828027248383, 0.12484772503376007, 0.13130716979503632, 0.13776661455631256, 0.1442260593175888, 0.15068550407886505, 0.1571449488401413, 0.16360439360141754, 0.17006385326385498, 0.17652329802513123, 0.18298274278640747, 0.18944218754768372, 0.19590163230895996, 0.2023610770702362, 0.20882052183151245, 0.2152799665927887, 0.22173941135406494, 0.2281988561153412, 0.23465830087661743]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 2.0, 7.0, 14.0, 19.0, 21.0, 21.0, 143.0, 4193415.0, 429.0, 88.0, 23.0, 11.0, 9.0, 2.0, 13.0, 9.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.43648529052734375, -0.4222869873046875, -0.40808868408203125, -0.393890380859375, -0.37969207763671875, -0.3654937744140625, -0.35129547119140625, -0.33709716796875, -0.32289886474609375, -0.3087005615234375, -0.29450225830078125, -0.280303955078125, -0.26610565185546875, -0.2519073486328125, -0.23770904541015625, -0.2235107421875, -0.20931243896484375, -0.1951141357421875, -0.18091583251953125, -0.166717529296875, -0.15251922607421875, -0.1383209228515625, -0.12412261962890625, -0.10992431640625, -0.09572601318359375, -0.0815277099609375, -0.06732940673828125, -0.053131103515625, -0.03893280029296875, -0.0247344970703125, -0.01053619384765625, 0.003662109375, 0.01786041259765625, 0.0320587158203125, 0.04625701904296875, 0.060455322265625, 0.07465362548828125, 0.0888519287109375, 0.10305023193359375, 0.11724853515625, 0.13144683837890625, 0.1456451416015625, 0.15984344482421875, 0.174041748046875, 0.18824005126953125, 0.2024383544921875, 0.21663665771484375, 0.2308349609375, 0.24503326416015625, 0.2592315673828125, 0.27342987060546875, 0.287628173828125, 0.30182647705078125, 0.3160247802734375, 0.33022308349609375, 0.34442138671875, 0.35861968994140625, 0.3728179931640625, 0.38701629638671875, 0.401214599609375, 0.41541290283203125, 0.4296112060546875, 0.44380950927734375, 0.4580078125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 7.0, 13.0, 20.0, 15.0, 13.0, 85.0, 342.0, 307.0, 75.0, 21.0, 12.0, 10.0, 2.0, 12.0, 8.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196075439453125, -0.018990755081176758, -0.018373966217041016, -0.017757177352905273, -0.01714038848876953, -0.01652359962463379, -0.015906810760498047, -0.015290021896362305, -0.014673233032226562, -0.01405644416809082, -0.013439655303955078, -0.012822866439819336, -0.012206077575683594, -0.011589288711547852, -0.01097249984741211, -0.010355710983276367, -0.009738922119140625, -0.009122133255004883, -0.00850534439086914, -0.007888555526733398, -0.007271766662597656, -0.006654977798461914, -0.006038188934326172, -0.00542140007019043, -0.0048046112060546875, -0.004187822341918945, -0.003571033477783203, -0.002954244613647461, -0.0023374557495117188, -0.0017206668853759766, -0.0011038780212402344, -0.0004870891571044922, 0.00012969970703125, 0.0007464885711669922, 0.0013632774353027344, 0.0019800662994384766, 0.0025968551635742188, 0.003213644027709961, 0.003830432891845703, 0.004447221755981445, 0.0050640106201171875, 0.00568079948425293, 0.006297588348388672, 0.006914377212524414, 0.007531166076660156, 0.008147954940795898, 0.00876474380493164, 0.009381532669067383, 0.009998321533203125, 0.010615110397338867, 0.01123189926147461, 0.011848688125610352, 0.012465476989746094, 0.013082265853881836, 0.013699054718017578, 0.01431584358215332, 0.014932632446289062, 0.015549421310424805, 0.016166210174560547, 0.01678299903869629, 0.01739978790283203, 0.018016576766967773, 0.018633365631103516, 0.019250154495239258, 0.019866943359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 57.0, 134.0, 229.0, 4188416.0, 5108.0, 175.0, 118.0, 41.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10382080078125, -0.10076045989990234, -0.09770011901855469, -0.09463977813720703, -0.09157943725585938, -0.08851909637451172, -0.08545875549316406, -0.0823984146118164, -0.07933807373046875, -0.0762777328491211, -0.07321739196777344, -0.07015705108642578, -0.06709671020507812, -0.06403636932373047, -0.06097602844238281, -0.057915687561035156, -0.0548553466796875, -0.051795005798339844, -0.04873466491699219, -0.04567432403564453, -0.042613983154296875, -0.03955364227294922, -0.03649330139160156, -0.033432960510253906, -0.03037261962890625, -0.027312278747558594, -0.024251937866210938, -0.02119159698486328, -0.018131256103515625, -0.015070915222167969, -0.012010574340820312, -0.008950233459472656, -0.005889892578125, -0.0028295516967773438, 0.0002307891845703125, 0.0032911300659179688, 0.006351470947265625, 0.009411811828613281, 0.012472152709960938, 0.015532493591308594, 0.01859283447265625, 0.021653175354003906, 0.024713516235351562, 0.02777385711669922, 0.030834197998046875, 0.03389453887939453, 0.03695487976074219, 0.040015220642089844, 0.0430755615234375, 0.046135902404785156, 0.04919624328613281, 0.05225658416748047, 0.055316925048828125, 0.05837726593017578, 0.06143760681152344, 0.0644979476928711, 0.06755828857421875, 0.0706186294555664, 0.07367897033691406, 0.07673931121826172, 0.07979965209960938, 0.08285999298095703, 0.08592033386230469, 0.08898067474365234, 0.092041015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 40.0, 4023.0, 15.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.02752685546875, -0.02705511450767517, -0.026583373546600342, -0.026111632585525513, -0.025639891624450684, -0.025168150663375854, -0.024696409702301025, -0.024224668741226196, -0.023752927780151367, -0.023281186819076538, -0.02280944585800171, -0.02233770489692688, -0.02186596393585205, -0.02139422297477722, -0.020922482013702393, -0.020450741052627563, -0.019979000091552734, -0.019507259130477905, -0.019035518169403076, -0.018563777208328247, -0.018092036247253418, -0.01762029528617859, -0.01714855432510376, -0.01667681336402893, -0.0162050724029541, -0.015733331441879272, -0.015261590480804443, -0.014789849519729614, -0.014318108558654785, -0.013846367597579956, -0.013374626636505127, -0.012902885675430298, -0.012431144714355469, -0.01195940375328064, -0.01148766279220581, -0.011015921831130981, -0.010544180870056152, -0.010072439908981323, -0.009600698947906494, -0.009128957986831665, -0.008657217025756836, -0.008185476064682007, -0.007713735103607178, -0.007241994142532349, -0.0067702531814575195, -0.00629851222038269, -0.005826771259307861, -0.005355030298233032, -0.004883289337158203, -0.004411548376083374, -0.003939807415008545, -0.003468066453933716, -0.0029963254928588867, -0.0025245845317840576, -0.0020528435707092285, -0.0015811026096343994, -0.0011093616485595703, -0.0006376206874847412, -0.0001658797264099121, 0.000305861234664917, 0.0007776021957397461, 0.0012493431568145752, 0.0017210841178894043, 0.0021928250789642334, 0.0026645660400390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1010.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264337956905365, -0.2596517503261566, -0.25496554374694824, -0.25027933716773987, -0.2455931305885315, -0.24090690910816193, -0.23622070252895355, -0.23153449594974518, -0.2268482893705368, -0.22216208279132843, -0.21747587621212006, -0.21278966963291168, -0.20810344815254211, -0.20341724157333374, -0.19873103499412537, -0.194044828414917, -0.18935862183570862, -0.18467241525650024, -0.17998620867729187, -0.1753000020980835, -0.17061379551887512, -0.16592757403850555, -0.16124136745929718, -0.1565551608800888, -0.15186895430088043, -0.14718274772167206, -0.14249654114246368, -0.1378103345632553, -0.13312411308288574, -0.12843790650367737, -0.123751699924469, -0.11906549334526062, -0.11437928676605225, -0.10969308018684387, -0.1050068736076355, -0.10032065957784653, -0.09563445299863815, -0.09094824641942978, -0.08626203238964081, -0.08157582581043243, -0.07688961923122406, -0.07220341265201569, -0.06751720607280731, -0.06283099204301834, -0.05814478546380997, -0.05345857888460159, -0.04877236858010292, -0.04408615827560425, -0.039399951696395874, -0.0347137451171875, -0.030027534812688828, -0.025341326370835304, -0.02065511792898178, -0.015968909487128258, -0.011282701045274734, -0.006596490740776062, -0.001910284161567688, 0.0027759242802858353, 0.0074621327221393585, 0.012148341163992882, 0.016834549605846405, 0.02152075804769993, 0.02620696648955345, 0.030893176794052124, 0.0355793833732605]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 13.0, 8.0, 15.0, 8.0, 23.0, 21.0, 28.0, 17.0, 39.0, 39.0, 40.0, 32.0, 39.0, 49.0, 39.0, 38.0, 47.0, 50.0, 41.0, 36.0, 33.0, 29.0, 36.0, 41.0, 28.0, 29.0, 18.0, 24.0, 21.0, 14.0, 13.0, 26.0, 10.0, 10.0, 5.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011171936988830566, -0.01081587839871645, -0.010459819808602333, -0.010103761218488216, -0.0097477026283741, -0.009391644038259983, -0.009035585448145866, -0.00867952685803175, -0.008323468267917633, -0.007967409677803516, -0.0076113510876894, -0.007255292497575283, -0.006899233907461166, -0.00654317531734705, -0.006187116727232933, -0.005831058137118816, -0.0054749995470047, -0.005118940956890583, -0.004762882366776466, -0.00440682377666235, -0.004050765186548233, -0.0036947065964341164, -0.0033386480063199997, -0.002982589416205883, -0.0026265308260917664, -0.0022704722359776497, -0.001914413645863533, -0.0015583550557494164, -0.0012022964656352997, -0.000846237875521183, -0.0004901792854070663, -0.00013412069529294968, 0.000221937894821167, 0.0005779964849352837, 0.0009340550750494003, 0.001290113665163517, 0.0016461722552776337, 0.0020022308453917503, 0.002358289435505867, 0.0027143480256199837, 0.0030704066157341003, 0.003426465205848217, 0.0037825237959623337, 0.00413858238607645, 0.004494640976190567, 0.004850699566304684, 0.0052067581564188, 0.005562816746532917, 0.005918875336647034, 0.00627493392676115, 0.006630992516875267, 0.006987051106989384, 0.0073431096971035, 0.007699168287217617, 0.008055226877331734, 0.00841128546744585, 0.008767344057559967, 0.009123402647674084, 0.0094794612377882, 0.009835519827902317, 0.010191578418016434, 0.01054763700813055, 0.010903695598244667, 0.011259754188358784, 0.0116158127784729]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 5.0, 11.0, 9.0, 13.0, 22.0, 54.0, 51.0, 82.0, 109.0, 133.0, 233.0, 338.0, 629.0, 890.0, 1554.0, 2896.0, 5653.0, 14042.0, 93113.0, 889195.0, 22922.0, 7657.0, 3739.0, 1982.0, 1178.0, 704.0, 453.0, 267.0, 195.0, 121.0, 92.0, 51.0, 40.0, 34.0, 18.0, 14.0, 16.0, 4.0, 10.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.028778076171875, -0.027884244918823242, -0.026990413665771484, -0.026096582412719727, -0.02520275115966797, -0.02430891990661621, -0.023415088653564453, -0.022521257400512695, -0.021627426147460938, -0.02073359489440918, -0.019839763641357422, -0.018945932388305664, -0.018052101135253906, -0.01715826988220215, -0.01626443862915039, -0.015370607376098633, -0.014476776123046875, -0.013582944869995117, -0.01268911361694336, -0.011795282363891602, -0.010901451110839844, -0.010007619857788086, -0.009113788604736328, -0.00821995735168457, -0.0073261260986328125, -0.006432294845581055, -0.005538463592529297, -0.004644632339477539, -0.0037508010864257812, -0.0028569698333740234, -0.0019631385803222656, -0.0010693073272705078, -0.00017547607421875, 0.0007183551788330078, 0.0016121864318847656, 0.0025060176849365234, 0.0033998489379882812, 0.004293680191040039, 0.005187511444091797, 0.006081342697143555, 0.0069751739501953125, 0.00786900520324707, 0.008762836456298828, 0.009656667709350586, 0.010550498962402344, 0.011444330215454102, 0.01233816146850586, 0.013231992721557617, 0.014125823974609375, 0.015019655227661133, 0.01591348648071289, 0.01680731773376465, 0.017701148986816406, 0.018594980239868164, 0.019488811492919922, 0.02038264274597168, 0.021276473999023438, 0.022170305252075195, 0.023064136505126953, 0.02395796775817871, 0.02485179901123047, 0.025745630264282227, 0.026639461517333984, 0.027533292770385742, 0.0284271240234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 7.0, 13.0, 20.0, 14.0, 14.0, 82.0, 342.0, 309.0, 76.0, 21.0, 12.0, 10.0, 2.0, 12.0, 8.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196075439453125, -0.01899099349975586, -0.01837444305419922, -0.017757892608642578, -0.017141342163085938, -0.016524791717529297, -0.015908241271972656, -0.015291690826416016, -0.014675140380859375, -0.014058589935302734, -0.013442039489746094, -0.012825489044189453, -0.012208938598632812, -0.011592388153076172, -0.010975837707519531, -0.01035928726196289, -0.00974273681640625, -0.00912618637084961, -0.008509635925292969, -0.007893085479736328, -0.0072765350341796875, -0.006659984588623047, -0.006043434143066406, -0.005426883697509766, -0.004810333251953125, -0.004193782806396484, -0.0035772323608398438, -0.002960681915283203, -0.0023441314697265625, -0.0017275810241699219, -0.0011110305786132812, -0.0004944801330566406, 0.0001220703125, 0.0007386207580566406, 0.0013551712036132812, 0.001971721649169922, 0.0025882720947265625, 0.003204822540283203, 0.0038213729858398438, 0.004437923431396484, 0.005054473876953125, 0.005671024322509766, 0.006287574768066406, 0.006904125213623047, 0.0075206756591796875, 0.008137226104736328, 0.008753776550292969, 0.00937032699584961, 0.00998687744140625, 0.01060342788696289, 0.011219978332519531, 0.011836528778076172, 0.012453079223632812, 0.013069629669189453, 0.013686180114746094, 0.014302730560302734, 0.014919281005859375, 0.015535831451416016, 0.016152381896972656, 0.016768932342529297, 0.017385482788085938, 0.018002033233642578, 0.01861858367919922, 0.01923513412475586, 0.0198516845703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 5.0, 4.0, 6.0, 7.0, 10.0, 9.0, 11.0, 11.0, 23.0, 25.0, 36.0, 49.0, 46.0, 68.0, 115.0, 154.0, 219.0, 341.0, 744.0, 1436.0, 14241.0, 1017728.0, 10064.0, 1381.0, 698.0, 351.0, 220.0, 145.0, 80.0, 69.0, 38.0, 51.0, 34.0, 21.0, 23.0, 21.0, 24.0, 9.0, 5.0, 8.0, 1.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.051849365234375, -0.050201416015625, -0.048553466796875, -0.046905517578125, -0.045257568359375, -0.043609619140625, -0.041961669921875, -0.040313720703125, -0.038665771484375, -0.037017822265625, -0.035369873046875, -0.033721923828125, -0.032073974609375, -0.030426025390625, -0.028778076171875, -0.027130126953125, -0.025482177734375, -0.023834228515625, -0.022186279296875, -0.020538330078125, -0.018890380859375, -0.017242431640625, -0.015594482421875, -0.013946533203125, -0.012298583984375, -0.010650634765625, -0.009002685546875, -0.007354736328125, -0.005706787109375, -0.004058837890625, -0.002410888671875, -0.000762939453125, 0.000885009765625, 0.002532958984375, 0.004180908203125, 0.005828857421875, 0.007476806640625, 0.009124755859375, 0.010772705078125, 0.012420654296875, 0.014068603515625, 0.015716552734375, 0.017364501953125, 0.019012451171875, 0.020660400390625, 0.022308349609375, 0.023956298828125, 0.025604248046875, 0.027252197265625, 0.028900146484375, 0.030548095703125, 0.032196044921875, 0.033843994140625, 0.035491943359375, 0.037139892578125, 0.038787841796875, 0.040435791015625, 0.042083740234375, 0.043731689453125, 0.045379638671875, 0.047027587890625, 0.048675537109375, 0.050323486328125, 0.051971435546875, 0.053619384765625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 8.0, 4.0, 4.0, 6.0, 7.0, 10.0, 7.0, 11.0, 10.0, 20.0, 21.0, 22.0, 31.0, 23.0, 27.0, 41.0, 38.0, 39.0, 40.0, 42.0, 37.0, 36.0, 50.0, 41.0, 42.0, 45.0, 33.0, 34.0, 46.0, 23.0, 28.0, 14.0, 31.0, 20.0, 16.0, 18.0, 19.0, 21.0, 7.0, 5.0, 8.0, 1.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.040008544921875, -0.03873395919799805, -0.037459373474121094, -0.03618478775024414, -0.03491020202636719, -0.033635616302490234, -0.03236103057861328, -0.031086444854736328, -0.029811859130859375, -0.028537273406982422, -0.02726268768310547, -0.025988101959228516, -0.024713516235351562, -0.02343893051147461, -0.022164344787597656, -0.020889759063720703, -0.01961517333984375, -0.018340587615966797, -0.017066001892089844, -0.01579141616821289, -0.014516830444335938, -0.013242244720458984, -0.011967658996582031, -0.010693073272705078, -0.009418487548828125, -0.008143901824951172, -0.006869316101074219, -0.005594730377197266, -0.0043201446533203125, -0.0030455589294433594, -0.0017709732055664062, -0.0004963874816894531, 0.0007781982421875, 0.002052783966064453, 0.0033273696899414062, 0.004601955413818359, 0.0058765411376953125, 0.007151126861572266, 0.008425712585449219, 0.009700298309326172, 0.010974884033203125, 0.012249469757080078, 0.013524055480957031, 0.014798641204833984, 0.016073226928710938, 0.01734781265258789, 0.018622398376464844, 0.019896984100341797, 0.02117156982421875, 0.022446155548095703, 0.023720741271972656, 0.02499532699584961, 0.026269912719726562, 0.027544498443603516, 0.02881908416748047, 0.030093669891357422, 0.031368255615234375, 0.03264284133911133, 0.03391742706298828, 0.035192012786865234, 0.03646659851074219, 0.03774118423461914, 0.039015769958496094, 0.04029035568237305, 0.04156494140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 13.0, 12.0, 18.0, 33.0, 31.0, 37.0, 64.0, 100.0, 129.0, 228.0, 391.0, 599.0, 1127.0, 2405.0, 4700.0, 11556.0, 37895.0, 348190.0, 574449.0, 43084.0, 12945.0, 5185.0, 2345.0, 1177.0, 673.0, 386.0, 294.0, 137.0, 96.0, 68.0, 52.0, 32.0, 18.0, 18.0, 16.0, 15.0, 3.0, 10.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9848346710205078e-05, -1.9188039004802704e-05, -1.852773129940033e-05, -1.7867423593997955e-05, -1.720711588859558e-05, -1.6546808183193207e-05, -1.5886500477790833e-05, -1.5226192772388458e-05, -1.4565885066986084e-05, -1.390557736158371e-05, -1.3245269656181335e-05, -1.2584961950778961e-05, -1.1924654245376587e-05, -1.1264346539974213e-05, -1.0604038834571838e-05, -9.943731129169464e-06, -9.28342342376709e-06, -8.623115718364716e-06, -7.962808012962341e-06, -7.302500307559967e-06, -6.642192602157593e-06, -5.9818848967552185e-06, -5.321577191352844e-06, -4.66126948595047e-06, -4.000961780548096e-06, -3.3406540751457214e-06, -2.680346369743347e-06, -2.020038664340973e-06, -1.3597309589385986e-06, -6.994232535362244e-07, -3.91155481338501e-08, 6.211921572685242e-07, 1.2814998626708984e-06, 1.9418075680732727e-06, 2.602115273475647e-06, 3.2624229788780212e-06, 3.9227306842803955e-06, 4.58303838968277e-06, 5.243346095085144e-06, 5.903653800487518e-06, 6.563961505889893e-06, 7.224269211292267e-06, 7.884576916694641e-06, 8.544884622097015e-06, 9.20519232749939e-06, 9.865500032901764e-06, 1.0525807738304138e-05, 1.1186115443706512e-05, 1.1846423149108887e-05, 1.2506730854511261e-05, 1.3167038559913635e-05, 1.382734626531601e-05, 1.4487653970718384e-05, 1.5147961676120758e-05, 1.5808269381523132e-05, 1.6468577086925507e-05, 1.712888479232788e-05, 1.7789192497730255e-05, 1.844950020313263e-05, 1.9109807908535004e-05, 1.9770115613937378e-05, 2.0430423319339752e-05, 2.1090731024742126e-05, 2.17510387301445e-05, 2.2411346435546875e-05]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 9.0, 11.0, 19.0, 37.0, 33.0, 53.0, 86.0, 127.0, 176.0, 131.0, 109.0, 61.0, 52.0, 39.0, 21.0, 13.0, 9.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.531839370727539e-05, -1.4865770936012268e-05, -1.4413148164749146e-05, -1.3960525393486023e-05, -1.35079026222229e-05, -1.3055279850959778e-05, -1.2602657079696655e-05, -1.2150034308433533e-05, -1.169741153717041e-05, -1.1244788765907288e-05, -1.0792165994644165e-05, -1.0339543223381042e-05, -9.88692045211792e-06, -9.434297680854797e-06, -8.981674909591675e-06, -8.529052138328552e-06, -8.07642936706543e-06, -7.623806595802307e-06, -7.1711838245391846e-06, -6.718561053276062e-06, -6.2659382820129395e-06, -5.813315510749817e-06, -5.360692739486694e-06, -4.908069968223572e-06, -4.455447196960449e-06, -4.002824425697327e-06, -3.550201654434204e-06, -3.0975788831710815e-06, -2.644956111907959e-06, -2.1923333406448364e-06, -1.7397105693817139e-06, -1.2870877981185913e-06, -8.344650268554688e-07, -3.818422555923462e-07, 7.078051567077637e-08, 5.234032869338989e-07, 9.760260581970215e-07, 1.428648829460144e-06, 1.8812716007232666e-06, 2.333894371986389e-06, 2.7865171432495117e-06, 3.2391399145126343e-06, 3.691762685775757e-06, 4.144385457038879e-06, 4.597008228302002e-06, 5.0496309995651245e-06, 5.502253770828247e-06, 5.95487654209137e-06, 6.407499313354492e-06, 6.860122084617615e-06, 7.312744855880737e-06, 7.76536762714386e-06, 8.217990398406982e-06, 8.670613169670105e-06, 9.123235940933228e-06, 9.57585871219635e-06, 1.0028481483459473e-05, 1.0481104254722595e-05, 1.0933727025985718e-05, 1.138634979724884e-05, 1.1838972568511963e-05, 1.2291595339775085e-05, 1.2744218111038208e-05, 1.319684088230133e-05, 1.3649463653564453e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 14.0, 17.0, 19.0, 29.0, 55.0, 78.0, 155.0, 392.0, 1531.0, 1034680.0, 10369.0, 714.0, 233.0, 102.0, 54.0, 30.0, 27.0, 19.0, 6.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.751319885253906e-05, -9.453482925891876e-05, -9.155645966529846e-05, -8.857809007167816e-05, -8.559972047805786e-05, -8.262135088443756e-05, -7.964298129081726e-05, -7.666461169719696e-05, -7.368624210357666e-05, -7.070787250995636e-05, -6.772950291633606e-05, -6.475113332271576e-05, -6.177276372909546e-05, -5.879439413547516e-05, -5.581602454185486e-05, -5.283765494823456e-05, -4.985928535461426e-05, -4.688091576099396e-05, -4.390254616737366e-05, -4.092417657375336e-05, -3.794580698013306e-05, -3.4967437386512756e-05, -3.1989067792892456e-05, -2.9010698199272156e-05, -2.6032328605651855e-05, -2.3053959012031555e-05, -2.0075589418411255e-05, -1.7097219824790955e-05, -1.4118850231170654e-05, -1.1140480637550354e-05, -8.162111043930054e-06, -5.183741450309753e-06, -2.205371856689453e-06, 7.729977369308472e-07, 3.7513673305511475e-06, 6.729736924171448e-06, 9.708106517791748e-06, 1.2686476111412048e-05, 1.566484570503235e-05, 1.864321529865265e-05, 2.162158489227295e-05, 2.459995448589325e-05, 2.757832407951355e-05, 3.055669367313385e-05, 3.353506326675415e-05, 3.651343286037445e-05, 3.949180245399475e-05, 4.247017204761505e-05, 4.544854164123535e-05, 4.842691123485565e-05, 5.140528082847595e-05, 5.438365042209625e-05, 5.736202001571655e-05, 6.034038960933685e-05, 6.331875920295715e-05, 6.629712879657745e-05, 6.927549839019775e-05, 7.225386798381805e-05, 7.523223757743835e-05, 7.821060717105865e-05, 8.118897676467896e-05, 8.416734635829926e-05, 8.714571595191956e-05, 9.012408554553986e-05, 9.310245513916016e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 12.0, 13.0, 10.0, 14.0, 27.0, 33.0, 39.0, 69.0, 102.0, 160.0, 207.0, 108.0, 60.0, 42.0, 24.0, 19.0, 13.0, 17.0, 10.0, 10.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.539987564086914e-05, -7.31172040104866e-05, -7.083453238010406e-05, -6.855186074972153e-05, -6.626918911933899e-05, -6.398651748895645e-05, -6.170384585857391e-05, -5.9421174228191376e-05, -5.713850259780884e-05, -5.48558309674263e-05, -5.257315933704376e-05, -5.0290487706661224e-05, -4.8007816076278687e-05, -4.572514444589615e-05, -4.344247281551361e-05, -4.115980118513107e-05, -3.8877129554748535e-05, -3.6594457924366e-05, -3.431178629398346e-05, -3.202911466360092e-05, -2.9746443033218384e-05, -2.7463771402835846e-05, -2.5181099772453308e-05, -2.289842814207077e-05, -2.0615756511688232e-05, -1.8333084881305695e-05, -1.6050413250923157e-05, -1.3767741620540619e-05, -1.1485069990158081e-05, -9.202398359775543e-06, -6.919726729393005e-06, -4.6370550990104675e-06, -2.3543834686279297e-06, -7.171183824539185e-08, 2.210959792137146e-06, 4.493631422519684e-06, 6.776303052902222e-06, 9.05897468328476e-06, 1.1341646313667297e-05, 1.3624317944049835e-05, 1.5906989574432373e-05, 1.818966120481491e-05, 2.047233283519745e-05, 2.2755004465579987e-05, 2.5037676095962524e-05, 2.7320347726345062e-05, 2.96030193567276e-05, 3.188569098711014e-05, 3.4168362617492676e-05, 3.6451034247875214e-05, 3.873370587825775e-05, 4.101637750864029e-05, 4.329904913902283e-05, 4.5581720769405365e-05, 4.78643923997879e-05, 5.014706403017044e-05, 5.242973566055298e-05, 5.4712407290935516e-05, 5.6995078921318054e-05, 5.927775055170059e-05, 6.156042218208313e-05, 6.384309381246567e-05, 6.61257654428482e-05, 6.840843707323074e-05, 7.069110870361328e-05]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 44.0, 356.0, 570.0, 38.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3561144471168518, -0.3476490080356598, -0.3391835689544678, -0.33071815967559814, -0.32225272059440613, -0.3137872815132141, -0.3053218722343445, -0.29685643315315247, -0.28839099407196045, -0.27992555499076843, -0.2714601159095764, -0.2629947066307068, -0.25452926754951477, -0.24606382846832275, -0.23759840428829193, -0.2291329801082611, -0.2206675410270691, -0.21220210194587708, -0.20373667776584625, -0.19527125358581543, -0.1868058145046234, -0.1783403754234314, -0.16987495124340057, -0.16140952706336975, -0.15294408798217773, -0.14447864890098572, -0.1360132247209549, -0.12754780054092407, -0.11908236145973206, -0.11061692982912064, -0.10215149819850922, -0.0936860665678978, -0.08522063493728638, -0.07675520330667496, -0.06828977167606354, -0.05982434004545212, -0.0513589084148407, -0.04289347678422928, -0.03442804515361786, -0.02596261352300644, -0.01749718189239502, -0.0090317502617836, -0.0005663186311721802, 0.00789911299943924, 0.01636454463005066, 0.02482997626066208, 0.0332954078912735, 0.04176083952188492, 0.05022627115249634, 0.05869170278310776, 0.06715713441371918, 0.0756225660443306, 0.08408799767494202, 0.09255342930555344, 0.10101886093616486, 0.10948429256677628, 0.1179497241973877, 0.1264151632785797, 0.13488058745861053, 0.14334601163864136, 0.15181145071983337, 0.1602768898010254, 0.1687423139810562, 0.17720773816108704, 0.18567317724227905]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 9.0, 8.0, 10.0, 11.0, 23.0, 24.0, 21.0, 27.0, 36.0, 24.0, 43.0, 31.0, 42.0, 41.0, 48.0, 36.0, 45.0, 43.0, 54.0, 44.0, 46.0, 41.0, 33.0, 29.0, 30.0, 31.0, 31.0, 27.0, 17.0, 12.0, 17.0, 9.0, 9.0, 4.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20078426599502563, -0.1936047375202179, -0.18642519414424896, -0.17924565076828003, -0.1720661222934723, -0.16488659381866455, -0.15770705044269562, -0.15052750706672668, -0.14334797859191895, -0.1361684501171112, -0.12898890674114227, -0.12180937081575394, -0.1146298348903656, -0.10745029896497726, -0.10027076303958893, -0.09309122711420059, -0.08591169118881226, -0.07873215526342392, -0.07155261933803558, -0.06437308341264725, -0.05719354748725891, -0.050014011561870575, -0.04283447563648224, -0.0356549397110939, -0.028475403785705566, -0.02129586786031723, -0.014116331934928894, -0.006936796009540558, 0.00024273991584777832, 0.0074222758412361145, 0.01460181176662445, 0.021781347692012787, 0.028960883617401123, 0.03614041954278946, 0.043319955468177795, 0.05049949139356613, 0.05767902731895447, 0.0648585632443428, 0.07203809916973114, 0.07921763509511948, 0.08639717102050781, 0.09357670694589615, 0.10075624287128448, 0.10793577879667282, 0.11511531472206116, 0.1222948506474495, 0.12947438657283783, 0.13665392994880676, 0.1438334584236145, 0.15101298689842224, 0.15819253027439117, 0.1653720736503601, 0.17255160212516785, 0.17973113059997559, 0.18691067397594452, 0.19409021735191345, 0.2012697458267212, 0.20844927430152893, 0.21562881767749786, 0.2228083610534668, 0.22998788952827454, 0.23716741800308228, 0.2443469613790512, 0.25152650475502014, 0.2587060332298279]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 0.0, 4.0, 5.0, 3.0, 6.0, 4.0, 9.0, 8.0, 10.0, 5.0, 9.0, 9.0, 20.0, 28.0, 37.0, 47.0, 220.0, 2282.0, 4184046.0, 6318.0, 983.0, 62.0, 29.0, 26.0, 24.0, 19.0, 15.0, 14.0, 9.0, 9.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04644775390625, -0.044981956481933594, -0.04351615905761719, -0.04205036163330078, -0.040584564208984375, -0.03911876678466797, -0.03765296936035156, -0.036187171936035156, -0.03472137451171875, -0.033255577087402344, -0.03178977966308594, -0.03032398223876953, -0.028858184814453125, -0.02739238739013672, -0.025926589965820312, -0.024460792541503906, -0.0229949951171875, -0.021529197692871094, -0.020063400268554688, -0.01859760284423828, -0.017131805419921875, -0.01566600799560547, -0.014200210571289062, -0.012734413146972656, -0.01126861572265625, -0.009802818298339844, -0.008337020874023438, -0.006871223449707031, -0.005405426025390625, -0.003939628601074219, -0.0024738311767578125, -0.0010080337524414062, 0.000457763671875, 0.0019235610961914062, 0.0033893585205078125, 0.004855155944824219, 0.006320953369140625, 0.007786750793457031, 0.009252548217773438, 0.010718345642089844, 0.01218414306640625, 0.013649940490722656, 0.015115737915039062, 0.01658153533935547, 0.018047332763671875, 0.01951313018798828, 0.020978927612304688, 0.022444725036621094, 0.0239105224609375, 0.025376319885253906, 0.026842117309570312, 0.02830791473388672, 0.029773712158203125, 0.03123950958251953, 0.03270530700683594, 0.034171104431152344, 0.03563690185546875, 0.037102699279785156, 0.03856849670410156, 0.04003429412841797, 0.041500091552734375, 0.04296588897705078, 0.04443168640136719, 0.045897483825683594, 0.04736328125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 11.0, 14.0, 18.0, 12.0, 19.0, 118.0, 411.0, 226.0, 49.0, 24.0, 9.0, 8.0, 3.0, 13.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193328857421875, -0.018720626831054688, -0.018108367919921875, -0.017496109008789062, -0.01688385009765625, -0.016271591186523438, -0.015659332275390625, -0.015047073364257812, -0.014434814453125, -0.013822555541992188, -0.013210296630859375, -0.012598037719726562, -0.01198577880859375, -0.011373519897460938, -0.010761260986328125, -0.010149002075195312, -0.0095367431640625, -0.008924484252929688, -0.008312225341796875, -0.0076999664306640625, -0.00708770751953125, -0.0064754486083984375, -0.005863189697265625, -0.0052509307861328125, -0.004638671875, -0.0040264129638671875, -0.003414154052734375, -0.0028018951416015625, -0.00218963623046875, -0.0015773773193359375, -0.000965118408203125, -0.0003528594970703125, 0.0002593994140625, 0.0008716583251953125, 0.001483917236328125, 0.0020961761474609375, 0.00270843505859375, 0.0033206939697265625, 0.003932952880859375, 0.0045452117919921875, 0.005157470703125, 0.0057697296142578125, 0.006381988525390625, 0.0069942474365234375, 0.00760650634765625, 0.008218765258789062, 0.008831024169921875, 0.009443283081054688, 0.0100555419921875, 0.010667800903320312, 0.011280059814453125, 0.011892318725585938, 0.01250457763671875, 0.013116836547851562, 0.013729095458984375, 0.014341354370117188, 0.01495361328125, 0.015565872192382812, 0.016178131103515625, 0.016790390014648438, 0.01740264892578125, 0.018014907836914062, 0.018627166748046875, 0.019239425659179688, 0.0198516845703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 20.0, 53.0, 111.0, 179.0, 1071.0, 4186533.0, 5646.0, 424.0, 136.0, 64.0, 27.0, 11.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042266845703125, -0.04111671447753906, -0.039966583251953125, -0.03881645202636719, -0.03766632080078125, -0.03651618957519531, -0.035366058349609375, -0.03421592712402344, -0.0330657958984375, -0.03191566467285156, -0.030765533447265625, -0.029615402221679688, -0.02846527099609375, -0.027315139770507812, -0.026165008544921875, -0.025014877319335938, -0.02386474609375, -0.022714614868164062, -0.021564483642578125, -0.020414352416992188, -0.01926422119140625, -0.018114089965820312, -0.016963958740234375, -0.015813827514648438, -0.0146636962890625, -0.013513565063476562, -0.012363433837890625, -0.011213302612304688, -0.01006317138671875, -0.008913040161132812, -0.007762908935546875, -0.0066127777099609375, -0.005462646484375, -0.0043125152587890625, -0.003162384033203125, -0.0020122528076171875, -0.00086212158203125, 0.0002880096435546875, 0.001438140869140625, 0.0025882720947265625, 0.0037384033203125, 0.0048885345458984375, 0.006038665771484375, 0.0071887969970703125, 0.00833892822265625, 0.009489059448242188, 0.010639190673828125, 0.011789321899414062, 0.012939453125, 0.014089584350585938, 0.015239715576171875, 0.016389846801757812, 0.01753997802734375, 0.018690109252929688, 0.019840240478515625, 0.020990371704101562, 0.0221405029296875, 0.023290634155273438, 0.024440765380859375, 0.025590896606445312, 0.02674102783203125, 0.027891159057617188, 0.029041290283203125, 0.030191421508789062, 0.031341552734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 18.0, 106.0, 3903.0, 32.0, 10.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0060882568359375, -0.005753874778747559, -0.005419492721557617, -0.005085110664367676, -0.004750728607177734, -0.004416346549987793, -0.0040819644927978516, -0.00374758243560791, -0.0034132003784179688, -0.0030788183212280273, -0.002744436264038086, -0.0024100542068481445, -0.002075672149658203, -0.0017412900924682617, -0.0014069080352783203, -0.001072525978088379, -0.0007381439208984375, -0.0004037618637084961, -6.937980651855469e-05, 0.0002650022506713867, 0.0005993843078613281, 0.0009337663650512695, 0.001268148422241211, 0.0016025304794311523, 0.0019369125366210938, 0.002271294593811035, 0.0026056766510009766, 0.002940058708190918, 0.0032744407653808594, 0.0036088228225708008, 0.003943204879760742, 0.004277586936950684, 0.004611968994140625, 0.004946351051330566, 0.005280733108520508, 0.005615115165710449, 0.005949497222900391, 0.006283879280090332, 0.0066182613372802734, 0.006952643394470215, 0.007287025451660156, 0.007621407508850098, 0.007955789566040039, 0.00829017162322998, 0.008624553680419922, 0.008958935737609863, 0.009293317794799805, 0.009627699851989746, 0.009962081909179688, 0.010296463966369629, 0.01063084602355957, 0.010965228080749512, 0.011299610137939453, 0.011633992195129395, 0.011968374252319336, 0.012302756309509277, 0.012637138366699219, 0.01297152042388916, 0.013305902481079102, 0.013640284538269043, 0.013974666595458984, 0.014309048652648926, 0.014643430709838867, 0.014977812767028809, 0.01531219482421875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 937.0, 79.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16899053752422333, -0.16585859656333923, -0.16272667050361633, -0.15959472954273224, -0.15646280348300934, -0.15333086252212524, -0.15019893646240234, -0.14706699550151825, -0.14393505454063416, -0.14080311357975006, -0.13767118752002716, -0.13453924655914307, -0.13140732049942017, -0.12827537953853607, -0.12514345347881317, -0.12201151251792908, -0.11887958645820618, -0.11574765294790268, -0.11261571943759918, -0.10948378592729568, -0.10635185241699219, -0.1032199114561081, -0.1000879779458046, -0.0969560444355011, -0.0938241109251976, -0.0906921774148941, -0.0875602439045906, -0.08442831039428711, -0.08129636943340302, -0.07816444337368011, -0.07503250241279602, -0.07190056890249252, -0.06876863539218903, -0.06563670188188553, -0.06250476837158203, -0.059372831135988235, -0.05624089762568474, -0.05310896411538124, -0.049977026879787445, -0.04684509336948395, -0.04371316358447075, -0.04058123007416725, -0.037449292838573456, -0.03431735932826996, -0.03118542581796646, -0.028053492307662964, -0.024921556934714317, -0.02178962156176567, -0.018657688051462173, -0.015525753609836102, -0.01239381916821003, -0.009261884726583958, -0.006129950284957886, -0.0029980167746543884, 0.00013391859829425812, 0.0032658539712429047, 0.006397787481546402, 0.009529721923172474, 0.012661656364798546, 0.015793591737747192, 0.01892552524805069, 0.022057458758354187, 0.025189394131302834, 0.02832132950425148, 0.03145326301455498]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 16.0, 28.0, 32.0, 53.0, 77.0, 83.0, 114.0, 107.0, 78.0, 102.0, 82.0, 61.0, 48.0, 39.0, 31.0, 15.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018790721893310547, -0.01829395815730095, -0.01779719442129135, -0.017300430685281754, -0.016803666949272156, -0.016306903213262558, -0.01581013947725296, -0.015313375741243362, -0.014816612005233765, -0.014319848269224167, -0.013823084533214569, -0.013326320797204971, -0.012829557061195374, -0.012332793325185776, -0.011836029589176178, -0.01133926585316658, -0.010842502117156982, -0.010345738381147385, -0.009848974645137787, -0.009352210909128189, -0.008855447173118591, -0.008358683437108994, -0.007861919701099396, -0.007365155965089798, -0.0068683922290802, -0.006371628493070602, -0.005874864757061005, -0.005378101021051407, -0.004881337285041809, -0.004384573549032211, -0.0038878098130226135, -0.0033910460770130157, -0.002894282341003418, -0.00239751860499382, -0.0019007548689842224, -0.0014039911329746246, -0.0009072273969650269, -0.0004104636609554291, 8.63000750541687e-05, 0.0005830638110637665, 0.0010798275470733643, 0.001576591283082962, 0.00207335501909256, 0.0025701187551021576, 0.0030668824911117554, 0.003563646227121353, 0.004060409963130951, 0.004557173699140549, 0.0050539374351501465, 0.005550701171159744, 0.006047464907169342, 0.00654422864317894, 0.007040992379188538, 0.007537756115198135, 0.008034519851207733, 0.008531283587217331, 0.009028047323226929, 0.009524811059236526, 0.010021574795246124, 0.010518338531255722, 0.01101510226726532, 0.011511866003274918, 0.012008629739284515, 0.012505393475294113, 0.013002157211303711]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 4.0, 15.0, 7.0, 14.0, 22.0, 37.0, 36.0, 69.0, 83.0, 133.0, 188.0, 350.0, 599.0, 1126.0, 2374.0, 6567.0, 31552.0, 967019.0, 27037.0, 6153.0, 2499.0, 1126.0, 585.0, 343.0, 191.0, 105.0, 80.0, 63.0, 44.0, 29.0, 13.0, 18.0, 6.0, 15.0, 7.0, 5.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.02655029296875, -0.02573251724243164, -0.02491474151611328, -0.024096965789794922, -0.023279190063476562, -0.022461414337158203, -0.021643638610839844, -0.020825862884521484, -0.020008087158203125, -0.019190311431884766, -0.018372535705566406, -0.017554759979248047, -0.016736984252929688, -0.015919208526611328, -0.015101432800292969, -0.01428365707397461, -0.01346588134765625, -0.01264810562133789, -0.011830329895019531, -0.011012554168701172, -0.010194778442382812, -0.009377002716064453, -0.008559226989746094, -0.007741451263427734, -0.006923675537109375, -0.006105899810791016, -0.005288124084472656, -0.004470348358154297, -0.0036525726318359375, -0.002834796905517578, -0.0020170211791992188, -0.0011992454528808594, -0.0003814697265625, 0.0004363059997558594, 0.0012540817260742188, 0.002071857452392578, 0.0028896331787109375, 0.003707408905029297, 0.004525184631347656, 0.005342960357666016, 0.006160736083984375, 0.006978511810302734, 0.007796287536621094, 0.008614063262939453, 0.009431838989257812, 0.010249614715576172, 0.011067390441894531, 0.01188516616821289, 0.01270294189453125, 0.01352071762084961, 0.014338493347167969, 0.015156269073486328, 0.015974044799804688, 0.016791820526123047, 0.017609596252441406, 0.018427371978759766, 0.019245147705078125, 0.020062923431396484, 0.020880699157714844, 0.021698474884033203, 0.022516250610351562, 0.023334026336669922, 0.02415180206298828, 0.02496957778930664, 0.025787353515625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 11.0, 14.0, 18.0, 13.0, 18.0, 118.0, 417.0, 223.0, 46.0, 24.0, 10.0, 7.0, 3.0, 13.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193328857421875, -0.018720388412475586, -0.018107891082763672, -0.017495393753051758, -0.016882896423339844, -0.01627039909362793, -0.015657901763916016, -0.015045404434204102, -0.014432907104492188, -0.013820409774780273, -0.01320791244506836, -0.012595415115356445, -0.011982917785644531, -0.011370420455932617, -0.010757923126220703, -0.010145425796508789, -0.009532928466796875, -0.008920431137084961, -0.008307933807373047, -0.007695436477661133, -0.007082939147949219, -0.006470441818237305, -0.005857944488525391, -0.0052454471588134766, -0.0046329498291015625, -0.0040204524993896484, -0.0034079551696777344, -0.0027954578399658203, -0.0021829605102539062, -0.0015704631805419922, -0.0009579658508300781, -0.00034546852111816406, 0.00026702880859375, 0.0008795261383056641, 0.0014920234680175781, 0.002104520797729492, 0.0027170181274414062, 0.0033295154571533203, 0.003942012786865234, 0.0045545101165771484, 0.0051670074462890625, 0.0057795047760009766, 0.006392002105712891, 0.007004499435424805, 0.007616996765136719, 0.008229494094848633, 0.008841991424560547, 0.009454488754272461, 0.010066986083984375, 0.010679483413696289, 0.011291980743408203, 0.011904478073120117, 0.012516975402832031, 0.013129472732543945, 0.01374197006225586, 0.014354467391967773, 0.014966964721679688, 0.015579462051391602, 0.016191959381103516, 0.01680445671081543, 0.017416954040527344, 0.018029451370239258, 0.018641948699951172, 0.019254446029663086, 0.019866943359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 5.0, 5.0, 9.0, 6.0, 9.0, 13.0, 15.0, 19.0, 33.0, 31.0, 32.0, 57.0, 50.0, 91.0, 110.0, 201.0, 436.0, 1162.0, 8989.0, 1025580.0, 9389.0, 1156.0, 438.0, 211.0, 124.0, 73.0, 55.0, 47.0, 37.0, 28.0, 22.0, 19.0, 18.0, 22.0, 13.0, 6.0, 8.0, 7.0, 5.0, 8.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.04315185546875, -0.04186391830444336, -0.04057598114013672, -0.03928804397583008, -0.03800010681152344, -0.0367121696472168, -0.035424232482910156, -0.034136295318603516, -0.032848358154296875, -0.031560420989990234, -0.030272483825683594, -0.028984546661376953, -0.027696609497070312, -0.026408672332763672, -0.02512073516845703, -0.02383279800415039, -0.02254486083984375, -0.02125692367553711, -0.01996898651123047, -0.018681049346923828, -0.017393112182617188, -0.016105175018310547, -0.014817237854003906, -0.013529300689697266, -0.012241363525390625, -0.010953426361083984, -0.009665489196777344, -0.008377552032470703, -0.0070896148681640625, -0.005801677703857422, -0.004513740539550781, -0.0032258033752441406, -0.0019378662109375, -0.0006499290466308594, 0.0006380081176757812, 0.0019259452819824219, 0.0032138824462890625, 0.004501819610595703, 0.005789756774902344, 0.007077693939208984, 0.008365631103515625, 0.009653568267822266, 0.010941505432128906, 0.012229442596435547, 0.013517379760742188, 0.014805316925048828, 0.01609325408935547, 0.01738119125366211, 0.01866912841796875, 0.01995706558227539, 0.02124500274658203, 0.022532939910888672, 0.023820877075195312, 0.025108814239501953, 0.026396751403808594, 0.027684688568115234, 0.028972625732421875, 0.030260562896728516, 0.031548500061035156, 0.0328364372253418, 0.03412437438964844, 0.03541231155395508, 0.03670024871826172, 0.03798818588256836, 0.039276123046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 5.0, 9.0, 6.0, 10.0, 11.0, 13.0, 18.0, 30.0, 27.0, 22.0, 40.0, 24.0, 39.0, 36.0, 35.0, 50.0, 45.0, 36.0, 51.0, 51.0, 52.0, 36.0, 35.0, 39.0, 30.0, 37.0, 28.0, 27.0, 23.0, 17.0, 16.0, 18.0, 19.0, 13.0, 6.0, 8.0, 7.0, 5.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.043975830078125, -0.042662620544433594, -0.04134941101074219, -0.04003620147705078, -0.038722991943359375, -0.03740978240966797, -0.03609657287597656, -0.034783363342285156, -0.03347015380859375, -0.032156944274902344, -0.030843734741210938, -0.02953052520751953, -0.028217315673828125, -0.02690410614013672, -0.025590896606445312, -0.024277687072753906, -0.0229644775390625, -0.021651268005371094, -0.020338058471679688, -0.01902484893798828, -0.017711639404296875, -0.01639842987060547, -0.015085220336914062, -0.013772010803222656, -0.01245880126953125, -0.011145591735839844, -0.009832382202148438, -0.008519172668457031, -0.007205963134765625, -0.005892753601074219, -0.0045795440673828125, -0.0032663345336914062, -0.001953125, -0.0006399154663085938, 0.0006732940673828125, 0.0019865036010742188, 0.003299713134765625, 0.004612922668457031, 0.0059261322021484375, 0.007239341735839844, 0.00855255126953125, 0.009865760803222656, 0.011178970336914062, 0.012492179870605469, 0.013805389404296875, 0.015118598937988281, 0.016431808471679688, 0.017745018005371094, 0.0190582275390625, 0.020371437072753906, 0.021684646606445312, 0.02299785614013672, 0.024311065673828125, 0.02562427520751953, 0.026937484741210938, 0.028250694274902344, 0.02956390380859375, 0.030877113342285156, 0.03219032287597656, 0.03350353240966797, 0.034816741943359375, 0.03612995147705078, 0.03744316101074219, 0.038756370544433594, 0.040069580078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 8.0, 8.0, 19.0, 18.0, 32.0, 54.0, 78.0, 100.0, 184.0, 364.0, 522.0, 945.0, 1872.0, 4954.0, 12847.0, 49882.0, 798504.0, 140544.0, 23669.0, 7484.0, 3309.0, 1336.0, 745.0, 408.0, 240.0, 138.0, 90.0, 68.0, 35.0, 37.0, 15.0, 8.0, 9.0, 10.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6689300537109375e-05, -1.6194768249988556e-05, -1.5700235962867737e-05, -1.5205703675746918e-05, -1.4711171388626099e-05, -1.421663910150528e-05, -1.372210681438446e-05, -1.3227574527263641e-05, -1.2733042240142822e-05, -1.2238509953022003e-05, -1.1743977665901184e-05, -1.1249445378780365e-05, -1.0754913091659546e-05, -1.0260380804538727e-05, -9.765848517417908e-06, -9.271316230297089e-06, -8.77678394317627e-06, -8.28225165605545e-06, -7.787719368934631e-06, -7.293187081813812e-06, -6.798654794692993e-06, -6.304122507572174e-06, -5.809590220451355e-06, -5.315057933330536e-06, -4.820525646209717e-06, -4.325993359088898e-06, -3.831461071968079e-06, -3.3369287848472595e-06, -2.8423964977264404e-06, -2.3478642106056213e-06, -1.8533319234848022e-06, -1.3587996363639832e-06, -8.642673492431641e-07, -3.6973506212234497e-07, 1.2479722499847412e-07, 6.193295121192932e-07, 1.1138617992401123e-06, 1.6083940863609314e-06, 2.1029263734817505e-06, 2.5974586606025696e-06, 3.0919909477233887e-06, 3.5865232348442078e-06, 4.081055521965027e-06, 4.575587809085846e-06, 5.070120096206665e-06, 5.564652383327484e-06, 6.059184670448303e-06, 6.553716957569122e-06, 7.048249244689941e-06, 7.5427815318107605e-06, 8.03731381893158e-06, 8.531846106052399e-06, 9.026378393173218e-06, 9.520910680294037e-06, 1.0015442967414856e-05, 1.0509975254535675e-05, 1.1004507541656494e-05, 1.1499039828777313e-05, 1.1993572115898132e-05, 1.2488104403018951e-05, 1.298263669013977e-05, 1.347716897726059e-05, 1.3971701264381409e-05, 1.4466233551502228e-05, 1.4960765838623047e-05]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 12.0, 8.0, 24.0, 18.0, 30.0, 22.0, 52.0, 78.0, 48.0, 89.0, 55.0, 93.0, 59.0, 76.0, 50.0, 52.0, 45.0, 21.0, 39.0, 22.0, 21.0, 16.0, 11.0, 16.0, 4.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.351139068603516e-06, -4.198402166366577e-06, -4.045665264129639e-06, -3.8929283618927e-06, -3.7401914596557617e-06, -3.5874545574188232e-06, -3.4347176551818848e-06, -3.2819807529449463e-06, -3.129243850708008e-06, -2.9765069484710693e-06, -2.823770046234131e-06, -2.6710331439971924e-06, -2.518296241760254e-06, -2.3655593395233154e-06, -2.212822437286377e-06, -2.0600855350494385e-06, -1.9073486328125e-06, -1.7546117305755615e-06, -1.601874828338623e-06, -1.4491379261016846e-06, -1.296401023864746e-06, -1.1436641216278076e-06, -9.909272193908691e-07, -8.381903171539307e-07, -6.854534149169922e-07, -5.327165126800537e-07, -3.7997961044311523e-07, -2.2724270820617676e-07, -7.450580596923828e-08, 7.82310962677002e-08, 2.3096799850463867e-07, 3.8370490074157715e-07, 5.364418029785156e-07, 6.891787052154541e-07, 8.419156074523926e-07, 9.94652509689331e-07, 1.1473894119262695e-06, 1.300126314163208e-06, 1.4528632164001465e-06, 1.605600118637085e-06, 1.7583370208740234e-06, 1.911073923110962e-06, 2.0638108253479004e-06, 2.216547727584839e-06, 2.3692846298217773e-06, 2.522021532058716e-06, 2.6747584342956543e-06, 2.8274953365325928e-06, 2.9802322387695312e-06, 3.1329691410064697e-06, 3.285706043243408e-06, 3.4384429454803467e-06, 3.591179847717285e-06, 3.7439167499542236e-06, 3.896653652191162e-06, 4.049390554428101e-06, 4.202127456665039e-06, 4.3548643589019775e-06, 4.507601261138916e-06, 4.6603381633758545e-06, 4.813075065612793e-06, 4.9658119678497314e-06, 5.11854887008667e-06, 5.271285772323608e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 11.0, 4.0, 8.0, 17.0, 18.0, 22.0, 23.0, 36.0, 46.0, 90.0, 159.0, 361.0, 1570.0, 999818.0, 44801.0, 899.0, 288.0, 123.0, 83.0, 40.0, 35.0, 30.0, 12.0, 18.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.1140785217285156e-05, -4.963018000125885e-05, -4.8119574785232544e-05, -4.660896956920624e-05, -4.509836435317993e-05, -4.3587759137153625e-05, -4.207715392112732e-05, -4.056654870510101e-05, -3.905594348907471e-05, -3.75453382730484e-05, -3.6034733057022095e-05, -3.452412784099579e-05, -3.301352262496948e-05, -3.1502917408943176e-05, -2.999231219291687e-05, -2.8481706976890564e-05, -2.6971101760864258e-05, -2.546049654483795e-05, -2.3949891328811646e-05, -2.243928611278534e-05, -2.0928680896759033e-05, -1.9418075680732727e-05, -1.790747046470642e-05, -1.6396865248680115e-05, -1.4886260032653809e-05, -1.3375654816627502e-05, -1.1865049600601196e-05, -1.035444438457489e-05, -8.843839168548584e-06, -7.333233952522278e-06, -5.822628736495972e-06, -4.3120235204696655e-06, -2.8014183044433594e-06, -1.2908130884170532e-06, 2.1979212760925293e-07, 1.730397343635559e-06, 3.2410025596618652e-06, 4.751607775688171e-06, 6.2622129917144775e-06, 7.772818207740784e-06, 9.28342342376709e-06, 1.0794028639793396e-05, 1.2304633855819702e-05, 1.3815239071846008e-05, 1.5325844287872314e-05, 1.683644950389862e-05, 1.8347054719924927e-05, 1.9857659935951233e-05, 2.136826515197754e-05, 2.2878870368003845e-05, 2.438947558403015e-05, 2.5900080800056458e-05, 2.7410686016082764e-05, 2.892129123210907e-05, 3.0431896448135376e-05, 3.194250166416168e-05, 3.345310688018799e-05, 3.4963712096214294e-05, 3.64743173122406e-05, 3.798492252826691e-05, 3.949552774429321e-05, 4.100613296031952e-05, 4.2516738176345825e-05, 4.402734339237213e-05, 4.553794860839844e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 10.0, 1.0, 9.0, 18.0, 15.0, 16.0, 18.0, 27.0, 24.0, 44.0, 50.0, 65.0, 89.0, 149.0, 114.0, 83.0, 60.0, 44.0, 30.0, 26.0, 23.0, 22.0, 11.0, 14.0, 11.0, 7.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.227327346801758e-05, -5.072541534900665e-05, -4.917755722999573e-05, -4.76296991109848e-05, -4.608184099197388e-05, -4.453398287296295e-05, -4.2986124753952026e-05, -4.14382666349411e-05, -3.9890408515930176e-05, -3.834255039691925e-05, -3.6794692277908325e-05, -3.52468341588974e-05, -3.3698976039886475e-05, -3.215111792087555e-05, -3.0603259801864624e-05, -2.90554016828537e-05, -2.7507543563842773e-05, -2.5959685444831848e-05, -2.4411827325820923e-05, -2.2863969206809998e-05, -2.1316111087799072e-05, -1.9768252968788147e-05, -1.822039484977722e-05, -1.6672536730766296e-05, -1.5124678611755371e-05, -1.3576820492744446e-05, -1.202896237373352e-05, -1.0481104254722595e-05, -8.93324613571167e-06, -7.385388016700745e-06, -5.837529897689819e-06, -4.289671778678894e-06, -2.7418136596679688e-06, -1.1939555406570435e-06, 3.5390257835388184e-07, 1.9017606973648071e-06, 3.4496188163757324e-06, 4.997476935386658e-06, 6.545335054397583e-06, 8.093193173408508e-06, 9.641051292419434e-06, 1.1188909411430359e-05, 1.2736767530441284e-05, 1.428462564945221e-05, 1.5832483768463135e-05, 1.738034188747406e-05, 1.8928200006484985e-05, 2.047605812549591e-05, 2.2023916244506836e-05, 2.357177436351776e-05, 2.5119632482528687e-05, 2.6667490601539612e-05, 2.8215348720550537e-05, 2.9763206839561462e-05, 3.131106495857239e-05, 3.285892307758331e-05, 3.440678119659424e-05, 3.5954639315605164e-05, 3.750249743461609e-05, 3.9050355553627014e-05, 4.059821367263794e-05, 4.2146071791648865e-05, 4.369392991065979e-05, 4.5241788029670715e-05, 4.678964614868164e-05]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 962.0, 55.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1434638798236847, -0.10585266351699829, -0.06824144721031189, -0.03063023090362549, 0.006980985403060913, 0.044592201709747314, 0.08220341801643372, 0.11981463432312012, 0.15742585062980652, 0.19503706693649292, 0.23264828324317932, 0.2702594995498657, 0.3078707158565521, 0.3454819321632385, 0.3830931484699249, 0.42070436477661133, 0.45831558108329773, 0.49592679738998413, 0.5335379838943481, 0.5711492300033569, 0.6087604761123657, 0.6463716626167297, 0.6839828491210938, 0.7215940952301025, 0.7592053413391113, 0.7968165874481201, 0.8344277739524841, 0.8720389604568481, 0.9096502065658569, 0.9472614526748657, 0.9848726391792297, 1.0224838256835938, 1.0600950717926025, 1.0977063179016113, 1.1353175640106201, 1.1729286909103394, 1.2105399370193481, 1.248151183128357, 1.2857623100280762, 1.323373556137085, 1.3609848022460938, 1.3985960483551025, 1.4362072944641113, 1.4738184213638306, 1.5114296674728394, 1.5490409135818481, 1.5866520404815674, 1.6242632865905762, 1.661874532699585, 1.6994857788085938, 1.7370970249176025, 1.7747081518173218, 1.8123193979263306, 1.8499306440353394, 1.8875417709350586, 1.9251530170440674, 1.9627642631530762, 2.000375509262085, 2.0379867553710938, 2.0755980014801025, 2.1132092475891113, 2.150820255279541, 2.18843150138855, 2.2260427474975586, 2.2636539936065674]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 6.0, 17.0, 20.0, 10.0, 11.0, 16.0, 21.0, 22.0, 21.0, 24.0, 31.0, 31.0, 42.0, 37.0, 38.0, 44.0, 42.0, 54.0, 34.0, 41.0, 47.0, 45.0, 35.0, 34.0, 24.0, 35.0, 32.0, 30.0, 16.0, 19.0, 20.0, 13.0, 14.0, 7.0, 9.0, 5.0, 8.0, 4.0, 4.0, 0.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18014496564865112, -0.17396490275859833, -0.16778483986854553, -0.16160479187965393, -0.15542472898960114, -0.14924466609954834, -0.14306460320949554, -0.13688454031944275, -0.13070449233055115, -0.12452442944049835, -0.11834437400102615, -0.11216431111097336, -0.10598425567150116, -0.09980419278144836, -0.09362412989139557, -0.08744406700134277, -0.08126400411128998, -0.07508394122123718, -0.06890388578176498, -0.06272382289171219, -0.05654376372694969, -0.050363704562187195, -0.0441836416721344, -0.0380035825073719, -0.031823523342609406, -0.02564346417784691, -0.019463403150439262, -0.013283342123031616, -0.007103282958269119, -0.0009232237935066223, 0.005256839096546173, 0.01143689826130867, 0.017616957426071167, 0.023797016590833664, 0.02997707761824131, 0.036157138645648956, 0.04233719781041145, 0.04851725697517395, 0.054697319865226746, 0.06087737902998924, 0.06705743819475174, 0.07323750108480453, 0.07941755652427673, 0.08559761941432953, 0.09177768230438232, 0.09795773774385452, 0.10413780063390732, 0.11031785607337952, 0.11649791896343231, 0.12267798185348511, 0.1288580447435379, 0.1350381076335907, 0.1412181556224823, 0.1473982185125351, 0.1535782814025879, 0.15975834429264069, 0.16593840718269348, 0.17211847007274628, 0.17829853296279907, 0.18447858095169067, 0.19065864384174347, 0.19683870673179626, 0.20301876962184906, 0.20919883251190186, 0.21537888050079346]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 7.0, 7.0, 10.0, 10.0, 9.0, 10.0, 24.0, 106.0, 4193696.0, 247.0, 44.0, 14.0, 15.0, 10.0, 13.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00033211708068847656, -0.0003213733434677124, -0.00031062960624694824, -0.0002998858690261841, -0.0002891421318054199, -0.00027839839458465576, -0.0002676546573638916, -0.00025691092014312744, -0.0002461671829223633, -0.00023542344570159912, -0.00022467970848083496, -0.0002139359712600708, -0.00020319223403930664, -0.00019244849681854248, -0.00018170475959777832, -0.00017096102237701416, -0.00016021728515625, -0.00014947354793548584, -0.00013872981071472168, -0.00012798607349395752, -0.00011724233627319336, -0.0001064985990524292, -9.575486183166504e-05, -8.501112461090088e-05, -7.426738739013672e-05, -6.352365016937256e-05, -5.27799129486084e-05, -4.203617572784424e-05, -3.129243850708008e-05, -2.0548701286315918e-05, -9.804964065551758e-06, 9.387731552124023e-07, 1.1682510375976562e-05, 2.2426247596740723e-05, 3.316998481750488e-05, 4.391372203826904e-05, 5.46574592590332e-05, 6.540119647979736e-05, 7.614493370056152e-05, 8.688867092132568e-05, 9.763240814208984e-05, 0.000108376145362854, 0.00011911988258361816, 0.00012986361980438232, 0.00014060735702514648, 0.00015135109424591064, 0.0001620948314666748, 0.00017283856868743896, 0.00018358230590820312, 0.00019432604312896729, 0.00020506978034973145, 0.0002158135175704956, 0.00022655725479125977, 0.00023730099201202393, 0.0002480447292327881, 0.00025878846645355225, 0.0002695322036743164, 0.00028027594089508057, 0.0002910196781158447, 0.0003017634153366089, 0.00031250715255737305, 0.0003232508897781372, 0.00033399462699890137, 0.00034473836421966553, 0.0003554821014404297]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 4.0, 9.0, 15.0, 17.0, 15.0, 18.0, 119.0, 400.0, 239.0, 47.0, 23.0, 9.0, 8.0, 5.0, 12.0, 9.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 22.0, 15.0, 34.0, 69.0, 84.0, 84.0, 90.0, 4193364.0, 87.0, 92.0, 112.0, 92.0, 64.0, 35.0, 32.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015115737915039062, -0.0014669299125671387, -0.001422286033630371, -0.0013776421546936035, -0.001332998275756836, -0.0012883543968200684, -0.0012437105178833008, -0.0011990666389465332, -0.0011544227600097656, -0.001109778881072998, -0.0010651350021362305, -0.0010204911231994629, -0.0009758472442626953, -0.0009312033653259277, -0.0008865594863891602, -0.0008419156074523926, -0.000797271728515625, -0.0007526278495788574, -0.0007079839706420898, -0.0006633400917053223, -0.0006186962127685547, -0.0005740523338317871, -0.0005294084548950195, -0.00048476457595825195, -0.0004401206970214844, -0.0003954768180847168, -0.0003508329391479492, -0.00030618906021118164, -0.00026154518127441406, -0.00021690130233764648, -0.0001722574234008789, -0.00012761354446411133, -8.296966552734375e-05, -3.832578659057617e-05, 6.318092346191406e-06, 5.0961971282958984e-05, 9.560585021972656e-05, 0.00014024972915649414, 0.00018489360809326172, 0.0002295374870300293, 0.0002741813659667969, 0.00031882524490356445, 0.00036346912384033203, 0.0004081130027770996, 0.0004527568817138672, 0.0004974007606506348, 0.0005420446395874023, 0.0005866885185241699, 0.0006313323974609375, 0.0006759762763977051, 0.0007206201553344727, 0.0007652640342712402, 0.0008099079132080078, 0.0008545517921447754, 0.000899195671081543, 0.0009438395500183105, 0.0009884834289550781, 0.0010331273078918457, 0.0010777711868286133, 0.0011224150657653809, 0.0011670589447021484, 0.001211702823638916, 0.0012563467025756836, 0.0013009905815124512, 0.0013456344604492188]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4095.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 7.059425115585327e-06, 1.4118850231170654e-05, 2.117827534675598e-05, 2.823770046234131e-05, 3.5297125577926636e-05, 4.235655069351196e-05, 4.941597580909729e-05, 5.647540092468262e-05, 6.353482604026794e-05, 7.059425115585327e-05, 7.76536762714386e-05, 8.471310138702393e-05, 9.177252650260925e-05, 9.883195161819458e-05, 0.00010589137673377991, 0.00011295080184936523, 0.00012001022696495056, 0.0001270696520805359, 0.00013412907719612122, 0.00014118850231170654, 0.00014824792742729187, 0.0001553073525428772, 0.00016236677765846252, 0.00016942620277404785, 0.00017648562788963318, 0.0001835450530052185, 0.00019060447812080383, 0.00019766390323638916, 0.0002047233283519745, 0.00021178275346755981, 0.00021884217858314514, 0.00022590160369873047, 0.0002329610288143158, 0.00024002045392990112, 0.00024707987904548645, 0.0002541393041610718, 0.0002611987292766571, 0.00026825815439224243, 0.00027531757950782776, 0.0002823770046234131, 0.0002894364297389984, 0.00029649585485458374, 0.00030355527997016907, 0.0003106147050857544, 0.0003176741302013397, 0.00032473355531692505, 0.0003317929804325104, 0.0003388524055480957, 0.00034591183066368103, 0.00035297125577926636, 0.0003600306808948517, 0.000367090106010437, 0.00037414953112602234, 0.00038120895624160767, 0.000388268381357193, 0.0003953278064727783, 0.00040238723158836365, 0.000409446656703949, 0.0004165060818195343, 0.00042356550693511963, 0.00043062493205070496, 0.0004376843571662903, 0.0004447437822818756, 0.00045180320739746094]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1011.0, 7.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024557714350521564, -0.002335949568077922, -0.0022161277011036873, -0.0020963058341294527, -0.001976483967155218, -0.0018566621001809835, -0.001736840233206749, -0.0016170183662325144, -0.0014971964992582798, -0.0013773746322840452, -0.0012575527653098106, -0.001137730898335576, -0.0010179090313613415, -0.000898087106179446, -0.0007782652392052114, -0.0006584433722309768, -0.0005386214470490813, -0.00041879958007484674, -0.00029897771310061216, -0.00017915581702254713, -5.9333950048312545e-05, 6.048794602975249e-05, 0.00018030981300398707, 0.00030013167997822165, 0.00041995354695245624, 0.0005397754139266908, 0.0006595972809009254, 0.0007794192060828209, 0.0008992410730570555, 0.00101906294003129, 0.0011388848070055246, 0.0012587066739797592, 0.0013785285409539938, 0.0014983504079282284, 0.001618172274902463, 0.0017379941418766975, 0.0018578160088509321, 0.0019776378758251667, 0.0020974597427994013, 0.002217281609773636, 0.0023371034767478704, 0.002456925343722105, 0.0025767472106963396, 0.002696569077670574, 0.0028163909446448088, 0.0029362128116190434, 0.003056034678593278, 0.0031758565455675125, 0.0032956786453723907, 0.0034155005123466253, 0.00353532237932086, 0.0036551442462950945, 0.003774966113269329, 0.0038947879802435637, 0.004014609847217798, 0.0041344319470226765, 0.004254253581166267, 0.004374075680971146, 0.0044938973151147366, 0.004613719414919615, 0.004733541049063206, 0.004853363148868084, 0.004973184783011675, 0.005093006882816553, 0.005212828516960144]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 12.0, 16.0, 36.0, 86.0, 129.0, 210.0, 164.0, 136.0, 98.0, 53.0, 26.0, 16.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039565563201904297, -0.0003751404583454132, -0.00035462528467178345, -0.0003341101109981537, -0.0003135949373245239, -0.00029307976365089417, -0.0002725645899772644, -0.00025204941630363464, -0.00023153424263000488, -0.00021101906895637512, -0.00019050389528274536, -0.0001699887216091156, -0.00014947354793548584, -0.00012895837426185608, -0.00010844320058822632, -8.792802691459656e-05, -6.74128532409668e-05, -4.6897679567337036e-05, -2.6382505893707275e-05, -5.867332220077515e-06, 1.4647841453552246e-05, 3.516301512718201e-05, 5.567818880081177e-05, 7.619336247444153e-05, 9.670853614807129e-05, 0.00011722370982170105, 0.0001377388834953308, 0.00015825405716896057, 0.00017876923084259033, 0.0001992844045162201, 0.00021979957818984985, 0.00024031475186347961, 0.0002608299255371094, 0.00028134509921073914, 0.0003018602728843689, 0.00032237544655799866, 0.0003428906202316284, 0.0003634057939052582, 0.00038392096757888794, 0.0004044361412525177, 0.00042495131492614746, 0.0004454664885997772, 0.000465981662273407, 0.00048649683594703674, 0.0005070120096206665, 0.0005275271832942963, 0.000548042356967926, 0.0005685575306415558, 0.0005890727043151855, 0.0006095878779888153, 0.0006301030516624451, 0.0006506182253360748, 0.0006711333990097046, 0.0006916485726833344, 0.0007121637463569641, 0.0007326789200305939, 0.0007531940937042236, 0.0007737092673778534, 0.0007942244410514832, 0.0008147396147251129, 0.0008352547883987427, 0.0008557699620723724, 0.0008762851357460022, 0.000896800309419632, 0.0009173154830932617]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 8.0, 3.0, 9.0, 11.0, 16.0, 19.0, 30.0, 26.0, 46.0, 67.0, 108.0, 136.0, 227.0, 368.0, 644.0, 1066.0, 2036.0, 5016.0, 20546.0, 964614.0, 40333.0, 7310.0, 2663.0, 1276.0, 728.0, 404.0, 242.0, 161.0, 110.0, 81.0, 55.0, 56.0, 23.0, 30.0, 15.0, 14.0, 16.0, 3.0, 6.0, 9.0, 1.0, 2.0, 7.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0295562744140625, -0.02862238883972168, -0.02768850326538086, -0.02675461769104004, -0.02582073211669922, -0.0248868465423584, -0.023952960968017578, -0.023019075393676758, -0.022085189819335938, -0.021151304244995117, -0.020217418670654297, -0.019283533096313477, -0.018349647521972656, -0.017415761947631836, -0.016481876373291016, -0.015547990798950195, -0.014614105224609375, -0.013680219650268555, -0.012746334075927734, -0.011812448501586914, -0.010878562927246094, -0.009944677352905273, -0.009010791778564453, -0.008076906204223633, -0.0071430206298828125, -0.006209135055541992, -0.005275249481201172, -0.0043413639068603516, -0.0034074783325195312, -0.002473592758178711, -0.0015397071838378906, -0.0006058216094970703, 0.00032806396484375, 0.0012619495391845703, 0.0021958351135253906, 0.003129720687866211, 0.004063606262207031, 0.0049974918365478516, 0.005931377410888672, 0.006865262985229492, 0.0077991485595703125, 0.008733034133911133, 0.009666919708251953, 0.010600805282592773, 0.011534690856933594, 0.012468576431274414, 0.013402462005615234, 0.014336347579956055, 0.015270233154296875, 0.016204118728637695, 0.017138004302978516, 0.018071889877319336, 0.019005775451660156, 0.019939661026000977, 0.020873546600341797, 0.021807432174682617, 0.022741317749023438, 0.023675203323364258, 0.024609088897705078, 0.0255429744720459, 0.02647686004638672, 0.02741074562072754, 0.02834463119506836, 0.02927851676940918, 0.03021240234375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 4.0, 9.0, 15.0, 17.0, 15.0, 18.0, 119.0, 400.0, 239.0, 47.0, 23.0, 9.0, 8.0, 5.0, 12.0, 9.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 8.0, 4.0, 8.0, 11.0, 12.0, 13.0, 17.0, 17.0, 20.0, 21.0, 35.0, 31.0, 41.0, 78.0, 75.0, 110.0, 140.0, 236.0, 423.0, 908.0, 2732.0, 916797.0, 122973.0, 1913.0, 727.0, 384.0, 197.0, 129.0, 91.0, 84.0, 54.0, 53.0, 39.0, 32.0, 20.0, 19.0, 10.0, 13.0, 15.0, 13.0, 11.0, 7.0, 3.0, 3.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03192138671875, -0.030776500701904297, -0.029631614685058594, -0.02848672866821289, -0.027341842651367188, -0.026196956634521484, -0.02505207061767578, -0.023907184600830078, -0.022762298583984375, -0.021617412567138672, -0.02047252655029297, -0.019327640533447266, -0.018182754516601562, -0.01703786849975586, -0.015892982482910156, -0.014748096466064453, -0.01360321044921875, -0.012458324432373047, -0.011313438415527344, -0.01016855239868164, -0.009023666381835938, -0.007878780364990234, -0.006733894348144531, -0.005589008331298828, -0.004444122314453125, -0.003299236297607422, -0.0021543502807617188, -0.0010094642639160156, 0.0001354217529296875, 0.0012803077697753906, 0.0024251937866210938, 0.003570079803466797, 0.0047149658203125, 0.005859851837158203, 0.007004737854003906, 0.00814962387084961, 0.009294509887695312, 0.010439395904541016, 0.011584281921386719, 0.012729167938232422, 0.013874053955078125, 0.015018939971923828, 0.01616382598876953, 0.017308712005615234, 0.018453598022460938, 0.01959848403930664, 0.020743370056152344, 0.021888256072998047, 0.02303314208984375, 0.024178028106689453, 0.025322914123535156, 0.02646780014038086, 0.027612686157226562, 0.028757572174072266, 0.02990245819091797, 0.031047344207763672, 0.032192230224609375, 0.03333711624145508, 0.03448200225830078, 0.035626888275146484, 0.03677177429199219, 0.03791666030883789, 0.039061546325683594, 0.0402064323425293, 0.041351318359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 4.0, 9.0, 11.0, 8.0, 12.0, 19.0, 13.0, 16.0, 15.0, 20.0, 21.0, 20.0, 42.0, 24.0, 32.0, 41.0, 35.0, 24.0, 45.0, 40.0, 36.0, 29.0, 35.0, 33.0, 36.0, 33.0, 32.0, 31.0, 36.0, 19.0, 35.0, 26.0, 24.0, 18.0, 18.0, 9.0, 13.0, 16.0, 13.0, 12.0, 7.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03009033203125, -0.02901458740234375, -0.0279388427734375, -0.02686309814453125, -0.025787353515625, -0.02471160888671875, -0.0236358642578125, -0.02256011962890625, -0.021484375, -0.02040863037109375, -0.0193328857421875, -0.01825714111328125, -0.017181396484375, -0.01610565185546875, -0.0150299072265625, -0.01395416259765625, -0.01287841796875, -0.01180267333984375, -0.0107269287109375, -0.00965118408203125, -0.008575439453125, -0.00749969482421875, -0.0064239501953125, -0.00534820556640625, -0.0042724609375, -0.00319671630859375, -0.0021209716796875, -0.00104522705078125, 3.0517578125e-05, 0.00110626220703125, 0.0021820068359375, 0.00325775146484375, 0.00433349609375, 0.00540924072265625, 0.0064849853515625, 0.00756072998046875, 0.008636474609375, 0.00971221923828125, 0.0107879638671875, 0.01186370849609375, 0.012939453125, 0.01401519775390625, 0.0150909423828125, 0.01616668701171875, 0.017242431640625, 0.01831817626953125, 0.0193939208984375, 0.02046966552734375, 0.02154541015625, 0.02262115478515625, 0.0236968994140625, 0.02477264404296875, 0.025848388671875, 0.02692413330078125, 0.0279998779296875, 0.02907562255859375, 0.0301513671875, 0.03122711181640625, 0.0323028564453125, 0.03337860107421875, 0.034454345703125, 0.03553009033203125, 0.0366058349609375, 0.03768157958984375, 0.03875732421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 8.0, 3.0, 3.0, 13.0, 12.0, 25.0, 32.0, 58.0, 92.0, 153.0, 337.0, 529.0, 984.0, 2886.0, 7178.0, 41365.0, 685606.0, 269217.0, 29712.0, 5947.0, 2469.0, 862.0, 440.0, 250.0, 118.0, 78.0, 60.0, 39.0, 31.0, 12.0, 16.0, 9.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.1861324310302734e-05, -1.1540018022060394e-05, -1.1218711733818054e-05, -1.0897405445575714e-05, -1.0576099157333374e-05, -1.0254792869091034e-05, -9.933486580848694e-06, -9.612180292606354e-06, -9.290874004364014e-06, -8.969567716121674e-06, -8.648261427879333e-06, -8.326955139636993e-06, -8.005648851394653e-06, -7.684342563152313e-06, -7.363036274909973e-06, -7.041729986667633e-06, -6.720423698425293e-06, -6.399117410182953e-06, -6.077811121940613e-06, -5.756504833698273e-06, -5.435198545455933e-06, -5.1138922572135925e-06, -4.7925859689712524e-06, -4.471279680728912e-06, -4.149973392486572e-06, -3.828667104244232e-06, -3.507360816001892e-06, -3.186054527759552e-06, -2.864748239517212e-06, -2.543441951274872e-06, -2.2221356630325317e-06, -1.9008293747901917e-06, -1.5795230865478516e-06, -1.2582167983055115e-06, -9.369105100631714e-07, -6.156042218208313e-07, -2.942979335784912e-07, 2.7008354663848877e-08, 3.4831464290618896e-07, 6.69620931148529e-07, 9.909272193908691e-07, 1.3122335076332092e-06, 1.6335397958755493e-06, 1.9548460841178894e-06, 2.2761523723602295e-06, 2.5974586606025696e-06, 2.9187649488449097e-06, 3.2400712370872498e-06, 3.56137752532959e-06, 3.88268381357193e-06, 4.20399010181427e-06, 4.52529639005661e-06, 4.84660267829895e-06, 5.16790896654129e-06, 5.48921525478363e-06, 5.8105215430259705e-06, 6.1318278312683105e-06, 6.453134119510651e-06, 6.774440407752991e-06, 7.095746695995331e-06, 7.417052984237671e-06, 7.738359272480011e-06, 8.059665560722351e-06, 8.380971848964691e-06, 8.702278137207031e-06]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 6.0, 11.0, 19.0, 25.0, 34.0, 57.0, 78.0, 64.0, 128.0, 124.0, 88.0, 113.0, 55.0, 39.0, 39.0, 17.0, 22.0, 8.0, 8.0, 10.0, 9.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.472001016139984e-06, -7.255002856254578e-06, -7.038004696369171e-06, -6.821006536483765e-06, -6.604008376598358e-06, -6.387010216712952e-06, -6.170012056827545e-06, -5.953013896942139e-06, -5.736015737056732e-06, -5.519017577171326e-06, -5.302019417285919e-06, -5.085021257400513e-06, -4.868023097515106e-06, -4.6510249376297e-06, -4.434026777744293e-06, -4.217028617858887e-06, -4.00003045797348e-06, -3.7830322980880737e-06, -3.5660341382026672e-06, -3.3490359783172607e-06, -3.1320378184318542e-06, -2.9150396585464478e-06, -2.6980414986610413e-06, -2.4810433387756348e-06, -2.2640451788902283e-06, -2.0470470190048218e-06, -1.8300488591194153e-06, -1.6130506992340088e-06, -1.3960525393486023e-06, -1.1790543794631958e-06, -9.620562195777893e-07, -7.450580596923828e-07, -5.280598998069763e-07, -3.110617399215698e-07, -9.406358003616333e-08, 1.2293457984924316e-07, 3.3993273973464966e-07, 5.569308996200562e-07, 7.739290595054626e-07, 9.909272193908691e-07, 1.2079253792762756e-06, 1.4249235391616821e-06, 1.6419216990470886e-06, 1.8589198589324951e-06, 2.0759180188179016e-06, 2.292916178703308e-06, 2.5099143385887146e-06, 2.726912498474121e-06, 2.9439106583595276e-06, 3.160908818244934e-06, 3.3779069781303406e-06, 3.594905138015747e-06, 3.8119032979011536e-06, 4.02890145778656e-06, 4.2458996176719666e-06, 4.462897777557373e-06, 4.6798959374427795e-06, 4.896894097328186e-06, 5.1138922572135925e-06, 5.330890417098999e-06, 5.5478885769844055e-06, 5.764886736869812e-06, 5.9818848967552185e-06, 6.198883056640625e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 4.0, 8.0, 4.0, 12.0, 11.0, 20.0, 16.0, 32.0, 43.0, 64.0, 99.0, 181.0, 422.0, 1451.0, 977116.0, 67314.0, 905.0, 362.0, 152.0, 100.0, 61.0, 42.0, 32.0, 26.0, 20.0, 10.0, 8.0, 7.0, 5.0, 2.0, 7.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.49879264831543e-05, -3.406405448913574e-05, -3.314018249511719e-05, -3.221631050109863e-05, -3.129243850708008e-05, -3.0368566513061523e-05, -2.944469451904297e-05, -2.8520822525024414e-05, -2.759695053100586e-05, -2.6673078536987305e-05, -2.574920654296875e-05, -2.4825334548950195e-05, -2.390146255493164e-05, -2.2977590560913086e-05, -2.205371856689453e-05, -2.1129846572875977e-05, -2.0205974578857422e-05, -1.9282102584838867e-05, -1.8358230590820312e-05, -1.7434358596801758e-05, -1.6510486602783203e-05, -1.558661460876465e-05, -1.4662742614746094e-05, -1.3738870620727539e-05, -1.2814998626708984e-05, -1.189112663269043e-05, -1.0967254638671875e-05, -1.004338264465332e-05, -9.119510650634766e-06, -8.195638656616211e-06, -7.271766662597656e-06, -6.3478946685791016e-06, -5.424022674560547e-06, -4.500150680541992e-06, -3.5762786865234375e-06, -2.652406692504883e-06, -1.7285346984863281e-06, -8.046627044677734e-07, 1.1920928955078125e-07, 1.043081283569336e-06, 1.9669532775878906e-06, 2.8908252716064453e-06, 3.814697265625e-06, 4.738569259643555e-06, 5.662441253662109e-06, 6.586313247680664e-06, 7.510185241699219e-06, 8.434057235717773e-06, 9.357929229736328e-06, 1.0281801223754883e-05, 1.1205673217773438e-05, 1.2129545211791992e-05, 1.3053417205810547e-05, 1.3977289199829102e-05, 1.4901161193847656e-05, 1.582503318786621e-05, 1.6748905181884766e-05, 1.767277717590332e-05, 1.8596649169921875e-05, 1.952052116394043e-05, 2.0444393157958984e-05, 2.136826515197754e-05, 2.2292137145996094e-05, 2.321600914001465e-05, 2.4139881134033203e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 5.0, 8.0, 7.0, 7.0, 12.0, 11.0, 15.0, 17.0, 30.0, 34.0, 34.0, 44.0, 66.0, 96.0, 132.0, 107.0, 76.0, 67.0, 43.0, 46.0, 20.0, 18.0, 19.0, 23.0, 14.0, 9.0, 6.0, 6.0, 5.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.266334533691406e-05, -3.17990779876709e-05, -3.0934810638427734e-05, -3.007054328918457e-05, -2.9206275939941406e-05, -2.8342008590698242e-05, -2.7477741241455078e-05, -2.6613473892211914e-05, -2.574920654296875e-05, -2.4884939193725586e-05, -2.4020671844482422e-05, -2.3156404495239258e-05, -2.2292137145996094e-05, -2.142786979675293e-05, -2.0563602447509766e-05, -1.96993350982666e-05, -1.8835067749023438e-05, -1.7970800399780273e-05, -1.710653305053711e-05, -1.6242265701293945e-05, -1.537799835205078e-05, -1.4513731002807617e-05, -1.3649463653564453e-05, -1.2785196304321289e-05, -1.1920928955078125e-05, -1.1056661605834961e-05, -1.0192394256591797e-05, -9.328126907348633e-06, -8.463859558105469e-06, -7.599592208862305e-06, -6.735324859619141e-06, -5.8710575103759766e-06, -5.0067901611328125e-06, -4.1425228118896484e-06, -3.2782554626464844e-06, -2.4139881134033203e-06, -1.5497207641601562e-06, -6.854534149169922e-07, 1.7881393432617188e-07, 1.043081283569336e-06, 1.9073486328125e-06, 2.771615982055664e-06, 3.635883331298828e-06, 4.500150680541992e-06, 5.364418029785156e-06, 6.22868537902832e-06, 7.092952728271484e-06, 7.957220077514648e-06, 8.821487426757812e-06, 9.685754776000977e-06, 1.055002212524414e-05, 1.1414289474487305e-05, 1.2278556823730469e-05, 1.3142824172973633e-05, 1.4007091522216797e-05, 1.4871358871459961e-05, 1.5735626220703125e-05, 1.659989356994629e-05, 1.7464160919189453e-05, 1.8328428268432617e-05, 1.919269561767578e-05, 2.0056962966918945e-05, 2.092123031616211e-05, 2.1785497665405273e-05, 2.2649765014648438e-05]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 27.0, 871.0, 115.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5965543985366821, -0.5840434432029724, -0.5715325474739075, -0.5590215921401978, -0.546510636806488, -0.5339996814727783, -0.5214887857437134, -0.5089778304100037, -0.49646687507629395, -0.4839559495449066, -0.4714449942111969, -0.45893406867980957, -0.44642311334609985, -0.4339121878147125, -0.4214012324810028, -0.4088903069496155, -0.39637935161590576, -0.38386842608451843, -0.3713574707508087, -0.3588465452194214, -0.34633558988571167, -0.33382466435432434, -0.3213137090206146, -0.3088027834892273, -0.29629185795783997, -0.28378093242645264, -0.2712699770927429, -0.2587590515613556, -0.24624809622764587, -0.23373717069625854, -0.22122621536254883, -0.2087152898311615, -0.19620433449745178, -0.18369339406490326, -0.17118245363235474, -0.1586715131998062, -0.1461605727672577, -0.13364964723587036, -0.12113869935274124, -0.10862775892019272, -0.0961168184876442, -0.08360587805509567, -0.07109493762254715, -0.058584000915288925, -0.0460730604827404, -0.03356212377548218, -0.021051183342933655, -0.008540242910385132, 0.003970697522163391, 0.016481637954711914, 0.028992576524615288, 0.04150351509451866, 0.054014455527067184, 0.06652539223432541, 0.07903633266687393, 0.09154727309942245, 0.10405821353197098, 0.1165691539645195, 0.12908008694648743, 0.14159102737903595, 0.15410196781158447, 0.166612908244133, 0.17912384867668152, 0.19163478910923004, 0.20414572954177856]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 3.0, 3.0, 10.0, 8.0, 12.0, 11.0, 13.0, 22.0, 25.0, 33.0, 35.0, 45.0, 33.0, 45.0, 49.0, 47.0, 68.0, 69.0, 55.0, 46.0, 53.0, 39.0, 38.0, 30.0, 27.0, 23.0, 35.0, 23.0, 18.0, 14.0, 19.0, 12.0, 11.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.25194251537323, -0.2448427826166153, -0.2377430647611618, -0.23064333200454712, -0.22354361414909363, -0.21644388139247894, -0.20934414863586426, -0.20224443078041077, -0.19514471292495728, -0.1880449801683426, -0.1809452623128891, -0.17384552955627441, -0.16674581170082092, -0.15964607894420624, -0.15254634618759155, -0.14544662833213806, -0.13834689557552338, -0.1312471628189087, -0.1241474449634552, -0.11704771220684052, -0.10994799435138702, -0.10284826159477234, -0.09574853628873825, -0.08864881098270416, -0.08154908567667007, -0.07444936037063599, -0.0673496350646019, -0.06024990603327751, -0.05315018072724342, -0.046050455421209335, -0.03895072638988495, -0.03185100108385086, -0.024751275777816772, -0.017651550471782684, -0.010551823303103447, -0.0034520961344242096, 0.0036476291716098785, 0.010747354477643967, 0.017847083508968353, 0.02494680881500244, 0.03204653412103653, 0.03914625942707062, 0.046245984733104706, 0.05334571376442909, 0.06044543907046318, 0.06754516065120697, 0.07464489340782166, 0.08174461871385574, 0.08884434401988983, 0.09594406932592392, 0.10304379463195801, 0.11014352738857269, 0.11724324524402618, 0.12434297800064087, 0.13144269585609436, 0.13854242861270905, 0.14564216136932373, 0.15274189412593842, 0.1598416119813919, 0.1669413447380066, 0.17404106259346008, 0.18114079535007477, 0.18824052810668945, 0.19534024596214294, 0.20243996381759644]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 6.0, 10.0, 12.0, 4.0, 8.0, 10.0, 24.0, 53.0, 264.0, 4193670.0, 100.0, 14.0, 19.0, 16.0, 14.0, 8.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0033054351806640625, -0.003203153610229492, -0.003100872039794922, -0.0029985904693603516, -0.0028963088989257812, -0.002794027328491211, -0.0026917457580566406, -0.0025894641876220703, -0.0024871826171875, -0.0023849010467529297, -0.0022826194763183594, -0.002180337905883789, -0.0020780563354492188, -0.0019757747650146484, -0.0018734931945800781, -0.0017712116241455078, -0.0016689300537109375, -0.0015666484832763672, -0.0014643669128417969, -0.0013620853424072266, -0.0012598037719726562, -0.001157522201538086, -0.0010552406311035156, -0.0009529590606689453, -0.000850677490234375, -0.0007483959197998047, -0.0006461143493652344, -0.0005438327789306641, -0.00044155120849609375, -0.00033926963806152344, -0.00023698806762695312, -0.0001347064971923828, -3.24249267578125e-05, 6.985664367675781e-05, 0.00017213821411132812, 0.00027441978454589844, 0.00037670135498046875, 0.00047898292541503906, 0.0005812644958496094, 0.0006835460662841797, 0.00078582763671875, 0.0008881092071533203, 0.0009903907775878906, 0.001092672348022461, 0.0011949539184570312, 0.0012972354888916016, 0.0013995170593261719, 0.0015017986297607422, 0.0016040802001953125, 0.0017063617706298828, 0.0018086433410644531, 0.0019109249114990234, 0.0020132064819335938, 0.002115488052368164, 0.0022177696228027344, 0.0023200511932373047, 0.002422332763671875, 0.0025246143341064453, 0.0026268959045410156, 0.002729177474975586, 0.0028314590454101562, 0.0029337406158447266, 0.003036022186279297, 0.003138303756713867, 0.0032405853271484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 9.0, 15.0, 15.0, 17.0, 18.0, 116.0, 419.0, 225.0, 46.0, 22.0, 9.0, 8.0, 5.0, 12.0, 10.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 7.0, 33.0, 60.0, 99.0, 157.0, 282.0, 420.0, 4192347.0, 349.0, 231.0, 107.0, 93.0, 51.0, 24.0, 5.0, 12.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003685951232910156, -0.0003584921360015869, -0.0003483891487121582, -0.0003382861614227295, -0.0003281831741333008, -0.00031808018684387207, -0.00030797719955444336, -0.00029787421226501465, -0.00028777122497558594, -0.0002776682376861572, -0.0002675652503967285, -0.0002574622631072998, -0.0002473592758178711, -0.00023725628852844238, -0.00022715330123901367, -0.00021705031394958496, -0.00020694732666015625, -0.00019684433937072754, -0.00018674135208129883, -0.00017663836479187012, -0.0001665353775024414, -0.0001564323902130127, -0.00014632940292358398, -0.00013622641563415527, -0.00012612342834472656, -0.00011602044105529785, -0.00010591745376586914, -9.581446647644043e-05, -8.571147918701172e-05, -7.560849189758301e-05, -6.55055046081543e-05, -5.5402517318725586e-05, -4.5299530029296875e-05, -3.5196542739868164e-05, -2.5093555450439453e-05, -1.4990568161010742e-05, -4.887580871582031e-06, 5.21540641784668e-06, 1.531839370727539e-05, 2.54213809967041e-05, 3.552436828613281e-05, 4.5627355575561523e-05, 5.5730342864990234e-05, 6.583333015441895e-05, 7.593631744384766e-05, 8.603930473327637e-05, 9.614229202270508e-05, 0.00010624527931213379, 0.0001163482666015625, 0.0001264512538909912, 0.00013655424118041992, 0.00014665722846984863, 0.00015676021575927734, 0.00016686320304870605, 0.00017696619033813477, 0.00018706917762756348, 0.0001971721649169922, 0.0002072751522064209, 0.0002173781394958496, 0.00022748112678527832, 0.00023758411407470703, 0.00024768710136413574, 0.00025779008865356445, 0.00026789307594299316, 0.0002779960632324219]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4088.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.834766387939453e-06, -7.948838174343109e-06, -6.062909960746765e-06, -4.176981747150421e-06, -2.291053533554077e-06, -4.0512531995773315e-07, 1.4808028936386108e-06, 3.366731107234955e-06, 5.252659320831299e-06, 7.138587534427643e-06, 9.024515748023987e-06, 1.091044396162033e-05, 1.2796372175216675e-05, 1.4682300388813019e-05, 1.6568228602409363e-05, 1.8454156816005707e-05, 2.034008502960205e-05, 2.2226013243198395e-05, 2.411194145679474e-05, 2.5997869670391083e-05, 2.7883797883987427e-05, 2.976972609758377e-05, 3.1655654311180115e-05, 3.354158252477646e-05, 3.54275107383728e-05, 3.731343895196915e-05, 3.919936716556549e-05, 4.1085295379161835e-05, 4.297122359275818e-05, 4.485715180635452e-05, 4.674308001995087e-05, 4.862900823354721e-05, 5.0514936447143555e-05, 5.24008646607399e-05, 5.428679287433624e-05, 5.617272108793259e-05, 5.805864930152893e-05, 5.9944577515125275e-05, 6.183050572872162e-05, 6.371643394231796e-05, 6.56023621559143e-05, 6.748829036951065e-05, 6.9374218583107e-05, 7.126014679670334e-05, 7.314607501029968e-05, 7.503200322389603e-05, 7.691793143749237e-05, 7.880385965108871e-05, 8.068978786468506e-05, 8.25757160782814e-05, 8.446164429187775e-05, 8.634757250547409e-05, 8.823350071907043e-05, 9.011942893266678e-05, 9.200535714626312e-05, 9.389128535985947e-05, 9.577721357345581e-05, 9.766314178705215e-05, 9.95490700006485e-05, 0.00010143499821424484, 0.00010332092642784119, 0.00010520685464143753, 0.00010709278285503387, 0.00010897871106863022, 0.00011086463928222656]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 30.0, 977.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040220562368631363, -0.0003933222615160048, -0.00038443889934569597, -0.0003755555080715567, -0.00036667214590124786, -0.00035778878373093903, -0.0003489054215606302, -0.0003400220593903214, -0.0003311386681161821, -0.00032225530594587326, -0.00031337194377556443, -0.00030448855250142515, -0.0002956051903311163, -0.0002867218281608075, -0.00027783846599049866, -0.00026895510382018983, -0.000260071741649881, -0.0002511883794795722, -0.00024230500275734812, -0.0002334216405870393, -0.00022453826386481524, -0.0002156549016945064, -0.00020677153952419758, -0.00019788817735388875, -0.0001890048006316647, -0.00018012143846135587, -0.0001712380617391318, -0.00016235469956882298, -0.00015347133739851415, -0.0001445879606762901, -0.00013570459850598127, -0.0001268212217837572, -0.00011793785961344838, -0.00010905449016718194, -0.0001001711207209155, -9.128775855060667e-05, -8.240438910434023e-05, -7.352101965807378e-05, -6.463765748776495e-05, -5.575428804149851e-05, -4.687091859523207e-05, -3.798754914896563e-05, -2.910418334067799e-05, -2.0220815713400953e-05, -1.1337448086123914e-05, -2.454078639857471e-06, 6.4292871684301645e-06, 1.53126529767178e-05, 2.4196022422984242e-05, 3.3079391869250685e-05, 4.196275767753832e-05, 5.0846123485825956e-05, 5.97294929320924e-05, 6.861286237835884e-05, 7.749622454866767e-05, 8.637959399493411e-05, 9.526296344120055e-05, 0.000104146332887467, 0.00011302970233373344, 0.00012191306450404227, 0.0001307964266743511, 0.00013967980339657515, 0.00014856316556688398, 0.00015744654228910804, 0.00016632990445941687]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 13.0, 14.0, 59.0, 111.0, 134.0, 160.0, 175.0, 137.0, 95.0, 41.0, 25.0, 15.0, 8.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010627508163452148, -0.00010160170495510101, -9.692832827568054e-05, -9.225495159626007e-05, -8.75815749168396e-05, -8.290819823741913e-05, -7.823482155799866e-05, -7.356144487857819e-05, -6.888806819915771e-05, -6.421469151973724e-05, -5.954131484031677e-05, -5.48679381608963e-05, -5.019456148147583e-05, -4.552118480205536e-05, -4.084780812263489e-05, -3.6174431443214417e-05, -3.1501054763793945e-05, -2.6827678084373474e-05, -2.2154301404953003e-05, -1.7480924725532532e-05, -1.280754804611206e-05, -8.13417136669159e-06, -3.460794687271118e-06, 1.212581992149353e-06, 5.885958671569824e-06, 1.0559335350990295e-05, 1.5232712030410767e-05, 1.9906088709831238e-05, 2.457946538925171e-05, 2.925284206867218e-05, 3.392621874809265e-05, 3.859959542751312e-05, 4.3272972106933594e-05, 4.7946348786354065e-05, 5.2619725465774536e-05, 5.729310214519501e-05, 6.196647882461548e-05, 6.663985550403595e-05, 7.131323218345642e-05, 7.598660886287689e-05, 8.065998554229736e-05, 8.533336222171783e-05, 9.00067389011383e-05, 9.468011558055878e-05, 9.935349225997925e-05, 0.00010402686893939972, 0.00010870024561882019, 0.00011337362229824066, 0.00011804699897766113, 0.0001227203756570816, 0.00012739375233650208, 0.00013206712901592255, 0.00013674050569534302, 0.0001414138823747635, 0.00014608725905418396, 0.00015076063573360443, 0.0001554340124130249, 0.00016010738909244537, 0.00016478076577186584, 0.00016945414245128632, 0.0001741275191307068, 0.00017880089581012726, 0.00018347427248954773, 0.0001881476491689682, 0.00019282102584838867]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 0.0, 4.0, 7.0, 3.0, 0.0, 2.0, 6.0, 7.0, 5.0, 15.0, 12.0, 24.0, 24.0, 27.0, 59.0, 56.0, 79.0, 94.0, 143.0, 186.0, 312.0, 474.0, 699.0, 1198.0, 2262.0, 4935.0, 14597.0, 613614.0, 384787.0, 14249.0, 4947.0, 2429.0, 1228.0, 651.0, 389.0, 297.0, 181.0, 134.0, 81.0, 66.0, 54.0, 56.0, 30.0, 40.0, 25.0, 14.0, 12.0, 8.0, 5.0, 11.0, 2.0, 5.0, 8.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.0285797119140625, -0.027686357498168945, -0.02679300308227539, -0.025899648666381836, -0.02500629425048828, -0.024112939834594727, -0.023219585418701172, -0.022326231002807617, -0.021432876586914062, -0.020539522171020508, -0.019646167755126953, -0.0187528133392334, -0.017859458923339844, -0.01696610450744629, -0.016072750091552734, -0.01517939567565918, -0.014286041259765625, -0.01339268684387207, -0.012499332427978516, -0.011605978012084961, -0.010712623596191406, -0.009819269180297852, -0.008925914764404297, -0.008032560348510742, -0.0071392059326171875, -0.006245851516723633, -0.005352497100830078, -0.0044591426849365234, -0.0035657882690429688, -0.002672433853149414, -0.0017790794372558594, -0.0008857250213623047, 7.62939453125e-06, 0.0009009838104248047, 0.0017943382263183594, 0.002687692642211914, 0.0035810470581054688, 0.0044744014739990234, 0.005367755889892578, 0.006261110305786133, 0.0071544647216796875, 0.008047819137573242, 0.008941173553466797, 0.009834527969360352, 0.010727882385253906, 0.011621236801147461, 0.012514591217041016, 0.01340794563293457, 0.014301300048828125, 0.01519465446472168, 0.016088008880615234, 0.01698136329650879, 0.017874717712402344, 0.0187680721282959, 0.019661426544189453, 0.020554780960083008, 0.021448135375976562, 0.022341489791870117, 0.023234844207763672, 0.024128198623657227, 0.02502155303955078, 0.025914907455444336, 0.02680826187133789, 0.027701616287231445, 0.028594970703125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 9.0, 15.0, 15.0, 17.0, 18.0, 116.0, 419.0, 225.0, 46.0, 22.0, 9.0, 8.0, 5.0, 12.0, 10.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 8.0, 10.0, 7.0, 12.0, 13.0, 11.0, 16.0, 19.0, 20.0, 27.0, 38.0, 45.0, 57.0, 98.0, 189.0, 405.0, 837.0, 2175.0, 123505.0, 916249.0, 2768.0, 943.0, 413.0, 190.0, 123.0, 80.0, 52.0, 43.0, 28.0, 30.0, 32.0, 15.0, 17.0, 13.0, 12.0, 10.0, 4.0, 13.0, 2.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04583740234375, -0.04436302185058594, -0.042888641357421875, -0.04141426086425781, -0.03993988037109375, -0.03846549987792969, -0.036991119384765625, -0.03551673889160156, -0.0340423583984375, -0.03256797790527344, -0.031093597412109375, -0.029619216918945312, -0.02814483642578125, -0.026670455932617188, -0.025196075439453125, -0.023721694946289062, -0.022247314453125, -0.020772933959960938, -0.019298553466796875, -0.017824172973632812, -0.01634979248046875, -0.014875411987304688, -0.013401031494140625, -0.011926651000976562, -0.0104522705078125, -0.008977890014648438, -0.007503509521484375, -0.0060291290283203125, -0.00455474853515625, -0.0030803680419921875, -0.001605987548828125, -0.0001316070556640625, 0.0013427734375, 0.0028171539306640625, 0.004291534423828125, 0.0057659149169921875, 0.00724029541015625, 0.008714675903320312, 0.010189056396484375, 0.011663436889648438, 0.0131378173828125, 0.014612197875976562, 0.016086578369140625, 0.017560958862304688, 0.01903533935546875, 0.020509719848632812, 0.021984100341796875, 0.023458480834960938, 0.024932861328125, 0.026407241821289062, 0.027881622314453125, 0.029356002807617188, 0.03083038330078125, 0.03230476379394531, 0.033779144287109375, 0.03525352478027344, 0.0367279052734375, 0.03820228576660156, 0.039676666259765625, 0.04115104675292969, 0.04262542724609375, 0.04409980773925781, 0.045574188232421875, 0.04704856872558594, 0.04852294921875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 7.0, 11.0, 10.0, 15.0, 11.0, 16.0, 17.0, 19.0, 28.0, 31.0, 34.0, 30.0, 27.0, 42.0, 36.0, 38.0, 44.0, 46.0, 47.0, 51.0, 40.0, 36.0, 24.0, 34.0, 38.0, 34.0, 34.0, 25.0, 27.0, 29.0, 18.0, 17.0, 12.0, 12.0, 10.0, 5.0, 10.0, 5.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036407470703125, -0.035237789154052734, -0.03406810760498047, -0.0328984260559082, -0.03172874450683594, -0.030559062957763672, -0.029389381408691406, -0.02821969985961914, -0.027050018310546875, -0.02588033676147461, -0.024710655212402344, -0.023540973663330078, -0.022371292114257812, -0.021201610565185547, -0.02003192901611328, -0.018862247467041016, -0.01769256591796875, -0.016522884368896484, -0.015353202819824219, -0.014183521270751953, -0.013013839721679688, -0.011844158172607422, -0.010674476623535156, -0.00950479507446289, -0.008335113525390625, -0.007165431976318359, -0.005995750427246094, -0.004826068878173828, -0.0036563873291015625, -0.002486705780029297, -0.0013170242309570312, -0.00014734268188476562, 0.0010223388671875, 0.0021920204162597656, 0.0033617019653320312, 0.004531383514404297, 0.0057010650634765625, 0.006870746612548828, 0.008040428161621094, 0.00921010971069336, 0.010379791259765625, 0.01154947280883789, 0.012719154357910156, 0.013888835906982422, 0.015058517456054688, 0.016228199005126953, 0.01739788055419922, 0.018567562103271484, 0.01973724365234375, 0.020906925201416016, 0.02207660675048828, 0.023246288299560547, 0.024415969848632812, 0.025585651397705078, 0.026755332946777344, 0.02792501449584961, 0.029094696044921875, 0.03026437759399414, 0.031434059143066406, 0.03260374069213867, 0.03377342224121094, 0.0349431037902832, 0.03611278533935547, 0.037282466888427734, 0.0384521484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 0.0, 9.0, 5.0, 10.0, 9.0, 12.0, 22.0, 24.0, 34.0, 61.0, 87.0, 124.0, 203.0, 345.0, 645.0, 1607.0, 3932.0, 11807.0, 59239.0, 828121.0, 115763.0, 17397.0, 5036.0, 1948.0, 926.0, 434.0, 265.0, 178.0, 93.0, 50.0, 48.0, 43.0, 29.0, 16.0, 10.0, 6.0, 5.0, 2.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-1.5437602996826172e-05, -1.5016645193099976e-05, -1.459568738937378e-05, -1.4174729585647583e-05, -1.3753771781921387e-05, -1.333281397819519e-05, -1.2911856174468994e-05, -1.2490898370742798e-05, -1.2069940567016602e-05, -1.1648982763290405e-05, -1.1228024959564209e-05, -1.0807067155838013e-05, -1.0386109352111816e-05, -9.96515154838562e-06, -9.544193744659424e-06, -9.123235940933228e-06, -8.702278137207031e-06, -8.281320333480835e-06, -7.860362529754639e-06, -7.439404726028442e-06, -7.018446922302246e-06, -6.59748911857605e-06, -6.1765313148498535e-06, -5.755573511123657e-06, -5.334615707397461e-06, -4.913657903671265e-06, -4.492700099945068e-06, -4.071742296218872e-06, -3.6507844924926758e-06, -3.2298266887664795e-06, -2.808868885040283e-06, -2.387911081314087e-06, -1.9669532775878906e-06, -1.5459954738616943e-06, -1.125037670135498e-06, -7.040798664093018e-07, -2.8312206268310547e-07, 1.3783574104309082e-07, 5.587935447692871e-07, 9.797513484954834e-07, 1.4007091522216797e-06, 1.821666955947876e-06, 2.2426247596740723e-06, 2.6635825634002686e-06, 3.084540367126465e-06, 3.505498170852661e-06, 3.926455974578857e-06, 4.347413778305054e-06, 4.76837158203125e-06, 5.189329385757446e-06, 5.610287189483643e-06, 6.031244993209839e-06, 6.452202796936035e-06, 6.8731606006622314e-06, 7.294118404388428e-06, 7.715076208114624e-06, 8.13603401184082e-06, 8.556991815567017e-06, 8.977949619293213e-06, 9.39890742301941e-06, 9.819865226745605e-06, 1.0240823030471802e-05, 1.0661780834197998e-05, 1.1082738637924194e-05, 1.150369644165039e-05]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 10.0, 16.0, 17.0, 17.0, 16.0, 36.0, 38.0, 52.0, 75.0, 84.0, 82.0, 93.0, 65.0, 106.0, 74.0, 53.0, 36.0, 26.0, 24.0, 14.0, 6.0, 6.0, 11.0, 9.0, 6.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.794929504394531e-06, -6.61797821521759e-06, -6.441026926040649e-06, -6.2640756368637085e-06, -6.087124347686768e-06, -5.910173058509827e-06, -5.733221769332886e-06, -5.556270480155945e-06, -5.379319190979004e-06, -5.202367901802063e-06, -5.025416612625122e-06, -4.848465323448181e-06, -4.67151403427124e-06, -4.494562745094299e-06, -4.317611455917358e-06, -4.1406601667404175e-06, -3.9637088775634766e-06, -3.7867575883865356e-06, -3.6098062992095947e-06, -3.432855010032654e-06, -3.255903720855713e-06, -3.078952431678772e-06, -2.902001142501831e-06, -2.72504985332489e-06, -2.5480985641479492e-06, -2.3711472749710083e-06, -2.1941959857940674e-06, -2.0172446966171265e-06, -1.8402934074401855e-06, -1.6633421182632446e-06, -1.4863908290863037e-06, -1.3094395399093628e-06, -1.1324882507324219e-06, -9.55536961555481e-07, -7.7858567237854e-07, -6.016343832015991e-07, -4.246830940246582e-07, -2.477318048477173e-07, -7.078051567077637e-08, 1.0617077350616455e-07, 2.8312206268310547e-07, 4.600733518600464e-07, 6.370246410369873e-07, 8.139759302139282e-07, 9.909272193908691e-07, 1.16787850856781e-06, 1.344829797744751e-06, 1.521781086921692e-06, 1.6987323760986328e-06, 1.8756836652755737e-06, 2.0526349544525146e-06, 2.2295862436294556e-06, 2.4065375328063965e-06, 2.5834888219833374e-06, 2.7604401111602783e-06, 2.9373914003372192e-06, 3.11434268951416e-06, 3.291293978691101e-06, 3.468245267868042e-06, 3.645196557044983e-06, 3.822147846221924e-06, 3.999099135398865e-06, 4.176050424575806e-06, 4.353001713752747e-06, 4.5299530029296875e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 8.0, 9.0, 14.0, 25.0, 37.0, 51.0, 78.0, 180.0, 603.0, 3417.0, 1040397.0, 2800.0, 491.0, 168.0, 86.0, 54.0, 36.0, 30.0, 24.0, 15.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.994340896606445e-05, -8.766446262598038e-05, -8.53855162858963e-05, -8.310656994581223e-05, -8.082762360572815e-05, -7.854867726564407e-05, -7.626973092556e-05, -7.399078458547592e-05, -7.171183824539185e-05, -6.943289190530777e-05, -6.71539455652237e-05, -6.487499922513962e-05, -6.259605288505554e-05, -6.0317106544971466e-05, -5.803816020488739e-05, -5.5759213864803314e-05, -5.348026752471924e-05, -5.120132118463516e-05, -4.8922374844551086e-05, -4.664342850446701e-05, -4.4364482164382935e-05, -4.208553582429886e-05, -3.980658948421478e-05, -3.752764314413071e-05, -3.524869680404663e-05, -3.2969750463962555e-05, -3.069080412387848e-05, -2.8411857783794403e-05, -2.6132911443710327e-05, -2.385396510362625e-05, -2.1575018763542175e-05, -1.92960724234581e-05, -1.7017126083374023e-05, -1.4738179743289948e-05, -1.2459233403205872e-05, -1.0180287063121796e-05, -7.90134072303772e-06, -5.622394382953644e-06, -3.343448042869568e-06, -1.064501702785492e-06, 1.214444637298584e-06, 3.49339097738266e-06, 5.772337317466736e-06, 8.051283657550812e-06, 1.0330229997634888e-05, 1.2609176337718964e-05, 1.488812267780304e-05, 1.7167069017887115e-05, 1.944601535797119e-05, 2.1724961698055267e-05, 2.4003908038139343e-05, 2.628285437822342e-05, 2.8561800718307495e-05, 3.084074705839157e-05, 3.311969339847565e-05, 3.539863973855972e-05, 3.76775860786438e-05, 3.9956532418727875e-05, 4.223547875881195e-05, 4.4514425098896027e-05, 4.67933714389801e-05, 4.907231777906418e-05, 5.1351264119148254e-05, 5.363021045923233e-05, 5.5909156799316406e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 7.0, 4.0, 14.0, 8.0, 23.0, 30.0, 36.0, 48.0, 50.0, 75.0, 85.0, 161.0, 116.0, 61.0, 68.0, 49.0, 51.0, 29.0, 30.0, 19.0, 17.0, 10.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265806198120117e-05, -7.082521915435791e-05, -6.899237632751465e-05, -6.715953350067139e-05, -6.532669067382812e-05, -6.349384784698486e-05, -6.16610050201416e-05, -5.982816219329834e-05, -5.799531936645508e-05, -5.6162476539611816e-05, -5.4329633712768555e-05, -5.249679088592529e-05, -5.066394805908203e-05, -4.883110523223877e-05, -4.699826240539551e-05, -4.5165419578552246e-05, -4.3332576751708984e-05, -4.149973392486572e-05, -3.966689109802246e-05, -3.78340482711792e-05, -3.600120544433594e-05, -3.4168362617492676e-05, -3.2335519790649414e-05, -3.0502676963806152e-05, -2.866983413696289e-05, -2.683699131011963e-05, -2.5004148483276367e-05, -2.3171305656433105e-05, -2.1338462829589844e-05, -1.9505620002746582e-05, -1.767277717590332e-05, -1.583993434906006e-05, -1.4007091522216797e-05, -1.2174248695373535e-05, -1.0341405868530273e-05, -8.508563041687012e-06, -6.67572021484375e-06, -4.842877388000488e-06, -3.0100345611572266e-06, -1.1771917343139648e-06, 6.556510925292969e-07, 2.4884939193725586e-06, 4.32133674621582e-06, 6.154179573059082e-06, 7.987022399902344e-06, 9.819865226745605e-06, 1.1652708053588867e-05, 1.3485550880432129e-05, 1.531839370727539e-05, 1.7151236534118652e-05, 1.8984079360961914e-05, 2.0816922187805176e-05, 2.2649765014648438e-05, 2.44826078414917e-05, 2.631545066833496e-05, 2.8148293495178223e-05, 2.9981136322021484e-05, 3.1813979148864746e-05, 3.364682197570801e-05, 3.547966480255127e-05, 3.731250762939453e-05, 3.914535045623779e-05, 4.0978193283081055e-05, 4.2811036109924316e-05, 4.464387893676758e-05]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 731.0, 274.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13766838610172272, -0.12499868124723434, -0.11232897639274597, -0.0996592789888382, -0.08698957413434982, -0.07431986927986145, -0.061650171875953674, -0.0489804670214653, -0.03631076216697693, -0.023641059175133705, -0.010971356183290482, 0.0016983449459075928, 0.014368049800395966, 0.02703775465488434, 0.039707452058792114, 0.05237715691328049, 0.06504686176776886, 0.07771656662225723, 0.0903862714767456, 0.10305596888065338, 0.11572567373514175, 0.12839537858963013, 0.1410650759935379, 0.15373477339744568, 0.16640448570251465, 0.17907418310642242, 0.1917438954114914, 0.20441359281539917, 0.21708330512046814, 0.22975300252437592, 0.2424226999282837, 0.25509241223335266, 0.26776212453842163, 0.2804318368434906, 0.2931015193462372, 0.30577123165130615, 0.3184409439563751, 0.3311106562614441, 0.3437803387641907, 0.35645005106925964, 0.3691197633743286, 0.3817894756793976, 0.39445915818214417, 0.40712887048721313, 0.4197985827922821, 0.4324682950973511, 0.44513797760009766, 0.4578076899051666, 0.4704773724079132, 0.4831470847129822, 0.49581676721572876, 0.5084865093231201, 0.5211561918258667, 0.5338258743286133, 0.5464955568313599, 0.5591652989387512, 0.5718349814414978, 0.5845046639442444, 0.5971744060516357, 0.6098440885543823, 0.6225137710571289, 0.6351835131645203, 0.6478531956672668, 0.6605228781700134, 0.6731926202774048]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 4.0, 3.0, 8.0, 11.0, 11.0, 10.0, 22.0, 17.0, 19.0, 31.0, 29.0, 37.0, 45.0, 36.0, 50.0, 44.0, 48.0, 52.0, 48.0, 57.0, 62.0, 44.0, 28.0, 48.0, 38.0, 22.0, 42.0, 18.0, 20.0, 25.0, 12.0, 10.0, 7.0, 11.0, 3.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2037792205810547, -0.1968652904033661, -0.1899513602256775, -0.1830374300479889, -0.1761235147714615, -0.1692095845937729, -0.1622956544160843, -0.1553817242383957, -0.1484678089618683, -0.1415538787841797, -0.1346399486064911, -0.1277260184288025, -0.12081210315227509, -0.11389817297458649, -0.10698424279689789, -0.10007031261920929, -0.09315638244152069, -0.08624245226383209, -0.07932852953672409, -0.07241459935903549, -0.06550067663192749, -0.05858674645423889, -0.05167281627655029, -0.04475888982415199, -0.03784496337175369, -0.030931036919355392, -0.024017108604311943, -0.017103180289268494, -0.010189253836870193, -0.0032753273844718933, 0.0036386027932167053, 0.010552529245615005, 0.017466455698013306, 0.024380382150411606, 0.031294308602809906, 0.038208238780498505, 0.045122165232896805, 0.052036091685295105, 0.058950021862983704, 0.0658639520406723, 0.0727778747677803, 0.0796918049454689, 0.0866057276725769, 0.0935196578502655, 0.1004335880279541, 0.1073475107550621, 0.1142614409327507, 0.1211753636598587, 0.1280892938375473, 0.1350032240152359, 0.1419171541929245, 0.1488310694694519, 0.1557449996471405, 0.1626589298248291, 0.1695728600025177, 0.1764867901802063, 0.1834007203578949, 0.1903146505355835, 0.1972285807132721, 0.2041425108909607, 0.2110564261674881, 0.2179703563451767, 0.2248842865228653, 0.2317982167005539, 0.2387121319770813]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 8.0, 0.0, 9.0, 11.0, 7.0, 7.0, 9.0, 11.0, 20.0, 90.0, 512.0, 4193382.0, 103.0, 23.0, 14.0, 18.0, 13.0, 6.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0006060600280761719, -0.0005877837538719177, -0.0005695074796676636, -0.0005512312054634094, -0.0005329549312591553, -0.0005146786570549011, -0.000496402382850647, -0.0004781261086463928, -0.00045984983444213867, -0.0004415735602378845, -0.00042329728603363037, -0.0004050210118293762, -0.00038674473762512207, -0.0003684684634208679, -0.00035019218921661377, -0.0003319159150123596, -0.00031363964080810547, -0.0002953633666038513, -0.00027708709239959717, -0.000258810818195343, -0.00024053454399108887, -0.00022225826978683472, -0.00020398199558258057, -0.00018570572137832642, -0.00016742944717407227, -0.00014915317296981812, -0.00013087689876556396, -0.00011260062456130981, -9.432435035705566e-05, -7.604807615280151e-05, -5.777180194854736e-05, -3.949552774429321e-05, -2.1219253540039062e-05, -2.942979335784912e-06, 1.5333294868469238e-05, 3.360956907272339e-05, 5.188584327697754e-05, 7.016211748123169e-05, 8.843839168548584e-05, 0.00010671466588973999, 0.00012499094009399414, 0.0001432672142982483, 0.00016154348850250244, 0.0001798197627067566, 0.00019809603691101074, 0.0002163723111152649, 0.00023464858531951904, 0.0002529248595237732, 0.00027120113372802734, 0.0002894774079322815, 0.00030775368213653564, 0.0003260299563407898, 0.00034430623054504395, 0.0003625825047492981, 0.00038085877895355225, 0.0003991350531578064, 0.00041741132736206055, 0.0004356876015663147, 0.00045396387577056885, 0.000472240149974823, 0.0004905164241790771, 0.0005087926983833313, 0.0005270689725875854, 0.0005453452467918396, 0.0005636215209960938]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 8.0, 15.0, 15.0, 17.0, 19.0, 116.0, 413.0, 231.0, 46.0, 23.0, 9.0, 7.0, 7.0, 11.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 6.0, 12.0, 27.0, 43.0, 85.0, 138.0, 222.0, 305.0, 4191970.0, 788.0, 244.0, 190.0, 100.0, 67.0, 42.0, 18.0, 11.0, 10.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00016355514526367188, -0.00015944987535476685, -0.00015534460544586182, -0.0001512393355369568, -0.00014713406562805176, -0.00014302879571914673, -0.0001389235258102417, -0.00013481825590133667, -0.00013071298599243164, -0.0001266077160835266, -0.00012250244617462158, -0.00011839717626571655, -0.00011429190635681152, -0.0001101866364479065, -0.00010608136653900146, -0.00010197609663009644, -9.78708267211914e-05, -9.376555681228638e-05, -8.966028690338135e-05, -8.555501699447632e-05, -8.144974708557129e-05, -7.734447717666626e-05, -7.323920726776123e-05, -6.91339373588562e-05, -6.502866744995117e-05, -6.092339754104614e-05, -5.681812763214111e-05, -5.2712857723236084e-05, -4.8607587814331055e-05, -4.4502317905426025e-05, -4.0397047996520996e-05, -3.629177808761597e-05, -3.218650817871094e-05, -2.8081238269805908e-05, -2.397596836090088e-05, -1.987069845199585e-05, -1.576542854309082e-05, -1.1660158634185791e-05, -7.554888725280762e-06, -3.4496188163757324e-06, 6.556510925292969e-07, 4.760921001434326e-06, 8.866190910339355e-06, 1.2971460819244385e-05, 1.7076730728149414e-05, 2.1182000637054443e-05, 2.5287270545959473e-05, 2.9392540454864502e-05, 3.349781036376953e-05, 3.760308027267456e-05, 4.170835018157959e-05, 4.581362009048462e-05, 4.991888999938965e-05, 5.402415990829468e-05, 5.812942981719971e-05, 6.223469972610474e-05, 6.633996963500977e-05, 7.04452395439148e-05, 7.455050945281982e-05, 7.865577936172485e-05, 8.276104927062988e-05, 8.686631917953491e-05, 9.097158908843994e-05, 9.507685899734497e-05, 9.918212890625e-05]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4088.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.245208740234375e-06, -4.484318196773529e-06, -3.723427653312683e-06, -2.962537109851837e-06, -2.201646566390991e-06, -1.4407560229301453e-06, -6.798654794692993e-07, 8.102506399154663e-08, 8.419156074523926e-07, 1.6028061509132385e-06, 2.3636966943740845e-06, 3.1245872378349304e-06, 3.885477781295776e-06, 4.646368324756622e-06, 5.407258868217468e-06, 6.168149411678314e-06, 6.92903995513916e-06, 7.689930498600006e-06, 8.450821042060852e-06, 9.211711585521698e-06, 9.972602128982544e-06, 1.073349267244339e-05, 1.1494383215904236e-05, 1.2255273759365082e-05, 1.3016164302825928e-05, 1.3777054846286774e-05, 1.453794538974762e-05, 1.5298835933208466e-05, 1.605972647666931e-05, 1.6820617020130157e-05, 1.7581507563591003e-05, 1.834239810705185e-05, 1.9103288650512695e-05, 1.986417919397354e-05, 2.0625069737434387e-05, 2.1385960280895233e-05, 2.214685082435608e-05, 2.2907741367816925e-05, 2.366863191127777e-05, 2.4429522454738617e-05, 2.5190412998199463e-05, 2.595130354166031e-05, 2.6712194085121155e-05, 2.7473084628582e-05, 2.8233975172042847e-05, 2.8994865715503693e-05, 2.975575625896454e-05, 3.0516646802425385e-05, 3.127753734588623e-05, 3.2038427889347076e-05, 3.279931843280792e-05, 3.356020897626877e-05, 3.4321099519729614e-05, 3.508199006319046e-05, 3.5842880606651306e-05, 3.660377115011215e-05, 3.7364661693573e-05, 3.8125552237033844e-05, 3.888644278049469e-05, 3.9647333323955536e-05, 4.040822386741638e-05, 4.116911441087723e-05, 4.1930004954338074e-05, 4.269089549779892e-05, 4.3451786041259766e-05]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 28.0, 972.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013577780919149518, -0.0001312948443228379, -0.00012681189400609583, -0.00012232892913743854, -0.00011784596426878124, -0.00011336300667608157, -0.00010888004908338189, -0.0001043970842147246, -9.991412662202492e-05, -9.543116902932525e-05, -9.094820416066796e-05, -8.646524656796828e-05, -8.19822889752686e-05, -7.749932410661131e-05, -7.301636651391163e-05, -6.853340892121196e-05, -6.405044405255467e-05, -5.956748282187618e-05, -5.50845215911977e-05, -5.060156399849802e-05, -4.611860276781954e-05, -4.1635641537141055e-05, -3.715268394444138e-05, -3.2669722713762894e-05, -2.818676148308441e-05, -2.3703800252405927e-05, -1.9220840840716846e-05, -1.4737880519533064e-05, -1.0254920198349282e-05, -5.771958967670798e-06, -1.288999555981718e-06, 3.1939598557073623e-06, 7.676921086385846e-06, 1.2159881407569628e-05, 1.664284172875341e-05, 2.112580114044249e-05, 2.5608762371120974e-05, 3.0091723601799458e-05, 3.4574681194499135e-05, 3.905764242517762e-05, 4.35406036558561e-05, 4.8023564886534587e-05, 5.250652611721307e-05, 5.698948370991275e-05, 6.147244130261242e-05, 6.595540617126971e-05, 7.043836376396939e-05, 7.492132135666907e-05, 7.940428622532636e-05, 8.388724381802604e-05, 8.837020868668333e-05, 9.2853166279383e-05, 9.73361311480403e-05, 0.00010181908874073997, 0.00010630204633343965, 0.00011078501120209694, 0.00011526796879479662, 0.00011975092638749629, 0.00012423389125615358, 0.00012871685612481087, 0.00013319980644155294, 0.00013768277131021023, 0.00014216573617886752, 0.00014664868649560958, 0.00015113165136426687]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 6.0, 14.0, 19.0, 62.0, 151.0, 134.0, 132.0, 149.0, 142.0, 126.0, 29.0, 17.0, 13.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7610530853271484e-05, -3.56016680598259e-05, -3.359280526638031e-05, -3.158394247293472e-05, -2.9575079679489136e-05, -2.756621688604355e-05, -2.555735409259796e-05, -2.3548491299152374e-05, -2.1539628505706787e-05, -1.95307657122612e-05, -1.7521902918815613e-05, -1.5513040125370026e-05, -1.3504177331924438e-05, -1.1495314538478851e-05, -9.486451745033264e-06, -7.477588951587677e-06, -5.46872615814209e-06, -3.4598633646965027e-06, -1.4510005712509155e-06, 5.578622221946716e-07, 2.566725015640259e-06, 4.575587809085846e-06, 6.584450602531433e-06, 8.59331339597702e-06, 1.0602176189422607e-05, 1.2611038982868195e-05, 1.4619901776313782e-05, 1.662876456975937e-05, 1.8637627363204956e-05, 2.0646490156650543e-05, 2.265535295009613e-05, 2.4664215743541718e-05, 2.6673078536987305e-05, 2.8681941330432892e-05, 3.069080412387848e-05, 3.2699666917324066e-05, 3.470852971076965e-05, 3.671739250421524e-05, 3.872625529766083e-05, 4.0735118091106415e-05, 4.2743980884552e-05, 4.475284367799759e-05, 4.6761706471443176e-05, 4.8770569264888763e-05, 5.077943205833435e-05, 5.278829485177994e-05, 5.4797157645225525e-05, 5.680602043867111e-05, 5.88148832321167e-05, 6.0823746025562286e-05, 6.283260881900787e-05, 6.484147161245346e-05, 6.685033440589905e-05, 6.885919719934464e-05, 7.086805999279022e-05, 7.287692278623581e-05, 7.48857855796814e-05, 7.689464837312698e-05, 7.890351116657257e-05, 8.091237396001816e-05, 8.292123675346375e-05, 8.493009954690933e-05, 8.693896234035492e-05, 8.89478251338005e-05, 9.09566879272461e-05]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 3.0, 6.0, 9.0, 13.0, 16.0, 31.0, 39.0, 56.0, 146.0, 292.0, 810.0, 2787.0, 18170.0, 1005833.0, 16279.0, 2530.0, 833.0, 345.0, 151.0, 78.0, 41.0, 28.0, 9.0, 11.0, 4.0, 3.0, 1.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0684814453125, -0.06637287139892578, -0.06426429748535156, -0.062155723571777344, -0.060047149658203125, -0.057938575744628906, -0.05583000183105469, -0.05372142791748047, -0.05161285400390625, -0.04950428009033203, -0.04739570617675781, -0.045287132263183594, -0.043178558349609375, -0.041069984436035156, -0.03896141052246094, -0.03685283660888672, -0.0347442626953125, -0.03263568878173828, -0.030527114868164062, -0.028418540954589844, -0.026309967041015625, -0.024201393127441406, -0.022092819213867188, -0.01998424530029297, -0.01787567138671875, -0.01576709747314453, -0.013658523559570312, -0.011549949645996094, -0.009441375732421875, -0.007332801818847656, -0.0052242279052734375, -0.0031156539916992188, -0.001007080078125, 0.0011014938354492188, 0.0032100677490234375, 0.005318641662597656, 0.007427215576171875, 0.009535789489746094, 0.011644363403320312, 0.013752937316894531, 0.01586151123046875, 0.01797008514404297, 0.020078659057617188, 0.022187232971191406, 0.024295806884765625, 0.026404380798339844, 0.028512954711914062, 0.03062152862548828, 0.0327301025390625, 0.03483867645263672, 0.03694725036621094, 0.039055824279785156, 0.041164398193359375, 0.043272972106933594, 0.04538154602050781, 0.04749011993408203, 0.04959869384765625, 0.05170726776123047, 0.05381584167480469, 0.055924415588378906, 0.058032989501953125, 0.060141563415527344, 0.06225013732910156, 0.06435871124267578, 0.06646728515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 8.0, 15.0, 15.0, 17.0, 19.0, 116.0, 413.0, 231.0, 46.0, 23.0, 9.0, 7.0, 7.0, 11.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 5.0, 4.0, 5.0, 7.0, 4.0, 11.0, 13.0, 14.0, 18.0, 30.0, 27.0, 25.0, 35.0, 59.0, 79.0, 136.0, 292.0, 632.0, 1699.0, 114936.0, 926830.0, 2095.0, 758.0, 307.0, 158.0, 84.0, 54.0, 38.0, 29.0, 24.0, 20.0, 23.0, 21.0, 20.0, 8.0, 8.0, 6.0, 8.0, 3.0, 5.0, 9.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049468994140625, -0.0479273796081543, -0.046385765075683594, -0.04484415054321289, -0.04330253601074219, -0.041760921478271484, -0.04021930694580078, -0.03867769241333008, -0.037136077880859375, -0.03559446334838867, -0.03405284881591797, -0.032511234283447266, -0.030969619750976562, -0.02942800521850586, -0.027886390686035156, -0.026344776153564453, -0.02480316162109375, -0.023261547088623047, -0.021719932556152344, -0.02017831802368164, -0.018636703491210938, -0.017095088958740234, -0.015553474426269531, -0.014011859893798828, -0.012470245361328125, -0.010928630828857422, -0.009387016296386719, -0.007845401763916016, -0.0063037872314453125, -0.004762172698974609, -0.0032205581665039062, -0.0016789436340332031, -0.0001373291015625, 0.0014042854309082031, 0.0029458999633789062, 0.004487514495849609, 0.0060291290283203125, 0.007570743560791016, 0.009112358093261719, 0.010653972625732422, 0.012195587158203125, 0.013737201690673828, 0.015278816223144531, 0.016820430755615234, 0.018362045288085938, 0.01990365982055664, 0.021445274353027344, 0.022986888885498047, 0.02452850341796875, 0.026070117950439453, 0.027611732482910156, 0.02915334701538086, 0.030694961547851562, 0.032236576080322266, 0.03377819061279297, 0.03531980514526367, 0.036861419677734375, 0.03840303421020508, 0.03994464874267578, 0.041486263275146484, 0.04302787780761719, 0.04456949234008789, 0.046111106872558594, 0.0476527214050293, 0.0491943359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 5.0, 4.0, 5.0, 6.0, 5.0, 11.0, 13.0, 14.0, 20.0, 26.0, 29.0, 24.0, 34.0, 37.0, 33.0, 34.0, 31.0, 65.0, 46.0, 48.0, 55.0, 43.0, 42.0, 38.0, 38.0, 37.0, 32.0, 30.0, 28.0, 23.0, 19.0, 24.0, 21.0, 21.0, 6.0, 9.0, 5.0, 9.0, 3.0, 5.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0382080078125, -0.037016868591308594, -0.03582572937011719, -0.03463459014892578, -0.033443450927734375, -0.03225231170654297, -0.031061172485351562, -0.029870033264160156, -0.02867889404296875, -0.027487754821777344, -0.026296615600585938, -0.02510547637939453, -0.023914337158203125, -0.02272319793701172, -0.021532058715820312, -0.020340919494628906, -0.0191497802734375, -0.017958641052246094, -0.016767501831054688, -0.015576362609863281, -0.014385223388671875, -0.013194084167480469, -0.012002944946289062, -0.010811805725097656, -0.00962066650390625, -0.008429527282714844, -0.0072383880615234375, -0.006047248840332031, -0.004856109619140625, -0.0036649703979492188, -0.0024738311767578125, -0.0012826919555664062, -9.1552734375e-05, 0.0010995864868164062, 0.0022907257080078125, 0.0034818649291992188, 0.004673004150390625, 0.005864143371582031, 0.0070552825927734375, 0.008246421813964844, 0.00943756103515625, 0.010628700256347656, 0.011819839477539062, 0.013010978698730469, 0.014202117919921875, 0.015393257141113281, 0.016584396362304688, 0.017775535583496094, 0.0189666748046875, 0.020157814025878906, 0.021348953247070312, 0.02254009246826172, 0.023731231689453125, 0.02492237091064453, 0.026113510131835938, 0.027304649353027344, 0.02849578857421875, 0.029686927795410156, 0.030878067016601562, 0.03206920623779297, 0.033260345458984375, 0.03445148468017578, 0.03564262390136719, 0.036833763122558594, 0.03802490234375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 13.0, 21.0, 38.0, 69.0, 102.0, 175.0, 441.0, 1280.0, 5927.0, 194587.0, 835830.0, 7460.0, 1557.0, 525.0, 201.0, 129.0, 65.0, 30.0, 36.0, 17.0, 12.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.066394805908203e-05, -4.9297697842121124e-05, -4.793144762516022e-05, -4.656519740819931e-05, -4.51989471912384e-05, -4.3832696974277496e-05, -4.246644675731659e-05, -4.110019654035568e-05, -3.9733946323394775e-05, -3.836769610643387e-05, -3.700144588947296e-05, -3.5635195672512054e-05, -3.426894545555115e-05, -3.290269523859024e-05, -3.1536445021629333e-05, -3.0170194804668427e-05, -2.880394458770752e-05, -2.7437694370746613e-05, -2.6071444153785706e-05, -2.47051939368248e-05, -2.333894371986389e-05, -2.1972693502902985e-05, -2.0606443285942078e-05, -1.924019306898117e-05, -1.7873942852020264e-05, -1.6507692635059357e-05, -1.514144241809845e-05, -1.3775192201137543e-05, -1.2408941984176636e-05, -1.1042691767215729e-05, -9.676441550254822e-06, -8.310191333293915e-06, -6.943941116333008e-06, -5.577690899372101e-06, -4.211440682411194e-06, -2.845190465450287e-06, -1.4789402484893799e-06, -1.126900315284729e-07, 1.253560185432434e-06, 2.619810402393341e-06, 3.986060619354248e-06, 5.352310836315155e-06, 6.718561053276062e-06, 8.084811270236969e-06, 9.451061487197876e-06, 1.0817311704158783e-05, 1.218356192111969e-05, 1.3549812138080597e-05, 1.4916062355041504e-05, 1.628231257200241e-05, 1.7648562788963318e-05, 1.9014813005924225e-05, 2.0381063222885132e-05, 2.174731343984604e-05, 2.3113563656806946e-05, 2.4479813873767853e-05, 2.584606409072876e-05, 2.7212314307689667e-05, 2.8578564524650574e-05, 2.994481474161148e-05, 3.131106495857239e-05, 3.2677315175533295e-05, 3.40435653924942e-05, 3.540981560945511e-05, 3.6776065826416016e-05]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 0.0, 5.0, 3.0, 5.0, 12.0, 7.0, 15.0, 17.0, 20.0, 19.0, 32.0, 53.0, 33.0, 62.0, 41.0, 81.0, 64.0, 48.0, 81.0, 49.0, 59.0, 47.0, 44.0, 39.0, 19.0, 36.0, 30.0, 25.0, 20.0, 12.0, 11.0, 7.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.139278411865234e-06, -5.984678864479065e-06, -5.8300793170928955e-06, -5.675479769706726e-06, -5.520880222320557e-06, -5.366280674934387e-06, -5.211681127548218e-06, -5.057081580162048e-06, -4.902482032775879e-06, -4.7478824853897095e-06, -4.59328293800354e-06, -4.438683390617371e-06, -4.284083843231201e-06, -4.129484295845032e-06, -3.974884748458862e-06, -3.820285201072693e-06, -3.6656856536865234e-06, -3.511086106300354e-06, -3.3564865589141846e-06, -3.201887011528015e-06, -3.0472874641418457e-06, -2.8926879167556763e-06, -2.738088369369507e-06, -2.5834888219833374e-06, -2.428889274597168e-06, -2.2742897272109985e-06, -2.119690179824829e-06, -1.9650906324386597e-06, -1.8104910850524902e-06, -1.6558915376663208e-06, -1.5012919902801514e-06, -1.346692442893982e-06, -1.1920928955078125e-06, -1.037493348121643e-06, -8.828938007354736e-07, -7.282942533493042e-07, -5.736947059631348e-07, -4.1909515857696533e-07, -2.644956111907959e-07, -1.0989606380462646e-07, 4.470348358154297e-08, 1.993030309677124e-07, 3.5390257835388184e-07, 5.085021257400513e-07, 6.631016731262207e-07, 8.177012205123901e-07, 9.723007678985596e-07, 1.126900315284729e-06, 1.2814998626708984e-06, 1.4360994100570679e-06, 1.5906989574432373e-06, 1.7452985048294067e-06, 1.8998980522155762e-06, 2.0544975996017456e-06, 2.209097146987915e-06, 2.3636966943740845e-06, 2.518296241760254e-06, 2.6728957891464233e-06, 2.8274953365325928e-06, 2.982094883918762e-06, 3.1366944313049316e-06, 3.291293978691101e-06, 3.4458935260772705e-06, 3.60049307346344e-06, 3.7550926208496094e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 8.0, 3.0, 10.0, 12.0, 13.0, 11.0, 26.0, 63.0, 131.0, 343.0, 1993.0, 1043547.0, 1793.0, 314.0, 140.0, 52.0, 22.0, 11.0, 14.0, 17.0, 4.0, 11.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012612342834472656, -0.00012292899191379547, -0.00011973455548286438, -0.00011654011905193329, -0.0001133456826210022, -0.0001101512461900711, -0.00010695680975914001, -0.00010376237332820892, -0.00010056793689727783, -9.737350046634674e-05, -9.417906403541565e-05, -9.098462760448456e-05, -8.779019117355347e-05, -8.459575474262238e-05, -8.140131831169128e-05, -7.820688188076019e-05, -7.50124454498291e-05, -7.181800901889801e-05, -6.862357258796692e-05, -6.542913615703583e-05, -6.223469972610474e-05, -5.9040263295173645e-05, -5.5845826864242554e-05, -5.265139043331146e-05, -4.945695400238037e-05, -4.626251757144928e-05, -4.306808114051819e-05, -3.98736447095871e-05, -3.6679208278656006e-05, -3.3484771847724915e-05, -3.0290335416793823e-05, -2.7095898985862732e-05, -2.390146255493164e-05, -2.070702612400055e-05, -1.7512589693069458e-05, -1.4318153262138367e-05, -1.1123716831207275e-05, -7.929280400276184e-06, -4.734843969345093e-06, -1.5404075384140015e-06, 1.6540288925170898e-06, 4.848465323448181e-06, 8.042901754379272e-06, 1.1237338185310364e-05, 1.4431774616241455e-05, 1.7626211047172546e-05, 2.0820647478103638e-05, 2.401508390903473e-05, 2.720952033996582e-05, 3.040395677089691e-05, 3.3598393201828e-05, 3.6792829632759094e-05, 3.9987266063690186e-05, 4.318170249462128e-05, 4.637613892555237e-05, 4.957057535648346e-05, 5.276501178741455e-05, 5.595944821834564e-05, 5.9153884649276733e-05, 6.234832108020782e-05, 6.554275751113892e-05, 6.873719394207001e-05, 7.19316303730011e-05, 7.512606680393219e-05, 7.832050323486328e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 2.0, 10.0, 12.0, 10.0, 9.0, 16.0, 28.0, 54.0, 63.0, 124.0, 308.0, 127.0, 76.0, 48.0, 28.0, 16.0, 6.0, 11.0, 15.0, 5.0, 11.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.810924530029297e-05, -9.562913328409195e-05, -9.314902126789093e-05, -9.066890925168991e-05, -8.818879723548889e-05, -8.570868521928787e-05, -8.322857320308685e-05, -8.074846118688583e-05, -7.826834917068481e-05, -7.57882371544838e-05, -7.330812513828278e-05, -7.082801312208176e-05, -6.834790110588074e-05, -6.586778908967972e-05, -6.33876770734787e-05, -6.090756505727768e-05, -5.842745304107666e-05, -5.594734102487564e-05, -5.346722900867462e-05, -5.09871169924736e-05, -4.850700497627258e-05, -4.6026892960071564e-05, -4.3546780943870544e-05, -4.1066668927669525e-05, -3.8586556911468506e-05, -3.6106444895267487e-05, -3.362633287906647e-05, -3.114622086286545e-05, -2.866610884666443e-05, -2.618599683046341e-05, -2.370588481426239e-05, -2.122577279806137e-05, -1.874566078186035e-05, -1.6265548765659332e-05, -1.3785436749458313e-05, -1.1305324733257294e-05, -8.825212717056274e-06, -6.345100700855255e-06, -3.864988684654236e-06, -1.3848766684532166e-06, 1.0952353477478027e-06, 3.575347363948822e-06, 6.055459380149841e-06, 8.53557139635086e-06, 1.101568341255188e-05, 1.34957954287529e-05, 1.597590744495392e-05, 1.8456019461154938e-05, 2.0936131477355957e-05, 2.3416243493556976e-05, 2.5896355509757996e-05, 2.8376467525959015e-05, 3.0856579542160034e-05, 3.3336691558361053e-05, 3.581680357456207e-05, 3.829691559076309e-05, 4.077702760696411e-05, 4.325713962316513e-05, 4.573725163936615e-05, 4.821736365556717e-05, 5.069747567176819e-05, 5.317758768796921e-05, 5.565769970417023e-05, 5.8137811720371246e-05, 6.0617923736572266e-05]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 849.0, 155.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15546324849128723, -0.1422867476940155, -0.12911024689674377, -0.11593374609947205, -0.10275724530220032, -0.08958074450492859, -0.07640424370765686, -0.06322774291038513, -0.0500512421131134, -0.036874741315841675, -0.023698240518569946, -0.010521739721298218, 0.0026547610759735107, 0.01583126187324524, 0.029007762670516968, 0.042184263467788696, 0.055360764265060425, 0.06853726506233215, 0.08171376585960388, 0.09489026665687561, 0.10806676745414734, 0.12124326825141907, 0.1344197690486908, 0.14759626984596252, 0.16077277064323425, 0.17394927144050598, 0.1871257722377777, 0.20030227303504944, 0.21347877383232117, 0.2266552746295929, 0.23983177542686462, 0.25300827622413635, 0.26618480682373047, 0.2793613076210022, 0.2925378084182739, 0.30571430921554565, 0.3188908100128174, 0.3320673108100891, 0.34524381160736084, 0.35842031240463257, 0.3715968132019043, 0.384773313999176, 0.39794981479644775, 0.4111263155937195, 0.4243028163909912, 0.43747931718826294, 0.45065581798553467, 0.4638323187828064, 0.4770088195800781, 0.49018532037734985, 0.5033618211746216, 0.5165383219718933, 0.529714822769165, 0.5428913235664368, 0.5560678243637085, 0.5692443251609802, 0.582420825958252, 0.5955973267555237, 0.6087738275527954, 0.6219503283500671, 0.6351268291473389, 0.6483033299446106, 0.6614798307418823, 0.674656331539154, 0.6878328323364258]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 14.0, 15.0, 12.0, 18.0, 20.0, 32.0, 34.0, 37.0, 49.0, 56.0, 55.0, 68.0, 76.0, 64.0, 69.0, 64.0, 61.0, 38.0, 37.0, 40.0, 37.0, 17.0, 17.0, 17.0, 20.0, 13.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24812549352645874, -0.2404186725616455, -0.23271186649799347, -0.22500504553318024, -0.2172982394695282, -0.20959141850471497, -0.20188459753990173, -0.1941777765750885, -0.18647097051143646, -0.17876414954662323, -0.1710573434829712, -0.16335052251815796, -0.15564370155334473, -0.1479368954896927, -0.14023007452487946, -0.13252326846122742, -0.12481644749641418, -0.11710963398218155, -0.10940282046794891, -0.10169599950313568, -0.09398918598890305, -0.08628237247467041, -0.07857555150985718, -0.07086873799562454, -0.0631619244813919, -0.05545511096715927, -0.04774829372763634, -0.0400414764881134, -0.03233466297388077, -0.024627849459648132, -0.0169210322201252, -0.009214214980602264, -0.001507401466369629, 0.006199413910508156, 0.01390622928738594, 0.021613044664263725, 0.02931986004114151, 0.037026673555374146, 0.04473349079489708, 0.05244030803442001, 0.06014712154865265, 0.06785393506288528, 0.07556074857711792, 0.08326756954193115, 0.09097438305616379, 0.09868119657039642, 0.10638801753520966, 0.11409483104944229, 0.12180164456367493, 0.12950846552848816, 0.1372152715921402, 0.14492209255695343, 0.15262889862060547, 0.1603357195854187, 0.16804254055023193, 0.17574936151504517, 0.1834561675786972, 0.19116298854351044, 0.19886979460716248, 0.2065766155719757, 0.21428343653678894, 0.22199024260044098, 0.2296970635652542, 0.23740386962890625, 0.24511069059371948]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 4.0, 5.0, 11.0, 9.0, 12.0, 14.0, 15.0, 25.0, 41.0, 31.0, 29.0, 53.0, 104.0, 214.0, 964.0, 4191612.0, 619.0, 121.0, 98.0, 69.0, 53.0, 31.0, 22.0, 10.0, 10.0, 15.0, 3.0, 10.0, 10.0, 11.0, 12.0, 12.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0], "bins": [-0.0033283233642578125, -0.003225773572921753, -0.0031232237815856934, -0.003020673990249634, -0.0029181241989135742, -0.0028155744075775146, -0.002713024616241455, -0.0026104748249053955, -0.002507925033569336, -0.0024053752422332764, -0.002302825450897217, -0.0022002756595611572, -0.0020977258682250977, -0.001995176076889038, -0.0018926262855529785, -0.001790076494216919, -0.0016875267028808594, -0.0015849769115447998, -0.0014824271202087402, -0.0013798773288726807, -0.001277327537536621, -0.0011747777462005615, -0.001072227954864502, -0.0009696781635284424, -0.0008671283721923828, -0.0007645785808563232, -0.0006620287895202637, -0.0005594789981842041, -0.00045692920684814453, -0.00035437941551208496, -0.0002518296241760254, -0.00014927983283996582, -4.673004150390625e-05, 5.581974983215332e-05, 0.0001583695411682129, 0.00026091933250427246, 0.00036346912384033203, 0.0004660189151763916, 0.0005685687065124512, 0.0006711184978485107, 0.0007736682891845703, 0.0008762180805206299, 0.0009787678718566895, 0.001081317663192749, 0.0011838674545288086, 0.0012864172458648682, 0.0013889670372009277, 0.0014915168285369873, 0.0015940666198730469, 0.0016966164112091064, 0.001799166202545166, 0.0019017159938812256, 0.002004265785217285, 0.0021068155765533447, 0.0022093653678894043, 0.002311915159225464, 0.0024144649505615234, 0.002517014741897583, 0.0026195645332336426, 0.002722114324569702, 0.0028246641159057617, 0.0029272139072418213, 0.003029763698577881, 0.0031323134899139404, 0.00323486328125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 8.0, 15.0, 15.0, 19.0, 21.0, 114.0, 413.0, 229.0, 46.0, 22.0, 9.0, 9.0, 5.0, 12.0, 10.0, 5.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 9.0, 45.0, 96.0, 221.0, 552.0, 1247.0, 3936.0, 4182354.0, 3698.0, 1182.0, 552.0, 226.0, 102.0, 52.0, 8.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008339881896972656, -0.0008074939250946045, -0.0007809996604919434, -0.0007545053958892822, -0.0007280111312866211, -0.00070151686668396, -0.0006750226020812988, -0.0006485283374786377, -0.0006220340728759766, -0.0005955398082733154, -0.0005690455436706543, -0.0005425512790679932, -0.000516057014465332, -0.0004895627498626709, -0.00046306848526000977, -0.00043657422065734863, -0.0004100799560546875, -0.00038358569145202637, -0.00035709142684936523, -0.0003305971622467041, -0.00030410289764404297, -0.00027760863304138184, -0.0002511143684387207, -0.00022462010383605957, -0.00019812583923339844, -0.0001716315746307373, -0.00014513731002807617, -0.00011864304542541504, -9.21487808227539e-05, -6.565451622009277e-05, -3.916025161743164e-05, -1.2665987014770508e-05, 1.3828277587890625e-05, 4.032254219055176e-05, 6.681680679321289e-05, 9.331107139587402e-05, 0.00011980533599853516, 0.0001462996006011963, 0.00017279386520385742, 0.00019928812980651855, 0.0002257823944091797, 0.0002522766590118408, 0.00027877092361450195, 0.0003052651882171631, 0.0003317594528198242, 0.00035825371742248535, 0.0003847479820251465, 0.0004112422466278076, 0.00043773651123046875, 0.0004642307758331299, 0.000490725040435791, 0.0005172193050384521, 0.0005437135696411133, 0.0005702078342437744, 0.0005967020988464355, 0.0006231963634490967, 0.0006496906280517578, 0.0006761848926544189, 0.0007026791572570801, 0.0007291734218597412, 0.0007556676864624023, 0.0007821619510650635, 0.0008086562156677246, 0.0008351504802703857, 0.0008616447448730469]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4031.0, 34.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035858154296875, -0.00034769997000694275, -0.0003368183970451355, -0.00032593682408332825, -0.000315055251121521, -0.00030417367815971375, -0.0002932921051979065, -0.00028241053223609924, -0.000271528959274292, -0.00026064738631248474, -0.0002497658133506775, -0.00023888424038887024, -0.000228002667427063, -0.00021712109446525574, -0.00020623952150344849, -0.00019535794854164124, -0.00018447637557983398, -0.00017359480261802673, -0.00016271322965621948, -0.00015183165669441223, -0.00014095008373260498, -0.00013006851077079773, -0.00011918693780899048, -0.00010830536484718323, -9.742379188537598e-05, -8.654221892356873e-05, -7.566064596176147e-05, -6.477907299995422e-05, -5.389750003814697e-05, -4.301592707633972e-05, -3.213435411453247e-05, -2.125278115272522e-05, -1.0371208190917969e-05, 5.103647708892822e-07, 1.1391937732696533e-05, 2.2273510694503784e-05, 3.3155083656311035e-05, 4.4036656618118286e-05, 5.491822957992554e-05, 6.579980254173279e-05, 7.668137550354004e-05, 8.756294846534729e-05, 9.844452142715454e-05, 0.00010932609438896179, 0.00012020766735076904, 0.0001310892403125763, 0.00014197081327438354, 0.0001528523862361908, 0.00016373395919799805, 0.0001746155321598053, 0.00018549710512161255, 0.0001963786780834198, 0.00020726025104522705, 0.0002181418240070343, 0.00022902339696884155, 0.0002399049699306488, 0.00025078654289245605, 0.0002616681158542633, 0.00027254968881607056, 0.0002834312617778778, 0.00029431283473968506, 0.0003051944077014923, 0.00031607598066329956, 0.0003269575536251068, 0.00033783912658691406]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 15.0, 703.0, 280.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005295274313539267, -0.0004999681259505451, -0.0004704088205471635, -0.0004408495151437819, -0.0004112902097404003, -0.00038173090433701873, -0.0003521716280374676, -0.000322612322634086, -0.0002930530172307044, -0.00026349371182732284, -0.00023393440642394125, -0.0002043751155724749, -0.0001748158101690933, -0.00014525650476571172, -0.00011569721391424537, -8.613790851086378e-05, -5.6578603107482195e-05, -2.7019301342079416e-05, 2.540000423323363e-06, 3.2099298550747335e-05, 6.165860395412892e-05, 9.121790935751051e-05, 0.00012077720020897686, 0.00015033650561235845, 0.00017989581101574004, 0.00020945511641912162, 0.0002390144218225032, 0.00026857369812205434, 0.0002981330035254359, 0.0003276923089288175, 0.0003572516143321991, 0.0003868109197355807, 0.00041637022513896227, 0.00044592953054234385, 0.00047548883594572544, 0.000505048141349107, 0.0005346074467524886, 0.0005641667521558702, 0.0005937260575592518, 0.0006232853047549725, 0.000652844668366015, 0.0006824039737693965, 0.0007119632791727781, 0.0007415225845761597, 0.0007710818899795413, 0.0008006411953829229, 0.0008302005007863045, 0.0008597597479820251, 0.0008893190533854067, 0.0009188783587887883, 0.0009484376641921699, 0.0009779969695955515, 0.0010075562167912722, 0.0010371155804023147, 0.0010666748275980353, 0.0010962341912090778, 0.0011257934384047985, 0.0011553526856005192, 0.0011849120492115617, 0.0012144712964072824, 0.0012440306600183249, 0.0012735899072140455, 0.001303149270825088, 0.0013327085180208087, 0.0013622678816318512]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 10.0, 26.0, 25.0, 25.0, 40.0, 51.0, 85.0, 93.0, 119.0, 114.0, 93.0, 77.0, 74.0, 53.0, 39.0, 28.0, 19.0, 8.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000954747200012207, -0.0009284215047955513, -0.0009020958095788956, -0.0008757701143622398, -0.0008494444191455841, -0.0008231187239289284, -0.0007967930287122726, -0.0007704673334956169, -0.0007441416382789612, -0.0007178159430623055, -0.0006914902478456497, -0.000665164552628994, -0.0006388388574123383, -0.0006125131621956825, -0.0005861874669790268, -0.0005598617717623711, -0.0005335360765457153, -0.0005072103813290596, -0.00048088468611240387, -0.00045455899089574814, -0.0004282332956790924, -0.0004019076004624367, -0.00037558190524578094, -0.0003492562100291252, -0.0003229305148124695, -0.00029660481959581375, -0.000270279124379158, -0.0002439534291625023, -0.00021762773394584656, -0.00019130203872919083, -0.0001649763435125351, -0.00013865064829587936, -0.00011232495307922363, -8.59992578625679e-05, -5.967356264591217e-05, -3.334786742925644e-05, -7.022172212600708e-06, 1.9303523004055023e-05, 4.5629218220710754e-05, 7.195491343736649e-05, 9.828060865402222e-05, 0.00012460630387067795, 0.00015093199908733368, 0.0001772576943039894, 0.00020358338952064514, 0.00022990908473730087, 0.0002562347799539566, 0.00028256047517061234, 0.00030888617038726807, 0.0003352118656039238, 0.00036153756082057953, 0.00038786325603723526, 0.000414188951253891, 0.0004405146464705467, 0.00046684034168720245, 0.0004931660369038582, 0.0005194917321205139, 0.0005458174273371696, 0.0005721431225538254, 0.0005984688177704811, 0.0006247945129871368, 0.0006511202082037926, 0.0006774459034204483, 0.000703771598637104, 0.0007300972938537598]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 7.0, 10.0, 5.0, 15.0, 11.0, 16.0, 17.0, 43.0, 44.0, 78.0, 128.0, 232.0, 546.0, 1262.0, 3896.0, 18872.0, 991451.0, 24983.0, 4271.0, 1389.0, 539.0, 271.0, 163.0, 92.0, 58.0, 53.0, 27.0, 15.0, 13.0, 8.0, 14.0, 1.0, 5.0, 10.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053009033203125, -0.05132913589477539, -0.04964923858642578, -0.04796934127807617, -0.04628944396972656, -0.04460954666137695, -0.042929649353027344, -0.041249752044677734, -0.039569854736328125, -0.037889957427978516, -0.036210060119628906, -0.0345301628112793, -0.03285026550292969, -0.031170368194580078, -0.02949047088623047, -0.02781057357788086, -0.02613067626953125, -0.02445077896118164, -0.02277088165283203, -0.021090984344482422, -0.019411087036132812, -0.017731189727783203, -0.016051292419433594, -0.014371395111083984, -0.012691497802734375, -0.011011600494384766, -0.009331703186035156, -0.007651805877685547, -0.0059719085693359375, -0.004292011260986328, -0.0026121139526367188, -0.0009322166442871094, 0.0007476806640625, 0.0024275779724121094, 0.004107475280761719, 0.005787372589111328, 0.0074672698974609375, 0.009147167205810547, 0.010827064514160156, 0.012506961822509766, 0.014186859130859375, 0.015866756439208984, 0.017546653747558594, 0.019226551055908203, 0.020906448364257812, 0.022586345672607422, 0.02426624298095703, 0.02594614028930664, 0.02762603759765625, 0.02930593490600586, 0.03098583221435547, 0.03266572952270508, 0.03434562683105469, 0.0360255241394043, 0.037705421447753906, 0.039385318756103516, 0.041065216064453125, 0.042745113372802734, 0.044425010681152344, 0.04610490798950195, 0.04778480529785156, 0.04946470260620117, 0.05114459991455078, 0.05282449722290039, 0.05450439453125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 8.0, 15.0, 15.0, 19.0, 21.0, 114.0, 413.0, 229.0, 46.0, 22.0, 9.0, 9.0, 5.0, 12.0, 10.0, 5.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 5.0, 5.0, 12.0, 10.0, 24.0, 12.0, 10.0, 17.0, 21.0, 27.0, 37.0, 27.0, 29.0, 59.0, 104.0, 187.0, 357.0, 823.0, 3203.0, 998589.0, 42075.0, 1538.0, 579.0, 280.0, 140.0, 68.0, 42.0, 35.0, 27.0, 20.0, 34.0, 23.0, 17.0, 17.0, 13.0, 20.0, 12.0, 10.0, 5.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.053497314453125, -0.051914215087890625, -0.05033111572265625, -0.048748016357421875, -0.0471649169921875, -0.045581817626953125, -0.04399871826171875, -0.042415618896484375, -0.04083251953125, -0.039249420166015625, -0.03766632080078125, -0.036083221435546875, -0.0345001220703125, -0.032917022705078125, -0.03133392333984375, -0.029750823974609375, -0.028167724609375, -0.026584625244140625, -0.02500152587890625, -0.023418426513671875, -0.0218353271484375, -0.020252227783203125, -0.01866912841796875, -0.017086029052734375, -0.0155029296875, -0.013919830322265625, -0.01233673095703125, -0.010753631591796875, -0.0091705322265625, -0.007587432861328125, -0.00600433349609375, -0.004421234130859375, -0.002838134765625, -0.001255035400390625, 0.00032806396484375, 0.001911163330078125, 0.0034942626953125, 0.005077362060546875, 0.00666046142578125, 0.008243560791015625, 0.00982666015625, 0.011409759521484375, 0.01299285888671875, 0.014575958251953125, 0.0161590576171875, 0.017742156982421875, 0.01932525634765625, 0.020908355712890625, 0.022491455078125, 0.024074554443359375, 0.02565765380859375, 0.027240753173828125, 0.0288238525390625, 0.030406951904296875, 0.03199005126953125, 0.033573150634765625, 0.03515625, 0.036739349365234375, 0.03832244873046875, 0.039905548095703125, 0.0414886474609375, 0.043071746826171875, 0.04465484619140625, 0.046237945556640625, 0.047821044921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 5.0, 5.0, 13.0, 10.0, 22.0, 14.0, 9.0, 17.0, 21.0, 28.0, 38.0, 24.0, 23.0, 33.0, 41.0, 30.0, 31.0, 41.0, 40.0, 39.0, 35.0, 38.0, 41.0, 35.0, 46.0, 24.0, 30.0, 29.0, 29.0, 19.0, 35.0, 22.0, 16.0, 19.0, 11.0, 21.0, 12.0, 9.0, 6.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.03387451171875, -0.03287172317504883, -0.031868934631347656, -0.030866146087646484, -0.029863357543945312, -0.02886056900024414, -0.02785778045654297, -0.026854991912841797, -0.025852203369140625, -0.024849414825439453, -0.02384662628173828, -0.02284383773803711, -0.021841049194335938, -0.020838260650634766, -0.019835472106933594, -0.018832683563232422, -0.01782989501953125, -0.016827106475830078, -0.015824317932128906, -0.014821529388427734, -0.013818740844726562, -0.01281595230102539, -0.011813163757324219, -0.010810375213623047, -0.009807586669921875, -0.008804798126220703, -0.007802009582519531, -0.006799221038818359, -0.0057964324951171875, -0.004793643951416016, -0.0037908554077148438, -0.002788066864013672, -0.0017852783203125, -0.0007824897766113281, 0.00022029876708984375, 0.0012230873107910156, 0.0022258758544921875, 0.0032286643981933594, 0.004231452941894531, 0.005234241485595703, 0.006237030029296875, 0.007239818572998047, 0.008242607116699219, 0.00924539566040039, 0.010248184204101562, 0.011250972747802734, 0.012253761291503906, 0.013256549835205078, 0.01425933837890625, 0.015262126922607422, 0.016264915466308594, 0.017267704010009766, 0.018270492553710938, 0.01927328109741211, 0.02027606964111328, 0.021278858184814453, 0.022281646728515625, 0.023284435272216797, 0.02428722381591797, 0.02529001235961914, 0.026292800903320312, 0.027295589447021484, 0.028298377990722656, 0.029301166534423828, 0.030303955078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 8.0, 9.0, 13.0, 12.0, 16.0, 37.0, 37.0, 59.0, 87.0, 122.0, 203.0, 342.0, 609.0, 1686.0, 4201.0, 17952.0, 911409.0, 96681.0, 9688.0, 2832.0, 1227.0, 510.0, 257.0, 176.0, 126.0, 75.0, 39.0, 24.0, 32.0, 19.0, 21.0, 11.0, 3.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-2.2709369659423828e-05, -2.2037886083126068e-05, -2.1366402506828308e-05, -2.0694918930530548e-05, -2.0023435354232788e-05, -1.9351951777935028e-05, -1.8680468201637268e-05, -1.8008984625339508e-05, -1.7337501049041748e-05, -1.6666017472743988e-05, -1.5994533896446228e-05, -1.5323050320148468e-05, -1.4651566743850708e-05, -1.3980083167552948e-05, -1.3308599591255188e-05, -1.2637116014957428e-05, -1.1965632438659668e-05, -1.1294148862361908e-05, -1.0622665286064148e-05, -9.951181709766388e-06, -9.279698133468628e-06, -8.608214557170868e-06, -7.936730980873108e-06, -7.265247404575348e-06, -6.593763828277588e-06, -5.922280251979828e-06, -5.250796675682068e-06, -4.579313099384308e-06, -3.907829523086548e-06, -3.236345946788788e-06, -2.564862370491028e-06, -1.8933787941932678e-06, -1.2218952178955078e-06, -5.504116415977478e-07, 1.210719347000122e-07, 7.925555109977722e-07, 1.4640390872955322e-06, 2.1355226635932922e-06, 2.8070062398910522e-06, 3.4784898161888123e-06, 4.149973392486572e-06, 4.821456968784332e-06, 5.492940545082092e-06, 6.164424121379852e-06, 6.835907697677612e-06, 7.507391273975372e-06, 8.178874850273132e-06, 8.850358426570892e-06, 9.521842002868652e-06, 1.0193325579166412e-05, 1.0864809155464172e-05, 1.1536292731761932e-05, 1.2207776308059692e-05, 1.2879259884357452e-05, 1.3550743460655212e-05, 1.4222227036952972e-05, 1.4893710613250732e-05, 1.5565194189548492e-05, 1.6236677765846252e-05, 1.6908161342144012e-05, 1.7579644918441772e-05, 1.8251128494739532e-05, 1.8922612071037292e-05, 1.9594095647335052e-05, 2.0265579223632812e-05]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 2.0, 9.0, 10.0, 6.0, 10.0, 18.0, 15.0, 19.0, 15.0, 28.0, 44.0, 37.0, 40.0, 54.0, 48.0, 50.0, 49.0, 105.0, 60.0, 41.0, 55.0, 54.0, 33.0, 39.0, 25.0, 29.0, 15.0, 16.0, 13.0, 14.0, 6.0, 5.0, 7.0, 7.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.291534423828125e-06, -4.157423973083496e-06, -4.023313522338867e-06, -3.889203071594238e-06, -3.7550926208496094e-06, -3.6209821701049805e-06, -3.4868717193603516e-06, -3.3527612686157227e-06, -3.2186508178710938e-06, -3.084540367126465e-06, -2.950429916381836e-06, -2.816319465637207e-06, -2.682209014892578e-06, -2.5480985641479492e-06, -2.4139881134033203e-06, -2.2798776626586914e-06, -2.1457672119140625e-06, -2.0116567611694336e-06, -1.8775463104248047e-06, -1.7434358596801758e-06, -1.6093254089355469e-06, -1.475214958190918e-06, -1.341104507446289e-06, -1.2069940567016602e-06, -1.0728836059570312e-06, -9.387731552124023e-07, -8.046627044677734e-07, -6.705522537231445e-07, -5.364418029785156e-07, -4.023313522338867e-07, -2.682209014892578e-07, -1.341104507446289e-07, 0.0, 1.341104507446289e-07, 2.682209014892578e-07, 4.023313522338867e-07, 5.364418029785156e-07, 6.705522537231445e-07, 8.046627044677734e-07, 9.387731552124023e-07, 1.0728836059570312e-06, 1.2069940567016602e-06, 1.341104507446289e-06, 1.475214958190918e-06, 1.6093254089355469e-06, 1.7434358596801758e-06, 1.8775463104248047e-06, 2.0116567611694336e-06, 2.1457672119140625e-06, 2.2798776626586914e-06, 2.4139881134033203e-06, 2.5480985641479492e-06, 2.682209014892578e-06, 2.816319465637207e-06, 2.950429916381836e-06, 3.084540367126465e-06, 3.2186508178710938e-06, 3.3527612686157227e-06, 3.4868717193603516e-06, 3.6209821701049805e-06, 3.7550926208496094e-06, 3.889203071594238e-06, 4.023313522338867e-06, 4.157423973083496e-06, 4.291534423828125e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 4.0, 4.0, 20.0, 16.0, 27.0, 41.0, 67.0, 90.0, 178.0, 569.0, 5291.0, 1038816.0, 2540.0, 412.0, 165.0, 91.0, 53.0, 40.0, 18.0, 17.0, 11.0, 13.0, 7.0, 7.0, 3.0, 3.0, 6.0, 9.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.0558319091796875e-05, -5.868915468454361e-05, -5.6819990277290344e-05, -5.495082587003708e-05, -5.3081661462783813e-05, -5.121249705553055e-05, -4.934333264827728e-05, -4.747416824102402e-05, -4.560500383377075e-05, -4.3735839426517487e-05, -4.186667501926422e-05, -3.9997510612010956e-05, -3.812834620475769e-05, -3.6259181797504425e-05, -3.439001739025116e-05, -3.2520852982997894e-05, -3.065168857574463e-05, -2.8782524168491364e-05, -2.6913359761238098e-05, -2.5044195353984833e-05, -2.3175030946731567e-05, -2.1305866539478302e-05, -1.9436702132225037e-05, -1.756753772497177e-05, -1.5698373317718506e-05, -1.382920891046524e-05, -1.1960044503211975e-05, -1.009088009595871e-05, -8.221715688705444e-06, -6.352551281452179e-06, -4.4833868741989136e-06, -2.614222466945648e-06, -7.450580596923828e-07, 1.1241063475608826e-06, 2.993270754814148e-06, 4.862435162067413e-06, 6.731599569320679e-06, 8.600763976573944e-06, 1.046992838382721e-05, 1.2339092791080475e-05, 1.420825719833374e-05, 1.6077421605587006e-05, 1.794658601284027e-05, 1.9815750420093536e-05, 2.1684914827346802e-05, 2.3554079234600067e-05, 2.5423243641853333e-05, 2.7292408049106598e-05, 2.9161572456359863e-05, 3.103073686361313e-05, 3.2899901270866394e-05, 3.476906567811966e-05, 3.6638230085372925e-05, 3.850739449262619e-05, 4.0376558899879456e-05, 4.224572330713272e-05, 4.4114887714385986e-05, 4.598405212163925e-05, 4.785321652889252e-05, 4.972238093614578e-05, 5.159154534339905e-05, 5.346070975065231e-05, 5.532987415790558e-05, 5.7199038565158844e-05, 5.906820297241211e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 5.0, 3.0, 4.0, 8.0, 5.0, 3.0, 21.0, 14.0, 23.0, 25.0, 36.0, 33.0, 47.0, 79.0, 104.0, 197.0, 95.0, 67.0, 45.0, 39.0, 22.0, 26.0, 11.0, 17.0, 11.0, 11.0, 7.0, 8.0, 5.0, 3.0, 5.0, 7.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.838539123535156e-05, -3.719702363014221e-05, -3.600865602493286e-05, -3.482028841972351e-05, -3.363192081451416e-05, -3.244355320930481e-05, -3.125518560409546e-05, -3.006681799888611e-05, -2.8878450393676758e-05, -2.7690082788467407e-05, -2.6501715183258057e-05, -2.5313347578048706e-05, -2.4124979972839355e-05, -2.2936612367630005e-05, -2.1748244762420654e-05, -2.0559877157211304e-05, -1.9371509552001953e-05, -1.8183141946792603e-05, -1.6994774341583252e-05, -1.58064067363739e-05, -1.461803913116455e-05, -1.34296715259552e-05, -1.224130392074585e-05, -1.1052936315536499e-05, -9.864568710327148e-06, -8.676201105117798e-06, -7.487833499908447e-06, -6.299465894699097e-06, -5.111098289489746e-06, -3.9227306842803955e-06, -2.734363079071045e-06, -1.5459954738616943e-06, -3.5762786865234375e-07, 8.307397365570068e-07, 2.0191073417663574e-06, 3.207474946975708e-06, 4.395842552185059e-06, 5.584210157394409e-06, 6.77257776260376e-06, 7.96094536781311e-06, 9.149312973022461e-06, 1.0337680578231812e-05, 1.1526048183441162e-05, 1.2714415788650513e-05, 1.3902783393859863e-05, 1.5091150999069214e-05, 1.6279518604278564e-05, 1.7467886209487915e-05, 1.8656253814697266e-05, 1.9844621419906616e-05, 2.1032989025115967e-05, 2.2221356630325317e-05, 2.3409724235534668e-05, 2.459809184074402e-05, 2.578645944595337e-05, 2.697482705116272e-05, 2.816319465637207e-05, 2.935156226158142e-05, 3.053992986679077e-05, 3.172829747200012e-05, 3.291666507720947e-05, 3.410503268241882e-05, 3.5293400287628174e-05, 3.6481767892837524e-05, 3.7670135498046875e-05]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 18.0, 851.0, 142.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08945082128047943, -0.07633531838655472, -0.06321981549263, -0.050104305148124695, -0.03698880225419998, -0.02387329936027527, -0.010757789015769958, 0.0023577138781547546, 0.015473216772079468, 0.02858872152864933, 0.04170422628521919, 0.054819732904434204, 0.06793523579835892, 0.08105073869228363, 0.09416624903678894, 0.10728175193071365, 0.12039725482463837, 0.13351276516914368, 0.1466282606124878, 0.1597437709569931, 0.1728592813014984, 0.18597477674484253, 0.19909028708934784, 0.21220579743385315, 0.22532129287719727, 0.23843680322170258, 0.2515523135662079, 0.264667809009552, 0.2777833044528961, 0.29089879989624023, 0.30401432514190674, 0.31712982058525085, 0.33024531602859497, 0.3433608114719391, 0.3564763367176056, 0.3695918321609497, 0.3827073276042938, 0.39582282304763794, 0.40893834829330444, 0.42205384373664856, 0.4351693391799927, 0.4482848346233368, 0.4614003598690033, 0.4745158553123474, 0.48763135075569153, 0.5007468461990356, 0.5138623714447021, 0.5269778966903687, 0.5400934219360352, 0.5532089471817017, 0.5663244128227234, 0.5794399380683899, 0.5925554633140564, 0.6056709289550781, 0.6187864542007446, 0.6319019794464111, 0.6450174450874329, 0.6581329703330994, 0.6712484359741211, 0.6843639612197876, 0.6974794864654541, 0.7105949521064758, 0.7237104773521423, 0.7368260025978088, 0.7499414682388306]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 8.0, 5.0, 8.0, 7.0, 18.0, 15.0, 11.0, 26.0, 21.0, 35.0, 31.0, 52.0, 50.0, 48.0, 61.0, 72.0, 68.0, 60.0, 69.0, 52.0, 53.0, 33.0, 42.0, 32.0, 27.0, 18.0, 18.0, 8.0, 15.0, 9.0, 7.0, 8.0, 9.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17363351583480835, -0.16735723614692688, -0.1610809564590454, -0.15480467677116394, -0.14852839708328247, -0.142252117395401, -0.13597583770751953, -0.12969955801963806, -0.12342328578233719, -0.11714700609445572, -0.11087072640657425, -0.10459445416927338, -0.0983181744813919, -0.09204189479351044, -0.08576561510562897, -0.0794893354177475, -0.07321305572986603, -0.06693677604198456, -0.06066049635410309, -0.05438422039151192, -0.04810794070363045, -0.04183166101574898, -0.035555385053157806, -0.029279105365276337, -0.023002825677394867, -0.016726545989513397, -0.010450268164277077, -0.004173990339040756, 0.0021022893488407135, 0.008378569036722183, 0.014654844999313354, 0.020931124687194824, 0.027207404375076294, 0.033483684062957764, 0.03975996375083923, 0.046036239713430405, 0.052312519401311874, 0.058588799089193344, 0.06486507505178452, 0.07114135473966599, 0.07741763442754745, 0.08369391411542892, 0.0899701938033104, 0.09624646604061127, 0.10252274572849274, 0.1087990254163742, 0.11507530510425568, 0.12135158479213715, 0.12762786448001862, 0.13390414416790009, 0.14018042385578156, 0.14645670354366302, 0.1527329832315445, 0.15900926291942596, 0.16528552770614624, 0.1715618073940277, 0.17783808708190918, 0.18411436676979065, 0.19039064645767212, 0.1966669261455536, 0.20294320583343506, 0.20921948552131653, 0.215495765209198, 0.22177204489707947, 0.22804832458496094]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 0.0, 4.0, 4.0, 4.0, 1.0, 8.0, 4.0, 1.0, 8.0, 11.0, 10.0, 25.0, 26.0, 31.0, 23.0, 19.0, 36.0, 54.0, 84.0, 111.0, 202.0, 309.0, 650.0, 2545.0, 4185075.0, 3494.0, 646.0, 329.0, 139.0, 125.0, 82.0, 68.0, 35.0, 27.0, 23.0, 15.0, 11.0, 15.0, 14.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348388671875, -0.3373374938964844, -0.32628631591796875, -0.3152351379394531, -0.3041839599609375, -0.2931327819824219, -0.28208160400390625, -0.2710304260253906, -0.259979248046875, -0.24892807006835938, -0.23787689208984375, -0.22682571411132812, -0.2157745361328125, -0.20472335815429688, -0.19367218017578125, -0.18262100219726562, -0.17156982421875, -0.16051864624023438, -0.14946746826171875, -0.13841629028320312, -0.1273651123046875, -0.11631393432617188, -0.10526275634765625, -0.09421157836914062, -0.083160400390625, -0.07210922241210938, -0.06105804443359375, -0.050006866455078125, -0.0389556884765625, -0.027904510498046875, -0.01685333251953125, -0.005802154541015625, 0.0052490234375, 0.016300201416015625, 0.02735137939453125, 0.038402557373046875, 0.0494537353515625, 0.060504913330078125, 0.07155609130859375, 0.08260726928710938, 0.093658447265625, 0.10470962524414062, 0.11576080322265625, 0.12681198120117188, 0.1378631591796875, 0.14891433715820312, 0.15996551513671875, 0.17101669311523438, 0.18206787109375, 0.19311904907226562, 0.20417022705078125, 0.21522140502929688, 0.2262725830078125, 0.23732376098632812, 0.24837493896484375, 0.2594261169433594, 0.270477294921875, 0.2815284729003906, 0.29257965087890625, 0.3036308288574219, 0.3146820068359375, 0.3257331848144531, 0.33678436279296875, 0.3478355407714844, 0.35888671875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 16.0, 17.0, 17.0, 19.0, 118.0, 407.0, 233.0, 47.0, 22.0, 10.0, 8.0, 5.0, 14.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 5.0, 11.0, 11.0, 20.0, 17.0, 26.0, 29.0, 53.0, 91.0, 365.0, 6899.0, 4177356.0, 8592.0, 409.0, 126.0, 57.0, 48.0, 31.0, 16.0, 17.0, 16.0, 13.0, 11.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07476806640625, -0.07194995880126953, -0.06913185119628906, -0.0663137435913086, -0.06349563598632812, -0.060677528381347656, -0.05785942077636719, -0.05504131317138672, -0.05222320556640625, -0.04940509796142578, -0.04658699035644531, -0.043768882751464844, -0.040950775146484375, -0.038132667541503906, -0.03531455993652344, -0.03249645233154297, -0.0296783447265625, -0.02686023712158203, -0.024042129516601562, -0.021224021911621094, -0.018405914306640625, -0.015587806701660156, -0.012769699096679688, -0.009951591491699219, -0.00713348388671875, -0.004315376281738281, -0.0014972686767578125, 0.0013208389282226562, 0.004138946533203125, 0.006957054138183594, 0.009775161743164062, 0.012593269348144531, 0.015411376953125, 0.01822948455810547, 0.021047592163085938, 0.023865699768066406, 0.026683807373046875, 0.029501914978027344, 0.03232002258300781, 0.03513813018798828, 0.03795623779296875, 0.04077434539794922, 0.04359245300292969, 0.046410560607910156, 0.049228668212890625, 0.052046775817871094, 0.05486488342285156, 0.05768299102783203, 0.0605010986328125, 0.06331920623779297, 0.06613731384277344, 0.0689554214477539, 0.07177352905273438, 0.07459163665771484, 0.07740974426269531, 0.08022785186767578, 0.08304595947265625, 0.08586406707763672, 0.08868217468261719, 0.09150028228759766, 0.09431838989257812, 0.0971364974975586, 0.09995460510253906, 0.10277271270751953, 0.1055908203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 4.0, 4.0, 5.0, 14.0, 16.0, 24.0, 56.0, 170.0, 2866.0, 730.0, 94.0, 19.0, 12.0, 8.0, 3.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.033447265625, -0.03256368637084961, -0.03168010711669922, -0.030796527862548828, -0.029912948608398438, -0.029029369354248047, -0.028145790100097656, -0.027262210845947266, -0.026378631591796875, -0.025495052337646484, -0.024611473083496094, -0.023727893829345703, -0.022844314575195312, -0.021960735321044922, -0.02107715606689453, -0.02019357681274414, -0.01930999755859375, -0.01842641830444336, -0.01754283905029297, -0.016659259796142578, -0.015775680541992188, -0.014892101287841797, -0.014008522033691406, -0.013124942779541016, -0.012241363525390625, -0.011357784271240234, -0.010474205017089844, -0.009590625762939453, -0.008707046508789062, -0.007823467254638672, -0.006939888000488281, -0.006056308746337891, -0.0051727294921875, -0.004289150238037109, -0.0034055709838867188, -0.002521991729736328, -0.0016384124755859375, -0.0007548332214355469, 0.00012874603271484375, 0.0010123252868652344, 0.001895904541015625, 0.0027794837951660156, 0.0036630630493164062, 0.004546642303466797, 0.0054302215576171875, 0.006313800811767578, 0.007197380065917969, 0.00808095932006836, 0.00896453857421875, 0.00984811782836914, 0.010731697082519531, 0.011615276336669922, 0.012498855590820312, 0.013382434844970703, 0.014266014099121094, 0.015149593353271484, 0.016033172607421875, 0.016916751861572266, 0.017800331115722656, 0.018683910369873047, 0.019567489624023438, 0.020451068878173828, 0.02133464813232422, 0.02221822738647461, 0.023101806640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 20.0, 998.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7024952173233032, -0.6819820404052734, -0.6614688038825989, -0.6409556269645691, -0.6204423904418945, -0.5999292135238647, -0.579416036605835, -0.5589028596878052, -0.5383896231651306, -0.5178764462471008, -0.49736320972442627, -0.4768500328063965, -0.4563368260860443, -0.43582361936569214, -0.41531044244766235, -0.3947972357273102, -0.374284029006958, -0.35377082228660583, -0.33325761556625366, -0.3127444386482239, -0.2922312319278717, -0.27171802520751953, -0.25120484828948975, -0.23069164156913757, -0.2101784348487854, -0.18966522812843323, -0.16915203630924225, -0.14863884449005127, -0.1281256377696991, -0.10761243849992752, -0.08709923923015594, -0.06658604741096497, -0.04607284069061279, -0.025559641420841217, -0.005046442151069641, 0.015466757118701935, 0.03597995638847351, 0.05649315565824509, 0.07700635492801666, 0.09751954674720764, 0.11803275346755981, 0.138545960187912, 0.15905915200710297, 0.17957234382629395, 0.20008555054664612, 0.2205987572669983, 0.24111194908618927, 0.26162514090538025, 0.2821383476257324, 0.3026515543460846, 0.32316476106643677, 0.34367793798446655, 0.3641911447048187, 0.3847043514251709, 0.4052175283432007, 0.42573073506355286, 0.44624394178390503, 0.4667571485042572, 0.4872703552246094, 0.5077835321426392, 0.528296709060669, 0.5488099455833435, 0.5693231225013733, 0.5898363590240479, 0.6103495359420776]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 13.0, 16.0, 13.0, 21.0, 33.0, 33.0, 37.0, 48.0, 60.0, 56.0, 46.0, 52.0, 58.0, 44.0, 50.0, 51.0, 62.0, 37.0, 51.0, 39.0, 35.0, 40.0, 22.0, 15.0, 13.0, 13.0, 9.0, 14.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09828883409500122, -0.09575214236974716, -0.0932154506444931, -0.09067875891923904, -0.08814206719398499, -0.08560537546873093, -0.08306868374347687, -0.08053199201822281, -0.07799530029296875, -0.07545860856771469, -0.07292191684246063, -0.07038522511720657, -0.06784853339195251, -0.06531184166669846, -0.0627751499414444, -0.06023845821619034, -0.05770176649093628, -0.05516507476568222, -0.05262838304042816, -0.0500916913151741, -0.047554999589920044, -0.045018307864665985, -0.042481616139411926, -0.03994492441415787, -0.03740823268890381, -0.03487154096364975, -0.03233484923839569, -0.029798157513141632, -0.027261465787887573, -0.024724774062633514, -0.022188082337379456, -0.019651390612125397, -0.017114698886871338, -0.014578007161617279, -0.01204131543636322, -0.009504623711109161, -0.0069679319858551025, -0.004431240260601044, -0.0018945485353469849, 0.000642143189907074, 0.003178834915161133, 0.005715526640415192, 0.00825221836566925, 0.01078891009092331, 0.013325601816177368, 0.015862293541431427, 0.018398985266685486, 0.020935676991939545, 0.023472368717193604, 0.026009060442447662, 0.02854575216770172, 0.03108244389295578, 0.03361913561820984, 0.0361558273434639, 0.03869251906871796, 0.041229210793972015, 0.043765902519226074, 0.04630259424448013, 0.04883928596973419, 0.05137597769498825, 0.05391266942024231, 0.05644936114549637, 0.05898605287075043, 0.061522744596004486, 0.06405943632125854]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 9.0, 9.0, 24.0, 19.0, 42.0, 33.0, 55.0, 68.0, 88.0, 118.0, 205.0, 255.0, 358.0, 507.0, 796.0, 1260.0, 2400.0, 5875.0, 27352.0, 977527.0, 20531.0, 4996.0, 2244.0, 1304.0, 815.0, 527.0, 314.0, 235.0, 156.0, 126.0, 60.0, 60.0, 42.0, 30.0, 25.0, 27.0, 10.0, 11.0, 11.0, 6.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.1270751953125, -0.12315750122070312, -0.11923980712890625, -0.11532211303710938, -0.1114044189453125, -0.10748672485351562, -0.10356903076171875, -0.09965133666992188, -0.095733642578125, -0.09181594848632812, -0.08789825439453125, -0.08398056030273438, -0.0800628662109375, -0.07614517211914062, -0.07222747802734375, -0.06830978393554688, -0.06439208984375, -0.060474395751953125, -0.05655670166015625, -0.052639007568359375, -0.0487213134765625, -0.044803619384765625, -0.04088592529296875, -0.036968231201171875, -0.033050537109375, -0.029132843017578125, -0.02521514892578125, -0.021297454833984375, -0.0173797607421875, -0.013462066650390625, -0.00954437255859375, -0.005626678466796875, -0.001708984375, 0.002208709716796875, 0.00612640380859375, 0.010044097900390625, 0.0139617919921875, 0.017879486083984375, 0.02179718017578125, 0.025714874267578125, 0.029632568359375, 0.033550262451171875, 0.03746795654296875, 0.041385650634765625, 0.0453033447265625, 0.049221038818359375, 0.05313873291015625, 0.057056427001953125, 0.06097412109375, 0.06489181518554688, 0.06880950927734375, 0.07272720336914062, 0.0766448974609375, 0.08056259155273438, 0.08448028564453125, 0.08839797973632812, 0.092315673828125, 0.09623336791992188, 0.10015106201171875, 0.10406875610351562, 0.1079864501953125, 0.11190414428710938, 0.11582183837890625, 0.11973953247070312, 0.1236572265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 16.0, 17.0, 16.0, 22.0, 122.0, 398.0, 238.0, 45.0, 23.0, 9.0, 8.0, 5.0, 14.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 4.0, 13.0, 10.0, 17.0, 21.0, 26.0, 32.0, 43.0, 61.0, 53.0, 78.0, 89.0, 127.0, 143.0, 221.0, 355.0, 611.0, 1575.0, 76466.0, 963147.0, 3219.0, 793.0, 415.0, 243.0, 155.0, 122.0, 94.0, 97.0, 62.0, 50.0, 42.0, 37.0, 28.0, 16.0, 22.0, 14.0, 8.0, 7.0, 8.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.09222412109375, -0.08960151672363281, -0.08697891235351562, -0.08435630798339844, -0.08173370361328125, -0.07911109924316406, -0.07648849487304688, -0.07386589050292969, -0.0712432861328125, -0.06862068176269531, -0.06599807739257812, -0.06337547302246094, -0.06075286865234375, -0.05813026428222656, -0.055507659912109375, -0.05288505554199219, -0.050262451171875, -0.04763984680175781, -0.045017242431640625, -0.04239463806152344, -0.03977203369140625, -0.03714942932128906, -0.034526824951171875, -0.03190422058105469, -0.0292816162109375, -0.026659011840820312, -0.024036407470703125, -0.021413803100585938, -0.01879119873046875, -0.016168594360351562, -0.013545989990234375, -0.010923385620117188, -0.00830078125, -0.0056781768798828125, -0.003055572509765625, -0.0004329681396484375, 0.00218963623046875, 0.0048122406005859375, 0.007434844970703125, 0.010057449340820312, 0.0126800537109375, 0.015302658081054688, 0.017925262451171875, 0.020547866821289062, 0.02317047119140625, 0.025793075561523438, 0.028415679931640625, 0.031038284301757812, 0.033660888671875, 0.03628349304199219, 0.038906097412109375, 0.04152870178222656, 0.04415130615234375, 0.04677391052246094, 0.049396514892578125, 0.05201911926269531, 0.0546417236328125, 0.05726432800292969, 0.059886932373046875, 0.06250953674316406, 0.06513214111328125, 0.06775474548339844, 0.07037734985351562, 0.07299995422363281, 0.07562255859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 3.0, 10.0, 7.0, 11.0, 12.0, 16.0, 18.0, 20.0, 35.0, 16.0, 27.0, 25.0, 27.0, 29.0, 40.0, 43.0, 51.0, 49.0, 44.0, 48.0, 61.0, 39.0, 42.0, 39.0, 33.0, 30.0, 30.0, 30.0, 29.0, 17.0, 21.0, 21.0, 14.0, 11.0, 12.0, 7.0, 5.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.03851318359375, -0.03741884231567383, -0.036324501037597656, -0.035230159759521484, -0.03413581848144531, -0.03304147720336914, -0.03194713592529297, -0.030852794647216797, -0.029758453369140625, -0.028664112091064453, -0.02756977081298828, -0.02647542953491211, -0.025381088256835938, -0.024286746978759766, -0.023192405700683594, -0.022098064422607422, -0.02100372314453125, -0.019909381866455078, -0.018815040588378906, -0.017720699310302734, -0.016626358032226562, -0.01553201675415039, -0.014437675476074219, -0.013343334197998047, -0.012248992919921875, -0.011154651641845703, -0.010060310363769531, -0.00896596908569336, -0.007871627807617188, -0.006777286529541016, -0.005682945251464844, -0.004588603973388672, -0.0034942626953125, -0.002399921417236328, -0.0013055801391601562, -0.00021123886108398438, 0.0008831024169921875, 0.0019774436950683594, 0.0030717849731445312, 0.004166126251220703, 0.005260467529296875, 0.006354808807373047, 0.007449150085449219, 0.00854349136352539, 0.009637832641601562, 0.010732173919677734, 0.011826515197753906, 0.012920856475830078, 0.01401519775390625, 0.015109539031982422, 0.016203880310058594, 0.017298221588134766, 0.018392562866210938, 0.01948690414428711, 0.02058124542236328, 0.021675586700439453, 0.022769927978515625, 0.023864269256591797, 0.02495861053466797, 0.02605295181274414, 0.027147293090820312, 0.028241634368896484, 0.029335975646972656, 0.030430316925048828, 0.031524658203125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 12.0, 13.0, 18.0, 24.0, 28.0, 48.0, 69.0, 138.0, 271.0, 570.0, 1549.0, 6624.0, 185614.0, 843126.0, 7508.0, 1697.0, 566.0, 275.0, 130.0, 88.0, 62.0, 37.0, 26.0, 14.0, 11.0, 9.0, 8.0, 5.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002390146255493164, -0.0002313125878572464, -0.0002236105501651764, -0.00021590851247310638, -0.00020820647478103638, -0.00020050443708896637, -0.00019280239939689636, -0.00018510036170482635, -0.00017739832401275635, -0.00016969628632068634, -0.00016199424862861633, -0.00015429221093654633, -0.00014659017324447632, -0.0001388881355524063, -0.0001311860978603363, -0.0001234840601682663, -0.00011578202247619629, -0.00010807998478412628, -0.00010037794709205627, -9.267590939998627e-05, -8.497387170791626e-05, -7.727183401584625e-05, -6.956979632377625e-05, -6.186775863170624e-05, -5.416572093963623e-05, -4.646368324756622e-05, -3.8761645555496216e-05, -3.105960786342621e-05, -2.33575701713562e-05, -1.5655532479286194e-05, -7.953494787216187e-06, -2.514570951461792e-07, 7.450580596923828e-06, 1.5152618288993835e-05, 2.2854655981063843e-05, 3.055669367313385e-05, 3.825873136520386e-05, 4.5960769057273865e-05, 5.366280674934387e-05, 6.136484444141388e-05, 6.906688213348389e-05, 7.67689198255539e-05, 8.44709575176239e-05, 9.217299520969391e-05, 9.987503290176392e-05, 0.00010757707059383392, 0.00011527910828590393, 0.00012298114597797394, 0.00013068318367004395, 0.00013838522136211395, 0.00014608725905418396, 0.00015378929674625397, 0.00016149133443832397, 0.00016919337213039398, 0.000176895409822464, 0.000184597447514534, 0.000192299485206604, 0.000200001522898674, 0.00020770356059074402, 0.00021540559828281403, 0.00022310763597488403, 0.00023080967366695404, 0.00023851171135902405, 0.00024621374905109406, 0.00025391578674316406]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 11.0, 9.0, 20.0, 14.0, 26.0, 27.0, 45.0, 38.0, 76.0, 66.0, 112.0, 93.0, 81.0, 71.0, 57.0, 49.0, 36.0, 29.0, 32.0, 21.0, 16.0, 15.0, 9.0, 4.0, 5.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.569789886474609e-06, -7.242895662784576e-06, -6.9160014390945435e-06, -6.5891072154045105e-06, -6.2622129917144775e-06, -5.935318768024445e-06, -5.608424544334412e-06, -5.281530320644379e-06, -4.954636096954346e-06, -4.627741873264313e-06, -4.30084764957428e-06, -3.973953425884247e-06, -3.647059202194214e-06, -3.320164978504181e-06, -2.993270754814148e-06, -2.666376531124115e-06, -2.339482307434082e-06, -2.012588083744049e-06, -1.6856938600540161e-06, -1.3587996363639832e-06, -1.0319054126739502e-06, -7.050111889839172e-07, -3.781169652938843e-07, -5.122274160385132e-08, 2.7567148208618164e-07, 6.025657057762146e-07, 9.294599294662476e-07, 1.2563541531562805e-06, 1.5832483768463135e-06, 1.9101426005363464e-06, 2.2370368242263794e-06, 2.5639310479164124e-06, 2.8908252716064453e-06, 3.2177194952964783e-06, 3.5446137189865112e-06, 3.871507942676544e-06, 4.198402166366577e-06, 4.52529639005661e-06, 4.852190613746643e-06, 5.179084837436676e-06, 5.505979061126709e-06, 5.832873284816742e-06, 6.159767508506775e-06, 6.486661732196808e-06, 6.813555955886841e-06, 7.140450179576874e-06, 7.467344403266907e-06, 7.79423862695694e-06, 8.121132850646973e-06, 8.448027074337006e-06, 8.774921298027039e-06, 9.101815521717072e-06, 9.428709745407104e-06, 9.755603969097137e-06, 1.008249819278717e-05, 1.0409392416477203e-05, 1.0736286640167236e-05, 1.106318086385727e-05, 1.1390075087547302e-05, 1.1716969311237335e-05, 1.2043863534927368e-05, 1.2370757758617401e-05, 1.2697651982307434e-05, 1.3024546205997467e-05, 1.33514404296875e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 5.0, 9.0, 14.0, 19.0, 29.0, 27.0, 52.0, 85.0, 139.0, 391.0, 2235.0, 1038831.0, 5708.0, 469.0, 190.0, 103.0, 63.0, 39.0, 28.0, 10.0, 14.0, 15.0, 11.0, 4.0, 4.0, 6.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003311634063720703, -0.000321313738822937, -0.0003114640712738037, -0.0003016144037246704, -0.0002917647361755371, -0.0002819150686264038, -0.0002720654010772705, -0.0002622157335281372, -0.0002523660659790039, -0.0002425163984298706, -0.0002326667308807373, -0.000222817063331604, -0.0002129673957824707, -0.0002031177282333374, -0.0001932680606842041, -0.0001834183931350708, -0.0001735687255859375, -0.0001637190580368042, -0.0001538693904876709, -0.0001440197229385376, -0.0001341700553894043, -0.000124320387840271, -0.0001144707202911377, -0.0001046210527420044, -9.47713851928711e-05, -8.492171764373779e-05, -7.507205009460449e-05, -6.522238254547119e-05, -5.537271499633789e-05, -4.552304744720459e-05, -3.567337989807129e-05, -2.5823712348937988e-05, -1.5974044799804688e-05, -6.124377250671387e-06, 3.725290298461914e-06, 1.3574957847595215e-05, 2.3424625396728516e-05, 3.3274292945861816e-05, 4.312396049499512e-05, 5.297362804412842e-05, 6.282329559326172e-05, 7.267296314239502e-05, 8.252263069152832e-05, 9.237229824066162e-05, 0.00010222196578979492, 0.00011207163333892822, 0.00012192130088806152, 0.00013177096843719482, 0.00014162063598632812, 0.00015147030353546143, 0.00016131997108459473, 0.00017116963863372803, 0.00018101930618286133, 0.00019086897373199463, 0.00020071864128112793, 0.00021056830883026123, 0.00022041797637939453, 0.00023026764392852783, 0.00024011731147766113, 0.00024996697902679443, 0.00025981664657592773, 0.00026966631412506104, 0.00027951598167419434, 0.00028936564922332764, 0.00029921531677246094]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 8.0, 7.0, 10.0, 10.0, 12.0, 20.0, 40.0, 79.0, 127.0, 298.0, 160.0, 77.0, 45.0, 25.0, 16.0, 12.0, 8.0, 2.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001385211944580078, -0.00013440102338790894, -0.00013028085231781006, -0.00012616068124771118, -0.0001220405101776123, -0.00011792033910751343, -0.00011380016803741455, -0.00010967999696731567, -0.0001055598258972168, -0.00010143965482711792, -9.731948375701904e-05, -9.319931268692017e-05, -8.907914161682129e-05, -8.495897054672241e-05, -8.083879947662354e-05, -7.671862840652466e-05, -7.259845733642578e-05, -6.84782862663269e-05, -6.435811519622803e-05, -6.023794412612915e-05, -5.6117773056030273e-05, -5.1997601985931396e-05, -4.787743091583252e-05, -4.375725984573364e-05, -3.9637088775634766e-05, -3.551691770553589e-05, -3.139674663543701e-05, -2.7276575565338135e-05, -2.3156404495239258e-05, -1.903623342514038e-05, -1.4916062355041504e-05, -1.0795891284942627e-05, -6.67572021484375e-06, -2.555549144744873e-06, 1.564621925354004e-06, 5.684792995452881e-06, 9.804964065551758e-06, 1.3925135135650635e-05, 1.8045306205749512e-05, 2.216547727584839e-05, 2.6285648345947266e-05, 3.0405819416046143e-05, 3.452599048614502e-05, 3.8646161556243896e-05, 4.2766332626342773e-05, 4.688650369644165e-05, 5.100667476654053e-05, 5.5126845836639404e-05, 5.924701690673828e-05, 6.336718797683716e-05, 6.748735904693604e-05, 7.160753011703491e-05, 7.572770118713379e-05, 7.984787225723267e-05, 8.396804332733154e-05, 8.808821439743042e-05, 9.22083854675293e-05, 9.632855653762817e-05, 0.00010044872760772705, 0.00010456889867782593, 0.0001086890697479248, 0.00011280924081802368, 0.00011692941188812256, 0.00012104958295822144, 0.0001251697540283203]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 29.0, 970.0, 16.0], "bins": [-1.6110010147094727, -1.5852724313735962, -1.5595438480377197, -1.5338152647018433, -1.5080865621566772, -1.4823579788208008, -1.4566293954849243, -1.4309008121490479, -1.4051722288131714, -1.379443645477295, -1.3537150621414185, -1.327986478805542, -1.302257776260376, -1.2765291929244995, -1.250800609588623, -1.2250720262527466, -1.1993434429168701, -1.1736148595809937, -1.1478862762451172, -1.1221576929092407, -1.0964289903640747, -1.0707004070281982, -1.0449718236923218, -1.0192432403564453, -0.9935145974159241, -0.9677860140800476, -0.9420573711395264, -0.9163287878036499, -0.8906002044677734, -0.864871621131897, -0.8391429781913757, -0.8134143948554993, -0.7876858711242676, -0.7619572877883911, -0.7362286448478699, -0.7105000615119934, -0.6847714781761169, -0.6590428352355957, -0.6333142518997192, -0.6075856685638428, -0.5818570256233215, -0.5561284422874451, -0.5303997993469238, -0.5046712160110474, -0.4789426326751709, -0.45321401953697205, -0.4274854063987732, -0.40175682306289673, -0.37602823972702026, -0.3502996265888214, -0.32457104325294495, -0.2988424301147461, -0.27311384677886963, -0.24738523364067078, -0.22165663540363312, -0.19592803716659546, -0.1701994389295578, -0.14447084069252014, -0.11874224245548248, -0.09301363676786423, -0.06728503853082657, -0.04155643284320831, -0.015827834606170654, 0.009900763630867004, 0.03562936186790466]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 12.0, 13.0, 13.0, 14.0, 26.0, 31.0, 29.0, 34.0, 50.0, 42.0, 51.0, 49.0, 59.0, 46.0, 51.0, 57.0, 50.0, 43.0, 42.0, 39.0, 39.0, 32.0, 23.0, 21.0, 20.0, 15.0, 14.0, 12.0, 12.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14257240295410156, -0.13748376071453094, -0.13239511847496033, -0.1273064762353897, -0.12221783399581909, -0.11712919175624847, -0.11204054951667786, -0.10695190727710724, -0.10186326503753662, -0.096774622797966, -0.09168598055839539, -0.08659733831882477, -0.08150869607925415, -0.07642005383968353, -0.07133141160011292, -0.0662427693605423, -0.06115412712097168, -0.05606548488140106, -0.050976842641830444, -0.04588820040225983, -0.04079955816268921, -0.03571091592311859, -0.030622273683547974, -0.025533631443977356, -0.02044498920440674, -0.01535634696483612, -0.010267704725265503, -0.005179062485694885, -9.042024612426758e-05, 0.00499822199344635, 0.010086864233016968, 0.015175506472587585, 0.020264148712158203, 0.02535279095172882, 0.03044143319129944, 0.035530075430870056, 0.040618717670440674, 0.04570735991001129, 0.05079600214958191, 0.05588464438915253, 0.060973286628723145, 0.06606192886829376, 0.07115057110786438, 0.076239213347435, 0.08132785558700562, 0.08641649782657623, 0.09150514006614685, 0.09659378230571747, 0.10168242454528809, 0.1067710667848587, 0.11185970902442932, 0.11694835126399994, 0.12203699350357056, 0.12712563574314117, 0.1322142779827118, 0.1373029202222824, 0.14239156246185303, 0.14748020470142365, 0.15256884694099426, 0.15765748918056488, 0.1627461314201355, 0.16783477365970612, 0.17292341589927673, 0.17801205813884735, 0.18310070037841797]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 2.0, 5.0, 6.0, 11.0, 11.0, 7.0, 7.0, 13.0, 22.0, 28.0, 38.0, 66.0, 142.0, 1198.0, 4191849.0, 554.0, 102.0, 57.0, 31.0, 27.0, 22.0, 16.0, 13.0, 13.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.63677978515625, -6.4180908203125, -6.19940185546875, -5.980712890625, -5.76202392578125, -5.5433349609375, -5.32464599609375, -5.10595703125, -4.88726806640625, -4.6685791015625, -4.44989013671875, -4.231201171875, -4.01251220703125, -3.7938232421875, -3.57513427734375, -3.3564453125, -3.13775634765625, -2.9190673828125, -2.70037841796875, -2.481689453125, -2.26300048828125, -2.0443115234375, -1.82562255859375, -1.60693359375, -1.38824462890625, -1.1695556640625, -0.95086669921875, -0.732177734375, -0.51348876953125, -0.2947998046875, -0.07611083984375, 0.142578125, 0.36126708984375, 0.5799560546875, 0.79864501953125, 1.017333984375, 1.23602294921875, 1.4547119140625, 1.67340087890625, 1.89208984375, 2.11077880859375, 2.3294677734375, 2.54815673828125, 2.766845703125, 2.98553466796875, 3.2042236328125, 3.42291259765625, 3.6416015625, 3.86029052734375, 4.0789794921875, 4.29766845703125, 4.516357421875, 4.73504638671875, 4.9537353515625, 5.17242431640625, 5.39111328125, 5.60980224609375, 5.8284912109375, 6.04718017578125, 6.265869140625, 6.48455810546875, 6.7032470703125, 6.92193603515625, 7.140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 16.0, 17.0, 15.0, 20.0, 122.0, 407.0, 234.0, 43.0, 23.0, 9.0, 8.0, 6.0, 13.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 8.0, 6.0, 8.0, 13.0, 26.0, 46.0, 77.0, 125.0, 308.0, 697.0, 2257.0, 14334.0, 4165774.0, 7808.0, 1713.0, 553.0, 237.0, 127.0, 57.0, 39.0, 24.0, 7.0, 10.0, 3.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.123779296875, -0.11995601654052734, -0.11613273620605469, -0.11230945587158203, -0.10848617553710938, -0.10466289520263672, -0.10083961486816406, -0.0970163345336914, -0.09319305419921875, -0.0893697738647461, -0.08554649353027344, -0.08172321319580078, -0.07789993286132812, -0.07407665252685547, -0.07025337219238281, -0.06643009185791016, -0.0626068115234375, -0.058783531188964844, -0.05496025085449219, -0.05113697052001953, -0.047313690185546875, -0.04349040985107422, -0.03966712951660156, -0.035843849182128906, -0.03202056884765625, -0.028197288513183594, -0.024374008178710938, -0.02055072784423828, -0.016727447509765625, -0.012904167175292969, -0.009080886840820312, -0.005257606506347656, -0.001434326171875, 0.0023889541625976562, 0.0062122344970703125, 0.010035514831542969, 0.013858795166015625, 0.01768207550048828, 0.021505355834960938, 0.025328636169433594, 0.02915191650390625, 0.032975196838378906, 0.03679847717285156, 0.04062175750732422, 0.044445037841796875, 0.04826831817626953, 0.05209159851074219, 0.055914878845214844, 0.0597381591796875, 0.06356143951416016, 0.06738471984863281, 0.07120800018310547, 0.07503128051757812, 0.07885456085205078, 0.08267784118652344, 0.0865011215209961, 0.09032440185546875, 0.0941476821899414, 0.09797096252441406, 0.10179424285888672, 0.10561752319335938, 0.10944080352783203, 0.11326408386230469, 0.11708736419677734, 0.12091064453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 8.0, 40.0, 759.0, 3171.0, 41.0, 15.0, 3.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03204345703125, -0.031073331832885742, -0.030103206634521484, -0.029133081436157227, -0.02816295623779297, -0.02719283103942871, -0.026222705841064453, -0.025252580642700195, -0.024282455444335938, -0.02331233024597168, -0.022342205047607422, -0.021372079849243164, -0.020401954650878906, -0.01943182945251465, -0.01846170425415039, -0.017491579055786133, -0.016521453857421875, -0.015551328659057617, -0.01458120346069336, -0.013611078262329102, -0.012640953063964844, -0.011670827865600586, -0.010700702667236328, -0.00973057746887207, -0.008760452270507812, -0.007790327072143555, -0.006820201873779297, -0.005850076675415039, -0.004879951477050781, -0.0039098262786865234, -0.0029397010803222656, -0.001969575881958008, -0.00099945068359375, -2.9325485229492188e-05, 0.0009407997131347656, 0.0019109249114990234, 0.0028810501098632812, 0.003851175308227539, 0.004821300506591797, 0.005791425704956055, 0.0067615509033203125, 0.00773167610168457, 0.008701801300048828, 0.009671926498413086, 0.010642051696777344, 0.011612176895141602, 0.01258230209350586, 0.013552427291870117, 0.014522552490234375, 0.015492677688598633, 0.01646280288696289, 0.01743292808532715, 0.018403053283691406, 0.019373178482055664, 0.020343303680419922, 0.02131342887878418, 0.022283554077148438, 0.023253679275512695, 0.024223804473876953, 0.02519392967224121, 0.02616405487060547, 0.027134180068969727, 0.028104305267333984, 0.029074430465698242, 0.0300445556640625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 199.0, 550.0, 117.0, 57.0, 25.0, 15.0, 10.0, 8.0, 9.0, 6.0, 1.0, 6.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07240816950798035, -0.062193647027015686, -0.051979128271341324, -0.04176460951566696, -0.0315500870347023, -0.02133556455373764, -0.011121045798063278, -0.000906527042388916, 0.009307995438575745, 0.019522516056895256, 0.029737036675214767, 0.03995155543088913, 0.05016607791185379, 0.06038060039281845, 0.07059511542320251, 0.08080963790416718, 0.09102416038513184, 0.1012386828660965, 0.11145320534706116, 0.12166772037744522, 0.13188225030899048, 0.14209675788879395, 0.1523112803697586, 0.16252580285072327, 0.17274032533168793, 0.1829548478126526, 0.19316937029361725, 0.2033838927745819, 0.21359840035438538, 0.22381293773651123, 0.2340274453163147, 0.24424196779727936, 0.25445646047592163, 0.2646709680557251, 0.27488550543785095, 0.2851000130176544, 0.2953145503997803, 0.30552905797958374, 0.3157435953617096, 0.32595810294151306, 0.3361726403236389, 0.3463871479034424, 0.35660168528556824, 0.3668161928653717, 0.37703073024749756, 0.387245237827301, 0.3974597752094269, 0.40767428278923035, 0.4178887903690338, 0.4281032979488373, 0.43831783533096313, 0.4485323429107666, 0.45874688029289246, 0.4689613878726959, 0.4791759252548218, 0.48939043283462524, 0.4996049404144287, 0.5098194479942322, 0.5200339555740356, 0.5302485227584839, 0.5404630303382874, 0.5506775379180908, 0.5608920454978943, 0.5711065530776978, 0.581321120262146]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 3.0, 3.0, 6.0, 6.0, 11.0, 7.0, 10.0, 17.0, 11.0, 21.0, 28.0, 40.0, 32.0, 28.0, 37.0, 48.0, 51.0, 60.0, 67.0, 70.0, 63.0, 49.0, 48.0, 53.0, 41.0, 32.0, 28.0, 24.0, 14.0, 27.0, 13.0, 11.0, 4.0, 9.0, 10.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07161343097686768, -0.06956803798675537, -0.06752265244722366, -0.06547726690769196, -0.06343187391757965, -0.061386484652757645, -0.05934109538793564, -0.05729570612311363, -0.055250316858291626, -0.05320492759346962, -0.051159538328647614, -0.04911414906382561, -0.0470687597990036, -0.045023370534181595, -0.04297798126935959, -0.04093259200453758, -0.038887202739715576, -0.03684181347489357, -0.034796424210071564, -0.03275103494524956, -0.03070564568042755, -0.028660256415605545, -0.02661486715078354, -0.024569477885961533, -0.022524088621139526, -0.02047869935631752, -0.018433310091495514, -0.016387920826673508, -0.014342531561851501, -0.012297142297029495, -0.010251753032207489, -0.008206363767385483, -0.0061609745025634766, -0.00411558523774147, -0.002070195972919464, -2.4806708097457886e-05, 0.0020205825567245483, 0.0040659718215465546, 0.006111361086368561, 0.008156750351190567, 0.010202139616012573, 0.01224752888083458, 0.014292918145656586, 0.016338307410478592, 0.018383696675300598, 0.020429085940122604, 0.02247447520494461, 0.024519864469766617, 0.026565253734588623, 0.02861064299941063, 0.030656032264232635, 0.03270142152905464, 0.03474681079387665, 0.036792200058698654, 0.03883758932352066, 0.04088297858834267, 0.04292836785316467, 0.04497375711798668, 0.047019146382808685, 0.04906453564763069, 0.0511099249124527, 0.053155314177274704, 0.05520070344209671, 0.057246092706918716, 0.05929148197174072]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 2.0, 7.0, 7.0, 14.0, 19.0, 37.0, 76.0, 121.0, 258.0, 517.0, 1114.0, 3099.0, 13235.0, 972705.0, 48272.0, 5960.0, 1690.0, 673.0, 276.0, 176.0, 110.0, 52.0, 35.0, 27.0, 15.0, 17.0, 13.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1387939453125, -0.13442230224609375, -0.1300506591796875, -0.12567901611328125, -0.121307373046875, -0.11693572998046875, -0.1125640869140625, -0.10819244384765625, -0.10382080078125, -0.09944915771484375, -0.0950775146484375, -0.09070587158203125, -0.086334228515625, -0.08196258544921875, -0.0775909423828125, -0.07321929931640625, -0.06884765625, -0.06447601318359375, -0.0601043701171875, -0.05573272705078125, -0.051361083984375, -0.04698944091796875, -0.0426177978515625, -0.03824615478515625, -0.03387451171875, -0.02950286865234375, -0.0251312255859375, -0.02075958251953125, -0.016387939453125, -0.01201629638671875, -0.0076446533203125, -0.00327301025390625, 0.0010986328125, 0.00547027587890625, 0.0098419189453125, 0.01421356201171875, 0.018585205078125, 0.02295684814453125, 0.0273284912109375, 0.03170013427734375, 0.03607177734375, 0.04044342041015625, 0.0448150634765625, 0.04918670654296875, 0.053558349609375, 0.05792999267578125, 0.0623016357421875, 0.06667327880859375, 0.071044921875, 0.07541656494140625, 0.0797882080078125, 0.08415985107421875, 0.088531494140625, 0.09290313720703125, 0.0972747802734375, 0.10164642333984375, 0.10601806640625, 0.11038970947265625, 0.1147613525390625, 0.11913299560546875, 0.123504638671875, 0.12787628173828125, 0.1322479248046875, 0.13661956787109375, 0.1409912109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 9.0, 12.0, 15.0, 17.0, 27.0, 109.0, 363.0, 248.0, 80.0, 22.0, 10.0, 7.0, 5.0, 12.0, 10.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019256591796875, -0.018648624420166016, -0.01804065704345703, -0.017432689666748047, -0.016824722290039062, -0.016216754913330078, -0.015608787536621094, -0.01500082015991211, -0.014392852783203125, -0.01378488540649414, -0.013176918029785156, -0.012568950653076172, -0.011960983276367188, -0.011353015899658203, -0.010745048522949219, -0.010137081146240234, -0.00952911376953125, -0.008921146392822266, -0.008313179016113281, -0.007705211639404297, -0.0070972442626953125, -0.006489276885986328, -0.005881309509277344, -0.005273342132568359, -0.004665374755859375, -0.004057407379150391, -0.0034494400024414062, -0.002841472625732422, -0.0022335052490234375, -0.0016255378723144531, -0.0010175704956054688, -0.0004096031188964844, 0.0001983642578125, 0.0008063316345214844, 0.0014142990112304688, 0.002022266387939453, 0.0026302337646484375, 0.003238201141357422, 0.0038461685180664062, 0.004454135894775391, 0.005062103271484375, 0.005670070648193359, 0.006278038024902344, 0.006886005401611328, 0.0074939727783203125, 0.008101940155029297, 0.008709907531738281, 0.009317874908447266, 0.00992584228515625, 0.010533809661865234, 0.011141777038574219, 0.011749744415283203, 0.012357711791992188, 0.012965679168701172, 0.013573646545410156, 0.01418161392211914, 0.014789581298828125, 0.01539754867553711, 0.016005516052246094, 0.016613483428955078, 0.017221450805664062, 0.017829418182373047, 0.01843738555908203, 0.019045352935791016, 0.0196533203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 4.0, 16.0, 22.0, 21.0, 21.0, 48.0, 60.0, 66.0, 90.0, 147.0, 222.0, 331.0, 556.0, 904.0, 1862.0, 4268.0, 12179.0, 50620.0, 604855.0, 316746.0, 38003.0, 9960.0, 3596.0, 1607.0, 841.0, 432.0, 310.0, 228.0, 147.0, 86.0, 66.0, 54.0, 53.0, 25.0, 24.0, 18.0, 8.0, 6.0, 12.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0], "bins": [-0.053375244140625, -0.05188894271850586, -0.05040264129638672, -0.04891633987426758, -0.04743003845214844, -0.0459437370300293, -0.044457435607910156, -0.042971134185791016, -0.041484832763671875, -0.039998531341552734, -0.038512229919433594, -0.03702592849731445, -0.03553962707519531, -0.03405332565307617, -0.03256702423095703, -0.03108072280883789, -0.02959442138671875, -0.02810811996459961, -0.02662181854248047, -0.025135517120361328, -0.023649215698242188, -0.022162914276123047, -0.020676612854003906, -0.019190311431884766, -0.017704010009765625, -0.016217708587646484, -0.014731407165527344, -0.013245105743408203, -0.011758804321289062, -0.010272502899169922, -0.008786201477050781, -0.007299900054931641, -0.0058135986328125, -0.004327297210693359, -0.0028409957885742188, -0.0013546943664550781, 0.0001316070556640625, 0.0016179084777832031, 0.0031042098999023438, 0.004590511322021484, 0.006076812744140625, 0.007563114166259766, 0.009049415588378906, 0.010535717010498047, 0.012022018432617188, 0.013508319854736328, 0.014994621276855469, 0.01648092269897461, 0.01796722412109375, 0.01945352554321289, 0.02093982696533203, 0.022426128387451172, 0.023912429809570312, 0.025398731231689453, 0.026885032653808594, 0.028371334075927734, 0.029857635498046875, 0.031343936920166016, 0.032830238342285156, 0.0343165397644043, 0.03580284118652344, 0.03728914260864258, 0.03877544403076172, 0.04026174545288086, 0.041748046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 10.0, 15.0, 10.0, 11.0, 17.0, 18.0, 25.0, 34.0, 24.0, 41.0, 42.0, 39.0, 46.0, 56.0, 48.0, 52.0, 52.0, 48.0, 35.0, 38.0, 38.0, 31.0, 33.0, 35.0, 31.0, 25.0, 22.0, 23.0, 14.0, 11.0, 7.0, 13.0, 9.0, 6.0, 3.0, 5.0, 2.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.038726806640625, -0.03764986991882324, -0.036572933197021484, -0.03549599647521973, -0.03441905975341797, -0.03334212303161621, -0.03226518630981445, -0.031188249588012695, -0.030111312866210938, -0.02903437614440918, -0.027957439422607422, -0.026880502700805664, -0.025803565979003906, -0.02472662925720215, -0.02364969253540039, -0.022572755813598633, -0.021495819091796875, -0.020418882369995117, -0.01934194564819336, -0.0182650089263916, -0.017188072204589844, -0.016111135482788086, -0.015034198760986328, -0.01395726203918457, -0.012880325317382812, -0.011803388595581055, -0.010726451873779297, -0.009649515151977539, -0.008572578430175781, -0.0074956417083740234, -0.006418704986572266, -0.005341768264770508, -0.00426483154296875, -0.003187894821166992, -0.0021109580993652344, -0.0010340213775634766, 4.291534423828125e-05, 0.001119852066040039, 0.002196788787841797, 0.0032737255096435547, 0.0043506622314453125, 0.00542759895324707, 0.006504535675048828, 0.007581472396850586, 0.008658409118652344, 0.009735345840454102, 0.01081228256225586, 0.011889219284057617, 0.012966156005859375, 0.014043092727661133, 0.01512002944946289, 0.01619696617126465, 0.017273902893066406, 0.018350839614868164, 0.019427776336669922, 0.02050471305847168, 0.021581649780273438, 0.022658586502075195, 0.023735523223876953, 0.02481245994567871, 0.02588939666748047, 0.026966333389282227, 0.028043270111083984, 0.029120206832885742, 0.0301971435546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 6.0, 4.0, 16.0, 19.0, 26.0, 39.0, 41.0, 50.0, 82.0, 118.0, 226.0, 392.0, 630.0, 1185.0, 2633.0, 6712.0, 41891.0, 965899.0, 19262.0, 4921.0, 2073.0, 1001.0, 454.0, 280.0, 172.0, 124.0, 83.0, 62.0, 35.0, 26.0, 18.0, 14.0, 15.0, 12.0, 9.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01226806640625, -0.011835336685180664, -0.011402606964111328, -0.010969877243041992, -0.010537147521972656, -0.01010441780090332, -0.009671688079833984, -0.009238958358764648, -0.008806228637695312, -0.008373498916625977, -0.00794076919555664, -0.007508039474487305, -0.007075309753417969, -0.006642580032348633, -0.006209850311279297, -0.005777120590209961, -0.005344390869140625, -0.004911661148071289, -0.004478931427001953, -0.004046201705932617, -0.0036134719848632812, -0.0031807422637939453, -0.0027480125427246094, -0.0023152828216552734, -0.0018825531005859375, -0.0014498233795166016, -0.0010170936584472656, -0.0005843639373779297, -0.00015163421630859375, 0.0002810955047607422, 0.0007138252258300781, 0.001146554946899414, 0.00157928466796875, 0.002012014389038086, 0.002444744110107422, 0.002877473831176758, 0.0033102035522460938, 0.0037429332733154297, 0.004175662994384766, 0.0046083927154541016, 0.0050411224365234375, 0.0054738521575927734, 0.005906581878662109, 0.006339311599731445, 0.006772041320800781, 0.007204771041870117, 0.007637500762939453, 0.008070230484008789, 0.008502960205078125, 0.008935689926147461, 0.009368419647216797, 0.009801149368286133, 0.010233879089355469, 0.010666608810424805, 0.01109933853149414, 0.011532068252563477, 0.011964797973632812, 0.012397527694702148, 0.012830257415771484, 0.01326298713684082, 0.013695716857910156, 0.014128446578979492, 0.014561176300048828, 0.014993906021118164, 0.0154266357421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 14.0, 24.0, 48.0, 65.0, 114.0, 147.0, 171.0, 138.0, 87.0, 83.0, 36.0, 15.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2650154531002045e-05, -1.2246891856193542e-05, -1.184362918138504e-05, -1.1440366506576538e-05, -1.1037103831768036e-05, -1.0633841156959534e-05, -1.0230578482151031e-05, -9.82731580734253e-06, -9.424053132534027e-06, -9.020790457725525e-06, -8.617527782917023e-06, -8.21426510810852e-06, -7.811002433300018e-06, -7.407739758491516e-06, -7.004477083683014e-06, -6.601214408874512e-06, -6.1979517340660095e-06, -5.794689059257507e-06, -5.391426384449005e-06, -4.988163709640503e-06, -4.584901034832001e-06, -4.1816383600234985e-06, -3.7783756852149963e-06, -3.375113010406494e-06, -2.971850335597992e-06, -2.5685876607894897e-06, -2.1653249859809875e-06, -1.7620623111724854e-06, -1.3587996363639832e-06, -9.55536961555481e-07, -5.522742867469788e-07, -1.4901161193847656e-07, 2.5425106287002563e-07, 6.575137376785278e-07, 1.06077641248703e-06, 1.4640390872955322e-06, 1.8673017621040344e-06, 2.2705644369125366e-06, 2.673827111721039e-06, 3.077089786529541e-06, 3.4803524613380432e-06, 3.883615136146545e-06, 4.286877810955048e-06, 4.69014048576355e-06, 5.093403160572052e-06, 5.496665835380554e-06, 5.899928510189056e-06, 6.303191184997559e-06, 6.706453859806061e-06, 7.109716534614563e-06, 7.512979209423065e-06, 7.916241884231567e-06, 8.31950455904007e-06, 8.722767233848572e-06, 9.126029908657074e-06, 9.529292583465576e-06, 9.932555258274078e-06, 1.033581793308258e-05, 1.0739080607891083e-05, 1.1142343282699585e-05, 1.1545605957508087e-05, 1.194886863231659e-05, 1.2352131307125092e-05, 1.2755393981933594e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 7.0, 10.0, 4.0, 21.0, 19.0, 25.0, 28.0, 48.0, 87.0, 124.0, 172.0, 288.0, 557.0, 1148.0, 2920.0, 10164.0, 86482.0, 907990.0, 28854.0, 5644.0, 1978.0, 867.0, 427.0, 230.0, 140.0, 88.0, 63.0, 51.0, 23.0, 20.0, 11.0, 12.0, 6.0, 10.0, 6.0, 5.0, 6.0, 1.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00806427001953125, -0.007779240608215332, -0.007494211196899414, -0.007209181785583496, -0.006924152374267578, -0.00663912296295166, -0.006354093551635742, -0.006069064140319824, -0.005784034729003906, -0.005499005317687988, -0.00521397590637207, -0.004928946495056152, -0.004643917083740234, -0.004358887672424316, -0.0040738582611083984, -0.0037888288497924805, -0.0035037994384765625, -0.0032187700271606445, -0.0029337406158447266, -0.0026487112045288086, -0.0023636817932128906, -0.0020786523818969727, -0.0017936229705810547, -0.0015085935592651367, -0.0012235641479492188, -0.0009385347366333008, -0.0006535053253173828, -0.00036847591400146484, -8.344650268554688e-05, 0.0002015829086303711, 0.00048661231994628906, 0.000771641731262207, 0.001056671142578125, 0.001341700553894043, 0.001626729965209961, 0.001911759376525879, 0.002196788787841797, 0.002481818199157715, 0.002766847610473633, 0.0030518770217895508, 0.0033369064331054688, 0.0036219358444213867, 0.003906965255737305, 0.004191994667053223, 0.004477024078369141, 0.004762053489685059, 0.0050470829010009766, 0.0053321123123168945, 0.0056171417236328125, 0.0059021711349487305, 0.0061872005462646484, 0.006472229957580566, 0.006757259368896484, 0.007042288780212402, 0.00732731819152832, 0.007612347602844238, 0.007897377014160156, 0.008182406425476074, 0.008467435836791992, 0.00875246524810791, 0.009037494659423828, 0.009322524070739746, 0.009607553482055664, 0.009892582893371582, 0.0101776123046875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 17.0, 16.0, 15.0, 24.0, 27.0, 31.0, 59.0, 96.0, 146.0, 123.0, 103.0, 76.0, 61.0, 45.0, 27.0, 26.0, 18.0, 14.0, 11.0, 9.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00530242919921875, -0.005108952522277832, -0.004915475845336914, -0.004721999168395996, -0.004528522491455078, -0.00433504581451416, -0.004141569137573242, -0.003948092460632324, -0.0037546157836914062, -0.0035611391067504883, -0.0033676624298095703, -0.0031741857528686523, -0.0029807090759277344, -0.0027872323989868164, -0.0025937557220458984, -0.0024002790451049805, -0.0022068023681640625, -0.0020133256912231445, -0.0018198490142822266, -0.0016263723373413086, -0.0014328956604003906, -0.0012394189834594727, -0.0010459423065185547, -0.0008524656295776367, -0.0006589889526367188, -0.0004655122756958008, -0.0002720355987548828, -7.855892181396484e-05, 0.00011491775512695312, 0.0003083944320678711, 0.0005018711090087891, 0.000695347785949707, 0.000888824462890625, 0.001082301139831543, 0.001275777816772461, 0.001469254493713379, 0.0016627311706542969, 0.0018562078475952148, 0.002049684524536133, 0.0022431612014770508, 0.0024366378784179688, 0.0026301145553588867, 0.0028235912322998047, 0.0030170679092407227, 0.0032105445861816406, 0.0034040212631225586, 0.0035974979400634766, 0.0037909746170043945, 0.0039844512939453125, 0.0041779279708862305, 0.0043714046478271484, 0.004564881324768066, 0.004758358001708984, 0.004951834678649902, 0.00514531135559082, 0.005338788032531738, 0.005532264709472656, 0.005725741386413574, 0.005919218063354492, 0.00611269474029541, 0.006306171417236328, 0.006499648094177246, 0.006693124771118164, 0.006886601448059082, 0.007080078125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 10.0, 30.0, 67.0, 213.0, 397.0, 173.0, 51.0, 30.0, 8.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5540460348129272, -0.5379233360290527, -0.5218006372451782, -0.5056779384613037, -0.4895552694797516, -0.47343260049819946, -0.45730990171432495, -0.44118720293045044, -0.4250645041465759, -0.4089418053627014, -0.3928191363811493, -0.3766964375972748, -0.36057373881340027, -0.34445106983184814, -0.32832837104797363, -0.3122056722640991, -0.296083003282547, -0.2799603044986725, -0.26383763551712036, -0.24771493673324585, -0.23159223794937134, -0.21546955406665802, -0.1993468701839447, -0.1832241714000702, -0.16710148751735687, -0.15097880363464355, -0.13485610485076904, -0.11873342096805573, -0.10261072963476181, -0.0864880383014679, -0.07036535441875458, -0.05424266308546066, -0.03811994194984436, -0.021997252479195595, -0.005874563008546829, 0.010248124599456787, 0.026370815932750702, 0.04249350726604462, 0.058616191148757935, 0.07473888248205185, 0.09086157381534576, 0.10698426514863968, 0.1231069564819336, 0.1392296403646469, 0.15535232424736023, 0.17147502303123474, 0.18759770691394806, 0.20372039079666138, 0.2198430895805359, 0.2359657734632492, 0.2520884573459625, 0.26821115612983704, 0.28433385491371155, 0.30045652389526367, 0.3165792226791382, 0.3327019214630127, 0.3488246202468872, 0.3649473190307617, 0.38106998801231384, 0.39719268679618835, 0.41331538558006287, 0.429438054561615, 0.4455607533454895, 0.461683452129364, 0.47780612111091614]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 13.0, 10.0, 20.0, 27.0, 21.0, 25.0, 19.0, 32.0, 35.0, 46.0, 63.0, 51.0, 74.0, 81.0, 82.0, 69.0, 51.0, 53.0, 44.0, 27.0, 39.0, 21.0, 22.0, 13.0, 19.0, 8.0, 8.0, 9.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2035682201385498, -0.1978914737701416, -0.1922147274017334, -0.1865379810333252, -0.1808612197637558, -0.1751844733953476, -0.1695077270269394, -0.1638309806585312, -0.1581542193889618, -0.1524774730205536, -0.14680072665214539, -0.14112398028373718, -0.13544721901416779, -0.12977047264575958, -0.12409372627735138, -0.11841697990894318, -0.11274023354053497, -0.10706348717212677, -0.10138673335313797, -0.09570998698472977, -0.09003323316574097, -0.08435648679733276, -0.07867974042892456, -0.07300299406051636, -0.06732624024152756, -0.061649490147829056, -0.055972740054130554, -0.05029599368572235, -0.04461924359202385, -0.03894249349832535, -0.033265747129917145, -0.027588997036218643, -0.02191224694252014, -0.01623549684882164, -0.010558748617768288, -0.004882000386714935, 0.0007947497069835663, 0.006471499800682068, 0.012148246169090271, 0.017824996262788773, 0.023501746356487274, 0.029178496450185776, 0.03485524654388428, 0.04053199291229248, 0.04620874300599098, 0.051885493099689484, 0.05756223946809769, 0.06323899328708649, 0.06891573965549469, 0.0745924860239029, 0.0802692398428917, 0.0859459862112999, 0.0916227400302887, 0.0972994863986969, 0.1029762327671051, 0.1086529791355133, 0.1143297329545021, 0.12000647932291031, 0.1256832331418991, 0.1313599795103073, 0.13703672587871552, 0.1427134871482849, 0.14839023351669312, 0.15406697988510132, 0.15974372625350952]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 7.0, 8.0, 14.0, 21.0, 48.0, 79.0, 129.0, 437.0, 4192348.0, 775.0, 206.0, 74.0, 33.0, 22.0, 16.0, 11.0, 4.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.5764846801757812, -0.5582427978515625, -0.5400009155273438, -0.521759033203125, -0.5035171508789062, -0.4852752685546875, -0.46703338623046875, -0.44879150390625, -0.43054962158203125, -0.4123077392578125, -0.39406585693359375, -0.375823974609375, -0.35758209228515625, -0.3393402099609375, -0.32109832763671875, -0.3028564453125, -0.28461456298828125, -0.2663726806640625, -0.24813079833984375, -0.229888916015625, -0.21164703369140625, -0.1934051513671875, -0.17516326904296875, -0.15692138671875, -0.13867950439453125, -0.1204376220703125, -0.10219573974609375, -0.083953857421875, -0.06571197509765625, -0.0474700927734375, -0.02922821044921875, -0.010986328125, 0.00725555419921875, 0.0254974365234375, 0.04373931884765625, 0.061981201171875, 0.08022308349609375, 0.0984649658203125, 0.11670684814453125, 0.13494873046875, 0.15319061279296875, 0.1714324951171875, 0.18967437744140625, 0.207916259765625, 0.22615814208984375, 0.2444000244140625, 0.26264190673828125, 0.2808837890625, 0.29912567138671875, 0.3173675537109375, 0.33560943603515625, 0.353851318359375, 0.37209320068359375, 0.3903350830078125, 0.40857696533203125, 0.42681884765625, 0.44506072998046875, 0.4633026123046875, 0.48154449462890625, 0.499786376953125, 0.5180282592773438, 0.5362701416015625, 0.5545120239257812, 0.57275390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 8.0, 4.0, 5.0, 3.0, 9.0, 10.0, 15.0, 29.0, 52.0, 152.0, 262.0, 240.0, 94.0, 35.0, 19.0, 10.0, 5.0, 12.0, 9.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191802978515625, -0.018573760986328125, -0.01796722412109375, -0.017360687255859375, -0.016754150390625, -0.016147613525390625, -0.01554107666015625, -0.014934539794921875, -0.0143280029296875, -0.013721466064453125, -0.01311492919921875, -0.012508392333984375, -0.01190185546875, -0.011295318603515625, -0.01068878173828125, -0.010082244873046875, -0.0094757080078125, -0.008869171142578125, -0.00826263427734375, -0.007656097412109375, -0.007049560546875, -0.006443023681640625, -0.00583648681640625, -0.005229949951171875, -0.0046234130859375, -0.004016876220703125, -0.00341033935546875, -0.002803802490234375, -0.002197265625, -0.001590728759765625, -0.00098419189453125, -0.000377655029296875, 0.0002288818359375, 0.000835418701171875, 0.00144195556640625, 0.002048492431640625, 0.002655029296875, 0.003261566162109375, 0.00386810302734375, 0.004474639892578125, 0.0050811767578125, 0.005687713623046875, 0.00629425048828125, 0.006900787353515625, 0.00750732421875, 0.008113861083984375, 0.00872039794921875, 0.009326934814453125, 0.0099334716796875, 0.010540008544921875, 0.01114654541015625, 0.011753082275390625, 0.012359619140625, 0.012966156005859375, 0.01357269287109375, 0.014179229736328125, 0.0147857666015625, 0.015392303466796875, 0.01599884033203125, 0.016605377197265625, 0.0172119140625, 0.017818450927734375, 0.01842498779296875, 0.019031524658203125, 0.0196380615234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 2.0, 6.0, 3.0, 10.0, 16.0, 30.0, 43.0, 49.0, 90.0, 147.0, 262.0, 445.0, 881.0, 1872.0, 5632.0, 34491.0, 3817566.0, 305870.0, 19430.0, 4409.0, 1510.0, 655.0, 322.0, 206.0, 113.0, 73.0, 43.0, 32.0, 28.0, 20.0, 5.0, 7.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0262603759765625, -0.025546789169311523, -0.024833202362060547, -0.02411961555480957, -0.023406028747558594, -0.022692441940307617, -0.02197885513305664, -0.021265268325805664, -0.020551681518554688, -0.01983809471130371, -0.019124507904052734, -0.018410921096801758, -0.01769733428955078, -0.016983747482299805, -0.016270160675048828, -0.015556573867797852, -0.014842987060546875, -0.014129400253295898, -0.013415813446044922, -0.012702226638793945, -0.011988639831542969, -0.011275053024291992, -0.010561466217041016, -0.009847879409790039, -0.009134292602539062, -0.008420705795288086, -0.007707118988037109, -0.006993532180786133, -0.006279945373535156, -0.00556635856628418, -0.004852771759033203, -0.0041391849517822266, -0.00342559814453125, -0.0027120113372802734, -0.001998424530029297, -0.0012848377227783203, -0.0005712509155273438, 0.0001423358917236328, 0.0008559226989746094, 0.001569509506225586, 0.0022830963134765625, 0.002996683120727539, 0.0037102699279785156, 0.004423856735229492, 0.005137443542480469, 0.005851030349731445, 0.006564617156982422, 0.0072782039642333984, 0.007991790771484375, 0.008705377578735352, 0.009418964385986328, 0.010132551193237305, 0.010846138000488281, 0.011559724807739258, 0.012273311614990234, 0.012986898422241211, 0.013700485229492188, 0.014414072036743164, 0.01512765884399414, 0.015841245651245117, 0.016554832458496094, 0.01726841926574707, 0.017982006072998047, 0.018695592880249023, 0.0194091796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 14.0, 14.0, 23.0, 34.0, 70.0, 188.0, 703.0, 1956.0, 629.0, 187.0, 74.0, 42.0, 31.0, 23.0, 17.0, 13.0, 12.0, 15.0, 7.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0218658447265625, -0.021325230598449707, -0.020784616470336914, -0.02024400234222412, -0.019703388214111328, -0.019162774085998535, -0.018622159957885742, -0.01808154582977295, -0.017540931701660156, -0.017000317573547363, -0.01645970344543457, -0.015919089317321777, -0.015378475189208984, -0.014837861061096191, -0.014297246932983398, -0.013756632804870605, -0.013216018676757812, -0.01267540454864502, -0.012134790420532227, -0.011594176292419434, -0.01105356216430664, -0.010512948036193848, -0.009972333908081055, -0.009431719779968262, -0.008891105651855469, -0.008350491523742676, -0.007809877395629883, -0.00726926326751709, -0.006728649139404297, -0.006188035011291504, -0.005647420883178711, -0.005106806755065918, -0.004566192626953125, -0.004025578498840332, -0.003484964370727539, -0.002944350242614746, -0.002403736114501953, -0.0018631219863891602, -0.0013225078582763672, -0.0007818937301635742, -0.00024127960205078125, 0.0002993345260620117, 0.0008399486541748047, 0.0013805627822875977, 0.0019211769104003906, 0.0024617910385131836, 0.0030024051666259766, 0.0035430192947387695, 0.0040836334228515625, 0.0046242475509643555, 0.0051648616790771484, 0.005705475807189941, 0.006246089935302734, 0.006786704063415527, 0.00732731819152832, 0.007867932319641113, 0.008408546447753906, 0.0089491605758667, 0.009489774703979492, 0.010030388832092285, 0.010571002960205078, 0.011111617088317871, 0.011652231216430664, 0.012192845344543457, 0.01273345947265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 15.0, 17.0, 43.0, 93.0, 159.0, 251.0, 167.0, 83.0, 59.0, 37.0, 23.0, 12.0, 4.0, 11.0, 6.0, 8.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07211392372846603, -0.06743697077035904, -0.06276002526283264, -0.05808307230472565, -0.05340611934661865, -0.04872916638851166, -0.04405221715569496, -0.039375267922878265, -0.03469831496477127, -0.030021363869309425, -0.02534441277384758, -0.020667461678385735, -0.01599051058292389, -0.011313559487462044, -0.006636608392000198, -0.001959659159183502, 0.0027172937989234924, 0.007394244894385338, 0.012071195989847183, 0.01674814708530903, 0.021425098180770874, 0.02610204927623272, 0.030779000371694565, 0.03545594960451126, 0.040132902562618256, 0.04480985552072525, 0.049486804753541946, 0.05416375398635864, 0.05884070694446564, 0.06351765990257263, 0.06819461286067963, 0.07287155836820602, 0.07754851877689362, 0.08222547173500061, 0.0869024246931076, 0.091579370200634, 0.096256323158741, 0.10093327611684799, 0.10561022162437439, 0.11028717458248138, 0.11496412754058838, 0.11964108049869537, 0.12431803345680237, 0.12899498641490936, 0.13367193937301636, 0.13834887742996216, 0.14302583038806915, 0.14770278334617615, 0.15237973630428314, 0.15705668926239014, 0.16173364222049713, 0.16641059517860413, 0.17108753323554993, 0.17576448619365692, 0.18044143915176392, 0.1851183921098709, 0.1897953450679779, 0.1944722980260849, 0.1991492509841919, 0.2038262039422989, 0.20850315690040588, 0.21318009495735168, 0.21785704791545868, 0.22253400087356567, 0.22721095383167267]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 6.0, 8.0, 10.0, 12.0, 18.0, 18.0, 25.0, 18.0, 25.0, 25.0, 37.0, 47.0, 35.0, 54.0, 31.0, 53.0, 35.0, 41.0, 51.0, 48.0, 38.0, 45.0, 47.0, 29.0, 40.0, 22.0, 27.0, 20.0, 26.0, 14.0, 13.0, 15.0, 17.0, 10.0, 10.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.045414865016937256, -0.043896742165088654, -0.04237861931324005, -0.04086049273610115, -0.03934236988425255, -0.037824247032403946, -0.036306120455265045, -0.03478799760341644, -0.03326987475156784, -0.03175175189971924, -0.030233627185225487, -0.028715502470731735, -0.027197379618883133, -0.02567925676703453, -0.02416113205254078, -0.022643007338047028, -0.021124884486198425, -0.019606761634349823, -0.01808863691985607, -0.01657051220536232, -0.015052389353513718, -0.01353426557034254, -0.012016141787171364, -0.010498018004000187, -0.00897989422082901, -0.007461770437657833, -0.005943646654486656, -0.004425522871315479, -0.0029073990881443024, -0.0013892753049731255, 0.00012884847819805145, 0.0016469722613692284, 0.0031650960445404053, 0.004683219827711582, 0.006201343610882759, 0.007719467394053936, 0.009237591177225113, 0.01075571496039629, 0.012273838743567467, 0.013791962526738644, 0.01531008630990982, 0.016828209161758423, 0.018346333876252174, 0.019864458590745926, 0.021382581442594528, 0.02290070429444313, 0.024418829008936882, 0.025936953723430634, 0.027455076575279236, 0.028973199427127838, 0.03049132414162159, 0.03200944885611534, 0.033527571707963943, 0.035045694559812546, 0.03656382113695145, 0.03808194398880005, 0.03960006684064865, 0.04111818969249725, 0.042636312544345856, 0.044154439121484756, 0.04567256197333336, 0.04719068482518196, 0.04870881140232086, 0.050226934254169464, 0.051745057106018066]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 18.0, 8.0, 20.0, 25.0, 41.0, 66.0, 104.0, 139.0, 199.0, 304.0, 554.0, 854.0, 1535.0, 3164.0, 7040.0, 20571.0, 139274.0, 778100.0, 70024.0, 14837.0, 5573.0, 2582.0, 1420.0, 731.0, 507.0, 295.0, 174.0, 131.0, 75.0, 41.0, 39.0, 31.0, 11.0, 19.0, 7.0, 10.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03240966796875, -0.03137636184692383, -0.030343055725097656, -0.029309749603271484, -0.028276443481445312, -0.02724313735961914, -0.02620983123779297, -0.025176525115966797, -0.024143218994140625, -0.023109912872314453, -0.02207660675048828, -0.02104330062866211, -0.020009994506835938, -0.018976688385009766, -0.017943382263183594, -0.016910076141357422, -0.01587677001953125, -0.014843463897705078, -0.013810157775878906, -0.012776851654052734, -0.011743545532226562, -0.01071023941040039, -0.009676933288574219, -0.008643627166748047, -0.007610321044921875, -0.006577014923095703, -0.005543708801269531, -0.004510402679443359, -0.0034770965576171875, -0.0024437904357910156, -0.0014104843139648438, -0.0003771781921386719, 0.0006561279296875, 0.0016894340515136719, 0.0027227401733398438, 0.0037560462951660156, 0.0047893524169921875, 0.005822658538818359, 0.006855964660644531, 0.007889270782470703, 0.008922576904296875, 0.009955883026123047, 0.010989189147949219, 0.01202249526977539, 0.013055801391601562, 0.014089107513427734, 0.015122413635253906, 0.016155719757080078, 0.01718902587890625, 0.018222332000732422, 0.019255638122558594, 0.020288944244384766, 0.021322250366210938, 0.02235555648803711, 0.02338886260986328, 0.024422168731689453, 0.025455474853515625, 0.026488780975341797, 0.02752208709716797, 0.02855539321899414, 0.029588699340820312, 0.030622005462646484, 0.031655311584472656, 0.03268861770629883, 0.033721923828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 9.0, 11.0, 15.0, 31.0, 69.0, 178.0, 266.0, 199.0, 89.0, 37.0, 16.0, 11.0, 7.0, 12.0, 5.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01885986328125, -0.018260955810546875, -0.01766204833984375, -0.017063140869140625, -0.0164642333984375, -0.015865325927734375, -0.01526641845703125, -0.014667510986328125, -0.014068603515625, -0.013469696044921875, -0.01287078857421875, -0.012271881103515625, -0.0116729736328125, -0.011074066162109375, -0.01047515869140625, -0.009876251220703125, -0.00927734375, -0.008678436279296875, -0.00807952880859375, -0.007480621337890625, -0.0068817138671875, -0.006282806396484375, -0.00568389892578125, -0.005084991455078125, -0.004486083984375, -0.003887176513671875, -0.00328826904296875, -0.002689361572265625, -0.0020904541015625, -0.001491546630859375, -0.00089263916015625, -0.000293731689453125, 0.00030517578125, 0.000904083251953125, 0.00150299072265625, 0.002101898193359375, 0.0027008056640625, 0.003299713134765625, 0.00389862060546875, 0.004497528076171875, 0.005096435546875, 0.005695343017578125, 0.00629425048828125, 0.006893157958984375, 0.0074920654296875, 0.008090972900390625, 0.00868988037109375, 0.009288787841796875, 0.0098876953125, 0.010486602783203125, 0.01108551025390625, 0.011684417724609375, 0.0122833251953125, 0.012882232666015625, 0.01348114013671875, 0.014080047607421875, 0.014678955078125, 0.015277862548828125, 0.01587677001953125, 0.016475677490234375, 0.0170745849609375, 0.017673492431640625, 0.01827239990234375, 0.018871307373046875, 0.01947021484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 4.0, 9.0, 7.0, 8.0, 5.0, 12.0, 28.0, 26.0, 31.0, 35.0, 58.0, 85.0, 121.0, 139.0, 247.0, 320.0, 533.0, 864.0, 1603.0, 3561.0, 9350.0, 32708.0, 178791.0, 665786.0, 116259.0, 23941.0, 7422.0, 2943.0, 1382.0, 752.0, 464.0, 295.0, 221.0, 152.0, 119.0, 68.0, 51.0, 44.0, 33.0, 20.0, 14.0, 16.0, 13.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0257568359375, -0.024780750274658203, -0.023804664611816406, -0.02282857894897461, -0.021852493286132812, -0.020876407623291016, -0.01990032196044922, -0.018924236297607422, -0.017948150634765625, -0.016972064971923828, -0.01599597930908203, -0.015019893646240234, -0.014043807983398438, -0.01306772232055664, -0.012091636657714844, -0.011115550994873047, -0.01013946533203125, -0.009163379669189453, -0.008187294006347656, -0.007211208343505859, -0.0062351226806640625, -0.005259037017822266, -0.004282951354980469, -0.003306865692138672, -0.002330780029296875, -0.0013546943664550781, -0.00037860870361328125, 0.0005974769592285156, 0.0015735626220703125, 0.0025496482849121094, 0.0035257339477539062, 0.004501819610595703, 0.0054779052734375, 0.006453990936279297, 0.007430076599121094, 0.00840616226196289, 0.009382247924804688, 0.010358333587646484, 0.011334419250488281, 0.012310504913330078, 0.013286590576171875, 0.014262676239013672, 0.015238761901855469, 0.016214847564697266, 0.017190933227539062, 0.01816701889038086, 0.019143104553222656, 0.020119190216064453, 0.02109527587890625, 0.022071361541748047, 0.023047447204589844, 0.02402353286743164, 0.024999618530273438, 0.025975704193115234, 0.02695178985595703, 0.027927875518798828, 0.028903961181640625, 0.029880046844482422, 0.03085613250732422, 0.031832218170166016, 0.03280830383300781, 0.03378438949584961, 0.034760475158691406, 0.0357365608215332, 0.036712646484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 3.0, 4.0, 8.0, 12.0, 10.0, 15.0, 19.0, 18.0, 16.0, 16.0, 33.0, 37.0, 30.0, 47.0, 27.0, 43.0, 48.0, 40.0, 51.0, 45.0, 56.0, 55.0, 37.0, 34.0, 26.0, 25.0, 33.0, 37.0, 26.0, 19.0, 22.0, 10.0, 12.0, 11.0, 7.0, 11.0, 10.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.033233642578125, -0.03226876258850098, -0.03130388259887695, -0.03033900260925293, -0.029374122619628906, -0.028409242630004883, -0.02744436264038086, -0.026479482650756836, -0.025514602661132812, -0.02454972267150879, -0.023584842681884766, -0.022619962692260742, -0.02165508270263672, -0.020690202713012695, -0.019725322723388672, -0.01876044273376465, -0.017795562744140625, -0.0168306827545166, -0.015865802764892578, -0.014900922775268555, -0.013936042785644531, -0.012971162796020508, -0.012006282806396484, -0.011041402816772461, -0.010076522827148438, -0.009111642837524414, -0.00814676284790039, -0.007181882858276367, -0.006217002868652344, -0.00525212287902832, -0.004287242889404297, -0.0033223628997802734, -0.00235748291015625, -0.0013926029205322266, -0.0004277229309082031, 0.0005371570587158203, 0.0015020370483398438, 0.002466917037963867, 0.0034317970275878906, 0.004396677017211914, 0.0053615570068359375, 0.006326436996459961, 0.007291316986083984, 0.008256196975708008, 0.009221076965332031, 0.010185956954956055, 0.011150836944580078, 0.012115716934204102, 0.013080596923828125, 0.014045476913452148, 0.015010356903076172, 0.015975236892700195, 0.01694011688232422, 0.017904996871948242, 0.018869876861572266, 0.01983475685119629, 0.020799636840820312, 0.021764516830444336, 0.02272939682006836, 0.023694276809692383, 0.024659156799316406, 0.02562403678894043, 0.026588916778564453, 0.027553796768188477, 0.0285186767578125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 4.0, 10.0, 11.0, 21.0, 22.0, 36.0, 73.0, 179.0, 325.0, 679.0, 1713.0, 5350.0, 47308.0, 971538.0, 15670.0, 3340.0, 1184.0, 537.0, 253.0, 118.0, 60.0, 45.0, 16.0, 15.0, 9.0, 12.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0304412841796875, -0.02952742576599121, -0.028613567352294922, -0.027699708938598633, -0.026785850524902344, -0.025871992111206055, -0.024958133697509766, -0.024044275283813477, -0.023130416870117188, -0.0222165584564209, -0.02130270004272461, -0.02038884162902832, -0.01947498321533203, -0.018561124801635742, -0.017647266387939453, -0.016733407974243164, -0.015819549560546875, -0.014905691146850586, -0.013991832733154297, -0.013077974319458008, -0.012164115905761719, -0.01125025749206543, -0.01033639907836914, -0.009422540664672852, -0.008508682250976562, -0.0075948238372802734, -0.006680965423583984, -0.005767107009887695, -0.004853248596191406, -0.003939390182495117, -0.003025531768798828, -0.002111673355102539, -0.00119781494140625, -0.00028395652770996094, 0.0006299018859863281, 0.0015437602996826172, 0.0024576187133789062, 0.0033714771270751953, 0.004285335540771484, 0.0051991939544677734, 0.0061130523681640625, 0.0070269107818603516, 0.00794076919555664, 0.00885462760925293, 0.009768486022949219, 0.010682344436645508, 0.011596202850341797, 0.012510061264038086, 0.013423919677734375, 0.014337778091430664, 0.015251636505126953, 0.016165494918823242, 0.01707935333251953, 0.01799321174621582, 0.01890707015991211, 0.0198209285736084, 0.020734786987304688, 0.021648645401000977, 0.022562503814697266, 0.023476362228393555, 0.024390220642089844, 0.025304079055786133, 0.026217937469482422, 0.02713179588317871, 0.028045654296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 8.0, 3.0, 9.0, 10.0, 12.0, 26.0, 13.0, 23.0, 27.0, 32.0, 26.0, 60.0, 57.0, 62.0, 70.0, 63.0, 57.0, 75.0, 57.0, 58.0, 52.0, 39.0, 28.0, 21.0, 16.0, 17.0, 17.0, 7.0, 13.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.271766662597656e-06, -7.038004696369171e-06, -6.804242730140686e-06, -6.570480763912201e-06, -6.336718797683716e-06, -6.102956831455231e-06, -5.869194865226746e-06, -5.6354328989982605e-06, -5.401670932769775e-06, -5.16790896654129e-06, -4.934147000312805e-06, -4.70038503408432e-06, -4.466623067855835e-06, -4.23286110162735e-06, -3.999099135398865e-06, -3.7653371691703796e-06, -3.5315752029418945e-06, -3.2978132367134094e-06, -3.0640512704849243e-06, -2.830289304256439e-06, -2.596527338027954e-06, -2.362765371799469e-06, -2.129003405570984e-06, -1.8952414393424988e-06, -1.6614794731140137e-06, -1.4277175068855286e-06, -1.1939555406570435e-06, -9.601935744285583e-07, -7.264316082000732e-07, -4.926696419715881e-07, -2.5890767574310303e-07, -2.514570951461792e-08, 2.086162567138672e-07, 4.423782229423523e-07, 6.761401891708374e-07, 9.099021553993225e-07, 1.1436641216278076e-06, 1.3774260878562927e-06, 1.6111880540847778e-06, 1.844950020313263e-06, 2.078711986541748e-06, 2.312473952770233e-06, 2.5462359189987183e-06, 2.7799978852272034e-06, 3.0137598514556885e-06, 3.2475218176841736e-06, 3.4812837839126587e-06, 3.715045750141144e-06, 3.948807716369629e-06, 4.182569682598114e-06, 4.416331648826599e-06, 4.650093615055084e-06, 4.883855581283569e-06, 5.1176175475120544e-06, 5.3513795137405396e-06, 5.585141479969025e-06, 5.81890344619751e-06, 6.052665412425995e-06, 6.28642737865448e-06, 6.520189344882965e-06, 6.75395131111145e-06, 6.987713277339935e-06, 7.22147524356842e-06, 7.4552372097969055e-06, 7.68899917602539e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 1.0, 4.0, 2.0, 10.0, 13.0, 15.0, 20.0, 25.0, 30.0, 51.0, 59.0, 103.0, 180.0, 289.0, 529.0, 945.0, 1971.0, 5002.0, 26676.0, 977926.0, 25490.0, 4857.0, 2008.0, 987.0, 539.0, 264.0, 167.0, 115.0, 61.0, 53.0, 39.0, 30.0, 19.0, 13.0, 10.0, 9.0, 19.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.031402587890625, -0.0305178165435791, -0.029633045196533203, -0.028748273849487305, -0.027863502502441406, -0.026978731155395508, -0.02609395980834961, -0.02520918846130371, -0.024324417114257812, -0.023439645767211914, -0.022554874420166016, -0.021670103073120117, -0.02078533172607422, -0.01990056037902832, -0.019015789031982422, -0.018131017684936523, -0.017246246337890625, -0.016361474990844727, -0.015476703643798828, -0.01459193229675293, -0.013707160949707031, -0.012822389602661133, -0.011937618255615234, -0.011052846908569336, -0.010168075561523438, -0.009283304214477539, -0.00839853286743164, -0.007513761520385742, -0.006628990173339844, -0.005744218826293945, -0.004859447479248047, -0.0039746761322021484, -0.00308990478515625, -0.0022051334381103516, -0.0013203620910644531, -0.0004355907440185547, 0.00044918060302734375, 0.0013339519500732422, 0.0022187232971191406, 0.003103494644165039, 0.0039882659912109375, 0.004873037338256836, 0.005757808685302734, 0.006642580032348633, 0.007527351379394531, 0.00841212272644043, 0.009296894073486328, 0.010181665420532227, 0.011066436767578125, 0.011951208114624023, 0.012835979461669922, 0.01372075080871582, 0.014605522155761719, 0.015490293502807617, 0.016375064849853516, 0.017259836196899414, 0.018144607543945312, 0.01902937889099121, 0.01991415023803711, 0.020798921585083008, 0.021683692932128906, 0.022568464279174805, 0.023453235626220703, 0.0243380069732666, 0.0252227783203125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 2.0, 3.0, 6.0, 6.0, 14.0, 16.0, 50.0, 83.0, 237.0, 306.0, 142.0, 56.0, 24.0, 13.0, 10.0, 6.0, 6.0, 3.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02752685546875, -0.026698827743530273, -0.025870800018310547, -0.02504277229309082, -0.024214744567871094, -0.023386716842651367, -0.02255868911743164, -0.021730661392211914, -0.020902633666992188, -0.02007460594177246, -0.019246578216552734, -0.018418550491333008, -0.01759052276611328, -0.016762495040893555, -0.015934467315673828, -0.015106439590454102, -0.014278411865234375, -0.013450384140014648, -0.012622356414794922, -0.011794328689575195, -0.010966300964355469, -0.010138273239135742, -0.009310245513916016, -0.008482217788696289, -0.0076541900634765625, -0.006826162338256836, -0.005998134613037109, -0.005170106887817383, -0.004342079162597656, -0.0035140514373779297, -0.002686023712158203, -0.0018579959869384766, -0.00102996826171875, -0.00020194053649902344, 0.0006260871887207031, 0.0014541149139404297, 0.0022821426391601562, 0.003110170364379883, 0.003938198089599609, 0.004766225814819336, 0.0055942535400390625, 0.006422281265258789, 0.007250308990478516, 0.008078336715698242, 0.008906364440917969, 0.009734392166137695, 0.010562419891357422, 0.011390447616577148, 0.012218475341796875, 0.013046503067016602, 0.013874530792236328, 0.014702558517456055, 0.015530586242675781, 0.016358613967895508, 0.017186641693115234, 0.01801466941833496, 0.018842697143554688, 0.019670724868774414, 0.02049875259399414, 0.021326780319213867, 0.022154808044433594, 0.02298283576965332, 0.023810863494873047, 0.024638891220092773, 0.0254669189453125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 9.0, 33.0, 52.0, 178.0, 371.0, 208.0, 90.0, 20.0, 17.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6343634724617004, -0.616607129573822, -0.5988508462905884, -0.58109450340271, -0.5633381605148315, -0.5455818176269531, -0.5278254747390747, -0.5100691914558411, -0.49231284856796265, -0.47455650568008423, -0.4568001925945282, -0.43904387950897217, -0.42128753662109375, -0.40353119373321533, -0.3857748806476593, -0.36801856756210327, -0.35026222467422485, -0.33250588178634644, -0.3147495687007904, -0.2969932556152344, -0.27923691272735596, -0.26148056983947754, -0.2437242567539215, -0.22596792876720428, -0.20821160078048706, -0.19045527279376984, -0.1726989448070526, -0.1549426168203354, -0.13718628883361816, -0.11942996084690094, -0.10167363286018372, -0.08391730487346649, -0.06616097688674927, -0.04840464890003204, -0.03064832091331482, -0.012891992926597595, 0.004864335060119629, 0.022620663046836853, 0.04037699103355408, 0.0581333190202713, 0.07588964700698853, 0.09364597499370575, 0.11140230298042297, 0.1291586309671402, 0.14691495895385742, 0.16467128694057465, 0.18242761492729187, 0.2001839429140091, 0.21794027090072632, 0.23569659888744354, 0.25345292687416077, 0.2712092399597168, 0.2889655828475952, 0.30672192573547363, 0.32447823882102966, 0.3422345519065857, 0.3599908947944641, 0.37774723768234253, 0.39550355076789856, 0.4132598638534546, 0.431016206741333, 0.4487725496292114, 0.46652886271476746, 0.4842851758003235, 0.5020415186882019]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 9.0, 5.0, 6.0, 10.0, 7.0, 5.0, 5.0, 17.0, 15.0, 13.0, 24.0, 20.0, 23.0, 28.0, 30.0, 26.0, 35.0, 39.0, 45.0, 61.0, 62.0, 61.0, 61.0, 48.0, 41.0, 34.0, 27.0, 33.0, 24.0, 25.0, 20.0, 24.0, 11.0, 21.0, 19.0, 14.0, 8.0, 12.0, 11.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13028067350387573, -0.12612950801849365, -0.12197835743427277, -0.11782719939947128, -0.1136760413646698, -0.10952488332986832, -0.10537372529506683, -0.10122256726026535, -0.09707140922546387, -0.09292025119066238, -0.0887690931558609, -0.08461793512105942, -0.08046677708625793, -0.07631561905145645, -0.07216446101665497, -0.06801330298185349, -0.063862144947052, -0.05971098691225052, -0.055559828877449036, -0.05140867084264755, -0.04725751280784607, -0.043106354773044586, -0.0389551967382431, -0.03480403870344162, -0.030652880668640137, -0.026501722633838654, -0.02235056459903717, -0.018199406564235687, -0.014048248529434204, -0.009897090494632721, -0.005745932459831238, -0.0015947744250297546, 0.0025563836097717285, 0.006707541644573212, 0.010858699679374695, 0.015009857714176178, 0.01916101574897766, 0.023312173783779144, 0.027463331818580627, 0.03161448985338211, 0.035765647888183594, 0.03991680592298508, 0.04406796395778656, 0.04821912199258804, 0.052370280027389526, 0.05652143806219101, 0.06067259609699249, 0.06482375413179398, 0.06897491216659546, 0.07312607020139694, 0.07727722823619843, 0.08142838627099991, 0.08557954430580139, 0.08973070234060287, 0.09388186037540436, 0.09803301841020584, 0.10218417644500732, 0.10633533447980881, 0.11048649251461029, 0.11463765054941177, 0.11878880858421326, 0.12293996661901474, 0.12709112465381622, 0.1312422752380371, 0.1353934407234192]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 9.0, 10.0, 16.0, 8.0, 13.0, 24.0, 30.0, 54.0, 96.0, 245.0, 1013.0, 60016.0, 4127823.0, 4147.0, 410.0, 159.0, 83.0, 45.0, 31.0, 14.0, 8.0, 8.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07965087890625, -0.07756757736206055, -0.0754842758178711, -0.07340097427368164, -0.07131767272949219, -0.06923437118530273, -0.06715106964111328, -0.06506776809692383, -0.06298446655273438, -0.06090116500854492, -0.05881786346435547, -0.056734561920166016, -0.05465126037597656, -0.05256795883178711, -0.050484657287597656, -0.0484013557434082, -0.04631805419921875, -0.0442347526550293, -0.042151451110839844, -0.04006814956665039, -0.03798484802246094, -0.035901546478271484, -0.03381824493408203, -0.03173494338989258, -0.029651641845703125, -0.027568340301513672, -0.02548503875732422, -0.023401737213134766, -0.021318435668945312, -0.01923513412475586, -0.017151832580566406, -0.015068531036376953, -0.0129852294921875, -0.010901927947998047, -0.008818626403808594, -0.006735324859619141, -0.0046520233154296875, -0.0025687217712402344, -0.00048542022705078125, 0.0015978813171386719, 0.003681182861328125, 0.005764484405517578, 0.007847785949707031, 0.009931087493896484, 0.012014389038085938, 0.01409769058227539, 0.016180992126464844, 0.018264293670654297, 0.02034759521484375, 0.022430896759033203, 0.024514198303222656, 0.02659749984741211, 0.028680801391601562, 0.030764102935791016, 0.03284740447998047, 0.03493070602416992, 0.037014007568359375, 0.03909730911254883, 0.04118061065673828, 0.043263912200927734, 0.04534721374511719, 0.04743051528930664, 0.049513816833496094, 0.05159711837768555, 0.053680419921875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 3.0, 7.0, 11.0, 20.0, 32.0, 57.0, 79.0, 150.0, 158.0, 171.0, 124.0, 71.0, 31.0, 22.0, 17.0, 10.0, 7.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0189666748046875, -0.018368005752563477, -0.017769336700439453, -0.01717066764831543, -0.016571998596191406, -0.015973329544067383, -0.01537466049194336, -0.014775991439819336, -0.014177322387695312, -0.013578653335571289, -0.012979984283447266, -0.012381315231323242, -0.011782646179199219, -0.011183977127075195, -0.010585308074951172, -0.009986639022827148, -0.009387969970703125, -0.008789300918579102, -0.008190631866455078, -0.007591962814331055, -0.006993293762207031, -0.006394624710083008, -0.005795955657958984, -0.005197286605834961, -0.0045986175537109375, -0.003999948501586914, -0.0034012794494628906, -0.002802610397338867, -0.0022039413452148438, -0.0016052722930908203, -0.0010066032409667969, -0.00040793418884277344, 0.00019073486328125, 0.0007894039154052734, 0.0013880729675292969, 0.0019867420196533203, 0.0025854110717773438, 0.003184080123901367, 0.0037827491760253906, 0.004381418228149414, 0.0049800872802734375, 0.005578756332397461, 0.006177425384521484, 0.006776094436645508, 0.007374763488769531, 0.007973432540893555, 0.008572101593017578, 0.009170770645141602, 0.009769439697265625, 0.010368108749389648, 0.010966777801513672, 0.011565446853637695, 0.012164115905761719, 0.012762784957885742, 0.013361454010009766, 0.013960123062133789, 0.014558792114257812, 0.015157461166381836, 0.01575613021850586, 0.016354799270629883, 0.016953468322753906, 0.01755213737487793, 0.018150806427001953, 0.018749475479125977, 0.01934814453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 15.0, 35.0, 59.0, 118.0, 184.0, 569.0, 4109.0, 143041.0, 4024358.0, 18324.0, 2196.0, 534.0, 259.0, 176.0, 109.0, 73.0, 38.0, 27.0, 11.0, 13.0, 4.0, 9.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.047393798828125, -0.04592275619506836, -0.04445171356201172, -0.04298067092895508, -0.04150962829589844, -0.0400385856628418, -0.038567543029785156, -0.037096500396728516, -0.035625457763671875, -0.034154415130615234, -0.032683372497558594, -0.031212329864501953, -0.029741287231445312, -0.028270244598388672, -0.02679920196533203, -0.02532815933227539, -0.02385711669921875, -0.02238607406616211, -0.02091503143310547, -0.019443988800048828, -0.017972946166992188, -0.016501903533935547, -0.015030860900878906, -0.013559818267822266, -0.012088775634765625, -0.010617733001708984, -0.009146690368652344, -0.007675647735595703, -0.0062046051025390625, -0.004733562469482422, -0.0032625198364257812, -0.0017914772033691406, -0.0003204345703125, 0.0011506080627441406, 0.0026216506958007812, 0.004092693328857422, 0.0055637359619140625, 0.007034778594970703, 0.008505821228027344, 0.009976863861083984, 0.011447906494140625, 0.012918949127197266, 0.014389991760253906, 0.015861034393310547, 0.017332077026367188, 0.018803119659423828, 0.02027416229248047, 0.02174520492553711, 0.02321624755859375, 0.02468729019165039, 0.02615833282470703, 0.027629375457763672, 0.029100418090820312, 0.030571460723876953, 0.032042503356933594, 0.033513545989990234, 0.034984588623046875, 0.036455631256103516, 0.037926673889160156, 0.0393977165222168, 0.04086875915527344, 0.04233980178833008, 0.04381084442138672, 0.04528188705444336, 0.0467529296875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 20.0, 32.0, 78.0, 278.0, 1510.0, 1567.0, 302.0, 107.0, 61.0, 32.0, 20.0, 20.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0128021240234375, -0.011816740036010742, -0.010831356048583984, -0.009845972061157227, -0.008860588073730469, -0.007875204086303711, -0.006889820098876953, -0.005904436111450195, -0.0049190521240234375, -0.00393366813659668, -0.002948284149169922, -0.001962900161743164, -0.0009775161743164062, 7.867813110351562e-06, 0.0009932518005371094, 0.001978635787963867, 0.002964019775390625, 0.003949403762817383, 0.004934787750244141, 0.0059201717376708984, 0.006905555725097656, 0.007890939712524414, 0.008876323699951172, 0.00986170768737793, 0.010847091674804688, 0.011832475662231445, 0.012817859649658203, 0.013803243637084961, 0.014788627624511719, 0.015774011611938477, 0.016759395599365234, 0.017744779586791992, 0.01873016357421875, 0.019715547561645508, 0.020700931549072266, 0.021686315536499023, 0.02267169952392578, 0.02365708351135254, 0.024642467498779297, 0.025627851486206055, 0.026613235473632812, 0.02759861946105957, 0.028584003448486328, 0.029569387435913086, 0.030554771423339844, 0.0315401554107666, 0.03252553939819336, 0.03351092338562012, 0.034496307373046875, 0.03548169136047363, 0.03646707534790039, 0.03745245933532715, 0.038437843322753906, 0.039423227310180664, 0.04040861129760742, 0.04139399528503418, 0.04237937927246094, 0.043364763259887695, 0.04435014724731445, 0.04533553123474121, 0.04632091522216797, 0.04730629920959473, 0.048291683197021484, 0.04927706718444824, 0.050262451171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 10.0, 17.0, 63.0, 213.0, 304.0, 188.0, 100.0, 46.0, 22.0, 14.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11292285472154617, -0.10438553988933563, -0.09584823250770569, -0.08731091767549515, -0.0787736028432846, -0.07023629546165466, -0.06169898062944412, -0.05316166952252388, -0.04462435841560364, -0.036087047308683395, -0.027549734339118004, -0.019012421369552612, -0.01047511026263237, -0.0019377991557121277, 0.006599515676498413, 0.015136826783418655, 0.023674137890338898, 0.03221144899725914, 0.04074876010417938, 0.04928607493638992, 0.057823386043310165, 0.06636069715023041, 0.07489801198244095, 0.08343532681465149, 0.09197263419628143, 0.10050994902849197, 0.10904725641012192, 0.11758457124233246, 0.1261218786239624, 0.13465920090675354, 0.14319650828838348, 0.15173381567001343, 0.16027113795280457, 0.1688084453344345, 0.17734576761722565, 0.1858830749988556, 0.19442038238048553, 0.20295768976211548, 0.21149501204490662, 0.22003231942653656, 0.2285696268081665, 0.23710693418979645, 0.24564425647258759, 0.25418156385421753, 0.26271888613700867, 0.2712561786174774, 0.27979350090026855, 0.2883308231830597, 0.29686814546585083, 0.30540546774864197, 0.3139427602291107, 0.32248008251190186, 0.331017404794693, 0.33955469727516174, 0.3480920195579529, 0.356629341840744, 0.36516663432121277, 0.3737039566040039, 0.38224124908447266, 0.3907785713672638, 0.39931589365005493, 0.4078531861305237, 0.4163905084133148, 0.42492783069610596, 0.4334651231765747]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 5.0, 8.0, 14.0, 13.0, 26.0, 19.0, 18.0, 23.0, 36.0, 39.0, 49.0, 38.0, 49.0, 41.0, 37.0, 48.0, 54.0, 53.0, 30.0, 46.0, 40.0, 46.0, 23.0, 26.0, 28.0, 36.0, 30.0, 23.0, 9.0, 12.0, 8.0, 14.0, 9.0, 10.0, 6.0, 8.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.11703497171401978, -0.11370910704135895, -0.11038324236869812, -0.10705737769603729, -0.10373151302337646, -0.10040564835071564, -0.0970797911286354, -0.09375392645597458, -0.09042806178331375, -0.08710219711065292, -0.0837763324379921, -0.08045046776533127, -0.07712461054325104, -0.07379874587059021, -0.07047288119792938, -0.06714701652526855, -0.06382115185260773, -0.0604952871799469, -0.05716942250728607, -0.05384356155991554, -0.050517696887254715, -0.04719183221459389, -0.04386597126722336, -0.04054010659456253, -0.0372142419219017, -0.033888377249240875, -0.030562514439225197, -0.02723665162920952, -0.02391078695654869, -0.020584922283887863, -0.017259059473872185, -0.013933196663856506, -0.010607331991195679, -0.007281468249857426, -0.003955604508519173, -0.0006297407671809196, 0.0026961229741573334, 0.006021987646818161, 0.00934785045683384, 0.012673713266849518, 0.015999577939510345, 0.019325442612171173, 0.02265130542218685, 0.02597716823220253, 0.029303032904863358, 0.032628897577524185, 0.035954758524894714, 0.03928062319755554, 0.04260648787021637, 0.0459323525428772, 0.049258217215538025, 0.052584078162908554, 0.05590994283556938, 0.05923580750823021, 0.06256166845560074, 0.06588753312826157, 0.0692133978009224, 0.07253926247358322, 0.07586512714624405, 0.07919099181890488, 0.08251684904098511, 0.08584271371364594, 0.08916857838630676, 0.09249444305896759, 0.09582030773162842]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 11.0, 11.0, 13.0, 16.0, 30.0, 38.0, 45.0, 74.0, 108.0, 160.0, 216.0, 354.0, 678.0, 1233.0, 2574.0, 6017.0, 17338.0, 68595.0, 425799.0, 427004.0, 69015.0, 17572.0, 6042.0, 2589.0, 1236.0, 662.0, 362.0, 235.0, 156.0, 91.0, 72.0, 47.0, 32.0, 23.0, 32.0, 22.0, 13.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0259246826171875, -0.025162220001220703, -0.024399757385253906, -0.02363729476928711, -0.022874832153320312, -0.022112369537353516, -0.02134990692138672, -0.020587444305419922, -0.019824981689453125, -0.019062519073486328, -0.01830005645751953, -0.017537593841552734, -0.016775131225585938, -0.01601266860961914, -0.015250205993652344, -0.014487743377685547, -0.01372528076171875, -0.012962818145751953, -0.012200355529785156, -0.01143789291381836, -0.010675430297851562, -0.009912967681884766, -0.009150505065917969, -0.008388042449951172, -0.007625579833984375, -0.006863117218017578, -0.006100654602050781, -0.005338191986083984, -0.0045757293701171875, -0.0038132667541503906, -0.0030508041381835938, -0.002288341522216797, -0.00152587890625, -0.0007634162902832031, -9.5367431640625e-07, 0.0007615089416503906, 0.0015239715576171875, 0.0022864341735839844, 0.0030488967895507812, 0.003811359405517578, 0.004573822021484375, 0.005336284637451172, 0.006098747253417969, 0.006861209869384766, 0.0076236724853515625, 0.00838613510131836, 0.009148597717285156, 0.009911060333251953, 0.01067352294921875, 0.011435985565185547, 0.012198448181152344, 0.01296091079711914, 0.013723373413085938, 0.014485836029052734, 0.015248298645019531, 0.016010761260986328, 0.016773223876953125, 0.017535686492919922, 0.01829814910888672, 0.019060611724853516, 0.019823074340820312, 0.02058553695678711, 0.021347999572753906, 0.022110462188720703, 0.0228729248046875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 4.0, 6.0, 18.0, 26.0, 34.0, 57.0, 112.0, 112.0, 163.0, 153.0, 100.0, 84.0, 40.0, 22.0, 13.0, 20.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179595947265625, -0.01737236976623535, -0.016785144805908203, -0.016197919845581055, -0.015610694885253906, -0.015023469924926758, -0.01443624496459961, -0.013849020004272461, -0.013261795043945312, -0.012674570083618164, -0.012087345123291016, -0.011500120162963867, -0.010912895202636719, -0.01032567024230957, -0.009738445281982422, -0.009151220321655273, -0.008563995361328125, -0.007976770401000977, -0.007389545440673828, -0.00680232048034668, -0.006215095520019531, -0.005627870559692383, -0.005040645599365234, -0.004453420639038086, -0.0038661956787109375, -0.003278970718383789, -0.0026917457580566406, -0.002104520797729492, -0.0015172958374023438, -0.0009300708770751953, -0.0003428459167480469, 0.00024437904357910156, 0.00083160400390625, 0.0014188289642333984, 0.002006053924560547, 0.0025932788848876953, 0.0031805038452148438, 0.003767728805541992, 0.004354953765869141, 0.004942178726196289, 0.0055294036865234375, 0.006116628646850586, 0.006703853607177734, 0.007291078567504883, 0.007878303527832031, 0.00846552848815918, 0.009052753448486328, 0.009639978408813477, 0.010227203369140625, 0.010814428329467773, 0.011401653289794922, 0.01198887825012207, 0.012576103210449219, 0.013163328170776367, 0.013750553131103516, 0.014337778091430664, 0.014925003051757812, 0.015512228012084961, 0.01609945297241211, 0.016686677932739258, 0.017273902893066406, 0.017861127853393555, 0.018448352813720703, 0.01903557777404785, 0.019622802734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 2.0, 5.0, 17.0, 14.0, 20.0, 15.0, 22.0, 42.0, 58.0, 72.0, 125.0, 165.0, 258.0, 404.0, 707.0, 1359.0, 2813.0, 7144.0, 23138.0, 105072.0, 645026.0, 204729.0, 38597.0, 10685.0, 3975.0, 1765.0, 871.0, 492.0, 315.0, 192.0, 127.0, 81.0, 75.0, 42.0, 34.0, 25.0, 18.0, 14.0, 6.0, 9.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0289764404296875, -0.028061866760253906, -0.027147293090820312, -0.02623271942138672, -0.025318145751953125, -0.02440357208251953, -0.023488998413085938, -0.022574424743652344, -0.02165985107421875, -0.020745277404785156, -0.019830703735351562, -0.01891613006591797, -0.018001556396484375, -0.01708698272705078, -0.016172409057617188, -0.015257835388183594, -0.01434326171875, -0.013428688049316406, -0.012514114379882812, -0.011599540710449219, -0.010684967041015625, -0.009770393371582031, -0.008855819702148438, -0.007941246032714844, -0.00702667236328125, -0.006112098693847656, -0.0051975250244140625, -0.004282951354980469, -0.003368377685546875, -0.0024538040161132812, -0.0015392303466796875, -0.0006246566772460938, 0.0002899169921875, 0.0012044906616210938, 0.0021190643310546875, 0.0030336380004882812, 0.003948211669921875, 0.004862785339355469, 0.0057773590087890625, 0.006691932678222656, 0.00760650634765625, 0.008521080017089844, 0.009435653686523438, 0.010350227355957031, 0.011264801025390625, 0.012179374694824219, 0.013093948364257812, 0.014008522033691406, 0.014923095703125, 0.015837669372558594, 0.016752243041992188, 0.01766681671142578, 0.018581390380859375, 0.01949596405029297, 0.020410537719726562, 0.021325111389160156, 0.02223968505859375, 0.023154258728027344, 0.024068832397460938, 0.02498340606689453, 0.025897979736328125, 0.02681255340576172, 0.027727127075195312, 0.028641700744628906, 0.0295562744140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 12.0, 11.0, 11.0, 12.0, 15.0, 15.0, 18.0, 30.0, 36.0, 59.0, 59.0, 43.0, 44.0, 60.0, 67.0, 54.0, 54.0, 68.0, 56.0, 38.0, 47.0, 29.0, 39.0, 30.0, 19.0, 20.0, 12.0, 8.0, 12.0, 3.0, 6.0, 5.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.047210693359375, -0.045955657958984375, -0.04470062255859375, -0.043445587158203125, -0.0421905517578125, -0.040935516357421875, -0.03968048095703125, -0.038425445556640625, -0.03717041015625, -0.035915374755859375, -0.03466033935546875, -0.033405303955078125, -0.0321502685546875, -0.030895233154296875, -0.02964019775390625, -0.028385162353515625, -0.027130126953125, -0.025875091552734375, -0.02462005615234375, -0.023365020751953125, -0.0221099853515625, -0.020854949951171875, -0.01959991455078125, -0.018344879150390625, -0.01708984375, -0.015834808349609375, -0.01457977294921875, -0.013324737548828125, -0.0120697021484375, -0.010814666748046875, -0.00955963134765625, -0.008304595947265625, -0.007049560546875, -0.005794525146484375, -0.00453948974609375, -0.003284454345703125, -0.0020294189453125, -0.000774383544921875, 0.00048065185546875, 0.001735687255859375, 0.00299072265625, 0.004245758056640625, 0.00550079345703125, 0.006755828857421875, 0.0080108642578125, 0.009265899658203125, 0.01052093505859375, 0.011775970458984375, 0.013031005859375, 0.014286041259765625, 0.01554107666015625, 0.016796112060546875, 0.0180511474609375, 0.019306182861328125, 0.02056121826171875, 0.021816253662109375, 0.0230712890625, 0.024326324462890625, 0.02558135986328125, 0.026836395263671875, 0.0280914306640625, 0.029346466064453125, 0.03060150146484375, 0.031856536865234375, 0.033111572265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 11.0, 11.0, 17.0, 24.0, 24.0, 33.0, 35.0, 55.0, 94.0, 136.0, 221.0, 419.0, 849.0, 2004.0, 6021.0, 27192.0, 357440.0, 611269.0, 31925.0, 6597.0, 2135.0, 909.0, 422.0, 243.0, 116.0, 102.0, 62.0, 35.0, 36.0, 24.0, 25.0, 15.0, 10.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01200103759765625, -0.011601567268371582, -0.011202096939086914, -0.010802626609802246, -0.010403156280517578, -0.01000368595123291, -0.009604215621948242, -0.009204745292663574, -0.008805274963378906, -0.008405804634094238, -0.00800633430480957, -0.007606863975524902, -0.007207393646240234, -0.006807923316955566, -0.0064084529876708984, -0.0060089826583862305, -0.0056095123291015625, -0.0052100419998168945, -0.0048105716705322266, -0.004411101341247559, -0.004011631011962891, -0.0036121606826782227, -0.0032126903533935547, -0.0028132200241088867, -0.0024137496948242188, -0.0020142793655395508, -0.0016148090362548828, -0.0012153387069702148, -0.0008158683776855469, -0.0004163980484008789, -1.6927719116210938e-05, 0.00038254261016845703, 0.000782012939453125, 0.001181483268737793, 0.001580953598022461, 0.001980423927307129, 0.002379894256591797, 0.002779364585876465, 0.003178834915161133, 0.0035783052444458008, 0.003977775573730469, 0.004377245903015137, 0.004776716232299805, 0.005176186561584473, 0.005575656890869141, 0.005975127220153809, 0.0063745975494384766, 0.0067740678787231445, 0.0071735382080078125, 0.0075730085372924805, 0.007972478866577148, 0.008371949195861816, 0.008771419525146484, 0.009170889854431152, 0.00957036018371582, 0.009969830513000488, 0.010369300842285156, 0.010768771171569824, 0.011168241500854492, 0.01156771183013916, 0.011967182159423828, 0.012366652488708496, 0.012766122817993164, 0.013165593147277832, 0.0135650634765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 4.0, 4.0, 11.0, 9.0, 8.0, 20.0, 14.0, 18.0, 34.0, 40.0, 42.0, 51.0, 61.0, 71.0, 100.0, 56.0, 81.0, 74.0, 46.0, 60.0, 33.0, 41.0, 34.0, 24.0, 10.0, 2.0, 15.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.556510925292969e-06, -6.3320621848106384e-06, -6.107613444328308e-06, -5.883164703845978e-06, -5.6587159633636475e-06, -5.434267222881317e-06, -5.209818482398987e-06, -4.9853697419166565e-06, -4.760921001434326e-06, -4.536472260951996e-06, -4.3120235204696655e-06, -4.087574779987335e-06, -3.863126039505005e-06, -3.6386772990226746e-06, -3.4142285585403442e-06, -3.189779818058014e-06, -2.9653310775756836e-06, -2.7408823370933533e-06, -2.516433596611023e-06, -2.2919848561286926e-06, -2.0675361156463623e-06, -1.843087375164032e-06, -1.6186386346817017e-06, -1.3941898941993713e-06, -1.169741153717041e-06, -9.452924132347107e-07, -7.208436727523804e-07, -4.9639493227005e-07, -2.7194619178771973e-07, -4.7497451305389404e-08, 1.7695128917694092e-07, 4.0140002965927124e-07, 6.258487701416016e-07, 8.502975106239319e-07, 1.0747462511062622e-06, 1.2991949915885925e-06, 1.5236437320709229e-06, 1.7480924725532532e-06, 1.9725412130355835e-06, 2.196989953517914e-06, 2.421438694000244e-06, 2.6458874344825745e-06, 2.8703361749649048e-06, 3.094784915447235e-06, 3.3192336559295654e-06, 3.5436823964118958e-06, 3.768131136894226e-06, 3.992579877376556e-06, 4.217028617858887e-06, 4.441477358341217e-06, 4.665926098823547e-06, 4.890374839305878e-06, 5.114823579788208e-06, 5.339272320270538e-06, 5.563721060752869e-06, 5.788169801235199e-06, 6.012618541717529e-06, 6.23706728219986e-06, 6.46151602268219e-06, 6.68596476316452e-06, 6.910413503646851e-06, 7.134862244129181e-06, 7.359310984611511e-06, 7.5837597250938416e-06, 7.808208465576172e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 2.0, 11.0, 11.0, 7.0, 15.0, 19.0, 12.0, 24.0, 42.0, 62.0, 83.0, 141.0, 243.0, 333.0, 657.0, 1248.0, 2705.0, 6763.0, 26000.0, 354292.0, 612108.0, 30520.0, 7498.0, 2716.0, 1309.0, 682.0, 364.0, 221.0, 137.0, 86.0, 65.0, 60.0, 30.0, 19.0, 21.0, 11.0, 9.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.012542724609375, -0.012095451354980469, -0.011648178100585938, -0.011200904846191406, -0.010753631591796875, -0.010306358337402344, -0.009859085083007812, -0.009411811828613281, -0.00896453857421875, -0.008517265319824219, -0.008069992065429688, -0.007622718811035156, -0.007175445556640625, -0.006728172302246094, -0.0062808990478515625, -0.005833625793457031, -0.0053863525390625, -0.004939079284667969, -0.0044918060302734375, -0.004044532775878906, -0.003597259521484375, -0.0031499862670898438, -0.0027027130126953125, -0.0022554397583007812, -0.00180816650390625, -0.0013608932495117188, -0.0009136199951171875, -0.00046634674072265625, -1.9073486328125e-05, 0.00042819976806640625, 0.0008754730224609375, 0.0013227462768554688, 0.00177001953125, 0.0022172927856445312, 0.0026645660400390625, 0.0031118392944335938, 0.003559112548828125, 0.004006385803222656, 0.0044536590576171875, 0.004900932312011719, 0.00534820556640625, 0.005795478820800781, 0.0062427520751953125, 0.006690025329589844, 0.007137298583984375, 0.007584571838378906, 0.008031845092773438, 0.008479118347167969, 0.0089263916015625, 0.009373664855957031, 0.009820938110351562, 0.010268211364746094, 0.010715484619140625, 0.011162757873535156, 0.011610031127929688, 0.012057304382324219, 0.01250457763671875, 0.012951850891113281, 0.013399124145507812, 0.013846397399902344, 0.014293670654296875, 0.014740943908691406, 0.015188217163085938, 0.01563549041748047, 0.016082763671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 5.0, 9.0, 13.0, 13.0, 19.0, 32.0, 27.0, 52.0, 78.0, 103.0, 116.0, 118.0, 107.0, 83.0, 55.0, 36.0, 25.0, 24.0, 24.0, 7.0, 8.0, 4.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01313018798828125, -0.012662768363952637, -0.012195348739624023, -0.01172792911529541, -0.011260509490966797, -0.010793089866638184, -0.01032567024230957, -0.009858250617980957, -0.009390830993652344, -0.00892341136932373, -0.008455991744995117, -0.007988572120666504, -0.007521152496337891, -0.007053732872009277, -0.006586313247680664, -0.006118893623352051, -0.0056514739990234375, -0.005184054374694824, -0.004716634750366211, -0.004249215126037598, -0.0037817955017089844, -0.003314375877380371, -0.002846956253051758, -0.0023795366287231445, -0.0019121170043945312, -0.001444697380065918, -0.0009772777557373047, -0.0005098581314086914, -4.2438507080078125e-05, 0.00042498111724853516, 0.0008924007415771484, 0.0013598203659057617, 0.001827239990234375, 0.0022946596145629883, 0.0027620792388916016, 0.003229498863220215, 0.003696918487548828, 0.004164338111877441, 0.004631757736206055, 0.005099177360534668, 0.005566596984863281, 0.0060340166091918945, 0.006501436233520508, 0.006968855857849121, 0.007436275482177734, 0.007903695106506348, 0.008371114730834961, 0.008838534355163574, 0.009305953979492188, 0.0097733736038208, 0.010240793228149414, 0.010708212852478027, 0.01117563247680664, 0.011643052101135254, 0.012110471725463867, 0.01257789134979248, 0.013045310974121094, 0.013512730598449707, 0.01398015022277832, 0.014447569847106934, 0.014914989471435547, 0.01538240909576416, 0.015849828720092773, 0.016317248344421387, 0.01678466796875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 7.0, 0.0, 5.0, 14.0, 25.0, 51.0, 86.0, 205.0, 317.0, 184.0, 62.0, 17.0, 11.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4073047637939453, -0.39484289288520813, -0.38238105177879333, -0.36991918087005615, -0.35745733976364136, -0.3449954688549042, -0.332533597946167, -0.3200717568397522, -0.3076099157333374, -0.2951480448246002, -0.2826862037181854, -0.27022433280944824, -0.25776249170303345, -0.24530062079429626, -0.23283876478672028, -0.2203769087791443, -0.2079150378704071, -0.19545318186283112, -0.18299132585525513, -0.17052945494651794, -0.15806761384010315, -0.14560574293136597, -0.13314388692378998, -0.12068203091621399, -0.108220174908638, -0.09575831890106201, -0.08329646289348602, -0.07083459943532944, -0.05837274342775345, -0.04591088742017746, -0.033449023962020874, -0.020987167954444885, -0.008525311946868896, 0.0039365459233522415, 0.01639840379357338, 0.028860263526439667, 0.041322119534015656, 0.053783975541591644, 0.06624583899974823, 0.07870769500732422, 0.09116955101490021, 0.1036314070224762, 0.11609326303005219, 0.12855511903762817, 0.14101698994636536, 0.15347883105278015, 0.16594070196151733, 0.17840255796909332, 0.1908644139766693, 0.2033262699842453, 0.2157881259918213, 0.22824999690055847, 0.24071183800697327, 0.25317370891571045, 0.26563555002212524, 0.2780974209308624, 0.2905592918395996, 0.3030211627483368, 0.3154830038547516, 0.32794487476348877, 0.34040671586990356, 0.35286858677864075, 0.36533045768737793, 0.3777922987937927, 0.3902541399002075]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 10.0, 8.0, 17.0, 18.0, 9.0, 15.0, 25.0, 37.0, 27.0, 25.0, 26.0, 40.0, 52.0, 72.0, 72.0, 95.0, 49.0, 51.0, 49.0, 34.0, 40.0, 27.0, 18.0, 29.0, 14.0, 22.0, 21.0, 11.0, 14.0, 8.0, 20.0, 5.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16855734586715698, -0.1632978916168213, -0.1580384373664856, -0.1527789831161499, -0.1475195437669754, -0.1422600895166397, -0.13700063526630402, -0.13174118101596832, -0.12648174166679382, -0.12122228741645813, -0.11596284061670303, -0.11070338636636734, -0.10544393956661224, -0.10018448531627655, -0.09492503106594086, -0.08966557681560516, -0.08440612256526947, -0.07914666831493378, -0.07388722151517868, -0.06862776726484299, -0.06336832046508789, -0.0581088662147522, -0.052849411964416504, -0.04758996143937111, -0.042330510914325714, -0.03707106038928032, -0.031811609864234924, -0.02655215561389923, -0.021292705088853836, -0.01603325456380844, -0.010773800313472748, -0.005514349788427353, -0.000254899263381958, 0.0050045521929860115, 0.010264003649353981, 0.015523456037044525, 0.02078290656208992, 0.026042357087135315, 0.03130181133747101, 0.0365612618625164, 0.0418207123875618, 0.04708016291260719, 0.05233961343765259, 0.05759906768798828, 0.06285852193832397, 0.06811796873807907, 0.07337742298841476, 0.07863686978816986, 0.08389632403850555, 0.08915577828884125, 0.09441522508859634, 0.09967467933893204, 0.10493412613868713, 0.11019358038902283, 0.11545303463935852, 0.12071248888969421, 0.1259719431400299, 0.1312313973903656, 0.1364908516407013, 0.141750305891037, 0.1470097452402115, 0.15226919949054718, 0.15752865374088287, 0.16278810799121857, 0.16804754734039307]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 11.0, 15.0, 13.0, 24.0, 43.0, 90.0, 209.0, 658.0, 6316.0, 4079828.0, 104362.0, 2052.0, 371.0, 144.0, 51.0, 41.0, 18.0, 18.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06793212890625, -0.06618022918701172, -0.06442832946777344, -0.06267642974853516, -0.060924530029296875, -0.059172630310058594, -0.05742073059082031, -0.05566883087158203, -0.05391693115234375, -0.05216503143310547, -0.05041313171386719, -0.048661231994628906, -0.046909332275390625, -0.045157432556152344, -0.04340553283691406, -0.04165363311767578, -0.0399017333984375, -0.03814983367919922, -0.03639793395996094, -0.034646034240722656, -0.032894134521484375, -0.031142234802246094, -0.029390335083007812, -0.02763843536376953, -0.02588653564453125, -0.02413463592529297, -0.022382736206054688, -0.020630836486816406, -0.018878936767578125, -0.017127037048339844, -0.015375137329101562, -0.013623237609863281, -0.011871337890625, -0.010119438171386719, -0.008367538452148438, -0.006615638732910156, -0.004863739013671875, -0.0031118392944335938, -0.0013599395751953125, 0.00039196014404296875, 0.00214385986328125, 0.0038957595825195312, 0.0056476593017578125, 0.007399559020996094, 0.009151458740234375, 0.010903358459472656, 0.012655258178710938, 0.014407157897949219, 0.0161590576171875, 0.01791095733642578, 0.019662857055664062, 0.021414756774902344, 0.023166656494140625, 0.024918556213378906, 0.026670455932617188, 0.02842235565185547, 0.03017425537109375, 0.03192615509033203, 0.03367805480957031, 0.035429954528808594, 0.037181854248046875, 0.038933753967285156, 0.04068565368652344, 0.04243755340576172, 0.044189453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 8.0, 16.0, 32.0, 37.0, 60.0, 88.0, 92.0, 157.0, 157.0, 116.0, 69.0, 43.0, 41.0, 26.0, 16.0, 10.0, 11.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0182647705078125, -0.017673254013061523, -0.017081737518310547, -0.01649022102355957, -0.015898704528808594, -0.015307188034057617, -0.01471567153930664, -0.014124155044555664, -0.013532638549804688, -0.012941122055053711, -0.012349605560302734, -0.011758089065551758, -0.011166572570800781, -0.010575056076049805, -0.009983539581298828, -0.009392023086547852, -0.008800506591796875, -0.008208990097045898, -0.007617473602294922, -0.007025957107543945, -0.006434440612792969, -0.005842924118041992, -0.005251407623291016, -0.004659891128540039, -0.0040683746337890625, -0.003476858139038086, -0.0028853416442871094, -0.002293825149536133, -0.0017023086547851562, -0.0011107921600341797, -0.0005192756652832031, 7.224082946777344e-05, 0.00066375732421875, 0.0012552738189697266, 0.0018467903137207031, 0.0024383068084716797, 0.0030298233032226562, 0.003621339797973633, 0.004212856292724609, 0.004804372787475586, 0.0053958892822265625, 0.005987405776977539, 0.006578922271728516, 0.007170438766479492, 0.007761955261230469, 0.008353471755981445, 0.008944988250732422, 0.009536504745483398, 0.010128021240234375, 0.010719537734985352, 0.011311054229736328, 0.011902570724487305, 0.012494087219238281, 0.013085603713989258, 0.013677120208740234, 0.014268636703491211, 0.014860153198242188, 0.015451669692993164, 0.01604318618774414, 0.016634702682495117, 0.017226219177246094, 0.01781773567199707, 0.018409252166748047, 0.019000768661499023, 0.01959228515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 4.0, 7.0, 11.0, 26.0, 42.0, 49.0, 94.0, 173.0, 321.0, 619.0, 1822.0, 10694.0, 1665126.0, 2499586.0, 12409.0, 2045.0, 633.0, 292.0, 145.0, 87.0, 39.0, 24.0, 9.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0386962890625, -0.03736257553100586, -0.03602886199951172, -0.03469514846801758, -0.03336143493652344, -0.0320277214050293, -0.030694007873535156, -0.029360294342041016, -0.028026580810546875, -0.026692867279052734, -0.025359153747558594, -0.024025440216064453, -0.022691726684570312, -0.021358013153076172, -0.02002429962158203, -0.01869058609008789, -0.01735687255859375, -0.01602315902709961, -0.014689445495605469, -0.013355731964111328, -0.012022018432617188, -0.010688304901123047, -0.009354591369628906, -0.008020877838134766, -0.006687164306640625, -0.005353450775146484, -0.004019737243652344, -0.002686023712158203, -0.0013523101806640625, -1.8596649169921875e-05, 0.0013151168823242188, 0.0026488304138183594, 0.0039825439453125, 0.005316257476806641, 0.006649971008300781, 0.007983684539794922, 0.009317398071289062, 0.010651111602783203, 0.011984825134277344, 0.013318538665771484, 0.014652252197265625, 0.015985965728759766, 0.017319679260253906, 0.018653392791748047, 0.019987106323242188, 0.021320819854736328, 0.02265453338623047, 0.02398824691772461, 0.02532196044921875, 0.02665567398071289, 0.02798938751220703, 0.029323101043701172, 0.030656814575195312, 0.03199052810668945, 0.033324241638183594, 0.034657955169677734, 0.035991668701171875, 0.037325382232666016, 0.038659095764160156, 0.0399928092956543, 0.04132652282714844, 0.04266023635864258, 0.04399394989013672, 0.04532766342163086, 0.046661376953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 9.0, 15.0, 13.0, 25.0, 42.0, 66.0, 189.0, 832.0, 1775.0, 732.0, 176.0, 65.0, 41.0, 25.0, 13.0, 14.0, 11.0, 7.0, 6.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.034515380859375, -0.033682823181152344, -0.03285026550292969, -0.03201770782470703, -0.031185150146484375, -0.03035259246826172, -0.029520034790039062, -0.028687477111816406, -0.02785491943359375, -0.027022361755371094, -0.026189804077148438, -0.02535724639892578, -0.024524688720703125, -0.02369213104248047, -0.022859573364257812, -0.022027015686035156, -0.0211944580078125, -0.020361900329589844, -0.019529342651367188, -0.01869678497314453, -0.017864227294921875, -0.01703166961669922, -0.016199111938476562, -0.015366554260253906, -0.01453399658203125, -0.013701438903808594, -0.012868881225585938, -0.012036323547363281, -0.011203765869140625, -0.010371208190917969, -0.009538650512695312, -0.008706092834472656, -0.00787353515625, -0.007040977478027344, -0.0062084197998046875, -0.005375862121582031, -0.004543304443359375, -0.0037107467651367188, -0.0028781890869140625, -0.0020456314086914062, -0.00121307373046875, -0.00038051605224609375, 0.0004520416259765625, 0.0012845993041992188, 0.002117156982421875, 0.0029497146606445312, 0.0037822723388671875, 0.004614830017089844, 0.0054473876953125, 0.006279945373535156, 0.0071125030517578125, 0.007945060729980469, 0.008777618408203125, 0.009610176086425781, 0.010442733764648438, 0.011275291442871094, 0.01210784912109375, 0.012940406799316406, 0.013772964477539062, 0.014605522155761719, 0.015438079833984375, 0.01627063751220703, 0.017103195190429688, 0.017935752868652344, 0.018768310546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 20.0, 63.0, 170.0, 396.0, 232.0, 73.0, 17.0, 9.0, 8.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.37230390310287476, -0.36357614398002625, -0.35484838485717773, -0.3461206257343292, -0.3373928666114807, -0.3286651074886322, -0.3199373483657837, -0.3112095892429352, -0.30248183012008667, -0.29375407099723816, -0.28502631187438965, -0.27629855275154114, -0.2675707936286926, -0.2588430345058441, -0.2501152753829956, -0.2413875162601471, -0.2326597422361374, -0.22393198311328888, -0.21520422399044037, -0.20647646486759186, -0.19774870574474335, -0.18902094662189484, -0.18029317259788513, -0.17156541347503662, -0.1628376543521881, -0.1541098952293396, -0.1453821361064911, -0.13665437698364258, -0.12792661786079407, -0.11919885873794556, -0.11047109216451645, -0.10174333304166794, -0.09301559627056122, -0.08428783714771271, -0.0755600780248642, -0.06683231890201569, -0.05810455605387688, -0.049376796931028366, -0.04064903408288956, -0.031921274960041046, -0.023193515837192535, -0.01446575578302145, -0.005737995728850365, 0.0029897652566432953, 0.011717524379491806, 0.020445283502340317, 0.029173046350479126, 0.03790080547332764, 0.04662856459617615, 0.05535632371902466, 0.06408408284187317, 0.07281184196472168, 0.08153960108757019, 0.0902673602104187, 0.09899512678384781, 0.10772288590669632, 0.11645064502954483, 0.12517841160297394, 0.13390617072582245, 0.14263392984867096, 0.15136168897151947, 0.16008944809436798, 0.1688172072172165, 0.177544966340065, 0.1862727254629135]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 7.0, 10.0, 8.0, 12.0, 20.0, 38.0, 33.0, 47.0, 67.0, 79.0, 75.0, 81.0, 82.0, 83.0, 77.0, 79.0, 47.0, 37.0, 42.0, 25.0, 20.0, 14.0, 11.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13930761814117432, -0.1355796456336975, -0.1318516731262207, -0.1281237006187439, -0.12439573556184769, -0.12066776305437088, -0.11693979799747467, -0.11321182548999786, -0.10948385298252106, -0.10575588047504425, -0.10202790796756744, -0.09829994291067123, -0.09457197040319443, -0.09084399789571762, -0.08711603283882141, -0.0833880603313446, -0.0796600878238678, -0.07593211531639099, -0.07220414280891418, -0.06847617775201797, -0.06474820524454117, -0.06102023273706436, -0.05729226395487785, -0.053564295172691345, -0.04983632266521454, -0.04610835015773773, -0.042380381375551224, -0.038652412593364716, -0.03492444008588791, -0.03119646944105625, -0.027468498796224594, -0.023740528151392937, -0.02001255750656128, -0.016284586861729622, -0.012556616216897964, -0.008828645572066307, -0.00510067492723465, -0.0013727042824029922, 0.002355266362428665, 0.006083237007260323, 0.00981120765209198, 0.013539178296923637, 0.017267148941755295, 0.020995119586586952, 0.02472309023141861, 0.028451060876250267, 0.032179031521081924, 0.03590700030326843, 0.03963497281074524, 0.043362945318222046, 0.047090914100408554, 0.05081888288259506, 0.05454685539007187, 0.058274827897548676, 0.062002796679735184, 0.06573076546192169, 0.0694587379693985, 0.0731867104768753, 0.07691468298435211, 0.08064264804124832, 0.08437062054872513, 0.08809859305620193, 0.09182655811309814, 0.09555453062057495, 0.09928250312805176]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 7.0, 16.0, 16.0, 25.0, 26.0, 47.0, 79.0, 117.0, 213.0, 380.0, 664.0, 1336.0, 3087.0, 9310.0, 41401.0, 302556.0, 584488.0, 81272.0, 15374.0, 4349.0, 1772.0, 837.0, 468.0, 257.0, 174.0, 94.0, 61.0, 43.0, 27.0, 18.0, 6.0, 9.0, 8.0, 6.0, 1.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0255279541015625, -0.02455306053161621, -0.023578166961669922, -0.022603273391723633, -0.021628379821777344, -0.020653486251831055, -0.019678592681884766, -0.018703699111938477, -0.017728805541992188, -0.0167539119720459, -0.01577901840209961, -0.01480412483215332, -0.013829231262207031, -0.012854337692260742, -0.011879444122314453, -0.010904550552368164, -0.009929656982421875, -0.008954763412475586, -0.007979869842529297, -0.007004976272583008, -0.006030082702636719, -0.00505518913269043, -0.004080295562744141, -0.0031054019927978516, -0.0021305084228515625, -0.0011556148529052734, -0.00018072128295898438, 0.0007941722869873047, 0.0017690658569335938, 0.002743959426879883, 0.003718852996826172, 0.004693746566772461, 0.00566864013671875, 0.006643533706665039, 0.007618427276611328, 0.008593320846557617, 0.009568214416503906, 0.010543107986450195, 0.011518001556396484, 0.012492895126342773, 0.013467788696289062, 0.014442682266235352, 0.01541757583618164, 0.01639246940612793, 0.01736736297607422, 0.018342256546020508, 0.019317150115966797, 0.020292043685913086, 0.021266937255859375, 0.022241830825805664, 0.023216724395751953, 0.024191617965698242, 0.02516651153564453, 0.02614140510559082, 0.02711629867553711, 0.0280911922454834, 0.029066085815429688, 0.030040979385375977, 0.031015872955322266, 0.031990766525268555, 0.032965660095214844, 0.03394055366516113, 0.03491544723510742, 0.03589034080505371, 0.036865234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 4.0, 7.0, 7.0, 16.0, 27.0, 32.0, 66.0, 80.0, 129.0, 139.0, 146.0, 114.0, 74.0, 50.0, 37.0, 28.0, 15.0, 6.0, 11.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0182952880859375, -0.017702341079711914, -0.017109394073486328, -0.016516447067260742, -0.015923500061035156, -0.01533055305480957, -0.014737606048583984, -0.014144659042358398, -0.013551712036132812, -0.012958765029907227, -0.01236581802368164, -0.011772871017456055, -0.011179924011230469, -0.010586977005004883, -0.009994029998779297, -0.009401082992553711, -0.008808135986328125, -0.008215188980102539, -0.007622241973876953, -0.007029294967651367, -0.006436347961425781, -0.005843400955200195, -0.005250453948974609, -0.0046575069427490234, -0.0040645599365234375, -0.0034716129302978516, -0.0028786659240722656, -0.0022857189178466797, -0.0016927719116210938, -0.0010998249053955078, -0.0005068778991699219, 8.606910705566406e-05, 0.00067901611328125, 0.001271963119506836, 0.0018649101257324219, 0.002457857131958008, 0.0030508041381835938, 0.0036437511444091797, 0.004236698150634766, 0.0048296451568603516, 0.0054225921630859375, 0.0060155391693115234, 0.006608486175537109, 0.007201433181762695, 0.007794380187988281, 0.008387327194213867, 0.008980274200439453, 0.009573221206665039, 0.010166168212890625, 0.010759115219116211, 0.011352062225341797, 0.011945009231567383, 0.012537956237792969, 0.013130903244018555, 0.01372385025024414, 0.014316797256469727, 0.014909744262695312, 0.015502691268920898, 0.016095638275146484, 0.01668858528137207, 0.017281532287597656, 0.017874479293823242, 0.018467426300048828, 0.019060373306274414, 0.0196533203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 6.0, 13.0, 16.0, 34.0, 30.0, 65.0, 112.0, 123.0, 202.0, 378.0, 669.0, 1255.0, 2807.0, 6433.0, 17953.0, 60927.0, 249572.0, 551606.0, 109338.0, 29403.0, 9837.0, 3943.0, 1714.0, 878.0, 483.0, 264.0, 158.0, 89.0, 71.0, 43.0, 35.0, 27.0, 15.0, 10.0, 7.0, 9.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0224151611328125, -0.021673202514648438, -0.020931243896484375, -0.020189285278320312, -0.01944732666015625, -0.018705368041992188, -0.017963409423828125, -0.017221450805664062, -0.0164794921875, -0.015737533569335938, -0.014995574951171875, -0.014253616333007812, -0.01351165771484375, -0.012769699096679688, -0.012027740478515625, -0.011285781860351562, -0.0105438232421875, -0.009801864624023438, -0.009059906005859375, -0.008317947387695312, -0.00757598876953125, -0.0068340301513671875, -0.006092071533203125, -0.0053501129150390625, -0.004608154296875, -0.0038661956787109375, -0.003124237060546875, -0.0023822784423828125, -0.00164031982421875, -0.0008983612060546875, -0.000156402587890625, 0.0005855560302734375, 0.0013275146484375, 0.0020694732666015625, 0.002811431884765625, 0.0035533905029296875, 0.00429534912109375, 0.0050373077392578125, 0.005779266357421875, 0.0065212249755859375, 0.00726318359375, 0.008005142211914062, 0.008747100830078125, 0.009489059448242188, 0.01023101806640625, 0.010972976684570312, 0.011714935302734375, 0.012456893920898438, 0.0131988525390625, 0.013940811157226562, 0.014682769775390625, 0.015424728393554688, 0.01616668701171875, 0.016908645629882812, 0.017650604248046875, 0.018392562866210938, 0.019134521484375, 0.019876480102539062, 0.020618438720703125, 0.021360397338867188, 0.02210235595703125, 0.022844314575195312, 0.023586273193359375, 0.024328231811523438, 0.0250701904296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 3.0, 8.0, 6.0, 12.0, 12.0, 17.0, 17.0, 15.0, 16.0, 27.0, 24.0, 30.0, 40.0, 24.0, 37.0, 32.0, 39.0, 37.0, 37.0, 34.0, 53.0, 35.0, 43.0, 32.0, 33.0, 40.0, 39.0, 30.0, 37.0, 35.0, 21.0, 24.0, 8.0, 12.0, 14.0, 14.0, 9.0, 4.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.02728271484375, -0.02645087242126465, -0.025619029998779297, -0.024787187576293945, -0.023955345153808594, -0.023123502731323242, -0.02229166030883789, -0.02145981788635254, -0.020627975463867188, -0.019796133041381836, -0.018964290618896484, -0.018132448196411133, -0.01730060577392578, -0.01646876335144043, -0.015636920928955078, -0.014805078506469727, -0.013973236083984375, -0.013141393661499023, -0.012309551239013672, -0.01147770881652832, -0.010645866394042969, -0.009814023971557617, -0.008982181549072266, -0.008150339126586914, -0.0073184967041015625, -0.006486654281616211, -0.005654811859130859, -0.004822969436645508, -0.003991127014160156, -0.0031592845916748047, -0.002327442169189453, -0.0014955997467041016, -0.00066375732421875, 0.00016808509826660156, 0.0009999275207519531, 0.0018317699432373047, 0.0026636123657226562, 0.003495454788208008, 0.004327297210693359, 0.005159139633178711, 0.0059909820556640625, 0.006822824478149414, 0.007654666900634766, 0.008486509323120117, 0.009318351745605469, 0.01015019416809082, 0.010982036590576172, 0.011813879013061523, 0.012645721435546875, 0.013477563858032227, 0.014309406280517578, 0.01514124870300293, 0.01597309112548828, 0.016804933547973633, 0.017636775970458984, 0.018468618392944336, 0.019300460815429688, 0.02013230323791504, 0.02096414566040039, 0.021795988082885742, 0.022627830505371094, 0.023459672927856445, 0.024291515350341797, 0.02512335777282715, 0.0259552001953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 6.0, 5.0, 11.0, 14.0, 16.0, 26.0, 41.0, 63.0, 127.0, 215.0, 395.0, 831.0, 1870.0, 5055.0, 18826.0, 117266.0, 747040.0, 127586.0, 20120.0, 5339.0, 1950.0, 797.0, 403.0, 233.0, 117.0, 69.0, 51.0, 27.0, 15.0, 13.0, 5.0, 6.0, 6.0, 6.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005924224853515625, -0.005716502666473389, -0.005508780479431152, -0.005301058292388916, -0.00509333610534668, -0.004885613918304443, -0.004677891731262207, -0.004470169544219971, -0.004262447357177734, -0.004054725170135498, -0.0038470029830932617, -0.0036392807960510254, -0.003431558609008789, -0.0032238364219665527, -0.0030161142349243164, -0.00280839204788208, -0.0026006698608398438, -0.0023929476737976074, -0.002185225486755371, -0.0019775032997131348, -0.0017697811126708984, -0.0015620589256286621, -0.0013543367385864258, -0.0011466145515441895, -0.0009388923645019531, -0.0007311701774597168, -0.0005234479904174805, -0.00031572580337524414, -0.00010800361633300781, 9.971857070922852e-05, 0.00030744075775146484, 0.0005151629447937012, 0.0007228851318359375, 0.0009306073188781738, 0.0011383295059204102, 0.0013460516929626465, 0.0015537738800048828, 0.0017614960670471191, 0.0019692182540893555, 0.002176940441131592, 0.002384662628173828, 0.0025923848152160645, 0.0028001070022583008, 0.003007829189300537, 0.0032155513763427734, 0.0034232735633850098, 0.003630995750427246, 0.0038387179374694824, 0.004046440124511719, 0.004254162311553955, 0.004461884498596191, 0.004669606685638428, 0.004877328872680664, 0.0050850510597229, 0.005292773246765137, 0.005500495433807373, 0.005708217620849609, 0.005915939807891846, 0.006123661994934082, 0.006331384181976318, 0.006539106369018555, 0.006746828556060791, 0.006954550743103027, 0.007162272930145264, 0.0073699951171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 4.0, 12.0, 17.0, 17.0, 24.0, 38.0, 56.0, 57.0, 81.0, 69.0, 83.0, 64.0, 69.0, 81.0, 63.0, 51.0, 39.0, 37.0, 40.0, 23.0, 14.0, 12.0, 11.0, 9.0, 4.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.735324859619141e-06, -6.545335054397583e-06, -6.355345249176025e-06, -6.165355443954468e-06, -5.97536563873291e-06, -5.7853758335113525e-06, -5.595386028289795e-06, -5.405396223068237e-06, -5.21540641784668e-06, -5.025416612625122e-06, -4.8354268074035645e-06, -4.645437002182007e-06, -4.455447196960449e-06, -4.265457391738892e-06, -4.075467586517334e-06, -3.885477781295776e-06, -3.6954879760742188e-06, -3.505498170852661e-06, -3.3155083656311035e-06, -3.125518560409546e-06, -2.9355287551879883e-06, -2.7455389499664307e-06, -2.555549144744873e-06, -2.3655593395233154e-06, -2.175569534301758e-06, -1.9855797290802e-06, -1.7955899238586426e-06, -1.605600118637085e-06, -1.4156103134155273e-06, -1.2256205081939697e-06, -1.0356307029724121e-06, -8.456408977508545e-07, -6.556510925292969e-07, -4.6566128730773926e-07, -2.7567148208618164e-07, -8.568167686462402e-08, 1.043081283569336e-07, 2.942979335784912e-07, 4.842877388000488e-07, 6.742775440216064e-07, 8.642673492431641e-07, 1.0542571544647217e-06, 1.2442469596862793e-06, 1.434236764907837e-06, 1.6242265701293945e-06, 1.8142163753509521e-06, 2.0042061805725098e-06, 2.1941959857940674e-06, 2.384185791015625e-06, 2.5741755962371826e-06, 2.7641654014587402e-06, 2.954155206680298e-06, 3.1441450119018555e-06, 3.334134817123413e-06, 3.5241246223449707e-06, 3.7141144275665283e-06, 3.904104232788086e-06, 4.0940940380096436e-06, 4.284083843231201e-06, 4.474073648452759e-06, 4.664063453674316e-06, 4.854053258895874e-06, 5.044043064117432e-06, 5.234032869338989e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 12.0, 4.0, 14.0, 23.0, 24.0, 24.0, 41.0, 76.0, 116.0, 199.0, 304.0, 562.0, 992.0, 2085.0, 5140.0, 15600.0, 65178.0, 527149.0, 349122.0, 58339.0, 14387.0, 4814.0, 2032.0, 958.0, 514.0, 289.0, 173.0, 125.0, 85.0, 34.0, 43.0, 23.0, 12.0, 10.0, 6.0, 8.0, 11.0, 3.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.00551605224609375, -0.005343496799468994, -0.005170941352844238, -0.004998385906219482, -0.0048258304595947266, -0.004653275012969971, -0.004480719566345215, -0.004308164119720459, -0.004135608673095703, -0.003963053226470947, -0.0037904977798461914, -0.0036179423332214355, -0.0034453868865966797, -0.003272831439971924, -0.003100275993347168, -0.002927720546722412, -0.0027551651000976562, -0.0025826096534729004, -0.0024100542068481445, -0.0022374987602233887, -0.002064943313598633, -0.001892387866973877, -0.001719832420349121, -0.0015472769737243652, -0.0013747215270996094, -0.0012021660804748535, -0.0010296106338500977, -0.0008570551872253418, -0.0006844997406005859, -0.0005119442939758301, -0.0003393888473510742, -0.00016683340072631836, 5.7220458984375e-06, 0.00017827749252319336, 0.0003508329391479492, 0.0005233883857727051, 0.0006959438323974609, 0.0008684992790222168, 0.0010410547256469727, 0.0012136101722717285, 0.0013861656188964844, 0.0015587210655212402, 0.001731276512145996, 0.001903831958770752, 0.002076387405395508, 0.0022489428520202637, 0.0024214982986450195, 0.0025940537452697754, 0.0027666091918945312, 0.002939164638519287, 0.003111720085144043, 0.003284275531768799, 0.0034568309783935547, 0.0036293864250183105, 0.0038019418716430664, 0.003974497318267822, 0.004147052764892578, 0.004319608211517334, 0.00449216365814209, 0.004664719104766846, 0.0048372745513916016, 0.005009829998016357, 0.005182385444641113, 0.005354940891265869, 0.005527496337890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 5.0, 16.0, 20.0, 14.0, 30.0, 38.0, 50.0, 59.0, 84.0, 94.0, 93.0, 104.0, 87.0, 68.0, 44.0, 48.0, 37.0, 24.0, 17.0, 15.0, 8.0, 5.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0081787109375, -0.007892131805419922, -0.007605552673339844, -0.007318973541259766, -0.0070323944091796875, -0.006745815277099609, -0.006459236145019531, -0.006172657012939453, -0.005886077880859375, -0.005599498748779297, -0.005312919616699219, -0.005026340484619141, -0.0047397613525390625, -0.004453182220458984, -0.004166603088378906, -0.003880023956298828, -0.00359344482421875, -0.003306865692138672, -0.0030202865600585938, -0.0027337074279785156, -0.0024471282958984375, -0.0021605491638183594, -0.0018739700317382812, -0.0015873908996582031, -0.001300811767578125, -0.0010142326354980469, -0.0007276535034179688, -0.0004410743713378906, -0.0001544952392578125, 0.00013208389282226562, 0.00041866302490234375, 0.0007052421569824219, 0.0009918212890625, 0.0012784004211425781, 0.0015649795532226562, 0.0018515586853027344, 0.0021381378173828125, 0.0024247169494628906, 0.0027112960815429688, 0.002997875213623047, 0.003284454345703125, 0.003571033477783203, 0.0038576126098632812, 0.004144191741943359, 0.0044307708740234375, 0.004717350006103516, 0.005003929138183594, 0.005290508270263672, 0.00557708740234375, 0.005863666534423828, 0.006150245666503906, 0.006436824798583984, 0.0067234039306640625, 0.007009983062744141, 0.007296562194824219, 0.007583141326904297, 0.007869720458984375, 0.008156299591064453, 0.008442878723144531, 0.00872945785522461, 0.009016036987304688, 0.009302616119384766, 0.009589195251464844, 0.009875774383544922, 0.010162353515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 5.0, 3.0, 1.0, 10.0, 13.0, 12.0, 23.0, 50.0, 85.0, 133.0, 221.0, 197.0, 112.0, 66.0, 27.0, 14.0, 12.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26822367310523987, -0.2616836726665497, -0.2551436722278595, -0.2486036717891693, -0.24206367135047913, -0.23552367091178894, -0.22898367047309875, -0.22244367003440857, -0.21590366959571838, -0.2093636691570282, -0.202823668718338, -0.19628366827964783, -0.18974366784095764, -0.18320366740226746, -0.17666366696357727, -0.17012366652488708, -0.1635836660861969, -0.1570436656475067, -0.15050366520881653, -0.14396366477012634, -0.13742366433143616, -0.13088366389274597, -0.12434366345405579, -0.1178036630153656, -0.11126366257667542, -0.10472366213798523, -0.09818366169929504, -0.09164366126060486, -0.08510366082191467, -0.07856366038322449, -0.0720236599445343, -0.06548365950584412, -0.05894364416599274, -0.05240364372730255, -0.045863643288612366, -0.03932364284992218, -0.032783642411231995, -0.02624364197254181, -0.019703641533851624, -0.013163641095161438, -0.0066236406564712524, -8.36402177810669e-05, 0.006456360220909119, 0.012996360659599304, 0.01953636109828949, 0.026076361536979675, 0.03261636197566986, 0.039156362414360046, 0.04569636285305023, 0.05223636329174042, 0.0587763637304306, 0.06531636416912079, 0.07185636460781097, 0.07839636504650116, 0.08493636548519135, 0.09147636592388153, 0.09801636636257172, 0.1045563668012619, 0.11109636723995209, 0.11763636767864227, 0.12417636811733246, 0.13071636855602264, 0.13725636899471283, 0.14379636943340302, 0.1503363698720932]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 4.0, 12.0, 9.0, 12.0, 8.0, 12.0, 19.0, 19.0, 11.0, 16.0, 17.0, 19.0, 28.0, 33.0, 19.0, 33.0, 39.0, 49.0, 66.0, 73.0, 73.0, 62.0, 49.0, 43.0, 29.0, 38.0, 28.0, 19.0, 22.0, 19.0, 26.0, 15.0, 14.0, 15.0, 9.0, 7.0, 5.0, 5.0, 6.0, 7.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.12892520427703857, -0.12518279254436493, -0.12144038826227188, -0.11769797652959824, -0.11395557224750519, -0.11021316051483154, -0.1064707487821579, -0.10272833704948425, -0.0989859327673912, -0.09524352103471756, -0.09150111675262451, -0.08775870501995087, -0.08401629328727722, -0.08027388900518417, -0.07653147727251053, -0.07278907299041748, -0.06904666125774384, -0.06530424952507019, -0.06156184524297714, -0.0578194335103035, -0.05407702550292015, -0.050334617495536804, -0.04659220576286316, -0.04284979775547981, -0.039107389748096466, -0.03536498174071312, -0.03162257373332977, -0.027880162000656128, -0.02413775399327278, -0.020395345985889435, -0.01665293611586094, -0.012910526245832443, -0.009168118238449097, -0.0054257092997431755, -0.0016833003610372543, 0.002059108577668667, 0.005801517516374588, 0.009543925523757935, 0.01328633539378643, 0.017028745263814926, 0.020771153271198273, 0.02451356127858162, 0.028255971148610115, 0.03199838101863861, 0.03574078902602196, 0.039483197033405304, 0.04322560876607895, 0.046968016773462296, 0.05071042478084564, 0.05445283278822899, 0.058195240795612335, 0.06193765252828598, 0.06568005681037903, 0.06942246854305267, 0.07316488027572632, 0.07690729200839996, 0.08064969629049301, 0.08439210802316666, 0.0881345123052597, 0.09187692403793335, 0.095619335770607, 0.09936174005270004, 0.10310415178537369, 0.10684655606746674, 0.11058896780014038]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 3.0, 8.0, 3.0, 11.0, 9.0, 18.0, 21.0, 41.0, 51.0, 103.0, 179.0, 363.0, 820.0, 2116.0, 6987.0, 42268.0, 2654113.0, 1440820.0, 35181.0, 7297.0, 2241.0, 847.0, 360.0, 189.0, 91.0, 46.0, 33.0, 19.0, 18.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0201416015625, -0.019610881805419922, -0.019080162048339844, -0.018549442291259766, -0.018018722534179688, -0.01748800277709961, -0.01695728302001953, -0.016426563262939453, -0.015895843505859375, -0.015365123748779297, -0.014834403991699219, -0.01430368423461914, -0.013772964477539062, -0.013242244720458984, -0.012711524963378906, -0.012180805206298828, -0.01165008544921875, -0.011119365692138672, -0.010588645935058594, -0.010057926177978516, -0.009527206420898438, -0.00899648666381836, -0.008465766906738281, -0.007935047149658203, -0.007404327392578125, -0.006873607635498047, -0.006342887878417969, -0.005812168121337891, -0.0052814483642578125, -0.004750728607177734, -0.004220008850097656, -0.003689289093017578, -0.0031585693359375, -0.002627849578857422, -0.0020971298217773438, -0.0015664100646972656, -0.0010356903076171875, -0.0005049705505371094, 2.574920654296875e-05, 0.0005564689636230469, 0.001087188720703125, 0.0016179084777832031, 0.0021486282348632812, 0.0026793479919433594, 0.0032100677490234375, 0.0037407875061035156, 0.004271507263183594, 0.004802227020263672, 0.00533294677734375, 0.005863666534423828, 0.006394386291503906, 0.006925106048583984, 0.0074558258056640625, 0.00798654556274414, 0.008517265319824219, 0.009047985076904297, 0.009578704833984375, 0.010109424591064453, 0.010640144348144531, 0.01117086410522461, 0.011701583862304688, 0.012232303619384766, 0.012763023376464844, 0.013293743133544922, 0.013824462890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 18.0, 25.0, 42.0, 59.0, 86.0, 104.0, 151.0, 135.0, 119.0, 84.0, 55.0, 45.0, 22.0, 17.0, 16.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184326171875, -0.0178377628326416, -0.017242908477783203, -0.016648054122924805, -0.016053199768066406, -0.015458345413208008, -0.01486349105834961, -0.014268636703491211, -0.013673782348632812, -0.013078927993774414, -0.012484073638916016, -0.011889219284057617, -0.011294364929199219, -0.01069951057434082, -0.010104656219482422, -0.009509801864624023, -0.008914947509765625, -0.008320093154907227, -0.007725238800048828, -0.00713038444519043, -0.006535530090332031, -0.005940675735473633, -0.005345821380615234, -0.004750967025756836, -0.0041561126708984375, -0.003561258316040039, -0.0029664039611816406, -0.002371549606323242, -0.0017766952514648438, -0.0011818408966064453, -0.0005869865417480469, 7.867813110351562e-06, 0.00060272216796875, 0.0011975765228271484, 0.0017924308776855469, 0.0023872852325439453, 0.0029821395874023438, 0.003576993942260742, 0.004171848297119141, 0.004766702651977539, 0.0053615570068359375, 0.005956411361694336, 0.006551265716552734, 0.007146120071411133, 0.007740974426269531, 0.00833582878112793, 0.008930683135986328, 0.009525537490844727, 0.010120391845703125, 0.010715246200561523, 0.011310100555419922, 0.01190495491027832, 0.012499809265136719, 0.013094663619995117, 0.013689517974853516, 0.014284372329711914, 0.014879226684570312, 0.015474081039428711, 0.01606893539428711, 0.016663789749145508, 0.017258644104003906, 0.017853498458862305, 0.018448352813720703, 0.0190432071685791, 0.0196380615234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 9.0, 20.0, 19.0, 20.0, 50.0, 70.0, 177.0, 561.0, 1684.0, 5762.0, 35450.0, 3840756.0, 290430.0, 14257.0, 3331.0, 1038.0, 349.0, 121.0, 52.0, 39.0, 25.0, 13.0, 8.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0242767333984375, -0.023402929306030273, -0.022529125213623047, -0.02165532112121582, -0.020781517028808594, -0.019907712936401367, -0.01903390884399414, -0.018160104751586914, -0.017286300659179688, -0.01641249656677246, -0.015538692474365234, -0.014664888381958008, -0.013791084289550781, -0.012917280197143555, -0.012043476104736328, -0.011169672012329102, -0.010295867919921875, -0.009422063827514648, -0.008548259735107422, -0.007674455642700195, -0.006800651550292969, -0.005926847457885742, -0.005053043365478516, -0.004179239273071289, -0.0033054351806640625, -0.002431631088256836, -0.0015578269958496094, -0.0006840229034423828, 0.00018978118896484375, 0.0010635852813720703, 0.0019373893737792969, 0.0028111934661865234, 0.00368499755859375, 0.0045588016510009766, 0.005432605743408203, 0.00630640983581543, 0.007180213928222656, 0.008054018020629883, 0.00892782211303711, 0.009801626205444336, 0.010675430297851562, 0.011549234390258789, 0.012423038482666016, 0.013296842575073242, 0.014170646667480469, 0.015044450759887695, 0.015918254852294922, 0.01679205894470215, 0.017665863037109375, 0.0185396671295166, 0.019413471221923828, 0.020287275314331055, 0.02116107940673828, 0.022034883499145508, 0.022908687591552734, 0.02378249168395996, 0.024656295776367188, 0.025530099868774414, 0.02640390396118164, 0.027277708053588867, 0.028151512145996094, 0.02902531623840332, 0.029899120330810547, 0.030772924423217773, 0.031646728515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 9.0, 13.0, 21.0, 25.0, 39.0, 64.0, 130.0, 329.0, 814.0, 1340.0, 659.0, 265.0, 135.0, 59.0, 36.0, 31.0, 28.0, 7.0, 10.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0178680419921875, -0.017348527908325195, -0.01682901382446289, -0.016309499740600586, -0.01578998565673828, -0.015270471572875977, -0.014750957489013672, -0.014231443405151367, -0.013711929321289062, -0.013192415237426758, -0.012672901153564453, -0.012153387069702148, -0.011633872985839844, -0.011114358901977539, -0.010594844818115234, -0.01007533073425293, -0.009555816650390625, -0.00903630256652832, -0.008516788482666016, -0.007997274398803711, -0.007477760314941406, -0.0069582462310791016, -0.006438732147216797, -0.005919218063354492, -0.0053997039794921875, -0.004880189895629883, -0.004360675811767578, -0.0038411617279052734, -0.0033216476440429688, -0.002802133560180664, -0.0022826194763183594, -0.0017631053924560547, -0.00124359130859375, -0.0007240772247314453, -0.00020456314086914062, 0.00031495094299316406, 0.0008344650268554688, 0.0013539791107177734, 0.0018734931945800781, 0.002393007278442383, 0.0029125213623046875, 0.003432035446166992, 0.003951549530029297, 0.0044710636138916016, 0.004990577697753906, 0.005510091781616211, 0.006029605865478516, 0.00654911994934082, 0.007068634033203125, 0.00758814811706543, 0.008107662200927734, 0.008627176284790039, 0.009146690368652344, 0.009666204452514648, 0.010185718536376953, 0.010705232620239258, 0.011224746704101562, 0.011744260787963867, 0.012263774871826172, 0.012783288955688477, 0.013302803039550781, 0.013822317123413086, 0.01434183120727539, 0.014861345291137695, 0.015380859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 12.0, 37.0, 109.0, 327.0, 335.0, 116.0, 44.0, 13.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1360357701778412, -0.12922190129756927, -0.12240803986787796, -0.11559417843818665, -0.10878030955791473, -0.10196644812822342, -0.0951525866985321, -0.08833871781826019, -0.08152485638856888, -0.07471099495887756, -0.06789712607860565, -0.06108326464891434, -0.054269399493932724, -0.04745553433895111, -0.040641672909259796, -0.03382780775427818, -0.02701394259929657, -0.020200077444314957, -0.013386214151978493, -0.006572350859642029, 0.00024151429533958435, 0.0070553794503211975, 0.013869240880012512, 0.020683106034994125, 0.02749697118997574, 0.03431083634495735, 0.041124701499938965, 0.04793856292963028, 0.05475242808461189, 0.061566293239593506, 0.06838015466928482, 0.07519401609897614, 0.08200788497924805, 0.08882174640893936, 0.09563561528921127, 0.10244947671890259, 0.1092633455991745, 0.11607720702886581, 0.12289106845855713, 0.12970493733882904, 0.13651880621910095, 0.14333267509937286, 0.15014652907848358, 0.1569603979587555, 0.1637742668390274, 0.17058813571929932, 0.17740198969841003, 0.18421585857868195, 0.19102971255779266, 0.19784358143806458, 0.2046574354171753, 0.2114713042974472, 0.21828517317771912, 0.22509902715682983, 0.23191289603710175, 0.23872676491737366, 0.24554061889648438, 0.2523544728755951, 0.2591683566570282, 0.2659822106361389, 0.27279606461524963, 0.27960994839668274, 0.28642380237579346, 0.2932376563549042, 0.3000515401363373]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 8.0, 15.0, 9.0, 8.0, 17.0, 19.0, 23.0, 26.0, 34.0, 34.0, 28.0, 46.0, 42.0, 47.0, 48.0, 51.0, 50.0, 50.0, 42.0, 39.0, 47.0, 41.0, 35.0, 31.0, 35.0, 21.0, 29.0, 14.0, 18.0, 13.0, 9.0, 12.0, 9.0, 6.0, 3.0, 3.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.05185800790786743, -0.050297170877456665, -0.0487363338470459, -0.04717549681663513, -0.045614659786224365, -0.0440538227558136, -0.04249298572540283, -0.040932148694992065, -0.0393713116645813, -0.03781047463417053, -0.036249637603759766, -0.034688800573349, -0.03312796354293823, -0.031567126512527466, -0.0300062894821167, -0.028445452451705933, -0.026884615421295166, -0.0253237783908844, -0.023762941360473633, -0.022202104330062866, -0.0206412672996521, -0.019080430269241333, -0.017519593238830566, -0.0159587562084198, -0.014397919178009033, -0.012837082147598267, -0.0112762451171875, -0.009715408086776733, -0.008154571056365967, -0.0065937340259552, -0.005032896995544434, -0.003472059965133667, -0.0019112229347229004, -0.0003503859043121338, 0.0012104511260986328, 0.0027712881565093994, 0.004332125186920166, 0.005892962217330933, 0.007453799247741699, 0.009014636278152466, 0.010575473308563232, 0.012136310338973999, 0.013697147369384766, 0.015257984399795532, 0.0168188214302063, 0.018379658460617065, 0.019940495491027832, 0.0215013325214386, 0.023062169551849365, 0.024623006582260132, 0.0261838436126709, 0.027744680643081665, 0.02930551767349243, 0.030866354703903198, 0.032427191734313965, 0.03398802876472473, 0.0355488657951355, 0.037109702825546265, 0.03867053985595703, 0.0402313768863678, 0.041792213916778564, 0.04335305094718933, 0.0449138879776001, 0.046474725008010864, 0.04803556203842163]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 10.0, 23.0, 22.0, 21.0, 31.0, 36.0, 60.0, 92.0, 140.0, 213.0, 312.0, 511.0, 894.0, 1693.0, 3247.0, 7777.0, 21607.0, 74377.0, 357908.0, 443938.0, 92898.0, 25535.0, 9011.0, 3795.0, 1842.0, 970.0, 579.0, 303.0, 219.0, 147.0, 82.0, 68.0, 52.0, 34.0, 24.0, 16.0, 20.0, 6.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0233612060546875, -0.022609472274780273, -0.021857738494873047, -0.02110600471496582, -0.020354270935058594, -0.019602537155151367, -0.01885080337524414, -0.018099069595336914, -0.017347335815429688, -0.01659560203552246, -0.015843868255615234, -0.015092134475708008, -0.014340400695800781, -0.013588666915893555, -0.012836933135986328, -0.012085199356079102, -0.011333465576171875, -0.010581731796264648, -0.009829998016357422, -0.009078264236450195, -0.008326530456542969, -0.007574796676635742, -0.006823062896728516, -0.006071329116821289, -0.0053195953369140625, -0.004567861557006836, -0.0038161277770996094, -0.003064393997192383, -0.0023126602172851562, -0.0015609264373779297, -0.0008091926574707031, -5.745887756347656e-05, 0.00069427490234375, 0.0014460086822509766, 0.002197742462158203, 0.0029494762420654297, 0.0037012100219726562, 0.004452943801879883, 0.005204677581787109, 0.005956411361694336, 0.0067081451416015625, 0.007459878921508789, 0.008211612701416016, 0.008963346481323242, 0.009715080261230469, 0.010466814041137695, 0.011218547821044922, 0.011970281600952148, 0.012722015380859375, 0.013473749160766602, 0.014225482940673828, 0.014977216720581055, 0.01572895050048828, 0.016480684280395508, 0.017232418060302734, 0.01798415184020996, 0.018735885620117188, 0.019487619400024414, 0.02023935317993164, 0.020991086959838867, 0.021742820739746094, 0.02249455451965332, 0.023246288299560547, 0.023998022079467773, 0.024749755859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 18.0, 26.0, 51.0, 59.0, 89.0, 108.0, 142.0, 139.0, 110.0, 82.0, 58.0, 38.0, 20.0, 18.0, 7.0, 18.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0183868408203125, -0.0177919864654541, -0.017197132110595703, -0.016602277755737305, -0.016007423400878906, -0.015412569046020508, -0.01481771469116211, -0.014222860336303711, -0.013628005981445312, -0.013033151626586914, -0.012438297271728516, -0.011843442916870117, -0.011248588562011719, -0.01065373420715332, -0.010058879852294922, -0.009464025497436523, -0.008869171142578125, -0.008274316787719727, -0.007679462432861328, -0.00708460807800293, -0.006489753723144531, -0.005894899368286133, -0.005300045013427734, -0.004705190658569336, -0.0041103363037109375, -0.003515481948852539, -0.0029206275939941406, -0.002325773239135742, -0.0017309188842773438, -0.0011360645294189453, -0.0005412101745605469, 5.364418029785156e-05, 0.00064849853515625, 0.0012433528900146484, 0.0018382072448730469, 0.0024330615997314453, 0.0030279159545898438, 0.003622770309448242, 0.004217624664306641, 0.004812479019165039, 0.0054073333740234375, 0.006002187728881836, 0.006597042083740234, 0.007191896438598633, 0.007786750793457031, 0.00838160514831543, 0.008976459503173828, 0.009571313858032227, 0.010166168212890625, 0.010761022567749023, 0.011355876922607422, 0.01195073127746582, 0.012545585632324219, 0.013140439987182617, 0.013735294342041016, 0.014330148696899414, 0.014925003051757812, 0.015519857406616211, 0.01611471176147461, 0.016709566116333008, 0.017304420471191406, 0.017899274826049805, 0.018494129180908203, 0.0190889835357666, 0.019683837890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 19.0, 14.0, 26.0, 45.0, 58.0, 102.0, 167.0, 243.0, 426.0, 780.0, 1463.0, 3122.0, 7500.0, 21376.0, 80477.0, 610545.0, 247701.0, 49111.0, 14711.0, 5575.0, 2374.0, 1120.0, 604.0, 336.0, 238.0, 144.0, 76.0, 54.0, 38.0, 31.0, 21.0, 13.0, 4.0, 7.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0274200439453125, -0.026558637619018555, -0.02569723129272461, -0.024835824966430664, -0.02397441864013672, -0.023113012313842773, -0.022251605987548828, -0.021390199661254883, -0.020528793334960938, -0.019667387008666992, -0.018805980682373047, -0.0179445743560791, -0.017083168029785156, -0.01622176170349121, -0.015360355377197266, -0.01449894905090332, -0.013637542724609375, -0.01277613639831543, -0.011914730072021484, -0.011053323745727539, -0.010191917419433594, -0.009330511093139648, -0.008469104766845703, -0.007607698440551758, -0.0067462921142578125, -0.005884885787963867, -0.005023479461669922, -0.0041620731353759766, -0.0033006668090820312, -0.002439260482788086, -0.0015778541564941406, -0.0007164478302001953, 0.00014495849609375, 0.0010063648223876953, 0.0018677711486816406, 0.002729177474975586, 0.0035905838012695312, 0.0044519901275634766, 0.005313396453857422, 0.006174802780151367, 0.0070362091064453125, 0.007897615432739258, 0.008759021759033203, 0.009620428085327148, 0.010481834411621094, 0.011343240737915039, 0.012204647064208984, 0.01306605339050293, 0.013927459716796875, 0.01478886604309082, 0.015650272369384766, 0.01651167869567871, 0.017373085021972656, 0.0182344913482666, 0.019095897674560547, 0.019957304000854492, 0.020818710327148438, 0.021680116653442383, 0.022541522979736328, 0.023402929306030273, 0.02426433563232422, 0.025125741958618164, 0.02598714828491211, 0.026848554611206055, 0.0277099609375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 3.0, 4.0, 2.0, 7.0, 10.0, 11.0, 21.0, 19.0, 22.0, 20.0, 30.0, 32.0, 40.0, 35.0, 44.0, 49.0, 42.0, 52.0, 52.0, 65.0, 68.0, 56.0, 47.0, 39.0, 35.0, 28.0, 39.0, 27.0, 25.0, 14.0, 8.0, 10.0, 11.0, 7.0, 4.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.033416748046875, -0.03235816955566406, -0.031299591064453125, -0.030241012573242188, -0.02918243408203125, -0.028123855590820312, -0.027065277099609375, -0.026006698608398438, -0.0249481201171875, -0.023889541625976562, -0.022830963134765625, -0.021772384643554688, -0.02071380615234375, -0.019655227661132812, -0.018596649169921875, -0.017538070678710938, -0.0164794921875, -0.015420913696289062, -0.014362335205078125, -0.013303756713867188, -0.01224517822265625, -0.011186599731445312, -0.010128021240234375, -0.009069442749023438, -0.0080108642578125, -0.0069522857666015625, -0.005893707275390625, -0.0048351287841796875, -0.00377655029296875, -0.0027179718017578125, -0.001659393310546875, -0.0006008148193359375, 0.000457763671875, 0.0015163421630859375, 0.002574920654296875, 0.0036334991455078125, 0.00469207763671875, 0.0057506561279296875, 0.006809234619140625, 0.007867813110351562, 0.0089263916015625, 0.009984970092773438, 0.011043548583984375, 0.012102127075195312, 0.01316070556640625, 0.014219284057617188, 0.015277862548828125, 0.016336441040039062, 0.01739501953125, 0.018453598022460938, 0.019512176513671875, 0.020570755004882812, 0.02162933349609375, 0.022687911987304688, 0.023746490478515625, 0.024805068969726562, 0.0258636474609375, 0.026922225952148438, 0.027980804443359375, 0.029039382934570312, 0.03009796142578125, 0.031156539916992188, 0.032215118408203125, 0.03327369689941406, 0.034332275390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 1.0, 4.0, 8.0, 15.0, 18.0, 22.0, 34.0, 68.0, 106.0, 181.0, 367.0, 756.0, 1883.0, 5716.0, 26944.0, 310126.0, 657158.0, 34398.0, 6919.0, 2070.0, 845.0, 408.0, 189.0, 117.0, 63.0, 41.0, 20.0, 13.0, 14.0, 10.0, 9.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0083465576171875, -0.008077859878540039, -0.007809162139892578, -0.007540464401245117, -0.007271766662597656, -0.007003068923950195, -0.006734371185302734, -0.0064656734466552734, -0.0061969757080078125, -0.0059282779693603516, -0.005659580230712891, -0.00539088249206543, -0.005122184753417969, -0.004853487014770508, -0.004584789276123047, -0.004316091537475586, -0.004047393798828125, -0.003778696060180664, -0.003509998321533203, -0.003241300582885742, -0.0029726028442382812, -0.0027039051055908203, -0.0024352073669433594, -0.0021665096282958984, -0.0018978118896484375, -0.0016291141510009766, -0.0013604164123535156, -0.0010917186737060547, -0.0008230209350585938, -0.0005543231964111328, -0.0002856254577636719, -1.6927719116210938e-05, 0.00025177001953125, 0.0005204677581787109, 0.0007891654968261719, 0.0010578632354736328, 0.0013265609741210938, 0.0015952587127685547, 0.0018639564514160156, 0.0021326541900634766, 0.0024013519287109375, 0.0026700496673583984, 0.0029387474060058594, 0.0032074451446533203, 0.0034761428833007812, 0.003744840621948242, 0.004013538360595703, 0.004282236099243164, 0.004550933837890625, 0.004819631576538086, 0.005088329315185547, 0.005357027053833008, 0.005625724792480469, 0.00589442253112793, 0.006163120269775391, 0.0064318180084228516, 0.0067005157470703125, 0.0069692134857177734, 0.007237911224365234, 0.007506608963012695, 0.007775306701660156, 0.008044004440307617, 0.008312702178955078, 0.008581399917602539, 0.00885009765625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 7.0, 7.0, 9.0, 13.0, 15.0, 31.0, 26.0, 29.0, 46.0, 47.0, 41.0, 77.0, 48.0, 57.0, 82.0, 46.0, 56.0, 62.0, 47.0, 42.0, 68.0, 21.0, 25.0, 24.0, 10.0, 13.0, 16.0, 6.0, 2.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.231929779052734e-06, -4.093162715435028e-06, -3.954395651817322e-06, -3.8156285881996155e-06, -3.676861524581909e-06, -3.538094460964203e-06, -3.3993273973464966e-06, -3.2605603337287903e-06, -3.121793270111084e-06, -2.9830262064933777e-06, -2.8442591428756714e-06, -2.705492079257965e-06, -2.566725015640259e-06, -2.4279579520225525e-06, -2.289190888404846e-06, -2.15042382478714e-06, -2.0116567611694336e-06, -1.8728896975517273e-06, -1.734122633934021e-06, -1.5953555703163147e-06, -1.4565885066986084e-06, -1.317821443080902e-06, -1.1790543794631958e-06, -1.0402873158454895e-06, -9.015202522277832e-07, -7.627531886100769e-07, -6.239861249923706e-07, -4.852190613746643e-07, -3.46451997756958e-07, -2.076849341392517e-07, -6.891787052154541e-08, 6.984919309616089e-08, 2.086162567138672e-07, 3.473833203315735e-07, 4.861503839492798e-07, 6.249174475669861e-07, 7.636845111846924e-07, 9.024515748023987e-07, 1.041218638420105e-06, 1.1799857020378113e-06, 1.3187527656555176e-06, 1.4575198292732239e-06, 1.5962868928909302e-06, 1.7350539565086365e-06, 1.8738210201263428e-06, 2.012588083744049e-06, 2.1513551473617554e-06, 2.2901222109794617e-06, 2.428889274597168e-06, 2.5676563382148743e-06, 2.7064234018325806e-06, 2.845190465450287e-06, 2.983957529067993e-06, 3.1227245926856995e-06, 3.2614916563034058e-06, 3.400258719921112e-06, 3.5390257835388184e-06, 3.6777928471565247e-06, 3.816559910774231e-06, 3.955326974391937e-06, 4.0940940380096436e-06, 4.23286110162735e-06, 4.371628165245056e-06, 4.5103952288627625e-06, 4.649162292480469e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 13.0, 22.0, 27.0, 42.0, 41.0, 80.0, 134.0, 209.0, 377.0, 642.0, 1151.0, 2572.0, 6293.0, 18668.0, 76075.0, 652451.0, 227269.0, 42157.0, 11897.0, 4377.0, 1821.0, 901.0, 510.0, 284.0, 178.0, 114.0, 73.0, 47.0, 36.0, 27.0, 17.0, 8.0, 12.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005596160888671875, -0.005425572395324707, -0.005254983901977539, -0.005084395408630371, -0.004913806915283203, -0.004743218421936035, -0.004572629928588867, -0.004402041435241699, -0.004231452941894531, -0.004060864448547363, -0.0038902759552001953, -0.0037196874618530273, -0.0035490989685058594, -0.0033785104751586914, -0.0032079219818115234, -0.0030373334884643555, -0.0028667449951171875, -0.0026961565017700195, -0.0025255680084228516, -0.0023549795150756836, -0.0021843910217285156, -0.0020138025283813477, -0.0018432140350341797, -0.0016726255416870117, -0.0015020370483398438, -0.0013314485549926758, -0.0011608600616455078, -0.0009902715682983398, -0.0008196830749511719, -0.0006490945816040039, -0.00047850608825683594, -0.00030791759490966797, -0.0001373291015625, 3.325939178466797e-05, 0.00020384788513183594, 0.0003744363784790039, 0.0005450248718261719, 0.0007156133651733398, 0.0008862018585205078, 0.0010567903518676758, 0.0012273788452148438, 0.0013979673385620117, 0.0015685558319091797, 0.0017391443252563477, 0.0019097328186035156, 0.0020803213119506836, 0.0022509098052978516, 0.0024214982986450195, 0.0025920867919921875, 0.0027626752853393555, 0.0029332637786865234, 0.0031038522720336914, 0.0032744407653808594, 0.0034450292587280273, 0.0036156177520751953, 0.0037862062454223633, 0.003956794738769531, 0.004127383232116699, 0.004297971725463867, 0.004468560218811035, 0.004639148712158203, 0.004809737205505371, 0.004980325698852539, 0.005150914192199707, 0.005321502685546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 5.0, 7.0, 5.0, 10.0, 18.0, 20.0, 23.0, 28.0, 41.0, 52.0, 89.0, 83.0, 108.0, 99.0, 92.0, 82.0, 59.0, 38.0, 32.0, 23.0, 16.0, 12.0, 8.0, 14.0, 7.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00861358642578125, -0.008326530456542969, -0.008039474487304688, -0.007752418518066406, -0.007465362548828125, -0.007178306579589844, -0.0068912506103515625, -0.006604194641113281, -0.006317138671875, -0.006030082702636719, -0.0057430267333984375, -0.005455970764160156, -0.005168914794921875, -0.004881858825683594, -0.0045948028564453125, -0.004307746887207031, -0.00402069091796875, -0.0037336349487304688, -0.0034465789794921875, -0.0031595230102539062, -0.002872467041015625, -0.0025854110717773438, -0.0022983551025390625, -0.0020112991333007812, -0.0017242431640625, -0.0014371871948242188, -0.0011501312255859375, -0.0008630752563476562, -0.000576019287109375, -0.00028896331787109375, -1.9073486328125e-06, 0.00028514862060546875, 0.00057220458984375, 0.0008592605590820312, 0.0011463165283203125, 0.0014333724975585938, 0.001720428466796875, 0.0020074844360351562, 0.0022945404052734375, 0.0025815963745117188, 0.00286865234375, 0.0031557083129882812, 0.0034427642822265625, 0.0037298202514648438, 0.004016876220703125, 0.004303932189941406, 0.0045909881591796875, 0.004878044128417969, 0.00516510009765625, 0.005452156066894531, 0.0057392120361328125, 0.006026268005371094, 0.006313323974609375, 0.006600379943847656, 0.0068874359130859375, 0.007174491882324219, 0.0074615478515625, 0.007748603820800781, 0.008035659790039062, 0.008322715759277344, 0.008609771728515625, 0.008896827697753906, 0.009183883666992188, 0.009470939636230469, 0.00975799560546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 14.0, 13.0, 13.0, 37.0, 31.0, 58.0, 102.0, 130.0, 254.0, 141.0, 73.0, 47.0, 21.0, 12.0, 14.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2625066637992859, -0.2566257417201996, -0.2507448196411133, -0.24486388266086578, -0.23898296058177948, -0.23310202360153198, -0.22722110152244568, -0.22134017944335938, -0.21545924246311188, -0.20957832038402557, -0.20369738340377808, -0.19781646132469177, -0.19193553924560547, -0.18605460226535797, -0.18017368018627167, -0.17429274320602417, -0.16841182112693787, -0.16253089904785156, -0.15664996206760406, -0.15076903998851776, -0.14488811790943146, -0.13900718092918396, -0.13312625885009766, -0.12724533677101135, -0.12136441469192505, -0.11548348516225815, -0.10960256308317184, -0.10372163355350494, -0.09784070402383804, -0.09195977449417114, -0.08607885241508484, -0.08019792288541794, -0.07431699335575104, -0.06843606382608414, -0.06255514174699783, -0.05667421221733093, -0.05079328268766403, -0.04491235688328743, -0.03903143107891083, -0.03315050154924393, -0.027269575744867325, -0.021388648077845573, -0.015507721342146397, -0.00962679460644722, -0.0037458669394254684, 0.002135060727596283, 0.008015986531972885, 0.013896916061639786, 0.019777841866016388, 0.02565876953303814, 0.03153969720005989, 0.03742062300443649, 0.043301552534103394, 0.049182478338479996, 0.0550634041428566, 0.0609443336725235, 0.0668252557516098, 0.0727061852812767, 0.078587107360363, 0.08446803689002991, 0.09034896641969681, 0.09622989594936371, 0.10211081802845001, 0.10799174755811691, 0.11387267708778381]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 3.0, 9.0, 12.0, 6.0, 8.0, 11.0, 7.0, 12.0, 25.0, 8.0, 11.0, 23.0, 21.0, 27.0, 34.0, 37.0, 36.0, 52.0, 72.0, 66.0, 71.0, 58.0, 42.0, 45.0, 25.0, 27.0, 23.0, 29.0, 16.0, 14.0, 22.0, 17.0, 18.0, 15.0, 15.0, 13.0, 13.0, 8.0, 4.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.09438371658325195, -0.091534823179245, -0.08868593722581863, -0.08583704382181168, -0.08298815786838531, -0.08013926446437836, -0.0772903710603714, -0.07444147765636444, -0.07159259170293808, -0.06874369829893112, -0.06589481234550476, -0.0630459189414978, -0.06019702926278114, -0.057348139584064484, -0.054499246180057526, -0.051650356501340866, -0.04880146682262421, -0.04595257714390755, -0.04310368746519089, -0.04025479406118393, -0.03740590438246727, -0.03455701470375061, -0.03170812129974365, -0.028859231621026993, -0.026010341942310333, -0.023161452263593674, -0.020312560722231865, -0.017463669180870056, -0.014614779502153397, -0.011765888892114162, -0.008916998282074928, -0.0060681067407131195, -0.00321921706199646, -0.0003703264519572258, 0.0024785641580820084, 0.0053274547681212425, 0.008176345378160477, 0.01102523598819971, 0.013874126598238945, 0.016723018139600754, 0.019571907818317413, 0.022420797497034073, 0.02526968903839588, 0.02811858057975769, 0.03096747025847435, 0.03381635993719101, 0.03666525334119797, 0.03951414301991463, 0.04236303269863129, 0.045211922377347946, 0.048060812056064606, 0.050909705460071564, 0.05375859513878822, 0.05660748481750488, 0.05945637822151184, 0.0623052679002285, 0.06515415757894516, 0.06800305098295212, 0.07085193693637848, 0.07370083034038544, 0.0765497237443924, 0.07939860969781876, 0.08224750310182571, 0.08509638905525208, 0.08794528245925903]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 12.0, 7.0, 26.0, 30.0, 34.0, 55.0, 105.0, 211.0, 394.0, 863.0, 2140.0, 7024.0, 44198.0, 2409457.0, 1677919.0, 40288.0, 7580.0, 2169.0, 864.0, 401.0, 205.0, 117.0, 64.0, 48.0, 15.0, 16.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0235137939453125, -0.022910356521606445, -0.02230691909790039, -0.021703481674194336, -0.02110004425048828, -0.020496606826782227, -0.019893169403076172, -0.019289731979370117, -0.018686294555664062, -0.018082857131958008, -0.017479419708251953, -0.0168759822845459, -0.016272544860839844, -0.01566910743713379, -0.015065670013427734, -0.01446223258972168, -0.013858795166015625, -0.01325535774230957, -0.012651920318603516, -0.012048482894897461, -0.011445045471191406, -0.010841608047485352, -0.010238170623779297, -0.009634733200073242, -0.009031295776367188, -0.008427858352661133, -0.007824420928955078, -0.0072209835052490234, -0.006617546081542969, -0.006014108657836914, -0.005410671234130859, -0.004807233810424805, -0.00420379638671875, -0.0036003589630126953, -0.0029969215393066406, -0.002393484115600586, -0.0017900466918945312, -0.0011866092681884766, -0.0005831718444824219, 2.0265579223632812e-05, 0.0006237030029296875, 0.0012271404266357422, 0.0018305778503417969, 0.0024340152740478516, 0.0030374526977539062, 0.003640890121459961, 0.004244327545166016, 0.00484776496887207, 0.005451202392578125, 0.00605463981628418, 0.006658077239990234, 0.007261514663696289, 0.007864952087402344, 0.008468389511108398, 0.009071826934814453, 0.009675264358520508, 0.010278701782226562, 0.010882139205932617, 0.011485576629638672, 0.012089014053344727, 0.012692451477050781, 0.013295888900756836, 0.01389932632446289, 0.014502763748168945, 0.015106201171875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 7.0, 7.0, 5.0, 19.0, 20.0, 33.0, 59.0, 98.0, 103.0, 131.0, 146.0, 106.0, 86.0, 55.0, 53.0, 31.0, 17.0, 12.0, 9.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185089111328125, -0.017913341522216797, -0.017317771911621094, -0.01672220230102539, -0.016126632690429688, -0.015531063079833984, -0.014935493469238281, -0.014339923858642578, -0.013744354248046875, -0.013148784637451172, -0.012553215026855469, -0.011957645416259766, -0.011362075805664062, -0.01076650619506836, -0.010170936584472656, -0.009575366973876953, -0.00897979736328125, -0.008384227752685547, -0.007788658142089844, -0.007193088531494141, -0.0065975189208984375, -0.006001949310302734, -0.005406379699707031, -0.004810810089111328, -0.004215240478515625, -0.003619670867919922, -0.0030241012573242188, -0.0024285316467285156, -0.0018329620361328125, -0.0012373924255371094, -0.0006418228149414062, -4.6253204345703125e-05, 0.00054931640625, 0.0011448860168457031, 0.0017404556274414062, 0.0023360252380371094, 0.0029315948486328125, 0.0035271644592285156, 0.004122734069824219, 0.004718303680419922, 0.005313873291015625, 0.005909442901611328, 0.006505012512207031, 0.007100582122802734, 0.0076961517333984375, 0.00829172134399414, 0.008887290954589844, 0.009482860565185547, 0.01007843017578125, 0.010673999786376953, 0.011269569396972656, 0.01186513900756836, 0.012460708618164062, 0.013056278228759766, 0.013651847839355469, 0.014247417449951172, 0.014842987060546875, 0.015438556671142578, 0.01603412628173828, 0.016629695892333984, 0.017225265502929688, 0.01782083511352539, 0.018416404724121094, 0.019011974334716797, 0.0196075439453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 13.0, 15.0, 24.0, 33.0, 65.0, 137.0, 319.0, 943.0, 3456.0, 19323.0, 1973645.0, 2170640.0, 20482.0, 3522.0, 1003.0, 349.0, 145.0, 50.0, 37.0, 28.0, 15.0, 8.0, 4.0, 2.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031341552734375, -0.030180931091308594, -0.029020309448242188, -0.02785968780517578, -0.026699066162109375, -0.02553844451904297, -0.024377822875976562, -0.023217201232910156, -0.02205657958984375, -0.020895957946777344, -0.019735336303710938, -0.01857471466064453, -0.017414093017578125, -0.01625347137451172, -0.015092849731445312, -0.013932228088378906, -0.0127716064453125, -0.011610984802246094, -0.010450363159179688, -0.009289741516113281, -0.008129119873046875, -0.006968498229980469, -0.0058078765869140625, -0.004647254943847656, -0.00348663330078125, -0.0023260116577148438, -0.0011653900146484375, -4.76837158203125e-06, 0.001155853271484375, 0.0023164749145507812, 0.0034770965576171875, 0.004637718200683594, 0.00579833984375, 0.006958961486816406, 0.008119583129882812, 0.009280204772949219, 0.010440826416015625, 0.011601448059082031, 0.012762069702148438, 0.013922691345214844, 0.01508331298828125, 0.016243934631347656, 0.017404556274414062, 0.01856517791748047, 0.019725799560546875, 0.02088642120361328, 0.022047042846679688, 0.023207664489746094, 0.0243682861328125, 0.025528907775878906, 0.026689529418945312, 0.02785015106201172, 0.029010772705078125, 0.03017139434814453, 0.03133201599121094, 0.032492637634277344, 0.03365325927734375, 0.034813880920410156, 0.03597450256347656, 0.03713512420654297, 0.038295745849609375, 0.03945636749267578, 0.04061698913574219, 0.041777610778808594, 0.042938232421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 13.0, 17.0, 18.0, 42.0, 73.0, 184.0, 565.0, 1461.0, 1051.0, 323.0, 125.0, 60.0, 25.0, 31.0, 17.0, 14.0, 10.0, 7.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0308380126953125, -0.029950380325317383, -0.029062747955322266, -0.02817511558532715, -0.02728748321533203, -0.026399850845336914, -0.025512218475341797, -0.02462458610534668, -0.023736953735351562, -0.022849321365356445, -0.021961688995361328, -0.02107405662536621, -0.020186424255371094, -0.019298791885375977, -0.01841115951538086, -0.017523527145385742, -0.016635894775390625, -0.015748262405395508, -0.01486063003540039, -0.013972997665405273, -0.013085365295410156, -0.012197732925415039, -0.011310100555419922, -0.010422468185424805, -0.009534835815429688, -0.00864720344543457, -0.007759571075439453, -0.006871938705444336, -0.005984306335449219, -0.0050966739654541016, -0.004209041595458984, -0.003321409225463867, -0.00243377685546875, -0.0015461444854736328, -0.0006585121154785156, 0.00022912025451660156, 0.0011167526245117188, 0.002004384994506836, 0.002892017364501953, 0.0037796497344970703, 0.0046672821044921875, 0.005554914474487305, 0.006442546844482422, 0.007330179214477539, 0.008217811584472656, 0.009105443954467773, 0.00999307632446289, 0.010880708694458008, 0.011768341064453125, 0.012655973434448242, 0.01354360580444336, 0.014431238174438477, 0.015318870544433594, 0.01620650291442871, 0.017094135284423828, 0.017981767654418945, 0.018869400024414062, 0.01975703239440918, 0.020644664764404297, 0.021532297134399414, 0.02241992950439453, 0.02330756187438965, 0.024195194244384766, 0.025082826614379883, 0.025970458984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 6.0, 14.0, 25.0, 35.0, 94.0, 115.0, 192.0, 198.0, 141.0, 74.0, 40.0, 23.0, 12.0, 12.0, 7.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08114591985940933, -0.07632295042276382, -0.07149998098611832, -0.06667700409889221, -0.061854034662246704, -0.057031065225601196, -0.05220809578895569, -0.04738512262701988, -0.042562153190374374, -0.03773918375372887, -0.03291621059179306, -0.028093241155147552, -0.023270269855856895, -0.01844729855656624, -0.01362432911992073, -0.008801355957984924, -0.0039783865213394165, 0.0008445843122899532, 0.005667555145919323, 0.010490525513887405, 0.015313496813178062, 0.02013646811246872, 0.024959437549114227, 0.029782410711050034, 0.03460538014769554, 0.03942834958434105, 0.044251322746276855, 0.04907429218292236, 0.05389726161956787, 0.05872023478150368, 0.06354320049285889, 0.06836617738008499, 0.0731891542673111, 0.0780121237039566, 0.08283509314060211, 0.08765806257724762, 0.09248103946447372, 0.09730400890111923, 0.10212697833776474, 0.10694995522499084, 0.11177292466163635, 0.11659589409828186, 0.12141886353492737, 0.12624183297157288, 0.13106480240821838, 0.1358877718448639, 0.1407107412815094, 0.1455337256193161, 0.15035668015480042, 0.15517964959144592, 0.16000261902809143, 0.16482558846473694, 0.16964855790138245, 0.17447152733802795, 0.17929449677467346, 0.18411748111248016, 0.18894045054912567, 0.19376341998577118, 0.1985863894224167, 0.2034093588590622, 0.2082323282957077, 0.2130553126335144, 0.2178782820701599, 0.22270125150680542, 0.22752422094345093]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 8.0, 7.0, 10.0, 5.0, 7.0, 17.0, 18.0, 21.0, 31.0, 22.0, 30.0, 43.0, 47.0, 37.0, 38.0, 53.0, 46.0, 46.0, 51.0, 36.0, 50.0, 48.0, 37.0, 42.0, 41.0, 40.0, 26.0, 28.0, 23.0, 22.0, 12.0, 5.0, 15.0, 6.0, 5.0, 7.0, 2.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09113991260528564, -0.08831251412630081, -0.08548511564731598, -0.08265771716833115, -0.07983031868934631, -0.07700292766094208, -0.07417552918195724, -0.07134813070297241, -0.06852073222398758, -0.06569333374500275, -0.06286593526601791, -0.06003854051232338, -0.05721114203333855, -0.054383743554353714, -0.05155634880065918, -0.04872895032167435, -0.045901551842689514, -0.04307415336370468, -0.04024675488471985, -0.037419360131025314, -0.03459196165204048, -0.03176456317305565, -0.028937166556715965, -0.026109769940376282, -0.02328237146139145, -0.020454972982406616, -0.017627576366066933, -0.014800178818404675, -0.011972781270742416, -0.009145383723080158, -0.0063179861754179, -0.0034905895590782166, -0.0006631910800933838, 0.0021642064675688744, 0.0049916040152311325, 0.00781900156289339, 0.010646399110555649, 0.013473796658217907, 0.016301194205880165, 0.01912859082221985, 0.02195598930120468, 0.024783387780189514, 0.027610784396529198, 0.03043818101286888, 0.033265579491853714, 0.03609297797083855, 0.03892037272453308, 0.041747771203517914, 0.04457516968250275, 0.04740256816148758, 0.05022996664047241, 0.053057361394166946, 0.05588475987315178, 0.05871215835213661, 0.061539553105831146, 0.06436695158481598, 0.06719435006380081, 0.07002174854278564, 0.07284914702177048, 0.07567654550075531, 0.07850393652915955, 0.08133133500814438, 0.08415873348712921, 0.08698613196611404, 0.08981353044509888]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 4.0, 4.0, 7.0, 6.0, 21.0, 18.0, 29.0, 55.0, 52.0, 85.0, 119.0, 198.0, 356.0, 576.0, 1063.0, 2113.0, 4179.0, 9616.0, 25827.0, 88883.0, 460747.0, 347137.0, 69994.0, 21488.0, 8136.0, 3597.0, 1798.0, 1013.0, 536.0, 324.0, 180.0, 131.0, 88.0, 57.0, 47.0, 14.0, 28.0, 15.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.032501220703125, -0.03144979476928711, -0.03039836883544922, -0.029346942901611328, -0.028295516967773438, -0.027244091033935547, -0.026192665100097656, -0.025141239166259766, -0.024089813232421875, -0.023038387298583984, -0.021986961364746094, -0.020935535430908203, -0.019884109497070312, -0.018832683563232422, -0.01778125762939453, -0.01672983169555664, -0.01567840576171875, -0.01462697982788086, -0.013575553894042969, -0.012524127960205078, -0.011472702026367188, -0.010421276092529297, -0.009369850158691406, -0.008318424224853516, -0.007266998291015625, -0.006215572357177734, -0.005164146423339844, -0.004112720489501953, -0.0030612945556640625, -0.002009868621826172, -0.0009584426879882812, 9.298324584960938e-05, 0.0011444091796875, 0.0021958351135253906, 0.0032472610473632812, 0.004298686981201172, 0.0053501129150390625, 0.006401538848876953, 0.007452964782714844, 0.008504390716552734, 0.009555816650390625, 0.010607242584228516, 0.011658668518066406, 0.012710094451904297, 0.013761520385742188, 0.014812946319580078, 0.01586437225341797, 0.01691579818725586, 0.01796722412109375, 0.01901865005493164, 0.02007007598876953, 0.021121501922607422, 0.022172927856445312, 0.023224353790283203, 0.024275779724121094, 0.025327205657958984, 0.026378631591796875, 0.027430057525634766, 0.028481483459472656, 0.029532909393310547, 0.030584335327148438, 0.03163576126098633, 0.03268718719482422, 0.03373861312866211, 0.0347900390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 5.0, 10.0, 16.0, 15.0, 30.0, 42.0, 67.0, 96.0, 104.0, 127.0, 108.0, 109.0, 75.0, 60.0, 47.0, 26.0, 28.0, 11.0, 10.0, 11.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018341064453125, -0.017747879028320312, -0.017154693603515625, -0.016561508178710938, -0.01596832275390625, -0.015375137329101562, -0.014781951904296875, -0.014188766479492188, -0.0135955810546875, -0.013002395629882812, -0.012409210205078125, -0.011816024780273438, -0.01122283935546875, -0.010629653930664062, -0.010036468505859375, -0.009443283081054688, -0.00885009765625, -0.008256912231445312, -0.007663726806640625, -0.0070705413818359375, -0.00647735595703125, -0.0058841705322265625, -0.005290985107421875, -0.0046977996826171875, -0.0041046142578125, -0.0035114288330078125, -0.002918243408203125, -0.0023250579833984375, -0.00173187255859375, -0.0011386871337890625, -0.000545501708984375, 4.76837158203125e-05, 0.000640869140625, 0.0012340545654296875, 0.001827239990234375, 0.0024204254150390625, 0.00301361083984375, 0.0036067962646484375, 0.004199981689453125, 0.0047931671142578125, 0.0053863525390625, 0.0059795379638671875, 0.006572723388671875, 0.0071659088134765625, 0.00775909423828125, 0.008352279663085938, 0.008945465087890625, 0.009538650512695312, 0.0101318359375, 0.010725021362304688, 0.011318206787109375, 0.011911392211914062, 0.01250457763671875, 0.013097763061523438, 0.013690948486328125, 0.014284133911132812, 0.0148773193359375, 0.015470504760742188, 0.016063690185546875, 0.016656875610351562, 0.01725006103515625, 0.017843246459960938, 0.018436431884765625, 0.019029617309570312, 0.019622802734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 10.0, 13.0, 15.0, 17.0, 31.0, 45.0, 65.0, 101.0, 143.0, 244.0, 359.0, 653.0, 1085.0, 2222.0, 4958.0, 13483.0, 49961.0, 596189.0, 314173.0, 43458.0, 12087.0, 4519.0, 2043.0, 1079.0, 568.0, 355.0, 201.0, 139.0, 94.0, 62.0, 51.0, 39.0, 25.0, 21.0, 7.0, 6.0, 7.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042449951171875, -0.041121482849121094, -0.03979301452636719, -0.03846454620361328, -0.037136077880859375, -0.03580760955810547, -0.03447914123535156, -0.033150672912597656, -0.03182220458984375, -0.030493736267089844, -0.029165267944335938, -0.02783679962158203, -0.026508331298828125, -0.02517986297607422, -0.023851394653320312, -0.022522926330566406, -0.0211944580078125, -0.019865989685058594, -0.018537521362304688, -0.01720905303955078, -0.015880584716796875, -0.014552116394042969, -0.013223648071289062, -0.011895179748535156, -0.01056671142578125, -0.009238243103027344, -0.007909774780273438, -0.006581306457519531, -0.005252838134765625, -0.003924369812011719, -0.0025959014892578125, -0.0012674331665039062, 6.103515625e-05, 0.0013895034790039062, 0.0027179718017578125, 0.004046440124511719, 0.005374908447265625, 0.006703376770019531, 0.008031845092773438, 0.009360313415527344, 0.01068878173828125, 0.012017250061035156, 0.013345718383789062, 0.014674186706542969, 0.016002655029296875, 0.01733112335205078, 0.018659591674804688, 0.019988059997558594, 0.0213165283203125, 0.022644996643066406, 0.023973464965820312, 0.02530193328857422, 0.026630401611328125, 0.02795886993408203, 0.029287338256835938, 0.030615806579589844, 0.03194427490234375, 0.033272743225097656, 0.03460121154785156, 0.03592967987060547, 0.037258148193359375, 0.03858661651611328, 0.03991508483886719, 0.041243553161621094, 0.042572021484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 12.0, 12.0, 19.0, 21.0, 15.0, 30.0, 31.0, 34.0, 33.0, 64.0, 58.0, 73.0, 53.0, 57.0, 69.0, 54.0, 53.0, 51.0, 53.0, 36.0, 27.0, 32.0, 20.0, 10.0, 21.0, 9.0, 9.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.048492431640625, -0.047118186950683594, -0.04574394226074219, -0.04436969757080078, -0.042995452880859375, -0.04162120819091797, -0.04024696350097656, -0.038872718811035156, -0.03749847412109375, -0.036124229431152344, -0.03474998474121094, -0.03337574005126953, -0.032001495361328125, -0.03062725067138672, -0.029253005981445312, -0.027878761291503906, -0.0265045166015625, -0.025130271911621094, -0.023756027221679688, -0.02238178253173828, -0.021007537841796875, -0.01963329315185547, -0.018259048461914062, -0.016884803771972656, -0.01551055908203125, -0.014136314392089844, -0.012762069702148438, -0.011387825012207031, -0.010013580322265625, -0.008639335632324219, -0.0072650909423828125, -0.005890846252441406, -0.0045166015625, -0.0031423568725585938, -0.0017681121826171875, -0.00039386749267578125, 0.000980377197265625, 0.0023546218872070312, 0.0037288665771484375, 0.005103111267089844, 0.00647735595703125, 0.007851600646972656, 0.009225845336914062, 0.010600090026855469, 0.011974334716796875, 0.013348579406738281, 0.014722824096679688, 0.016097068786621094, 0.0174713134765625, 0.018845558166503906, 0.020219802856445312, 0.02159404754638672, 0.022968292236328125, 0.02434253692626953, 0.025716781616210938, 0.027091026306152344, 0.02846527099609375, 0.029839515686035156, 0.031213760375976562, 0.03258800506591797, 0.033962249755859375, 0.03533649444580078, 0.03671073913574219, 0.038084983825683594, 0.039459228515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 3.0, 11.0, 12.0, 20.0, 43.0, 45.0, 78.0, 136.0, 233.0, 536.0, 1580.0, 6369.0, 39824.0, 826847.0, 153044.0, 14994.0, 3063.0, 885.0, 346.0, 176.0, 106.0, 54.0, 34.0, 27.0, 13.0, 15.0, 12.0, 14.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0132598876953125, -0.012855052947998047, -0.012450218200683594, -0.01204538345336914, -0.011640548706054688, -0.011235713958740234, -0.010830879211425781, -0.010426044464111328, -0.010021209716796875, -0.009616374969482422, -0.009211540222167969, -0.008806705474853516, -0.008401870727539062, -0.00799703598022461, -0.007592201232910156, -0.007187366485595703, -0.00678253173828125, -0.006377696990966797, -0.005972862243652344, -0.005568027496337891, -0.0051631927490234375, -0.004758358001708984, -0.004353523254394531, -0.003948688507080078, -0.003543853759765625, -0.003139019012451172, -0.0027341842651367188, -0.0023293495178222656, -0.0019245147705078125, -0.0015196800231933594, -0.0011148452758789062, -0.0007100105285644531, -0.00030517578125, 9.965896606445312e-05, 0.0005044937133789062, 0.0009093284606933594, 0.0013141632080078125, 0.0017189979553222656, 0.0021238327026367188, 0.002528667449951172, 0.002933502197265625, 0.003338336944580078, 0.0037431716918945312, 0.004148006439208984, 0.0045528411865234375, 0.004957675933837891, 0.005362510681152344, 0.005767345428466797, 0.00617218017578125, 0.006577014923095703, 0.006981849670410156, 0.007386684417724609, 0.0077915191650390625, 0.008196353912353516, 0.008601188659667969, 0.009006023406982422, 0.009410858154296875, 0.009815692901611328, 0.010220527648925781, 0.010625362396240234, 0.011030197143554688, 0.01143503189086914, 0.011839866638183594, 0.012244701385498047, 0.0126495361328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 4.0, 4.0, 5.0, 5.0, 11.0, 2.0, 5.0, 14.0, 11.0, 9.0, 14.0, 23.0, 16.0, 38.0, 44.0, 32.0, 56.0, 68.0, 70.0, 49.0, 73.0, 66.0, 51.0, 60.0, 69.0, 47.0, 29.0, 44.0, 15.0, 15.0, 16.0, 5.0, 4.0, 6.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.066394805908203e-06, -4.905276000499725e-06, -4.7441571950912476e-06, -4.58303838968277e-06, -4.421919584274292e-06, -4.260800778865814e-06, -4.0996819734573364e-06, -3.938563168048859e-06, -3.777444362640381e-06, -3.616325557231903e-06, -3.4552067518234253e-06, -3.2940879464149475e-06, -3.1329691410064697e-06, -2.971850335597992e-06, -2.810731530189514e-06, -2.6496127247810364e-06, -2.4884939193725586e-06, -2.327375113964081e-06, -2.166256308555603e-06, -2.0051375031471252e-06, -1.8440186977386475e-06, -1.6828998923301697e-06, -1.521781086921692e-06, -1.3606622815132141e-06, -1.1995434761047363e-06, -1.0384246706962585e-06, -8.773058652877808e-07, -7.16187059879303e-07, -5.550682544708252e-07, -3.939494490623474e-07, -2.3283064365386963e-07, -7.171183824539185e-08, 8.940696716308594e-08, 2.505257725715637e-07, 4.116445779800415e-07, 5.727633833885193e-07, 7.338821887969971e-07, 8.950009942054749e-07, 1.0561197996139526e-06, 1.2172386050224304e-06, 1.3783574104309082e-06, 1.539476215839386e-06, 1.7005950212478638e-06, 1.8617138266563416e-06, 2.0228326320648193e-06, 2.183951437473297e-06, 2.345070242881775e-06, 2.5061890482902527e-06, 2.6673078536987305e-06, 2.8284266591072083e-06, 2.989545464515686e-06, 3.150664269924164e-06, 3.3117830753326416e-06, 3.4729018807411194e-06, 3.634020686149597e-06, 3.795139491558075e-06, 3.956258296966553e-06, 4.1173771023750305e-06, 4.278495907783508e-06, 4.439614713191986e-06, 4.600733518600464e-06, 4.761852324008942e-06, 4.9229711294174194e-06, 5.084089934825897e-06, 5.245208740234375e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 13.0, 9.0, 23.0, 29.0, 40.0, 65.0, 85.0, 114.0, 164.0, 284.0, 471.0, 790.0, 1414.0, 3084.0, 7706.0, 23491.0, 107738.0, 739355.0, 122895.0, 25836.0, 7972.0, 3209.0, 1540.0, 863.0, 482.0, 290.0, 187.0, 120.0, 78.0, 55.0, 42.0, 34.0, 10.0, 14.0, 12.0, 10.0, 8.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.007781982421875, -0.007562994956970215, -0.00734400749206543, -0.0071250200271606445, -0.006906032562255859, -0.006687045097351074, -0.006468057632446289, -0.006249070167541504, -0.006030082702636719, -0.005811095237731934, -0.0055921077728271484, -0.005373120307922363, -0.005154132843017578, -0.004935145378112793, -0.004716157913208008, -0.004497170448303223, -0.0042781829833984375, -0.004059195518493652, -0.003840208053588867, -0.003621220588684082, -0.003402233123779297, -0.0031832456588745117, -0.0029642581939697266, -0.0027452707290649414, -0.0025262832641601562, -0.002307295799255371, -0.002088308334350586, -0.0018693208694458008, -0.0016503334045410156, -0.0014313459396362305, -0.0012123584747314453, -0.0009933710098266602, -0.000774383544921875, -0.0005553960800170898, -0.0003364086151123047, -0.00011742115020751953, 0.00010156631469726562, 0.0003205537796020508, 0.0005395412445068359, 0.0007585287094116211, 0.0009775161743164062, 0.0011965036392211914, 0.0014154911041259766, 0.0016344785690307617, 0.0018534660339355469, 0.002072453498840332, 0.002291440963745117, 0.0025104284286499023, 0.0027294158935546875, 0.0029484033584594727, 0.003167390823364258, 0.003386378288269043, 0.003605365753173828, 0.0038243532180786133, 0.0040433406829833984, 0.004262328147888184, 0.004481315612792969, 0.004700303077697754, 0.004919290542602539, 0.005138278007507324, 0.005357265472412109, 0.0055762529373168945, 0.00579524040222168, 0.006014227867126465, 0.00623321533203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 3.0, 5.0, 11.0, 6.0, 14.0, 11.0, 25.0, 22.0, 32.0, 43.0, 52.0, 42.0, 54.0, 78.0, 84.0, 87.0, 79.0, 75.0, 58.0, 51.0, 29.0, 28.0, 18.0, 16.0, 7.0, 19.0, 15.0, 8.0, 6.0, 2.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0100250244140625, -0.00970911979675293, -0.00939321517944336, -0.009077310562133789, -0.008761405944824219, -0.008445501327514648, -0.008129596710205078, -0.007813692092895508, -0.0074977874755859375, -0.007181882858276367, -0.006865978240966797, -0.0065500736236572266, -0.006234169006347656, -0.005918264389038086, -0.005602359771728516, -0.005286455154418945, -0.004970550537109375, -0.004654645919799805, -0.004338741302490234, -0.004022836685180664, -0.0037069320678710938, -0.0033910274505615234, -0.003075122833251953, -0.002759218215942383, -0.0024433135986328125, -0.002127408981323242, -0.0018115043640136719, -0.0014955997467041016, -0.0011796951293945312, -0.0008637905120849609, -0.0005478858947753906, -0.0002319812774658203, 8.392333984375e-05, 0.0003998279571533203, 0.0007157325744628906, 0.001031637191772461, 0.0013475418090820312, 0.0016634464263916016, 0.001979351043701172, 0.002295255661010742, 0.0026111602783203125, 0.002927064895629883, 0.003242969512939453, 0.0035588741302490234, 0.0038747787475585938, 0.004190683364868164, 0.004506587982177734, 0.004822492599487305, 0.005138397216796875, 0.005454301834106445, 0.005770206451416016, 0.006086111068725586, 0.006402015686035156, 0.0067179203033447266, 0.007033824920654297, 0.007349729537963867, 0.0076656341552734375, 0.007981538772583008, 0.008297443389892578, 0.008613348007202148, 0.008929252624511719, 0.009245157241821289, 0.00956106185913086, 0.00987696647644043, 0.01019287109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 10.0, 11.0, 12.0, 11.0, 43.0, 49.0, 139.0, 347.0, 278.0, 64.0, 20.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5150738954544067, -0.4994322657585144, -0.48379063606262207, -0.46814897656440735, -0.452507346868515, -0.4368657171726227, -0.42122405767440796, -0.4055824279785156, -0.3899407982826233, -0.37429916858673096, -0.3586575388908386, -0.3430158793926239, -0.32737424969673157, -0.31173262000083923, -0.2960909605026245, -0.2804493308067322, -0.26480770111083984, -0.2491660714149475, -0.23352442681789398, -0.21788278222084045, -0.20224115252494812, -0.1865995228290558, -0.17095787823200226, -0.15531623363494873, -0.1396746039390564, -0.12403296679258347, -0.10839132964611053, -0.0927496924996376, -0.07710805535316467, -0.06146641820669174, -0.04582478106021881, -0.03018314391374588, -0.014541566371917725, 0.0011000707745552063, 0.016741707921028137, 0.03238334506750107, 0.048024982213974, 0.06366661936044693, 0.07930825650691986, 0.09494989365339279, 0.11059153079986572, 0.12623316049575806, 0.14187480509281158, 0.1575164496898651, 0.17315807938575745, 0.18879970908164978, 0.2044413536787033, 0.22008299827575684, 0.23572462797164917, 0.2513662576675415, 0.26700788736343384, 0.28264954686164856, 0.2982911765575409, 0.3139328062534332, 0.32957446575164795, 0.3452160954475403, 0.3608577251434326, 0.37649935483932495, 0.3921409845352173, 0.407782644033432, 0.42342427372932434, 0.4390659034252167, 0.4547075629234314, 0.47034919261932373, 0.48599082231521606]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 6.0, 4.0, 3.0, 14.0, 11.0, 9.0, 17.0, 23.0, 15.0, 25.0, 15.0, 22.0, 26.0, 28.0, 32.0, 47.0, 88.0, 107.0, 106.0, 64.0, 49.0, 28.0, 30.0, 29.0, 26.0, 17.0, 19.0, 18.0, 20.0, 14.0, 15.0, 15.0, 11.0, 7.0, 4.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11476194858551025, -0.11114710569381714, -0.10753225535154343, -0.10391741245985031, -0.1003025621175766, -0.09668771922588348, -0.09307287633419037, -0.08945803344249725, -0.08584318310022354, -0.08222834020853043, -0.07861348986625671, -0.0749986469745636, -0.07138380408287048, -0.06776895374059677, -0.06415411084890366, -0.06053926423192024, -0.05692441761493683, -0.053309570997953415, -0.04969472438097, -0.046079881489276886, -0.04246503487229347, -0.03885018825531006, -0.03523534536361694, -0.03162049874663353, -0.028005652129650116, -0.024390805512666702, -0.020775960758328438, -0.017161116003990173, -0.01354626938700676, -0.009931422770023346, -0.0063165780156850815, -0.002701733261346817, 0.0009131133556365967, 0.004527959041297436, 0.008142804726958275, 0.011757650412619114, 0.015372496098279953, 0.018987342715263367, 0.02260218746960163, 0.026217032223939896, 0.02983187884092331, 0.03344672545790672, 0.03706157207489014, 0.04067641496658325, 0.044291261583566666, 0.04790610820055008, 0.051520951092243195, 0.05513579770922661, 0.05875064432621002, 0.062365490943193436, 0.06598033756017685, 0.06959518045186996, 0.07321003079414368, 0.07682487368583679, 0.08043971657752991, 0.08405455946922302, 0.08766940981149673, 0.09128425270318985, 0.09489910304546356, 0.09851394593715668, 0.10212878882884979, 0.1057436391711235, 0.10935848206281662, 0.11297333240509033, 0.11658817529678345]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 7.0, 5.0, 8.0, 17.0, 12.0, 18.0, 32.0, 25.0, 49.0, 60.0, 107.0, 141.0, 212.0, 306.0, 430.0, 623.0, 1041.0, 1607.0, 2753.0, 5450.0, 12193.0, 36961.0, 198086.0, 2689070.0, 1103875.0, 97411.0, 24334.0, 9142.0, 4278.0, 2237.0, 1369.0, 816.0, 519.0, 352.0, 240.0, 146.0, 95.0, 78.0, 62.0, 44.0, 25.0, 14.0, 10.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.027435302734375, -0.02657294273376465, -0.025710582733154297, -0.024848222732543945, -0.023985862731933594, -0.023123502731323242, -0.02226114273071289, -0.02139878273010254, -0.020536422729492188, -0.019674062728881836, -0.018811702728271484, -0.017949342727661133, -0.01708698272705078, -0.01622462272644043, -0.015362262725830078, -0.014499902725219727, -0.013637542724609375, -0.012775182723999023, -0.011912822723388672, -0.01105046272277832, -0.010188102722167969, -0.009325742721557617, -0.008463382720947266, -0.007601022720336914, -0.0067386627197265625, -0.005876302719116211, -0.005013942718505859, -0.004151582717895508, -0.0032892227172851562, -0.0024268627166748047, -0.0015645027160644531, -0.0007021427154541016, 0.00016021728515625, 0.0010225772857666016, 0.0018849372863769531, 0.0027472972869873047, 0.0036096572875976562, 0.004472017288208008, 0.005334377288818359, 0.006196737289428711, 0.0070590972900390625, 0.007921457290649414, 0.008783817291259766, 0.009646177291870117, 0.010508537292480469, 0.01137089729309082, 0.012233257293701172, 0.013095617294311523, 0.013957977294921875, 0.014820337295532227, 0.015682697296142578, 0.01654505729675293, 0.01740741729736328, 0.018269777297973633, 0.019132137298583984, 0.019994497299194336, 0.020856857299804688, 0.02171921730041504, 0.02258157730102539, 0.023443937301635742, 0.024306297302246094, 0.025168657302856445, 0.026031017303466797, 0.02689337730407715, 0.0277557373046875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 11.0, 18.0, 23.0, 25.0, 65.0, 93.0, 114.0, 120.0, 120.0, 103.0, 88.0, 58.0, 51.0, 32.0, 33.0, 14.0, 7.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185546875, -0.0179598331451416, -0.017364978790283203, -0.016770124435424805, -0.016175270080566406, -0.015580415725708008, -0.01498556137084961, -0.014390707015991211, -0.013795852661132812, -0.013200998306274414, -0.012606143951416016, -0.012011289596557617, -0.011416435241699219, -0.01082158088684082, -0.010226726531982422, -0.009631872177124023, -0.009037017822265625, -0.008442163467407227, -0.007847309112548828, -0.00725245475769043, -0.006657600402832031, -0.006062746047973633, -0.005467891693115234, -0.004873037338256836, -0.0042781829833984375, -0.003683328628540039, -0.0030884742736816406, -0.002493619918823242, -0.0018987655639648438, -0.0013039112091064453, -0.0007090568542480469, -0.00011420249938964844, 0.00048065185546875, 0.0010755062103271484, 0.0016703605651855469, 0.0022652149200439453, 0.0028600692749023438, 0.003454923629760742, 0.004049777984619141, 0.004644632339477539, 0.0052394866943359375, 0.005834341049194336, 0.006429195404052734, 0.007024049758911133, 0.007618904113769531, 0.00821375846862793, 0.008808612823486328, 0.009403467178344727, 0.009998321533203125, 0.010593175888061523, 0.011188030242919922, 0.01178288459777832, 0.012377738952636719, 0.012972593307495117, 0.013567447662353516, 0.014162302017211914, 0.014757156372070312, 0.015352010726928711, 0.01594686508178711, 0.016541719436645508, 0.017136573791503906, 0.017731428146362305, 0.018326282501220703, 0.0189211368560791, 0.0195159912109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 10.0, 13.0, 33.0, 68.0, 147.0, 439.0, 2143.0, 74696.0, 4111088.0, 4555.0, 663.0, 217.0, 78.0, 43.0, 24.0, 17.0, 10.0, 6.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.22034835815429688, -0.21193695068359375, -0.20352554321289062, -0.1951141357421875, -0.18670272827148438, -0.17829132080078125, -0.16987991333007812, -0.161468505859375, -0.15305709838867188, -0.14464569091796875, -0.13623428344726562, -0.1278228759765625, -0.11941146850585938, -0.11100006103515625, -0.10258865356445312, -0.09417724609375, -0.08576583862304688, -0.07735443115234375, -0.06894302368164062, -0.0605316162109375, -0.052120208740234375, -0.04370880126953125, -0.035297393798828125, -0.026885986328125, -0.018474578857421875, -0.01006317138671875, -0.001651763916015625, 0.0067596435546875, 0.015171051025390625, 0.02358245849609375, 0.031993865966796875, 0.0404052734375, 0.048816680908203125, 0.05722808837890625, 0.06563949584960938, 0.0740509033203125, 0.08246231079101562, 0.09087371826171875, 0.09928512573242188, 0.107696533203125, 0.11610794067382812, 0.12451934814453125, 0.13293075561523438, 0.1413421630859375, 0.14975357055664062, 0.15816497802734375, 0.16657638549804688, 0.17498779296875, 0.18339920043945312, 0.19181060791015625, 0.20022201538085938, 0.2086334228515625, 0.21704483032226562, 0.22545623779296875, 0.23386764526367188, 0.242279052734375, 0.2506904602050781, 0.25910186767578125, 0.2675132751464844, 0.2759246826171875, 0.2843360900878906, 0.29274749755859375, 0.3011589050292969, 0.3095703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 6.0, 6.0, 1.0, 5.0, 7.0, 7.0, 12.0, 15.0, 19.0, 50.0, 74.0, 149.0, 299.0, 869.0, 1491.0, 607.0, 226.0, 116.0, 59.0, 28.0, 11.0, 12.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1168212890625, -0.11351394653320312, -0.11020660400390625, -0.10689926147460938, -0.1035919189453125, -0.10028457641601562, -0.09697723388671875, -0.09366989135742188, -0.090362548828125, -0.08705520629882812, -0.08374786376953125, -0.08044052124023438, -0.0771331787109375, -0.07382583618164062, -0.07051849365234375, -0.06721115112304688, -0.06390380859375, -0.060596466064453125, -0.05728912353515625, -0.053981781005859375, -0.0506744384765625, -0.047367095947265625, -0.04405975341796875, -0.040752410888671875, -0.037445068359375, -0.034137725830078125, -0.03083038330078125, -0.027523040771484375, -0.0242156982421875, -0.020908355712890625, -0.01760101318359375, -0.014293670654296875, -0.010986328125, -0.007678985595703125, -0.00437164306640625, -0.001064300537109375, 0.0022430419921875, 0.005550384521484375, 0.00885772705078125, 0.012165069580078125, 0.015472412109375, 0.018779754638671875, 0.02208709716796875, 0.025394439697265625, 0.0287017822265625, 0.032009124755859375, 0.03531646728515625, 0.038623809814453125, 0.04193115234375, 0.045238494873046875, 0.04854583740234375, 0.051853179931640625, 0.0551605224609375, 0.058467864990234375, 0.06177520751953125, 0.06508255004882812, 0.068389892578125, 0.07169723510742188, 0.07500457763671875, 0.07831192016601562, 0.0816192626953125, 0.08492660522460938, 0.08823394775390625, 0.09154129028320312, 0.0948486328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 10.0, 14.0, 21.0, 44.0, 43.0, 98.0, 161.0, 254.0, 165.0, 73.0, 39.0, 23.0, 18.0, 14.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-1.0359103679656982, -1.015360951423645, -0.994811475276947, -0.974261999130249, -0.9537125825881958, -0.9331631660461426, -0.9126136898994446, -0.8920642137527466, -0.8715147972106934, -0.8509653806686401, -0.8304159045219421, -0.8098664283752441, -0.7893170118331909, -0.7687675952911377, -0.7482181191444397, -0.7276686429977417, -0.7071192264556885, -0.6865698099136353, -0.6660203337669373, -0.6454708576202393, -0.624921441078186, -0.6043720245361328, -0.5838225483894348, -0.5632730722427368, -0.5427236557006836, -0.5221742391586304, -0.5016247630119324, -0.48107531666755676, -0.46052587032318115, -0.43997642397880554, -0.41942697763442993, -0.3988775312900543, -0.3783281147480011, -0.3577786684036255, -0.3372292220592499, -0.31667977571487427, -0.29613032937049866, -0.27558088302612305, -0.25503143668174744, -0.23448199033737183, -0.21393254399299622, -0.1933830976486206, -0.172833651304245, -0.15228420495986938, -0.13173475861549377, -0.11118531227111816, -0.09063586592674255, -0.07008641958236694, -0.04953697323799133, -0.028987526893615723, -0.008438080549240112, 0.012111365795135498, 0.03266081213951111, 0.05321025848388672, 0.07375970482826233, 0.09430915117263794, 0.11485859751701355, 0.13540804386138916, 0.15595749020576477, 0.17650693655014038, 0.197056382894516, 0.2176058292388916, 0.2381552755832672, 0.2587047219276428, 0.27925416827201843]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 9.0, 9.0, 17.0, 25.0, 26.0, 24.0, 37.0, 43.0, 57.0, 72.0, 80.0, 105.0, 77.0, 71.0, 64.0, 49.0, 64.0, 39.0, 32.0, 27.0, 21.0, 16.0, 8.0, 9.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.566375195980072, -0.5489749312400818, -0.5315747261047363, -0.5141744613647461, -0.49677419662475586, -0.4793739318847656, -0.4619736969470978, -0.44457346200942993, -0.4271731972694397, -0.40977293252944946, -0.3923726975917816, -0.37497246265411377, -0.35757219791412354, -0.3401719331741333, -0.32277169823646545, -0.3053714632987976, -0.2879711985588074, -0.27057093381881714, -0.2531706988811493, -0.23577044904232025, -0.2183701992034912, -0.20096994936466217, -0.18356969952583313, -0.1661694496870041, -0.14876919984817505, -0.131368950009346, -0.11396870017051697, -0.09656845033168793, -0.07916820049285889, -0.061767950654029846, -0.044367700815200806, -0.026967450976371765, -0.0095672607421875, 0.00783298909664154, 0.02523323893547058, 0.04263348877429962, 0.06003373861312866, 0.0774339884519577, 0.09483423829078674, 0.11223448812961578, 0.12963473796844482, 0.14703498780727386, 0.1644352376461029, 0.18183548748493195, 0.199235737323761, 0.21663598716259003, 0.23403623700141907, 0.2514364719390869, 0.26883673667907715, 0.2862370014190674, 0.30363723635673523, 0.3210374712944031, 0.3384377360343933, 0.35583800077438354, 0.3732382357120514, 0.39063847064971924, 0.4080387353897095, 0.4254390001296997, 0.44283923506736755, 0.4602394700050354, 0.47763973474502563, 0.49503999948501587, 0.5124402046203613, 0.5298404693603516, 0.5472407341003418]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 2.0, 2.0, 6.0, 12.0, 22.0, 33.0, 53.0, 96.0, 158.0, 373.0, 904.0, 3346.0, 19965.0, 757643.0, 250296.0, 11870.0, 2413.0, 736.0, 275.0, 139.0, 88.0, 46.0, 27.0, 13.0, 10.0, 4.0, 3.0, 3.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.14806556701660156, -0.14342117309570312, -0.1387767791748047, -0.13413238525390625, -0.1294879913330078, -0.12484359741210938, -0.12019920349121094, -0.1155548095703125, -0.11091041564941406, -0.10626602172851562, -0.10162162780761719, -0.09697723388671875, -0.09233283996582031, -0.08768844604492188, -0.08304405212402344, -0.078399658203125, -0.07375526428222656, -0.06911087036132812, -0.06446647644042969, -0.05982208251953125, -0.05517768859863281, -0.050533294677734375, -0.04588890075683594, -0.0412445068359375, -0.03660011291503906, -0.031955718994140625, -0.027311325073242188, -0.02266693115234375, -0.018022537231445312, -0.013378143310546875, -0.008733749389648438, -0.00408935546875, 0.0005550384521484375, 0.005199432373046875, 0.009843826293945312, 0.01448822021484375, 0.019132614135742188, 0.023777008056640625, 0.028421401977539062, 0.0330657958984375, 0.03771018981933594, 0.042354583740234375, 0.04699897766113281, 0.05164337158203125, 0.05628776550292969, 0.060932159423828125, 0.06557655334472656, 0.070220947265625, 0.07486534118652344, 0.07950973510742188, 0.08415412902832031, 0.08879852294921875, 0.09344291687011719, 0.09808731079101562, 0.10273170471191406, 0.1073760986328125, 0.11202049255371094, 0.11666488647460938, 0.12130928039550781, 0.12595367431640625, 0.1305980682373047, 0.13524246215820312, 0.13988685607910156, 0.14453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 15.0, 20.0, 23.0, 33.0, 52.0, 50.0, 74.0, 99.0, 117.0, 111.0, 108.0, 83.0, 60.0, 39.0, 33.0, 26.0, 16.0, 13.0, 9.0, 6.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04345703125, -0.042314767837524414, -0.04117250442504883, -0.04003024101257324, -0.038887977600097656, -0.03774571418762207, -0.036603450775146484, -0.0354611873626709, -0.03431892395019531, -0.03317666053771973, -0.03203439712524414, -0.030892133712768555, -0.02974987030029297, -0.028607606887817383, -0.027465343475341797, -0.02632308006286621, -0.025180816650390625, -0.02403855323791504, -0.022896289825439453, -0.021754026412963867, -0.02061176300048828, -0.019469499588012695, -0.01832723617553711, -0.017184972763061523, -0.016042709350585938, -0.014900445938110352, -0.013758182525634766, -0.01261591911315918, -0.011473655700683594, -0.010331392288208008, -0.009189128875732422, -0.008046865463256836, -0.00690460205078125, -0.005762338638305664, -0.004620075225830078, -0.003477811813354492, -0.0023355484008789062, -0.0011932849884033203, -5.1021575927734375e-05, 0.0010912418365478516, 0.0022335052490234375, 0.0033757686614990234, 0.004518032073974609, 0.005660295486450195, 0.006802558898925781, 0.007944822311401367, 0.009087085723876953, 0.010229349136352539, 0.011371612548828125, 0.012513875961303711, 0.013656139373779297, 0.014798402786254883, 0.01594066619873047, 0.017082929611206055, 0.01822519302368164, 0.019367456436157227, 0.020509719848632812, 0.0216519832611084, 0.022794246673583984, 0.02393651008605957, 0.025078773498535156, 0.026221036911010742, 0.027363300323486328, 0.028505563735961914, 0.0296478271484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 7.0, 9.0, 6.0, 23.0, 36.0, 69.0, 119.0, 295.0, 695.0, 2842.0, 37206.0, 986371.0, 17721.0, 2026.0, 599.0, 236.0, 120.0, 66.0, 37.0, 23.0, 16.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1195068359375, -0.11334419250488281, -0.10718154907226562, -0.10101890563964844, -0.09485626220703125, -0.08869361877441406, -0.08253097534179688, -0.07636833190917969, -0.0702056884765625, -0.06404304504394531, -0.057880401611328125, -0.05171775817871094, -0.04555511474609375, -0.03939247131347656, -0.033229827880859375, -0.027067184448242188, -0.020904541015625, -0.014741897583007812, -0.008579254150390625, -0.0024166107177734375, 0.00374603271484375, 0.009908676147460938, 0.016071319580078125, 0.022233963012695312, 0.0283966064453125, 0.03455924987792969, 0.040721893310546875, 0.04688453674316406, 0.05304718017578125, 0.05920982360839844, 0.06537246704101562, 0.07153511047363281, 0.07769775390625, 0.08386039733886719, 0.09002304077148438, 0.09618568420410156, 0.10234832763671875, 0.10851097106933594, 0.11467361450195312, 0.12083625793457031, 0.1269989013671875, 0.1331615447998047, 0.13932418823242188, 0.14548683166503906, 0.15164947509765625, 0.15781211853027344, 0.16397476196289062, 0.1701374053955078, 0.176300048828125, 0.1824626922607422, 0.18862533569335938, 0.19478797912597656, 0.20095062255859375, 0.20711326599121094, 0.21327590942382812, 0.2194385528564453, 0.2256011962890625, 0.2317638397216797, 0.23792648315429688, 0.24408912658691406, 0.25025177001953125, 0.25641441345214844, 0.2625770568847656, 0.2687397003173828, 0.27490234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 17.0, 7.0, 20.0, 27.0, 31.0, 42.0, 60.0, 78.0, 128.0, 134.0, 120.0, 81.0, 60.0, 48.0, 32.0, 30.0, 23.0, 18.0, 12.0, 9.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1607666015625, -0.15582275390625, -0.15087890625, -0.14593505859375, -0.1409912109375, -0.13604736328125, -0.131103515625, -0.12615966796875, -0.1212158203125, -0.11627197265625, -0.111328125, -0.10638427734375, -0.1014404296875, -0.09649658203125, -0.091552734375, -0.08660888671875, -0.0816650390625, -0.07672119140625, -0.07177734375, -0.06683349609375, -0.0618896484375, -0.05694580078125, -0.052001953125, -0.04705810546875, -0.0421142578125, -0.03717041015625, -0.0322265625, -0.02728271484375, -0.0223388671875, -0.01739501953125, -0.012451171875, -0.00750732421875, -0.0025634765625, 0.00238037109375, 0.00732421875, 0.01226806640625, 0.0172119140625, 0.02215576171875, 0.027099609375, 0.03204345703125, 0.0369873046875, 0.04193115234375, 0.046875, 0.05181884765625, 0.0567626953125, 0.06170654296875, 0.066650390625, 0.07159423828125, 0.0765380859375, 0.08148193359375, 0.08642578125, 0.09136962890625, 0.0963134765625, 0.10125732421875, 0.106201171875, 0.11114501953125, 0.1160888671875, 0.12103271484375, 0.1259765625, 0.13092041015625, 0.1358642578125, 0.14080810546875, 0.145751953125, 0.15069580078125, 0.1556396484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 5.0, 12.0, 16.0, 9.0, 25.0, 34.0, 45.0, 62.0, 88.0, 157.0, 258.0, 532.0, 1228.0, 2930.0, 8880.0, 40186.0, 862049.0, 107795.0, 16326.0, 4539.0, 1731.0, 700.0, 352.0, 193.0, 128.0, 73.0, 54.0, 39.0, 21.0, 13.0, 12.0, 4.0, 9.0, 6.0, 4.0, 2.0, 6.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0166168212890625, -0.016108989715576172, -0.015601158142089844, -0.015093326568603516, -0.014585494995117188, -0.01407766342163086, -0.013569831848144531, -0.013062000274658203, -0.012554168701171875, -0.012046337127685547, -0.011538505554199219, -0.01103067398071289, -0.010522842407226562, -0.010015010833740234, -0.009507179260253906, -0.008999347686767578, -0.00849151611328125, -0.007983684539794922, -0.007475852966308594, -0.006968021392822266, -0.0064601898193359375, -0.005952358245849609, -0.005444526672363281, -0.004936695098876953, -0.004428863525390625, -0.003921031951904297, -0.0034132003784179688, -0.0029053688049316406, -0.0023975372314453125, -0.0018897056579589844, -0.0013818740844726562, -0.0008740425109863281, -0.0003662109375, 0.00014162063598632812, 0.0006494522094726562, 0.0011572837829589844, 0.0016651153564453125, 0.0021729469299316406, 0.0026807785034179688, 0.003188610076904297, 0.003696441650390625, 0.004204273223876953, 0.004712104797363281, 0.005219936370849609, 0.0057277679443359375, 0.006235599517822266, 0.006743431091308594, 0.007251262664794922, 0.00775909423828125, 0.008266925811767578, 0.008774757385253906, 0.009282588958740234, 0.009790420532226562, 0.01029825210571289, 0.010806083679199219, 0.011313915252685547, 0.011821746826171875, 0.012329578399658203, 0.012837409973144531, 0.01334524154663086, 0.013853073120117188, 0.014360904693603516, 0.014868736267089844, 0.015376567840576172, 0.0158843994140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 6.0, 11.0, 8.0, 18.0, 12.0, 16.0, 18.0, 36.0, 41.0, 45.0, 46.0, 70.0, 69.0, 81.0, 83.0, 60.0, 74.0, 61.0, 53.0, 45.0, 20.0, 25.0, 22.0, 14.0, 5.0, 8.0, 7.0, 12.0, 3.0, 4.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.867813110351562e-06, -7.642433047294617e-06, -7.417052984237671e-06, -7.191672921180725e-06, -6.966292858123779e-06, -6.7409127950668335e-06, -6.515532732009888e-06, -6.290152668952942e-06, -6.064772605895996e-06, -5.83939254283905e-06, -5.6140124797821045e-06, -5.388632416725159e-06, -5.163252353668213e-06, -4.937872290611267e-06, -4.712492227554321e-06, -4.4871121644973755e-06, -4.26173210144043e-06, -4.036352038383484e-06, -3.810971975326538e-06, -3.5855919122695923e-06, -3.3602118492126465e-06, -3.1348317861557007e-06, -2.909451723098755e-06, -2.684071660041809e-06, -2.4586915969848633e-06, -2.2333115339279175e-06, -2.0079314708709717e-06, -1.7825514078140259e-06, -1.55717134475708e-06, -1.3317912817001343e-06, -1.1064112186431885e-06, -8.810311555862427e-07, -6.556510925292969e-07, -4.302710294723511e-07, -2.0489096641540527e-07, 2.0489096641540527e-08, 2.4586915969848633e-07, 4.7124922275543213e-07, 6.966292858123779e-07, 9.220093488693237e-07, 1.1473894119262695e-06, 1.3727694749832153e-06, 1.5981495380401611e-06, 1.823529601097107e-06, 2.0489096641540527e-06, 2.2742897272109985e-06, 2.4996697902679443e-06, 2.72504985332489e-06, 2.950429916381836e-06, 3.1758099794387817e-06, 3.4011900424957275e-06, 3.6265701055526733e-06, 3.851950168609619e-06, 4.077330231666565e-06, 4.302710294723511e-06, 4.5280903577804565e-06, 4.753470420837402e-06, 4.978850483894348e-06, 5.204230546951294e-06, 5.42961061000824e-06, 5.6549906730651855e-06, 5.880370736122131e-06, 6.105750799179077e-06, 6.331130862236023e-06, 6.556510925292969e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 7.0, 6.0, 19.0, 15.0, 31.0, 43.0, 55.0, 92.0, 124.0, 215.0, 384.0, 711.0, 1496.0, 3978.0, 17798.0, 659033.0, 340635.0, 17040.0, 3909.0, 1378.0, 671.0, 343.0, 189.0, 138.0, 75.0, 57.0, 29.0, 26.0, 15.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.011077880859375, -0.010770082473754883, -0.010462284088134766, -0.010154485702514648, -0.009846687316894531, -0.009538888931274414, -0.009231090545654297, -0.00892329216003418, -0.008615493774414062, -0.008307695388793945, -0.007999897003173828, -0.007692098617553711, -0.007384300231933594, -0.0070765018463134766, -0.006768703460693359, -0.006460905075073242, -0.006153106689453125, -0.005845308303833008, -0.005537509918212891, -0.0052297115325927734, -0.004921913146972656, -0.004614114761352539, -0.004306316375732422, -0.003998517990112305, -0.0036907196044921875, -0.0033829212188720703, -0.003075122833251953, -0.002767324447631836, -0.0024595260620117188, -0.0021517276763916016, -0.0018439292907714844, -0.0015361309051513672, -0.00122833251953125, -0.0009205341339111328, -0.0006127357482910156, -0.00030493736267089844, 2.86102294921875e-06, 0.00031065940856933594, 0.0006184577941894531, 0.0009262561798095703, 0.0012340545654296875, 0.0015418529510498047, 0.0018496513366699219, 0.002157449722290039, 0.0024652481079101562, 0.0027730464935302734, 0.0030808448791503906, 0.003388643264770508, 0.003696441650390625, 0.004004240036010742, 0.004312038421630859, 0.0046198368072509766, 0.004927635192871094, 0.005235433578491211, 0.005543231964111328, 0.005851030349731445, 0.0061588287353515625, 0.00646662712097168, 0.006774425506591797, 0.007082223892211914, 0.007390022277832031, 0.0076978206634521484, 0.008005619049072266, 0.008313417434692383, 0.0086212158203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 14.0, 21.0, 21.0, 38.0, 51.0, 91.0, 119.0, 138.0, 120.0, 100.0, 95.0, 61.0, 36.0, 21.0, 23.0, 8.0, 8.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0209503173828125, -0.020254850387573242, -0.019559383392333984, -0.018863916397094727, -0.01816844940185547, -0.01747298240661621, -0.016777515411376953, -0.016082048416137695, -0.015386581420898438, -0.01469111442565918, -0.013995647430419922, -0.013300180435180664, -0.012604713439941406, -0.011909246444702148, -0.01121377944946289, -0.010518312454223633, -0.009822845458984375, -0.009127378463745117, -0.00843191146850586, -0.0077364444732666016, -0.007040977478027344, -0.006345510482788086, -0.005650043487548828, -0.00495457649230957, -0.0042591094970703125, -0.0035636425018310547, -0.002868175506591797, -0.002172708511352539, -0.0014772415161132812, -0.0007817745208740234, -8.630752563476562e-05, 0.0006091594696044922, 0.00130462646484375, 0.002000093460083008, 0.0026955604553222656, 0.0033910274505615234, 0.004086494445800781, 0.004781961441040039, 0.005477428436279297, 0.006172895431518555, 0.0068683624267578125, 0.00756382942199707, 0.008259296417236328, 0.008954763412475586, 0.009650230407714844, 0.010345697402954102, 0.01104116439819336, 0.011736631393432617, 0.012432098388671875, 0.013127565383911133, 0.01382303237915039, 0.014518499374389648, 0.015213966369628906, 0.015909433364868164, 0.016604900360107422, 0.01730036735534668, 0.017995834350585938, 0.018691301345825195, 0.019386768341064453, 0.02008223533630371, 0.02077770233154297, 0.021473169326782227, 0.022168636322021484, 0.022864103317260742, 0.0235595703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 10.0, 18.0, 35.0, 103.0, 511.0, 246.0, 46.0, 24.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8921020030975342, -1.8548486232757568, -1.81759512424469, -1.7803417444229126, -1.7430883646011353, -1.7058348655700684, -1.668581485748291, -1.6313281059265137, -1.5940747261047363, -1.556821346282959, -1.519567847251892, -1.4823144674301147, -1.4450610876083374, -1.4078075885772705, -1.3705542087554932, -1.3333008289337158, -1.296047329902649, -1.2587939500808716, -1.2215404510498047, -1.1842870712280273, -1.14703369140625, -1.1097803115844727, -1.0725268125534058, -1.0352734327316284, -0.9980199933052063, -0.9607665538787842, -0.9235131740570068, -0.8862597346305847, -0.8490062952041626, -0.8117529153823853, -0.7744994759559631, -0.737246036529541, -0.6999927759170532, -0.6627393364906311, -0.6254859566688538, -0.5882325172424316, -0.5509791374206543, -0.5137256979942322, -0.47647225856781006, -0.4392188489437103, -0.4019654393196106, -0.36471202969551086, -0.32745862007141113, -0.290205180644989, -0.2529517710208893, -0.21569836139678955, -0.17844493687152863, -0.1411915123462677, -0.10393810272216797, -0.06668468564748764, -0.029431268572807312, 0.007822148501873016, 0.045075565576553345, 0.08232897520065308, 0.119582399725914, 0.15683582425117493, 0.19408923387527466, 0.2313426434993744, 0.2685960531234741, 0.30584949254989624, 0.34310290217399597, 0.3803563117980957, 0.4176097512245178, 0.45486316084861755, 0.4921165704727173]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 4.0, 7.0, 9.0, 5.0, 8.0, 12.0, 32.0, 22.0, 23.0, 28.0, 29.0, 36.0, 89.0, 103.0, 64.0, 48.0, 93.0, 108.0, 78.0, 39.0, 21.0, 19.0, 15.0, 17.0, 10.0, 10.0, 14.0, 11.0, 8.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0], "bins": [-0.3038482069969177, -0.2952592968940735, -0.28667035698890686, -0.27808141708374023, -0.269492506980896, -0.26090359687805176, -0.25231465697288513, -0.2437257319688797, -0.23513680696487427, -0.22654788196086884, -0.2179589569568634, -0.20937003195285797, -0.20078110694885254, -0.1921921819448471, -0.18360325694084167, -0.17501433193683624, -0.1664254069328308, -0.15783648192882538, -0.14924755692481995, -0.14065863192081451, -0.13206970691680908, -0.12348078191280365, -0.11489185690879822, -0.10630293190479279, -0.09771400690078735, -0.08912508189678192, -0.08053615689277649, -0.07194723188877106, -0.06335830688476562, -0.05476938188076019, -0.04618045687675476, -0.03759153187274933, -0.029002606868743896, -0.020413681864738464, -0.011824756860733032, -0.0032358318567276, 0.005353093147277832, 0.013942018151283264, 0.022530943155288696, 0.03111986815929413, 0.03970879316329956, 0.04829771816730499, 0.056886643171310425, 0.06547556817531586, 0.07406449317932129, 0.08265341818332672, 0.09124234318733215, 0.09983126819133759, 0.10842019319534302, 0.11700911819934845, 0.12559804320335388, 0.13418696820735931, 0.14277589321136475, 0.15136481821537018, 0.1599537432193756, 0.16854266822338104, 0.17713159322738647, 0.1857205182313919, 0.19430944323539734, 0.20289836823940277, 0.2114872932434082, 0.22007621824741364, 0.22866514325141907, 0.2372540682554245, 0.24584299325942993]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 9.0, 9.0, 17.0, 16.0, 29.0, 39.0, 34.0, 62.0, 213.0, 284.0, 78.0, 48.0, 45.0, 33.0, 28.0, 11.0, 15.0, 11.0, 4.0, 6.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031524658203125, -0.030510902404785156, -0.029497146606445312, -0.02848339080810547, -0.027469635009765625, -0.02645587921142578, -0.025442123413085938, -0.024428367614746094, -0.02341461181640625, -0.022400856018066406, -0.021387100219726562, -0.02037334442138672, -0.019359588623046875, -0.01834583282470703, -0.017332077026367188, -0.016318321228027344, -0.0153045654296875, -0.014290809631347656, -0.013277053833007812, -0.012263298034667969, -0.011249542236328125, -0.010235786437988281, -0.009222030639648438, -0.008208274841308594, -0.00719451904296875, -0.006180763244628906, -0.0051670074462890625, -0.004153251647949219, -0.003139495849609375, -0.0021257400512695312, -0.0011119842529296875, -9.822845458984375e-05, 0.00091552734375, 0.0019292831420898438, 0.0029430389404296875, 0.003956794738769531, 0.004970550537109375, 0.005984306335449219, 0.0069980621337890625, 0.008011817932128906, 0.00902557373046875, 0.010039329528808594, 0.011053085327148438, 0.012066841125488281, 0.013080596923828125, 0.014094352722167969, 0.015108108520507812, 0.016121864318847656, 0.0171356201171875, 0.018149375915527344, 0.019163131713867188, 0.02017688751220703, 0.021190643310546875, 0.02220439910888672, 0.023218154907226562, 0.024231910705566406, 0.02524566650390625, 0.026259422302246094, 0.027273178100585938, 0.02828693389892578, 0.029300689697265625, 0.03031444549560547, 0.03132820129394531, 0.032341957092285156, 0.033355712890625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 9.0, 0.0, 12.0, 3.0, 3.0, 12.0, 27.0, 18.0, 17.0, 30.0, 65.0, 76.0, 171.0, 420.0, 1627.0, 33356.0, 8348995.0, 2780.0, 522.0, 176.0, 90.0, 59.0, 45.0, 22.0, 15.0, 2.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4398147165775299, -0.42886215448379517, -0.4179095923900604, -0.4069570302963257, -0.39600449800491333, -0.3850519359111786, -0.37409937381744385, -0.3631468117237091, -0.35219424962997437, -0.3412416875362396, -0.3302891254425049, -0.31933656334877014, -0.3083840012550354, -0.29743146896362305, -0.2864789068698883, -0.27552634477615356, -0.2645737826824188, -0.2536212205886841, -0.24266865849494934, -0.2317161113023758, -0.22076354920864105, -0.2098109871149063, -0.19885843992233276, -0.18790587782859802, -0.17695331573486328, -0.16600075364112854, -0.1550481915473938, -0.14409564435482025, -0.1331430822610855, -0.12219052016735077, -0.11123796552419662, -0.10028541088104248, -0.08933281898498535, -0.07838025689125061, -0.06742770224809647, -0.05647514387965202, -0.04552258551120758, -0.03457002714276314, -0.023617468774318695, -0.01266491413116455, -0.0017123520374298096, 0.009240206331014633, 0.020192764699459076, 0.03114532306790352, 0.04209788143634796, 0.053050439804792404, 0.06400299817323685, 0.07495555281639099, 0.08590811491012573, 0.09686067700386047, 0.10781323164701462, 0.11876578629016876, 0.1297183483839035, 0.14067091047763824, 0.1516234576702118, 0.16257601976394653, 0.17352858185768127, 0.18448114395141602, 0.19543370604515076, 0.2063862532377243, 0.21733881533145905, 0.2282913774251938, 0.23924392461776733, 0.2501964867115021, 0.2611490488052368]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 5.0, 0.0, 3.0, 5.0, 2.0, 2.0, 7.0, 5.0, 8.0, 7.0, 2.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07983268797397614, -0.07632064074277878, -0.07280860096216202, -0.06929655373096466, -0.0657845139503479, -0.06227246671915054, -0.058760419487953186, -0.05524837598204613, -0.05173633247613907, -0.04822428897023201, -0.04471224546432495, -0.041200198233127594, -0.037688154727220535, -0.03417611122131348, -0.03066406585276127, -0.02715202048420906, -0.023639976978302002, -0.020127933472394943, -0.016615888103842735, -0.013103843666613102, -0.009591799229383469, -0.00607975572347641, -0.002567710354924202, 0.000944335013628006, 0.004456378519535065, 0.007968422956764698, 0.011480467393994331, 0.014992511831223965, 0.018504556268453598, 0.022016599774360657, 0.025528645142912865, 0.029040690511465073, 0.03255273401737213, 0.03606477752327919, 0.03957682102918625, 0.043088868260383606, 0.046600911766290665, 0.05011295527219772, 0.05362500250339508, 0.05713704600930214, 0.0606490895152092, 0.06416113674640656, 0.06767317652702332, 0.07118522375822067, 0.07469727098941803, 0.07820931077003479, 0.08172135800123215, 0.0852334052324295, 0.08874544501304626, 0.09225749224424362, 0.09576953202486038, 0.09928157925605774, 0.1027936190366745, 0.10630566626787186, 0.10981771349906921, 0.11332975327968597, 0.11684180051088333, 0.12035384774208069, 0.12386588752269745, 0.1273779273033142, 0.13088998198509216, 0.13440202176570892, 0.13791406154632568, 0.14142611622810364, 0.1449381560087204]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 6.0, 9.0, 11.0, 19.0, 25.0, 19.0, 46.0, 55.0, 106.0, 140.0, 287.0, 516.0, 981.0, 2429.0, 6230.0, 19363.0, 73765.0, 243797.0, 128471.0, 31796.0, 9601.0, 3511.0, 1422.0, 710.0, 364.0, 230.0, 120.0, 75.0, 56.0, 37.0, 16.0, 10.0, 8.0, 10.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1815185546875, -0.17670249938964844, -0.17188644409179688, -0.1670703887939453, -0.16225433349609375, -0.1574382781982422, -0.15262222290039062, -0.14780616760253906, -0.1429901123046875, -0.13817405700683594, -0.13335800170898438, -0.1285419464111328, -0.12372589111328125, -0.11890983581542969, -0.11409378051757812, -0.10927772521972656, -0.104461669921875, -0.09964561462402344, -0.09482955932617188, -0.09001350402832031, -0.08519744873046875, -0.08038139343261719, -0.07556533813476562, -0.07074928283691406, -0.0659332275390625, -0.06111717224121094, -0.056301116943359375, -0.05148506164550781, -0.04666900634765625, -0.04185295104980469, -0.037036895751953125, -0.03222084045410156, -0.02740478515625, -0.022588729858398438, -0.017772674560546875, -0.012956619262695312, -0.00814056396484375, -0.0033245086669921875, 0.001491546630859375, 0.0063076019287109375, 0.0111236572265625, 0.015939712524414062, 0.020755767822265625, 0.025571823120117188, 0.03038787841796875, 0.03520393371582031, 0.040019989013671875, 0.04483604431152344, 0.049652099609375, 0.05446815490722656, 0.059284210205078125, 0.06410026550292969, 0.06891632080078125, 0.07373237609863281, 0.07854843139648438, 0.08336448669433594, 0.0881805419921875, 0.09299659729003906, 0.09781265258789062, 0.10262870788574219, 0.10744476318359375, 0.11226081848144531, 0.11707687377929688, 0.12189292907714844, 0.126708984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 3.0, 7.0, 9.0, 12.0, 11.0, 22.0, 26.0, 30.0, 44.0, 63.0, 74.0, 88.0, 99.0, 90.0, 102.0, 61.0, 54.0, 36.0, 40.0, 16.0, 28.0, 10.0, 17.0, 10.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0380859375, -0.037030696868896484, -0.03597545623779297, -0.03492021560668945, -0.03386497497558594, -0.03280973434448242, -0.031754493713378906, -0.03069925308227539, -0.029644012451171875, -0.02858877182006836, -0.027533531188964844, -0.026478290557861328, -0.025423049926757812, -0.024367809295654297, -0.02331256866455078, -0.022257328033447266, -0.02120208740234375, -0.020146846771240234, -0.01909160614013672, -0.018036365509033203, -0.016981124877929688, -0.015925884246826172, -0.014870643615722656, -0.01381540298461914, -0.012760162353515625, -0.01170492172241211, -0.010649681091308594, -0.009594440460205078, -0.008539199829101562, -0.007483959197998047, -0.006428718566894531, -0.005373477935791016, -0.0043182373046875, -0.0032629966735839844, -0.0022077560424804688, -0.0011525154113769531, -9.72747802734375e-05, 0.0009579658508300781, 0.0020132064819335938, 0.0030684471130371094, 0.004123687744140625, 0.005178928375244141, 0.006234169006347656, 0.007289409637451172, 0.008344650268554688, 0.009399890899658203, 0.010455131530761719, 0.011510372161865234, 0.01256561279296875, 0.013620853424072266, 0.014676094055175781, 0.015731334686279297, 0.016786575317382812, 0.017841815948486328, 0.018897056579589844, 0.01995229721069336, 0.021007537841796875, 0.02206277847290039, 0.023118019104003906, 0.024173259735107422, 0.025228500366210938, 0.026283740997314453, 0.02733898162841797, 0.028394222259521484, 0.029449462890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 18.0, 105.0, 197.0, 78.0, 41.0, 22.0, 10.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8479621410369873, -0.8298379778862, -0.8117138743400574, -0.79358971118927, -0.7754656076431274, -0.7573414444923401, -0.7392173409461975, -0.7210931777954102, -0.7029690742492676, -0.6848449110984802, -0.6667208075523376, -0.6485966444015503, -0.6304725408554077, -0.6123483777046204, -0.5942242741584778, -0.5761001110076904, -0.5579760074615479, -0.5398518443107605, -0.5217277407646179, -0.5036035776138306, -0.485479474067688, -0.467355340719223, -0.44923120737075806, -0.4311070442199707, -0.41298288106918335, -0.3948587477207184, -0.3767346143722534, -0.35861048102378845, -0.3404863476753235, -0.3223622143268585, -0.30423808097839355, -0.2861139178276062, -0.267989844083786, -0.24986571073532104, -0.23174157738685608, -0.2136174440383911, -0.19549331068992615, -0.17736917734146118, -0.15924502909183502, -0.14112089574337006, -0.12299676239490509, -0.10487262904644012, -0.08674849569797516, -0.0686243548989296, -0.05050022155046463, -0.032376088201999664, -0.014251947402954102, 0.0038721859455108643, 0.02199631929397583, 0.040120452642440796, 0.05824458971619606, 0.07636872678995132, 0.09449286013841629, 0.11261699348688126, 0.13074113428592682, 0.14886526763439178, 0.16698940098285675, 0.18511353433132172, 0.20323766767978668, 0.22136181592941284, 0.2394859492778778, 0.2576100826263428, 0.27573421597480774, 0.2938583493232727, 0.31198248267173767]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 11.0, 10.0, 53.0, 113.0, 124.0, 85.0, 22.0, 19.0, 11.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1873171329498291, -0.1781158745288849, -0.16891461610794067, -0.15971335768699646, -0.15051209926605225, -0.14131084084510803, -0.132109597325325, -0.1229083389043808, -0.11370708048343658, -0.10450582206249237, -0.09530456364154816, -0.08610331267118454, -0.07690205425024033, -0.06770079582929611, -0.0584995411336422, -0.04929828643798828, -0.04009702801704407, -0.030895771458745003, -0.021694514900445938, -0.012493258342146873, -0.003292001783847809, 0.005909256637096405, 0.01511051133275032, 0.024311766028404236, 0.03351302444934845, 0.042714282870292664, 0.05191553756594658, 0.061116792261600494, 0.07031805068254471, 0.07951930910348892, 0.08872056007385254, 0.09792181849479675, 0.10712307691574097, 0.11632433533668518, 0.1255255937576294, 0.1347268521785736, 0.14392811059951782, 0.15312936902046204, 0.16233061254024506, 0.17153187096118927, 0.18073312938213348, 0.1899343878030777, 0.1991356462240219, 0.20833690464496613, 0.21753814816474915, 0.22673940658569336, 0.23594066500663757, 0.2451419234275818, 0.254343181848526, 0.2635444402694702, 0.27274569869041443, 0.28194695711135864, 0.29114821553230286, 0.30034947395324707, 0.3095507323741913, 0.3187519907951355, 0.3279532194137573, 0.33715447783470154, 0.34635573625564575, 0.35555699467658997, 0.3647582530975342, 0.3739595115184784, 0.3831607699394226, 0.39236199855804443, 0.40156328678131104]}, "eval/loss": 5.038694858551025, "eval/wer": 1.9940103133677112, "eval/runtime": 799.2667, "eval/samples_per_second": 3.306, "eval/steps_per_second": 0.277, "train/train_runtime": 6750.5443, "train/train_samples_per_second": 4.228, "train/train_steps_per_second": 0.176, "train/total_flos": 0.0, "train/train_loss": 4.993681282832704} \ No newline at end of file +{"train/loss": 4.843, "train/learning_rate": 4.354136429608128e-06, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 7982, "_timestamp": 1646301438, "_step": 1192, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 217.0, 781.0, 18.0], "bins": [-1056.006591796875, -1039.0478515625, -1022.089111328125, -1005.13037109375, -988.1715698242188, -971.2128295898438, -954.2540893554688, -937.2953491210938, -920.3366088867188, -903.3778686523438, -886.4191284179688, -869.4603271484375, -852.5015869140625, -835.5428466796875, -818.5841064453125, -801.6253662109375, -784.6666259765625, -767.7078857421875, -750.7491455078125, -733.7904052734375, -716.8316040039062, -699.8728637695312, -682.9141235351562, -665.9553833007812, -648.99658203125, -632.037841796875, -615.0791015625, -598.120361328125, -581.1615600585938, -564.2028198242188, -547.2440795898438, -530.2853393554688, -513.32666015625, -496.367919921875, -479.4091491699219, -462.4504089355469, -445.4916687011719, -428.53289794921875, -411.57415771484375, -394.61541748046875, -377.6566467285156, -360.6979064941406, -343.7391357421875, -326.7803955078125, -309.8216552734375, -292.8629150390625, -275.9041442871094, -258.9454040527344, -241.98663330078125, -225.0278778076172, -208.0691375732422, -191.11038208007812, -174.15164184570312, -157.19288635253906, -140.234130859375, -123.27538299560547, -106.31664276123047, -89.35789489746094, -72.39913940429688, -55.440391540527344, -38.48164367675781, -21.52289581298828, -4.564140319824219, 12.394607543945312, 29.353355407714844]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 8.0, 10.0, 13.0, 13.0, 16.0, 18.0, 24.0, 20.0, 22.0, 34.0, 28.0, 28.0, 38.0, 38.0, 39.0, 42.0, 42.0, 36.0, 43.0, 41.0, 29.0, 45.0, 38.0, 34.0, 36.0, 33.0, 21.0, 30.0, 20.0, 23.0, 22.0, 14.0, 13.0, 13.0, 13.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-114.42926025390625, -110.70561981201172, -106.98198699951172, -103.25834655761719, -99.53471374511719, -95.81107330322266, -92.08743286132812, -88.36380004882812, -84.6401596069336, -80.91651916503906, -77.19288635253906, -73.46924591064453, -69.74560546875, -66.02197265625, -62.29833221435547, -58.5746955871582, -54.85105895996094, -51.12742233276367, -47.403785705566406, -43.680145263671875, -39.95650863647461, -36.232872009277344, -32.50923156738281, -28.785594940185547, -25.06195831298828, -21.338321685791016, -17.614683151245117, -13.891045570373535, -10.167407989501953, -6.4437713623046875, -2.720132827758789, 1.0035057067871094, 4.727142333984375, 8.450779914855957, 12.174417495727539, 15.898055076599121, 19.621692657470703, 23.34532928466797, 27.068967819213867, 30.792606353759766, 34.51624298095703, 38.2398796081543, 41.96351623535156, 45.687156677246094, 49.41079330444336, 53.134429931640625, 56.858070373535156, 60.58170700073242, 64.30534362792969, 68.02898406982422, 71.75261688232422, 75.47625732421875, 79.19989013671875, 82.92353057861328, 86.64717102050781, 90.37080383300781, 94.09444427490234, 97.81808471679688, 101.54171752929688, 105.2653579711914, 108.98899841308594, 112.71263122558594, 116.43627166748047, 120.159912109375, 123.883544921875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 15.0, 17.0, 24.0, 28.0, 30.0, 42.0, 38.0, 64.0, 59.0, 65.0, 83.0, 72.0, 57.0, 71.0, 69.0, 62.0, 47.0, 36.0, 33.0, 19.0, 27.0, 12.0, 7.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.80816650390625, -3.7159423828125, -3.62371826171875, -3.531494140625, -3.43927001953125, -3.3470458984375, -3.25482177734375, -3.16259765625, -3.07037353515625, -2.9781494140625, -2.88592529296875, -2.793701171875, -2.70147705078125, -2.6092529296875, -2.51702880859375, -2.4248046875, -2.33258056640625, -2.2403564453125, -2.14813232421875, -2.055908203125, -1.96368408203125, -1.8714599609375, -1.77923583984375, -1.68701171875, -1.59478759765625, -1.5025634765625, -1.41033935546875, -1.318115234375, -1.22589111328125, -1.1336669921875, -1.04144287109375, -0.94921875, -0.85699462890625, -0.7647705078125, -0.67254638671875, -0.580322265625, -0.48809814453125, -0.3958740234375, -0.30364990234375, -0.21142578125, -0.11920166015625, -0.0269775390625, 0.06524658203125, 0.157470703125, 0.24969482421875, 0.3419189453125, 0.43414306640625, 0.5263671875, 0.61859130859375, 0.7108154296875, 0.80303955078125, 0.895263671875, 0.98748779296875, 1.0797119140625, 1.17193603515625, 1.26416015625, 1.35638427734375, 1.4486083984375, 1.54083251953125, 1.633056640625, 1.72528076171875, 1.8175048828125, 1.90972900390625, 2.001953125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 15.0, 12.0, 22.0, 28.0, 49.0, 86.0, 120.0, 207.0, 382.0, 700.0, 1239.0, 2570.0, 7192.0, 74633.0, 4046930.0, 48887.0, 6218.0, 2302.0, 1196.0, 614.0, 331.0, 205.0, 116.0, 80.0, 50.0, 25.0, 26.0, 15.0, 8.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-33.5, -32.710693359375, -31.92138671875, -31.132080078125, -30.3427734375, -29.553466796875, -28.76416015625, -27.974853515625, -27.185546875, -26.396240234375, -25.60693359375, -24.817626953125, -24.0283203125, -23.239013671875, -22.44970703125, -21.660400390625, -20.87109375, -20.081787109375, -19.29248046875, -18.503173828125, -17.7138671875, -16.924560546875, -16.13525390625, -15.345947265625, -14.556640625, -13.767333984375, -12.97802734375, -12.188720703125, -11.3994140625, -10.610107421875, -9.82080078125, -9.031494140625, -8.2421875, -7.452880859375, -6.66357421875, -5.874267578125, -5.0849609375, -4.295654296875, -3.50634765625, -2.717041015625, -1.927734375, -1.138427734375, -0.34912109375, 0.440185546875, 1.2294921875, 2.018798828125, 2.80810546875, 3.597412109375, 4.38671875, 5.176025390625, 5.96533203125, 6.754638671875, 7.5439453125, 8.333251953125, 9.12255859375, 9.911865234375, 10.701171875, 11.490478515625, 12.27978515625, 13.069091796875, 13.8583984375, 14.647705078125, 15.43701171875, 16.226318359375, 17.015625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 21.0, 33.0, 33.0, 84.0, 166.0, 389.0, 1046.0, 1220.0, 553.0, 259.0, 132.0, 59.0, 35.0, 21.0, 11.0, 9.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.0625, -23.517333984375, -22.97216796875, -22.427001953125, -21.8818359375, -21.336669921875, -20.79150390625, -20.246337890625, -19.701171875, -19.156005859375, -18.61083984375, -18.065673828125, -17.5205078125, -16.975341796875, -16.43017578125, -15.885009765625, -15.33984375, -14.794677734375, -14.24951171875, -13.704345703125, -13.1591796875, -12.614013671875, -12.06884765625, -11.523681640625, -10.978515625, -10.433349609375, -9.88818359375, -9.343017578125, -8.7978515625, -8.252685546875, -7.70751953125, -7.162353515625, -6.6171875, -6.072021484375, -5.52685546875, -4.981689453125, -4.4365234375, -3.891357421875, -3.34619140625, -2.801025390625, -2.255859375, -1.710693359375, -1.16552734375, -0.620361328125, -0.0751953125, 0.469970703125, 1.01513671875, 1.560302734375, 2.10546875, 2.650634765625, 3.19580078125, 3.740966796875, 4.2861328125, 4.831298828125, 5.37646484375, 5.921630859375, 6.466796875, 7.011962890625, 7.55712890625, 8.102294921875, 8.6474609375, 9.192626953125, 9.73779296875, 10.282958984375, 10.828125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 2.0, 12.0, 22.0, 46.0, 98.0, 231.0, 652.0, 3396.0, 3978798.0, 208211.0, 2032.0, 479.0, 169.0, 70.0, 35.0, 13.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.65625, -46.84423828125, -45.0322265625, -43.22021484375, -41.408203125, -39.59619140625, -37.7841796875, -35.97216796875, -34.16015625, -32.34814453125, -30.5361328125, -28.72412109375, -26.912109375, -25.10009765625, -23.2880859375, -21.47607421875, -19.6640625, -17.85205078125, -16.0400390625, -14.22802734375, -12.416015625, -10.60400390625, -8.7919921875, -6.97998046875, -5.16796875, -3.35595703125, -1.5439453125, 0.26806640625, 2.080078125, 3.89208984375, 5.7041015625, 7.51611328125, 9.328125, 11.14013671875, 12.9521484375, 14.76416015625, 16.576171875, 18.38818359375, 20.2001953125, 22.01220703125, 23.82421875, 25.63623046875, 27.4482421875, 29.26025390625, 31.072265625, 32.88427734375, 34.6962890625, 36.50830078125, 38.3203125, 40.13232421875, 41.9443359375, 43.75634765625, 45.568359375, 47.38037109375, 49.1923828125, 51.00439453125, 52.81640625, 54.62841796875, 56.4404296875, 58.25244140625, 60.064453125, 61.87646484375, 63.6884765625, 65.50048828125, 67.3125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 49.0, 264.0, 437.0, 201.0, 46.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-123.02286529541016, -120.75912475585938, -118.4953842163086, -116.23163604736328, -113.9678955078125, -111.70415496826172, -109.44041442871094, -107.17667388916016, -104.91293334960938, -102.6491928100586, -100.38545227050781, -98.1217041015625, -95.85796356201172, -93.59422302246094, -91.33048248291016, -89.06674194335938, -86.80299377441406, -84.53925323486328, -82.2755126953125, -80.01176452636719, -77.7480239868164, -75.48428344726562, -73.22054290771484, -70.95680236816406, -68.69305419921875, -66.42931365966797, -64.16557312011719, -61.90182876586914, -59.638084411621094, -57.37434387207031, -55.11060333251953, -52.84686279296875, -50.58312225341797, -48.31938171386719, -46.05563735961914, -43.79189682006836, -41.52815246582031, -39.26441192626953, -37.00067138671875, -34.73693084716797, -32.47318649291992, -30.209444046020508, -27.945701599121094, -25.681961059570312, -23.4182186126709, -21.154476165771484, -18.890735626220703, -16.62699317932129, -14.363250732421875, -12.099508285522461, -9.835766792297363, -7.572024822235107, -5.308282852172852, -3.0445404052734375, -0.7807989120483398, 1.4829425811767578, 3.746685028076172, 6.010426998138428, 8.274168968200684, 10.537910461425781, 12.801652908325195, 15.06539535522461, 17.32913589477539, 19.592878341674805, 21.85662078857422]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 9.0, 3.0, 6.0, 12.0, 11.0, 16.0, 22.0, 21.0, 25.0, 23.0, 34.0, 35.0, 43.0, 26.0, 35.0, 35.0, 38.0, 45.0, 43.0, 37.0, 59.0, 43.0, 36.0, 51.0, 36.0, 24.0, 33.0, 27.0, 22.0, 28.0, 24.0, 16.0, 14.0, 14.0, 7.0, 8.0, 7.0, 9.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-34.01847839355469, -33.0948600769043, -32.171241760253906, -31.24762535095215, -30.32400894165039, -29.400390625, -28.47677230834961, -27.55315589904785, -26.629539489746094, -25.705921173095703, -24.782304763793945, -23.858686447143555, -22.935070037841797, -22.011451721191406, -21.087833404541016, -20.164216995239258, -19.240598678588867, -18.316980361938477, -17.39336395263672, -16.469745635986328, -15.54612922668457, -14.62251091003418, -13.698893547058105, -12.775276184082031, -11.851658821105957, -10.928041458129883, -10.004424095153809, -9.080806732177734, -8.157188415527344, -7.233571529388428, -6.309953689575195, -5.386336326599121, -4.462718963623047, -3.5391016006469727, -2.6154839992523193, -1.691866397857666, -0.7682490348815918, 0.15536832809448242, 1.0789861679077148, 2.002603530883789, 2.9262208938598633, 3.8498382568359375, 4.773455619812012, 5.697073459625244, 6.620690822601318, 7.544308185577393, 8.467926025390625, 9.3915433883667, 10.315160751342773, 11.238778114318848, 12.162395477294922, 13.086013793945312, 14.00963020324707, 14.933248519897461, 15.856865882873535, 16.78048324584961, 17.7041015625, 18.62771987915039, 19.55133628845215, 20.47495460510254, 21.398571014404297, 22.322189331054688, 23.245807647705078, 24.169424057006836, 25.093040466308594]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 15.0, 21.0, 27.0, 21.0, 28.0, 36.0, 40.0, 55.0, 63.0, 54.0, 75.0, 86.0, 60.0, 52.0, 61.0, 65.0, 71.0, 28.0, 29.0, 30.0, 27.0, 13.0, 12.0, 4.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.791015625, -3.70184326171875, -3.6126708984375, -3.52349853515625, -3.434326171875, -3.34515380859375, -3.2559814453125, -3.16680908203125, -3.07763671875, -2.98846435546875, -2.8992919921875, -2.81011962890625, -2.720947265625, -2.63177490234375, -2.5426025390625, -2.45343017578125, -2.3642578125, -2.27508544921875, -2.1859130859375, -2.09674072265625, -2.007568359375, -1.91839599609375, -1.8292236328125, -1.74005126953125, -1.65087890625, -1.56170654296875, -1.4725341796875, -1.38336181640625, -1.294189453125, -1.20501708984375, -1.1158447265625, -1.02667236328125, -0.9375, -0.84832763671875, -0.7591552734375, -0.66998291015625, -0.580810546875, -0.49163818359375, -0.4024658203125, -0.31329345703125, -0.22412109375, -0.13494873046875, -0.0457763671875, 0.04339599609375, 0.132568359375, 0.22174072265625, 0.3109130859375, 0.40008544921875, 0.4892578125, 0.57843017578125, 0.6676025390625, 0.75677490234375, 0.845947265625, 0.93511962890625, 1.0242919921875, 1.11346435546875, 1.20263671875, 1.29180908203125, 1.3809814453125, 1.47015380859375, 1.559326171875, 1.64849853515625, 1.7376708984375, 1.82684326171875, 1.916015625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 7.0, 6.0, 6.0, 7.0, 5.0, 13.0, 17.0, 17.0, 16.0, 39.0, 78.0, 116.0, 212.0, 420.0, 748.0, 1611.0, 3090.0, 6104.0, 12240.0, 27212.0, 64617.0, 171225.0, 427432.0, 200779.0, 73960.0, 30795.0, 14087.0, 6834.0, 3285.0, 1639.0, 866.0, 470.0, 223.0, 140.0, 65.0, 48.0, 27.0, 18.0, 15.0, 17.0, 7.0, 10.0, 4.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0265960693359375, -0.02575373649597168, -0.02491140365600586, -0.02406907081604004, -0.02322673797607422, -0.0223844051361084, -0.021542072296142578, -0.020699739456176758, -0.019857406616210938, -0.019015073776245117, -0.018172740936279297, -0.017330408096313477, -0.016488075256347656, -0.015645742416381836, -0.014803409576416016, -0.013961076736450195, -0.013118743896484375, -0.012276411056518555, -0.011434078216552734, -0.010591745376586914, -0.009749412536621094, -0.008907079696655273, -0.008064746856689453, -0.007222414016723633, -0.0063800811767578125, -0.005537748336791992, -0.004695415496826172, -0.0038530826568603516, -0.0030107498168945312, -0.002168416976928711, -0.0013260841369628906, -0.0004837512969970703, 0.00035858154296875, 0.0012009143829345703, 0.0020432472229003906, 0.002885580062866211, 0.0037279129028320312, 0.0045702457427978516, 0.005412578582763672, 0.006254911422729492, 0.0070972442626953125, 0.007939577102661133, 0.008781909942626953, 0.009624242782592773, 0.010466575622558594, 0.011308908462524414, 0.012151241302490234, 0.012993574142456055, 0.013835906982421875, 0.014678239822387695, 0.015520572662353516, 0.016362905502319336, 0.017205238342285156, 0.018047571182250977, 0.018889904022216797, 0.019732236862182617, 0.020574569702148438, 0.021416902542114258, 0.022259235382080078, 0.0231015682220459, 0.02394390106201172, 0.02478623390197754, 0.02562856674194336, 0.02647089958190918, 0.027313232421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 2.0, 1.0, 15.0, 13.0, 8.0, 11.0, 9.0, 16.0, 18.0, 20.0, 20.0, 30.0, 31.0, 42.0, 36.0, 36.0, 25.0, 41.0, 33.0, 40.0, 1067.0, 54.0, 44.0, 33.0, 30.0, 41.0, 35.0, 28.0, 27.0, 29.0, 29.0, 23.0, 14.0, 20.0, 16.0, 14.0, 12.0, 16.0, 4.0, 8.0, 8.0, 2.0, 10.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.318939208984375, -1.27459716796875, -1.230255126953125, -1.1859130859375, -1.141571044921875, -1.09722900390625, -1.052886962890625, -1.008544921875, -0.964202880859375, -0.91986083984375, -0.875518798828125, -0.8311767578125, -0.786834716796875, -0.74249267578125, -0.698150634765625, -0.65380859375, -0.609466552734375, -0.56512451171875, -0.520782470703125, -0.4764404296875, -0.432098388671875, -0.38775634765625, -0.343414306640625, -0.299072265625, -0.254730224609375, -0.21038818359375, -0.166046142578125, -0.1217041015625, -0.077362060546875, -0.03302001953125, 0.011322021484375, 0.0556640625, 0.100006103515625, 0.14434814453125, 0.188690185546875, 0.2330322265625, 0.277374267578125, 0.32171630859375, 0.366058349609375, 0.410400390625, 0.454742431640625, 0.49908447265625, 0.543426513671875, 0.5877685546875, 0.632110595703125, 0.67645263671875, 0.720794677734375, 0.76513671875, 0.809478759765625, 0.85382080078125, 0.898162841796875, 0.9425048828125, 0.986846923828125, 1.03118896484375, 1.075531005859375, 1.119873046875, 1.164215087890625, 1.20855712890625, 1.252899169921875, 1.2972412109375, 1.341583251953125, 1.38592529296875, 1.430267333984375, 1.474609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 7.0, 23.0, 35.0, 41.0, 54.0, 83.0, 139.0, 217.0, 378.0, 511.0, 747.0, 1248.0, 1904.0, 2893.0, 4715.0, 7578.0, 12278.0, 20482.0, 33846.0, 57472.0, 100595.0, 180120.0, 1291669.0, 160061.0, 90063.0, 51384.0, 30446.0, 18190.0, 11123.0, 6870.0, 4364.0, 2676.0, 1766.0, 1074.0, 724.0, 450.0, 331.0, 185.0, 136.0, 98.0, 52.0, 35.0, 32.0, 20.0, 10.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00634002685546875, -0.006150186061859131, -0.005960345268249512, -0.005770504474639893, -0.0055806636810302734, -0.005390822887420654, -0.005200982093811035, -0.005011141300201416, -0.004821300506591797, -0.004631459712982178, -0.004441618919372559, -0.0042517781257629395, -0.00406193733215332, -0.003872096538543701, -0.003682255744934082, -0.003492414951324463, -0.0033025741577148438, -0.0031127333641052246, -0.0029228925704956055, -0.0027330517768859863, -0.002543210983276367, -0.002353370189666748, -0.002163529396057129, -0.0019736886024475098, -0.0017838478088378906, -0.0015940070152282715, -0.0014041662216186523, -0.0012143254280090332, -0.001024484634399414, -0.0008346438407897949, -0.0006448030471801758, -0.00045496225357055664, -0.0002651214599609375, -7.528066635131836e-05, 0.00011456012725830078, 0.0003044009208679199, 0.0004942417144775391, 0.0006840825080871582, 0.0008739233016967773, 0.0010637640953063965, 0.0012536048889160156, 0.0014434456825256348, 0.001633286476135254, 0.001823127269744873, 0.002012968063354492, 0.0022028088569641113, 0.0023926496505737305, 0.0025824904441833496, 0.0027723312377929688, 0.002962172031402588, 0.003152012825012207, 0.003341853618621826, 0.0035316944122314453, 0.0037215352058410645, 0.003911375999450684, 0.004101216793060303, 0.004291057586669922, 0.004480898380279541, 0.00467073917388916, 0.004860579967498779, 0.0050504207611083984, 0.005240261554718018, 0.005430102348327637, 0.005619943141937256, 0.005809783935546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 11.0, 0.0, 13.0, 0.0, 0.0, 18.0, 0.0, 0.0, 19.0, 0.0, 40.0, 0.0, 0.0, 44.0, 0.0, 0.0, 74.0, 0.0, 145.0, 0.0, 0.0, 286.0, 0.0, 0.0, 132.0, 0.0, 62.0, 0.0, 0.0, 46.0, 0.0, 0.0, 42.0, 0.0, 20.0, 0.0, 0.0, 20.0, 0.0, 0.0, 16.0, 0.0, 5.0, 0.0, 0.0, 10.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.556510925292969e-07, -6.332993507385254e-07, -6.109476089477539e-07, -5.885958671569824e-07, -5.662441253662109e-07, -5.438923835754395e-07, -5.21540641784668e-07, -4.991888999938965e-07, -4.76837158203125e-07, -4.544854164123535e-07, -4.3213367462158203e-07, -4.0978193283081055e-07, -3.8743019104003906e-07, -3.650784492492676e-07, -3.427267074584961e-07, -3.203749656677246e-07, -2.980232238769531e-07, -2.7567148208618164e-07, -2.5331974029541016e-07, -2.3096799850463867e-07, -2.086162567138672e-07, -1.862645149230957e-07, -1.6391277313232422e-07, -1.4156103134155273e-07, -1.1920928955078125e-07, -9.685754776000977e-08, -7.450580596923828e-08, -5.21540641784668e-08, -2.9802322387695312e-08, -7.450580596923828e-09, 1.4901161193847656e-08, 3.725290298461914e-08, 5.960464477539063e-08, 8.195638656616211e-08, 1.043081283569336e-07, 1.2665987014770508e-07, 1.4901161193847656e-07, 1.7136335372924805e-07, 1.9371509552001953e-07, 2.1606683731079102e-07, 2.384185791015625e-07, 2.60770320892334e-07, 2.8312206268310547e-07, 3.0547380447387695e-07, 3.2782554626464844e-07, 3.501772880554199e-07, 3.725290298461914e-07, 3.948807716369629e-07, 4.172325134277344e-07, 4.3958425521850586e-07, 4.6193599700927734e-07, 4.842877388000488e-07, 5.066394805908203e-07, 5.289912223815918e-07, 5.513429641723633e-07, 5.736947059631348e-07, 5.960464477539062e-07, 6.183981895446777e-07, 6.407499313354492e-07, 6.631016731262207e-07, 6.854534149169922e-07, 7.078051567077637e-07, 7.301568984985352e-07, 7.525086402893066e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 1.0, 0.0, 4.0, 3.0, 10.0, 10.0, 7.0, 15.0, 11.0, 15.0, 18.0, 18.0, 38.0, 42.0, 55.0, 53.0, 38.0, 107.0, 108.0, 178.0, 238.0, 611.0, 903227.0, 142241.0, 526.0, 243.0, 175.0, 89.0, 92.0, 68.0, 54.0, 53.0, 31.0, 44.0, 21.0, 23.0, 15.0, 6.0, 19.0, 8.0, 5.0, 9.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.7881393432617188e-05, -1.7354264855384827e-05, -1.6827136278152466e-05, -1.6300007700920105e-05, -1.5772879123687744e-05, -1.5245750546455383e-05, -1.4718621969223022e-05, -1.4191493391990662e-05, -1.36643648147583e-05, -1.313723623752594e-05, -1.2610107660293579e-05, -1.2082979083061218e-05, -1.1555850505828857e-05, -1.1028721928596497e-05, -1.0501593351364136e-05, -9.974464774131775e-06, -9.447336196899414e-06, -8.920207619667053e-06, -8.393079042434692e-06, -7.865950465202332e-06, -7.338821887969971e-06, -6.81169331073761e-06, -6.284564733505249e-06, -5.757436156272888e-06, -5.230307579040527e-06, -4.7031790018081665e-06, -4.176050424575806e-06, -3.648921847343445e-06, -3.121793270111084e-06, -2.594664692878723e-06, -2.0675361156463623e-06, -1.5404075384140015e-06, -1.0132789611816406e-06, -4.861503839492798e-07, 4.0978193283081055e-08, 5.681067705154419e-07, 1.0952353477478027e-06, 1.6223639249801636e-06, 2.1494925022125244e-06, 2.6766210794448853e-06, 3.203749656677246e-06, 3.730878233909607e-06, 4.258006811141968e-06, 4.785135388374329e-06, 5.3122639656066895e-06, 5.83939254283905e-06, 6.366521120071411e-06, 6.893649697303772e-06, 7.420778274536133e-06, 7.947906851768494e-06, 8.475035429000854e-06, 9.002164006233215e-06, 9.529292583465576e-06, 1.0056421160697937e-05, 1.0583549737930298e-05, 1.1110678315162659e-05, 1.163780689239502e-05, 1.216493546962738e-05, 1.2692064046859741e-05, 1.3219192624092102e-05, 1.3746321201324463e-05, 1.4273449778556824e-05, 1.4800578355789185e-05, 1.5327706933021545e-05, 1.5854835510253906e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 17.0, 143.0, 601.0, 215.0, 32.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.332940749118279e-07, -8.995003213385644e-07, -8.65706510921882e-07, -8.319127573486185e-07, -7.981190037753549e-07, -7.643251933586725e-07, -7.30531439785409e-07, -6.967376293687266e-07, -6.629438757954631e-07, -6.291501222221996e-07, -5.953563118055172e-07, -5.615625582322537e-07, -5.277687478155713e-07, -4.939749942423077e-07, -4.601812406690442e-07, -4.2638745867407124e-07, -3.925936766790983e-07, -3.587998946841253e-07, -3.2500611268915236e-07, -2.9121235911588883e-07, -2.5741857712091587e-07, -2.236247951259429e-07, -1.8983102734182467e-07, -1.5603725955770642e-07, -1.2224347756273346e-07, -8.844970267318786e-08, -5.4655927783642255e-08, -2.0862152894096653e-08, 1.293162199544895e-08, 4.672540399042191e-08, 8.051917177454015e-08, 1.143129395586584e-07, 1.481066647102125e-07, 1.8190044670518546e-07, 2.156942144893037e-07, 2.4948798227342195e-07, 2.832817642683949e-07, 3.1707554626336787e-07, 3.508692998366314e-07, 3.8466308183160436e-07, 4.184568638265773e-07, 4.522506458215503e-07, 4.860444278165232e-07, 5.198381813897868e-07, 5.536319349630503e-07, 5.874257453797327e-07, 6.212194989529962e-07, 6.550133093696786e-07, 6.888070629429421e-07, 7.226008165162057e-07, 7.563946269328881e-07, 7.901883805061516e-07, 8.23982190922834e-07, 8.577759444960975e-07, 8.91569698069361e-07, 9.253634516426246e-07, 9.59157205215888e-07, 9.929509587891516e-07, 1.0267447123624152e-06, 1.0605385796225164e-06, 1.09433233319578e-06, 1.1281260867690435e-06, 1.161919840342307e-06, 1.1957135939155705e-06, 1.2295074611756718e-06]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 106.0, 0.0, 0.0, 0.0, 156.0, 0.0, 0.0, 0.0, 242.0, 0.0, 0.0, 0.0, 0.0, 184.0, 0.0, 0.0, 0.0, 112.0, 0.0, 0.0, 0.0, 62.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.032626748085022e-07, -3.8929283618927e-07, -3.7532299757003784e-07, -3.6135315895080566e-07, -3.473833203315735e-07, -3.334134817123413e-07, -3.1944364309310913e-07, -3.0547380447387695e-07, -2.915039658546448e-07, -2.775341272354126e-07, -2.635642886161804e-07, -2.4959444999694824e-07, -2.3562461137771606e-07, -2.2165477275848389e-07, -2.076849341392517e-07, -1.9371509552001953e-07, -1.7974525690078735e-07, -1.6577541828155518e-07, -1.51805579662323e-07, -1.3783574104309082e-07, -1.2386590242385864e-07, -1.0989606380462646e-07, -9.592622518539429e-08, -8.195638656616211e-08, -6.798654794692993e-08, -5.4016709327697754e-08, -4.0046870708465576e-08, -2.60770320892334e-08, -1.210719347000122e-08, 1.862645149230957e-09, 1.5832483768463135e-08, 2.9802322387695312e-08, 4.377216100692749e-08, 5.774199962615967e-08, 7.171183824539185e-08, 8.568167686462402e-08, 9.96515154838562e-08, 1.1362135410308838e-07, 1.2759119272232056e-07, 1.4156103134155273e-07, 1.555308699607849e-07, 1.695007085800171e-07, 1.8347054719924927e-07, 1.9744038581848145e-07, 2.1141022443771362e-07, 2.253800630569458e-07, 2.39349901676178e-07, 2.5331974029541016e-07, 2.6728957891464233e-07, 2.812594175338745e-07, 2.952292561531067e-07, 3.0919909477233887e-07, 3.2316893339157104e-07, 3.371387720108032e-07, 3.511086106300354e-07, 3.650784492492676e-07, 3.7904828786849976e-07, 3.9301812648773193e-07, 4.069879651069641e-07, 4.209578037261963e-07, 4.3492764234542847e-07, 4.4889748096466064e-07, 4.628673195838928e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 15.0, 21.0, 27.0, 21.0, 28.0, 36.0, 40.0, 55.0, 63.0, 54.0, 75.0, 86.0, 60.0, 52.0, 61.0, 65.0, 71.0, 28.0, 29.0, 30.0, 27.0, 13.0, 12.0, 4.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.791015625, -3.70184326171875, -3.6126708984375, -3.52349853515625, -3.434326171875, -3.34515380859375, -3.2559814453125, -3.16680908203125, -3.07763671875, -2.98846435546875, -2.8992919921875, -2.81011962890625, -2.720947265625, -2.63177490234375, -2.5426025390625, -2.45343017578125, -2.3642578125, -2.27508544921875, -2.1859130859375, -2.09674072265625, -2.007568359375, -1.91839599609375, -1.8292236328125, -1.74005126953125, -1.65087890625, -1.56170654296875, -1.4725341796875, -1.38336181640625, -1.294189453125, -1.20501708984375, -1.1158447265625, -1.02667236328125, -0.9375, -0.84832763671875, -0.7591552734375, -0.66998291015625, -0.580810546875, -0.49163818359375, -0.4024658203125, -0.31329345703125, -0.22412109375, -0.13494873046875, -0.0457763671875, 0.04339599609375, 0.132568359375, 0.22174072265625, 0.3109130859375, 0.40008544921875, 0.4892578125, 0.57843017578125, 0.6676025390625, 0.75677490234375, 0.845947265625, 0.93511962890625, 1.0242919921875, 1.11346435546875, 1.20263671875, 1.29180908203125, 1.3809814453125, 1.47015380859375, 1.559326171875, 1.64849853515625, 1.7376708984375, 1.82684326171875, 1.916015625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 17.0, 41.0, 76.0, 140.0, 243.0, 395.0, 659.0, 1025.0, 1766.0, 3819.0, 10559.0, 83112.0, 890555.0, 41001.0, 8067.0, 3192.0, 1591.0, 899.0, 571.0, 342.0, 200.0, 131.0, 63.0, 29.0, 12.0, 14.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.40625, -21.735107421875, -21.06396484375, -20.392822265625, -19.7216796875, -19.050537109375, -18.37939453125, -17.708251953125, -17.037109375, -16.365966796875, -15.69482421875, -15.023681640625, -14.3525390625, -13.681396484375, -13.01025390625, -12.339111328125, -11.66796875, -10.996826171875, -10.32568359375, -9.654541015625, -8.9833984375, -8.312255859375, -7.64111328125, -6.969970703125, -6.298828125, -5.627685546875, -4.95654296875, -4.285400390625, -3.6142578125, -2.943115234375, -2.27197265625, -1.600830078125, -0.9296875, -0.258544921875, 0.41259765625, 1.083740234375, 1.7548828125, 2.426025390625, 3.09716796875, 3.768310546875, 4.439453125, 5.110595703125, 5.78173828125, 6.452880859375, 7.1240234375, 7.795166015625, 8.46630859375, 9.137451171875, 9.80859375, 10.479736328125, 11.15087890625, 11.822021484375, 12.4931640625, 13.164306640625, 13.83544921875, 14.506591796875, 15.177734375, 15.848876953125, 16.52001953125, 17.191162109375, 17.8623046875, 18.533447265625, 19.20458984375, 19.875732421875, 20.546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 6.0, 12.0, 10.0, 17.0, 17.0, 17.0, 21.0, 30.0, 27.0, 36.0, 43.0, 45.0, 31.0, 49.0, 64.0, 93.0, 164.0, 1496.0, 258.0, 105.0, 72.0, 49.0, 53.0, 51.0, 48.0, 24.0, 28.0, 32.0, 16.0, 21.0, 14.0, 18.0, 14.0, 13.0, 5.0, 3.0, 5.0, 12.0, 5.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.83306884765625, -4.6583251953125, -4.48358154296875, -4.308837890625, -4.13409423828125, -3.9593505859375, -3.78460693359375, -3.60986328125, -3.43511962890625, -3.2603759765625, -3.08563232421875, -2.910888671875, -2.73614501953125, -2.5614013671875, -2.38665771484375, -2.2119140625, -2.03717041015625, -1.8624267578125, -1.68768310546875, -1.512939453125, -1.33819580078125, -1.1634521484375, -0.98870849609375, -0.81396484375, -0.63922119140625, -0.4644775390625, -0.28973388671875, -0.114990234375, 0.05975341796875, 0.2344970703125, 0.40924072265625, 0.583984375, 0.75872802734375, 0.9334716796875, 1.10821533203125, 1.282958984375, 1.45770263671875, 1.6324462890625, 1.80718994140625, 1.98193359375, 2.15667724609375, 2.3314208984375, 2.50616455078125, 2.680908203125, 2.85565185546875, 3.0303955078125, 3.20513916015625, 3.3798828125, 3.55462646484375, 3.7293701171875, 3.90411376953125, 4.078857421875, 4.25360107421875, 4.4283447265625, 4.60308837890625, 4.77783203125, 4.95257568359375, 5.1273193359375, 5.30206298828125, 5.476806640625, 5.65155029296875, 5.8262939453125, 6.00103759765625, 6.17578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 7.0, 10.0, 4.0, 2.0, 6.0, 13.0, 12.0, 22.0, 20.0, 20.0, 20.0, 37.0, 39.0, 63.0, 95.0, 131.0, 242.0, 650.0, 3617.0, 254763.0, 2874626.0, 9446.0, 994.0, 332.0, 164.0, 75.0, 62.0, 41.0, 33.0, 32.0, 25.0, 17.0, 20.0, 16.0, 8.0, 11.0, 3.0, 10.0, 4.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.59375, -24.885986328125, -24.17822265625, -23.470458984375, -22.7626953125, -22.054931640625, -21.34716796875, -20.639404296875, -19.931640625, -19.223876953125, -18.51611328125, -17.808349609375, -17.1005859375, -16.392822265625, -15.68505859375, -14.977294921875, -14.26953125, -13.561767578125, -12.85400390625, -12.146240234375, -11.4384765625, -10.730712890625, -10.02294921875, -9.315185546875, -8.607421875, -7.899658203125, -7.19189453125, -6.484130859375, -5.7763671875, -5.068603515625, -4.36083984375, -3.653076171875, -2.9453125, -2.237548828125, -1.52978515625, -0.822021484375, -0.1142578125, 0.593505859375, 1.30126953125, 2.009033203125, 2.716796875, 3.424560546875, 4.13232421875, 4.840087890625, 5.5478515625, 6.255615234375, 6.96337890625, 7.671142578125, 8.37890625, 9.086669921875, 9.79443359375, 10.502197265625, 11.2099609375, 11.917724609375, 12.62548828125, 13.333251953125, 14.041015625, 14.748779296875, 15.45654296875, 16.164306640625, 16.8720703125, 17.579833984375, 18.28759765625, 18.995361328125, 19.703125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 29.0, 921.0, 66.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-289.0257873535156, -283.7305908203125, -278.43536376953125, -273.1401672363281, -267.8449401855469, -262.54974365234375, -257.2545166015625, -251.9593048095703, -246.66409301757812, -241.36888122558594, -236.07366943359375, -230.77845764160156, -225.48324584960938, -220.1880340576172, -214.892822265625, -209.5976104736328, -204.30239868164062, -199.00718688964844, -193.71197509765625, -188.41676330566406, -183.12155151367188, -177.8263397216797, -172.5311279296875, -167.2359161376953, -161.9407196044922, -156.6455078125, -151.3502960205078, -146.05508422851562, -140.75987243652344, -135.46466064453125, -130.16944885253906, -124.87423706054688, -119.57903289794922, -114.28382110595703, -108.98860931396484, -103.69339752197266, -98.39818572998047, -93.10297393798828, -87.80776977539062, -82.51255798339844, -77.21734619140625, -71.92213439941406, -66.62692260742188, -61.33171081542969, -56.0364990234375, -50.74128723144531, -45.44607925415039, -40.1508674621582, -34.85565185546875, -29.560440063476562, -24.265228271484375, -18.97001838684082, -13.674806594848633, -8.379594802856445, -3.0843849182128906, 2.210826873779297, 7.506038665771484, 12.801250457763672, 18.09646224975586, 23.391672134399414, 28.6868839263916, 33.982093811035156, 39.277305603027344, 44.57251739501953, 49.86772918701172]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 3.0, 5.0, 10.0, 13.0, 25.0, 19.0, 18.0, 28.0, 30.0, 34.0, 24.0, 38.0, 40.0, 48.0, 32.0, 47.0, 59.0, 42.0, 45.0, 47.0, 50.0, 39.0, 35.0, 42.0, 43.0, 35.0, 27.0, 25.0, 17.0, 21.0, 12.0, 9.0, 7.0, 5.0, 3.0, 4.0, 4.0, 11.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.69549560546875, -19.965490341186523, -19.23548698425293, -18.505481719970703, -17.77547836303711, -17.045473098754883, -16.315467834472656, -15.585463523864746, -14.855459213256836, -14.125454902648926, -13.395450592041016, -12.665445327758789, -11.935441017150879, -11.205436706542969, -10.475431442260742, -9.745427131652832, -9.015422821044922, -8.285418510437012, -7.555413722991943, -6.825408935546875, -6.095404624938965, -5.365400314331055, -4.635395526885986, -3.905390739440918, -3.175386428833008, -2.4453818798065186, -1.7153773307800293, -0.98537278175354, -0.2553682327270508, 0.4746363162994385, 1.2046408653259277, 1.934645652770996, 2.6646499633789062, 3.3946545124053955, 4.124659061431885, 4.854663848876953, 5.584668159484863, 6.314672470092773, 7.044677257537842, 7.77468204498291, 8.50468635559082, 9.23469066619873, 9.96469497680664, 10.694700241088867, 11.424704551696777, 12.154708862304688, 12.884714126586914, 13.614718437194824, 14.344722747802734, 15.074727058410645, 15.804731369018555, 16.53473663330078, 17.264739990234375, 17.9947452545166, 18.724750518798828, 19.454753875732422, 20.18475914001465, 20.914764404296875, 21.64476776123047, 22.374773025512695, 23.104778289794922, 23.834781646728516, 24.564786911010742, 25.29479217529297, 26.024795532226562]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 8.0, 6.0, 11.0, 15.0, 29.0, 19.0, 22.0, 31.0, 29.0, 53.0, 67.0, 46.0, 67.0, 79.0, 65.0, 59.0, 61.0, 60.0, 74.0, 49.0, 35.0, 28.0, 28.0, 18.0, 19.0, 7.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.775390625, -3.685943603515625, -3.59649658203125, -3.507049560546875, -3.4176025390625, -3.328155517578125, -3.23870849609375, -3.149261474609375, -3.059814453125, -2.970367431640625, -2.88092041015625, -2.791473388671875, -2.7020263671875, -2.612579345703125, -2.52313232421875, -2.433685302734375, -2.34423828125, -2.254791259765625, -2.16534423828125, -2.075897216796875, -1.9864501953125, -1.897003173828125, -1.80755615234375, -1.718109130859375, -1.628662109375, -1.539215087890625, -1.44976806640625, -1.360321044921875, -1.2708740234375, -1.181427001953125, -1.09197998046875, -1.002532958984375, -0.9130859375, -0.823638916015625, -0.73419189453125, -0.644744873046875, -0.5552978515625, -0.465850830078125, -0.37640380859375, -0.286956787109375, -0.197509765625, -0.108062744140625, -0.01861572265625, 0.070831298828125, 0.1602783203125, 0.249725341796875, 0.33917236328125, 0.428619384765625, 0.51806640625, 0.607513427734375, 0.69696044921875, 0.786407470703125, 0.8758544921875, 0.965301513671875, 1.05474853515625, 1.144195556640625, 1.233642578125, 1.323089599609375, 1.41253662109375, 1.501983642578125, 1.5914306640625, 1.680877685546875, 1.77032470703125, 1.859771728515625, 1.94921875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 13.0, 18.0, 32.0, 36.0, 79.0, 132.0, 168.0, 370.0, 640.0, 1587.0, 10153.0, 3024651.0, 1146519.0, 7178.0, 1338.0, 575.0, 307.0, 194.0, 106.0, 68.0, 30.0, 34.0, 13.0, 13.0, 7.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-37.90625, -37.04345703125, -36.1806640625, -35.31787109375, -34.455078125, -33.59228515625, -32.7294921875, -31.86669921875, -31.00390625, -30.14111328125, -29.2783203125, -28.41552734375, -27.552734375, -26.68994140625, -25.8271484375, -24.96435546875, -24.1015625, -23.23876953125, -22.3759765625, -21.51318359375, -20.650390625, -19.78759765625, -18.9248046875, -18.06201171875, -17.19921875, -16.33642578125, -15.4736328125, -14.61083984375, -13.748046875, -12.88525390625, -12.0224609375, -11.15966796875, -10.296875, -9.43408203125, -8.5712890625, -7.70849609375, -6.845703125, -5.98291015625, -5.1201171875, -4.25732421875, -3.39453125, -2.53173828125, -1.6689453125, -0.80615234375, 0.056640625, 0.91943359375, 1.7822265625, 2.64501953125, 3.5078125, 4.37060546875, 5.2333984375, 6.09619140625, 6.958984375, 7.82177734375, 8.6845703125, 9.54736328125, 10.41015625, 11.27294921875, 12.1357421875, 12.99853515625, 13.861328125, 14.72412109375, 15.5869140625, 16.44970703125, 17.3125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 9.0, 3.0, 7.0, 15.0, 27.0, 49.0, 109.0, 194.0, 379.0, 587.0, 979.0, 762.0, 417.0, 248.0, 148.0, 69.0, 26.0, 20.0, 11.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.0234375, -9.6328125, -9.2421875, -8.8515625, -8.4609375, -8.0703125, -7.6796875, -7.2890625, -6.8984375, -6.5078125, -6.1171875, -5.7265625, -5.3359375, -4.9453125, -4.5546875, -4.1640625, -3.7734375, -3.3828125, -2.9921875, -2.6015625, -2.2109375, -1.8203125, -1.4296875, -1.0390625, -0.6484375, -0.2578125, 0.1328125, 0.5234375, 0.9140625, 1.3046875, 1.6953125, 2.0859375, 2.4765625, 2.8671875, 3.2578125, 3.6484375, 4.0390625, 4.4296875, 4.8203125, 5.2109375, 5.6015625, 5.9921875, 6.3828125, 6.7734375, 7.1640625, 7.5546875, 7.9453125, 8.3359375, 8.7265625, 9.1171875, 9.5078125, 9.8984375, 10.2890625, 10.6796875, 11.0703125, 11.4609375, 11.8515625, 12.2421875, 12.6328125, 13.0234375, 13.4140625, 13.8046875, 14.1953125, 14.5859375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 15.0, 24.0, 34.0, 82.0, 142.0, 285.0, 759.0, 2619.0, 22624.0, 1816579.0, 2320396.0, 26527.0, 2745.0, 840.0, 336.0, 126.0, 69.0, 41.0, 16.0, 15.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.40576171875, -17.5302734375, -16.65478515625, -15.779296875, -14.90380859375, -14.0283203125, -13.15283203125, -12.27734375, -11.40185546875, -10.5263671875, -9.65087890625, -8.775390625, -7.89990234375, -7.0244140625, -6.14892578125, -5.2734375, -4.39794921875, -3.5224609375, -2.64697265625, -1.771484375, -0.89599609375, -0.0205078125, 0.85498046875, 1.73046875, 2.60595703125, 3.4814453125, 4.35693359375, 5.232421875, 6.10791015625, 6.9833984375, 7.85888671875, 8.734375, 9.60986328125, 10.4853515625, 11.36083984375, 12.236328125, 13.11181640625, 13.9873046875, 14.86279296875, 15.73828125, 16.61376953125, 17.4892578125, 18.36474609375, 19.240234375, 20.11572265625, 20.9912109375, 21.86669921875, 22.7421875, 23.61767578125, 24.4931640625, 25.36865234375, 26.244140625, 27.11962890625, 27.9951171875, 28.87060546875, 29.74609375, 30.62158203125, 31.4970703125, 32.37255859375, 33.248046875, 34.12353515625, 34.9990234375, 35.87451171875, 36.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 110.0, 393.0, 411.0, 92.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.30104064941406, -32.240684509277344, -28.18033218383789, -24.119977951049805, -20.05962371826172, -15.999269485473633, -11.938915252685547, -7.878561019897461, -3.818206787109375, 0.24214744567871094, 4.302501678466797, 8.362855911254883, 12.423210144042969, 16.483564376831055, 20.54391860961914, 24.604272842407227, 28.664627075195312, 32.72498321533203, 36.785335540771484, 40.84568786621094, 44.906044006347656, 48.966400146484375, 53.02675247192383, 57.08710479736328, 61.1474609375, 65.20781707763672, 69.26817321777344, 73.32852172851562, 77.38887786865234, 81.44923400878906, 85.50958251953125, 89.56993865966797, 93.63031005859375, 97.69066619873047, 101.75102233886719, 105.81137084960938, 109.8717269897461, 113.93208312988281, 117.992431640625, 122.05278778076172, 126.11314392089844, 130.17349243164062, 134.23385620117188, 138.29420471191406, 142.35455322265625, 146.4149169921875, 150.4752655029297, 154.53562927246094, 158.59597778320312, 162.6563262939453, 166.71669006347656, 170.77703857421875, 174.83740234375, 178.8977508544922, 182.95809936523438, 187.01846313476562, 191.0788116455078, 195.13916015625, 199.19952392578125, 203.25987243652344, 207.32022094726562, 211.38058471679688, 215.44093322753906, 219.5012969970703, 223.5616455078125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 7.0, 13.0, 22.0, 18.0, 20.0, 18.0, 32.0, 33.0, 29.0, 36.0, 40.0, 31.0, 36.0, 38.0, 38.0, 46.0, 43.0, 38.0, 38.0, 45.0, 29.0, 35.0, 44.0, 28.0, 30.0, 25.0, 22.0, 26.0, 17.0, 14.0, 10.0, 15.0, 9.0, 13.0, 7.0, 9.0, 2.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-25.921432495117188, -25.211803436279297, -24.502172470092773, -23.79254150390625, -23.08291244506836, -22.37328338623047, -21.663652420043945, -20.954021453857422, -20.24439239501953, -19.53476333618164, -18.825132369995117, -18.115501403808594, -17.405872344970703, -16.696243286132812, -15.986612319946289, -15.276982307434082, -14.567352294921875, -13.857722282409668, -13.148092269897461, -12.438462257385254, -11.728832244873047, -11.01920223236084, -10.309572219848633, -9.599942207336426, -8.890312194824219, -8.180682182312012, -7.471052169799805, -6.761422157287598, -6.051792144775391, -5.342162132263184, -4.632532119750977, -3.9229021072387695, -3.2132720947265625, -2.5036420822143555, -1.7940120697021484, -1.0843820571899414, -0.3747520446777344, 0.33487796783447266, 1.0445079803466797, 1.7541379928588867, 2.4637680053710938, 3.173398017883301, 3.883028030395508, 4.592658042907715, 5.302288055419922, 6.011918067932129, 6.721548080444336, 7.431178092956543, 8.14080810546875, 8.850438117980957, 9.560068130493164, 10.269698143005371, 10.979328155517578, 11.688958168029785, 12.398588180541992, 13.1082181930542, 13.817848205566406, 14.527478218078613, 15.23710823059082, 15.946738243103027, 16.656368255615234, 17.365997314453125, 18.07562828063965, 18.785259246826172, 19.494888305664062]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 5.0, 12.0, 10.0, 18.0, 19.0, 25.0, 22.0, 33.0, 37.0, 56.0, 45.0, 72.0, 53.0, 71.0, 64.0, 56.0, 62.0, 48.0, 62.0, 56.0, 40.0, 33.0, 30.0, 20.0, 16.0, 8.0, 8.0, 5.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0], "bins": [-3.736328125, -3.6497955322265625, -3.563262939453125, -3.4767303466796875, -3.39019775390625, -3.3036651611328125, -3.217132568359375, -3.1305999755859375, -3.0440673828125, -2.9575347900390625, -2.871002197265625, -2.7844696044921875, -2.69793701171875, -2.6114044189453125, -2.524871826171875, -2.4383392333984375, -2.351806640625, -2.2652740478515625, -2.178741455078125, -2.0922088623046875, -2.00567626953125, -1.9191436767578125, -1.832611083984375, -1.7460784912109375, -1.6595458984375, -1.5730133056640625, -1.486480712890625, -1.3999481201171875, -1.31341552734375, -1.2268829345703125, -1.140350341796875, -1.0538177490234375, -0.96728515625, -0.8807525634765625, -0.794219970703125, -0.7076873779296875, -0.62115478515625, -0.5346221923828125, -0.448089599609375, -0.3615570068359375, -0.2750244140625, -0.1884918212890625, -0.101959228515625, -0.0154266357421875, 0.07110595703125, 0.1576385498046875, 0.244171142578125, 0.3307037353515625, 0.417236328125, 0.5037689208984375, 0.590301513671875, 0.6768341064453125, 0.76336669921875, 0.8498992919921875, 0.936431884765625, 1.0229644775390625, 1.1094970703125, 1.1960296630859375, 1.282562255859375, 1.3690948486328125, 1.45562744140625, 1.5421600341796875, 1.628692626953125, 1.7152252197265625, 1.8017578125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 11.0, 11.0, 12.0, 11.0, 20.0, 35.0, 37.0, 55.0, 102.0, 213.0, 429.0, 777.0, 1460.0, 2843.0, 5659.0, 11488.0, 23987.0, 52751.0, 127213.0, 360338.0, 277276.0, 101336.0, 43218.0, 19756.0, 9440.0, 4781.0, 2517.0, 1275.0, 698.0, 344.0, 174.0, 95.0, 49.0, 24.0, 25.0, 15.0, 9.0, 10.0, 15.0, 7.0, 3.0, 6.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.027557373046875, -0.02674388885498047, -0.025930404663085938, -0.025116920471191406, -0.024303436279296875, -0.023489952087402344, -0.022676467895507812, -0.02186298370361328, -0.02104949951171875, -0.02023601531982422, -0.019422531127929688, -0.018609046936035156, -0.017795562744140625, -0.016982078552246094, -0.016168594360351562, -0.015355110168457031, -0.0145416259765625, -0.013728141784667969, -0.012914657592773438, -0.012101173400878906, -0.011287689208984375, -0.010474205017089844, -0.009660720825195312, -0.008847236633300781, -0.00803375244140625, -0.007220268249511719, -0.0064067840576171875, -0.005593299865722656, -0.004779815673828125, -0.003966331481933594, -0.0031528472900390625, -0.0023393630981445312, -0.00152587890625, -0.0007123947143554688, 0.0001010894775390625, 0.0009145736694335938, 0.001728057861328125, 0.0025415420532226562, 0.0033550262451171875, 0.004168510437011719, 0.00498199462890625, 0.005795478820800781, 0.0066089630126953125, 0.007422447204589844, 0.008235931396484375, 0.009049415588378906, 0.009862899780273438, 0.010676383972167969, 0.0114898681640625, 0.012303352355957031, 0.013116836547851562, 0.013930320739746094, 0.014743804931640625, 0.015557289123535156, 0.016370773315429688, 0.01718425750732422, 0.01799774169921875, 0.01881122589111328, 0.019624710083007812, 0.020438194274902344, 0.021251678466796875, 0.022065162658691406, 0.022878646850585938, 0.02369213104248047, 0.024505615234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 6.0, 4.0, 7.0, 13.0, 7.0, 13.0, 14.0, 21.0, 18.0, 21.0, 24.0, 28.0, 25.0, 24.0, 34.0, 40.0, 29.0, 41.0, 41.0, 46.0, 1085.0, 44.0, 53.0, 37.0, 41.0, 41.0, 29.0, 35.0, 30.0, 40.0, 29.0, 23.0, 19.0, 11.0, 13.0, 11.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7021484375, -1.6480865478515625, -1.594024658203125, -1.5399627685546875, -1.48590087890625, -1.4318389892578125, -1.377777099609375, -1.3237152099609375, -1.2696533203125, -1.2155914306640625, -1.161529541015625, -1.1074676513671875, -1.05340576171875, -0.9993438720703125, -0.945281982421875, -0.8912200927734375, -0.837158203125, -0.7830963134765625, -0.729034423828125, -0.6749725341796875, -0.62091064453125, -0.5668487548828125, -0.512786865234375, -0.4587249755859375, -0.4046630859375, -0.3506011962890625, -0.296539306640625, -0.2424774169921875, -0.18841552734375, -0.1343536376953125, -0.080291748046875, -0.0262298583984375, 0.02783203125, 0.0818939208984375, 0.135955810546875, 0.1900177001953125, 0.24407958984375, 0.2981414794921875, 0.352203369140625, 0.4062652587890625, 0.4603271484375, 0.5143890380859375, 0.568450927734375, 0.6225128173828125, 0.67657470703125, 0.7306365966796875, 0.784698486328125, 0.8387603759765625, 0.892822265625, 0.9468841552734375, 1.000946044921875, 1.0550079345703125, 1.10906982421875, 1.1631317138671875, 1.217193603515625, 1.2712554931640625, 1.3253173828125, 1.3793792724609375, 1.433441162109375, 1.4875030517578125, 1.54156494140625, 1.5956268310546875, 1.649688720703125, 1.7037506103515625, 1.7578125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 15.0, 21.0, 36.0, 38.0, 56.0, 71.0, 102.0, 160.0, 284.0, 415.0, 536.0, 876.0, 1339.0, 1934.0, 3010.0, 4578.0, 7278.0, 11484.0, 17901.0, 28492.0, 46532.0, 76664.0, 130806.0, 1264656.0, 199455.0, 116468.0, 69290.0, 42481.0, 25956.0, 16593.0, 10429.0, 6649.0, 4250.0, 2825.0, 1848.0, 1115.0, 846.0, 538.0, 351.0, 235.0, 162.0, 109.0, 89.0, 48.0, 33.0, 28.0, 17.0, 12.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0061798095703125, -0.0059860944747924805, -0.005792379379272461, -0.005598664283752441, -0.005404949188232422, -0.005211234092712402, -0.005017518997192383, -0.004823803901672363, -0.004630088806152344, -0.004436373710632324, -0.004242658615112305, -0.004048943519592285, -0.0038552284240722656, -0.003661513328552246, -0.0034677982330322266, -0.003274083137512207, -0.0030803680419921875, -0.002886652946472168, -0.0026929378509521484, -0.002499222755432129, -0.0023055076599121094, -0.00211179256439209, -0.0019180774688720703, -0.0017243623733520508, -0.0015306472778320312, -0.0013369321823120117, -0.0011432170867919922, -0.0009495019912719727, -0.0007557868957519531, -0.0005620718002319336, -0.00036835670471191406, -0.00017464160919189453, 1.9073486328125e-05, 0.00021278858184814453, 0.00040650367736816406, 0.0006002187728881836, 0.0007939338684082031, 0.0009876489639282227, 0.0011813640594482422, 0.0013750791549682617, 0.0015687942504882812, 0.0017625093460083008, 0.0019562244415283203, 0.00214993953704834, 0.0023436546325683594, 0.002537369728088379, 0.0027310848236083984, 0.002924799919128418, 0.0031185150146484375, 0.003312230110168457, 0.0035059452056884766, 0.003699660301208496, 0.0038933753967285156, 0.004087090492248535, 0.004280805587768555, 0.004474520683288574, 0.004668235778808594, 0.004861950874328613, 0.005055665969848633, 0.005249381065368652, 0.005443096160888672, 0.005636811256408691, 0.005830526351928711, 0.0060242414474487305, 0.00621795654296875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 10.0, 0.0, 0.0, 14.0, 0.0, 0.0, 31.0, 0.0, 0.0, 39.0, 0.0, 0.0, 60.0, 0.0, 145.0, 0.0, 0.0, 388.0, 0.0, 0.0, 156.0, 0.0, 0.0, 81.0, 0.0, 0.0, 38.0, 0.0, 0.0, 27.0, 0.0, 0.0, 11.0, 0.0, 0.0, 9.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.543712854385376e-07, -7.338821887969971e-07, -7.133930921554565e-07, -6.92903995513916e-07, -6.724148988723755e-07, -6.51925802230835e-07, -6.314367055892944e-07, -6.109476089477539e-07, -5.904585123062134e-07, -5.699694156646729e-07, -5.494803190231323e-07, -5.289912223815918e-07, -5.085021257400513e-07, -4.880130290985107e-07, -4.675239324569702e-07, -4.470348358154297e-07, -4.2654573917388916e-07, -4.0605664253234863e-07, -3.855675458908081e-07, -3.650784492492676e-07, -3.4458935260772705e-07, -3.241002559661865e-07, -3.03611159324646e-07, -2.8312206268310547e-07, -2.6263296604156494e-07, -2.421438694000244e-07, -2.2165477275848389e-07, -2.0116567611694336e-07, -1.8067657947540283e-07, -1.601874828338623e-07, -1.3969838619232178e-07, -1.1920928955078125e-07, -9.872019290924072e-08, -7.82310962677002e-08, -5.774199962615967e-08, -3.725290298461914e-08, -1.6763806343078613e-08, 3.725290298461914e-09, 2.421438694000244e-08, 4.470348358154297e-08, 6.51925802230835e-08, 8.568167686462402e-08, 1.0617077350616455e-07, 1.2665987014770508e-07, 1.471489667892456e-07, 1.6763806343078613e-07, 1.8812716007232666e-07, 2.086162567138672e-07, 2.2910535335540771e-07, 2.4959444999694824e-07, 2.7008354663848877e-07, 2.905726432800293e-07, 3.110617399215698e-07, 3.3155083656311035e-07, 3.520399332046509e-07, 3.725290298461914e-07, 3.9301812648773193e-07, 4.1350722312927246e-07, 4.33996319770813e-07, 4.544854164123535e-07, 4.7497451305389404e-07, 4.954636096954346e-07, 5.159527063369751e-07, 5.364418029785156e-07]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 20.0, 14.0, 22.0, 11.0, 26.0, 33.0, 25.0, 35.0, 74.0, 40.0, 129.0, 96.0, 119.0, 479.0, 3769.0, 977561.0, 64696.0, 552.0, 275.0, 71.0, 135.0, 53.0, 48.0, 71.0, 37.0, 34.0, 18.0, 22.0, 21.0, 13.0, 12.0, 8.0, 3.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.233816146850586e-05, -1.194886863231659e-05, -1.155957579612732e-05, -1.117028295993805e-05, -1.078099012374878e-05, -1.039169728755951e-05, -1.000240445137024e-05, -9.61311161518097e-06, -9.2238187789917e-06, -8.83452594280243e-06, -8.44523310661316e-06, -8.05594027042389e-06, -7.666647434234619e-06, -7.277354598045349e-06, -6.888061761856079e-06, -6.498768925666809e-06, -6.109476089477539e-06, -5.720183253288269e-06, -5.330890417098999e-06, -4.941597580909729e-06, -4.552304744720459e-06, -4.163011908531189e-06, -3.773719072341919e-06, -3.384426236152649e-06, -2.995133399963379e-06, -2.605840563774109e-06, -2.216547727584839e-06, -1.8272548913955688e-06, -1.4379620552062988e-06, -1.0486692190170288e-06, -6.593763828277588e-07, -2.7008354663848877e-07, 1.1920928955078125e-07, 5.085021257400513e-07, 8.977949619293213e-07, 1.2870877981185913e-06, 1.6763806343078613e-06, 2.0656734704971313e-06, 2.4549663066864014e-06, 2.8442591428756714e-06, 3.2335519790649414e-06, 3.6228448152542114e-06, 4.0121376514434814e-06, 4.4014304876327515e-06, 4.7907233238220215e-06, 5.1800161600112915e-06, 5.5693089962005615e-06, 5.9586018323898315e-06, 6.3478946685791016e-06, 6.737187504768372e-06, 7.126480340957642e-06, 7.515773177146912e-06, 7.905066013336182e-06, 8.294358849525452e-06, 8.683651685714722e-06, 9.072944521903992e-06, 9.462237358093262e-06, 9.851530194282532e-06, 1.0240823030471802e-05, 1.0630115866661072e-05, 1.1019408702850342e-05, 1.1408701539039612e-05, 1.1797994375228882e-05, 1.2187287211418152e-05, 1.2576580047607422e-05]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 51.0, 289.0, 594.0, 73.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0107694379257737e-06, -9.478548577135371e-07, -8.849402775013004e-07, -8.220257541324827e-07, -7.591111739202461e-07, -6.961965937080095e-07, -6.332820703391917e-07, -5.703674901269551e-07, -5.074529099147185e-07, -4.4453832970248186e-07, -3.816237779119547e-07, -3.187092261214275e-07, -2.557946459091909e-07, -1.9288006569695426e-07, -1.2996551390642708e-07, -6.705096211589989e-08, -4.136381903663278e-09, 5.877818409771862e-08, 1.2169275009910052e-07, 1.8460731610048242e-07, 2.475218821018643e-07, 3.1043646231410094e-07, 3.733510141046281e-07, 4.362655658951553e-07, 4.991801461073919e-07, 5.620947263196285e-07, 6.250093065318651e-07, 6.879238299006829e-07, 7.508384101129195e-07, 8.137529903251561e-07, 8.766675136939739e-07, 9.395820939062105e-07, 1.0024969014921226e-06, 1.0654114248609403e-06, 1.1283260619165958e-06, 1.1912405852854135e-06, 1.254155222341069e-06, 1.3170697457098868e-06, 1.3799842690787045e-06, 1.4428987924475223e-06, 1.5058134295031778e-06, 1.5687279528719955e-06, 1.631642589927651e-06, 1.6945571132964687e-06, 1.7574716366652865e-06, 1.820386273720942e-06, 1.8833007970897597e-06, 1.946215434145415e-06, 2.009129957514233e-06, 2.0720444808830507e-06, 2.1349590042518685e-06, 2.1978737549943617e-06, 2.2607882783631794e-06, 2.323702801731997e-06, 2.386617325100815e-06, 2.4495318484696327e-06, 2.5124463718384504e-06, 2.575360895207268e-06, 2.638275418576086e-06, 2.701190169318579e-06, 2.764104692687397e-06, 2.8270192160562146e-06, 2.8899337394250324e-06, 2.95284826279385e-06, 3.0157630135363434e-06]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.0, 0.0, 0.0, 0.0, 0.0, 179.0, 0.0, 0.0, 0.0, 0.0, 376.0, 0.0, 0.0, 0.0, 0.0, 0.0, 220.0, 0.0, 0.0, 0.0, 0.0, 79.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.980232238769531e-07, -2.868473529815674e-07, -2.7567148208618164e-07, -2.644956111907959e-07, -2.5331974029541016e-07, -2.421438694000244e-07, -2.3096799850463867e-07, -2.1979212760925293e-07, -2.086162567138672e-07, -1.9744038581848145e-07, -1.862645149230957e-07, -1.7508864402770996e-07, -1.6391277313232422e-07, -1.5273690223693848e-07, -1.4156103134155273e-07, -1.30385160446167e-07, -1.1920928955078125e-07, -1.0803341865539551e-07, -9.685754776000977e-08, -8.568167686462402e-08, -7.450580596923828e-08, -6.332993507385254e-08, -5.21540641784668e-08, -4.0978193283081055e-08, -2.9802322387695312e-08, -1.862645149230957e-08, -7.450580596923828e-09, 3.725290298461914e-09, 1.4901161193847656e-08, 2.60770320892334e-08, 3.725290298461914e-08, 4.842877388000488e-08, 5.960464477539063e-08, 7.078051567077637e-08, 8.195638656616211e-08, 9.313225746154785e-08, 1.043081283569336e-07, 1.1548399925231934e-07, 1.2665987014770508e-07, 1.3783574104309082e-07, 1.4901161193847656e-07, 1.601874828338623e-07, 1.7136335372924805e-07, 1.825392246246338e-07, 1.9371509552001953e-07, 2.0489096641540527e-07, 2.1606683731079102e-07, 2.2724270820617676e-07, 2.384185791015625e-07, 2.4959444999694824e-07, 2.60770320892334e-07, 2.7194619178771973e-07, 2.8312206268310547e-07, 2.942979335784912e-07, 3.0547380447387695e-07, 3.166496753692627e-07, 3.2782554626464844e-07, 3.390014171600342e-07, 3.501772880554199e-07, 3.6135315895080566e-07, 3.725290298461914e-07, 3.8370490074157715e-07, 3.948807716369629e-07, 4.0605664253234863e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 5.0, 12.0, 10.0, 18.0, 19.0, 25.0, 22.0, 33.0, 37.0, 56.0, 45.0, 72.0, 53.0, 71.0, 64.0, 56.0, 62.0, 48.0, 62.0, 56.0, 40.0, 33.0, 30.0, 20.0, 16.0, 8.0, 8.0, 5.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0], "bins": [-3.736328125, -3.6497955322265625, -3.563262939453125, -3.4767303466796875, -3.39019775390625, -3.3036651611328125, -3.217132568359375, -3.1305999755859375, -3.0440673828125, -2.9575347900390625, -2.871002197265625, -2.7844696044921875, -2.69793701171875, -2.6114044189453125, -2.524871826171875, -2.4383392333984375, -2.351806640625, -2.2652740478515625, -2.178741455078125, -2.0922088623046875, -2.00567626953125, -1.9191436767578125, -1.832611083984375, -1.7460784912109375, -1.6595458984375, -1.5730133056640625, -1.486480712890625, -1.3999481201171875, -1.31341552734375, -1.2268829345703125, -1.140350341796875, -1.0538177490234375, -0.96728515625, -0.8807525634765625, -0.794219970703125, -0.7076873779296875, -0.62115478515625, -0.5346221923828125, -0.448089599609375, -0.3615570068359375, -0.2750244140625, -0.1884918212890625, -0.101959228515625, -0.0154266357421875, 0.07110595703125, 0.1576385498046875, 0.244171142578125, 0.3307037353515625, 0.417236328125, 0.5037689208984375, 0.590301513671875, 0.6768341064453125, 0.76336669921875, 0.8498992919921875, 0.936431884765625, 1.0229644775390625, 1.1094970703125, 1.1960296630859375, 1.282562255859375, 1.3690948486328125, 1.45562744140625, 1.5421600341796875, 1.628692626953125, 1.7152252197265625, 1.8017578125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 12.0, 26.0, 36.0, 53.0, 91.0, 136.0, 271.0, 490.0, 945.0, 1790.0, 3532.0, 7688.0, 18684.0, 54566.0, 240565.0, 559026.0, 106590.0, 31270.0, 12226.0, 5224.0, 2560.0, 1254.0, 646.0, 383.0, 186.0, 125.0, 70.0, 50.0, 22.0, 14.0, 8.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.236328125, -3.14453125, -3.052734375, -2.9609375, -2.869140625, -2.77734375, -2.685546875, -2.59375, -2.501953125, -2.41015625, -2.318359375, -2.2265625, -2.134765625, -2.04296875, -1.951171875, -1.859375, -1.767578125, -1.67578125, -1.583984375, -1.4921875, -1.400390625, -1.30859375, -1.216796875, -1.125, -1.033203125, -0.94140625, -0.849609375, -0.7578125, -0.666015625, -0.57421875, -0.482421875, -0.390625, -0.298828125, -0.20703125, -0.115234375, -0.0234375, 0.068359375, 0.16015625, 0.251953125, 0.34375, 0.435546875, 0.52734375, 0.619140625, 0.7109375, 0.802734375, 0.89453125, 0.986328125, 1.078125, 1.169921875, 1.26171875, 1.353515625, 1.4453125, 1.537109375, 1.62890625, 1.720703125, 1.8125, 1.904296875, 1.99609375, 2.087890625, 2.1796875, 2.271484375, 2.36328125, 2.455078125, 2.546875, 2.638671875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 10.0, 7.0, 7.0, 6.0, 12.0, 10.0, 9.0, 12.0, 16.0, 21.0, 17.0, 19.0, 23.0, 23.0, 31.0, 27.0, 39.0, 31.0, 53.0, 49.0, 84.0, 222.0, 1664.0, 156.0, 71.0, 54.0, 43.0, 31.0, 40.0, 35.0, 29.0, 23.0, 25.0, 26.0, 18.0, 20.0, 14.0, 13.0, 12.0, 8.0, 8.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.81640625, -5.63092041015625, -5.4454345703125, -5.25994873046875, -5.074462890625, -4.88897705078125, -4.7034912109375, -4.51800537109375, -4.33251953125, -4.14703369140625, -3.9615478515625, -3.77606201171875, -3.590576171875, -3.40509033203125, -3.2196044921875, -3.03411865234375, -2.8486328125, -2.66314697265625, -2.4776611328125, -2.29217529296875, -2.106689453125, -1.92120361328125, -1.7357177734375, -1.55023193359375, -1.36474609375, -1.17926025390625, -0.9937744140625, -0.80828857421875, -0.622802734375, -0.43731689453125, -0.2518310546875, -0.06634521484375, 0.119140625, 0.30462646484375, 0.4901123046875, 0.67559814453125, 0.861083984375, 1.04656982421875, 1.2320556640625, 1.41754150390625, 1.60302734375, 1.78851318359375, 1.9739990234375, 2.15948486328125, 2.344970703125, 2.53045654296875, 2.7159423828125, 2.90142822265625, 3.0869140625, 3.27239990234375, 3.4578857421875, 3.64337158203125, 3.828857421875, 4.01434326171875, 4.1998291015625, 4.38531494140625, 4.57080078125, 4.75628662109375, 4.9417724609375, 5.12725830078125, 5.312744140625, 5.49822998046875, 5.6837158203125, 5.86920166015625, 6.0546875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 7.0, 1.0, 7.0, 8.0, 7.0, 3.0, 9.0, 18.0, 13.0, 20.0, 18.0, 28.0, 31.0, 26.0, 50.0, 45.0, 80.0, 111.0, 206.0, 344.0, 858.0, 5916.0, 533397.0, 2592067.0, 10384.0, 1002.0, 379.0, 194.0, 124.0, 67.0, 53.0, 40.0, 26.0, 31.0, 17.0, 17.0, 22.0, 18.0, 12.0, 10.0, 9.0, 7.0, 2.0, 5.0, 13.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.796875, -11.4173583984375, -11.037841796875, -10.6583251953125, -10.27880859375, -9.8992919921875, -9.519775390625, -9.1402587890625, -8.7607421875, -8.3812255859375, -8.001708984375, -7.6221923828125, -7.24267578125, -6.8631591796875, -6.483642578125, -6.1041259765625, -5.724609375, -5.3450927734375, -4.965576171875, -4.5860595703125, -4.20654296875, -3.8270263671875, -3.447509765625, -3.0679931640625, -2.6884765625, -2.3089599609375, -1.929443359375, -1.5499267578125, -1.17041015625, -0.7908935546875, -0.411376953125, -0.0318603515625, 0.34765625, 0.7271728515625, 1.106689453125, 1.4862060546875, 1.86572265625, 2.2452392578125, 2.624755859375, 3.0042724609375, 3.3837890625, 3.7633056640625, 4.142822265625, 4.5223388671875, 4.90185546875, 5.2813720703125, 5.660888671875, 6.0404052734375, 6.419921875, 6.7994384765625, 7.178955078125, 7.5584716796875, 7.93798828125, 8.3175048828125, 8.697021484375, 9.0765380859375, 9.4560546875, 9.8355712890625, 10.215087890625, 10.5946044921875, 10.97412109375, 11.3536376953125, 11.733154296875, 12.1126708984375, 12.4921875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 8.0, 1011.0], "bins": [-361.3667907714844, -355.6764831542969, -349.9861755371094, -344.29583740234375, -338.60552978515625, -332.91522216796875, -327.22491455078125, -321.53460693359375, -315.84429931640625, -310.15399169921875, -304.46368408203125, -298.77337646484375, -293.0830383300781, -287.3927307128906, -281.7024230957031, -276.0121154785156, -270.32177734375, -264.6314697265625, -258.941162109375, -253.25083923339844, -247.56053161621094, -241.87020874023438, -236.17990112304688, -230.48959350585938, -224.79928588867188, -219.10897827148438, -213.4186553955078, -207.7283477783203, -202.0380401611328, -196.34771728515625, -190.65740966796875, -184.96710205078125, -179.27679443359375, -173.58648681640625, -167.8961639404297, -162.2058563232422, -156.5155487060547, -150.82522583007812, -145.13491821289062, -139.44461059570312, -133.75428771972656, -128.06398010253906, -122.37366485595703, -116.683349609375, -110.9930419921875, -105.30272674560547, -99.61241149902344, -93.92210388183594, -88.2317886352539, -82.54147338867188, -76.85116577148438, -71.16085052490234, -65.47053527832031, -59.78022766113281, -54.08991241455078, -48.399600982666016, -42.70928955078125, -37.018978118896484, -31.328664779663086, -25.638351440429688, -19.948040008544922, -14.257728576660156, -8.567413330078125, -2.8771018981933594, 2.813208818435669]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 3.0, 7.0, 12.0, 9.0, 9.0, 10.0, 10.0, 14.0, 20.0, 34.0, 24.0, 16.0, 29.0, 28.0, 28.0, 47.0, 39.0, 41.0, 24.0, 33.0, 42.0, 39.0, 49.0, 51.0, 28.0, 32.0, 40.0, 35.0, 26.0, 28.0, 24.0, 11.0, 24.0, 17.0, 21.0, 24.0, 14.0, 4.0, 14.0, 5.0, 3.0, 6.0, 4.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-22.755081176757812, -22.09783363342285, -21.44058609008789, -20.783340454101562, -20.1260929107666, -19.46884536743164, -18.81159782409668, -18.15435028076172, -17.497102737426758, -16.839855194091797, -16.182607650756836, -15.525361061096191, -14.86811351776123, -14.210866928100586, -13.553619384765625, -12.896371841430664, -12.23912525177002, -11.581877708435059, -10.924631118774414, -10.267383575439453, -9.610136032104492, -8.952888488769531, -8.295641899108887, -7.638394355773926, -6.981147289276123, -6.32390022277832, -5.666652679443359, -5.009405612945557, -4.352158546447754, -3.694911003112793, -3.0376639366149902, -2.3804163932800293, -1.7231693267822266, -1.0659220218658447, -0.40867483615875244, 0.24857234954833984, 0.9058196544647217, 1.5630669593811035, 2.2203140258789062, 2.877561569213867, 3.53480863571167, 4.192055702209473, 4.849303245544434, 5.506550312042236, 6.163797378540039, 6.821044921875, 7.478291988372803, 8.135540008544922, 8.792786598205566, 9.450034141540527, 10.107280731201172, 10.764528274536133, 11.421775817871094, 12.079023361206055, 12.7362699508667, 13.39351749420166, 14.050764083862305, 14.708011627197266, 15.36525821685791, 16.022506713867188, 16.679752349853516, 17.336999893188477, 17.994247436523438, 18.6514949798584, 19.30874252319336]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 5.0, 3.0, 3.0, 15.0, 10.0, 23.0, 14.0, 29.0, 20.0, 31.0, 40.0, 48.0, 52.0, 59.0, 66.0, 67.0, 65.0, 54.0, 57.0, 47.0, 71.0, 45.0, 42.0, 43.0, 26.0, 19.0, 16.0, 8.0, 10.0, 6.0, 4.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.74609375, -3.6594696044921875, -3.572845458984375, -3.4862213134765625, -3.39959716796875, -3.3129730224609375, -3.226348876953125, -3.1397247314453125, -3.0531005859375, -2.9664764404296875, -2.879852294921875, -2.7932281494140625, -2.70660400390625, -2.6199798583984375, -2.533355712890625, -2.4467315673828125, -2.360107421875, -2.2734832763671875, -2.186859130859375, -2.1002349853515625, -2.01361083984375, -1.9269866943359375, -1.840362548828125, -1.7537384033203125, -1.6671142578125, -1.5804901123046875, -1.493865966796875, -1.4072418212890625, -1.32061767578125, -1.2339935302734375, -1.147369384765625, -1.0607452392578125, -0.97412109375, -0.8874969482421875, -0.800872802734375, -0.7142486572265625, -0.62762451171875, -0.5410003662109375, -0.454376220703125, -0.3677520751953125, -0.2811279296875, -0.1945037841796875, -0.107879638671875, -0.0212554931640625, 0.06536865234375, 0.1519927978515625, 0.238616943359375, 0.3252410888671875, 0.411865234375, 0.4984893798828125, 0.585113525390625, 0.6717376708984375, 0.75836181640625, 0.8449859619140625, 0.931610107421875, 1.0182342529296875, 1.1048583984375, 1.1914825439453125, 1.278106689453125, 1.3647308349609375, 1.45135498046875, 1.5379791259765625, 1.624603271484375, 1.7112274169921875, 1.7978515625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 2.0, 7.0, 9.0, 25.0, 21.0, 36.0, 42.0, 56.0, 85.0, 157.0, 319.0, 796.0, 3442.0, 66607.0, 3872211.0, 241569.0, 6868.0, 1168.0, 366.0, 175.0, 114.0, 61.0, 37.0, 32.0, 32.0, 19.0, 5.0, 6.0, 3.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-28.34375, -27.6943359375, -27.044921875, -26.3955078125, -25.74609375, -25.0966796875, -24.447265625, -23.7978515625, -23.1484375, -22.4990234375, -21.849609375, -21.2001953125, -20.55078125, -19.9013671875, -19.251953125, -18.6025390625, -17.953125, -17.3037109375, -16.654296875, -16.0048828125, -15.35546875, -14.7060546875, -14.056640625, -13.4072265625, -12.7578125, -12.1083984375, -11.458984375, -10.8095703125, -10.16015625, -9.5107421875, -8.861328125, -8.2119140625, -7.5625, -6.9130859375, -6.263671875, -5.6142578125, -4.96484375, -4.3154296875, -3.666015625, -3.0166015625, -2.3671875, -1.7177734375, -1.068359375, -0.4189453125, 0.23046875, 0.8798828125, 1.529296875, 2.1787109375, 2.828125, 3.4775390625, 4.126953125, 4.7763671875, 5.42578125, 6.0751953125, 6.724609375, 7.3740234375, 8.0234375, 8.6728515625, 9.322265625, 9.9716796875, 10.62109375, 11.2705078125, 11.919921875, 12.5693359375, 13.21875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 18.0, 25.0, 44.0, 103.0, 178.0, 271.0, 462.0, 730.0, 822.0, 573.0, 391.0, 204.0, 98.0, 57.0, 30.0, 27.0, 14.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9029541015625, -9.524658203125, -9.1463623046875, -8.76806640625, -8.3897705078125, -8.011474609375, -7.6331787109375, -7.2548828125, -6.8765869140625, -6.498291015625, -6.1199951171875, -5.74169921875, -5.3634033203125, -4.985107421875, -4.6068115234375, -4.228515625, -3.8502197265625, -3.471923828125, -3.0936279296875, -2.71533203125, -2.3370361328125, -1.958740234375, -1.5804443359375, -1.2021484375, -0.8238525390625, -0.445556640625, -0.0672607421875, 0.31103515625, 0.6893310546875, 1.067626953125, 1.4459228515625, 1.82421875, 2.2025146484375, 2.580810546875, 2.9591064453125, 3.33740234375, 3.7156982421875, 4.093994140625, 4.4722900390625, 4.8505859375, 5.2288818359375, 5.607177734375, 5.9854736328125, 6.36376953125, 6.7420654296875, 7.120361328125, 7.4986572265625, 7.876953125, 8.2552490234375, 8.633544921875, 9.0118408203125, 9.39013671875, 9.7684326171875, 10.146728515625, 10.5250244140625, 10.9033203125, 11.2816162109375, 11.659912109375, 12.0382080078125, 12.41650390625, 12.7947998046875, 13.173095703125, 13.5513916015625, 13.9296875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 15.0, 8.0, 9.0, 23.0, 20.0, 32.0, 58.0, 66.0, 86.0, 143.0, 224.0, 370.0, 721.0, 1581.0, 5462.0, 43604.0, 891865.0, 3080171.0, 152690.0, 12379.0, 2499.0, 956.0, 469.0, 261.0, 163.0, 120.0, 83.0, 56.0, 43.0, 25.0, 28.0, 19.0, 14.0, 7.0, 1.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.953125, -20.322509765625, -19.69189453125, -19.061279296875, -18.4306640625, -17.800048828125, -17.16943359375, -16.538818359375, -15.908203125, -15.277587890625, -14.64697265625, -14.016357421875, -13.3857421875, -12.755126953125, -12.12451171875, -11.493896484375, -10.86328125, -10.232666015625, -9.60205078125, -8.971435546875, -8.3408203125, -7.710205078125, -7.07958984375, -6.448974609375, -5.818359375, -5.187744140625, -4.55712890625, -3.926513671875, -3.2958984375, -2.665283203125, -2.03466796875, -1.404052734375, -0.7734375, -0.142822265625, 0.48779296875, 1.118408203125, 1.7490234375, 2.379638671875, 3.01025390625, 3.640869140625, 4.271484375, 4.902099609375, 5.53271484375, 6.163330078125, 6.7939453125, 7.424560546875, 8.05517578125, 8.685791015625, 9.31640625, 9.947021484375, 10.57763671875, 11.208251953125, 11.8388671875, 12.469482421875, 13.10009765625, 13.730712890625, 14.361328125, 14.991943359375, 15.62255859375, 16.253173828125, 16.8837890625, 17.514404296875, 18.14501953125, 18.775634765625, 19.40625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 23.0, 72.0, 180.0, 280.0, 259.0, 139.0, 45.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.13874053955078, -64.05313110351562, -60.9675178527832, -57.88190460205078, -54.796295166015625, -51.7106819152832, -48.62506866455078, -45.539459228515625, -42.4538459777832, -39.36823272705078, -36.282623291015625, -33.1970100402832, -30.111398696899414, -27.025787353515625, -23.940174102783203, -20.854562759399414, -17.768951416015625, -14.683340072631836, -11.59772777557373, -8.512115478515625, -5.426504135131836, -2.340892791748047, 0.744720458984375, 3.830331802368164, 6.915943145751953, 10.001554489135742, 13.087166786193848, 16.172779083251953, 19.258390426635742, 22.34400177001953, 25.429615020751953, 28.515226364135742, 31.600845336914062, 34.686458587646484, 37.77206802368164, 40.85768127441406, 43.94329071044922, 47.02890396118164, 50.11451721191406, 53.20012664794922, 56.28573989868164, 59.37135314941406, 62.45696258544922, 65.54257202148438, 68.62818908691406, 71.71379852294922, 74.79940795898438, 77.88502502441406, 80.97063446044922, 84.05624389648438, 87.14186096191406, 90.22747039794922, 93.31307983398438, 96.39869689941406, 99.48430633544922, 102.56991577148438, 105.65553283691406, 108.74114227294922, 111.8267593383789, 114.91236877441406, 117.99797821044922, 121.08358764648438, 124.16920471191406, 127.25481414794922, 130.34042358398438]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 7.0, 11.0, 13.0, 14.0, 9.0, 8.0, 7.0, 19.0, 22.0, 22.0, 27.0, 19.0, 30.0, 27.0, 25.0, 34.0, 31.0, 32.0, 30.0, 44.0, 44.0, 41.0, 38.0, 35.0, 39.0, 35.0, 23.0, 33.0, 29.0, 31.0, 33.0, 10.0, 32.0, 15.0, 18.0, 14.0, 18.0, 14.0, 14.0, 7.0, 7.0, 8.0, 5.0, 4.0, 7.0, 3.0, 1.0, 3.0, 0.0, 3.0], "bins": [-23.70941162109375, -23.038780212402344, -22.36815071105957, -21.697519302368164, -21.026887893676758, -20.356258392333984, -19.685626983642578, -19.014995574951172, -18.344364166259766, -17.67373275756836, -17.003103256225586, -16.33247184753418, -15.661840438842773, -14.991209983825684, -14.320579528808594, -13.649948120117188, -12.979318618774414, -12.308688163757324, -11.638056755065918, -10.967426300048828, -10.296794891357422, -9.626164436340332, -8.955533981323242, -8.284902572631836, -7.614272117614746, -6.943641185760498, -6.27301025390625, -5.60237979888916, -4.931748867034912, -4.261117935180664, -3.590487480163574, -2.919856548309326, -2.249225616455078, -1.5785948038101196, -0.9079639911651611, -0.2373332977294922, 0.43329763412475586, 1.103928565979004, 1.7745590209960938, 2.445189952850342, 3.11582088470459, 3.786451816558838, 4.457082748413086, 5.127713203430176, 5.798344135284424, 6.468975067138672, 7.139605522155762, 7.81023645401001, 8.480867385864258, 9.151497840881348, 9.822129249572754, 10.492759704589844, 11.16339111328125, 11.83402156829834, 12.50465202331543, 13.175283432006836, 13.845913887023926, 14.516544342041016, 15.187175750732422, 15.857806205749512, 16.5284366607666, 17.199068069458008, 17.86969757080078, 18.540328979492188, 19.210960388183594]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 15.0, 13.0, 14.0, 35.0, 20.0, 24.0, 38.0, 47.0, 51.0, 50.0, 61.0, 71.0, 61.0, 62.0, 57.0, 57.0, 43.0, 46.0, 45.0, 39.0, 30.0, 30.0, 17.0, 19.0, 12.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 4.0], "bins": [-3.72265625, -3.6373138427734375, -3.551971435546875, -3.4666290283203125, -3.38128662109375, -3.2959442138671875, -3.210601806640625, -3.1252593994140625, -3.0399169921875, -2.9545745849609375, -2.869232177734375, -2.7838897705078125, -2.69854736328125, -2.6132049560546875, -2.527862548828125, -2.4425201416015625, -2.357177734375, -2.2718353271484375, -2.186492919921875, -2.1011505126953125, -2.01580810546875, -1.9304656982421875, -1.845123291015625, -1.7597808837890625, -1.6744384765625, -1.5890960693359375, -1.503753662109375, -1.4184112548828125, -1.33306884765625, -1.2477264404296875, -1.162384033203125, -1.0770416259765625, -0.99169921875, -0.9063568115234375, -0.821014404296875, -0.7356719970703125, -0.65032958984375, -0.5649871826171875, -0.479644775390625, -0.3943023681640625, -0.3089599609375, -0.2236175537109375, -0.138275146484375, -0.0529327392578125, 0.03240966796875, 0.1177520751953125, 0.203094482421875, 0.2884368896484375, 0.373779296875, 0.4591217041015625, 0.544464111328125, 0.6298065185546875, 0.71514892578125, 0.8004913330078125, 0.885833740234375, 0.9711761474609375, 1.0565185546875, 1.1418609619140625, 1.227203369140625, 1.3125457763671875, 1.39788818359375, 1.4832305908203125, 1.568572998046875, 1.6539154052734375, 1.7392578125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 3.0, 7.0, 5.0, 16.0, 24.0, 32.0, 35.0, 79.0, 169.0, 228.0, 505.0, 989.0, 1951.0, 4191.0, 8994.0, 20010.0, 46774.0, 120663.0, 392351.0, 290792.0, 92919.0, 37680.0, 15978.0, 7243.0, 3423.0, 1696.0, 798.0, 445.0, 240.0, 114.0, 61.0, 40.0, 21.0, 13.0, 10.0, 16.0, 9.0, 2.0, 7.0, 3.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.033721923828125, -0.03278183937072754, -0.03184175491333008, -0.030901670455932617, -0.029961585998535156, -0.029021501541137695, -0.028081417083740234, -0.027141332626342773, -0.026201248168945312, -0.02526116371154785, -0.02432107925415039, -0.02338099479675293, -0.02244091033935547, -0.021500825881958008, -0.020560741424560547, -0.019620656967163086, -0.018680572509765625, -0.017740488052368164, -0.016800403594970703, -0.015860319137573242, -0.014920234680175781, -0.01398015022277832, -0.01304006576538086, -0.012099981307983398, -0.011159896850585938, -0.010219812393188477, -0.009279727935791016, -0.008339643478393555, -0.007399559020996094, -0.006459474563598633, -0.005519390106201172, -0.004579305648803711, -0.00363922119140625, -0.002699136734008789, -0.0017590522766113281, -0.0008189678192138672, 0.00012111663818359375, 0.0010612010955810547, 0.0020012855529785156, 0.0029413700103759766, 0.0038814544677734375, 0.0048215389251708984, 0.005761623382568359, 0.00670170783996582, 0.007641792297363281, 0.008581876754760742, 0.009521961212158203, 0.010462045669555664, 0.011402130126953125, 0.012342214584350586, 0.013282299041748047, 0.014222383499145508, 0.015162467956542969, 0.01610255241394043, 0.01704263687133789, 0.01798272132873535, 0.018922805786132812, 0.019862890243530273, 0.020802974700927734, 0.021743059158325195, 0.022683143615722656, 0.023623228073120117, 0.024563312530517578, 0.02550339698791504, 0.0264434814453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 5.0, 11.0, 13.0, 11.0, 21.0, 22.0, 19.0, 26.0, 26.0, 24.0, 35.0, 24.0, 34.0, 43.0, 42.0, 49.0, 43.0, 1079.0, 28.0, 41.0, 44.0, 43.0, 41.0, 41.0, 33.0, 33.0, 27.0, 26.0, 17.0, 18.0, 20.0, 19.0, 14.0, 10.0, 9.0, 3.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41015625, -1.3609466552734375, -1.311737060546875, -1.2625274658203125, -1.21331787109375, -1.1641082763671875, -1.114898681640625, -1.0656890869140625, -1.0164794921875, -0.9672698974609375, -0.918060302734375, -0.8688507080078125, -0.81964111328125, -0.7704315185546875, -0.721221923828125, -0.6720123291015625, -0.622802734375, -0.5735931396484375, -0.524383544921875, -0.4751739501953125, -0.42596435546875, -0.3767547607421875, -0.327545166015625, -0.2783355712890625, -0.2291259765625, -0.1799163818359375, -0.130706787109375, -0.0814971923828125, -0.03228759765625, 0.0169219970703125, 0.066131591796875, 0.1153411865234375, 0.16455078125, 0.2137603759765625, 0.262969970703125, 0.3121795654296875, 0.36138916015625, 0.4105987548828125, 0.459808349609375, 0.5090179443359375, 0.5582275390625, 0.6074371337890625, 0.656646728515625, 0.7058563232421875, 0.75506591796875, 0.8042755126953125, 0.853485107421875, 0.9026947021484375, 0.951904296875, 1.0011138916015625, 1.050323486328125, 1.0995330810546875, 1.14874267578125, 1.1979522705078125, 1.247161865234375, 1.2963714599609375, 1.3455810546875, 1.3947906494140625, 1.444000244140625, 1.4932098388671875, 1.54241943359375, 1.5916290283203125, 1.640838623046875, 1.6900482177734375, 1.7392578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 3.0, 11.0, 11.0, 25.0, 19.0, 50.0, 71.0, 100.0, 150.0, 167.0, 283.0, 396.0, 563.0, 888.0, 1261.0, 1882.0, 2821.0, 4419.0, 6614.0, 10492.0, 16334.0, 25679.0, 40772.0, 65585.0, 109625.0, 183174.0, 1263852.0, 139629.0, 82857.0, 50899.0, 31712.0, 19751.0, 12736.0, 8236.0, 5514.0, 3464.0, 2306.0, 1571.0, 1037.0, 685.0, 439.0, 343.0, 244.0, 149.0, 91.0, 68.0, 44.0, 33.0, 34.0, 13.0, 6.0, 2.0, 9.0, 8.0, 2.0, 0.0, 4.0, 3.0], "bins": [-0.005870819091796875, -0.005688667297363281, -0.0055065155029296875, -0.005324363708496094, -0.0051422119140625, -0.004960060119628906, -0.0047779083251953125, -0.004595756530761719, -0.004413604736328125, -0.004231452941894531, -0.0040493011474609375, -0.0038671493530273438, -0.00368499755859375, -0.0035028457641601562, -0.0033206939697265625, -0.0031385421752929688, -0.002956390380859375, -0.0027742385864257812, -0.0025920867919921875, -0.0024099349975585938, -0.002227783203125, -0.0020456314086914062, -0.0018634796142578125, -0.0016813278198242188, -0.001499176025390625, -0.0013170242309570312, -0.0011348724365234375, -0.0009527206420898438, -0.00077056884765625, -0.0005884170532226562, -0.0004062652587890625, -0.00022411346435546875, -4.1961669921875e-05, 0.00014019012451171875, 0.0003223419189453125, 0.0005044937133789062, 0.0006866455078125, 0.0008687973022460938, 0.0010509490966796875, 0.0012331008911132812, 0.001415252685546875, 0.0015974044799804688, 0.0017795562744140625, 0.0019617080688476562, 0.00214385986328125, 0.0023260116577148438, 0.0025081634521484375, 0.0026903152465820312, 0.002872467041015625, 0.0030546188354492188, 0.0032367706298828125, 0.0034189224243164062, 0.00360107421875, 0.0037832260131835938, 0.0039653778076171875, 0.004147529602050781, 0.004329681396484375, 0.004511833190917969, 0.0046939849853515625, 0.004876136779785156, 0.00505828857421875, 0.005240440368652344, 0.0054225921630859375, 0.005604743957519531, 0.005786895751953125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 147.0, 0.0, 0.0, 475.0, 0.0, 0.0, 0.0, 131.0, 0.0, 0.0, 93.0, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.792826414108276e-07, -5.62518835067749e-07, -5.457550287246704e-07, -5.289912223815918e-07, -5.122274160385132e-07, -4.954636096954346e-07, -4.78699803352356e-07, -4.6193599700927734e-07, -4.4517219066619873e-07, -4.284083843231201e-07, -4.116445779800415e-07, -3.948807716369629e-07, -3.781169652938843e-07, -3.6135315895080566e-07, -3.4458935260772705e-07, -3.2782554626464844e-07, -3.110617399215698e-07, -2.942979335784912e-07, -2.775341272354126e-07, -2.60770320892334e-07, -2.4400651454925537e-07, -2.2724270820617676e-07, -2.1047890186309814e-07, -1.9371509552001953e-07, -1.7695128917694092e-07, -1.601874828338623e-07, -1.434236764907837e-07, -1.2665987014770508e-07, -1.0989606380462646e-07, -9.313225746154785e-08, -7.636845111846924e-08, -5.960464477539063e-08, -4.284083843231201e-08, -2.60770320892334e-08, -9.313225746154785e-09, 7.450580596923828e-09, 2.421438694000244e-08, 4.0978193283081055e-08, 5.774199962615967e-08, 7.450580596923828e-08, 9.12696123123169e-08, 1.0803341865539551e-07, 1.2479722499847412e-07, 1.4156103134155273e-07, 1.5832483768463135e-07, 1.7508864402770996e-07, 1.9185245037078857e-07, 2.086162567138672e-07, 2.253800630569458e-07, 2.421438694000244e-07, 2.5890767574310303e-07, 2.7567148208618164e-07, 2.9243528842926025e-07, 3.0919909477233887e-07, 3.259629011154175e-07, 3.427267074584961e-07, 3.594905138015747e-07, 3.762543201446533e-07, 3.9301812648773193e-07, 4.0978193283081055e-07, 4.2654573917388916e-07, 4.4330954551696777e-07, 4.600733518600464e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 8.0, 9.0, 19.0, 22.0, 15.0, 43.0, 50.0, 13.0, 70.0, 154.0, 58.0, 114.0, 400.0, 1162.0, 68787.0, 950934.0, 25219.0, 529.0, 405.0, 69.0, 52.0, 177.0, 51.0, 25.0, 43.0, 28.0, 12.0, 24.0, 21.0, 6.0, 6.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-06, -7.533468306064606e-06, -7.2587281465530396e-06, -6.983987987041473e-06, -6.709247827529907e-06, -6.434507668018341e-06, -6.159767508506775e-06, -5.885027348995209e-06, -5.610287189483643e-06, -5.335547029972076e-06, -5.06080687046051e-06, -4.786066710948944e-06, -4.511326551437378e-06, -4.236586391925812e-06, -3.961846232414246e-06, -3.6871060729026794e-06, -3.4123659133911133e-06, -3.137625753879547e-06, -2.862885594367981e-06, -2.588145434856415e-06, -2.3134052753448486e-06, -2.0386651158332825e-06, -1.7639249563217163e-06, -1.4891847968101501e-06, -1.214444637298584e-06, -9.397044777870178e-07, -6.649643182754517e-07, -3.902241587638855e-07, -1.1548399925231934e-07, 1.5925616025924683e-07, 4.33996319770813e-07, 7.087364792823792e-07, 9.834766387939453e-07, 1.2582167983055115e-06, 1.5329569578170776e-06, 1.8076971173286438e-06, 2.08243727684021e-06, 2.357177436351776e-06, 2.6319175958633423e-06, 2.9066577553749084e-06, 3.1813979148864746e-06, 3.4561380743980408e-06, 3.730878233909607e-06, 4.005618393421173e-06, 4.280358552932739e-06, 4.555098712444305e-06, 4.829838871955872e-06, 5.104579031467438e-06, 5.379319190979004e-06, 5.65405935049057e-06, 5.928799510002136e-06, 6.203539669513702e-06, 6.4782798290252686e-06, 6.753019988536835e-06, 7.027760148048401e-06, 7.302500307559967e-06, 7.577240467071533e-06, 7.8519806265831e-06, 8.126720786094666e-06, 8.401460945606232e-06, 8.676201105117798e-06, 8.950941264629364e-06, 9.22568142414093e-06, 9.500421583652496e-06, 9.775161743164062e-06]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 13.0, 19.0, 32.0, 39.0, 60.0, 65.0, 469.0, 95.0, 81.0, 36.0, 39.0, 25.0, 16.0, 6.0, 6.0, 3.0, 2.0, 2.0], "bins": [-8.073860158219759e-07, -7.921365181573492e-07, -7.768870204927225e-07, -7.616375228280958e-07, -7.463880251634691e-07, -7.311385274988424e-07, -7.158890298342158e-07, -7.006394753261702e-07, -6.853899776615435e-07, -6.701404799969168e-07, -6.548909823322902e-07, -6.396414846676635e-07, -6.243919870030368e-07, -6.091424893384101e-07, -5.938929916737834e-07, -5.786434940091567e-07, -5.6339399634453e-07, -5.481444986799033e-07, -5.328950010152766e-07, -5.1764550335065e-07, -5.023960056860233e-07, -4.871465080213966e-07, -4.7189698193506047e-07, -4.566474842704338e-07, -4.413979866058071e-07, -4.261484889411804e-07, -4.108989912765537e-07, -3.9564949361192703e-07, -3.803999675255909e-07, -3.651504698609642e-07, -3.4990097219633753e-07, -3.3465147453171085e-07, -3.19402033710503e-07, -3.0415253604587633e-07, -2.8890303838124964e-07, -2.7365354071662296e-07, -2.5840404305199627e-07, -2.431545453873696e-07, -2.2790501930103346e-07, -2.1265552163640677e-07, -1.974060239717801e-07, -1.821565263071534e-07, -1.669070286425267e-07, -1.516575167670453e-07, -1.3640801910241862e-07, -1.2115852143779193e-07, -1.0590901666773789e-07, -9.065951189768384e-08, -7.541001423305715e-08, -6.016051656843047e-08, -4.491101179837642e-08, -2.9661510581036055e-08, -1.4412009363695688e-08, 8.374883009309997e-10, 1.6086993070985045e-08, 3.133649784103909e-08, 4.658599550566578e-08, 6.183549317029247e-08, 7.708499794034651e-08, 9.233450271040056e-08, 1.0758400037502724e-07, 1.2283349803965393e-07, 1.3808300991513534e-07, 1.5333250757976202e-07, 1.685820052443887e-07]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 192.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 485.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 199.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.980232238769531e-07, -2.896413207054138e-07, -2.812594175338745e-07, -2.728775143623352e-07, -2.644956111907959e-07, -2.561137080192566e-07, -2.477318048477173e-07, -2.39349901676178e-07, -2.3096799850463867e-07, -2.2258609533309937e-07, -2.1420419216156006e-07, -2.0582228899002075e-07, -1.9744038581848145e-07, -1.8905848264694214e-07, -1.8067657947540283e-07, -1.7229467630386353e-07, -1.6391277313232422e-07, -1.555308699607849e-07, -1.471489667892456e-07, -1.387670636177063e-07, -1.30385160446167e-07, -1.2200325727462769e-07, -1.1362135410308838e-07, -1.0523945093154907e-07, -9.685754776000977e-08, -8.847564458847046e-08, -8.009374141693115e-08, -7.171183824539185e-08, -6.332993507385254e-08, -5.494803190231323e-08, -4.6566128730773926e-08, -3.818422555923462e-08, -2.9802322387695312e-08, -2.1420419216156006e-08, -1.30385160446167e-08, -4.6566128730773926e-09, 3.725290298461914e-09, 1.210719347000122e-08, 2.0489096641540527e-08, 2.8870999813079834e-08, 3.725290298461914e-08, 4.563480615615845e-08, 5.4016709327697754e-08, 6.239861249923706e-08, 7.078051567077637e-08, 7.916241884231567e-08, 8.754432201385498e-08, 9.592622518539429e-08, 1.043081283569336e-07, 1.126900315284729e-07, 1.210719347000122e-07, 1.2945383787155151e-07, 1.3783574104309082e-07, 1.4621764421463013e-07, 1.5459954738616943e-07, 1.6298145055770874e-07, 1.7136335372924805e-07, 1.7974525690078735e-07, 1.8812716007232666e-07, 1.9650906324386597e-07, 2.0489096641540527e-07, 2.1327286958694458e-07, 2.2165477275848389e-07, 2.300366759300232e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 15.0, 13.0, 14.0, 35.0, 20.0, 24.0, 38.0, 47.0, 51.0, 50.0, 61.0, 71.0, 61.0, 62.0, 57.0, 57.0, 43.0, 46.0, 45.0, 39.0, 30.0, 30.0, 17.0, 19.0, 12.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 4.0], "bins": [-3.72265625, -3.6373138427734375, -3.551971435546875, -3.4666290283203125, -3.38128662109375, -3.2959442138671875, -3.210601806640625, -3.1252593994140625, -3.0399169921875, -2.9545745849609375, -2.869232177734375, -2.7838897705078125, -2.69854736328125, -2.6132049560546875, -2.527862548828125, -2.4425201416015625, -2.357177734375, -2.2718353271484375, -2.186492919921875, -2.1011505126953125, -2.01580810546875, -1.9304656982421875, -1.845123291015625, -1.7597808837890625, -1.6744384765625, -1.5890960693359375, -1.503753662109375, -1.4184112548828125, -1.33306884765625, -1.2477264404296875, -1.162384033203125, -1.0770416259765625, -0.99169921875, -0.9063568115234375, -0.821014404296875, -0.7356719970703125, -0.65032958984375, -0.5649871826171875, -0.479644775390625, -0.3943023681640625, -0.3089599609375, -0.2236175537109375, -0.138275146484375, -0.0529327392578125, 0.03240966796875, 0.1177520751953125, 0.203094482421875, 0.2884368896484375, 0.373779296875, 0.4591217041015625, 0.544464111328125, 0.6298065185546875, 0.71514892578125, 0.8004913330078125, 0.885833740234375, 0.9711761474609375, 1.0565185546875, 1.1418609619140625, 1.227203369140625, 1.3125457763671875, 1.39788818359375, 1.4832305908203125, 1.568572998046875, 1.6539154052734375, 1.7392578125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 9.0, 3.0, 8.0, 13.0, 19.0, 27.0, 32.0, 43.0, 67.0, 104.0, 169.0, 286.0, 388.0, 704.0, 1135.0, 1861.0, 3099.0, 5562.0, 10882.0, 24094.0, 65284.0, 409928.0, 411091.0, 65019.0, 24087.0, 10945.0, 5669.0, 3118.0, 1888.0, 1060.0, 706.0, 468.0, 260.0, 184.0, 110.0, 70.0, 54.0, 38.0, 21.0, 15.0, 10.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.771484375, -2.689971923828125, -2.60845947265625, -2.526947021484375, -2.4454345703125, -2.363922119140625, -2.28240966796875, -2.200897216796875, -2.119384765625, -2.037872314453125, -1.95635986328125, -1.874847412109375, -1.7933349609375, -1.711822509765625, -1.63031005859375, -1.548797607421875, -1.46728515625, -1.385772705078125, -1.30426025390625, -1.222747802734375, -1.1412353515625, -1.059722900390625, -0.97821044921875, -0.896697998046875, -0.815185546875, -0.733673095703125, -0.65216064453125, -0.570648193359375, -0.4891357421875, -0.407623291015625, -0.32611083984375, -0.244598388671875, -0.1630859375, -0.081573486328125, -6.103515625e-05, 0.081451416015625, 0.1629638671875, 0.244476318359375, 0.32598876953125, 0.407501220703125, 0.489013671875, 0.570526123046875, 0.65203857421875, 0.733551025390625, 0.8150634765625, 0.896575927734375, 0.97808837890625, 1.059600830078125, 1.14111328125, 1.222625732421875, 1.30413818359375, 1.385650634765625, 1.4671630859375, 1.548675537109375, 1.63018798828125, 1.711700439453125, 1.793212890625, 1.874725341796875, 1.95623779296875, 2.037750244140625, 2.1192626953125, 2.200775146484375, 2.28228759765625, 2.363800048828125, 2.4453125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 6.0, 10.0, 1.0, 8.0, 7.0, 7.0, 7.0, 16.0, 11.0, 12.0, 12.0, 21.0, 37.0, 27.0, 31.0, 32.0, 46.0, 36.0, 48.0, 54.0, 64.0, 139.0, 1802.0, 135.0, 52.0, 46.0, 54.0, 50.0, 42.0, 35.0, 24.0, 28.0, 24.0, 14.0, 22.0, 17.0, 12.0, 15.0, 10.0, 14.0, 8.0, 10.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-7.69140625, -7.474609375, -7.2578125, -7.041015625, -6.82421875, -6.607421875, -6.390625, -6.173828125, -5.95703125, -5.740234375, -5.5234375, -5.306640625, -5.08984375, -4.873046875, -4.65625, -4.439453125, -4.22265625, -4.005859375, -3.7890625, -3.572265625, -3.35546875, -3.138671875, -2.921875, -2.705078125, -2.48828125, -2.271484375, -2.0546875, -1.837890625, -1.62109375, -1.404296875, -1.1875, -0.970703125, -0.75390625, -0.537109375, -0.3203125, -0.103515625, 0.11328125, 0.330078125, 0.546875, 0.763671875, 0.98046875, 1.197265625, 1.4140625, 1.630859375, 1.84765625, 2.064453125, 2.28125, 2.498046875, 2.71484375, 2.931640625, 3.1484375, 3.365234375, 3.58203125, 3.798828125, 4.015625, 4.232421875, 4.44921875, 4.666015625, 4.8828125, 5.099609375, 5.31640625, 5.533203125, 5.75, 5.966796875, 6.18359375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 4.0, 9.0, 6.0, 12.0, 15.0, 9.0, 12.0, 16.0, 22.0, 18.0, 22.0, 33.0, 41.0, 58.0, 101.0, 142.0, 288.0, 787.0, 3938.0, 66115.0, 3019429.0, 49836.0, 3294.0, 717.0, 275.0, 121.0, 93.0, 58.0, 44.0, 49.0, 25.0, 20.0, 15.0, 13.0, 10.0, 10.0, 11.0, 4.0, 6.0, 11.0, 5.0, 8.0, 3.0, 0.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.21875, -10.8245849609375, -10.430419921875, -10.0362548828125, -9.64208984375, -9.2479248046875, -8.853759765625, -8.4595947265625, -8.0654296875, -7.6712646484375, -7.277099609375, -6.8829345703125, -6.48876953125, -6.0946044921875, -5.700439453125, -5.3062744140625, -4.912109375, -4.5179443359375, -4.123779296875, -3.7296142578125, -3.33544921875, -2.9412841796875, -2.547119140625, -2.1529541015625, -1.7587890625, -1.3646240234375, -0.970458984375, -0.5762939453125, -0.18212890625, 0.2120361328125, 0.606201171875, 1.0003662109375, 1.39453125, 1.7886962890625, 2.182861328125, 2.5770263671875, 2.97119140625, 3.3653564453125, 3.759521484375, 4.1536865234375, 4.5478515625, 4.9420166015625, 5.336181640625, 5.7303466796875, 6.12451171875, 6.5186767578125, 6.912841796875, 7.3070068359375, 7.701171875, 8.0953369140625, 8.489501953125, 8.8836669921875, 9.27783203125, 9.6719970703125, 10.066162109375, 10.4603271484375, 10.8544921875, 11.2486572265625, 11.642822265625, 12.0369873046875, 12.43115234375, 12.8253173828125, 13.219482421875, 13.6136474609375, 14.0078125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 23.0, 340.0, 580.0, 70.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.37042999267578, -88.49588775634766, -86.62135314941406, -84.74681091308594, -82.87227630615234, -80.99773406982422, -79.12319946289062, -77.2486572265625, -75.37411499023438, -73.49957275390625, -71.62503814697266, -69.75049591064453, -67.87596130371094, -66.00141906738281, -64.12688446044922, -62.252342224121094, -60.3778076171875, -58.50326919555664, -56.62873077392578, -54.75419235229492, -52.87965393066406, -51.00511169433594, -49.13057327270508, -47.25603485107422, -45.38149642944336, -43.5069580078125, -41.63241958618164, -39.75788116455078, -37.883338928222656, -36.00880432128906, -34.13426208496094, -32.25972366333008, -30.38518714904785, -28.510648727416992, -26.6361083984375, -24.76156997680664, -22.88703155517578, -21.012493133544922, -19.137954711914062, -17.26341438293457, -15.388875961303711, -13.514337539672852, -11.639798164367676, -9.7652587890625, -7.890720367431641, -6.016181945800781, -4.1416425704956055, -2.2671031951904297, -0.3925647735595703, 1.4819741249084473, 3.356513023376465, 5.231051921844482, 7.1055908203125, 8.98012924194336, 10.854668617248535, 12.729207992553711, 14.60374641418457, 16.47828483581543, 18.352825164794922, 20.22736358642578, 22.10190200805664, 23.9764404296875, 25.85097885131836, 27.72551918029785, 29.60005760192871]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 5.0, 2.0, 9.0, 8.0, 10.0, 9.0, 9.0, 9.0, 16.0, 17.0, 17.0, 27.0, 32.0, 27.0, 45.0, 35.0, 30.0, 48.0, 40.0, 45.0, 39.0, 48.0, 40.0, 41.0, 47.0, 39.0, 38.0, 40.0, 24.0, 30.0, 13.0, 30.0, 24.0, 22.0, 15.0, 17.0, 7.0, 10.0, 7.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.774188995361328, -23.012977600097656, -22.251768112182617, -21.490556716918945, -20.729345321655273, -19.968135833740234, -19.206924438476562, -18.44571304321289, -17.68450355529785, -16.92329216003418, -16.16208267211914, -15.400871276855469, -14.639660835266113, -13.878450393676758, -13.117238998413086, -12.35602855682373, -11.594817161560059, -10.833606719970703, -10.072395324707031, -9.311184883117676, -8.54997444152832, -7.788763523101807, -7.027552604675293, -6.2663421630859375, -5.505131244659424, -4.74392032623291, -3.9827098846435547, -3.221498966217041, -2.4602882862091064, -1.6990776062011719, -0.9378666877746582, -0.17665624618530273, 0.5845546722412109, 1.3457653522491455, 2.10697603225708, 2.8681869506835938, 3.6293976306915283, 4.390608310699463, 5.151819229125977, 5.913029670715332, 6.674240589141846, 7.435451507568359, 8.196661949157715, 8.95787239074707, 9.719083786010742, 10.480294227600098, 11.241504669189453, 12.002716064453125, 12.76392650604248, 13.525136947631836, 14.286348342895508, 15.047558784484863, 15.808769226074219, 16.56998062133789, 17.331192016601562, 18.0924015045166, 18.853612899780273, 19.614824295043945, 20.376033782958984, 21.137245178222656, 21.898456573486328, 22.659666061401367, 23.42087745666504, 24.182086944580078, 24.94329833984375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 2.0, 5.0, 9.0, 17.0, 7.0, 14.0, 19.0, 30.0, 23.0, 33.0, 41.0, 39.0, 48.0, 65.0, 60.0, 66.0, 64.0, 59.0, 59.0, 45.0, 53.0, 32.0, 51.0, 38.0, 33.0, 23.0, 18.0, 17.0, 10.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 4.0], "bins": [-3.705078125, -3.6194915771484375, -3.533905029296875, -3.4483184814453125, -3.36273193359375, -3.2771453857421875, -3.191558837890625, -3.1059722900390625, -3.0203857421875, -2.9347991943359375, -2.849212646484375, -2.7636260986328125, -2.67803955078125, -2.5924530029296875, -2.506866455078125, -2.4212799072265625, -2.335693359375, -2.2501068115234375, -2.164520263671875, -2.0789337158203125, -1.99334716796875, -1.9077606201171875, -1.822174072265625, -1.7365875244140625, -1.6510009765625, -1.5654144287109375, -1.479827880859375, -1.3942413330078125, -1.30865478515625, -1.2230682373046875, -1.137481689453125, -1.0518951416015625, -0.96630859375, -0.8807220458984375, -0.795135498046875, -0.7095489501953125, -0.62396240234375, -0.5383758544921875, -0.452789306640625, -0.3672027587890625, -0.2816162109375, -0.1960296630859375, -0.110443115234375, -0.0248565673828125, 0.06072998046875, 0.1463165283203125, 0.231903076171875, 0.3174896240234375, 0.403076171875, 0.4886627197265625, 0.574249267578125, 0.6598358154296875, 0.74542236328125, 0.8310089111328125, 0.916595458984375, 1.0021820068359375, 1.0877685546875, 1.1733551025390625, 1.258941650390625, 1.3445281982421875, 1.43011474609375, 1.5157012939453125, 1.601287841796875, 1.6868743896484375, 1.7724609375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 14.0, 13.0, 22.0, 20.0, 36.0, 49.0, 62.0, 98.0, 174.0, 328.0, 995.0, 4125.0, 38003.0, 1332077.0, 2745402.0, 65162.0, 5682.0, 1172.0, 318.0, 165.0, 93.0, 78.0, 52.0, 41.0, 23.0, 26.0, 11.0, 5.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.140625, -18.6632080078125, -18.185791015625, -17.7083740234375, -17.23095703125, -16.7535400390625, -16.276123046875, -15.7987060546875, -15.3212890625, -14.8438720703125, -14.366455078125, -13.8890380859375, -13.41162109375, -12.9342041015625, -12.456787109375, -11.9793701171875, -11.501953125, -11.0245361328125, -10.547119140625, -10.0697021484375, -9.59228515625, -9.1148681640625, -8.637451171875, -8.1600341796875, -7.6826171875, -7.2052001953125, -6.727783203125, -6.2503662109375, -5.77294921875, -5.2955322265625, -4.818115234375, -4.3406982421875, -3.86328125, -3.3858642578125, -2.908447265625, -2.4310302734375, -1.95361328125, -1.4761962890625, -0.998779296875, -0.5213623046875, -0.0439453125, 0.4334716796875, 0.910888671875, 1.3883056640625, 1.86572265625, 2.3431396484375, 2.820556640625, 3.2979736328125, 3.775390625, 4.2528076171875, 4.730224609375, 5.2076416015625, 5.68505859375, 6.1624755859375, 6.639892578125, 7.1173095703125, 7.5947265625, 8.0721435546875, 8.549560546875, 9.0269775390625, 9.50439453125, 9.9818115234375, 10.459228515625, 10.9366455078125, 11.4140625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 9.0, 4.0, 11.0, 6.0, 23.0, 47.0, 72.0, 140.0, 241.0, 526.0, 855.0, 882.0, 554.0, 309.0, 186.0, 100.0, 61.0, 17.0, 14.0, 12.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.765625, -19.35467529296875, -18.9437255859375, -18.53277587890625, -18.121826171875, -17.71087646484375, -17.2999267578125, -16.88897705078125, -16.47802734375, -16.06707763671875, -15.6561279296875, -15.24517822265625, -14.834228515625, -14.42327880859375, -14.0123291015625, -13.60137939453125, -13.1904296875, -12.77947998046875, -12.3685302734375, -11.95758056640625, -11.546630859375, -11.13568115234375, -10.7247314453125, -10.31378173828125, -9.90283203125, -9.49188232421875, -9.0809326171875, -8.66998291015625, -8.259033203125, -7.84808349609375, -7.4371337890625, -7.02618408203125, -6.615234375, -6.20428466796875, -5.7933349609375, -5.38238525390625, -4.971435546875, -4.56048583984375, -4.1495361328125, -3.73858642578125, -3.32763671875, -2.91668701171875, -2.5057373046875, -2.09478759765625, -1.683837890625, -1.27288818359375, -0.8619384765625, -0.45098876953125, -0.0400390625, 0.37091064453125, 0.7818603515625, 1.19281005859375, 1.603759765625, 2.01470947265625, 2.4256591796875, 2.83660888671875, 3.24755859375, 3.65850830078125, 4.0694580078125, 4.48040771484375, 4.891357421875, 5.30230712890625, 5.7132568359375, 6.12420654296875, 6.53515625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 7.0, 9.0, 11.0, 24.0, 32.0, 32.0, 61.0, 101.0, 202.0, 462.0, 1493.0, 9233.0, 535381.0, 3603709.0, 39293.0, 2881.0, 727.0, 258.0, 125.0, 80.0, 38.0, 31.0, 30.0, 22.0, 8.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.0625, -25.9453125, -24.828125, -23.7109375, -22.59375, -21.4765625, -20.359375, -19.2421875, -18.125, -17.0078125, -15.890625, -14.7734375, -13.65625, -12.5390625, -11.421875, -10.3046875, -9.1875, -8.0703125, -6.953125, -5.8359375, -4.71875, -3.6015625, -2.484375, -1.3671875, -0.25, 0.8671875, 1.984375, 3.1015625, 4.21875, 5.3359375, 6.453125, 7.5703125, 8.6875, 9.8046875, 10.921875, 12.0390625, 13.15625, 14.2734375, 15.390625, 16.5078125, 17.625, 18.7421875, 19.859375, 20.9765625, 22.09375, 23.2109375, 24.328125, 25.4453125, 26.5625, 27.6796875, 28.796875, 29.9140625, 31.03125, 32.1484375, 33.265625, 34.3828125, 35.5, 36.6171875, 37.734375, 38.8515625, 39.96875, 41.0859375, 42.203125, 43.3203125, 44.4375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 19.0, 26.0, 38.0, 106.0, 142.0, 177.0, 166.0, 154.0, 84.0, 49.0, 26.0, 12.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0624008178711, -79.03031158447266, -76.99822235107422, -74.96613311767578, -72.93403625488281, -70.90194702148438, -68.86985778808594, -66.8377685546875, -64.80567932128906, -62.773590087890625, -60.74150085449219, -58.709407806396484, -56.67731857299805, -54.64522933959961, -52.613136291503906, -50.58104705810547, -48.54895782470703, -46.516868591308594, -44.484779357910156, -42.45268630981445, -40.420597076416016, -38.38850784301758, -36.356414794921875, -34.32432556152344, -32.292236328125, -30.260147094726562, -28.228055953979492, -26.195964813232422, -24.163875579833984, -22.131786346435547, -20.099695205688477, -18.067604064941406, -16.0355224609375, -14.003432273864746, -11.971342086791992, -9.939251899719238, -7.907161712646484, -5.8750715255737305, -3.8429813385009766, -1.8108911514282227, 0.22119903564453125, 2.253289222717285, 4.285379409790039, 6.317469596862793, 8.349559783935547, 10.3816499710083, 12.413740158081055, 14.445830345153809, 16.477920532226562, 18.510009765625, 20.54210090637207, 22.57419204711914, 24.606281280517578, 26.638370513916016, 28.670461654663086, 30.702552795410156, 32.734642028808594, 34.76673126220703, 36.79882049560547, 38.83091354370117, 40.86300277709961, 42.89509201049805, 44.92718505859375, 46.95927429199219, 48.991363525390625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 8.0, 4.0, 7.0, 10.0, 10.0, 9.0, 14.0, 17.0, 14.0, 10.0, 22.0, 23.0, 32.0, 30.0, 36.0, 25.0, 39.0, 37.0, 44.0, 50.0, 37.0, 40.0, 41.0, 34.0, 48.0, 42.0, 35.0, 50.0, 39.0, 29.0, 33.0, 26.0, 27.0, 14.0, 17.0, 13.0, 7.0, 10.0, 8.0, 1.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.678138732910156, -29.807748794555664, -28.937358856201172, -28.06696891784668, -27.196578979492188, -26.326189041137695, -25.455799102783203, -24.58540916442871, -23.71501922607422, -22.844629287719727, -21.974239349365234, -21.103849411010742, -20.23345947265625, -19.363069534301758, -18.492679595947266, -17.622289657592773, -16.75189971923828, -15.881509780883789, -15.011119842529297, -14.140729904174805, -13.270339965820312, -12.39995002746582, -11.529560089111328, -10.659170150756836, -9.788780212402344, -8.918390274047852, -8.04800033569336, -7.177610397338867, -6.307220458984375, -5.436830520629883, -4.566440582275391, -3.6960506439208984, -2.8256607055664062, -1.955270767211914, -1.0848808288574219, -0.2144908905029297, 0.6558990478515625, 1.5262889862060547, 2.396678924560547, 3.267068862915039, 4.137458801269531, 5.007848739624023, 5.878238677978516, 6.748628616333008, 7.6190185546875, 8.489408493041992, 9.359798431396484, 10.230188369750977, 11.100578308105469, 11.970968246459961, 12.841358184814453, 13.711748123168945, 14.582138061523438, 15.45252799987793, 16.322917938232422, 17.193307876586914, 18.063697814941406, 18.9340877532959, 19.80447769165039, 20.674867630004883, 21.545257568359375, 22.415647506713867, 23.28603744506836, 24.15642738342285, 25.026817321777344]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 8.0, 11.0, 10.0, 16.0, 20.0, 23.0, 26.0, 33.0, 44.0, 47.0, 46.0, 58.0, 71.0, 55.0, 51.0, 65.0, 60.0, 57.0, 48.0, 31.0, 38.0, 47.0, 27.0, 25.0, 16.0, 19.0, 11.0, 13.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-3.88671875, -3.7968902587890625, -3.707061767578125, -3.6172332763671875, -3.52740478515625, -3.4375762939453125, -3.347747802734375, -3.2579193115234375, -3.1680908203125, -3.0782623291015625, -2.988433837890625, -2.8986053466796875, -2.80877685546875, -2.7189483642578125, -2.629119873046875, -2.5392913818359375, -2.449462890625, -2.3596343994140625, -2.269805908203125, -2.1799774169921875, -2.09014892578125, -2.0003204345703125, -1.910491943359375, -1.8206634521484375, -1.7308349609375, -1.6410064697265625, -1.551177978515625, -1.4613494873046875, -1.37152099609375, -1.2816925048828125, -1.191864013671875, -1.1020355224609375, -1.01220703125, -0.9223785400390625, -0.832550048828125, -0.7427215576171875, -0.65289306640625, -0.5630645751953125, -0.473236083984375, -0.3834075927734375, -0.2935791015625, -0.2037506103515625, -0.113922119140625, -0.0240936279296875, 0.06573486328125, 0.1555633544921875, 0.245391845703125, 0.3352203369140625, 0.425048828125, 0.5148773193359375, 0.604705810546875, 0.6945343017578125, 0.78436279296875, 0.8741912841796875, 0.964019775390625, 1.0538482666015625, 1.1436767578125, 1.2335052490234375, 1.323333740234375, 1.4131622314453125, 1.50299072265625, 1.5928192138671875, 1.682647705078125, 1.7724761962890625, 1.8623046875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 9.0, 10.0, 14.0, 19.0, 25.0, 33.0, 47.0, 88.0, 181.0, 369.0, 658.0, 1363.0, 2600.0, 4925.0, 9910.0, 19973.0, 42412.0, 97128.0, 287204.0, 364620.0, 119567.0, 50098.0, 23707.0, 11596.0, 5846.0, 2936.0, 1504.0, 785.0, 376.0, 223.0, 118.0, 58.0, 30.0, 25.0, 17.0, 16.0, 14.0, 5.0, 8.0, 3.0, 4.0, 4.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025360107421875, -0.02448892593383789, -0.02361774444580078, -0.022746562957763672, -0.021875381469726562, -0.021004199981689453, -0.020133018493652344, -0.019261837005615234, -0.018390655517578125, -0.017519474029541016, -0.016648292541503906, -0.015777111053466797, -0.014905929565429688, -0.014034748077392578, -0.013163566589355469, -0.01229238510131836, -0.01142120361328125, -0.01055002212524414, -0.009678840637207031, -0.008807659149169922, -0.007936477661132812, -0.007065296173095703, -0.006194114685058594, -0.005322933197021484, -0.004451751708984375, -0.0035805702209472656, -0.0027093887329101562, -0.0018382072448730469, -0.0009670257568359375, -9.584426879882812e-05, 0.0007753372192382812, 0.0016465187072753906, 0.0025177001953125, 0.0033888816833496094, 0.004260063171386719, 0.005131244659423828, 0.0060024261474609375, 0.006873607635498047, 0.007744789123535156, 0.008615970611572266, 0.009487152099609375, 0.010358333587646484, 0.011229515075683594, 0.012100696563720703, 0.012971878051757812, 0.013843059539794922, 0.014714241027832031, 0.01558542251586914, 0.01645660400390625, 0.01732778549194336, 0.01819896697998047, 0.019070148468017578, 0.019941329956054688, 0.020812511444091797, 0.021683692932128906, 0.022554874420166016, 0.023426055908203125, 0.024297237396240234, 0.025168418884277344, 0.026039600372314453, 0.026910781860351562, 0.027781963348388672, 0.02865314483642578, 0.02952432632446289, 0.0303955078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 6.0, 10.0, 16.0, 10.0, 8.0, 9.0, 14.0, 17.0, 23.0, 26.0, 27.0, 43.0, 29.0, 34.0, 29.0, 32.0, 32.0, 28.0, 46.0, 1064.0, 49.0, 42.0, 39.0, 44.0, 27.0, 31.0, 35.0, 25.0, 29.0, 20.0, 16.0, 22.0, 11.0, 19.0, 14.0, 11.0, 11.0, 8.0, 7.0, 8.0, 7.0, 6.0, 4.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.525390625, -1.4770965576171875, -1.428802490234375, -1.3805084228515625, -1.33221435546875, -1.2839202880859375, -1.235626220703125, -1.1873321533203125, -1.1390380859375, -1.0907440185546875, -1.042449951171875, -0.9941558837890625, -0.94586181640625, -0.8975677490234375, -0.849273681640625, -0.8009796142578125, -0.752685546875, -0.7043914794921875, -0.656097412109375, -0.6078033447265625, -0.55950927734375, -0.5112152099609375, -0.462921142578125, -0.4146270751953125, -0.3663330078125, -0.3180389404296875, -0.269744873046875, -0.2214508056640625, -0.17315673828125, -0.1248626708984375, -0.076568603515625, -0.0282745361328125, 0.02001953125, 0.0683135986328125, 0.116607666015625, 0.1649017333984375, 0.21319580078125, 0.2614898681640625, 0.309783935546875, 0.3580780029296875, 0.4063720703125, 0.4546661376953125, 0.502960205078125, 0.5512542724609375, 0.59954833984375, 0.6478424072265625, 0.696136474609375, 0.7444305419921875, 0.792724609375, 0.8410186767578125, 0.889312744140625, 0.9376068115234375, 0.98590087890625, 1.0341949462890625, 1.082489013671875, 1.1307830810546875, 1.1790771484375, 1.2273712158203125, 1.275665283203125, 1.3239593505859375, 1.37225341796875, 1.4205474853515625, 1.468841552734375, 1.5171356201171875, 1.5654296875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 10.0, 15.0, 27.0, 34.0, 54.0, 81.0, 112.0, 177.0, 225.0, 342.0, 505.0, 724.0, 1007.0, 1594.0, 2203.0, 3244.0, 4990.0, 7429.0, 11256.0, 17022.0, 26036.0, 40485.0, 65056.0, 107252.0, 188773.0, 1269231.0, 132715.0, 78225.0, 48427.0, 30579.0, 19656.0, 13230.0, 8478.0, 5817.0, 3790.0, 2612.0, 1780.0, 1254.0, 847.0, 584.0, 385.0, 263.0, 189.0, 135.0, 95.0, 59.0, 46.0, 34.0, 15.0, 20.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00628662109375, -0.006085038185119629, -0.005883455276489258, -0.005681872367858887, -0.005480289459228516, -0.0052787065505981445, -0.0050771236419677734, -0.004875540733337402, -0.004673957824707031, -0.00447237491607666, -0.004270792007446289, -0.004069209098815918, -0.003867626190185547, -0.0036660432815551758, -0.0034644603729248047, -0.0032628774642944336, -0.0030612945556640625, -0.0028597116470336914, -0.0026581287384033203, -0.0024565458297729492, -0.002254962921142578, -0.002053380012512207, -0.001851797103881836, -0.0016502141952514648, -0.0014486312866210938, -0.0012470483779907227, -0.0010454654693603516, -0.0008438825607299805, -0.0006422996520996094, -0.0004407167434692383, -0.0002391338348388672, -3.7550926208496094e-05, 0.000164031982421875, 0.0003656148910522461, 0.0005671977996826172, 0.0007687807083129883, 0.0009703636169433594, 0.0011719465255737305, 0.0013735294342041016, 0.0015751123428344727, 0.0017766952514648438, 0.001978278160095215, 0.002179861068725586, 0.002381443977355957, 0.002583026885986328, 0.0027846097946166992, 0.0029861927032470703, 0.0031877756118774414, 0.0033893585205078125, 0.0035909414291381836, 0.0037925243377685547, 0.003994107246398926, 0.004195690155029297, 0.004397273063659668, 0.004598855972290039, 0.00480043888092041, 0.005002021789550781, 0.005203604698181152, 0.0054051876068115234, 0.0056067705154418945, 0.005808353424072266, 0.006009936332702637, 0.006211519241333008, 0.006413102149963379, 0.00661468505859375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 121.0, 0.0, 0.0, 0.0, 467.0, 0.0, 0.0, 0.0, 113.0, 0.0, 0.0, 77.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.0140002965927124e-07, -3.855675458908081e-07, -3.6973506212234497e-07, -3.5390257835388184e-07, -3.380700945854187e-07, -3.2223761081695557e-07, -3.0640512704849243e-07, -2.905726432800293e-07, -2.7474015951156616e-07, -2.5890767574310303e-07, -2.430751919746399e-07, -2.2724270820617676e-07, -2.1141022443771362e-07, -1.955777406692505e-07, -1.7974525690078735e-07, -1.6391277313232422e-07, -1.4808028936386108e-07, -1.3224780559539795e-07, -1.1641532182693481e-07, -1.0058283805847168e-07, -8.475035429000854e-08, -6.891787052154541e-08, -5.3085386753082275e-08, -3.725290298461914e-08, -2.1420419216156006e-08, -5.587935447692871e-09, 1.0244548320770264e-08, 2.60770320892334e-08, 4.190951585769653e-08, 5.774199962615967e-08, 7.35744833946228e-08, 8.940696716308594e-08, 1.0523945093154907e-07, 1.210719347000122e-07, 1.3690441846847534e-07, 1.5273690223693848e-07, 1.685693860054016e-07, 1.8440186977386475e-07, 2.0023435354232788e-07, 2.1606683731079102e-07, 2.3189932107925415e-07, 2.477318048477173e-07, 2.635642886161804e-07, 2.7939677238464355e-07, 2.952292561531067e-07, 3.110617399215698e-07, 3.2689422369003296e-07, 3.427267074584961e-07, 3.5855919122695923e-07, 3.7439167499542236e-07, 3.902241587638855e-07, 4.0605664253234863e-07, 4.2188912630081177e-07, 4.377216100692749e-07, 4.5355409383773804e-07, 4.6938657760620117e-07, 4.852190613746643e-07, 5.010515451431274e-07, 5.168840289115906e-07, 5.327165126800537e-07, 5.485489964485168e-07, 5.6438148021698e-07, 5.802139639854431e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 3.0, 6.0, 3.0, 5.0, 12.0, 11.0, 16.0, 31.0, 19.0, 34.0, 41.0, 52.0, 67.0, 54.0, 104.0, 112.0, 113.0, 380.0, 1443.0, 40924.0, 909332.0, 89574.0, 5011.0, 448.0, 152.0, 124.0, 98.0, 76.0, 50.0, 51.0, 38.0, 29.0, 27.0, 28.0, 19.0, 18.0, 10.0, 8.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-8.285045623779297e-06, -8.023343980312347e-06, -7.761642336845398e-06, -7.4999406933784485e-06, -7.238239049911499e-06, -6.9765374064445496e-06, -6.7148357629776e-06, -6.453134119510651e-06, -6.191432476043701e-06, -5.929730832576752e-06, -5.668029189109802e-06, -5.406327545642853e-06, -5.144625902175903e-06, -4.882924258708954e-06, -4.621222615242004e-06, -4.359520971775055e-06, -4.0978193283081055e-06, -3.836117684841156e-06, -3.5744160413742065e-06, -3.312714397907257e-06, -3.0510127544403076e-06, -2.789311110973358e-06, -2.5276094675064087e-06, -2.2659078240394592e-06, -2.0042061805725098e-06, -1.7425045371055603e-06, -1.4808028936386108e-06, -1.2191012501716614e-06, -9.57399606704712e-07, -6.956979632377625e-07, -4.33996319770813e-07, -1.7229467630386353e-07, 8.940696716308594e-08, 3.511086106300354e-07, 6.128102540969849e-07, 8.745118975639343e-07, 1.1362135410308838e-06, 1.3979151844978333e-06, 1.6596168279647827e-06, 1.921318471431732e-06, 2.1830201148986816e-06, 2.444721758365631e-06, 2.7064234018325806e-06, 2.96812504529953e-06, 3.2298266887664795e-06, 3.491528332233429e-06, 3.7532299757003784e-06, 4.014931619167328e-06, 4.276633262634277e-06, 4.538334906101227e-06, 4.800036549568176e-06, 5.061738193035126e-06, 5.323439836502075e-06, 5.585141479969025e-06, 5.846843123435974e-06, 6.108544766902924e-06, 6.370246410369873e-06, 6.6319480538368225e-06, 6.893649697303772e-06, 7.1553513407707214e-06, 7.417052984237671e-06, 7.67875462770462e-06, 7.94045627117157e-06, 8.20215791463852e-06, 8.463859558105469e-06]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 12.0, 17.0, 33.0, 42.0, 67.0, 77.0, 431.0, 69.0, 70.0, 52.0, 47.0, 29.0, 19.0, 11.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.444868970196694e-07, -7.28646341485728e-07, -7.128058427952055e-07, -6.969652872612642e-07, -6.811247317273228e-07, -6.652842330368003e-07, -6.494436775028589e-07, -6.336031219689175e-07, -6.17762623278395e-07, -6.019220677444537e-07, -5.860815690539312e-07, -5.702410135199898e-07, -5.544004579860484e-07, -5.385599592955259e-07, -5.227194037615845e-07, -5.068788482276432e-07, -4.910383495371207e-07, -4.7519782242488873e-07, -4.5935726689094736e-07, -4.435167397787154e-07, -4.276762126664835e-07, -4.1183568555425154e-07, -3.9599513002031017e-07, -3.8015460290807823e-07, -3.6431401895242743e-07, -3.484734918401955e-07, -3.326329363062541e-07, -3.167924091940222e-07, -3.0095188208179025e-07, -2.851113549695583e-07, -2.6927079943561694e-07, -2.53430272323385e-07, -2.375897736328625e-07, -2.2174923230977583e-07, -2.059087051975439e-07, -1.9006816387445724e-07, -1.742276367622253e-07, -1.5838709543913865e-07, -1.42546554116052e-07, -1.2670602700382005e-07, -1.108654856807334e-07, -9.50249514630741e-08, -7.91844172454148e-08, -6.334387592232815e-08, -4.7503341704668856e-08, -3.166280748700956e-08, -1.5822266163922905e-08, 1.8268053736392176e-11, 1.585880227139569e-08, 3.1699336489054986e-08, 4.753987425942796e-08, 6.338041202980094e-08, 7.922094624746023e-08, 9.506148046511953e-08, 1.1090202178820618e-07, 1.2674254890043812e-07, 1.4258309022352478e-07, 1.5842363154661143e-07, 1.7426415865884337e-07, 1.9010469998193003e-07, 2.0594524130501668e-07, 2.2178576841724862e-07, 2.3762630974033527e-07, 2.5346685106342193e-07, 2.6930737817565387e-07]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 0.0, 0.0, 186.0, 0.0, 0.0, 0.0, 0.0, 0.0, 445.0, 0.0, 0.0, 0.0, 0.0, 182.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.980232238769531e-07, -2.8777867555618286e-07, -2.775341272354126e-07, -2.6728957891464233e-07, -2.5704503059387207e-07, -2.468004822731018e-07, -2.3655593395233154e-07, -2.2631138563156128e-07, -2.1606683731079102e-07, -2.0582228899002075e-07, -1.955777406692505e-07, -1.8533319234848022e-07, -1.7508864402770996e-07, -1.648440957069397e-07, -1.5459954738616943e-07, -1.4435499906539917e-07, -1.341104507446289e-07, -1.2386590242385864e-07, -1.1362135410308838e-07, -1.0337680578231812e-07, -9.313225746154785e-08, -8.288770914077759e-08, -7.264316082000732e-08, -6.239861249923706e-08, -5.21540641784668e-08, -4.190951585769653e-08, -3.166496753692627e-08, -2.1420419216156006e-08, -1.1175870895385742e-08, -9.313225746154785e-10, 9.313225746154785e-09, 1.955777406692505e-08, 2.9802322387695312e-08, 4.0046870708465576e-08, 5.029141902923584e-08, 6.05359673500061e-08, 7.078051567077637e-08, 8.102506399154663e-08, 9.12696123123169e-08, 1.0151416063308716e-07, 1.1175870895385742e-07, 1.2200325727462769e-07, 1.3224780559539795e-07, 1.424923539161682e-07, 1.5273690223693848e-07, 1.6298145055770874e-07, 1.73225998878479e-07, 1.8347054719924927e-07, 1.9371509552001953e-07, 2.039596438407898e-07, 2.1420419216156006e-07, 2.2444874048233032e-07, 2.3469328880310059e-07, 2.4493783712387085e-07, 2.551823854446411e-07, 2.654269337654114e-07, 2.7567148208618164e-07, 2.859160304069519e-07, 2.9616057872772217e-07, 3.0640512704849243e-07, 3.166496753692627e-07, 3.2689422369003296e-07, 3.371387720108032e-07, 3.473833203315735e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 8.0, 11.0, 10.0, 16.0, 20.0, 23.0, 26.0, 33.0, 44.0, 47.0, 46.0, 58.0, 71.0, 55.0, 51.0, 65.0, 60.0, 57.0, 48.0, 31.0, 38.0, 47.0, 27.0, 25.0, 16.0, 19.0, 11.0, 13.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-3.88671875, -3.7968902587890625, -3.707061767578125, -3.6172332763671875, -3.52740478515625, -3.4375762939453125, -3.347747802734375, -3.2579193115234375, -3.1680908203125, -3.0782623291015625, -2.988433837890625, -2.8986053466796875, -2.80877685546875, -2.7189483642578125, -2.629119873046875, -2.5392913818359375, -2.449462890625, -2.3596343994140625, -2.269805908203125, -2.1799774169921875, -2.09014892578125, -2.0003204345703125, -1.910491943359375, -1.8206634521484375, -1.7308349609375, -1.6410064697265625, -1.551177978515625, -1.4613494873046875, -1.37152099609375, -1.2816925048828125, -1.191864013671875, -1.1020355224609375, -1.01220703125, -0.9223785400390625, -0.832550048828125, -0.7427215576171875, -0.65289306640625, -0.5630645751953125, -0.473236083984375, -0.3834075927734375, -0.2935791015625, -0.2037506103515625, -0.113922119140625, -0.0240936279296875, 0.06573486328125, 0.1555633544921875, 0.245391845703125, 0.3352203369140625, 0.425048828125, 0.5148773193359375, 0.604705810546875, 0.6945343017578125, 0.78436279296875, 0.8741912841796875, 0.964019775390625, 1.0538482666015625, 1.1436767578125, 1.2335052490234375, 1.323333740234375, 1.4131622314453125, 1.50299072265625, 1.5928192138671875, 1.682647705078125, 1.7724761962890625, 1.8623046875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 10.0, 29.0, 41.0, 66.0, 120.0, 255.0, 519.0, 1037.0, 2414.0, 7280.0, 32304.0, 239788.0, 682370.0, 63637.0, 12407.0, 3524.0, 1393.0, 662.0, 316.0, 163.0, 98.0, 46.0, 25.0, 18.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.80078125, -6.617919921875, -6.43505859375, -6.252197265625, -6.0693359375, -5.886474609375, -5.70361328125, -5.520751953125, -5.337890625, -5.155029296875, -4.97216796875, -4.789306640625, -4.6064453125, -4.423583984375, -4.24072265625, -4.057861328125, -3.875, -3.692138671875, -3.50927734375, -3.326416015625, -3.1435546875, -2.960693359375, -2.77783203125, -2.594970703125, -2.412109375, -2.229248046875, -2.04638671875, -1.863525390625, -1.6806640625, -1.497802734375, -1.31494140625, -1.132080078125, -0.94921875, -0.766357421875, -0.58349609375, -0.400634765625, -0.2177734375, -0.034912109375, 0.14794921875, 0.330810546875, 0.513671875, 0.696533203125, 0.87939453125, 1.062255859375, 1.2451171875, 1.427978515625, 1.61083984375, 1.793701171875, 1.9765625, 2.159423828125, 2.34228515625, 2.525146484375, 2.7080078125, 2.890869140625, 3.07373046875, 3.256591796875, 3.439453125, 3.622314453125, 3.80517578125, 3.988037109375, 4.1708984375, 4.353759765625, 4.53662109375, 4.719482421875, 4.90234375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 17.0, 6.0, 22.0, 21.0, 27.0, 33.0, 34.0, 41.0, 44.0, 58.0, 72.0, 152.0, 1768.0, 267.0, 89.0, 56.0, 58.0, 49.0, 46.0, 35.0, 28.0, 14.0, 25.0, 13.0, 19.0, 8.0, 10.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.0740966796875, -8.757568359375, -8.4410400390625, -8.12451171875, -7.8079833984375, -7.491455078125, -7.1749267578125, -6.8583984375, -6.5418701171875, -6.225341796875, -5.9088134765625, -5.59228515625, -5.2757568359375, -4.959228515625, -4.6427001953125, -4.326171875, -4.0096435546875, -3.693115234375, -3.3765869140625, -3.06005859375, -2.7435302734375, -2.427001953125, -2.1104736328125, -1.7939453125, -1.4774169921875, -1.160888671875, -0.8443603515625, -0.52783203125, -0.2113037109375, 0.105224609375, 0.4217529296875, 0.73828125, 1.0548095703125, 1.371337890625, 1.6878662109375, 2.00439453125, 2.3209228515625, 2.637451171875, 2.9539794921875, 3.2705078125, 3.5870361328125, 3.903564453125, 4.2200927734375, 4.53662109375, 4.8531494140625, 5.169677734375, 5.4862060546875, 5.802734375, 6.1192626953125, 6.435791015625, 6.7523193359375, 7.06884765625, 7.3853759765625, 7.701904296875, 8.0184326171875, 8.3349609375, 8.6514892578125, 8.968017578125, 9.2845458984375, 9.60107421875, 9.9176025390625, 10.234130859375, 10.5506591796875, 10.8671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 14.0, 11.0, 16.0, 18.0, 14.0, 26.0, 27.0, 44.0, 55.0, 80.0, 146.0, 288.0, 604.0, 2319.0, 17220.0, 2034344.0, 1072040.0, 15015.0, 2166.0, 606.0, 233.0, 125.0, 83.0, 43.0, 38.0, 28.0, 27.0, 18.0, 12.0, 12.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.921875, -11.560302734375, -11.19873046875, -10.837158203125, -10.4755859375, -10.114013671875, -9.75244140625, -9.390869140625, -9.029296875, -8.667724609375, -8.30615234375, -7.944580078125, -7.5830078125, -7.221435546875, -6.85986328125, -6.498291015625, -6.13671875, -5.775146484375, -5.41357421875, -5.052001953125, -4.6904296875, -4.328857421875, -3.96728515625, -3.605712890625, -3.244140625, -2.882568359375, -2.52099609375, -2.159423828125, -1.7978515625, -1.436279296875, -1.07470703125, -0.713134765625, -0.3515625, 0.010009765625, 0.37158203125, 0.733154296875, 1.0947265625, 1.456298828125, 1.81787109375, 2.179443359375, 2.541015625, 2.902587890625, 3.26416015625, 3.625732421875, 3.9873046875, 4.348876953125, 4.71044921875, 5.072021484375, 5.43359375, 5.795166015625, 6.15673828125, 6.518310546875, 6.8798828125, 7.241455078125, 7.60302734375, 7.964599609375, 8.326171875, 8.687744140625, 9.04931640625, 9.410888671875, 9.7724609375, 10.134033203125, 10.49560546875, 10.857177734375, 11.21875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 109.0, 554.0, 322.0, 27.0, 2.0, 2.0], "bins": [-134.84300231933594, -132.58731079101562, -130.33163452148438, -128.07594299316406, -125.82025146484375, -123.56456756591797, -121.30887603759766, -119.05319213867188, -116.79750061035156, -114.54181671142578, -112.28612518310547, -110.03044128417969, -107.77474975585938, -105.5190658569336, -103.26337432861328, -101.0076904296875, -98.75199890136719, -96.4963150024414, -94.2406234741211, -91.98493957519531, -89.729248046875, -87.47356414794922, -85.2178726196289, -82.96218872070312, -80.70650482177734, -78.45082092285156, -76.19512939453125, -73.93944549560547, -71.68375396728516, -69.42807006835938, -67.17237854003906, -64.91669464111328, -62.661006927490234, -60.40531921386719, -58.14963150024414, -55.893943786621094, -53.63825607299805, -51.382568359375, -49.12688446044922, -46.871192932128906, -44.615509033203125, -42.35982131958008, -40.10413360595703, -37.848445892333984, -35.59275817871094, -33.33707046508789, -31.081384658813477, -28.82569694519043, -26.57000732421875, -24.314319610595703, -22.058631896972656, -19.80294418334961, -17.547256469726562, -15.291569709777832, -13.035882949829102, -10.780195236206055, -8.524507522583008, -6.268819808959961, -4.013132572174072, -1.7574453353881836, 0.4982423782348633, 2.75393009185791, 5.009616851806641, 7.2653045654296875, 9.520992279052734]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 9.0, 13.0, 11.0, 16.0, 10.0, 23.0, 26.0, 23.0, 24.0, 27.0, 30.0, 40.0, 32.0, 33.0, 36.0, 34.0, 38.0, 43.0, 50.0, 39.0, 59.0, 36.0, 28.0, 34.0, 26.0, 23.0, 22.0, 29.0, 25.0, 25.0, 13.0, 20.0, 16.0, 16.0, 6.0, 7.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.819372177124023, -23.039987564086914, -22.260604858398438, -21.481220245361328, -20.70183753967285, -19.922452926635742, -19.143070220947266, -18.363685607910156, -17.584300994873047, -16.804916381835938, -16.02553367614746, -15.246149063110352, -14.466766357421875, -13.687381744384766, -12.907998085021973, -12.12861442565918, -11.349231719970703, -10.56984806060791, -9.790464401245117, -9.011079788208008, -8.231697082519531, -7.45231294631958, -6.672928810119629, -5.893545150756836, -5.114161491394043, -4.33477783203125, -3.555393934249878, -2.776010036468506, -1.996626377105713, -1.21724271774292, -0.43785858154296875, 0.3415250778198242, 1.12091064453125, 1.9002944231033325, 2.679678201675415, 3.459062099456787, 4.23844575881958, 5.017829418182373, 5.797213554382324, 6.576597213745117, 7.35598087310791, 8.135364532470703, 8.914748191833496, 9.694131851196289, 10.473516464233398, 11.252899169921875, 12.032283782958984, 12.811667442321777, 13.59105110168457, 14.370434761047363, 15.149818420410156, 15.929203033447266, 16.708585739135742, 17.48797035217285, 18.267353057861328, 19.046737670898438, 19.826122283935547, 20.605506896972656, 21.384889602661133, 22.164274215698242, 22.94365692138672, 23.723041534423828, 24.502426147460938, 25.281808853149414, 26.06119155883789]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 8.0, 10.0, 10.0, 15.0, 17.0, 23.0, 21.0, 37.0, 41.0, 50.0, 47.0, 59.0, 52.0, 65.0, 51.0, 66.0, 64.0, 51.0, 52.0, 38.0, 32.0, 45.0, 32.0, 25.0, 17.0, 16.0, 17.0, 11.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-3.92578125, -3.8353424072265625, -3.744903564453125, -3.6544647216796875, -3.56402587890625, -3.4735870361328125, -3.383148193359375, -3.2927093505859375, -3.2022705078125, -3.1118316650390625, -3.021392822265625, -2.9309539794921875, -2.84051513671875, -2.7500762939453125, -2.659637451171875, -2.5691986083984375, -2.478759765625, -2.3883209228515625, -2.297882080078125, -2.2074432373046875, -2.11700439453125, -2.0265655517578125, -1.936126708984375, -1.8456878662109375, -1.7552490234375, -1.6648101806640625, -1.574371337890625, -1.4839324951171875, -1.39349365234375, -1.3030548095703125, -1.212615966796875, -1.1221771240234375, -1.03173828125, -0.9412994384765625, -0.850860595703125, -0.7604217529296875, -0.66998291015625, -0.5795440673828125, -0.489105224609375, -0.3986663818359375, -0.3082275390625, -0.2177886962890625, -0.127349853515625, -0.0369110107421875, 0.05352783203125, 0.1439666748046875, 0.234405517578125, 0.3248443603515625, 0.415283203125, 0.5057220458984375, 0.596160888671875, 0.6865997314453125, 0.77703857421875, 0.8674774169921875, 0.957916259765625, 1.0483551025390625, 1.1387939453125, 1.2292327880859375, 1.319671630859375, 1.4101104736328125, 1.50054931640625, 1.5909881591796875, 1.681427001953125, 1.7718658447265625, 1.8623046875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 18.0, 10.0, 18.0, 30.0, 34.0, 55.0, 84.0, 184.0, 349.0, 860.0, 2489.0, 8812.0, 40269.0, 260567.0, 2598905.0, 1134948.0, 117659.0, 21160.0, 5183.0, 1468.0, 584.0, 257.0, 115.0, 83.0, 28.0, 39.0, 17.0, 14.0, 9.0, 5.0, 10.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-10.984375, -10.71514892578125, -10.4459228515625, -10.17669677734375, -9.907470703125, -9.63824462890625, -9.3690185546875, -9.09979248046875, -8.83056640625, -8.56134033203125, -8.2921142578125, -8.02288818359375, -7.753662109375, -7.48443603515625, -7.2152099609375, -6.94598388671875, -6.6767578125, -6.40753173828125, -6.1383056640625, -5.86907958984375, -5.599853515625, -5.33062744140625, -5.0614013671875, -4.79217529296875, -4.52294921875, -4.25372314453125, -3.9844970703125, -3.71527099609375, -3.446044921875, -3.17681884765625, -2.9075927734375, -2.63836669921875, -2.369140625, -2.09991455078125, -1.8306884765625, -1.56146240234375, -1.292236328125, -1.02301025390625, -0.7537841796875, -0.48455810546875, -0.21533203125, 0.05389404296875, 0.3231201171875, 0.59234619140625, 0.861572265625, 1.13079833984375, 1.4000244140625, 1.66925048828125, 1.9384765625, 2.20770263671875, 2.4769287109375, 2.74615478515625, 3.015380859375, 3.28460693359375, 3.5538330078125, 3.82305908203125, 4.09228515625, 4.36151123046875, 4.6307373046875, 4.89996337890625, 5.169189453125, 5.43841552734375, 5.7076416015625, 5.97686767578125, 6.24609375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 9.0, 19.0, 14.0, 27.0, 55.0, 56.0, 97.0, 154.0, 237.0, 347.0, 447.0, 582.0, 600.0, 461.0, 305.0, 207.0, 145.0, 105.0, 75.0, 40.0, 35.0, 21.0, 12.0, 11.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1484375, -10.869140625, -10.58984375, -10.310546875, -10.03125, -9.751953125, -9.47265625, -9.193359375, -8.9140625, -8.634765625, -8.35546875, -8.076171875, -7.796875, -7.517578125, -7.23828125, -6.958984375, -6.6796875, -6.400390625, -6.12109375, -5.841796875, -5.5625, -5.283203125, -5.00390625, -4.724609375, -4.4453125, -4.166015625, -3.88671875, -3.607421875, -3.328125, -3.048828125, -2.76953125, -2.490234375, -2.2109375, -1.931640625, -1.65234375, -1.373046875, -1.09375, -0.814453125, -0.53515625, -0.255859375, 0.0234375, 0.302734375, 0.58203125, 0.861328125, 1.140625, 1.419921875, 1.69921875, 1.978515625, 2.2578125, 2.537109375, 2.81640625, 3.095703125, 3.375, 3.654296875, 3.93359375, 4.212890625, 4.4921875, 4.771484375, 5.05078125, 5.330078125, 5.609375, 5.888671875, 6.16796875, 6.447265625, 6.7265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 5.0, 0.0, 8.0, 10.0, 13.0, 16.0, 18.0, 28.0, 51.0, 96.0, 145.0, 215.0, 380.0, 729.0, 1393.0, 3482.0, 11489.0, 57761.0, 432752.0, 2752728.0, 809583.0, 97679.0, 17216.0, 4823.0, 1781.0, 822.0, 443.0, 242.0, 131.0, 91.0, 52.0, 36.0, 22.0, 13.0, 13.0, 9.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.3193359375, -8.888671875, -8.4580078125, -8.02734375, -7.5966796875, -7.166015625, -6.7353515625, -6.3046875, -5.8740234375, -5.443359375, -5.0126953125, -4.58203125, -4.1513671875, -3.720703125, -3.2900390625, -2.859375, -2.4287109375, -1.998046875, -1.5673828125, -1.13671875, -0.7060546875, -0.275390625, 0.1552734375, 0.5859375, 1.0166015625, 1.447265625, 1.8779296875, 2.30859375, 2.7392578125, 3.169921875, 3.6005859375, 4.03125, 4.4619140625, 4.892578125, 5.3232421875, 5.75390625, 6.1845703125, 6.615234375, 7.0458984375, 7.4765625, 7.9072265625, 8.337890625, 8.7685546875, 9.19921875, 9.6298828125, 10.060546875, 10.4912109375, 10.921875, 11.3525390625, 11.783203125, 12.2138671875, 12.64453125, 13.0751953125, 13.505859375, 13.9365234375, 14.3671875, 14.7978515625, 15.228515625, 15.6591796875, 16.08984375, 16.5205078125, 16.951171875, 17.3818359375, 17.8125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 14.0, 17.0, 36.0, 54.0, 75.0, 114.0, 124.0, 140.0, 120.0, 111.0, 75.0, 61.0, 33.0, 15.0, 13.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.715938568115234, -34.05451583862305, -32.393089294433594, -30.731666564941406, -29.070240020751953, -27.408817291259766, -25.747392654418945, -24.085968017578125, -22.424543380737305, -20.763118743896484, -19.101694107055664, -17.440269470214844, -15.77884578704834, -14.11742115020752, -12.455997467041016, -10.794572830200195, -9.133148193359375, -7.471723556518555, -5.810299396514893, -4.1488752365112305, -2.48745059967041, -0.8260259628295898, 0.8353977203369141, 2.4968223571777344, 4.158246994018555, 5.819671630859375, 7.481095790863037, 9.1425199508667, 10.80394458770752, 12.46536922454834, 14.126792907714844, 15.788217544555664, 17.44963836669922, 19.11106300354004, 20.77248764038086, 22.433910369873047, 24.0953369140625, 25.756759643554688, 27.418184280395508, 29.079608917236328, 30.74103355407715, 32.40245819091797, 34.063880920410156, 35.72530746459961, 37.3867301940918, 39.04815673828125, 40.70957946777344, 42.371002197265625, 44.03242874145508, 45.693851470947266, 47.35527801513672, 49.016700744628906, 50.67812728881836, 52.33955001831055, 54.0009765625, 55.66239929199219, 57.323822021484375, 58.98524475097656, 60.646671295166016, 62.3080940246582, 63.969520568847656, 65.63094329833984, 67.29236602783203, 68.95379638671875, 70.61521911621094]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 9.0, 5.0, 8.0, 10.0, 12.0, 11.0, 15.0, 18.0, 17.0, 19.0, 23.0, 19.0, 30.0, 33.0, 34.0, 36.0, 44.0, 34.0, 40.0, 40.0, 35.0, 43.0, 44.0, 59.0, 31.0, 40.0, 29.0, 31.0, 28.0, 28.0, 21.0, 25.0, 22.0, 19.0, 20.0, 14.0, 12.0, 14.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.386524200439453, -23.668357849121094, -22.950193405151367, -22.232027053833008, -21.51386070251465, -20.795696258544922, -20.077529907226562, -19.359363555908203, -18.641199111938477, -17.923032760620117, -17.20486831665039, -16.48670196533203, -15.768536567687988, -15.050371170043945, -14.332204818725586, -13.614039421081543, -12.895873069763184, -12.17770767211914, -11.459541320800781, -10.741375923156738, -10.023210525512695, -9.305044174194336, -8.586878776550293, -7.86871337890625, -7.150547504425049, -6.432381629943848, -5.714216232299805, -4.9960503578186035, -4.277884483337402, -3.5597190856933594, -2.841553211212158, -2.1233878135681152, -1.405221939086914, -0.6870562434196472, 0.03110945224761963, 0.7492752075195312, 1.4674408435821533, 2.1856064796447754, 2.9037723541259766, 3.6219377517700195, 4.340103626251221, 5.058269500732422, 5.776434898376465, 6.494600772857666, 7.212766647338867, 7.93093204498291, 8.649097442626953, 9.367263793945312, 10.085429191589355, 10.803594589233398, 11.521760940551758, 12.2399263381958, 12.958091735839844, 13.676258087158203, 14.394423484802246, 15.112588882446289, 15.830755233764648, 16.548921585083008, 17.267086029052734, 17.985252380371094, 18.703418731689453, 19.42158317565918, 20.13974952697754, 20.857913970947266, 21.576080322265625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 8.0, 6.0, 13.0, 18.0, 20.0, 16.0, 24.0, 33.0, 38.0, 40.0, 53.0, 43.0, 53.0, 55.0, 62.0, 54.0, 46.0, 45.0, 47.0, 36.0, 44.0, 44.0, 36.0, 23.0, 28.0, 28.0, 16.0, 12.0, 13.0, 13.0, 2.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.560546875, -3.4758453369140625, -3.391143798828125, -3.3064422607421875, -3.22174072265625, -3.1370391845703125, -3.052337646484375, -2.9676361083984375, -2.8829345703125, -2.7982330322265625, -2.713531494140625, -2.6288299560546875, -2.54412841796875, -2.4594268798828125, -2.374725341796875, -2.2900238037109375, -2.205322265625, -2.1206207275390625, -2.035919189453125, -1.9512176513671875, -1.86651611328125, -1.7818145751953125, -1.697113037109375, -1.6124114990234375, -1.5277099609375, -1.4430084228515625, -1.358306884765625, -1.2736053466796875, -1.18890380859375, -1.1042022705078125, -1.019500732421875, -0.9347991943359375, -0.85009765625, -0.7653961181640625, -0.680694580078125, -0.5959930419921875, -0.51129150390625, -0.4265899658203125, -0.341888427734375, -0.2571868896484375, -0.1724853515625, -0.0877838134765625, -0.003082275390625, 0.0816192626953125, 0.16632080078125, 0.2510223388671875, 0.335723876953125, 0.4204254150390625, 0.505126953125, 0.5898284912109375, 0.674530029296875, 0.7592315673828125, 0.84393310546875, 0.9286346435546875, 1.013336181640625, 1.0980377197265625, 1.1827392578125, 1.2674407958984375, 1.352142333984375, 1.4368438720703125, 1.52154541015625, 1.6062469482421875, 1.690948486328125, 1.7756500244140625, 1.8603515625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 18.0, 18.0, 42.0, 42.0, 66.0, 148.0, 197.0, 375.0, 695.0, 1200.0, 2033.0, 3673.0, 6664.0, 12229.0, 23275.0, 46202.0, 100237.0, 252107.0, 339586.0, 136093.0, 60524.0, 29384.0, 15252.0, 8037.0, 4461.0, 2533.0, 1430.0, 835.0, 464.0, 284.0, 168.0, 88.0, 65.0, 34.0, 24.0, 14.0, 13.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0264739990234375, -0.02567601203918457, -0.02487802505493164, -0.02408003807067871, -0.02328205108642578, -0.02248406410217285, -0.021686077117919922, -0.020888090133666992, -0.020090103149414062, -0.019292116165161133, -0.018494129180908203, -0.017696142196655273, -0.016898155212402344, -0.016100168228149414, -0.015302181243896484, -0.014504194259643555, -0.013706207275390625, -0.012908220291137695, -0.012110233306884766, -0.011312246322631836, -0.010514259338378906, -0.009716272354125977, -0.008918285369873047, -0.008120298385620117, -0.0073223114013671875, -0.006524324417114258, -0.005726337432861328, -0.0049283504486083984, -0.004130363464355469, -0.003332376480102539, -0.0025343894958496094, -0.0017364025115966797, -0.00093841552734375, -0.0001404285430908203, 0.0006575584411621094, 0.001455545425415039, 0.0022535324096679688, 0.0030515193939208984, 0.003849506378173828, 0.004647493362426758, 0.0054454803466796875, 0.006243467330932617, 0.007041454315185547, 0.007839441299438477, 0.008637428283691406, 0.009435415267944336, 0.010233402252197266, 0.011031389236450195, 0.011829376220703125, 0.012627363204956055, 0.013425350189208984, 0.014223337173461914, 0.015021324157714844, 0.015819311141967773, 0.016617298126220703, 0.017415285110473633, 0.018213272094726562, 0.019011259078979492, 0.019809246063232422, 0.02060723304748535, 0.02140522003173828, 0.02220320701599121, 0.02300119400024414, 0.02379918098449707, 0.02459716796875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 7.0, 9.0, 8.0, 10.0, 11.0, 19.0, 20.0, 16.0, 30.0, 21.0, 38.0, 29.0, 22.0, 27.0, 39.0, 41.0, 31.0, 51.0, 54.0, 1072.0, 36.0, 42.0, 44.0, 30.0, 42.0, 26.0, 34.0, 17.0, 23.0, 32.0, 18.0, 21.0, 23.0, 19.0, 9.0, 10.0, 12.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.673828125, -1.62078857421875, -1.5677490234375, -1.51470947265625, -1.461669921875, -1.40863037109375, -1.3555908203125, -1.30255126953125, -1.24951171875, -1.19647216796875, -1.1434326171875, -1.09039306640625, -1.037353515625, -0.98431396484375, -0.9312744140625, -0.87823486328125, -0.8251953125, -0.77215576171875, -0.7191162109375, -0.66607666015625, -0.613037109375, -0.55999755859375, -0.5069580078125, -0.45391845703125, -0.40087890625, -0.34783935546875, -0.2947998046875, -0.24176025390625, -0.188720703125, -0.13568115234375, -0.0826416015625, -0.02960205078125, 0.0234375, 0.07647705078125, 0.1295166015625, 0.18255615234375, 0.235595703125, 0.28863525390625, 0.3416748046875, 0.39471435546875, 0.44775390625, 0.50079345703125, 0.5538330078125, 0.60687255859375, 0.659912109375, 0.71295166015625, 0.7659912109375, 0.81903076171875, 0.8720703125, 0.92510986328125, 0.9781494140625, 1.03118896484375, 1.084228515625, 1.13726806640625, 1.1903076171875, 1.24334716796875, 1.29638671875, 1.34942626953125, 1.4024658203125, 1.45550537109375, 1.508544921875, 1.56158447265625, 1.6146240234375, 1.66766357421875, 1.720703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 5.0, 5.0, 5.0, 6.0, 3.0, 19.0, 24.0, 40.0, 65.0, 88.0, 99.0, 174.0, 230.0, 341.0, 516.0, 730.0, 1134.0, 1712.0, 2593.0, 3898.0, 5938.0, 8976.0, 14274.0, 21864.0, 34276.0, 53709.0, 85772.0, 143603.0, 1264873.0, 172471.0, 102471.0, 63815.0, 40097.0, 25912.0, 16534.0, 10467.0, 6966.0, 4455.0, 2943.0, 1984.0, 1362.0, 816.0, 585.0, 396.0, 306.0, 178.0, 123.0, 86.0, 81.0, 46.0, 24.0, 15.0, 9.0, 6.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0], "bins": [-0.0065155029296875, -0.006316125392913818, -0.006116747856140137, -0.005917370319366455, -0.0057179927825927734, -0.005518615245819092, -0.00531923770904541, -0.0051198601722717285, -0.004920482635498047, -0.004721105098724365, -0.004521727561950684, -0.004322350025177002, -0.00412297248840332, -0.003923594951629639, -0.003724217414855957, -0.0035248398780822754, -0.0033254623413085938, -0.003126084804534912, -0.0029267072677612305, -0.002727329730987549, -0.002527952194213867, -0.0023285746574401855, -0.002129197120666504, -0.0019298195838928223, -0.0017304420471191406, -0.001531064510345459, -0.0013316869735717773, -0.0011323094367980957, -0.0009329319000244141, -0.0007335543632507324, -0.0005341768264770508, -0.00033479928970336914, -0.0001354217529296875, 6.395578384399414e-05, 0.0002633333206176758, 0.0004627108573913574, 0.0006620883941650391, 0.0008614659309387207, 0.0010608434677124023, 0.001260221004486084, 0.0014595985412597656, 0.0016589760780334473, 0.001858353614807129, 0.0020577311515808105, 0.002257108688354492, 0.002456486225128174, 0.0026558637619018555, 0.002855241298675537, 0.0030546188354492188, 0.0032539963722229004, 0.003453373908996582, 0.0036527514457702637, 0.0038521289825439453, 0.004051506519317627, 0.004250884056091309, 0.00445026159286499, 0.004649639129638672, 0.0048490166664123535, 0.005048394203186035, 0.005247771739959717, 0.0054471492767333984, 0.00564652681350708, 0.005845904350280762, 0.006045281887054443, 0.006244659423828125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 15.0, 0.0, 0.0, 30.0, 0.0, 0.0, 67.0, 0.0, 0.0, 123.0, 0.0, 0.0, 0.0, 456.0, 0.0, 0.0, 159.0, 0.0, 0.0, 53.0, 0.0, 0.0, 34.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 8.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 5.0, 12.0, 10.0, 7.0, 18.0, 10.0, 14.0, 14.0, 23.0, 32.0, 33.0, 36.0, 35.0, 82.0, 74.0, 132.0, 211.0, 684.0, 3215.0, 94573.0, 925283.0, 20795.0, 2193.0, 395.0, 144.0, 90.0, 104.0, 57.0, 42.0, 35.0, 32.0, 22.0, 26.0, 15.0, 13.0, 16.0, 9.0, 14.0, 7.0, 8.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.119510650634766e-06, -8.837319910526276e-06, -8.555129170417786e-06, -8.272938430309296e-06, -7.990747690200806e-06, -7.708556950092316e-06, -7.426366209983826e-06, -7.144175469875336e-06, -6.861984729766846e-06, -6.579793989658356e-06, -6.297603249549866e-06, -6.015412509441376e-06, -5.733221769332886e-06, -5.451031029224396e-06, -5.168840289115906e-06, -4.886649549007416e-06, -4.604458808898926e-06, -4.322268068790436e-06, -4.040077328681946e-06, -3.757886588573456e-06, -3.475695848464966e-06, -3.193505108356476e-06, -2.911314368247986e-06, -2.629123628139496e-06, -2.346932888031006e-06, -2.064742147922516e-06, -1.7825514078140259e-06, -1.5003606677055359e-06, -1.218169927597046e-06, -9.359791874885559e-07, -6.537884473800659e-07, -3.7159770727157593e-07, -8.940696716308594e-08, 1.9278377294540405e-07, 4.7497451305389404e-07, 7.57165253162384e-07, 1.039355993270874e-06, 1.321546733379364e-06, 1.603737473487854e-06, 1.885928213596344e-06, 2.168118953704834e-06, 2.450309693813324e-06, 2.732500433921814e-06, 3.014691174030304e-06, 3.296881914138794e-06, 3.579072654247284e-06, 3.861263394355774e-06, 4.143454134464264e-06, 4.425644874572754e-06, 4.707835614681244e-06, 4.990026354789734e-06, 5.272217094898224e-06, 5.554407835006714e-06, 5.836598575115204e-06, 6.118789315223694e-06, 6.400980055332184e-06, 6.683170795440674e-06, 6.965361535549164e-06, 7.247552275657654e-06, 7.529743015766144e-06, 7.811933755874634e-06, 8.094124495983124e-06, 8.376315236091614e-06, 8.658505976200104e-06, 8.940696716308594e-06]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 15.0, 33.0, 60.0, 118.0, 434.0, 136.0, 95.0, 52.0, 33.0, 14.0, 9.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.125636799770291e-06, -1.0994504009431694e-06, -1.0732640021160478e-06, -1.0470774896020885e-06, -1.0208910907749669e-06, -9.947046919478453e-07, -9.685182931207237e-07, -9.423318374501832e-07, -9.161453817796428e-07, -8.899589829525212e-07, -8.637725272819807e-07, -8.375861284548591e-07, -8.113996727843187e-07, -7.852132739571971e-07, -7.590268751300755e-07, -7.32840419459535e-07, -7.066540206324134e-07, -6.804676218052919e-07, -6.542811661347514e-07, -6.280947673076298e-07, -6.019083116370894e-07, -5.757219128099678e-07, -5.495354571394273e-07, -5.233490583123057e-07, -4.971626594851841e-07, -4.709762322363531e-07, -4.447898049875221e-07, -4.186034061604005e-07, -3.9241695048986003e-07, -3.6623055166273843e-07, -3.400441244139074e-07, -3.138576971650764e-07, -2.8767124149453593e-07, -2.614848142457049e-07, -2.352983869968739e-07, -2.0911197395889758e-07, -1.8292554671006656e-07, -1.5673911946123553e-07, -1.3055270642325922e-07, -1.043662791744282e-07, -7.817985192559718e-08, -5.199342822947983e-08, -2.5807004533362488e-08, 3.794156100411783e-10, 2.6565842858872202e-08, 5.2752270107703225e-08, 7.893868314567953e-08, 1.0512511039451056e-07, 1.3131153764334158e-07, 1.574979648921726e-07, 1.8368439214100363e-07, 2.0987080517897994e-07, 2.3605723242781096e-07, 2.6224364546578727e-07, 2.884300727146183e-07, 3.146164999634493e-07, 3.4080292721228034e-07, 3.6698935446111136e-07, 3.931757817099424e-07, 4.193622089587734e-07, 4.45548607785895e-07, 4.7173506345643546e-07, 4.97921462283557e-07, 5.241079179540975e-07, 5.502943167812191e-07]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 204.0, 0.0, 0.0, 0.0, 0.0, 0.0, 420.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 228.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.384185791015625e-07, -2.2910535335540771e-07, -2.1979212760925293e-07, -2.1047890186309814e-07, -2.0116567611694336e-07, -1.9185245037078857e-07, -1.825392246246338e-07, -1.73225998878479e-07, -1.6391277313232422e-07, -1.5459954738616943e-07, -1.4528632164001465e-07, -1.3597309589385986e-07, -1.2665987014770508e-07, -1.1734664440155029e-07, -1.0803341865539551e-07, -9.872019290924072e-08, -8.940696716308594e-08, -8.009374141693115e-08, -7.078051567077637e-08, -6.146728992462158e-08, -5.21540641784668e-08, -4.284083843231201e-08, -3.3527612686157227e-08, -2.421438694000244e-08, -1.4901161193847656e-08, -5.587935447692871e-09, 3.725290298461914e-09, 1.30385160446167e-08, 2.2351741790771484e-08, 3.166496753692627e-08, 4.0978193283081055e-08, 5.029141902923584e-08, 5.960464477539063e-08, 6.891787052154541e-08, 7.82310962677002e-08, 8.754432201385498e-08, 9.685754776000977e-08, 1.0617077350616455e-07, 1.1548399925231934e-07, 1.2479722499847412e-07, 1.341104507446289e-07, 1.434236764907837e-07, 1.5273690223693848e-07, 1.6205012798309326e-07, 1.7136335372924805e-07, 1.8067657947540283e-07, 1.8998980522155762e-07, 1.993030309677124e-07, 2.086162567138672e-07, 2.1792948246002197e-07, 2.2724270820617676e-07, 2.3655593395233154e-07, 2.4586915969848633e-07, 2.551823854446411e-07, 2.644956111907959e-07, 2.738088369369507e-07, 2.8312206268310547e-07, 2.9243528842926025e-07, 3.0174851417541504e-07, 3.110617399215698e-07, 3.203749656677246e-07, 3.296881914138794e-07, 3.390014171600342e-07, 3.4831464290618896e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 8.0, 6.0, 13.0, 18.0, 20.0, 16.0, 24.0, 33.0, 38.0, 40.0, 53.0, 43.0, 53.0, 55.0, 62.0, 54.0, 46.0, 45.0, 47.0, 36.0, 44.0, 44.0, 36.0, 23.0, 28.0, 28.0, 16.0, 12.0, 13.0, 13.0, 2.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.560546875, -3.4758453369140625, -3.391143798828125, -3.3064422607421875, -3.22174072265625, -3.1370391845703125, -3.052337646484375, -2.9676361083984375, -2.8829345703125, -2.7982330322265625, -2.713531494140625, -2.6288299560546875, -2.54412841796875, -2.4594268798828125, -2.374725341796875, -2.2900238037109375, -2.205322265625, -2.1206207275390625, -2.035919189453125, -1.9512176513671875, -1.86651611328125, -1.7818145751953125, -1.697113037109375, -1.6124114990234375, -1.5277099609375, -1.4430084228515625, -1.358306884765625, -1.2736053466796875, -1.18890380859375, -1.1042022705078125, -1.019500732421875, -0.9347991943359375, -0.85009765625, -0.7653961181640625, -0.680694580078125, -0.5959930419921875, -0.51129150390625, -0.4265899658203125, -0.341888427734375, -0.2571868896484375, -0.1724853515625, -0.0877838134765625, -0.003082275390625, 0.0816192626953125, 0.16632080078125, 0.2510223388671875, 0.335723876953125, 0.4204254150390625, 0.505126953125, 0.5898284912109375, 0.674530029296875, 0.7592315673828125, 0.84393310546875, 0.9286346435546875, 1.013336181640625, 1.0980377197265625, 1.1827392578125, 1.2674407958984375, 1.352142333984375, 1.4368438720703125, 1.52154541015625, 1.6062469482421875, 1.690948486328125, 1.7756500244140625, 1.8603515625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 9.0, 18.0, 22.0, 28.0, 55.0, 74.0, 116.0, 189.0, 317.0, 498.0, 822.0, 1418.0, 2444.0, 4112.0, 7767.0, 14554.0, 29042.0, 64633.0, 229951.0, 494509.0, 110647.0, 42539.0, 20672.0, 10611.0, 5642.0, 3144.0, 1902.0, 1047.0, 635.0, 420.0, 238.0, 172.0, 107.0, 60.0, 45.0, 27.0, 21.0, 13.0, 9.0, 2.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0], "bins": [-3.91015625, -3.80230712890625, -3.6944580078125, -3.58660888671875, -3.478759765625, -3.37091064453125, -3.2630615234375, -3.15521240234375, -3.04736328125, -2.93951416015625, -2.8316650390625, -2.72381591796875, -2.615966796875, -2.50811767578125, -2.4002685546875, -2.29241943359375, -2.1845703125, -2.07672119140625, -1.9688720703125, -1.86102294921875, -1.753173828125, -1.64532470703125, -1.5374755859375, -1.42962646484375, -1.32177734375, -1.21392822265625, -1.1060791015625, -0.99822998046875, -0.890380859375, -0.78253173828125, -0.6746826171875, -0.56683349609375, -0.458984375, -0.35113525390625, -0.2432861328125, -0.13543701171875, -0.027587890625, 0.08026123046875, 0.1881103515625, 0.29595947265625, 0.40380859375, 0.51165771484375, 0.6195068359375, 0.72735595703125, 0.835205078125, 0.94305419921875, 1.0509033203125, 1.15875244140625, 1.2666015625, 1.37445068359375, 1.4822998046875, 1.59014892578125, 1.697998046875, 1.80584716796875, 1.9136962890625, 2.02154541015625, 2.12939453125, 2.23724365234375, 2.3450927734375, 2.45294189453125, 2.560791015625, 2.66864013671875, 2.7764892578125, 2.88433837890625, 2.9921875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 2.0, 7.0, 10.0, 6.0, 10.0, 12.0, 16.0, 22.0, 21.0, 33.0, 35.0, 35.0, 12.0, 43.0, 40.0, 40.0, 55.0, 103.0, 181.0, 1501.0, 283.0, 113.0, 54.0, 48.0, 40.0, 47.0, 44.0, 24.0, 36.0, 21.0, 23.0, 19.0, 16.0, 18.0, 13.0, 11.0, 8.0, 9.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-7.88671875, -7.64593505859375, -7.4051513671875, -7.16436767578125, -6.923583984375, -6.68280029296875, -6.4420166015625, -6.20123291015625, -5.96044921875, -5.71966552734375, -5.4788818359375, -5.23809814453125, -4.997314453125, -4.75653076171875, -4.5157470703125, -4.27496337890625, -4.0341796875, -3.79339599609375, -3.5526123046875, -3.31182861328125, -3.071044921875, -2.83026123046875, -2.5894775390625, -2.34869384765625, -2.10791015625, -1.86712646484375, -1.6263427734375, -1.38555908203125, -1.144775390625, -0.90399169921875, -0.6632080078125, -0.42242431640625, -0.181640625, 0.05914306640625, 0.2999267578125, 0.54071044921875, 0.781494140625, 1.02227783203125, 1.2630615234375, 1.50384521484375, 1.74462890625, 1.98541259765625, 2.2261962890625, 2.46697998046875, 2.707763671875, 2.94854736328125, 3.1893310546875, 3.43011474609375, 3.6708984375, 3.91168212890625, 4.1524658203125, 4.39324951171875, 4.634033203125, 4.87481689453125, 5.1156005859375, 5.35638427734375, 5.59716796875, 5.83795166015625, 6.0787353515625, 6.31951904296875, 6.560302734375, 6.80108642578125, 7.0418701171875, 7.28265380859375, 7.5234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 3.0, 9.0, 7.0, 7.0, 7.0, 13.0, 12.0, 7.0, 25.0, 19.0, 34.0, 37.0, 40.0, 67.0, 85.0, 147.0, 214.0, 480.0, 1525.0, 7339.0, 56584.0, 2559039.0, 489275.0, 24924.0, 3886.0, 959.0, 338.0, 155.0, 128.0, 71.0, 46.0, 48.0, 39.0, 27.0, 18.0, 21.0, 15.0, 12.0, 7.0, 7.0, 4.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.1484375, -10.8087158203125, -10.468994140625, -10.1292724609375, -9.78955078125, -9.4498291015625, -9.110107421875, -8.7703857421875, -8.4306640625, -8.0909423828125, -7.751220703125, -7.4114990234375, -7.07177734375, -6.7320556640625, -6.392333984375, -6.0526123046875, -5.712890625, -5.3731689453125, -5.033447265625, -4.6937255859375, -4.35400390625, -4.0142822265625, -3.674560546875, -3.3348388671875, -2.9951171875, -2.6553955078125, -2.315673828125, -1.9759521484375, -1.63623046875, -1.2965087890625, -0.956787109375, -0.6170654296875, -0.27734375, 0.0623779296875, 0.402099609375, 0.7418212890625, 1.08154296875, 1.4212646484375, 1.760986328125, 2.1007080078125, 2.4404296875, 2.7801513671875, 3.119873046875, 3.4595947265625, 3.79931640625, 4.1390380859375, 4.478759765625, 4.8184814453125, 5.158203125, 5.4979248046875, 5.837646484375, 6.1773681640625, 6.51708984375, 6.8568115234375, 7.196533203125, 7.5362548828125, 7.8759765625, 8.2156982421875, 8.555419921875, 8.8951416015625, 9.23486328125, 9.5745849609375, 9.914306640625, 10.2540283203125, 10.59375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 42.0, 259.0, 474.0, 211.0, 23.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-109.1397933959961, -107.01485443115234, -104.8899154663086, -102.76497650146484, -100.6400375366211, -98.51509094238281, -96.39015197753906, -94.26521301269531, -92.14027404785156, -90.01533508300781, -87.89039611816406, -85.76545715332031, -83.64051818847656, -81.51557922363281, -79.39064025878906, -77.26569366455078, -75.14076232910156, -73.01582336425781, -70.89088439941406, -68.76594543457031, -66.64100646972656, -64.51606750488281, -62.3911247253418, -60.26618576049805, -58.14124298095703, -56.01630401611328, -53.89136505126953, -51.76642608642578, -49.641483306884766, -47.516544342041016, -45.391605377197266, -43.266666412353516, -41.141727447509766, -39.016788482666016, -36.891849517822266, -34.76690673828125, -32.6419677734375, -30.51702880859375, -28.39208984375, -26.26715087890625, -24.142210006713867, -22.017271041870117, -19.892330169677734, -17.767391204833984, -15.642451286315918, -13.517511367797852, -11.392572402954102, -9.267632484436035, -7.142692565917969, -5.017752647399902, -2.892813205718994, -0.7678737640380859, 1.3570661544799805, 3.482006072998047, 5.606945037841797, 7.731884956359863, 9.85682487487793, 11.981764793395996, 14.106704711914062, 16.231643676757812, 18.356582641601562, 20.481523513793945, 22.606462478637695, 24.731403350830078, 26.856342315673828]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 5.0, 9.0, 10.0, 9.0, 17.0, 12.0, 12.0, 32.0, 20.0, 27.0, 31.0, 29.0, 35.0, 42.0, 40.0, 29.0, 43.0, 53.0, 42.0, 39.0, 44.0, 40.0, 39.0, 37.0, 34.0, 31.0, 32.0, 31.0, 28.0, 22.0, 18.0, 22.0, 12.0, 13.0, 9.0, 5.0, 11.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.180843353271484, -27.292997360229492, -26.405149459838867, -25.517303466796875, -24.62945556640625, -23.741609573364258, -22.853761672973633, -21.96591567993164, -21.078067779541016, -20.190221786499023, -19.3023738861084, -18.414527893066406, -17.52667999267578, -16.63883399963379, -15.750986099243164, -14.863140106201172, -13.975293159484863, -13.087446212768555, -12.199599266052246, -11.311752319335938, -10.423905372619629, -9.53605842590332, -8.648212432861328, -7.760365009307861, -6.872518062591553, -5.984671115875244, -5.0968241691589355, -4.208977699279785, -3.3211305141448975, -2.433283805847168, -1.5454368591308594, -0.6575899124145508, 0.2302570343017578, 1.1181039810180664, 2.005950927734375, 2.8937976360321045, 3.781644582748413, 4.669491291046143, 5.557338237762451, 6.44518518447876, 7.333032131195068, 8.220878601074219, 9.108725547790527, 9.996572494506836, 10.884419441223145, 11.772266387939453, 12.660113334655762, 13.54796028137207, 14.435807228088379, 15.323654174804688, 16.21150016784668, 17.099348068237305, 17.987194061279297, 18.875041961669922, 19.762887954711914, 20.65073585510254, 21.53858184814453, 22.426427841186523, 23.31427574157715, 24.20212173461914, 25.089969635009766, 25.977815628051758, 26.865663528442383, 27.753509521484375, 28.641357421875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 8.0, 9.0, 6.0, 8.0, 14.0, 21.0, 13.0, 25.0, 23.0, 32.0, 31.0, 43.0, 44.0, 58.0, 42.0, 52.0, 63.0, 55.0, 54.0, 49.0, 31.0, 40.0, 46.0, 37.0, 37.0, 32.0, 25.0, 28.0, 17.0, 8.0, 17.0, 6.0, 8.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.49609375, -3.410919189453125, -3.32574462890625, -3.240570068359375, -3.1553955078125, -3.070220947265625, -2.98504638671875, -2.899871826171875, -2.814697265625, -2.729522705078125, -2.64434814453125, -2.559173583984375, -2.4739990234375, -2.388824462890625, -2.30364990234375, -2.218475341796875, -2.13330078125, -2.048126220703125, -1.96295166015625, -1.877777099609375, -1.7926025390625, -1.707427978515625, -1.62225341796875, -1.537078857421875, -1.451904296875, -1.366729736328125, -1.28155517578125, -1.196380615234375, -1.1112060546875, -1.026031494140625, -0.94085693359375, -0.855682373046875, -0.7705078125, -0.685333251953125, -0.60015869140625, -0.514984130859375, -0.4298095703125, -0.344635009765625, -0.25946044921875, -0.174285888671875, -0.089111328125, -0.003936767578125, 0.08123779296875, 0.166412353515625, 0.2515869140625, 0.336761474609375, 0.42193603515625, 0.507110595703125, 0.59228515625, 0.677459716796875, 0.76263427734375, 0.847808837890625, 0.9329833984375, 1.018157958984375, 1.10333251953125, 1.188507080078125, 1.273681640625, 1.358856201171875, 1.44403076171875, 1.529205322265625, 1.6143798828125, 1.699554443359375, 1.78472900390625, 1.869903564453125, 1.955078125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 9.0, 4.0, 7.0, 6.0, 13.0, 14.0, 20.0, 25.0, 31.0, 53.0, 82.0, 153.0, 281.0, 641.0, 1794.0, 5829.0, 23584.0, 130019.0, 1330826.0, 2416278.0, 234868.0, 37435.0, 8399.0, 2366.0, 765.0, 322.0, 176.0, 91.0, 48.0, 39.0, 33.0, 20.0, 19.0, 10.0, 9.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.828125, -10.54425048828125, -10.2603759765625, -9.97650146484375, -9.692626953125, -9.40875244140625, -9.1248779296875, -8.84100341796875, -8.55712890625, -8.27325439453125, -7.9893798828125, -7.70550537109375, -7.421630859375, -7.13775634765625, -6.8538818359375, -6.57000732421875, -6.2861328125, -6.00225830078125, -5.7183837890625, -5.43450927734375, -5.150634765625, -4.86676025390625, -4.5828857421875, -4.29901123046875, -4.01513671875, -3.73126220703125, -3.4473876953125, -3.16351318359375, -2.879638671875, -2.59576416015625, -2.3118896484375, -2.02801513671875, -1.744140625, -1.46026611328125, -1.1763916015625, -0.89251708984375, -0.608642578125, -0.32476806640625, -0.0408935546875, 0.24298095703125, 0.52685546875, 0.81072998046875, 1.0946044921875, 1.37847900390625, 1.662353515625, 1.94622802734375, 2.2301025390625, 2.51397705078125, 2.7978515625, 3.08172607421875, 3.3656005859375, 3.64947509765625, 3.933349609375, 4.21722412109375, 4.5010986328125, 4.78497314453125, 5.06884765625, 5.35272216796875, 5.6365966796875, 5.92047119140625, 6.204345703125, 6.48822021484375, 6.7720947265625, 7.05596923828125, 7.33984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 12.0, 16.0, 28.0, 44.0, 48.0, 62.0, 108.0, 163.0, 233.0, 392.0, 567.0, 672.0, 528.0, 401.0, 272.0, 195.0, 114.0, 83.0, 57.0, 26.0, 18.0, 10.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5234375, -10.2269287109375, -9.930419921875, -9.6339111328125, -9.33740234375, -9.0408935546875, -8.744384765625, -8.4478759765625, -8.1513671875, -7.8548583984375, -7.558349609375, -7.2618408203125, -6.96533203125, -6.6688232421875, -6.372314453125, -6.0758056640625, -5.779296875, -5.4827880859375, -5.186279296875, -4.8897705078125, -4.59326171875, -4.2967529296875, -4.000244140625, -3.7037353515625, -3.4072265625, -3.1107177734375, -2.814208984375, -2.5177001953125, -2.22119140625, -1.9246826171875, -1.628173828125, -1.3316650390625, -1.03515625, -0.7386474609375, -0.442138671875, -0.1456298828125, 0.15087890625, 0.4473876953125, 0.743896484375, 1.0404052734375, 1.3369140625, 1.6334228515625, 1.929931640625, 2.2264404296875, 2.52294921875, 2.8194580078125, 3.115966796875, 3.4124755859375, 3.708984375, 4.0054931640625, 4.302001953125, 4.5985107421875, 4.89501953125, 5.1915283203125, 5.488037109375, 5.7845458984375, 6.0810546875, 6.3775634765625, 6.674072265625, 6.9705810546875, 7.26708984375, 7.5635986328125, 7.860107421875, 8.1566162109375, 8.453125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 11.0, 14.0, 16.0, 29.0, 49.0, 97.0, 122.0, 274.0, 636.0, 1405.0, 4200.0, 17776.0, 128007.0, 1645270.0, 2195144.0, 171556.0, 21964.0, 4905.0, 1488.0, 625.0, 307.0, 167.0, 83.0, 56.0, 26.0, 22.0, 11.0, 5.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8515625, -13.3397216796875, -12.827880859375, -12.3160400390625, -11.80419921875, -11.2923583984375, -10.780517578125, -10.2686767578125, -9.7568359375, -9.2449951171875, -8.733154296875, -8.2213134765625, -7.70947265625, -7.1976318359375, -6.685791015625, -6.1739501953125, -5.662109375, -5.1502685546875, -4.638427734375, -4.1265869140625, -3.61474609375, -3.1029052734375, -2.591064453125, -2.0792236328125, -1.5673828125, -1.0555419921875, -0.543701171875, -0.0318603515625, 0.47998046875, 0.9918212890625, 1.503662109375, 2.0155029296875, 2.52734375, 3.0391845703125, 3.551025390625, 4.0628662109375, 4.57470703125, 5.0865478515625, 5.598388671875, 6.1102294921875, 6.6220703125, 7.1339111328125, 7.645751953125, 8.1575927734375, 8.66943359375, 9.1812744140625, 9.693115234375, 10.2049560546875, 10.716796875, 11.2286376953125, 11.740478515625, 12.2523193359375, 12.76416015625, 13.2760009765625, 13.787841796875, 14.2996826171875, 14.8115234375, 15.3233642578125, 15.835205078125, 16.3470458984375, 16.85888671875, 17.3707275390625, 17.882568359375, 18.3944091796875, 18.90625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 11.0, 18.0, 39.0, 75.0, 127.0, 140.0, 179.0, 157.0, 125.0, 71.0, 40.0, 17.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.4660873413086, -87.30715942382812, -85.14822387695312, -82.98929595947266, -80.83036041259766, -78.67143249511719, -76.51249694824219, -74.35356903076172, -72.19463348388672, -70.03570556640625, -67.87677001953125, -65.71784210205078, -63.55890655517578, -61.39997482299805, -59.24104309082031, -57.082115173339844, -54.92318344116211, -52.764251708984375, -50.60531997680664, -48.446388244628906, -46.28745651245117, -44.12852478027344, -41.96959686279297, -39.81066131591797, -37.6517333984375, -35.492801666259766, -33.33386993408203, -31.174938201904297, -29.016006469726562, -26.857074737548828, -24.698144912719727, -22.539213180541992, -20.38028335571289, -18.221351623535156, -16.062419891357422, -13.903489112854004, -11.74455738067627, -9.585625648498535, -7.426694869995117, -5.267763137817383, -3.1088314056396484, -0.9498999118804932, 1.209031581878662, 3.3679628372192383, 5.526894569396973, 7.685826301574707, 9.844757080078125, 12.00368881225586, 14.162620544433594, 16.321552276611328, 18.480484008789062, 20.639415740966797, 22.79834747314453, 24.957279205322266, 27.116209030151367, 29.2751407623291, 31.434072494506836, 33.59300231933594, 35.75193405151367, 37.910865783691406, 40.06979751586914, 42.228729248046875, 44.38766098022461, 46.546592712402344, 48.70552444458008]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 2.0, 11.0, 9.0, 11.0, 17.0, 11.0, 6.0, 19.0, 19.0, 24.0, 26.0, 19.0, 43.0, 36.0, 32.0, 42.0, 29.0, 40.0, 41.0, 32.0, 43.0, 39.0, 41.0, 30.0, 42.0, 34.0, 36.0, 31.0, 33.0, 27.0, 23.0, 27.0, 17.0, 22.0, 7.0, 18.0, 7.0, 8.0, 11.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.8173828125, -23.04169464111328, -22.266006469726562, -21.490318298339844, -20.714630126953125, -19.938941955566406, -19.163253784179688, -18.38756561279297, -17.61187744140625, -16.83618927001953, -16.060501098632812, -15.284812927246094, -14.509124755859375, -13.733436584472656, -12.957748413085938, -12.182060241699219, -11.406371116638184, -10.630682945251465, -9.854994773864746, -9.079306602478027, -8.303618431091309, -7.52793025970459, -6.752241611480713, -5.976553440093994, -5.200865268707275, -4.425177097320557, -3.649488925933838, -2.87380051612854, -2.0981123447418213, -1.3224241733551025, -0.5467357635498047, 0.22895240783691406, 1.0046405792236328, 1.7803287506103516, 2.5560169219970703, 3.331705331802368, 4.107393264770508, 4.883081436157227, 5.6587700843811035, 6.434458255767822, 7.210146427154541, 7.98583459854126, 8.761523246765137, 9.537211418151855, 10.312899589538574, 11.088587760925293, 11.864275932312012, 12.63996410369873, 13.41565227508545, 14.191340446472168, 14.967028617858887, 15.742716789245605, 16.51840591430664, 17.29409408569336, 18.069782257080078, 18.845470428466797, 19.621158599853516, 20.396846771240234, 21.172534942626953, 21.948223114013672, 22.72391128540039, 23.49959945678711, 24.275287628173828, 25.050975799560547, 25.826663970947266]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 5.0, 7.0, 8.0, 18.0, 6.0, 20.0, 23.0, 25.0, 27.0, 34.0, 34.0, 37.0, 46.0, 45.0, 43.0, 43.0, 41.0, 47.0, 52.0, 56.0, 36.0, 45.0, 32.0, 35.0, 39.0, 30.0, 36.0, 24.0, 22.0, 16.0, 7.0, 11.0, 10.0, 8.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84765625, -2.7667236328125, -2.685791015625, -2.6048583984375, -2.52392578125, -2.4429931640625, -2.362060546875, -2.2811279296875, -2.2001953125, -2.1192626953125, -2.038330078125, -1.9573974609375, -1.87646484375, -1.7955322265625, -1.714599609375, -1.6336669921875, -1.552734375, -1.4718017578125, -1.390869140625, -1.3099365234375, -1.22900390625, -1.1480712890625, -1.067138671875, -0.9862060546875, -0.9052734375, -0.8243408203125, -0.743408203125, -0.6624755859375, -0.58154296875, -0.5006103515625, -0.419677734375, -0.3387451171875, -0.2578125, -0.1768798828125, -0.095947265625, -0.0150146484375, 0.06591796875, 0.1468505859375, 0.227783203125, 0.3087158203125, 0.3896484375, 0.4705810546875, 0.551513671875, 0.6324462890625, 0.71337890625, 0.7943115234375, 0.875244140625, 0.9561767578125, 1.037109375, 1.1180419921875, 1.198974609375, 1.2799072265625, 1.36083984375, 1.4417724609375, 1.522705078125, 1.6036376953125, 1.6845703125, 1.7655029296875, 1.846435546875, 1.9273681640625, 2.00830078125, 2.0892333984375, 2.170166015625, 2.2510986328125, 2.33203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 13.0, 15.0, 34.0, 41.0, 100.0, 91.0, 158.0, 271.0, 393.0, 633.0, 909.0, 1501.0, 2274.0, 3601.0, 5668.0, 9213.0, 14961.0, 24773.0, 41512.0, 72850.0, 140577.0, 300815.0, 200347.0, 94747.0, 52862.0, 31032.0, 18674.0, 11412.0, 6914.0, 4422.0, 2702.0, 1787.0, 1166.0, 721.0, 456.0, 339.0, 181.0, 132.0, 80.0, 56.0, 40.0, 25.0, 17.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02142333984375, -0.020747900009155273, -0.020072460174560547, -0.01939702033996582, -0.018721580505371094, -0.018046140670776367, -0.01737070083618164, -0.016695261001586914, -0.016019821166992188, -0.015344381332397461, -0.014668941497802734, -0.013993501663208008, -0.013318061828613281, -0.012642621994018555, -0.011967182159423828, -0.011291742324829102, -0.010616302490234375, -0.009940862655639648, -0.009265422821044922, -0.008589982986450195, -0.007914543151855469, -0.007239103317260742, -0.006563663482666016, -0.005888223648071289, -0.0052127838134765625, -0.004537343978881836, -0.0038619041442871094, -0.003186464309692383, -0.0025110244750976562, -0.0018355846405029297, -0.0011601448059082031, -0.00048470497131347656, 0.00019073486328125, 0.0008661746978759766, 0.0015416145324707031, 0.0022170543670654297, 0.0028924942016601562, 0.003567934036254883, 0.004243373870849609, 0.004918813705444336, 0.0055942535400390625, 0.006269693374633789, 0.006945133209228516, 0.007620573043823242, 0.008296012878417969, 0.008971452713012695, 0.009646892547607422, 0.010322332382202148, 0.010997772216796875, 0.011673212051391602, 0.012348651885986328, 0.013024091720581055, 0.013699531555175781, 0.014374971389770508, 0.015050411224365234, 0.01572585105895996, 0.016401290893554688, 0.017076730728149414, 0.01775217056274414, 0.018427610397338867, 0.019103050231933594, 0.01977849006652832, 0.020453929901123047, 0.021129369735717773, 0.0218048095703125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 7.0, 6.0, 7.0, 12.0, 8.0, 15.0, 17.0, 23.0, 20.0, 35.0, 27.0, 48.0, 27.0, 40.0, 36.0, 46.0, 48.0, 44.0, 1070.0, 53.0, 47.0, 49.0, 57.0, 45.0, 34.0, 32.0, 32.0, 28.0, 21.0, 20.0, 24.0, 12.0, 7.0, 10.0, 6.0, 4.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.400390625, -2.334197998046875, -2.26800537109375, -2.201812744140625, -2.1356201171875, -2.069427490234375, -2.00323486328125, -1.937042236328125, -1.870849609375, -1.804656982421875, -1.73846435546875, -1.672271728515625, -1.6060791015625, -1.539886474609375, -1.47369384765625, -1.407501220703125, -1.34130859375, -1.275115966796875, -1.20892333984375, -1.142730712890625, -1.0765380859375, -1.010345458984375, -0.94415283203125, -0.877960205078125, -0.811767578125, -0.745574951171875, -0.67938232421875, -0.613189697265625, -0.5469970703125, -0.480804443359375, -0.41461181640625, -0.348419189453125, -0.2822265625, -0.216033935546875, -0.14984130859375, -0.083648681640625, -0.0174560546875, 0.048736572265625, 0.11492919921875, 0.181121826171875, 0.247314453125, 0.313507080078125, 0.37969970703125, 0.445892333984375, 0.5120849609375, 0.578277587890625, 0.64447021484375, 0.710662841796875, 0.77685546875, 0.843048095703125, 0.90924072265625, 0.975433349609375, 1.0416259765625, 1.107818603515625, 1.17401123046875, 1.240203857421875, 1.306396484375, 1.372589111328125, 1.43878173828125, 1.504974365234375, 1.5711669921875, 1.637359619140625, 1.70355224609375, 1.769744873046875, 1.8359375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 11.0, 9.0, 23.0, 44.0, 66.0, 91.0, 90.0, 181.0, 266.0, 436.0, 632.0, 999.0, 1614.0, 2596.0, 4368.0, 7090.0, 12139.0, 20638.0, 35946.0, 62580.0, 114231.0, 214788.0, 1299303.0, 139965.0, 75396.0, 42456.0, 24804.0, 14559.0, 8506.0, 5015.0, 3135.0, 1872.0, 1167.0, 748.0, 453.0, 307.0, 184.0, 116.0, 84.0, 65.0, 40.0, 31.0, 16.0, 13.0, 15.0, 9.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00832366943359375, -0.008064866065979004, -0.007806062698364258, -0.007547259330749512, -0.007288455963134766, -0.0070296525955200195, -0.0067708492279052734, -0.006512045860290527, -0.006253242492675781, -0.005994439125061035, -0.005735635757446289, -0.005476832389831543, -0.005218029022216797, -0.004959225654602051, -0.004700422286987305, -0.004441618919372559, -0.0041828155517578125, -0.003924012184143066, -0.0036652088165283203, -0.0034064054489135742, -0.003147602081298828, -0.002888798713684082, -0.002629995346069336, -0.00237119197845459, -0.0021123886108398438, -0.0018535852432250977, -0.0015947818756103516, -0.0013359785079956055, -0.0010771751403808594, -0.0008183717727661133, -0.0005595684051513672, -0.0003007650375366211, -4.1961669921875e-05, 0.0002168416976928711, 0.0004756450653076172, 0.0007344484329223633, 0.0009932518005371094, 0.0012520551681518555, 0.0015108585357666016, 0.0017696619033813477, 0.0020284652709960938, 0.00228726863861084, 0.002546072006225586, 0.002804875373840332, 0.003063678741455078, 0.0033224821090698242, 0.0035812854766845703, 0.0038400888442993164, 0.0040988922119140625, 0.004357695579528809, 0.004616498947143555, 0.004875302314758301, 0.005134105682373047, 0.005392909049987793, 0.005651712417602539, 0.005910515785217285, 0.006169319152832031, 0.006428122520446777, 0.0066869258880615234, 0.0069457292556762695, 0.007204532623291016, 0.007463335990905762, 0.007722139358520508, 0.007980942726135254, 0.00823974609375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 8.0, 0.0, 8.0, 0.0, 0.0, 15.0, 0.0, 0.0, 28.0, 0.0, 0.0, 33.0, 0.0, 0.0, 69.0, 0.0, 152.0, 0.0, 0.0, 385.0, 0.0, 0.0, 136.0, 0.0, 0.0, 74.0, 0.0, 30.0, 0.0, 0.0, 27.0, 0.0, 0.0, 23.0, 0.0, 0.0, 11.0, 0.0, 0.0, 8.0, 0.0, 5.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.342306733131409e-07, -6.128102540969849e-07, -5.913898348808289e-07, -5.699694156646729e-07, -5.485489964485168e-07, -5.271285772323608e-07, -5.057081580162048e-07, -4.842877388000488e-07, -4.628673195838928e-07, -4.414469003677368e-07, -4.200264811515808e-07, -3.986060619354248e-07, -3.771856427192688e-07, -3.557652235031128e-07, -3.343448042869568e-07, -3.129243850708008e-07, -2.915039658546448e-07, -2.7008354663848877e-07, -2.4866312742233276e-07, -2.2724270820617676e-07, -2.0582228899002075e-07, -1.8440186977386475e-07, -1.6298145055770874e-07, -1.4156103134155273e-07, -1.2014061212539673e-07, -9.872019290924072e-08, -7.729977369308472e-08, -5.587935447692871e-08, -3.4458935260772705e-08, -1.30385160446167e-08, 8.381903171539307e-09, 2.9802322387695312e-08, 5.122274160385132e-08, 7.264316082000732e-08, 9.406358003616333e-08, 1.1548399925231934e-07, 1.3690441846847534e-07, 1.5832483768463135e-07, 1.7974525690078735e-07, 2.0116567611694336e-07, 2.2258609533309937e-07, 2.4400651454925537e-07, 2.654269337654114e-07, 2.868473529815674e-07, 3.082677721977234e-07, 3.296881914138794e-07, 3.511086106300354e-07, 3.725290298461914e-07, 3.939494490623474e-07, 4.153698682785034e-07, 4.367902874946594e-07, 4.5821070671081543e-07, 4.796311259269714e-07, 5.010515451431274e-07, 5.224719643592834e-07, 5.438923835754395e-07, 5.653128027915955e-07, 5.867332220077515e-07, 6.081536412239075e-07, 6.295740604400635e-07, 6.509944796562195e-07, 6.724148988723755e-07, 6.938353180885315e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 18.0, 12.0, 19.0, 23.0, 17.0, 34.0, 39.0, 52.0, 44.0, 65.0, 113.0, 153.0, 243.0, 507.0, 2732.0, 33459.0, 880640.0, 121909.0, 6479.0, 952.0, 295.0, 126.0, 129.0, 67.0, 64.0, 61.0, 37.0, 42.0, 37.0, 25.0, 23.0, 25.0, 20.0, 15.0, 10.0, 8.0, 7.0, 6.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-9.894371032714844e-06, -9.601004421710968e-06, -9.307637810707092e-06, -9.014271199703217e-06, -8.72090458869934e-06, -8.427537977695465e-06, -8.13417136669159e-06, -7.840804755687714e-06, -7.547438144683838e-06, -7.254071533679962e-06, -6.9607049226760864e-06, -6.667338311672211e-06, -6.373971700668335e-06, -6.080605089664459e-06, -5.7872384786605835e-06, -5.493871867656708e-06, -5.200505256652832e-06, -4.907138645648956e-06, -4.6137720346450806e-06, -4.320405423641205e-06, -4.027038812637329e-06, -3.7336722016334534e-06, -3.4403055906295776e-06, -3.146938979625702e-06, -2.853572368621826e-06, -2.5602057576179504e-06, -2.2668391466140747e-06, -1.973472535610199e-06, -1.6801059246063232e-06, -1.3867393136024475e-06, -1.0933727025985718e-06, -8.00006091594696e-07, -5.066394805908203e-07, -2.1327286958694458e-07, 8.009374141693115e-08, 3.734603524208069e-07, 6.668269634246826e-07, 9.601935744285583e-07, 1.253560185432434e-06, 1.5469267964363098e-06, 1.8402934074401855e-06, 2.1336600184440613e-06, 2.427026629447937e-06, 2.7203932404518127e-06, 3.0137598514556885e-06, 3.307126462459564e-06, 3.60049307346344e-06, 3.893859684467316e-06, 4.187226295471191e-06, 4.480592906475067e-06, 4.773959517478943e-06, 5.067326128482819e-06, 5.360692739486694e-06, 5.65405935049057e-06, 5.947425961494446e-06, 6.2407925724983215e-06, 6.534159183502197e-06, 6.827525794506073e-06, 7.120892405509949e-06, 7.4142590165138245e-06, 7.7076256275177e-06, 8.000992238521576e-06, 8.294358849525452e-06, 8.587725460529327e-06, 8.881092071533203e-06]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 11.0, 18.0, 50.0, 122.0, 380.0, 207.0, 125.0, 57.0, 21.0, 9.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2618720575119369e-06, -1.2197108389955247e-06, -1.1775496204791125e-06, -1.1353884019627003e-06, -1.0932271834462881e-06, -1.051065964929876e-06, -1.0089047464134637e-06, -9.667435278970515e-07, -9.245823093806393e-07, -8.824210908642272e-07, -8.40259872347815e-07, -7.980986538314028e-07, -7.559374353149906e-07, -7.137762167985784e-07, -6.716149982821662e-07, -6.29453779765754e-07, -5.872925612493418e-07, -5.451313427329296e-07, -5.029701242165174e-07, -4.6080890570010524e-07, -4.1864768718369305e-07, -3.7648646866728086e-07, -3.3432525015086867e-07, -2.921640316344565e-07, -2.500028131180443e-07, -2.078415946016321e-07, -1.656803760852199e-07, -1.2351915756880771e-07, -8.135793905239552e-08, -3.919672053598333e-08, 2.9644979804288596e-09, 4.512571649684105e-08, 8.728704870009096e-08, 1.2944826721650315e-07, 1.7160948573291535e-07, 2.1377070424932754e-07, 2.5593192276573973e-07, 2.980931412821519e-07, 3.402543597985641e-07, 3.824155783149763e-07, 4.245767968313885e-07, 4.667380153478007e-07, 5.088992338642129e-07, 5.510604523806251e-07, 5.932216708970373e-07, 6.353828894134494e-07, 6.775441079298616e-07, 7.197053264462738e-07, 7.61866544962686e-07, 8.040277634790982e-07, 8.461889819955104e-07, 8.883502005119226e-07, 9.305114190283348e-07, 9.72672637544747e-07, 1.0148338560611592e-06, 1.0569950745775714e-06, 1.0991562930939835e-06, 1.1413175116103957e-06, 1.183478730126808e-06, 1.2256399486432201e-06, 1.2678011671596323e-06, 1.3099623856760445e-06, 1.3521236041924567e-06, 1.3942848227088689e-06, 1.436446041225281e-06]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 0.0, 95.0, 0.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 0.0, 0.0, 326.0, 0.0, 0.0, 0.0, 0.0, 192.0, 0.0, 0.0, 0.0, 0.0, 73.0, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 4.0], "bins": [-4.172325134277344e-07, -4.0512531995773315e-07, -3.9301812648773193e-07, -3.809109330177307e-07, -3.688037395477295e-07, -3.5669654607772827e-07, -3.4458935260772705e-07, -3.3248215913772583e-07, -3.203749656677246e-07, -3.082677721977234e-07, -2.9616057872772217e-07, -2.8405338525772095e-07, -2.7194619178771973e-07, -2.598389983177185e-07, -2.477318048477173e-07, -2.3562461137771606e-07, -2.2351741790771484e-07, -2.1141022443771362e-07, -1.993030309677124e-07, -1.8719583749771118e-07, -1.7508864402770996e-07, -1.6298145055770874e-07, -1.5087425708770752e-07, -1.387670636177063e-07, -1.2665987014770508e-07, -1.1455267667770386e-07, -1.0244548320770264e-07, -9.033828973770142e-08, -7.82310962677002e-08, -6.612390279769897e-08, -5.4016709327697754e-08, -4.190951585769653e-08, -2.9802322387695312e-08, -1.7695128917694092e-08, -5.587935447692871e-09, 6.51925802230835e-09, 1.862645149230957e-08, 3.073364496231079e-08, 4.284083843231201e-08, 5.494803190231323e-08, 6.705522537231445e-08, 7.916241884231567e-08, 9.12696123123169e-08, 1.0337680578231812e-07, 1.1548399925231934e-07, 1.2759119272232056e-07, 1.3969838619232178e-07, 1.51805579662323e-07, 1.6391277313232422e-07, 1.7601996660232544e-07, 1.8812716007232666e-07, 2.0023435354232788e-07, 2.123415470123291e-07, 2.2444874048233032e-07, 2.3655593395233154e-07, 2.4866312742233276e-07, 2.60770320892334e-07, 2.728775143623352e-07, 2.849847078323364e-07, 2.9709190130233765e-07, 3.0919909477233887e-07, 3.213062882423401e-07, 3.334134817123413e-07, 3.4552067518234253e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 5.0, 7.0, 8.0, 18.0, 6.0, 20.0, 23.0, 25.0, 27.0, 34.0, 34.0, 37.0, 46.0, 45.0, 43.0, 43.0, 41.0, 47.0, 52.0, 56.0, 36.0, 45.0, 32.0, 35.0, 39.0, 30.0, 36.0, 24.0, 22.0, 16.0, 7.0, 11.0, 10.0, 8.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84765625, -2.7667236328125, -2.685791015625, -2.6048583984375, -2.52392578125, -2.4429931640625, -2.362060546875, -2.2811279296875, -2.2001953125, -2.1192626953125, -2.038330078125, -1.9573974609375, -1.87646484375, -1.7955322265625, -1.714599609375, -1.6336669921875, -1.552734375, -1.4718017578125, -1.390869140625, -1.3099365234375, -1.22900390625, -1.1480712890625, -1.067138671875, -0.9862060546875, -0.9052734375, -0.8243408203125, -0.743408203125, -0.6624755859375, -0.58154296875, -0.5006103515625, -0.419677734375, -0.3387451171875, -0.2578125, -0.1768798828125, -0.095947265625, -0.0150146484375, 0.06591796875, 0.1468505859375, 0.227783203125, 0.3087158203125, 0.3896484375, 0.4705810546875, 0.551513671875, 0.6324462890625, 0.71337890625, 0.7943115234375, 0.875244140625, 0.9561767578125, 1.037109375, 1.1180419921875, 1.198974609375, 1.2799072265625, 1.36083984375, 1.4417724609375, 1.522705078125, 1.6036376953125, 1.6845703125, 1.7655029296875, 1.846435546875, 1.9273681640625, 2.00830078125, 2.0892333984375, 2.170166015625, 2.2510986328125, 2.33203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 10.0, 11.0, 18.0, 31.0, 51.0, 62.0, 102.0, 160.0, 292.0, 484.0, 734.0, 1269.0, 2147.0, 3665.0, 6353.0, 11465.0, 20822.0, 40555.0, 90762.0, 510798.0, 226677.0, 63416.0, 30760.0, 16273.0, 9109.0, 5139.0, 2959.0, 1746.0, 1062.0, 620.0, 379.0, 240.0, 140.0, 94.0, 48.0, 41.0, 24.0, 16.0, 9.0, 4.0, 0.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.00506591796875, -2.8929443359375, -2.78082275390625, -2.668701171875, -2.55657958984375, -2.4444580078125, -2.33233642578125, -2.22021484375, -2.10809326171875, -1.9959716796875, -1.88385009765625, -1.771728515625, -1.65960693359375, -1.5474853515625, -1.43536376953125, -1.3232421875, -1.21112060546875, -1.0989990234375, -0.98687744140625, -0.874755859375, -0.76263427734375, -0.6505126953125, -0.53839111328125, -0.42626953125, -0.31414794921875, -0.2020263671875, -0.08990478515625, 0.022216796875, 0.13433837890625, 0.2464599609375, 0.35858154296875, 0.470703125, 0.58282470703125, 0.6949462890625, 0.80706787109375, 0.919189453125, 1.03131103515625, 1.1434326171875, 1.25555419921875, 1.36767578125, 1.47979736328125, 1.5919189453125, 1.70404052734375, 1.816162109375, 1.92828369140625, 2.0404052734375, 2.15252685546875, 2.2646484375, 2.37677001953125, 2.4888916015625, 2.60101318359375, 2.713134765625, 2.82525634765625, 2.9373779296875, 3.04949951171875, 3.16162109375, 3.27374267578125, 3.3858642578125, 3.49798583984375, 3.610107421875, 3.72222900390625, 3.8343505859375, 3.94647216796875, 4.05859375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 10.0, 10.0, 15.0, 13.0, 16.0, 19.0, 22.0, 22.0, 25.0, 28.0, 34.0, 28.0, 32.0, 41.0, 41.0, 47.0, 88.0, 126.0, 371.0, 1371.0, 146.0, 78.0, 72.0, 61.0, 37.0, 37.0, 32.0, 28.0, 26.0, 28.0, 14.0, 27.0, 14.0, 16.0, 14.0, 10.0, 8.0, 8.0, 4.0, 2.0, 6.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-7.546875, -7.3111572265625, -7.075439453125, -6.8397216796875, -6.60400390625, -6.3682861328125, -6.132568359375, -5.8968505859375, -5.6611328125, -5.4254150390625, -5.189697265625, -4.9539794921875, -4.71826171875, -4.4825439453125, -4.246826171875, -4.0111083984375, -3.775390625, -3.5396728515625, -3.303955078125, -3.0682373046875, -2.83251953125, -2.5968017578125, -2.361083984375, -2.1253662109375, -1.8896484375, -1.6539306640625, -1.418212890625, -1.1824951171875, -0.94677734375, -0.7110595703125, -0.475341796875, -0.2396240234375, -0.00390625, 0.2318115234375, 0.467529296875, 0.7032470703125, 0.93896484375, 1.1746826171875, 1.410400390625, 1.6461181640625, 1.8818359375, 2.1175537109375, 2.353271484375, 2.5889892578125, 2.82470703125, 3.0604248046875, 3.296142578125, 3.5318603515625, 3.767578125, 4.0032958984375, 4.239013671875, 4.4747314453125, 4.71044921875, 4.9461669921875, 5.181884765625, 5.4176025390625, 5.6533203125, 5.8890380859375, 6.124755859375, 6.3604736328125, 6.59619140625, 6.8319091796875, 7.067626953125, 7.3033447265625, 7.5390625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 3.0, 7.0, 7.0, 11.0, 8.0, 12.0, 18.0, 22.0, 29.0, 34.0, 44.0, 65.0, 79.0, 98.0, 148.0, 255.0, 531.0, 1636.0, 8006.0, 64218.0, 2248069.0, 772585.0, 41619.0, 5724.0, 1218.0, 444.0, 223.0, 149.0, 96.0, 74.0, 63.0, 39.0, 35.0, 27.0, 21.0, 13.0, 12.0, 13.0, 12.0, 9.0, 4.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.046875, -11.6807861328125, -11.314697265625, -10.9486083984375, -10.58251953125, -10.2164306640625, -9.850341796875, -9.4842529296875, -9.1181640625, -8.7520751953125, -8.385986328125, -8.0198974609375, -7.65380859375, -7.2877197265625, -6.921630859375, -6.5555419921875, -6.189453125, -5.8233642578125, -5.457275390625, -5.0911865234375, -4.72509765625, -4.3590087890625, -3.992919921875, -3.6268310546875, -3.2607421875, -2.8946533203125, -2.528564453125, -2.1624755859375, -1.79638671875, -1.4302978515625, -1.064208984375, -0.6981201171875, -0.33203125, 0.0340576171875, 0.400146484375, 0.7662353515625, 1.13232421875, 1.4984130859375, 1.864501953125, 2.2305908203125, 2.5966796875, 2.9627685546875, 3.328857421875, 3.6949462890625, 4.06103515625, 4.4271240234375, 4.793212890625, 5.1593017578125, 5.525390625, 5.8914794921875, 6.257568359375, 6.6236572265625, 6.98974609375, 7.3558349609375, 7.721923828125, 8.0880126953125, 8.4541015625, 8.8201904296875, 9.186279296875, 9.5523681640625, 9.91845703125, 10.2845458984375, 10.650634765625, 11.0167236328125, 11.3828125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 25.0, 115.0, 371.0, 353.0, 129.0, 20.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.97040367126465, -25.831098556518555, -23.691791534423828, -21.552486419677734, -19.41318130493164, -17.273876190185547, -15.134570121765137, -12.995264053344727, -10.855958938598633, -8.716653823852539, -6.577347755432129, -4.438042163848877, -2.298736572265625, -0.15943145751953125, 1.979874610900879, 4.119180679321289, 6.258485794067383, 8.397790908813477, 10.537096977233887, 12.676403045654297, 14.81570816040039, 16.955013275146484, 19.094318389892578, 21.233625411987305, 23.3729305267334, 25.512235641479492, 27.65154266357422, 29.790847778320312, 31.930152893066406, 34.0694580078125, 36.208763122558594, 38.34806823730469, 40.48738098144531, 42.626686096191406, 44.7659912109375, 46.905296325683594, 49.04460144042969, 51.18390655517578, 53.32321548461914, 55.462520599365234, 57.60182571411133, 59.74113082885742, 61.880435943603516, 64.01974487304688, 66.15904998779297, 68.29835510253906, 70.43766021728516, 72.57696533203125, 74.71627044677734, 76.85557556152344, 78.99488067626953, 81.13418579101562, 83.27349090576172, 85.41279602050781, 87.5521011352539, 89.69140625, 91.83071899414062, 93.97002410888672, 96.10932922363281, 98.2486343383789, 100.387939453125, 102.5272445678711, 104.66654968261719, 106.80586242675781, 108.94515991210938]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 3.0, 10.0, 8.0, 10.0, 17.0, 19.0, 16.0, 25.0, 23.0, 31.0, 31.0, 23.0, 32.0, 41.0, 38.0, 37.0, 43.0, 53.0, 39.0, 52.0, 49.0, 48.0, 34.0, 31.0, 25.0, 28.0, 28.0, 28.0, 22.0, 22.0, 24.0, 25.0, 15.0, 16.0, 14.0, 8.0, 8.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.498703002929688, -26.61612319946289, -25.733543395996094, -24.850963592529297, -23.9683837890625, -23.085803985595703, -22.203222274780273, -21.320642471313477, -20.43806266784668, -19.555482864379883, -18.672903060913086, -17.79032325744629, -16.90774154663086, -16.025161743164062, -15.142581939697266, -14.260002136230469, -13.377422332763672, -12.494842529296875, -11.612262725830078, -10.729681968688965, -9.847102165222168, -8.964522361755371, -8.081941604614258, -7.199361801147461, -6.316781997680664, -5.434202194213867, -4.551621913909912, -3.669041872024536, -2.78646183013916, -1.9038820266723633, -1.0213017463684082, -0.13872146606445312, 0.7438583374023438, 1.6264383792877197, 2.5090184211730957, 3.3915984630584717, 4.274178504943848, 5.1567583084106445, 6.0393385887146, 6.921918869018555, 7.804498672485352, 8.687078475952148, 9.569658279418945, 10.452239036560059, 11.334818840026855, 12.217398643493652, 13.099979400634766, 13.982559204101562, 14.86513900756836, 15.747718811035156, 16.630298614501953, 17.51287841796875, 18.395458221435547, 19.278038024902344, 20.160619735717773, 21.04319953918457, 21.925779342651367, 22.808359146118164, 23.69093894958496, 24.573518753051758, 25.456100463867188, 26.338680267333984, 27.22126007080078, 28.103839874267578, 28.986419677734375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 8.0, 10.0, 9.0, 9.0, 16.0, 17.0, 20.0, 18.0, 29.0, 39.0, 26.0, 40.0, 39.0, 38.0, 42.0, 45.0, 57.0, 40.0, 45.0, 55.0, 39.0, 47.0, 31.0, 36.0, 43.0, 37.0, 30.0, 25.0, 24.0, 17.0, 13.0, 9.0, 8.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.921875, -2.83978271484375, -2.7576904296875, -2.67559814453125, -2.593505859375, -2.51141357421875, -2.4293212890625, -2.34722900390625, -2.26513671875, -2.18304443359375, -2.1009521484375, -2.01885986328125, -1.936767578125, -1.85467529296875, -1.7725830078125, -1.69049072265625, -1.6083984375, -1.52630615234375, -1.4442138671875, -1.36212158203125, -1.280029296875, -1.19793701171875, -1.1158447265625, -1.03375244140625, -0.95166015625, -0.86956787109375, -0.7874755859375, -0.70538330078125, -0.623291015625, -0.54119873046875, -0.4591064453125, -0.37701416015625, -0.294921875, -0.21282958984375, -0.1307373046875, -0.04864501953125, 0.033447265625, 0.11553955078125, 0.1976318359375, 0.27972412109375, 0.36181640625, 0.44390869140625, 0.5260009765625, 0.60809326171875, 0.690185546875, 0.77227783203125, 0.8543701171875, 0.93646240234375, 1.0185546875, 1.10064697265625, 1.1827392578125, 1.26483154296875, 1.346923828125, 1.42901611328125, 1.5111083984375, 1.59320068359375, 1.67529296875, 1.75738525390625, 1.8394775390625, 1.92156982421875, 2.003662109375, 2.08575439453125, 2.1678466796875, 2.24993896484375, 2.33203125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 9.0, 18.0, 26.0, 30.0, 47.0, 58.0, 110.0, 143.0, 242.0, 373.0, 623.0, 1208.0, 2147.0, 4592.0, 10749.0, 28554.0, 88735.0, 338832.0, 1601647.0, 1627736.0, 347646.0, 90778.0, 29420.0, 10783.0, 4668.0, 2270.0, 1171.0, 684.0, 341.0, 220.0, 132.0, 83.0, 62.0, 48.0, 30.0, 17.0, 16.0, 10.0, 6.0, 3.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.0806884765625, -4.911376953125, -4.7420654296875, -4.57275390625, -4.4034423828125, -4.234130859375, -4.0648193359375, -3.8955078125, -3.7261962890625, -3.556884765625, -3.3875732421875, -3.21826171875, -3.0489501953125, -2.879638671875, -2.7103271484375, -2.541015625, -2.3717041015625, -2.202392578125, -2.0330810546875, -1.86376953125, -1.6944580078125, -1.525146484375, -1.3558349609375, -1.1865234375, -1.0172119140625, -0.847900390625, -0.6785888671875, -0.50927734375, -0.3399658203125, -0.170654296875, -0.0013427734375, 0.16796875, 0.3372802734375, 0.506591796875, 0.6759033203125, 0.84521484375, 1.0145263671875, 1.183837890625, 1.3531494140625, 1.5224609375, 1.6917724609375, 1.861083984375, 2.0303955078125, 2.19970703125, 2.3690185546875, 2.538330078125, 2.7076416015625, 2.876953125, 3.0462646484375, 3.215576171875, 3.3848876953125, 3.55419921875, 3.7235107421875, 3.892822265625, 4.0621337890625, 4.2314453125, 4.4007568359375, 4.570068359375, 4.7393798828125, 4.90869140625, 5.0780029296875, 5.247314453125, 5.4166259765625, 5.5859375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 11.0, 12.0, 23.0, 27.0, 36.0, 76.0, 95.0, 147.0, 175.0, 279.0, 328.0, 479.0, 550.0, 468.0, 409.0, 277.0, 212.0, 164.0, 99.0, 71.0, 48.0, 22.0, 11.0, 20.0, 11.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4140625, -9.16363525390625, -8.9132080078125, -8.66278076171875, -8.412353515625, -8.16192626953125, -7.9114990234375, -7.66107177734375, -7.41064453125, -7.16021728515625, -6.9097900390625, -6.65936279296875, -6.408935546875, -6.15850830078125, -5.9080810546875, -5.65765380859375, -5.4072265625, -5.15679931640625, -4.9063720703125, -4.65594482421875, -4.405517578125, -4.15509033203125, -3.9046630859375, -3.65423583984375, -3.40380859375, -3.15338134765625, -2.9029541015625, -2.65252685546875, -2.402099609375, -2.15167236328125, -1.9012451171875, -1.65081787109375, -1.400390625, -1.14996337890625, -0.8995361328125, -0.64910888671875, -0.398681640625, -0.14825439453125, 0.1021728515625, 0.35260009765625, 0.60302734375, 0.85345458984375, 1.1038818359375, 1.35430908203125, 1.604736328125, 1.85516357421875, 2.1055908203125, 2.35601806640625, 2.6064453125, 2.85687255859375, 3.1072998046875, 3.35772705078125, 3.608154296875, 3.85858154296875, 4.1090087890625, 4.35943603515625, 4.60986328125, 4.86029052734375, 5.1107177734375, 5.36114501953125, 5.611572265625, 5.86199951171875, 6.1124267578125, 6.36285400390625, 6.61328125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 7.0, 13.0, 11.0, 12.0, 26.0, 17.0, 38.0, 40.0, 63.0, 99.0, 119.0, 214.0, 338.0, 592.0, 1071.0, 2202.0, 5498.0, 17693.0, 71066.0, 358900.0, 1900467.0, 1489859.0, 268098.0, 54639.0, 14235.0, 4642.0, 1926.0, 941.0, 513.0, 321.0, 178.0, 125.0, 77.0, 53.0, 31.0, 33.0, 22.0, 23.0, 14.0, 16.0, 17.0, 7.0, 5.0, 10.0, 0.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.140625, -9.8228759765625, -9.505126953125, -9.1873779296875, -8.86962890625, -8.5518798828125, -8.234130859375, -7.9163818359375, -7.5986328125, -7.2808837890625, -6.963134765625, -6.6453857421875, -6.32763671875, -6.0098876953125, -5.692138671875, -5.3743896484375, -5.056640625, -4.7388916015625, -4.421142578125, -4.1033935546875, -3.78564453125, -3.4678955078125, -3.150146484375, -2.8323974609375, -2.5146484375, -2.1968994140625, -1.879150390625, -1.5614013671875, -1.24365234375, -0.9259033203125, -0.608154296875, -0.2904052734375, 0.02734375, 0.3450927734375, 0.662841796875, 0.9805908203125, 1.29833984375, 1.6160888671875, 1.933837890625, 2.2515869140625, 2.5693359375, 2.8870849609375, 3.204833984375, 3.5225830078125, 3.84033203125, 4.1580810546875, 4.475830078125, 4.7935791015625, 5.111328125, 5.4290771484375, 5.746826171875, 6.0645751953125, 6.38232421875, 6.7000732421875, 7.017822265625, 7.3355712890625, 7.6533203125, 7.9710693359375, 8.288818359375, 8.6065673828125, 8.92431640625, 9.2420654296875, 9.559814453125, 9.8775634765625, 10.1953125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 14.0, 36.0, 83.0, 155.0, 189.0, 203.0, 167.0, 99.0, 43.0, 15.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.00029373168945, -38.296077728271484, -35.59185791015625, -32.88764190673828, -30.183422088623047, -27.479206085205078, -24.774988174438477, -22.070770263671875, -19.366552352905273, -16.662334442138672, -13.95811653137207, -11.253899574279785, -8.549681663513184, -5.845463752746582, -3.141246795654297, -0.4370288848876953, 2.2671890258789062, 4.971406936645508, 7.675624370574951, 10.379841804504395, 13.084059715270996, 15.788277626037598, 18.492494583129883, 21.196712493896484, 23.900930404663086, 26.605148315429688, 29.30936622619629, 32.01358413696289, 34.71780014038086, 37.422019958496094, 40.12623596191406, 42.83045196533203, 45.53467559814453, 48.2388916015625, 50.943111419677734, 53.6473274230957, 56.35154724121094, 59.055763244628906, 61.759979248046875, 64.46420288085938, 67.16841888427734, 69.87263488769531, 72.57685089111328, 75.28107452392578, 77.98529052734375, 80.68950653076172, 83.39372253417969, 86.09794616699219, 88.80215454101562, 91.5063705444336, 94.21058654785156, 96.91481018066406, 99.61902618408203, 102.3232421875, 105.02745819091797, 107.73167419433594, 110.43589782714844, 113.1401138305664, 115.84432983398438, 118.54855346679688, 121.25276947021484, 123.95698547363281, 126.66120147705078, 129.36541748046875, 132.06964111328125]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 12.0, 3.0, 12.0, 11.0, 10.0, 21.0, 19.0, 22.0, 13.0, 22.0, 26.0, 25.0, 34.0, 28.0, 33.0, 41.0, 38.0, 30.0, 31.0, 36.0, 40.0, 46.0, 33.0, 30.0, 31.0, 46.0, 27.0, 37.0, 28.0, 32.0, 23.0, 18.0, 17.0, 17.0, 20.0, 13.0, 11.0, 17.0, 10.0, 8.0, 3.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-25.74560546875, -25.035871505737305, -24.32613754272461, -23.616405487060547, -22.90667152404785, -22.196937561035156, -21.48720359802246, -20.777469635009766, -20.067737579345703, -19.358003616333008, -18.648269653320312, -17.93853759765625, -17.228803634643555, -16.51906967163086, -15.809335708618164, -15.099601745605469, -14.389867782592773, -13.680133819580078, -12.9704008102417, -12.260666847229004, -11.550933837890625, -10.84119987487793, -10.131465911865234, -9.421731948852539, -8.71199893951416, -8.002264976501465, -7.292531967163086, -6.582798004150391, -5.8730645179748535, -5.163331031799316, -4.453597068786621, -3.743863582611084, -3.034130096435547, -2.3243966102600098, -1.6146628856658936, -0.9049291610717773, -0.19519567489624023, 0.5145378112792969, 1.2242717742919922, 1.9340052604675293, 2.6437387466430664, 3.3534722328186035, 4.063205718994141, 4.772939682006836, 5.482673168182373, 6.19240665435791, 6.9021406173706055, 7.611874103546143, 8.32160758972168, 9.031341552734375, 9.741074562072754, 10.45080852508545, 11.160541534423828, 11.870275497436523, 12.580009460449219, 13.289743423461914, 13.999476432800293, 14.709210395812988, 15.418943405151367, 16.128677368164062, 16.838411331176758, 17.548145294189453, 18.257877349853516, 18.96761131286621, 19.677345275878906]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 0.0, 5.0, 5.0, 13.0, 7.0, 17.0, 16.0, 14.0, 18.0, 30.0, 21.0, 18.0, 28.0, 33.0, 36.0, 49.0, 43.0, 49.0, 54.0, 55.0, 35.0, 37.0, 46.0, 41.0, 40.0, 42.0, 30.0, 31.0, 34.0, 34.0, 28.0, 17.0, 9.0, 15.0, 12.0, 10.0, 3.0, 5.0, 4.0, 10.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.66461181640625, -2.5811767578125, -2.49774169921875, -2.414306640625, -2.33087158203125, -2.2474365234375, -2.16400146484375, -2.08056640625, -1.99713134765625, -1.9136962890625, -1.83026123046875, -1.746826171875, -1.66339111328125, -1.5799560546875, -1.49652099609375, -1.4130859375, -1.32965087890625, -1.2462158203125, -1.16278076171875, -1.079345703125, -0.99591064453125, -0.9124755859375, -0.82904052734375, -0.74560546875, -0.66217041015625, -0.5787353515625, -0.49530029296875, -0.411865234375, -0.32843017578125, -0.2449951171875, -0.16156005859375, -0.078125, 0.00531005859375, 0.0887451171875, 0.17218017578125, 0.255615234375, 0.33905029296875, 0.4224853515625, 0.50592041015625, 0.58935546875, 0.67279052734375, 0.7562255859375, 0.83966064453125, 0.923095703125, 1.00653076171875, 1.0899658203125, 1.17340087890625, 1.2568359375, 1.34027099609375, 1.4237060546875, 1.50714111328125, 1.590576171875, 1.67401123046875, 1.7574462890625, 1.84088134765625, 1.92431640625, 2.00775146484375, 2.0911865234375, 2.17462158203125, 2.258056640625, 2.34149169921875, 2.4249267578125, 2.50836181640625, 2.591796875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 9.0, 15.0, 12.0, 29.0, 35.0, 69.0, 100.0, 146.0, 197.0, 350.0, 475.0, 707.0, 1047.0, 1559.0, 2426.0, 3775.0, 5978.0, 9393.0, 14680.0, 23543.0, 39386.0, 70109.0, 137571.0, 280601.0, 214469.0, 102225.0, 54540.0, 31938.0, 19399.0, 12004.0, 7542.0, 4899.0, 3169.0, 2095.0, 1357.0, 947.0, 579.0, 355.0, 277.0, 170.0, 115.0, 85.0, 57.0, 34.0, 34.0, 23.0, 8.0, 12.0, 2.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0198822021484375, -0.0192568302154541, -0.018631458282470703, -0.018006086349487305, -0.017380714416503906, -0.016755342483520508, -0.01612997055053711, -0.015504598617553711, -0.014879226684570312, -0.014253854751586914, -0.013628482818603516, -0.013003110885620117, -0.012377738952636719, -0.01175236701965332, -0.011126995086669922, -0.010501623153686523, -0.009876251220703125, -0.009250879287719727, -0.008625507354736328, -0.00800013542175293, -0.007374763488769531, -0.006749391555786133, -0.006124019622802734, -0.005498647689819336, -0.0048732757568359375, -0.004247903823852539, -0.0036225318908691406, -0.002997159957885742, -0.0023717880249023438, -0.0017464160919189453, -0.0011210441589355469, -0.0004956722259521484, 0.00012969970703125, 0.0007550716400146484, 0.0013804435729980469, 0.0020058155059814453, 0.0026311874389648438, 0.003256559371948242, 0.0038819313049316406, 0.004507303237915039, 0.0051326751708984375, 0.005758047103881836, 0.006383419036865234, 0.007008790969848633, 0.007634162902832031, 0.00825953483581543, 0.008884906768798828, 0.009510278701782227, 0.010135650634765625, 0.010761022567749023, 0.011386394500732422, 0.01201176643371582, 0.012637138366699219, 0.013262510299682617, 0.013887882232666016, 0.014513254165649414, 0.015138626098632812, 0.01576399803161621, 0.01638936996459961, 0.017014741897583008, 0.017640113830566406, 0.018265485763549805, 0.018890857696533203, 0.0195162296295166, 0.0201416015625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 8.0, 2.0, 14.0, 11.0, 12.0, 21.0, 17.0, 32.0, 25.0, 28.0, 27.0, 36.0, 35.0, 45.0, 27.0, 43.0, 50.0, 1078.0, 38.0, 45.0, 43.0, 31.0, 36.0, 45.0, 30.0, 31.0, 27.0, 29.0, 19.0, 23.0, 21.0, 19.0, 17.0, 14.0, 9.0, 9.0, 3.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.951171875, -1.888092041015625, -1.82501220703125, -1.761932373046875, -1.6988525390625, -1.635772705078125, -1.57269287109375, -1.509613037109375, -1.446533203125, -1.383453369140625, -1.32037353515625, -1.257293701171875, -1.1942138671875, -1.131134033203125, -1.06805419921875, -1.004974365234375, -0.94189453125, -0.878814697265625, -0.81573486328125, -0.752655029296875, -0.6895751953125, -0.626495361328125, -0.56341552734375, -0.500335693359375, -0.437255859375, -0.374176025390625, -0.31109619140625, -0.248016357421875, -0.1849365234375, -0.121856689453125, -0.05877685546875, 0.004302978515625, 0.0673828125, 0.130462646484375, 0.19354248046875, 0.256622314453125, 0.3197021484375, 0.382781982421875, 0.44586181640625, 0.508941650390625, 0.572021484375, 0.635101318359375, 0.69818115234375, 0.761260986328125, 0.8243408203125, 0.887420654296875, 0.95050048828125, 1.013580322265625, 1.07666015625, 1.139739990234375, 1.20281982421875, 1.265899658203125, 1.3289794921875, 1.392059326171875, 1.45513916015625, 1.518218994140625, 1.581298828125, 1.644378662109375, 1.70745849609375, 1.770538330078125, 1.8336181640625, 1.896697998046875, 1.95977783203125, 2.022857666015625, 2.0859375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 5.0, 8.0, 17.0, 12.0, 32.0, 39.0, 38.0, 85.0, 86.0, 154.0, 237.0, 314.0, 423.0, 629.0, 915.0, 1462.0, 1970.0, 2882.0, 4336.0, 6236.0, 9400.0, 14248.0, 21677.0, 32710.0, 49995.0, 76836.0, 122110.0, 1239452.0, 181921.0, 115776.0, 72908.0, 47602.0, 30718.0, 20289.0, 13513.0, 8911.0, 6085.0, 4125.0, 2850.0, 1916.0, 1285.0, 850.0, 631.0, 469.0, 297.0, 223.0, 146.0, 91.0, 73.0, 50.0, 28.0, 23.0, 16.0, 9.0, 11.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.006374359130859375, -0.00616830587387085, -0.005962252616882324, -0.005756199359893799, -0.0055501461029052734, -0.005344092845916748, -0.005138039588928223, -0.004931986331939697, -0.004725933074951172, -0.0045198798179626465, -0.004313826560974121, -0.004107773303985596, -0.0039017200469970703, -0.003695666790008545, -0.0034896135330200195, -0.003283560276031494, -0.0030775070190429688, -0.0028714537620544434, -0.002665400505065918, -0.0024593472480773926, -0.002253293991088867, -0.002047240734100342, -0.0018411874771118164, -0.001635134220123291, -0.0014290809631347656, -0.0012230277061462402, -0.0010169744491577148, -0.0008109211921691895, -0.0006048679351806641, -0.00039881467819213867, -0.00019276142120361328, 1.329183578491211e-05, 0.0002193450927734375, 0.0004253983497619629, 0.0006314516067504883, 0.0008375048637390137, 0.001043558120727539, 0.0012496113777160645, 0.0014556646347045898, 0.0016617178916931152, 0.0018677711486816406, 0.002073824405670166, 0.0022798776626586914, 0.002485930919647217, 0.002691984176635742, 0.0028980374336242676, 0.003104090690612793, 0.0033101439476013184, 0.0035161972045898438, 0.003722250461578369, 0.0039283037185668945, 0.00413435697555542, 0.004340410232543945, 0.004546463489532471, 0.004752516746520996, 0.0049585700035095215, 0.005164623260498047, 0.005370676517486572, 0.005576729774475098, 0.005782783031463623, 0.0059888362884521484, 0.006194889545440674, 0.006400942802429199, 0.006606996059417725, 0.00681304931640625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 0.0, 8.0, 0.0, 7.0, 8.0, 0.0, 17.0, 0.0, 21.0, 30.0, 0.0, 69.0, 119.0, 0.0, 420.0, 0.0, 140.0, 67.0, 0.0, 40.0, 0.0, 20.0, 14.0, 0.0, 10.0, 0.0, 10.0, 5.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.577480912208557e-07, -8.21426510810852e-07, -7.851049304008484e-07, -7.487833499908447e-07, -7.124617695808411e-07, -6.761401891708374e-07, -6.398186087608337e-07, -6.034970283508301e-07, -5.671754479408264e-07, -5.308538675308228e-07, -4.945322871208191e-07, -4.5821070671081543e-07, -4.2188912630081177e-07, -3.855675458908081e-07, -3.4924596548080444e-07, -3.129243850708008e-07, -2.766028046607971e-07, -2.4028122425079346e-07, -2.039596438407898e-07, -1.6763806343078613e-07, -1.3131648302078247e-07, -9.499490261077881e-08, -5.8673322200775146e-08, -2.2351741790771484e-08, 1.3969838619232178e-08, 5.029141902923584e-08, 8.66129994392395e-08, 1.2293457984924316e-07, 1.5925616025924683e-07, 1.955777406692505e-07, 2.3189932107925415e-07, 2.682209014892578e-07, 3.045424818992615e-07, 3.4086406230926514e-07, 3.771856427192688e-07, 4.1350722312927246e-07, 4.498288035392761e-07, 4.861503839492798e-07, 5.224719643592834e-07, 5.587935447692871e-07, 5.951151251792908e-07, 6.314367055892944e-07, 6.677582859992981e-07, 7.040798664093018e-07, 7.404014468193054e-07, 7.767230272293091e-07, 8.130446076393127e-07, 8.493661880493164e-07, 8.856877684593201e-07, 9.220093488693237e-07, 9.583309292793274e-07, 9.94652509689331e-07, 1.0309740900993347e-06, 1.0672956705093384e-06, 1.103617250919342e-06, 1.1399388313293457e-06, 1.1762604117393494e-06, 1.212581992149353e-06, 1.2489035725593567e-06, 1.2852251529693604e-06, 1.321546733379364e-06, 1.3578683137893677e-06, 1.3941898941993713e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 9.0, 19.0, 20.0, 22.0, 48.0, 43.0, 93.0, 104.0, 209.0, 602.0, 11232.0, 1000464.0, 34165.0, 815.0, 293.0, 146.0, 84.0, 55.0, 40.0, 21.0, 20.0, 12.0, 10.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9729137420654297e-05, -1.9189901649951935e-05, -1.8650665879249573e-05, -1.811143010854721e-05, -1.757219433784485e-05, -1.7032958567142487e-05, -1.6493722796440125e-05, -1.5954487025737762e-05, -1.54152512550354e-05, -1.4876015484333038e-05, -1.4336779713630676e-05, -1.3797543942928314e-05, -1.3258308172225952e-05, -1.271907240152359e-05, -1.2179836630821228e-05, -1.1640600860118866e-05, -1.1101365089416504e-05, -1.0562129318714142e-05, -1.002289354801178e-05, -9.483657777309418e-06, -8.944422006607056e-06, -8.405186235904694e-06, -7.865950465202332e-06, -7.3267146944999695e-06, -6.787478923797607e-06, -6.248243153095245e-06, -5.709007382392883e-06, -5.169771611690521e-06, -4.630535840988159e-06, -4.091300070285797e-06, -3.552064299583435e-06, -3.012828528881073e-06, -2.473592758178711e-06, -1.934356987476349e-06, -1.3951212167739868e-06, -8.558854460716248e-07, -3.166496753692627e-07, 2.2258609533309937e-07, 7.618218660354614e-07, 1.3010576367378235e-06, 1.8402934074401855e-06, 2.3795291781425476e-06, 2.9187649488449097e-06, 3.4580007195472717e-06, 3.997236490249634e-06, 4.536472260951996e-06, 5.075708031654358e-06, 5.61494380235672e-06, 6.154179573059082e-06, 6.693415343761444e-06, 7.232651114463806e-06, 7.771886885166168e-06, 8.31112265586853e-06, 8.850358426570892e-06, 9.389594197273254e-06, 9.928829967975616e-06, 1.0468065738677979e-05, 1.100730150938034e-05, 1.1546537280082703e-05, 1.2085773050785065e-05, 1.2625008821487427e-05, 1.3164244592189789e-05, 1.3703480362892151e-05, 1.4242716133594513e-05, 1.4781951904296875e-05]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 67.0, 627.0, 296.0, 21.0], "bins": [-7.136484327929793e-06, -7.021114470262546e-06, -6.90574506734265e-06, -6.790375209675403e-06, -6.675005806755507e-06, -6.5596359490882605e-06, -6.444266546168365e-06, -6.328896688501118e-06, -6.213526830833871e-06, -6.098156973166624e-06, -5.982787570246728e-06, -5.867417712579481e-06, -5.752048309659585e-06, -5.6366784519923385e-06, -5.521308594325092e-06, -5.405939191405196e-06, -5.2905697884853e-06, -5.175199930818053e-06, -5.059830527898157e-06, -4.94446067023091e-06, -4.829091267311014e-06, -4.713721409643767e-06, -4.5983515519765206e-06, -4.482982149056625e-06, -4.367612291389378e-06, -4.252242433722131e-06, -4.136873030802235e-06, -4.021503173134988e-06, -3.906133770215092e-06, -3.7907639125478454e-06, -3.675394282254274e-06, -3.5600246519607026e-06, -3.4446545669197803e-06, -3.329284936626209e-06, -3.2139153063326376e-06, -3.098545676039066e-06, -2.9831758183718193e-06, -2.867806188078248e-06, -2.7524365577846766e-06, -2.637066927491105e-06, -2.5216972971975338e-06, -2.4063276669039624e-06, -2.290958036610391e-06, -2.175588178943144e-06, -2.0602185486495728e-06, -1.9448489183560014e-06, -1.82947928806243e-06, -1.7141096577688586e-06, -1.5987398001016118e-06, -1.4833701698080404e-06, -1.3680004258276313e-06, -1.2526307955340599e-06, -1.1372610515536508e-06, -1.0218914212600794e-06, -9.06521790966508e-07, -7.911521038295177e-07, -6.757824735359463e-07, -5.604127863989561e-07, -4.4504312768367527e-07, -3.2967346896839445e-07, -2.143037818314042e-07, -9.893409469441394e-08, 1.6435535599157447e-08, 1.318052227361477e-07, 2.4717490987313795e-07]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 39.0, 0.0, 0.0, 0.0, 0.0, 107.0, 0.0, 0.0, 0.0, 189.0, 0.0, 0.0, 0.0, 0.0, 315.0, 0.0, 0.0, 0.0, 0.0, 172.0, 0.0, 0.0, 0.0, 95.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4458935260772705e-07, -3.3155083656311035e-07, -3.1851232051849365e-07, -3.0547380447387695e-07, -2.9243528842926025e-07, -2.7939677238464355e-07, -2.6635825634002686e-07, -2.5331974029541016e-07, -2.4028122425079346e-07, -2.2724270820617676e-07, -2.1420419216156006e-07, -2.0116567611694336e-07, -1.8812716007232666e-07, -1.7508864402770996e-07, -1.6205012798309326e-07, -1.4901161193847656e-07, -1.3597309589385986e-07, -1.2293457984924316e-07, -1.0989606380462646e-07, -9.685754776000977e-08, -8.381903171539307e-08, -7.078051567077637e-08, -5.774199962615967e-08, -4.470348358154297e-08, -3.166496753692627e-08, -1.862645149230957e-08, -5.587935447692871e-09, 7.450580596923828e-09, 2.0489096641540527e-08, 3.3527612686157227e-08, 4.6566128730773926e-08, 5.960464477539063e-08, 7.264316082000732e-08, 8.568167686462402e-08, 9.872019290924072e-08, 1.1175870895385742e-07, 1.2479722499847412e-07, 1.3783574104309082e-07, 1.5087425708770752e-07, 1.6391277313232422e-07, 1.7695128917694092e-07, 1.8998980522155762e-07, 2.0302832126617432e-07, 2.1606683731079102e-07, 2.2910535335540771e-07, 2.421438694000244e-07, 2.551823854446411e-07, 2.682209014892578e-07, 2.812594175338745e-07, 2.942979335784912e-07, 3.073364496231079e-07, 3.203749656677246e-07, 3.334134817123413e-07, 3.46451997756958e-07, 3.594905138015747e-07, 3.725290298461914e-07, 3.855675458908081e-07, 3.986060619354248e-07, 4.116445779800415e-07, 4.246830940246582e-07, 4.377216100692749e-07, 4.507601261138916e-07, 4.637986421585083e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 0.0, 5.0, 5.0, 13.0, 7.0, 17.0, 16.0, 14.0, 18.0, 30.0, 21.0, 18.0, 28.0, 33.0, 36.0, 49.0, 43.0, 49.0, 54.0, 55.0, 35.0, 37.0, 46.0, 41.0, 40.0, 42.0, 30.0, 31.0, 34.0, 34.0, 28.0, 17.0, 9.0, 15.0, 12.0, 10.0, 3.0, 5.0, 4.0, 10.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.66461181640625, -2.5811767578125, -2.49774169921875, -2.414306640625, -2.33087158203125, -2.2474365234375, -2.16400146484375, -2.08056640625, -1.99713134765625, -1.9136962890625, -1.83026123046875, -1.746826171875, -1.66339111328125, -1.5799560546875, -1.49652099609375, -1.4130859375, -1.32965087890625, -1.2462158203125, -1.16278076171875, -1.079345703125, -0.99591064453125, -0.9124755859375, -0.82904052734375, -0.74560546875, -0.66217041015625, -0.5787353515625, -0.49530029296875, -0.411865234375, -0.32843017578125, -0.2449951171875, -0.16156005859375, -0.078125, 0.00531005859375, 0.0887451171875, 0.17218017578125, 0.255615234375, 0.33905029296875, 0.4224853515625, 0.50592041015625, 0.58935546875, 0.67279052734375, 0.7562255859375, 0.83966064453125, 0.923095703125, 1.00653076171875, 1.0899658203125, 1.17340087890625, 1.2568359375, 1.34027099609375, 1.4237060546875, 1.50714111328125, 1.590576171875, 1.67401123046875, 1.7574462890625, 1.84088134765625, 1.92431640625, 2.00775146484375, 2.0911865234375, 2.17462158203125, 2.258056640625, 2.34149169921875, 2.4249267578125, 2.50836181640625, 2.591796875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 17.0, 19.0, 40.0, 61.0, 91.0, 137.0, 220.0, 309.0, 523.0, 823.0, 1283.0, 1961.0, 3028.0, 4542.0, 7099.0, 11344.0, 19666.0, 37971.0, 95018.0, 418067.0, 292169.0, 75878.0, 32297.0, 17134.0, 10534.0, 6493.0, 4156.0, 2657.0, 1824.0, 1138.0, 687.0, 490.0, 322.0, 194.0, 131.0, 78.0, 56.0, 36.0, 27.0, 10.0, 5.0, 12.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.509765625, -3.39971923828125, -3.2896728515625, -3.17962646484375, -3.069580078125, -2.95953369140625, -2.8494873046875, -2.73944091796875, -2.62939453125, -2.51934814453125, -2.4093017578125, -2.29925537109375, -2.189208984375, -2.07916259765625, -1.9691162109375, -1.85906982421875, -1.7490234375, -1.63897705078125, -1.5289306640625, -1.41888427734375, -1.308837890625, -1.19879150390625, -1.0887451171875, -0.97869873046875, -0.86865234375, -0.75860595703125, -0.6485595703125, -0.53851318359375, -0.428466796875, -0.31842041015625, -0.2083740234375, -0.09832763671875, 0.01171875, 0.12176513671875, 0.2318115234375, 0.34185791015625, 0.451904296875, 0.56195068359375, 0.6719970703125, 0.78204345703125, 0.89208984375, 1.00213623046875, 1.1121826171875, 1.22222900390625, 1.332275390625, 1.44232177734375, 1.5523681640625, 1.66241455078125, 1.7724609375, 1.88250732421875, 1.9925537109375, 2.10260009765625, 2.212646484375, 2.32269287109375, 2.4327392578125, 2.54278564453125, 2.65283203125, 2.76287841796875, 2.8729248046875, 2.98297119140625, 3.093017578125, 3.20306396484375, 3.3131103515625, 3.42315673828125, 3.533203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 5.0, 1.0, 10.0, 10.0, 11.0, 11.0, 18.0, 24.0, 22.0, 23.0, 29.0, 25.0, 24.0, 43.0, 41.0, 54.0, 66.0, 74.0, 167.0, 1493.0, 291.0, 119.0, 78.0, 59.0, 57.0, 45.0, 39.0, 26.0, 20.0, 30.0, 22.0, 26.0, 17.0, 15.0, 6.0, 13.0, 5.0, 8.0, 4.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1015625, -7.82958984375, -7.5576171875, -7.28564453125, -7.013671875, -6.74169921875, -6.4697265625, -6.19775390625, -5.92578125, -5.65380859375, -5.3818359375, -5.10986328125, -4.837890625, -4.56591796875, -4.2939453125, -4.02197265625, -3.75, -3.47802734375, -3.2060546875, -2.93408203125, -2.662109375, -2.39013671875, -2.1181640625, -1.84619140625, -1.57421875, -1.30224609375, -1.0302734375, -0.75830078125, -0.486328125, -0.21435546875, 0.0576171875, 0.32958984375, 0.6015625, 0.87353515625, 1.1455078125, 1.41748046875, 1.689453125, 1.96142578125, 2.2333984375, 2.50537109375, 2.77734375, 3.04931640625, 3.3212890625, 3.59326171875, 3.865234375, 4.13720703125, 4.4091796875, 4.68115234375, 4.953125, 5.22509765625, 5.4970703125, 5.76904296875, 6.041015625, 6.31298828125, 6.5849609375, 6.85693359375, 7.12890625, 7.40087890625, 7.6728515625, 7.94482421875, 8.216796875, 8.48876953125, 8.7607421875, 9.03271484375, 9.3046875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 6.0, 6.0, 13.0, 9.0, 15.0, 16.0, 23.0, 30.0, 40.0, 47.0, 50.0, 85.0, 124.0, 206.0, 383.0, 988.0, 4584.0, 34247.0, 1769883.0, 1297256.0, 31349.0, 4390.0, 941.0, 314.0, 182.0, 149.0, 86.0, 67.0, 39.0, 28.0, 33.0, 20.0, 22.0, 14.0, 13.0, 12.0, 6.0, 9.0, 1.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.734375, -15.2713623046875, -14.808349609375, -14.3453369140625, -13.88232421875, -13.4193115234375, -12.956298828125, -12.4932861328125, -12.0302734375, -11.5672607421875, -11.104248046875, -10.6412353515625, -10.17822265625, -9.7152099609375, -9.252197265625, -8.7891845703125, -8.326171875, -7.8631591796875, -7.400146484375, -6.9371337890625, -6.47412109375, -6.0111083984375, -5.548095703125, -5.0850830078125, -4.6220703125, -4.1590576171875, -3.696044921875, -3.2330322265625, -2.77001953125, -2.3070068359375, -1.843994140625, -1.3809814453125, -0.91796875, -0.4549560546875, 0.008056640625, 0.4710693359375, 0.93408203125, 1.3970947265625, 1.860107421875, 2.3231201171875, 2.7861328125, 3.2491455078125, 3.712158203125, 4.1751708984375, 4.63818359375, 5.1011962890625, 5.564208984375, 6.0272216796875, 6.490234375, 6.9532470703125, 7.416259765625, 7.8792724609375, 8.34228515625, 8.8052978515625, 9.268310546875, 9.7313232421875, 10.1943359375, 10.6573486328125, 11.120361328125, 11.5833740234375, 12.04638671875, 12.5093994140625, 12.972412109375, 13.4354248046875, 13.8984375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 28.0, 65.0, 194.0, 315.0, 234.0, 117.0, 45.0, 10.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.07544708251953, -31.556636810302734, -30.03782844543457, -28.519018173217773, -27.000207901000977, -25.481399536132812, -23.962589263916016, -22.44377899169922, -20.924968719482422, -19.406158447265625, -17.88735008239746, -16.368539810180664, -14.849729537963867, -13.330920219421387, -11.812110900878906, -10.29330062866211, -8.774492263793945, -7.255682468414307, -5.736872673034668, -4.2180633544921875, -2.699253559112549, -1.1804437637329102, 0.3383655548095703, 1.8571758270263672, 3.3759851455688477, 4.894794940948486, 6.413604736328125, 7.9324140548706055, 9.451223373413086, 10.970033645629883, 12.488842964172363, 14.00765323638916, 15.52646255493164, 17.045272827148438, 18.5640811920166, 20.0828914642334, 21.601701736450195, 23.12051010131836, 24.639320373535156, 26.158130645751953, 27.67694091796875, 29.195751190185547, 30.71455955505371, 32.233367919921875, 33.75217819213867, 35.27098846435547, 36.789798736572266, 38.30860900878906, 39.827415466308594, 41.34622573852539, 42.86503601074219, 44.38384246826172, 45.902652740478516, 47.42146301269531, 48.94027328491211, 50.459083557128906, 51.9778938293457, 53.4967041015625, 55.0155143737793, 56.534324645996094, 58.053131103515625, 59.57194137573242, 61.09075164794922, 62.609561920166016, 64.12837219238281]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 8.0, 6.0, 7.0, 8.0, 15.0, 19.0, 19.0, 20.0, 16.0, 20.0, 32.0, 22.0, 34.0, 37.0, 61.0, 25.0, 54.0, 45.0, 57.0, 44.0, 43.0, 49.0, 47.0, 36.0, 34.0, 28.0, 27.0, 26.0, 26.0, 30.0, 23.0, 17.0, 14.0, 10.0, 9.0, 5.0, 8.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.180925369262695, -21.36521339416504, -20.549503326416016, -19.73379135131836, -18.918079376220703, -18.102367401123047, -17.286657333374023, -16.470945358276367, -15.655233383178711, -14.839522361755371, -14.023810386657715, -13.208099365234375, -12.392387390136719, -11.576676368713379, -10.760965347290039, -9.945253372192383, -9.129542350769043, -8.313831329345703, -7.498119354248047, -6.682408332824707, -5.866696357727051, -5.050985336303711, -4.235273838043213, -3.419562339782715, -2.603850841522217, -1.7881393432617188, -0.9724279642105103, -0.15671658515930176, 0.6589949131011963, 1.4747061729431152, 2.2904176712036133, 3.1061291694641113, 3.9218406677246094, 4.737552165985107, 5.5532636642456055, 6.368974685668945, 7.184686660766602, 8.000397682189941, 8.816108703613281, 9.631820678710938, 10.447532653808594, 11.263243675231934, 12.07895565032959, 12.89466667175293, 13.710378646850586, 14.526089668273926, 15.341800689697266, 16.157512664794922, 16.973224639892578, 17.788936614990234, 18.604646682739258, 19.420358657836914, 20.23607063293457, 21.051780700683594, 21.86749267578125, 22.683204650878906, 23.49891471862793, 24.314626693725586, 25.13033676147461, 25.946048736572266, 26.761760711669922, 27.577472686767578, 28.3931827545166, 29.208894729614258, 30.024606704711914]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 9.0, 8.0, 15.0, 14.0, 17.0, 24.0, 23.0, 20.0, 19.0, 29.0, 35.0, 37.0, 35.0, 45.0, 60.0, 47.0, 54.0, 44.0, 42.0, 29.0, 45.0, 47.0, 45.0, 33.0, 32.0, 38.0, 27.0, 24.0, 20.0, 15.0, 11.0, 11.0, 8.0, 8.0, 5.0, 5.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.79296875, -2.706024169921875, -2.61907958984375, -2.532135009765625, -2.4451904296875, -2.358245849609375, -2.27130126953125, -2.184356689453125, -2.097412109375, -2.010467529296875, -1.92352294921875, -1.836578369140625, -1.7496337890625, -1.662689208984375, -1.57574462890625, -1.488800048828125, -1.40185546875, -1.314910888671875, -1.22796630859375, -1.141021728515625, -1.0540771484375, -0.967132568359375, -0.88018798828125, -0.793243408203125, -0.706298828125, -0.619354248046875, -0.53240966796875, -0.445465087890625, -0.3585205078125, -0.271575927734375, -0.18463134765625, -0.097686767578125, -0.0107421875, 0.076202392578125, 0.16314697265625, 0.250091552734375, 0.3370361328125, 0.423980712890625, 0.51092529296875, 0.597869873046875, 0.684814453125, 0.771759033203125, 0.85870361328125, 0.945648193359375, 1.0325927734375, 1.119537353515625, 1.20648193359375, 1.293426513671875, 1.38037109375, 1.467315673828125, 1.55426025390625, 1.641204833984375, 1.7281494140625, 1.815093994140625, 1.90203857421875, 1.988983154296875, 2.075927734375, 2.162872314453125, 2.24981689453125, 2.336761474609375, 2.4237060546875, 2.510650634765625, 2.59759521484375, 2.684539794921875, 2.771484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 10.0, 4.0, 11.0, 2.0, 13.0, 16.0, 24.0, 28.0, 42.0, 59.0, 73.0, 141.0, 219.0, 459.0, 1138.0, 2987.0, 10215.0, 47130.0, 349899.0, 2862391.0, 809894.0, 85754.0, 16344.0, 4520.0, 1556.0, 571.0, 273.0, 169.0, 103.0, 61.0, 49.0, 25.0, 26.0, 13.0, 11.0, 9.0, 9.0, 7.0, 4.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.59375, -9.300048828125, -9.00634765625, -8.712646484375, -8.4189453125, -8.125244140625, -7.83154296875, -7.537841796875, -7.244140625, -6.950439453125, -6.65673828125, -6.363037109375, -6.0693359375, -5.775634765625, -5.48193359375, -5.188232421875, -4.89453125, -4.600830078125, -4.30712890625, -4.013427734375, -3.7197265625, -3.426025390625, -3.13232421875, -2.838623046875, -2.544921875, -2.251220703125, -1.95751953125, -1.663818359375, -1.3701171875, -1.076416015625, -0.78271484375, -0.489013671875, -0.1953125, 0.098388671875, 0.39208984375, 0.685791015625, 0.9794921875, 1.273193359375, 1.56689453125, 1.860595703125, 2.154296875, 2.447998046875, 2.74169921875, 3.035400390625, 3.3291015625, 3.622802734375, 3.91650390625, 4.210205078125, 4.50390625, 4.797607421875, 5.09130859375, 5.385009765625, 5.6787109375, 5.972412109375, 6.26611328125, 6.559814453125, 6.853515625, 7.147216796875, 7.44091796875, 7.734619140625, 8.0283203125, 8.322021484375, 8.61572265625, 8.909423828125, 9.203125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 10.0, 11.0, 14.0, 26.0, 44.0, 68.0, 92.0, 158.0, 200.0, 254.0, 337.0, 457.0, 540.0, 513.0, 408.0, 267.0, 206.0, 131.0, 94.0, 65.0, 53.0, 37.0, 32.0, 13.0, 14.0, 10.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.14520263671875, -6.9036865234375, -6.66217041015625, -6.420654296875, -6.17913818359375, -5.9376220703125, -5.69610595703125, -5.45458984375, -5.21307373046875, -4.9715576171875, -4.73004150390625, -4.488525390625, -4.24700927734375, -4.0054931640625, -3.76397705078125, -3.5224609375, -3.28094482421875, -3.0394287109375, -2.79791259765625, -2.556396484375, -2.31488037109375, -2.0733642578125, -1.83184814453125, -1.59033203125, -1.34881591796875, -1.1072998046875, -0.86578369140625, -0.624267578125, -0.38275146484375, -0.1412353515625, 0.10028076171875, 0.341796875, 0.58331298828125, 0.8248291015625, 1.06634521484375, 1.307861328125, 1.54937744140625, 1.7908935546875, 2.03240966796875, 2.27392578125, 2.51544189453125, 2.7569580078125, 2.99847412109375, 3.239990234375, 3.48150634765625, 3.7230224609375, 3.96453857421875, 4.2060546875, 4.44757080078125, 4.6890869140625, 4.93060302734375, 5.172119140625, 5.41363525390625, 5.6551513671875, 5.89666748046875, 6.13818359375, 6.37969970703125, 6.6212158203125, 6.86273193359375, 7.104248046875, 7.34576416015625, 7.5872802734375, 7.82879638671875, 8.0703125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 16.0, 19.0, 23.0, 41.0, 52.0, 107.0, 194.0, 338.0, 630.0, 1606.0, 7380.0, 85722.0, 2039203.0, 1966070.0, 82789.0, 7127.0, 1536.0, 658.0, 348.0, 192.0, 90.0, 61.0, 28.0, 12.0, 16.0, 7.0, 11.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-22.109375, -21.4951171875, -20.880859375, -20.2666015625, -19.65234375, -19.0380859375, -18.423828125, -17.8095703125, -17.1953125, -16.5810546875, -15.966796875, -15.3525390625, -14.73828125, -14.1240234375, -13.509765625, -12.8955078125, -12.28125, -11.6669921875, -11.052734375, -10.4384765625, -9.82421875, -9.2099609375, -8.595703125, -7.9814453125, -7.3671875, -6.7529296875, -6.138671875, -5.5244140625, -4.91015625, -4.2958984375, -3.681640625, -3.0673828125, -2.453125, -1.8388671875, -1.224609375, -0.6103515625, 0.00390625, 0.6181640625, 1.232421875, 1.8466796875, 2.4609375, 3.0751953125, 3.689453125, 4.3037109375, 4.91796875, 5.5322265625, 6.146484375, 6.7607421875, 7.375, 7.9892578125, 8.603515625, 9.2177734375, 9.83203125, 10.4462890625, 11.060546875, 11.6748046875, 12.2890625, 12.9033203125, 13.517578125, 14.1318359375, 14.74609375, 15.3603515625, 15.974609375, 16.5888671875, 17.203125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 12.0, 50.0, 112.0, 264.0, 281.0, 190.0, 78.0, 22.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.87179183959961, -15.284139633178711, -11.696486473083496, -8.108833312988281, -4.521181106567383, -0.9335289001464844, 2.654125213623047, 6.241777420043945, 9.829429626464844, 13.417081832885742, 17.00473403930664, 20.592388153076172, 24.18004035949707, 27.76769256591797, 31.3553466796875, 34.94300079345703, 38.5306510925293, 42.11830520629883, 45.705955505371094, 49.293609619140625, 52.881263732910156, 56.46891403198242, 60.05656814575195, 63.64421844482422, 67.23187255859375, 70.81952667236328, 74.40718078613281, 77.99482727050781, 81.58248138427734, 85.17013549804688, 88.7577896118164, 92.34544372558594, 95.93309020996094, 99.52074432373047, 103.1083984375, 106.696044921875, 110.28369903564453, 113.87135314941406, 117.4590072631836, 121.04666137695312, 124.63430786132812, 128.22195434570312, 131.8096160888672, 135.3972625732422, 138.98492431640625, 142.57257080078125, 146.16021728515625, 149.7478790283203, 153.33554077148438, 156.92318725585938, 160.51084899902344, 164.09849548339844, 167.6861572265625, 171.2738037109375, 174.8614501953125, 178.44911193847656, 182.03675842285156, 185.62440490722656, 189.21206665039062, 192.79971313476562, 196.3873748779297, 199.9750213623047, 203.56268310546875, 207.15032958984375, 210.73797607421875]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 9.0, 9.0, 15.0, 18.0, 23.0, 18.0, 26.0, 27.0, 31.0, 42.0, 35.0, 55.0, 46.0, 42.0, 65.0, 40.0, 39.0, 38.0, 46.0, 44.0, 33.0, 39.0, 30.0, 37.0, 28.0, 24.0, 27.0, 21.0, 17.0, 12.0, 17.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.712013244628906, -22.931381225585938, -22.1507511138916, -21.370121002197266, -20.589488983154297, -19.808856964111328, -19.028226852416992, -18.247596740722656, -17.466964721679688, -16.68633270263672, -15.905702590942383, -15.12507152557373, -14.344440460205078, -13.563809394836426, -12.783178329467773, -12.002547264099121, -11.221916198730469, -10.441285133361816, -9.660654067993164, -8.880023002624512, -8.09939193725586, -7.318760871887207, -6.538129806518555, -5.757498741149902, -4.97686767578125, -4.196236610412598, -3.4156055450439453, -2.634974479675293, -1.8543434143066406, -1.0737123489379883, -0.29308128356933594, 0.4875497817993164, 1.2681808471679688, 2.048811912536621, 2.8294429779052734, 3.610074043273926, 4.390705108642578, 5.1713361740112305, 5.951967239379883, 6.732598304748535, 7.5132293701171875, 8.29386043548584, 9.074491500854492, 9.855122566223145, 10.635753631591797, 11.41638469696045, 12.197015762329102, 12.977646827697754, 13.758277893066406, 14.538908958435059, 15.319540023803711, 16.100170135498047, 16.880802154541016, 17.661434173583984, 18.44206428527832, 19.222694396972656, 20.003326416015625, 20.783958435058594, 21.56458854675293, 22.345218658447266, 23.125850677490234, 23.906482696533203, 24.68711280822754, 25.467742919921875, 26.248374938964844]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 8.0, 8.0, 10.0, 9.0, 16.0, 17.0, 21.0, 20.0, 22.0, 32.0, 20.0, 26.0, 35.0, 41.0, 53.0, 40.0, 48.0, 51.0, 40.0, 56.0, 39.0, 41.0, 38.0, 46.0, 34.0, 33.0, 37.0, 30.0, 22.0, 28.0, 12.0, 16.0, 12.0, 7.0, 6.0, 5.0, 3.0, 5.0, 5.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.7918701171875, -2.702880859375, -2.6138916015625, -2.52490234375, -2.4359130859375, -2.346923828125, -2.2579345703125, -2.1689453125, -2.0799560546875, -1.990966796875, -1.9019775390625, -1.81298828125, -1.7239990234375, -1.635009765625, -1.5460205078125, -1.45703125, -1.3680419921875, -1.279052734375, -1.1900634765625, -1.10107421875, -1.0120849609375, -0.923095703125, -0.8341064453125, -0.7451171875, -0.6561279296875, -0.567138671875, -0.4781494140625, -0.38916015625, -0.3001708984375, -0.211181640625, -0.1221923828125, -0.033203125, 0.0557861328125, 0.144775390625, 0.2337646484375, 0.32275390625, 0.4117431640625, 0.500732421875, 0.5897216796875, 0.6787109375, 0.7677001953125, 0.856689453125, 0.9456787109375, 1.03466796875, 1.1236572265625, 1.212646484375, 1.3016357421875, 1.390625, 1.4796142578125, 1.568603515625, 1.6575927734375, 1.74658203125, 1.8355712890625, 1.924560546875, 2.0135498046875, 2.1025390625, 2.1915283203125, 2.280517578125, 2.3695068359375, 2.45849609375, 2.5474853515625, 2.636474609375, 2.7254638671875, 2.814453125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 8.0, 7.0, 9.0, 19.0, 22.0, 36.0, 61.0, 89.0, 101.0, 154.0, 234.0, 321.0, 492.0, 719.0, 1121.0, 1646.0, 2564.0, 3869.0, 6192.0, 9859.0, 15740.0, 25766.0, 44479.0, 79245.0, 148954.0, 270778.0, 194906.0, 101002.0, 56125.0, 32278.0, 19127.0, 11638.0, 7423.0, 4678.0, 2985.0, 1892.0, 1315.0, 871.0, 569.0, 383.0, 281.0, 204.0, 119.0, 93.0, 55.0, 37.0, 31.0, 20.0, 15.0, 6.0, 12.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.021026611328125, -0.020383596420288086, -0.019740581512451172, -0.019097566604614258, -0.018454551696777344, -0.01781153678894043, -0.017168521881103516, -0.0165255069732666, -0.015882492065429688, -0.015239477157592773, -0.01459646224975586, -0.013953447341918945, -0.013310432434082031, -0.012667417526245117, -0.012024402618408203, -0.011381387710571289, -0.010738372802734375, -0.010095357894897461, -0.009452342987060547, -0.008809328079223633, -0.008166313171386719, -0.007523298263549805, -0.006880283355712891, -0.0062372684478759766, -0.0055942535400390625, -0.0049512386322021484, -0.004308223724365234, -0.0036652088165283203, -0.0030221939086914062, -0.002379179000854492, -0.0017361640930175781, -0.001093149185180664, -0.00045013427734375, 0.00019288063049316406, 0.0008358955383300781, 0.0014789104461669922, 0.0021219253540039062, 0.0027649402618408203, 0.0034079551696777344, 0.0040509700775146484, 0.0046939849853515625, 0.0053369998931884766, 0.005980014801025391, 0.006623029708862305, 0.007266044616699219, 0.007909059524536133, 0.008552074432373047, 0.009195089340209961, 0.009838104248046875, 0.010481119155883789, 0.011124134063720703, 0.011767148971557617, 0.012410163879394531, 0.013053178787231445, 0.01369619369506836, 0.014339208602905273, 0.014982223510742188, 0.0156252384185791, 0.016268253326416016, 0.01691126823425293, 0.017554283142089844, 0.018197298049926758, 0.018840312957763672, 0.019483327865600586, 0.0201263427734375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 4.0, 10.0, 6.0, 9.0, 8.0, 13.0, 17.0, 13.0, 23.0, 14.0, 21.0, 28.0, 31.0, 27.0, 21.0, 30.0, 28.0, 31.0, 46.0, 29.0, 40.0, 38.0, 1064.0, 41.0, 39.0, 32.0, 30.0, 30.0, 31.0, 27.0, 23.0, 22.0, 34.0, 14.0, 20.0, 24.0, 15.0, 16.0, 20.0, 12.0, 3.0, 9.0, 10.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7353515625, -1.6803741455078125, -1.625396728515625, -1.5704193115234375, -1.51544189453125, -1.4604644775390625, -1.405487060546875, -1.3505096435546875, -1.2955322265625, -1.2405548095703125, -1.185577392578125, -1.1305999755859375, -1.07562255859375, -1.0206451416015625, -0.965667724609375, -0.9106903076171875, -0.855712890625, -0.8007354736328125, -0.745758056640625, -0.6907806396484375, -0.63580322265625, -0.5808258056640625, -0.525848388671875, -0.4708709716796875, -0.4158935546875, -0.3609161376953125, -0.305938720703125, -0.2509613037109375, -0.19598388671875, -0.1410064697265625, -0.086029052734375, -0.0310516357421875, 0.02392578125, 0.0789031982421875, 0.133880615234375, 0.1888580322265625, 0.24383544921875, 0.2988128662109375, 0.353790283203125, 0.4087677001953125, 0.4637451171875, 0.5187225341796875, 0.573699951171875, 0.6286773681640625, 0.68365478515625, 0.7386322021484375, 0.793609619140625, 0.8485870361328125, 0.903564453125, 0.9585418701171875, 1.013519287109375, 1.0684967041015625, 1.12347412109375, 1.1784515380859375, 1.233428955078125, 1.2884063720703125, 1.3433837890625, 1.3983612060546875, 1.453338623046875, 1.5083160400390625, 1.56329345703125, 1.6182708740234375, 1.673248291015625, 1.7282257080078125, 1.783203125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 13.0, 28.0, 33.0, 45.0, 71.0, 82.0, 126.0, 183.0, 336.0, 446.0, 687.0, 967.0, 1513.0, 2252.0, 3179.0, 5026.0, 7502.0, 11332.0, 17503.0, 26539.0, 40020.0, 60475.0, 92853.0, 146375.0, 1245461.0, 152208.0, 96928.0, 62689.0, 41650.0, 27400.0, 17994.0, 11878.0, 7825.0, 5099.0, 3404.0, 2302.0, 1548.0, 1062.0, 670.0, 478.0, 310.0, 204.0, 158.0, 78.0, 76.0, 48.0, 26.0, 24.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.00675201416015625, -0.006544530391693115, -0.0063370466232299805, -0.006129562854766846, -0.005922079086303711, -0.005714595317840576, -0.005507111549377441, -0.005299627780914307, -0.005092144012451172, -0.004884660243988037, -0.004677176475524902, -0.004469692707061768, -0.004262208938598633, -0.004054725170135498, -0.0038472414016723633, -0.0036397576332092285, -0.0034322738647460938, -0.003224790096282959, -0.0030173063278198242, -0.0028098225593566895, -0.0026023387908935547, -0.00239485502243042, -0.002187371253967285, -0.0019798874855041504, -0.0017724037170410156, -0.0015649199485778809, -0.001357436180114746, -0.0011499524116516113, -0.0009424686431884766, -0.0007349848747253418, -0.000527501106262207, -0.00032001733779907227, -0.0001125335693359375, 9.495019912719727e-05, 0.00030243396759033203, 0.0005099177360534668, 0.0007174015045166016, 0.0009248852729797363, 0.001132369041442871, 0.0013398528099060059, 0.0015473365783691406, 0.0017548203468322754, 0.00196230411529541, 0.002169787883758545, 0.0023772716522216797, 0.0025847554206848145, 0.0027922391891479492, 0.002999722957611084, 0.0032072067260742188, 0.0034146904945373535, 0.0036221742630004883, 0.003829658031463623, 0.004037141799926758, 0.004244625568389893, 0.004452109336853027, 0.004659593105316162, 0.004867076873779297, 0.005074560642242432, 0.005282044410705566, 0.005489528179168701, 0.005697011947631836, 0.005904495716094971, 0.0061119794845581055, 0.00631946325302124, 0.006526947021484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 11.0, 0.0, 9.0, 0.0, 0.0, 12.0, 0.0, 0.0, 8.0, 0.0, 14.0, 0.0, 0.0, 25.0, 0.0, 0.0, 33.0, 0.0, 69.0, 0.0, 0.0, 116.0, 0.0, 0.0, 399.0, 0.0, 113.0, 0.0, 0.0, 77.0, 0.0, 0.0, 29.0, 0.0, 27.0, 0.0, 0.0, 13.0, 0.0, 0.0, 21.0, 0.0, 11.0, 0.0, 0.0, 6.0, 0.0, 0.0, 7.0, 0.0, 5.0, 0.0, 0.0, 5.0, 0.0, 2.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 7.0, 5.0, 6.0, 11.0, 11.0, 13.0, 16.0, 22.0, 33.0, 37.0, 33.0, 48.0, 96.0, 130.0, 178.0, 328.0, 846.0, 13193.0, 763329.0, 264311.0, 4578.0, 471.0, 256.0, 149.0, 105.0, 84.0, 73.0, 29.0, 35.0, 24.0, 15.0, 15.0, 10.0, 6.0, 3.0, 2.0, 7.0, 4.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.1980533599853516e-05, -1.1604279279708862e-05, -1.1228024959564209e-05, -1.0851770639419556e-05, -1.0475516319274902e-05, -1.0099261999130249e-05, -9.723007678985596e-06, -9.346753358840942e-06, -8.970499038696289e-06, -8.594244718551636e-06, -8.217990398406982e-06, -7.841736078262329e-06, -7.465481758117676e-06, -7.0892274379730225e-06, -6.712973117828369e-06, -6.336718797683716e-06, -5.9604644775390625e-06, -5.584210157394409e-06, -5.207955837249756e-06, -4.8317015171051025e-06, -4.455447196960449e-06, -4.079192876815796e-06, -3.7029385566711426e-06, -3.3266842365264893e-06, -2.950429916381836e-06, -2.5741755962371826e-06, -2.1979212760925293e-06, -1.821666955947876e-06, -1.4454126358032227e-06, -1.0691583156585693e-06, -6.92903995513916e-07, -3.166496753692627e-07, 5.960464477539063e-08, 4.3585896492004395e-07, 8.121132850646973e-07, 1.1883676052093506e-06, 1.564621925354004e-06, 1.9408762454986572e-06, 2.3171305656433105e-06, 2.693384885787964e-06, 3.069639205932617e-06, 3.4458935260772705e-06, 3.822147846221924e-06, 4.198402166366577e-06, 4.5746564865112305e-06, 4.950910806655884e-06, 5.327165126800537e-06, 5.7034194469451904e-06, 6.079673767089844e-06, 6.455928087234497e-06, 6.83218240737915e-06, 7.208436727523804e-06, 7.584691047668457e-06, 7.96094536781311e-06, 8.337199687957764e-06, 8.713454008102417e-06, 9.08970832824707e-06, 9.465962648391724e-06, 9.842216968536377e-06, 1.021847128868103e-05, 1.0594725608825684e-05, 1.0970979928970337e-05, 1.134723424911499e-05, 1.1723488569259644e-05, 1.2099742889404297e-05]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 20.0, 26.0, 74.0, 118.0, 404.0, 168.0, 100.0, 49.0, 30.0, 11.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.429752374970121e-07, -6.088771442591678e-07, -5.747790510213235e-07, -5.406809009400604e-07, -5.065828077022161e-07, -4.724847144643718e-07, -4.3838659280481806e-07, -4.0428847114526434e-07, -3.7019037790742004e-07, -3.3609228466957575e-07, -3.01994163010022e-07, -2.678960413504683e-07, -2.33797948112624e-07, -1.99699840663925e-07, -1.6560173321522598e-07, -1.3150361155567225e-07, -9.740551831782795e-08, -6.330741086912894e-08, -2.9209303420429933e-08, 4.888804028269078e-09, 3.898691147696809e-08, 7.30850189256671e-08, 1.0718312637436611e-07, 1.4128124803391984e-07, 1.7537934127176413e-07, 2.0947744872046314e-07, 2.4357555616916216e-07, 2.776736778287159e-07, 3.117717710665602e-07, 3.4586986430440447e-07, 3.799679859639582e-07, 4.140661076235119e-07, 4.481640871745185e-07, 4.822621804123628e-07, 5.163602736502071e-07, 5.504584237314702e-07, 5.845565169693145e-07, 6.186546102071588e-07, 6.52752760288422e-07, 6.868508535262663e-07, 7.209489467641106e-07, 7.550470400019549e-07, 7.891451332397992e-07, 8.232432833210623e-07, 8.573413765589066e-07, 8.914394697967509e-07, 9.255376198780141e-07, 9.596357131158584e-07, 9.937338063537027e-07, 1.027831899591547e-06, 1.0619299928293913e-06, 1.0960280860672356e-06, 1.1301262929919176e-06, 1.1642243862297619e-06, 1.1983224794676062e-06, 1.2324205727054505e-06, 1.2665186659432948e-06, 1.300616759181139e-06, 1.3347148524189834e-06, 1.3688129456568277e-06, 1.402911038894672e-06, 1.437009245819354e-06, 1.4711073390571983e-06, 1.5052054322950426e-06, 1.5393035255328869e-06]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 80.0, 0.0, 0.0, 0.0, 0.0, 198.0, 0.0, 0.0, 0.0, 0.0, 355.0, 0.0, 0.0, 0.0, 207.0, 0.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 8.0, 8.0, 10.0, 9.0, 16.0, 17.0, 21.0, 20.0, 22.0, 32.0, 20.0, 26.0, 35.0, 41.0, 53.0, 40.0, 48.0, 51.0, 40.0, 56.0, 39.0, 41.0, 38.0, 46.0, 34.0, 33.0, 37.0, 30.0, 22.0, 28.0, 12.0, 16.0, 12.0, 7.0, 6.0, 5.0, 3.0, 5.0, 5.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.7918701171875, -2.702880859375, -2.6138916015625, -2.52490234375, -2.4359130859375, -2.346923828125, -2.2579345703125, -2.1689453125, -2.0799560546875, -1.990966796875, -1.9019775390625, -1.81298828125, -1.7239990234375, -1.635009765625, -1.5460205078125, -1.45703125, -1.3680419921875, -1.279052734375, -1.1900634765625, -1.10107421875, -1.0120849609375, -0.923095703125, -0.8341064453125, -0.7451171875, -0.6561279296875, -0.567138671875, -0.4781494140625, -0.38916015625, -0.3001708984375, -0.211181640625, -0.1221923828125, -0.033203125, 0.0557861328125, 0.144775390625, 0.2337646484375, 0.32275390625, 0.4117431640625, 0.500732421875, 0.5897216796875, 0.6787109375, 0.7677001953125, 0.856689453125, 0.9456787109375, 1.03466796875, 1.1236572265625, 1.212646484375, 1.3016357421875, 1.390625, 1.4796142578125, 1.568603515625, 1.6575927734375, 1.74658203125, 1.8355712890625, 1.924560546875, 2.0135498046875, 2.1025390625, 2.1915283203125, 2.280517578125, 2.3695068359375, 2.45849609375, 2.5474853515625, 2.636474609375, 2.7254638671875, 2.814453125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 14.0, 12.0, 19.0, 25.0, 32.0, 48.0, 63.0, 96.0, 149.0, 225.0, 296.0, 476.0, 662.0, 938.0, 1399.0, 2053.0, 2884.0, 4212.0, 6340.0, 9244.0, 14200.0, 22617.0, 38498.0, 78928.0, 324343.0, 352038.0, 81705.0, 39426.0, 23185.0, 14551.0, 9517.0, 6362.0, 4372.0, 3047.0, 2056.0, 1410.0, 925.0, 692.0, 455.0, 341.0, 244.0, 130.0, 113.0, 68.0, 46.0, 33.0, 32.0, 10.0, 7.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.54296875, -2.46099853515625, -2.3790283203125, -2.29705810546875, -2.215087890625, -2.13311767578125, -2.0511474609375, -1.96917724609375, -1.88720703125, -1.80523681640625, -1.7232666015625, -1.64129638671875, -1.559326171875, -1.47735595703125, -1.3953857421875, -1.31341552734375, -1.2314453125, -1.14947509765625, -1.0675048828125, -0.98553466796875, -0.903564453125, -0.82159423828125, -0.7396240234375, -0.65765380859375, -0.57568359375, -0.49371337890625, -0.4117431640625, -0.32977294921875, -0.247802734375, -0.16583251953125, -0.0838623046875, -0.00189208984375, 0.080078125, 0.16204833984375, 0.2440185546875, 0.32598876953125, 0.407958984375, 0.48992919921875, 0.5718994140625, 0.65386962890625, 0.73583984375, 0.81781005859375, 0.8997802734375, 0.98175048828125, 1.063720703125, 1.14569091796875, 1.2276611328125, 1.30963134765625, 1.3916015625, 1.47357177734375, 1.5555419921875, 1.63751220703125, 1.719482421875, 1.80145263671875, 1.8834228515625, 1.96539306640625, 2.04736328125, 2.12933349609375, 2.2113037109375, 2.29327392578125, 2.375244140625, 2.45721435546875, 2.5391845703125, 2.62115478515625, 2.703125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 10.0, 14.0, 16.0, 20.0, 11.0, 21.0, 28.0, 19.0, 18.0, 28.0, 31.0, 35.0, 29.0, 34.0, 53.0, 57.0, 116.0, 247.0, 1518.0, 169.0, 83.0, 56.0, 49.0, 28.0, 35.0, 43.0, 32.0, 34.0, 28.0, 18.0, 25.0, 18.0, 23.0, 13.0, 13.0, 15.0, 9.0, 12.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0], "bins": [-8.0546875, -7.81268310546875, -7.5706787109375, -7.32867431640625, -7.086669921875, -6.84466552734375, -6.6026611328125, -6.36065673828125, -6.11865234375, -5.87664794921875, -5.6346435546875, -5.39263916015625, -5.150634765625, -4.90863037109375, -4.6666259765625, -4.42462158203125, -4.1826171875, -3.94061279296875, -3.6986083984375, -3.45660400390625, -3.214599609375, -2.97259521484375, -2.7305908203125, -2.48858642578125, -2.24658203125, -2.00457763671875, -1.7625732421875, -1.52056884765625, -1.278564453125, -1.03656005859375, -0.7945556640625, -0.55255126953125, -0.310546875, -0.06854248046875, 0.1734619140625, 0.41546630859375, 0.657470703125, 0.89947509765625, 1.1414794921875, 1.38348388671875, 1.62548828125, 1.86749267578125, 2.1094970703125, 2.35150146484375, 2.593505859375, 2.83551025390625, 3.0775146484375, 3.31951904296875, 3.5615234375, 3.80352783203125, 4.0455322265625, 4.28753662109375, 4.529541015625, 4.77154541015625, 5.0135498046875, 5.25555419921875, 5.49755859375, 5.73956298828125, 5.9815673828125, 6.22357177734375, 6.465576171875, 6.70758056640625, 6.9495849609375, 7.19158935546875, 7.43359375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 1.0, 2.0, 7.0, 5.0, 10.0, 10.0, 10.0, 9.0, 12.0, 22.0, 26.0, 35.0, 41.0, 57.0, 71.0, 84.0, 111.0, 161.0, 243.0, 502.0, 1729.0, 9469.0, 98556.0, 2871154.0, 147948.0, 11967.0, 2018.0, 541.0, 282.0, 152.0, 125.0, 83.0, 49.0, 42.0, 39.0, 38.0, 23.0, 20.0, 13.0, 13.0, 13.0, 1.0, 1.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-15.28125, -14.839111328125, -14.39697265625, -13.954833984375, -13.5126953125, -13.070556640625, -12.62841796875, -12.186279296875, -11.744140625, -11.302001953125, -10.85986328125, -10.417724609375, -9.9755859375, -9.533447265625, -9.09130859375, -8.649169921875, -8.20703125, -7.764892578125, -7.32275390625, -6.880615234375, -6.4384765625, -5.996337890625, -5.55419921875, -5.112060546875, -4.669921875, -4.227783203125, -3.78564453125, -3.343505859375, -2.9013671875, -2.459228515625, -2.01708984375, -1.574951171875, -1.1328125, -0.690673828125, -0.24853515625, 0.193603515625, 0.6357421875, 1.077880859375, 1.52001953125, 1.962158203125, 2.404296875, 2.846435546875, 3.28857421875, 3.730712890625, 4.1728515625, 4.614990234375, 5.05712890625, 5.499267578125, 5.94140625, 6.383544921875, 6.82568359375, 7.267822265625, 7.7099609375, 8.152099609375, 8.59423828125, 9.036376953125, 9.478515625, 9.920654296875, 10.36279296875, 10.804931640625, 11.2470703125, 11.689208984375, 12.13134765625, 12.573486328125, 13.015625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 51.0, 428.0, 441.0, 88.0, 7.0], "bins": [-173.51063537597656, -170.66748046875, -167.82432556152344, -164.98117065429688, -162.13803100585938, -159.2948760986328, -156.45172119140625, -153.6085662841797, -150.76541137695312, -147.92225646972656, -145.0791015625, -142.23594665527344, -139.39279174804688, -136.54965209960938, -133.7064971923828, -130.86334228515625, -128.0201873779297, -125.17703247070312, -122.33387756347656, -119.49073028564453, -116.64757537841797, -113.8044204711914, -110.96127319335938, -108.11811828613281, -105.27496337890625, -102.43180847167969, -99.58865356445312, -96.7455062866211, -93.90235137939453, -91.05919647216797, -88.21604919433594, -85.37289428710938, -82.52973937988281, -79.68658447265625, -76.84342956542969, -74.00028228759766, -71.1571273803711, -68.31397247314453, -65.4708251953125, -62.62767028808594, -59.784515380859375, -56.94136047363281, -54.098209381103516, -51.25505828857422, -48.411903381347656, -45.568748474121094, -42.7255973815918, -39.8824462890625, -37.03929138183594, -34.196136474609375, -31.352985382080078, -28.50983238220215, -25.66667938232422, -22.82352638244629, -19.98037338256836, -17.13722038269043, -14.2940673828125, -11.45091438293457, -8.60776138305664, -5.764608383178711, -2.9214553833007812, -0.07830238342285156, 2.764850616455078, 5.608003616333008, 8.451156616210938]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 5.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 7.0, 7.0, 15.0, 10.0, 22.0, 17.0, 22.0, 26.0, 22.0, 32.0, 28.0, 48.0, 32.0, 42.0, 42.0, 45.0, 44.0, 45.0, 47.0, 34.0, 46.0, 27.0, 30.0, 43.0, 22.0, 24.0, 19.0, 33.0, 15.0, 22.0, 9.0, 14.0, 10.0, 9.0, 16.0, 12.0, 14.0, 2.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.727693557739258, -23.95778465270996, -23.187877655029297, -22.41796875, -21.648059844970703, -20.878150939941406, -20.108243942260742, -19.338335037231445, -18.56842613220215, -17.79851722717285, -17.028610229492188, -16.25870132446289, -15.488792419433594, -14.718884468078613, -13.948976516723633, -13.179067611694336, -12.409159660339355, -11.639251708984375, -10.869342803955078, -10.099434852600098, -9.3295259475708, -8.55961799621582, -7.789709568023682, -7.019801139831543, -6.249892711639404, -5.479984283447266, -4.710075855255127, -3.9401676654815674, -3.1702592372894287, -2.40035080909729, -1.6304426193237305, -0.8605341911315918, -0.09062576293945312, 0.6792826056480408, 1.4491909742355347, 2.219099283218384, 2.9890077114105225, 3.758916139602661, 4.528824329376221, 5.298732757568359, 6.068641185760498, 6.838549613952637, 7.608458042144775, 8.378366470336914, 9.148274421691895, 9.918183326721191, 10.688091278076172, 11.458000183105469, 12.22790813446045, 12.99781608581543, 13.767724990844727, 14.537632942199707, 15.307541847229004, 16.077449798583984, 16.84735870361328, 17.617267608642578, 18.387174606323242, 19.15708351135254, 19.926990509033203, 20.6968994140625, 21.466808319091797, 22.236717224121094, 23.006624221801758, 23.776533126831055, 24.54644203186035]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 10.0, 14.0, 13.0, 21.0, 16.0, 29.0, 21.0, 22.0, 30.0, 32.0, 36.0, 39.0, 48.0, 43.0, 47.0, 53.0, 57.0, 54.0, 26.0, 44.0, 51.0, 42.0, 37.0, 25.0, 39.0, 26.0, 23.0, 23.0, 14.0, 10.0, 8.0, 8.0, 2.0, 4.0, 8.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98828125, -2.894805908203125, -2.80133056640625, -2.707855224609375, -2.6143798828125, -2.520904541015625, -2.42742919921875, -2.333953857421875, -2.240478515625, -2.147003173828125, -2.05352783203125, -1.960052490234375, -1.8665771484375, -1.773101806640625, -1.67962646484375, -1.586151123046875, -1.49267578125, -1.399200439453125, -1.30572509765625, -1.212249755859375, -1.1187744140625, -1.025299072265625, -0.93182373046875, -0.838348388671875, -0.744873046875, -0.651397705078125, -0.55792236328125, -0.464447021484375, -0.3709716796875, -0.277496337890625, -0.18402099609375, -0.090545654296875, 0.0029296875, 0.096405029296875, 0.18988037109375, 0.283355712890625, 0.3768310546875, 0.470306396484375, 0.56378173828125, 0.657257080078125, 0.750732421875, 0.844207763671875, 0.93768310546875, 1.031158447265625, 1.1246337890625, 1.218109130859375, 1.31158447265625, 1.405059814453125, 1.49853515625, 1.592010498046875, 1.68548583984375, 1.778961181640625, 1.8724365234375, 1.965911865234375, 2.05938720703125, 2.152862548828125, 2.246337890625, 2.339813232421875, 2.43328857421875, 2.526763916015625, 2.6202392578125, 2.713714599609375, 2.80718994140625, 2.900665283203125, 2.994140625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 11.0, 11.0, 22.0, 15.0, 30.0, 38.0, 46.0, 64.0, 117.0, 133.0, 189.0, 289.0, 429.0, 771.0, 1361.0, 2410.0, 4966.0, 10401.0, 24482.0, 64533.0, 206539.0, 828174.0, 1966499.0, 779391.0, 196430.0, 62711.0, 23819.0, 9902.0, 4660.0, 2432.0, 1295.0, 680.0, 473.0, 295.0, 186.0, 127.0, 104.0, 62.0, 43.0, 31.0, 25.0, 17.0, 14.0, 11.0, 15.0, 9.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-5.296875, -5.14324951171875, -4.9896240234375, -4.83599853515625, -4.682373046875, -4.52874755859375, -4.3751220703125, -4.22149658203125, -4.06787109375, -3.91424560546875, -3.7606201171875, -3.60699462890625, -3.453369140625, -3.29974365234375, -3.1461181640625, -2.99249267578125, -2.8388671875, -2.68524169921875, -2.5316162109375, -2.37799072265625, -2.224365234375, -2.07073974609375, -1.9171142578125, -1.76348876953125, -1.60986328125, -1.45623779296875, -1.3026123046875, -1.14898681640625, -0.995361328125, -0.84173583984375, -0.6881103515625, -0.53448486328125, -0.380859375, -0.22723388671875, -0.0736083984375, 0.08001708984375, 0.233642578125, 0.38726806640625, 0.5408935546875, 0.69451904296875, 0.84814453125, 1.00177001953125, 1.1553955078125, 1.30902099609375, 1.462646484375, 1.61627197265625, 1.7698974609375, 1.92352294921875, 2.0771484375, 2.23077392578125, 2.3843994140625, 2.53802490234375, 2.691650390625, 2.84527587890625, 2.9989013671875, 3.15252685546875, 3.30615234375, 3.45977783203125, 3.6134033203125, 3.76702880859375, 3.920654296875, 4.07427978515625, 4.2279052734375, 4.38153076171875, 4.53515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 4.0, 6.0, 9.0, 12.0, 20.0, 31.0, 56.0, 82.0, 127.0, 182.0, 269.0, 440.0, 573.0, 656.0, 519.0, 358.0, 245.0, 181.0, 101.0, 63.0, 49.0, 29.0, 31.0, 5.0, 7.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.1484375, -10.871826171875, -10.59521484375, -10.318603515625, -10.0419921875, -9.765380859375, -9.48876953125, -9.212158203125, -8.935546875, -8.658935546875, -8.38232421875, -8.105712890625, -7.8291015625, -7.552490234375, -7.27587890625, -6.999267578125, -6.72265625, -6.446044921875, -6.16943359375, -5.892822265625, -5.6162109375, -5.339599609375, -5.06298828125, -4.786376953125, -4.509765625, -4.233154296875, -3.95654296875, -3.679931640625, -3.4033203125, -3.126708984375, -2.85009765625, -2.573486328125, -2.296875, -2.020263671875, -1.74365234375, -1.467041015625, -1.1904296875, -0.913818359375, -0.63720703125, -0.360595703125, -0.083984375, 0.192626953125, 0.46923828125, 0.745849609375, 1.0224609375, 1.299072265625, 1.57568359375, 1.852294921875, 2.12890625, 2.405517578125, 2.68212890625, 2.958740234375, 3.2353515625, 3.511962890625, 3.78857421875, 4.065185546875, 4.341796875, 4.618408203125, 4.89501953125, 5.171630859375, 5.4482421875, 5.724853515625, 6.00146484375, 6.278076171875, 6.5546875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 20.0, 19.0, 32.0, 72.0, 111.0, 173.0, 305.0, 763.0, 2226.0, 13651.0, 176868.0, 3071076.0, 877040.0, 44686.0, 4999.0, 1190.0, 481.0, 247.0, 123.0, 65.0, 38.0, 28.0, 17.0, 13.0, 14.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.140625, -13.5693359375, -12.998046875, -12.4267578125, -11.85546875, -11.2841796875, -10.712890625, -10.1416015625, -9.5703125, -8.9990234375, -8.427734375, -7.8564453125, -7.28515625, -6.7138671875, -6.142578125, -5.5712890625, -5.0, -4.4287109375, -3.857421875, -3.2861328125, -2.71484375, -2.1435546875, -1.572265625, -1.0009765625, -0.4296875, 0.1416015625, 0.712890625, 1.2841796875, 1.85546875, 2.4267578125, 2.998046875, 3.5693359375, 4.140625, 4.7119140625, 5.283203125, 5.8544921875, 6.42578125, 6.9970703125, 7.568359375, 8.1396484375, 8.7109375, 9.2822265625, 9.853515625, 10.4248046875, 10.99609375, 11.5673828125, 12.138671875, 12.7099609375, 13.28125, 13.8525390625, 14.423828125, 14.9951171875, 15.56640625, 16.1376953125, 16.708984375, 17.2802734375, 17.8515625, 18.4228515625, 18.994140625, 19.5654296875, 20.13671875, 20.7080078125, 21.279296875, 21.8505859375, 22.421875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 11.0, 22.0, 38.0, 58.0, 84.0, 89.0, 130.0, 116.0, 125.0, 99.0, 72.0, 66.0, 39.0, 24.0, 18.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.1524658203125, -49.63003921508789, -48.107608795166016, -46.585182189941406, -45.0627555847168, -43.54032897949219, -42.01789855957031, -40.4954719543457, -38.973045349121094, -37.450618743896484, -35.92818832397461, -34.40576171875, -32.88333511352539, -31.36090660095215, -29.838478088378906, -28.316051483154297, -26.793621063232422, -25.27119255065918, -23.74876594543457, -22.226337432861328, -20.70391082763672, -19.181482315063477, -17.659053802490234, -16.136627197265625, -14.614198684692383, -13.091771125793457, -11.569343566894531, -10.046915054321289, -8.524487495422363, -7.0020599365234375, -5.479631423950195, -3.9572038650512695, -2.4347763061523438, -0.9123485088348389, 0.610079288482666, 2.13250732421875, 3.654934883117676, 5.177362442016602, 6.699790954589844, 8.22221851348877, 9.744646072387695, 11.267073631286621, 12.789501190185547, 14.311929702758789, 15.834357261657715, 17.35678482055664, 18.879213333129883, 20.401641845703125, 21.924068450927734, 23.446496963500977, 24.968923568725586, 26.491352081298828, 28.013778686523438, 29.53620719909668, 31.058635711669922, 32.58106231689453, 34.103492736816406, 35.625919342041016, 37.14834976196289, 38.6707763671875, 40.19320297241211, 41.71562957763672, 43.238059997558594, 44.7604866027832, 46.28291320800781]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 8.0, 4.0, 8.0, 9.0, 18.0, 12.0, 13.0, 27.0, 13.0, 21.0, 24.0, 26.0, 31.0, 38.0, 43.0, 42.0, 35.0, 42.0, 36.0, 38.0, 45.0, 38.0, 42.0, 44.0, 39.0, 37.0, 31.0, 32.0, 25.0, 28.0, 23.0, 22.0, 12.0, 14.0, 14.0, 12.0, 12.0, 4.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.444656372070312, -20.770015716552734, -20.095375061035156, -19.420732498168945, -18.746091842651367, -18.07145118713379, -17.396808624267578, -16.72216796875, -16.047527313232422, -15.372886657714844, -14.69824504852295, -14.023603439331055, -13.348962783813477, -12.674322128295898, -11.999680519104004, -11.32503890991211, -10.650398254394531, -9.975757598876953, -9.301115989685059, -8.626474380493164, -7.951833724975586, -7.27719259262085, -6.602551460266113, -5.927910327911377, -5.253269195556641, -4.578628063201904, -3.903986930847168, -3.2293457984924316, -2.5547046661376953, -1.880063533782959, -1.2054224014282227, -0.5307812690734863, 0.14385986328125, 0.8185009956359863, 1.4931421279907227, 2.167783260345459, 2.8424243927001953, 3.5170655250549316, 4.191706657409668, 4.866347789764404, 5.540988922119141, 6.215630054473877, 6.890271186828613, 7.56491231918335, 8.239553451538086, 8.914194107055664, 9.588835716247559, 10.263477325439453, 10.938117980957031, 11.61275863647461, 12.287400245666504, 12.962041854858398, 13.636682510375977, 14.311323165893555, 14.98596477508545, 15.660606384277344, 16.335247039794922, 17.0098876953125, 17.684528350830078, 18.35917091369629, 19.033811569213867, 19.708452224731445, 20.383094787597656, 21.057735443115234, 21.732376098632812]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 7.0, 9.0, 21.0, 13.0, 20.0, 14.0, 20.0, 28.0, 25.0, 35.0, 39.0, 36.0, 40.0, 36.0, 44.0, 59.0, 41.0, 52.0, 43.0, 40.0, 45.0, 42.0, 42.0, 34.0, 36.0, 24.0, 26.0, 20.0, 21.0, 16.0, 11.0, 11.0, 6.0, 4.0, 6.0, 7.0, 7.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.64422607421875, -2.5521240234375, -2.46002197265625, -2.367919921875, -2.27581787109375, -2.1837158203125, -2.09161376953125, -1.99951171875, -1.90740966796875, -1.8153076171875, -1.72320556640625, -1.631103515625, -1.53900146484375, -1.4468994140625, -1.35479736328125, -1.2626953125, -1.17059326171875, -1.0784912109375, -0.98638916015625, -0.894287109375, -0.80218505859375, -0.7100830078125, -0.61798095703125, -0.52587890625, -0.43377685546875, -0.3416748046875, -0.24957275390625, -0.157470703125, -0.06536865234375, 0.0267333984375, 0.11883544921875, 0.2109375, 0.30303955078125, 0.3951416015625, 0.48724365234375, 0.579345703125, 0.67144775390625, 0.7635498046875, 0.85565185546875, 0.94775390625, 1.03985595703125, 1.1319580078125, 1.22406005859375, 1.316162109375, 1.40826416015625, 1.5003662109375, 1.59246826171875, 1.6845703125, 1.77667236328125, 1.8687744140625, 1.96087646484375, 2.052978515625, 2.14508056640625, 2.2371826171875, 2.32928466796875, 2.42138671875, 2.51348876953125, 2.6055908203125, 2.69769287109375, 2.789794921875, 2.88189697265625, 2.9739990234375, 3.06610107421875, 3.158203125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 7.0, 5.0, 13.0, 17.0, 19.0, 32.0, 57.0, 75.0, 87.0, 151.0, 210.0, 347.0, 539.0, 879.0, 1411.0, 2207.0, 3724.0, 6135.0, 10572.0, 18215.0, 32543.0, 62250.0, 128957.0, 304194.0, 248561.0, 106992.0, 52668.0, 28192.0, 15892.0, 9260.0, 5563.0, 3380.0, 2018.0, 1242.0, 755.0, 492.0, 284.0, 192.0, 120.0, 95.0, 71.0, 35.0, 36.0, 29.0, 11.0, 4.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.025665283203125, -0.024834156036376953, -0.024003028869628906, -0.02317190170288086, -0.022340774536132812, -0.021509647369384766, -0.02067852020263672, -0.019847393035888672, -0.019016265869140625, -0.018185138702392578, -0.01735401153564453, -0.016522884368896484, -0.015691757202148438, -0.01486063003540039, -0.014029502868652344, -0.013198375701904297, -0.01236724853515625, -0.011536121368408203, -0.010704994201660156, -0.00987386703491211, -0.009042739868164062, -0.008211612701416016, -0.007380485534667969, -0.006549358367919922, -0.005718231201171875, -0.004887104034423828, -0.004055976867675781, -0.0032248497009277344, -0.0023937225341796875, -0.0015625953674316406, -0.0007314682006835938, 9.965896606445312e-05, 0.0009307861328125, 0.0017619132995605469, 0.0025930404663085938, 0.0034241676330566406, 0.0042552947998046875, 0.005086421966552734, 0.005917549133300781, 0.006748676300048828, 0.007579803466796875, 0.008410930633544922, 0.009242057800292969, 0.010073184967041016, 0.010904312133789062, 0.01173543930053711, 0.012566566467285156, 0.013397693634033203, 0.01422882080078125, 0.015059947967529297, 0.015891075134277344, 0.01672220230102539, 0.017553329467773438, 0.018384456634521484, 0.01921558380126953, 0.020046710968017578, 0.020877838134765625, 0.021708965301513672, 0.02254009246826172, 0.023371219635009766, 0.024202346801757812, 0.02503347396850586, 0.025864601135253906, 0.026695728302001953, 0.02752685546875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 4.0, 10.0, 13.0, 16.0, 16.0, 15.0, 20.0, 19.0, 23.0, 33.0, 21.0, 25.0, 33.0, 37.0, 30.0, 27.0, 40.0, 37.0, 28.0, 1073.0, 36.0, 28.0, 36.0, 39.0, 37.0, 36.0, 40.0, 21.0, 23.0, 27.0, 22.0, 20.0, 25.0, 18.0, 12.0, 17.0, 10.0, 9.0, 10.0, 6.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.931640625, -1.8748016357421875, -1.817962646484375, -1.7611236572265625, -1.70428466796875, -1.6474456787109375, -1.590606689453125, -1.5337677001953125, -1.4769287109375, -1.4200897216796875, -1.363250732421875, -1.3064117431640625, -1.24957275390625, -1.1927337646484375, -1.135894775390625, -1.0790557861328125, -1.022216796875, -0.9653778076171875, -0.908538818359375, -0.8516998291015625, -0.79486083984375, -0.7380218505859375, -0.681182861328125, -0.6243438720703125, -0.5675048828125, -0.5106658935546875, -0.453826904296875, -0.3969879150390625, -0.34014892578125, -0.2833099365234375, -0.226470947265625, -0.1696319580078125, -0.11279296875, -0.0559539794921875, 0.000885009765625, 0.0577239990234375, 0.11456298828125, 0.1714019775390625, 0.228240966796875, 0.2850799560546875, 0.3419189453125, 0.3987579345703125, 0.455596923828125, 0.5124359130859375, 0.56927490234375, 0.6261138916015625, 0.682952880859375, 0.7397918701171875, 0.796630859375, 0.8534698486328125, 0.910308837890625, 0.9671478271484375, 1.02398681640625, 1.0808258056640625, 1.137664794921875, 1.1945037841796875, 1.2513427734375, 1.3081817626953125, 1.365020751953125, 1.4218597412109375, 1.47869873046875, 1.5355377197265625, 1.592376708984375, 1.6492156982421875, 1.7060546875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 10.0, 8.0, 19.0, 26.0, 41.0, 69.0, 76.0, 120.0, 181.0, 250.0, 344.0, 489.0, 741.0, 1062.0, 1510.0, 2206.0, 3279.0, 4785.0, 7088.0, 10668.0, 15536.0, 23248.0, 35246.0, 53335.0, 81398.0, 125341.0, 1228896.0, 169504.0, 113221.0, 73586.0, 47609.0, 31746.0, 21446.0, 14224.0, 9552.0, 6363.0, 4428.0, 2947.0, 1997.0, 1455.0, 966.0, 657.0, 426.0, 295.0, 200.0, 164.0, 131.0, 67.0, 57.0, 35.0, 26.0, 26.0, 11.0, 11.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.00658416748046875, -0.0063838958740234375, -0.006183624267578125, -0.0059833526611328125, -0.0057830810546875, -0.0055828094482421875, -0.005382537841796875, -0.0051822662353515625, -0.00498199462890625, -0.0047817230224609375, -0.004581451416015625, -0.0043811798095703125, -0.004180908203125, -0.0039806365966796875, -0.003780364990234375, -0.0035800933837890625, -0.00337982177734375, -0.0031795501708984375, -0.002979278564453125, -0.0027790069580078125, -0.0025787353515625, -0.0023784637451171875, -0.002178192138671875, -0.0019779205322265625, -0.00177764892578125, -0.0015773773193359375, -0.001377105712890625, -0.0011768341064453125, -0.0009765625, -0.0007762908935546875, -0.000576019287109375, -0.0003757476806640625, -0.00017547607421875, 2.47955322265625e-05, 0.000225067138671875, 0.0004253387451171875, 0.0006256103515625, 0.0008258819580078125, 0.001026153564453125, 0.0012264251708984375, 0.00142669677734375, 0.0016269683837890625, 0.001827239990234375, 0.0020275115966796875, 0.002227783203125, 0.0024280548095703125, 0.002628326416015625, 0.0028285980224609375, 0.00302886962890625, 0.0032291412353515625, 0.003429412841796875, 0.0036296844482421875, 0.0038299560546875, 0.0040302276611328125, 0.004230499267578125, 0.0044307708740234375, 0.00463104248046875, 0.0048313140869140625, 0.005031585693359375, 0.0052318572998046875, 0.00543212890625, 0.0056324005126953125, 0.005832672119140625, 0.0060329437255859375, 0.00623321533203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 0.0, 5.0, 0.0, 6.0, 0.0, 10.0, 0.0, 0.0, 15.0, 0.0, 22.0, 0.0, 33.0, 0.0, 68.0, 0.0, 143.0, 0.0, 399.0, 0.0, 140.0, 0.0, 71.0, 0.0, 38.0, 0.0, 23.0, 0.0, 10.0, 0.0, 9.0, 0.0, 8.0, 0.0, 5.0, 0.0, 4.0, 0.0, 3.0], "bins": [-1.2516975402832031e-06, -1.2228265404701233e-06, -1.1939555406570435e-06, -1.1650845408439636e-06, -1.1362135410308838e-06, -1.107342541217804e-06, -1.0784715414047241e-06, -1.0496005415916443e-06, -1.0207295417785645e-06, -9.918585419654846e-07, -9.629875421524048e-07, -9.34116542339325e-07, -9.052455425262451e-07, -8.763745427131653e-07, -8.475035429000854e-07, -8.186325430870056e-07, -7.897615432739258e-07, -7.60890543460846e-07, -7.320195436477661e-07, -7.031485438346863e-07, -6.742775440216064e-07, -6.454065442085266e-07, -6.165355443954468e-07, -5.876645445823669e-07, -5.587935447692871e-07, -5.299225449562073e-07, -5.010515451431274e-07, -4.721805453300476e-07, -4.4330954551696777e-07, -4.1443854570388794e-07, -3.855675458908081e-07, -3.5669654607772827e-07, -3.2782554626464844e-07, -2.989545464515686e-07, -2.7008354663848877e-07, -2.4121254682540894e-07, -2.123415470123291e-07, -1.8347054719924927e-07, -1.5459954738616943e-07, -1.257285475730896e-07, -9.685754776000977e-08, -6.798654794692993e-08, -3.91155481338501e-08, -1.0244548320770264e-08, 1.862645149230957e-08, 4.7497451305389404e-08, 7.636845111846924e-08, 1.0523945093154907e-07, 1.341104507446289e-07, 1.6298145055770874e-07, 1.9185245037078857e-07, 2.207234501838684e-07, 2.4959444999694824e-07, 2.784654498100281e-07, 3.073364496231079e-07, 3.3620744943618774e-07, 3.650784492492676e-07, 3.939494490623474e-07, 4.2282044887542725e-07, 4.516914486885071e-07, 4.805624485015869e-07, 5.094334483146667e-07, 5.383044481277466e-07, 5.671754479408264e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 5.0, 13.0, 18.0, 10.0, 43.0, 68.0, 86.0, 154.0, 350.0, 2532.0, 273010.0, 767677.0, 3749.0, 395.0, 163.0, 88.0, 63.0, 44.0, 13.0, 16.0, 10.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138448715209961e-05, -1.0868534445762634e-05, -1.035258173942566e-05, -9.836629033088684e-06, -9.320676326751709e-06, -8.804723620414734e-06, -8.288770914077759e-06, -7.772818207740784e-06, -7.256865501403809e-06, -6.7409127950668335e-06, -6.224960088729858e-06, -5.709007382392883e-06, -5.193054676055908e-06, -4.677101969718933e-06, -4.161149263381958e-06, -3.645196557044983e-06, -3.129243850708008e-06, -2.6132911443710327e-06, -2.0973384380340576e-06, -1.5813857316970825e-06, -1.0654330253601074e-06, -5.494803190231323e-07, -3.3527612686157227e-08, 4.824250936508179e-07, 9.98377799987793e-07, 1.514330506324768e-06, 2.030283212661743e-06, 2.5462359189987183e-06, 3.0621886253356934e-06, 3.5781413316726685e-06, 4.0940940380096436e-06, 4.610046744346619e-06, 5.125999450683594e-06, 5.641952157020569e-06, 6.157904863357544e-06, 6.673857569694519e-06, 7.189810276031494e-06, 7.70576298236847e-06, 8.221715688705444e-06, 8.73766839504242e-06, 9.253621101379395e-06, 9.76957380771637e-06, 1.0285526514053345e-05, 1.080147922039032e-05, 1.1317431926727295e-05, 1.183338463306427e-05, 1.2349337339401245e-05, 1.286529004573822e-05, 1.3381242752075195e-05, 1.389719545841217e-05, 1.4413148164749146e-05, 1.492910087108612e-05, 1.5445053577423096e-05, 1.596100628376007e-05, 1.6476958990097046e-05, 1.699291169643402e-05, 1.7508864402770996e-05, 1.802481710910797e-05, 1.8540769815444946e-05, 1.905672252178192e-05, 1.9572675228118896e-05, 2.008862793445587e-05, 2.0604580640792847e-05, 2.1120533347129822e-05, 2.1636486053466797e-05]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 15.0, 111.0, 555.0, 278.0, 51.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.494871402333956e-06, -5.396424512582598e-06, -5.297977168083889e-06, -5.1995302783325315e-06, -5.1010833885811735e-06, -5.002636044082465e-06, -4.904189154331107e-06, -4.805742264579749e-06, -4.70729492008104e-06, -4.608848030329682e-06, -4.510400685830973e-06, -4.411953796079615e-06, -4.313506906328257e-06, -4.215059561829548e-06, -4.11661267207819e-06, -4.018165782326832e-06, -3.9197188925754745e-06, -3.8212720028241165e-06, -3.722824885699083e-06, -3.6243777685740497e-06, -3.5259306514490163e-06, -3.4274837616976583e-06, -3.329036644572625e-06, -3.230589754821267e-06, -3.132142410322558e-06, -3.0336952931975247e-06, -2.9352484034461668e-06, -2.8368012863211334e-06, -2.7383541691961e-06, -2.639907279444742e-06, -2.5414601623197086e-06, -2.4430132725683507e-06, -2.3445663828169927e-06, -2.2461192656919593e-06, -2.1476723759406013e-06, -2.049225258815568e-06, -1.9507781416905345e-06, -1.8523312519391766e-06, -1.7538841348141432e-06, -1.6554371313759475e-06, -1.5569899005640764e-06, -1.4585428971258807e-06, -1.3600957800008473e-06, -1.2616487765626516e-06, -1.163201773124456e-06, -1.0647547696862603e-06, -9.663076525612269e-07, -8.678606491230312e-07, -7.694136456848355e-07, -6.70966585403221e-07, -5.725195819650253e-07, -4.7407252168341074e-07, -3.7562548982350563e-07, -2.771784579636005e-07, -1.7873139768198598e-07, -8.02843942437903e-08, 1.8162666037824238e-08, 1.166097050031567e-07, 2.1505674396848917e-07, 3.13503790039249e-07, 4.119508218991541e-07, 5.103978537590592e-07, 6.088449140406738e-07, 7.072919174788694e-07, 8.05738977760484e-07]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 93.0, 0.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 0.0, 323.0, 0.0, 0.0, 0.0, 0.0, 200.0, 0.0, 0.0, 0.0, 0.0, 84.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 7.0, 9.0, 21.0, 13.0, 20.0, 14.0, 20.0, 28.0, 25.0, 35.0, 39.0, 36.0, 40.0, 36.0, 44.0, 59.0, 41.0, 52.0, 43.0, 40.0, 45.0, 42.0, 42.0, 34.0, 36.0, 24.0, 26.0, 20.0, 21.0, 16.0, 11.0, 11.0, 6.0, 4.0, 6.0, 7.0, 7.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.64422607421875, -2.5521240234375, -2.46002197265625, -2.367919921875, -2.27581787109375, -2.1837158203125, -2.09161376953125, -1.99951171875, -1.90740966796875, -1.8153076171875, -1.72320556640625, -1.631103515625, -1.53900146484375, -1.4468994140625, -1.35479736328125, -1.2626953125, -1.17059326171875, -1.0784912109375, -0.98638916015625, -0.894287109375, -0.80218505859375, -0.7100830078125, -0.61798095703125, -0.52587890625, -0.43377685546875, -0.3416748046875, -0.24957275390625, -0.157470703125, -0.06536865234375, 0.0267333984375, 0.11883544921875, 0.2109375, 0.30303955078125, 0.3951416015625, 0.48724365234375, 0.579345703125, 0.67144775390625, 0.7635498046875, 0.85565185546875, 0.94775390625, 1.03985595703125, 1.1319580078125, 1.22406005859375, 1.316162109375, 1.40826416015625, 1.5003662109375, 1.59246826171875, 1.6845703125, 1.77667236328125, 1.8687744140625, 1.96087646484375, 2.052978515625, 2.14508056640625, 2.2371826171875, 2.32928466796875, 2.42138671875, 2.51348876953125, 2.6055908203125, 2.69769287109375, 2.789794921875, 2.88189697265625, 2.9739990234375, 3.06610107421875, 3.158203125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 15.0, 24.0, 40.0, 48.0, 82.0, 122.0, 180.0, 230.0, 398.0, 586.0, 881.0, 1287.0, 1851.0, 2783.0, 4172.0, 6280.0, 9782.0, 14900.0, 22460.0, 34396.0, 54104.0, 96864.0, 233302.0, 279519.0, 113787.0, 60257.0, 37792.0, 24432.0, 16390.0, 10640.0, 7022.0, 4669.0, 3137.0, 1995.0, 1373.0, 890.0, 597.0, 400.0, 304.0, 176.0, 119.0, 78.0, 62.0, 42.0, 27.0, 17.0, 10.0, 11.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.931640625, -2.84033203125, -2.7490234375, -2.65771484375, -2.56640625, -2.47509765625, -2.3837890625, -2.29248046875, -2.201171875, -2.10986328125, -2.0185546875, -1.92724609375, -1.8359375, -1.74462890625, -1.6533203125, -1.56201171875, -1.470703125, -1.37939453125, -1.2880859375, -1.19677734375, -1.10546875, -1.01416015625, -0.9228515625, -0.83154296875, -0.740234375, -0.64892578125, -0.5576171875, -0.46630859375, -0.375, -0.28369140625, -0.1923828125, -0.10107421875, -0.009765625, 0.08154296875, 0.1728515625, 0.26416015625, 0.35546875, 0.44677734375, 0.5380859375, 0.62939453125, 0.720703125, 0.81201171875, 0.9033203125, 0.99462890625, 1.0859375, 1.17724609375, 1.2685546875, 1.35986328125, 1.451171875, 1.54248046875, 1.6337890625, 1.72509765625, 1.81640625, 1.90771484375, 1.9990234375, 2.09033203125, 2.181640625, 2.27294921875, 2.3642578125, 2.45556640625, 2.546875, 2.63818359375, 2.7294921875, 2.82080078125, 2.912109375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 9.0, 10.0, 12.0, 22.0, 19.0, 22.0, 25.0, 18.0, 32.0, 36.0, 58.0, 37.0, 66.0, 64.0, 81.0, 166.0, 301.0, 1379.0, 171.0, 89.0, 65.0, 59.0, 40.0, 33.0, 26.0, 24.0, 27.0, 21.0, 18.0, 23.0, 17.0, 10.0, 8.0, 12.0, 8.0, 7.0, 2.0, 4.0, 6.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.75, -9.4639892578125, -9.177978515625, -8.8919677734375, -8.60595703125, -8.3199462890625, -8.033935546875, -7.7479248046875, -7.4619140625, -7.1759033203125, -6.889892578125, -6.6038818359375, -6.31787109375, -6.0318603515625, -5.745849609375, -5.4598388671875, -5.173828125, -4.8878173828125, -4.601806640625, -4.3157958984375, -4.02978515625, -3.7437744140625, -3.457763671875, -3.1717529296875, -2.8857421875, -2.5997314453125, -2.313720703125, -2.0277099609375, -1.74169921875, -1.4556884765625, -1.169677734375, -0.8836669921875, -0.59765625, -0.3116455078125, -0.025634765625, 0.2603759765625, 0.54638671875, 0.8323974609375, 1.118408203125, 1.4044189453125, 1.6904296875, 1.9764404296875, 2.262451171875, 2.5484619140625, 2.83447265625, 3.1204833984375, 3.406494140625, 3.6925048828125, 3.978515625, 4.2645263671875, 4.550537109375, 4.8365478515625, 5.12255859375, 5.4085693359375, 5.694580078125, 5.9805908203125, 6.2666015625, 6.5526123046875, 6.838623046875, 7.1246337890625, 7.41064453125, 7.6966552734375, 7.982666015625, 8.2686767578125, 8.5546875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 8.0, 17.0, 19.0, 22.0, 31.0, 51.0, 52.0, 79.0, 80.0, 104.0, 174.0, 274.0, 606.0, 1743.0, 9028.0, 96521.0, 2714278.0, 298031.0, 19469.0, 3077.0, 916.0, 364.0, 213.0, 138.0, 99.0, 77.0, 54.0, 46.0, 32.0, 24.0, 12.0, 12.0, 7.0, 9.0, 4.0, 8.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.03125, -16.49365234375, -15.9560546875, -15.41845703125, -14.880859375, -14.34326171875, -13.8056640625, -13.26806640625, -12.73046875, -12.19287109375, -11.6552734375, -11.11767578125, -10.580078125, -10.04248046875, -9.5048828125, -8.96728515625, -8.4296875, -7.89208984375, -7.3544921875, -6.81689453125, -6.279296875, -5.74169921875, -5.2041015625, -4.66650390625, -4.12890625, -3.59130859375, -3.0537109375, -2.51611328125, -1.978515625, -1.44091796875, -0.9033203125, -0.36572265625, 0.171875, 0.70947265625, 1.2470703125, 1.78466796875, 2.322265625, 2.85986328125, 3.3974609375, 3.93505859375, 4.47265625, 5.01025390625, 5.5478515625, 6.08544921875, 6.623046875, 7.16064453125, 7.6982421875, 8.23583984375, 8.7734375, 9.31103515625, 9.8486328125, 10.38623046875, 10.923828125, 11.46142578125, 11.9990234375, 12.53662109375, 13.07421875, 13.61181640625, 14.1494140625, 14.68701171875, 15.224609375, 15.76220703125, 16.2998046875, 16.83740234375, 17.375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 12.0, 157.0, 570.0, 255.0, 23.0, 1.0], "bins": [-258.2127685546875, -253.9541015625, -249.6954345703125, -245.436767578125, -241.1781005859375, -236.91943359375, -232.6607666015625, -228.40211486816406, -224.14344787597656, -219.88478088378906, -215.62611389160156, -211.36744689941406, -207.10877990722656, -202.85012817382812, -198.59146118164062, -194.33279418945312, -190.07412719726562, -185.81546020507812, -181.55679321289062, -177.29812622070312, -173.03945922851562, -168.78079223632812, -164.52212524414062, -160.2634735107422, -156.00479125976562, -151.74612426757812, -147.48745727539062, -143.22879028320312, -138.97012329101562, -134.71145629882812, -130.45278930664062, -126.19412994384766, -121.93548583984375, -117.67681884765625, -113.41815185546875, -109.15948486328125, -104.90082550048828, -100.64215850830078, -96.38349151611328, -92.12482452392578, -87.86615753173828, -83.60749053955078, -79.34882354736328, -75.09016418457031, -70.83149719238281, -66.57283020019531, -62.31416320800781, -58.05549621582031, -53.796836853027344, -49.538169860839844, -45.27950668334961, -41.02083969116211, -36.762176513671875, -32.503509521484375, -28.244842529296875, -23.986177444458008, -19.727510452270508, -15.46884536743164, -11.210179328918457, -6.951513290405273, -2.6928482055664062, 1.565816879272461, 5.824483871459961, 10.083148956298828, 14.341814041137695]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 8.0, 11.0, 8.0, 11.0, 14.0, 14.0, 21.0, 26.0, 24.0, 24.0, 32.0, 30.0, 25.0, 31.0, 46.0, 40.0, 42.0, 37.0, 33.0, 45.0, 31.0, 44.0, 40.0, 48.0, 42.0, 27.0, 31.0, 33.0, 23.0, 23.0, 16.0, 17.0, 16.0, 9.0, 10.0, 5.0, 10.0, 6.0, 15.0, 12.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.24087142944336, -23.45634651184082, -22.67181968688965, -21.88729476928711, -21.102767944335938, -20.3182430267334, -19.533716201782227, -18.749191284179688, -17.964664459228516, -17.180139541625977, -16.395612716674805, -15.61108684539795, -14.826560974121094, -14.042035102844238, -13.257509231567383, -12.472984313964844, -11.688458442687988, -10.903932571411133, -10.119406700134277, -9.334880828857422, -8.550354957580566, -7.765829086303711, -6.981303691864014, -6.196777820587158, -5.412251949310303, -4.627726078033447, -3.843200206756592, -3.0586745738983154, -2.27414870262146, -1.4896228313446045, -0.7050971984863281, 0.07942867279052734, 0.8639545440673828, 1.6484804153442383, 2.4330062866210938, 3.21753191947937, 4.002058029174805, 4.78658390045166, 5.571109294891357, 6.355635166168213, 7.140161037445068, 7.924686908721924, 8.709212303161621, 9.493738174438477, 10.278264045715332, 11.062789916992188, 11.847315788269043, 12.631841659545898, 13.416367530822754, 14.20089340209961, 14.985419273376465, 15.76994514465332, 16.55447006225586, 17.33899688720703, 18.12352180480957, 18.908048629760742, 19.69257354736328, 20.47709846496582, 21.261625289916992, 22.04615020751953, 22.830677032470703, 23.615201950073242, 24.399728775024414, 25.184253692626953, 25.968780517578125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 9.0, 8.0, 11.0, 10.0, 18.0, 15.0, 22.0, 20.0, 22.0, 23.0, 34.0, 39.0, 38.0, 41.0, 40.0, 41.0, 57.0, 45.0, 58.0, 42.0, 49.0, 39.0, 42.0, 39.0, 34.0, 29.0, 35.0, 23.0, 23.0, 18.0, 15.0, 11.0, 8.0, 9.0, 5.0, 5.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.896484375, -2.799224853515625, -2.70196533203125, -2.604705810546875, -2.5074462890625, -2.410186767578125, -2.31292724609375, -2.215667724609375, -2.118408203125, -2.021148681640625, -1.92388916015625, -1.826629638671875, -1.7293701171875, -1.632110595703125, -1.53485107421875, -1.437591552734375, -1.34033203125, -1.243072509765625, -1.14581298828125, -1.048553466796875, -0.9512939453125, -0.854034423828125, -0.75677490234375, -0.659515380859375, -0.562255859375, -0.464996337890625, -0.36773681640625, -0.270477294921875, -0.1732177734375, -0.075958251953125, 0.02130126953125, 0.118560791015625, 0.2158203125, 0.313079833984375, 0.41033935546875, 0.507598876953125, 0.6048583984375, 0.702117919921875, 0.79937744140625, 0.896636962890625, 0.993896484375, 1.091156005859375, 1.18841552734375, 1.285675048828125, 1.3829345703125, 1.480194091796875, 1.57745361328125, 1.674713134765625, 1.77197265625, 1.869232177734375, 1.96649169921875, 2.063751220703125, 2.1610107421875, 2.258270263671875, 2.35552978515625, 2.452789306640625, 2.550048828125, 2.647308349609375, 2.74456787109375, 2.841827392578125, 2.9390869140625, 3.036346435546875, 3.13360595703125, 3.230865478515625, 3.328125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 9.0, 11.0, 8.0, 16.0, 16.0, 19.0, 19.0, 35.0, 42.0, 65.0, 103.0, 261.0, 514.0, 1240.0, 3506.0, 11812.0, 56103.0, 394842.0, 2666773.0, 922823.0, 107962.0, 19949.0, 5101.0, 1716.0, 632.0, 305.0, 128.0, 67.0, 41.0, 32.0, 15.0, 24.0, 18.0, 7.0, 10.0, 12.0, 5.0, 4.0, 2.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.90625, -8.6251220703125, -8.343994140625, -8.0628662109375, -7.78173828125, -7.5006103515625, -7.219482421875, -6.9383544921875, -6.6572265625, -6.3760986328125, -6.094970703125, -5.8138427734375, -5.53271484375, -5.2515869140625, -4.970458984375, -4.6893310546875, -4.408203125, -4.1270751953125, -3.845947265625, -3.5648193359375, -3.28369140625, -3.0025634765625, -2.721435546875, -2.4403076171875, -2.1591796875, -1.8780517578125, -1.596923828125, -1.3157958984375, -1.03466796875, -0.7535400390625, -0.472412109375, -0.1912841796875, 0.08984375, 0.3709716796875, 0.652099609375, 0.9332275390625, 1.21435546875, 1.4954833984375, 1.776611328125, 2.0577392578125, 2.3388671875, 2.6199951171875, 2.901123046875, 3.1822509765625, 3.46337890625, 3.7445068359375, 4.025634765625, 4.3067626953125, 4.587890625, 4.8690185546875, 5.150146484375, 5.4312744140625, 5.71240234375, 5.9935302734375, 6.274658203125, 6.5557861328125, 6.8369140625, 7.1180419921875, 7.399169921875, 7.6802978515625, 7.96142578125, 8.2425537109375, 8.523681640625, 8.8048095703125, 9.0859375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 9.0, 14.0, 33.0, 43.0, 36.0, 57.0, 81.0, 133.0, 150.0, 190.0, 271.0, 326.0, 393.0, 452.0, 417.0, 370.0, 264.0, 205.0, 140.0, 113.0, 104.0, 63.0, 56.0, 38.0, 28.0, 22.0, 13.0, 4.0, 9.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.19140625, -6.99493408203125, -6.7984619140625, -6.60198974609375, -6.405517578125, -6.20904541015625, -6.0125732421875, -5.81610107421875, -5.61962890625, -5.42315673828125, -5.2266845703125, -5.03021240234375, -4.833740234375, -4.63726806640625, -4.4407958984375, -4.24432373046875, -4.0478515625, -3.85137939453125, -3.6549072265625, -3.45843505859375, -3.261962890625, -3.06549072265625, -2.8690185546875, -2.67254638671875, -2.47607421875, -2.27960205078125, -2.0831298828125, -1.88665771484375, -1.690185546875, -1.49371337890625, -1.2972412109375, -1.10076904296875, -0.904296875, -0.70782470703125, -0.5113525390625, -0.31488037109375, -0.118408203125, 0.07806396484375, 0.2745361328125, 0.47100830078125, 0.66748046875, 0.86395263671875, 1.0604248046875, 1.25689697265625, 1.453369140625, 1.64984130859375, 1.8463134765625, 2.04278564453125, 2.2392578125, 2.43572998046875, 2.6322021484375, 2.82867431640625, 3.025146484375, 3.22161865234375, 3.4180908203125, 3.61456298828125, 3.81103515625, 4.00750732421875, 4.2039794921875, 4.40045166015625, 4.596923828125, 4.79339599609375, 4.9898681640625, 5.18634033203125, 5.3828125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 2.0, 9.0, 4.0, 8.0, 17.0, 26.0, 31.0, 49.0, 61.0, 99.0, 174.0, 201.0, 373.0, 598.0, 1315.0, 3396.0, 12396.0, 63373.0, 427525.0, 2492910.0, 1021449.0, 136982.0, 23687.0, 5677.0, 1854.0, 819.0, 416.0, 255.0, 180.0, 110.0, 81.0, 65.0, 42.0, 28.0, 22.0, 16.0, 4.0, 9.0, 6.0, 0.0, 5.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.984375, -10.626708984375, -10.26904296875, -9.911376953125, -9.5537109375, -9.196044921875, -8.83837890625, -8.480712890625, -8.123046875, -7.765380859375, -7.40771484375, -7.050048828125, -6.6923828125, -6.334716796875, -5.97705078125, -5.619384765625, -5.26171875, -4.904052734375, -4.54638671875, -4.188720703125, -3.8310546875, -3.473388671875, -3.11572265625, -2.758056640625, -2.400390625, -2.042724609375, -1.68505859375, -1.327392578125, -0.9697265625, -0.612060546875, -0.25439453125, 0.103271484375, 0.4609375, 0.818603515625, 1.17626953125, 1.533935546875, 1.8916015625, 2.249267578125, 2.60693359375, 2.964599609375, 3.322265625, 3.679931640625, 4.03759765625, 4.395263671875, 4.7529296875, 5.110595703125, 5.46826171875, 5.825927734375, 6.18359375, 6.541259765625, 6.89892578125, 7.256591796875, 7.6142578125, 7.971923828125, 8.32958984375, 8.687255859375, 9.044921875, 9.402587890625, 9.76025390625, 10.117919921875, 10.4755859375, 10.833251953125, 11.19091796875, 11.548583984375, 11.90625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 7.0, 22.0, 65.0, 87.0, 147.0, 128.0, 177.0, 156.0, 107.0, 57.0, 32.0, 14.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0333251953125, -16.081329345703125, -14.129332542419434, -12.177335739135742, -10.225339889526367, -8.273344039916992, -6.321347236633301, -4.369350433349609, -2.4173545837402344, -0.46535825729370117, 1.486638069152832, 3.4386343955993652, 5.390630722045898, 7.342626571655273, 9.294623374938965, 11.246620178222656, 13.198616027832031, 15.150611877441406, 17.10260772705078, 19.05460548400879, 21.006601333618164, 22.95859718322754, 24.910594940185547, 26.862590789794922, 28.814586639404297, 30.766582489013672, 32.71857833862305, 34.67057418823242, 36.62257385253906, 38.57456970214844, 40.52656555175781, 42.47856140136719, 44.43055725097656, 46.38255310058594, 48.33454895019531, 50.28654479980469, 52.23854064941406, 54.19053649902344, 56.14253616333008, 58.09453201293945, 60.04652786254883, 61.9985237121582, 63.95051956176758, 65.90251922607422, 67.8545150756836, 69.80651092529297, 71.75850677490234, 73.71050262451172, 75.6624984741211, 77.61449432373047, 79.56649017333984, 81.51848602294922, 83.4704818725586, 85.42247772216797, 87.37447357177734, 89.32647705078125, 91.27847290039062, 93.23046875, 95.18246459960938, 97.13446044921875, 99.08645629882812, 101.0384521484375, 102.99044799804688, 104.94244384765625, 106.89443969726562]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 7.0, 7.0, 8.0, 16.0, 14.0, 15.0, 18.0, 26.0, 20.0, 29.0, 45.0, 31.0, 32.0, 39.0, 37.0, 37.0, 33.0, 47.0, 43.0, 36.0, 44.0, 27.0, 39.0, 49.0, 30.0, 38.0, 29.0, 25.0, 30.0, 33.0, 24.0, 11.0, 11.0, 16.0, 11.0, 8.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.985031127929688, -19.326824188232422, -18.668617248535156, -18.01041030883789, -17.352203369140625, -16.69399642944336, -16.035789489746094, -15.377582550048828, -14.719375610351562, -14.061168670654297, -13.402961730957031, -12.744754791259766, -12.0865478515625, -11.428340911865234, -10.770133972167969, -10.111927032470703, -9.453720092773438, -8.795513153076172, -8.137306213378906, -7.479099273681641, -6.820892333984375, -6.162685394287109, -5.504478454589844, -4.846271514892578, -4.1880645751953125, -3.529857635498047, -2.8716506958007812, -2.2134437561035156, -1.55523681640625, -0.8970298767089844, -0.23882293701171875, 0.4193840026855469, 1.0775909423828125, 1.7357978820800781, 2.3940048217773438, 3.0522117614746094, 3.710418701171875, 4.368625640869141, 5.026832580566406, 5.685039520263672, 6.3432464599609375, 7.001453399658203, 7.659660339355469, 8.317867279052734, 8.97607421875, 9.634281158447266, 10.292488098144531, 10.950695037841797, 11.608901977539062, 12.267108917236328, 12.925315856933594, 13.58352279663086, 14.241729736328125, 14.89993667602539, 15.558143615722656, 16.216350555419922, 16.874557495117188, 17.532764434814453, 18.19097137451172, 18.849178314208984, 19.50738525390625, 20.165592193603516, 20.82379913330078, 21.482006072998047, 22.140213012695312]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 10.0, 8.0, 8.0, 10.0, 16.0, 20.0, 27.0, 16.0, 38.0, 26.0, 32.0, 36.0, 44.0, 41.0, 53.0, 59.0, 42.0, 65.0, 49.0, 42.0, 52.0, 39.0, 43.0, 27.0, 31.0, 37.0, 21.0, 23.0, 11.0, 14.0, 12.0, 10.0, 9.0, 4.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.216796875, -3.112548828125, -3.00830078125, -2.904052734375, -2.7998046875, -2.695556640625, -2.59130859375, -2.487060546875, -2.3828125, -2.278564453125, -2.17431640625, -2.070068359375, -1.9658203125, -1.861572265625, -1.75732421875, -1.653076171875, -1.548828125, -1.444580078125, -1.34033203125, -1.236083984375, -1.1318359375, -1.027587890625, -0.92333984375, -0.819091796875, -0.71484375, -0.610595703125, -0.50634765625, -0.402099609375, -0.2978515625, -0.193603515625, -0.08935546875, 0.014892578125, 0.119140625, 0.223388671875, 0.32763671875, 0.431884765625, 0.5361328125, 0.640380859375, 0.74462890625, 0.848876953125, 0.953125, 1.057373046875, 1.16162109375, 1.265869140625, 1.3701171875, 1.474365234375, 1.57861328125, 1.682861328125, 1.787109375, 1.891357421875, 1.99560546875, 2.099853515625, 2.2041015625, 2.308349609375, 2.41259765625, 2.516845703125, 2.62109375, 2.725341796875, 2.82958984375, 2.933837890625, 3.0380859375, 3.142333984375, 3.24658203125, 3.350830078125, 3.455078125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 0.0, 7.0, 11.0, 19.0, 20.0, 46.0, 45.0, 90.0, 121.0, 143.0, 241.0, 336.0, 492.0, 746.0, 1103.0, 1721.0, 2499.0, 3735.0, 5557.0, 8775.0, 13359.0, 20868.0, 33870.0, 57767.0, 104752.0, 199423.0, 259957.0, 140813.0, 75652.0, 42901.0, 25968.0, 16217.0, 10659.0, 6845.0, 4568.0, 2971.0, 2072.0, 1374.0, 872.0, 642.0, 392.0, 295.0, 191.0, 137.0, 104.0, 60.0, 41.0, 24.0, 24.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.021240234375, -0.02058124542236328, -0.019922256469726562, -0.019263267517089844, -0.018604278564453125, -0.017945289611816406, -0.017286300659179688, -0.01662731170654297, -0.01596832275390625, -0.015309333801269531, -0.014650344848632812, -0.013991355895996094, -0.013332366943359375, -0.012673377990722656, -0.012014389038085938, -0.011355400085449219, -0.0106964111328125, -0.010037422180175781, -0.009378433227539062, -0.008719444274902344, -0.008060455322265625, -0.007401466369628906, -0.0067424774169921875, -0.006083488464355469, -0.00542449951171875, -0.004765510559082031, -0.0041065216064453125, -0.0034475326538085938, -0.002788543701171875, -0.0021295547485351562, -0.0014705657958984375, -0.0008115768432617188, -0.000152587890625, 0.0005064010620117188, 0.0011653900146484375, 0.0018243789672851562, 0.002483367919921875, 0.0031423568725585938, 0.0038013458251953125, 0.004460334777832031, 0.00511932373046875, 0.005778312683105469, 0.0064373016357421875, 0.007096290588378906, 0.007755279541015625, 0.008414268493652344, 0.009073257446289062, 0.009732246398925781, 0.0103912353515625, 0.011050224304199219, 0.011709213256835938, 0.012368202209472656, 0.013027191162109375, 0.013686180114746094, 0.014345169067382812, 0.015004158020019531, 0.01566314697265625, 0.01632213592529297, 0.016981124877929688, 0.017640113830566406, 0.018299102783203125, 0.018958091735839844, 0.019617080688476562, 0.02027606964111328, 0.02093505859375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 4.0, 9.0, 10.0, 9.0, 17.0, 15.0, 15.0, 25.0, 29.0, 27.0, 29.0, 33.0, 31.0, 33.0, 50.0, 41.0, 31.0, 48.0, 1071.0, 44.0, 40.0, 30.0, 47.0, 33.0, 25.0, 30.0, 34.0, 29.0, 19.0, 23.0, 15.0, 29.0, 15.0, 8.0, 13.0, 6.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0], "bins": [-2.4921875, -2.4244384765625, -2.356689453125, -2.2889404296875, -2.22119140625, -2.1534423828125, -2.085693359375, -2.0179443359375, -1.9501953125, -1.8824462890625, -1.814697265625, -1.7469482421875, -1.67919921875, -1.6114501953125, -1.543701171875, -1.4759521484375, -1.408203125, -1.3404541015625, -1.272705078125, -1.2049560546875, -1.13720703125, -1.0694580078125, -1.001708984375, -0.9339599609375, -0.8662109375, -0.7984619140625, -0.730712890625, -0.6629638671875, -0.59521484375, -0.5274658203125, -0.459716796875, -0.3919677734375, -0.32421875, -0.2564697265625, -0.188720703125, -0.1209716796875, -0.05322265625, 0.0145263671875, 0.082275390625, 0.1500244140625, 0.2177734375, 0.2855224609375, 0.353271484375, 0.4210205078125, 0.48876953125, 0.5565185546875, 0.624267578125, 0.6920166015625, 0.759765625, 0.8275146484375, 0.895263671875, 0.9630126953125, 1.03076171875, 1.0985107421875, 1.166259765625, 1.2340087890625, 1.3017578125, 1.3695068359375, 1.437255859375, 1.5050048828125, 1.57275390625, 1.6405029296875, 1.708251953125, 1.7760009765625, 1.84375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 15.0, 12.0, 21.0, 49.0, 55.0, 90.0, 116.0, 186.0, 247.0, 362.0, 519.0, 779.0, 1127.0, 1775.0, 2491.0, 3778.0, 5599.0, 8373.0, 13209.0, 19944.0, 30753.0, 47714.0, 76385.0, 124732.0, 1247160.0, 190729.0, 117746.0, 71987.0, 45624.0, 29100.0, 19220.0, 12520.0, 8127.0, 5443.0, 3723.0, 2350.0, 1608.0, 1127.0, 717.0, 496.0, 338.0, 275.0, 159.0, 118.0, 57.0, 61.0, 44.0, 21.0, 25.0, 12.0, 5.0, 5.0, 2.0, 4.0, 3.0], "bins": [-0.0082550048828125, -0.008011817932128906, -0.0077686309814453125, -0.007525444030761719, -0.007282257080078125, -0.007039070129394531, -0.0067958831787109375, -0.006552696228027344, -0.00630950927734375, -0.006066322326660156, -0.0058231353759765625, -0.005579948425292969, -0.005336761474609375, -0.005093574523925781, -0.0048503875732421875, -0.004607200622558594, -0.004364013671875, -0.004120826721191406, -0.0038776397705078125, -0.0036344528198242188, -0.003391265869140625, -0.0031480789184570312, -0.0029048919677734375, -0.0026617050170898438, -0.00241851806640625, -0.0021753311157226562, -0.0019321441650390625, -0.0016889572143554688, -0.001445770263671875, -0.0012025833129882812, -0.0009593963623046875, -0.0007162094116210938, -0.0004730224609375, -0.00022983551025390625, 1.33514404296875e-05, 0.00025653839111328125, 0.000499725341796875, 0.0007429122924804688, 0.0009860992431640625, 0.0012292861938476562, 0.00147247314453125, 0.0017156600952148438, 0.0019588470458984375, 0.0022020339965820312, 0.002445220947265625, 0.0026884078979492188, 0.0029315948486328125, 0.0031747817993164062, 0.00341796875, 0.0036611557006835938, 0.0039043426513671875, 0.004147529602050781, 0.004390716552734375, 0.004633903503417969, 0.0048770904541015625, 0.005120277404785156, 0.00536346435546875, 0.005606651306152344, 0.0058498382568359375, 0.006093025207519531, 0.006336212158203125, 0.006579399108886719, 0.0068225860595703125, 0.007065773010253906, 0.0073089599609375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 0.0, 0.0, 6.0, 0.0, 6.0, 0.0, 9.0, 0.0, 0.0, 8.0, 0.0, 12.0, 0.0, 18.0, 0.0, 0.0, 19.0, 0.0, 29.0, 0.0, 0.0, 29.0, 0.0, 76.0, 0.0, 135.0, 0.0, 0.0, 309.0, 0.0, 161.0, 0.0, 78.0, 0.0, 0.0, 36.0, 0.0, 12.0, 0.0, 0.0, 16.0, 0.0, 14.0, 0.0, 10.0, 0.0, 0.0, 9.0, 0.0, 12.0, 0.0, 7.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 9.0, 6.0, 6.0, 6.0, 8.0, 11.0, 18.0, 17.0, 26.0, 40.0, 68.0, 118.0, 168.0, 329.0, 1606.0, 67539.0, 934463.0, 41656.0, 1625.0, 299.0, 165.0, 94.0, 50.0, 42.0, 31.0, 23.0, 16.0, 5.0, 19.0, 6.0, 12.0, 3.0, 5.0, 6.0, 7.0, 2.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-1.5556812286376953e-05, -1.5062279999256134e-05, -1.4567747712135315e-05, -1.4073215425014496e-05, -1.3578683137893677e-05, -1.3084150850772858e-05, -1.2589618563652039e-05, -1.209508627653122e-05, -1.16005539894104e-05, -1.1106021702289581e-05, -1.0611489415168762e-05, -1.0116957128047943e-05, -9.622424840927124e-06, -9.127892553806305e-06, -8.633360266685486e-06, -8.138827979564667e-06, -7.644295692443848e-06, -7.1497634053230286e-06, -6.6552311182022095e-06, -6.16069883108139e-06, -5.666166543960571e-06, -5.171634256839752e-06, -4.677101969718933e-06, -4.182569682598114e-06, -3.688037395477295e-06, -3.193505108356476e-06, -2.6989728212356567e-06, -2.2044405341148376e-06, -1.7099082469940186e-06, -1.2153759598731995e-06, -7.208436727523804e-07, -2.2631138563156128e-07, 2.682209014892578e-07, 7.627531886100769e-07, 1.257285475730896e-06, 1.751817762851715e-06, 2.246350049972534e-06, 2.7408823370933533e-06, 3.2354146242141724e-06, 3.7299469113349915e-06, 4.2244791984558105e-06, 4.71901148557663e-06, 5.213543772697449e-06, 5.708076059818268e-06, 6.202608346939087e-06, 6.697140634059906e-06, 7.191672921180725e-06, 7.686205208301544e-06, 8.180737495422363e-06, 8.675269782543182e-06, 9.169802069664001e-06, 9.66433435678482e-06, 1.015886664390564e-05, 1.0653398931026459e-05, 1.1147931218147278e-05, 1.1642463505268097e-05, 1.2136995792388916e-05, 1.2631528079509735e-05, 1.3126060366630554e-05, 1.3620592653751373e-05, 1.4115124940872192e-05, 1.4609657227993011e-05, 1.510418951511383e-05, 1.559872180223465e-05, 1.609325408935547e-05]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 557.0, 436.0, 15.0], "bins": [-1.4749783076695167e-05, -1.4511805602523964e-05, -1.4273829037847463e-05, -1.403585156367626e-05, -1.379787499899976e-05, -1.3559897524828557e-05, -1.3321920050657354e-05, -1.3083943485980853e-05, -1.284596601180965e-05, -1.2607988537638448e-05, -1.2370011972961947e-05, -1.2132034498790745e-05, -1.1894057024619542e-05, -1.1656080459943041e-05, -1.1418102985771839e-05, -1.1180126421095338e-05, -1.0942148946924135e-05, -1.0704171472752932e-05, -1.0466194908076432e-05, -1.0228217433905229e-05, -9.990240869228728e-06, -9.752263395057525e-06, -9.514285920886323e-06, -9.276309356209822e-06, -9.03833188203862e-06, -8.800354407867417e-06, -8.562377843190916e-06, -8.324400369019713e-06, -8.08642289484851e-06, -7.84844633017201e-06, -7.610468856000807e-06, -7.372491836576955e-06, -7.1345152719004545e-06, -6.896538252476603e-06, -6.6585607783054e-06, -6.420583758881548e-06, -6.182606739457697e-06, -5.944629720033845e-06, -5.706652700609993e-06, -5.4686752264387906e-06, -5.230698207014939e-06, -4.992721187591087e-06, -4.7547437134198844e-06, -4.516766693996033e-06, -4.278789674572181e-06, -4.040812655148329e-06, -3.802835408350802e-06, -3.564858161553275e-06, -3.326881142129423e-06, -3.0889041227055714e-06, -2.850926875908044e-06, -2.612949629110517e-06, -2.3749726096866652e-06, -2.1369955902628135e-06, -1.8990183434652863e-06, -1.6610412103545968e-06, -1.4230640772439074e-06, -1.185086944133218e-06, -9.471098110225284e-07, -7.09132677911839e-07, -4.711555448011495e-07, -2.3317841169046005e-07, 4.798721420229413e-09, 2.427758545309189e-07, 4.807529876416083e-07]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 4.0, 0.0, 0.0, 14.0, 0.0, 0.0, 49.0, 0.0, 0.0, 114.0, 0.0, 0.0, 197.0, 0.0, 0.0, 255.0, 0.0, 0.0, 212.0, 0.0, 105.0, 0.0, 0.0, 42.0, 0.0, 0.0, 15.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.755573511123657e-07, -5.550682544708252e-07, -5.345791578292847e-07, -5.140900611877441e-07, -4.936009645462036e-07, -4.731118679046631e-07, -4.5262277126312256e-07, -4.3213367462158203e-07, -4.116445779800415e-07, -3.91155481338501e-07, -3.7066638469696045e-07, -3.501772880554199e-07, -3.296881914138794e-07, -3.0919909477233887e-07, -2.8870999813079834e-07, -2.682209014892578e-07, -2.477318048477173e-07, -2.2724270820617676e-07, -2.0675361156463623e-07, -1.862645149230957e-07, -1.6577541828155518e-07, -1.4528632164001465e-07, -1.2479722499847412e-07, -1.043081283569336e-07, -8.381903171539307e-08, -6.332993507385254e-08, -4.284083843231201e-08, -2.2351741790771484e-08, -1.862645149230957e-09, 1.862645149230957e-08, 3.91155481338501e-08, 5.960464477539063e-08, 8.009374141693115e-08, 1.0058283805847168e-07, 1.210719347000122e-07, 1.4156103134155273e-07, 1.6205012798309326e-07, 1.825392246246338e-07, 2.0302832126617432e-07, 2.2351741790771484e-07, 2.4400651454925537e-07, 2.644956111907959e-07, 2.849847078323364e-07, 3.0547380447387695e-07, 3.259629011154175e-07, 3.46451997756958e-07, 3.6694109439849854e-07, 3.8743019104003906e-07, 4.079192876815796e-07, 4.284083843231201e-07, 4.4889748096466064e-07, 4.6938657760620117e-07, 4.898756742477417e-07, 5.103647708892822e-07, 5.308538675308228e-07, 5.513429641723633e-07, 5.718320608139038e-07, 5.923211574554443e-07, 6.128102540969849e-07, 6.332993507385254e-07, 6.537884473800659e-07, 6.742775440216064e-07, 6.94766640663147e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 10.0, 8.0, 8.0, 10.0, 16.0, 20.0, 27.0, 16.0, 38.0, 26.0, 32.0, 36.0, 44.0, 41.0, 53.0, 59.0, 42.0, 65.0, 49.0, 42.0, 52.0, 39.0, 43.0, 27.0, 31.0, 37.0, 21.0, 23.0, 11.0, 14.0, 12.0, 10.0, 9.0, 4.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.216796875, -3.112548828125, -3.00830078125, -2.904052734375, -2.7998046875, -2.695556640625, -2.59130859375, -2.487060546875, -2.3828125, -2.278564453125, -2.17431640625, -2.070068359375, -1.9658203125, -1.861572265625, -1.75732421875, -1.653076171875, -1.548828125, -1.444580078125, -1.34033203125, -1.236083984375, -1.1318359375, -1.027587890625, -0.92333984375, -0.819091796875, -0.71484375, -0.610595703125, -0.50634765625, -0.402099609375, -0.2978515625, -0.193603515625, -0.08935546875, 0.014892578125, 0.119140625, 0.223388671875, 0.32763671875, 0.431884765625, 0.5361328125, 0.640380859375, 0.74462890625, 0.848876953125, 0.953125, 1.057373046875, 1.16162109375, 1.265869140625, 1.3701171875, 1.474365234375, 1.57861328125, 1.682861328125, 1.787109375, 1.891357421875, 1.99560546875, 2.099853515625, 2.2041015625, 2.308349609375, 2.41259765625, 2.516845703125, 2.62109375, 2.725341796875, 2.82958984375, 2.933837890625, 3.0380859375, 3.142333984375, 3.24658203125, 3.350830078125, 3.455078125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 13.0, 13.0, 28.0, 25.0, 52.0, 84.0, 132.0, 220.0, 328.0, 590.0, 938.0, 1537.0, 2369.0, 3801.0, 6246.0, 10002.0, 16018.0, 25299.0, 40877.0, 69737.0, 144521.0, 347585.0, 177670.0, 79820.0, 45388.0, 27950.0, 17751.0, 11412.0, 6861.0, 4333.0, 2736.0, 1597.0, 1006.0, 596.0, 405.0, 220.0, 137.0, 87.0, 69.0, 36.0, 28.0, 19.0, 9.0, 6.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.992095947265625, -2.89434814453125, -2.796600341796875, -2.6988525390625, -2.601104736328125, -2.50335693359375, -2.405609130859375, -2.307861328125, -2.210113525390625, -2.11236572265625, -2.014617919921875, -1.9168701171875, -1.819122314453125, -1.72137451171875, -1.623626708984375, -1.52587890625, -1.428131103515625, -1.33038330078125, -1.232635498046875, -1.1348876953125, -1.037139892578125, -0.93939208984375, -0.841644287109375, -0.743896484375, -0.646148681640625, -0.54840087890625, -0.450653076171875, -0.3529052734375, -0.255157470703125, -0.15740966796875, -0.059661865234375, 0.0380859375, 0.135833740234375, 0.23358154296875, 0.331329345703125, 0.4290771484375, 0.526824951171875, 0.62457275390625, 0.722320556640625, 0.820068359375, 0.917816162109375, 1.01556396484375, 1.113311767578125, 1.2110595703125, 1.308807373046875, 1.40655517578125, 1.504302978515625, 1.60205078125, 1.699798583984375, 1.79754638671875, 1.895294189453125, 1.9930419921875, 2.090789794921875, 2.18853759765625, 2.286285400390625, 2.384033203125, 2.481781005859375, 2.57952880859375, 2.677276611328125, 2.7750244140625, 2.872772216796875, 2.97052001953125, 3.068267822265625, 3.166015625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 7.0, 6.0, 15.0, 8.0, 14.0, 13.0, 23.0, 19.0, 18.0, 29.0, 29.0, 25.0, 39.0, 27.0, 68.0, 63.0, 93.0, 174.0, 1559.0, 248.0, 137.0, 56.0, 56.0, 39.0, 38.0, 33.0, 40.0, 28.0, 25.0, 16.0, 26.0, 14.0, 16.0, 14.0, 10.0, 5.0, 6.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.69970703125, -9.3837890625, -9.06787109375, -8.751953125, -8.43603515625, -8.1201171875, -7.80419921875, -7.48828125, -7.17236328125, -6.8564453125, -6.54052734375, -6.224609375, -5.90869140625, -5.5927734375, -5.27685546875, -4.9609375, -4.64501953125, -4.3291015625, -4.01318359375, -3.697265625, -3.38134765625, -3.0654296875, -2.74951171875, -2.43359375, -2.11767578125, -1.8017578125, -1.48583984375, -1.169921875, -0.85400390625, -0.5380859375, -0.22216796875, 0.09375, 0.40966796875, 0.7255859375, 1.04150390625, 1.357421875, 1.67333984375, 1.9892578125, 2.30517578125, 2.62109375, 2.93701171875, 3.2529296875, 3.56884765625, 3.884765625, 4.20068359375, 4.5166015625, 4.83251953125, 5.1484375, 5.46435546875, 5.7802734375, 6.09619140625, 6.412109375, 6.72802734375, 7.0439453125, 7.35986328125, 7.67578125, 7.99169921875, 8.3076171875, 8.62353515625, 8.939453125, 9.25537109375, 9.5712890625, 9.88720703125, 10.203125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 11.0, 15.0, 9.0, 26.0, 17.0, 28.0, 31.0, 48.0, 43.0, 83.0, 109.0, 112.0, 173.0, 236.0, 526.0, 2041.0, 20179.0, 549162.0, 2519264.0, 47947.0, 3792.0, 752.0, 323.0, 186.0, 114.0, 102.0, 86.0, 68.0, 35.0, 34.0, 25.0, 25.0, 23.0, 13.0, 12.0, 14.0, 9.0, 7.0, 5.0, 1.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.71875, -17.167724609375, -16.61669921875, -16.065673828125, -15.5146484375, -14.963623046875, -14.41259765625, -13.861572265625, -13.310546875, -12.759521484375, -12.20849609375, -11.657470703125, -11.1064453125, -10.555419921875, -10.00439453125, -9.453369140625, -8.90234375, -8.351318359375, -7.80029296875, -7.249267578125, -6.6982421875, -6.147216796875, -5.59619140625, -5.045166015625, -4.494140625, -3.943115234375, -3.39208984375, -2.841064453125, -2.2900390625, -1.739013671875, -1.18798828125, -0.636962890625, -0.0859375, 0.465087890625, 1.01611328125, 1.567138671875, 2.1181640625, 2.669189453125, 3.22021484375, 3.771240234375, 4.322265625, 4.873291015625, 5.42431640625, 5.975341796875, 6.5263671875, 7.077392578125, 7.62841796875, 8.179443359375, 8.73046875, 9.281494140625, 9.83251953125, 10.383544921875, 10.9345703125, 11.485595703125, 12.03662109375, 12.587646484375, 13.138671875, 13.689697265625, 14.24072265625, 14.791748046875, 15.3427734375, 15.893798828125, 16.44482421875, 16.995849609375, 17.546875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 5.0, 7.0, 11.0, 15.0, 15.0, 29.0, 39.0, 36.0, 47.0, 44.0, 60.0, 64.0, 69.0, 73.0, 54.0, 50.0, 52.0, 60.0, 45.0, 46.0, 33.0, 35.0, 30.0, 18.0, 18.0, 7.0, 13.0, 8.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.862521171569824, -13.496307373046875, -13.13009262084961, -12.76387882232666, -12.397665023803711, -12.031450271606445, -11.665236473083496, -11.299022674560547, -10.932807922363281, -10.566594123840332, -10.200379371643066, -9.834165573120117, -9.467950820922852, -9.101737022399902, -8.735523223876953, -8.369308471679688, -8.003094673156738, -7.636880397796631, -7.270666122436523, -6.904452323913574, -6.538238048553467, -6.172023773193359, -5.80580997467041, -5.439595699310303, -5.073381423950195, -4.707167148590088, -4.3409528732299805, -3.9747390747070312, -3.608524799346924, -3.2423105239868164, -2.876096487045288, -2.5098824501037598, -2.143667221069336, -1.777453064918518, -1.4112389087677002, -1.0450247526168823, -0.6788105964660645, -0.3125964403152466, 0.05361771583557129, 0.4198317527770996, 0.786046028137207, 1.152260184288025, 1.5184743404388428, 1.8846884965896606, 2.2509026527404785, 2.617116928100586, 2.9833309650421143, 3.3495450019836426, 3.71575927734375, 4.081973552703857, 4.448187828063965, 4.814401626586914, 5.1806159019470215, 5.546830177307129, 5.913043975830078, 6.2792582511901855, 6.645472526550293, 7.0116868019104, 7.377901077270508, 7.744114875793457, 8.110328674316406, 8.476543426513672, 8.842757225036621, 9.20897102355957, 9.575185775756836]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 3.0, 11.0, 12.0, 8.0, 14.0, 21.0, 20.0, 25.0, 21.0, 31.0, 28.0, 35.0, 34.0, 38.0, 38.0, 35.0, 51.0, 43.0, 49.0, 48.0, 32.0, 42.0, 39.0, 40.0, 34.0, 37.0, 16.0, 33.0, 20.0, 23.0, 19.0, 9.0, 17.0, 11.0, 11.0, 13.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-30.117591857910156, -29.18962287902832, -28.261655807495117, -27.33368682861328, -26.405719757080078, -25.477750778198242, -24.549781799316406, -23.621814727783203, -22.69384765625, -21.765878677368164, -20.83791160583496, -19.909942626953125, -18.981975555419922, -18.054006576538086, -17.12603759765625, -16.198070526123047, -15.270101547241211, -14.342133522033691, -13.414165496826172, -12.486196517944336, -11.558229446411133, -10.630260467529297, -9.702292442321777, -8.774324417114258, -7.846356391906738, -6.918388366699219, -5.990420341491699, -5.0624518394470215, -4.134483814239502, -3.2065157890319824, -2.2785472869873047, -1.3505792617797852, -0.42261314392089844, 0.5053550004959106, 1.4333231449127197, 2.3612914085388184, 3.289259433746338, 4.217227458953857, 5.145195960998535, 6.073163986206055, 7.001132011413574, 7.929100036621094, 8.857068061828613, 9.785036087036133, 10.713005065917969, 11.640972137451172, 12.568941116333008, 13.496909141540527, 14.424877166748047, 15.352845191955566, 16.280813217163086, 17.208782196044922, 18.136749267578125, 19.06471824645996, 19.992687225341797, 20.920654296875, 21.848621368408203, 22.77659034729004, 23.704557418823242, 24.632526397705078, 25.56049346923828, 26.488462448120117, 27.416431427001953, 28.344398498535156, 29.272367477416992]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 5.0, 7.0, 18.0, 14.0, 23.0, 13.0, 24.0, 24.0, 28.0, 37.0, 32.0, 43.0, 39.0, 39.0, 54.0, 59.0, 52.0, 54.0, 53.0, 55.0, 33.0, 40.0, 35.0, 37.0, 34.0, 28.0, 20.0, 18.0, 15.0, 12.0, 10.0, 10.0, 5.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.185546875, -3.077178955078125, -2.96881103515625, -2.860443115234375, -2.7520751953125, -2.643707275390625, -2.53533935546875, -2.426971435546875, -2.318603515625, -2.210235595703125, -2.10186767578125, -1.993499755859375, -1.8851318359375, -1.776763916015625, -1.66839599609375, -1.560028076171875, -1.45166015625, -1.343292236328125, -1.23492431640625, -1.126556396484375, -1.0181884765625, -0.909820556640625, -0.80145263671875, -0.693084716796875, -0.584716796875, -0.476348876953125, -0.36798095703125, -0.259613037109375, -0.1512451171875, -0.042877197265625, 0.06549072265625, 0.173858642578125, 0.2822265625, 0.390594482421875, 0.49896240234375, 0.607330322265625, 0.7156982421875, 0.824066162109375, 0.93243408203125, 1.040802001953125, 1.149169921875, 1.257537841796875, 1.36590576171875, 1.474273681640625, 1.5826416015625, 1.691009521484375, 1.79937744140625, 1.907745361328125, 2.01611328125, 2.124481201171875, 2.23284912109375, 2.341217041015625, 2.4495849609375, 2.557952880859375, 2.66632080078125, 2.774688720703125, 2.883056640625, 2.991424560546875, 3.09979248046875, 3.208160400390625, 3.3165283203125, 3.424896240234375, 3.53326416015625, 3.641632080078125, 3.75]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 4.0, 10.0, 14.0, 19.0, 24.0, 43.0, 47.0, 70.0, 87.0, 138.0, 218.0, 371.0, 609.0, 1343.0, 3279.0, 9382.0, 31020.0, 137409.0, 868842.0, 2413792.0, 590936.0, 100293.0, 23660.0, 7342.0, 2709.0, 1211.0, 501.0, 316.0, 194.0, 119.0, 73.0, 53.0, 41.0, 22.0, 24.0, 13.0, 11.0, 5.0, 9.0, 3.0, 4.0, 3.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.58203125, -7.3480224609375, -7.114013671875, -6.8800048828125, -6.64599609375, -6.4119873046875, -6.177978515625, -5.9439697265625, -5.7099609375, -5.4759521484375, -5.241943359375, -5.0079345703125, -4.77392578125, -4.5399169921875, -4.305908203125, -4.0718994140625, -3.837890625, -3.6038818359375, -3.369873046875, -3.1358642578125, -2.90185546875, -2.6678466796875, -2.433837890625, -2.1998291015625, -1.9658203125, -1.7318115234375, -1.497802734375, -1.2637939453125, -1.02978515625, -0.7957763671875, -0.561767578125, -0.3277587890625, -0.09375, 0.1402587890625, 0.374267578125, 0.6082763671875, 0.84228515625, 1.0762939453125, 1.310302734375, 1.5443115234375, 1.7783203125, 2.0123291015625, 2.246337890625, 2.4803466796875, 2.71435546875, 2.9483642578125, 3.182373046875, 3.4163818359375, 3.650390625, 3.8843994140625, 4.118408203125, 4.3524169921875, 4.58642578125, 4.8204345703125, 5.054443359375, 5.2884521484375, 5.5224609375, 5.7564697265625, 5.990478515625, 6.2244873046875, 6.45849609375, 6.6925048828125, 6.926513671875, 7.1605224609375, 7.39453125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 5.0, 14.0, 8.0, 21.0, 27.0, 39.0, 73.0, 82.0, 113.0, 175.0, 235.0, 345.0, 403.0, 528.0, 488.0, 385.0, 313.0, 253.0, 176.0, 123.0, 77.0, 50.0, 46.0, 34.0, 21.0, 18.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.84515380859375, -8.6121826171875, -8.37921142578125, -8.146240234375, -7.91326904296875, -7.6802978515625, -7.44732666015625, -7.21435546875, -6.98138427734375, -6.7484130859375, -6.51544189453125, -6.282470703125, -6.04949951171875, -5.8165283203125, -5.58355712890625, -5.3505859375, -5.11761474609375, -4.8846435546875, -4.65167236328125, -4.418701171875, -4.18572998046875, -3.9527587890625, -3.71978759765625, -3.48681640625, -3.25384521484375, -3.0208740234375, -2.78790283203125, -2.554931640625, -2.32196044921875, -2.0889892578125, -1.85601806640625, -1.623046875, -1.39007568359375, -1.1571044921875, -0.92413330078125, -0.691162109375, -0.45819091796875, -0.2252197265625, 0.00775146484375, 0.24072265625, 0.47369384765625, 0.7066650390625, 0.93963623046875, 1.172607421875, 1.40557861328125, 1.6385498046875, 1.87152099609375, 2.1044921875, 2.33746337890625, 2.5704345703125, 2.80340576171875, 3.036376953125, 3.26934814453125, 3.5023193359375, 3.73529052734375, 3.96826171875, 4.20123291015625, 4.4342041015625, 4.66717529296875, 4.900146484375, 5.13311767578125, 5.3660888671875, 5.59906005859375, 5.83203125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 13.0, 14.0, 18.0, 22.0, 37.0, 42.0, 60.0, 104.0, 119.0, 244.0, 361.0, 753.0, 1935.0, 14287.0, 275164.0, 3401121.0, 474061.0, 21415.0, 2619.0, 754.0, 379.0, 232.0, 150.0, 106.0, 83.0, 57.0, 34.0, 25.0, 15.0, 10.0, 10.0, 10.0, 6.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8671875, -14.2623291015625, -13.657470703125, -13.0526123046875, -12.44775390625, -11.8428955078125, -11.238037109375, -10.6331787109375, -10.0283203125, -9.4234619140625, -8.818603515625, -8.2137451171875, -7.60888671875, -7.0040283203125, -6.399169921875, -5.7943115234375, -5.189453125, -4.5845947265625, -3.979736328125, -3.3748779296875, -2.77001953125, -2.1651611328125, -1.560302734375, -0.9554443359375, -0.3505859375, 0.2542724609375, 0.859130859375, 1.4639892578125, 2.06884765625, 2.6737060546875, 3.278564453125, 3.8834228515625, 4.48828125, 5.0931396484375, 5.697998046875, 6.3028564453125, 6.90771484375, 7.5125732421875, 8.117431640625, 8.7222900390625, 9.3271484375, 9.9320068359375, 10.536865234375, 11.1417236328125, 11.74658203125, 12.3514404296875, 12.956298828125, 13.5611572265625, 14.166015625, 14.7708740234375, 15.375732421875, 15.9805908203125, 16.58544921875, 17.1903076171875, 17.795166015625, 18.4000244140625, 19.0048828125, 19.6097412109375, 20.214599609375, 20.8194580078125, 21.42431640625, 22.0291748046875, 22.634033203125, 23.2388916015625, 23.84375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 13.0, 14.0, 28.0, 41.0, 60.0, 71.0, 85.0, 96.0, 98.0, 114.0, 101.0, 74.0, 67.0, 43.0, 35.0, 24.0, 16.0, 13.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.36457633972168, -21.12825584411621, -19.891935348510742, -18.655614852905273, -17.419294357299805, -16.182973861694336, -14.946653366088867, -13.710332870483398, -12.47401237487793, -11.237691879272461, -10.001371383666992, -8.765050888061523, -7.528730392456055, -6.292409896850586, -5.056089401245117, -3.8197689056396484, -2.5834484100341797, -1.347127914428711, -0.11080741882324219, 1.1255130767822266, 2.3618335723876953, 3.598154067993164, 4.834474563598633, 6.070795059204102, 7.30711555480957, 8.543436050415039, 9.779756546020508, 11.016077041625977, 12.252397537231445, 13.488718032836914, 14.725038528442383, 15.961359024047852, 17.197681427001953, 18.434001922607422, 19.67032241821289, 20.90664291381836, 22.142963409423828, 23.379283905029297, 24.615604400634766, 25.851924896240234, 27.088245391845703, 28.324565887451172, 29.56088638305664, 30.79720687866211, 32.03352737426758, 33.26984786987305, 34.506168365478516, 35.742488861083984, 36.97880935668945, 38.21512985229492, 39.45145034790039, 40.68777084350586, 41.92409133911133, 43.1604118347168, 44.396732330322266, 45.633052825927734, 46.8693733215332, 48.10569381713867, 49.34201431274414, 50.57833480834961, 51.81465530395508, 53.05097579956055, 54.287296295166016, 55.523616790771484, 56.75993728637695]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 5.0, 2.0, 10.0, 11.0, 10.0, 17.0, 17.0, 18.0, 20.0, 23.0, 25.0, 25.0, 35.0, 35.0, 38.0, 44.0, 42.0, 38.0, 32.0, 42.0, 41.0, 34.0, 40.0, 37.0, 33.0, 41.0, 33.0, 31.0, 20.0, 24.0, 33.0, 26.0, 17.0, 14.0, 15.0, 15.0, 22.0, 9.0, 6.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.292266845703125, -19.617502212524414, -18.942737579345703, -18.267972946166992, -17.59320831298828, -16.918445587158203, -16.243680953979492, -15.568916320800781, -14.89415168762207, -14.21938705444336, -13.544622421264648, -12.869858741760254, -12.195094108581543, -11.520329475402832, -10.845565795898438, -10.170801162719727, -9.496036529541016, -8.821271896362305, -8.146507263183594, -7.471743583679199, -6.796978950500488, -6.122214317321777, -5.447450160980225, -4.772686004638672, -4.097921371459961, -3.423156976699829, -2.7483925819396973, -2.0736281871795654, -1.3988637924194336, -0.7240993976593018, -0.04933500289916992, 0.6254291534423828, 1.3001937866210938, 1.9749581813812256, 2.6497225761413574, 3.3244869709014893, 3.999251365661621, 4.674015998840332, 5.348780155181885, 6.0235443115234375, 6.698308944702148, 7.373073577880859, 8.04783821105957, 8.722601890563965, 9.397366523742676, 10.072131156921387, 10.746894836425781, 11.421659469604492, 12.096424102783203, 12.771188735961914, 13.445953369140625, 14.12071704864502, 14.79548168182373, 15.470246315002441, 16.145009994506836, 16.819774627685547, 17.494539260864258, 18.16930389404297, 18.84406852722168, 19.51883316040039, 20.19359588623047, 20.86836051940918, 21.54312515258789, 22.2178897857666, 22.892654418945312]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 8.0, 9.0, 17.0, 17.0, 13.0, 25.0, 18.0, 23.0, 22.0, 35.0, 33.0, 35.0, 49.0, 46.0, 43.0, 55.0, 54.0, 53.0, 53.0, 49.0, 40.0, 40.0, 42.0, 30.0, 36.0, 30.0, 21.0, 21.0, 17.0, 12.0, 16.0, 10.0, 6.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.99609375, -2.88812255859375, -2.7801513671875, -2.67218017578125, -2.564208984375, -2.45623779296875, -2.3482666015625, -2.24029541015625, -2.13232421875, -2.02435302734375, -1.9163818359375, -1.80841064453125, -1.700439453125, -1.59246826171875, -1.4844970703125, -1.37652587890625, -1.2685546875, -1.16058349609375, -1.0526123046875, -0.94464111328125, -0.836669921875, -0.72869873046875, -0.6207275390625, -0.51275634765625, -0.40478515625, -0.29681396484375, -0.1888427734375, -0.08087158203125, 0.027099609375, 0.13507080078125, 0.2430419921875, 0.35101318359375, 0.458984375, 0.56695556640625, 0.6749267578125, 0.78289794921875, 0.890869140625, 0.99884033203125, 1.1068115234375, 1.21478271484375, 1.32275390625, 1.43072509765625, 1.5386962890625, 1.64666748046875, 1.754638671875, 1.86260986328125, 1.9705810546875, 2.07855224609375, 2.1865234375, 2.29449462890625, 2.4024658203125, 2.51043701171875, 2.618408203125, 2.72637939453125, 2.8343505859375, 2.94232177734375, 3.05029296875, 3.15826416015625, 3.2662353515625, 3.37420654296875, 3.482177734375, 3.59014892578125, 3.6981201171875, 3.80609130859375, 3.9140625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 12.0, 24.0, 29.0, 43.0, 67.0, 107.0, 129.0, 216.0, 369.0, 510.0, 830.0, 1264.0, 1855.0, 2822.0, 4251.0, 6854.0, 10624.0, 17129.0, 28195.0, 48015.0, 84003.0, 158603.0, 273268.0, 179847.0, 93977.0, 53097.0, 31310.0, 18792.0, 11362.0, 7270.0, 4723.0, 3031.0, 2055.0, 1359.0, 855.0, 544.0, 336.0, 244.0, 176.0, 126.0, 77.0, 50.0, 33.0, 15.0, 12.0, 9.0, 5.0, 5.0, 2.0, 6.0, 0.0, 3.0, 5.0, 0.0, 1.0], "bins": [-0.0206756591796875, -0.02002120018005371, -0.019366741180419922, -0.018712282180786133, -0.018057823181152344, -0.017403364181518555, -0.016748905181884766, -0.016094446182250977, -0.015439987182617188, -0.014785528182983398, -0.01413106918334961, -0.01347661018371582, -0.012822151184082031, -0.012167692184448242, -0.011513233184814453, -0.010858774185180664, -0.010204315185546875, -0.009549856185913086, -0.008895397186279297, -0.008240938186645508, -0.007586479187011719, -0.00693202018737793, -0.006277561187744141, -0.0056231021881103516, -0.0049686431884765625, -0.0043141841888427734, -0.0036597251892089844, -0.0030052661895751953, -0.0023508071899414062, -0.0016963481903076172, -0.0010418891906738281, -0.00038743019104003906, 0.00026702880859375, 0.0009214878082275391, 0.0015759468078613281, 0.002230405807495117, 0.0028848648071289062, 0.0035393238067626953, 0.004193782806396484, 0.0048482418060302734, 0.0055027008056640625, 0.0061571598052978516, 0.006811618804931641, 0.00746607780456543, 0.008120536804199219, 0.008774995803833008, 0.009429454803466797, 0.010083913803100586, 0.010738372802734375, 0.011392831802368164, 0.012047290802001953, 0.012701749801635742, 0.013356208801269531, 0.01401066780090332, 0.01466512680053711, 0.015319585800170898, 0.015974044799804688, 0.016628503799438477, 0.017282962799072266, 0.017937421798706055, 0.018591880798339844, 0.019246339797973633, 0.019900798797607422, 0.02055525779724121, 0.021209716796875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 9.0, 12.0, 8.0, 13.0, 13.0, 17.0, 27.0, 28.0, 35.0, 30.0, 27.0, 44.0, 32.0, 35.0, 40.0, 37.0, 42.0, 1059.0, 52.0, 52.0, 43.0, 33.0, 43.0, 32.0, 43.0, 34.0, 29.0, 28.0, 18.0, 18.0, 21.0, 22.0, 13.0, 6.0, 6.0, 5.0, 7.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7890625, -2.708740234375, -2.62841796875, -2.548095703125, -2.4677734375, -2.387451171875, -2.30712890625, -2.226806640625, -2.146484375, -2.066162109375, -1.98583984375, -1.905517578125, -1.8251953125, -1.744873046875, -1.66455078125, -1.584228515625, -1.50390625, -1.423583984375, -1.34326171875, -1.262939453125, -1.1826171875, -1.102294921875, -1.02197265625, -0.941650390625, -0.861328125, -0.781005859375, -0.70068359375, -0.620361328125, -0.5400390625, -0.459716796875, -0.37939453125, -0.299072265625, -0.21875, -0.138427734375, -0.05810546875, 0.022216796875, 0.1025390625, 0.182861328125, 0.26318359375, 0.343505859375, 0.423828125, 0.504150390625, 0.58447265625, 0.664794921875, 0.7451171875, 0.825439453125, 0.90576171875, 0.986083984375, 1.06640625, 1.146728515625, 1.22705078125, 1.307373046875, 1.3876953125, 1.468017578125, 1.54833984375, 1.628662109375, 1.708984375, 1.789306640625, 1.86962890625, 1.949951171875, 2.0302734375, 2.110595703125, 2.19091796875, 2.271240234375, 2.3515625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 5.0, 16.0, 27.0, 29.0, 56.0, 97.0, 123.0, 178.0, 301.0, 430.0, 618.0, 1029.0, 1654.0, 2505.0, 3915.0, 6323.0, 10089.0, 16115.0, 25685.0, 41760.0, 66430.0, 108868.0, 179760.0, 1261693.0, 142289.0, 85391.0, 52979.0, 33188.0, 20493.0, 13061.0, 8163.0, 5041.0, 3154.0, 2056.0, 1237.0, 804.0, 527.0, 393.0, 228.0, 127.0, 83.0, 73.0, 44.0, 34.0, 16.0, 8.0, 7.0, 9.0, 4.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.008941650390625, -0.008664488792419434, -0.008387327194213867, -0.0081101655960083, -0.007833003997802734, -0.007555842399597168, -0.0072786808013916016, -0.007001519203186035, -0.006724357604980469, -0.006447196006774902, -0.006170034408569336, -0.0058928728103637695, -0.005615711212158203, -0.005338549613952637, -0.00506138801574707, -0.004784226417541504, -0.0045070648193359375, -0.004229903221130371, -0.003952741622924805, -0.0036755800247192383, -0.003398418426513672, -0.0031212568283081055, -0.002844095230102539, -0.0025669336318969727, -0.0022897720336914062, -0.00201261043548584, -0.0017354488372802734, -0.001458287239074707, -0.0011811256408691406, -0.0009039640426635742, -0.0006268024444580078, -0.0003496408462524414, -7.2479248046875e-05, 0.0002046823501586914, 0.0004818439483642578, 0.0007590055465698242, 0.0010361671447753906, 0.001313328742980957, 0.0015904903411865234, 0.0018676519393920898, 0.0021448135375976562, 0.0024219751358032227, 0.002699136734008789, 0.0029762983322143555, 0.003253459930419922, 0.0035306215286254883, 0.0038077831268310547, 0.004084944725036621, 0.0043621063232421875, 0.004639267921447754, 0.00491642951965332, 0.005193591117858887, 0.005470752716064453, 0.0057479143142700195, 0.006025075912475586, 0.006302237510681152, 0.006579399108886719, 0.006856560707092285, 0.0071337223052978516, 0.007410883903503418, 0.007688045501708984, 0.00796520709991455, 0.008242368698120117, 0.008519530296325684, 0.00879669189453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 0.0, 11.0, 13.0, 0.0, 16.0, 23.0, 0.0, 25.0, 26.0, 0.0, 34.0, 0.0, 63.0, 149.0, 0.0, 261.0, 130.0, 0.0, 66.0, 34.0, 0.0, 35.0, 24.0, 0.0, 26.0, 13.0, 0.0, 8.0, 11.0, 0.0, 6.0, 8.0, 0.0, 2.0, 1.0, 0.0, 3.0, 8.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3317912817001343e-06, -1.2926757335662842e-06, -1.253560185432434e-06, -1.214444637298584e-06, -1.1753290891647339e-06, -1.1362135410308838e-06, -1.0970979928970337e-06, -1.0579824447631836e-06, -1.0188668966293335e-06, -9.797513484954834e-07, -9.406358003616333e-07, -9.015202522277832e-07, -8.624047040939331e-07, -8.23289155960083e-07, -7.841736078262329e-07, -7.450580596923828e-07, -7.059425115585327e-07, -6.668269634246826e-07, -6.277114152908325e-07, -5.885958671569824e-07, -5.494803190231323e-07, -5.103647708892822e-07, -4.7124922275543213e-07, -4.3213367462158203e-07, -3.9301812648773193e-07, -3.5390257835388184e-07, -3.1478703022003174e-07, -2.7567148208618164e-07, -2.3655593395233154e-07, -1.9744038581848145e-07, -1.5832483768463135e-07, -1.1920928955078125e-07, -8.009374141693115e-08, -4.0978193283081055e-08, -1.862645149230957e-09, 3.725290298461914e-08, 7.636845111846924e-08, 1.1548399925231934e-07, 1.5459954738616943e-07, 1.9371509552001953e-07, 2.3283064365386963e-07, 2.7194619178771973e-07, 3.110617399215698e-07, 3.501772880554199e-07, 3.8929283618927e-07, 4.284083843231201e-07, 4.675239324569702e-07, 5.066394805908203e-07, 5.457550287246704e-07, 5.848705768585205e-07, 6.239861249923706e-07, 6.631016731262207e-07, 7.022172212600708e-07, 7.413327693939209e-07, 7.80448317527771e-07, 8.195638656616211e-07, 8.586794137954712e-07, 8.977949619293213e-07, 9.369105100631714e-07, 9.760260581970215e-07, 1.0151416063308716e-06, 1.0542571544647217e-06, 1.0933727025985718e-06, 1.1324882507324219e-06]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 0.0, 6.0, 6.0, 6.0, 9.0, 2.0, 11.0, 13.0, 18.0, 16.0, 26.0, 35.0, 62.0, 80.0, 171.0, 372.0, 2182.0, 855843.0, 187524.0, 1440.0, 304.0, 142.0, 85.0, 52.0, 24.0, 21.0, 18.0, 18.0, 10.0, 9.0, 11.0, 6.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.282857894897461e-05, -2.2038817405700684e-05, -2.1249055862426758e-05, -2.0459294319152832e-05, -1.9669532775878906e-05, -1.887977123260498e-05, -1.8090009689331055e-05, -1.730024814605713e-05, -1.6510486602783203e-05, -1.5720725059509277e-05, -1.4930963516235352e-05, -1.4141201972961426e-05, -1.33514404296875e-05, -1.2561678886413574e-05, -1.1771917343139648e-05, -1.0982155799865723e-05, -1.0192394256591797e-05, -9.402632713317871e-06, -8.612871170043945e-06, -7.82310962677002e-06, -7.033348083496094e-06, -6.243586540222168e-06, -5.453824996948242e-06, -4.664063453674316e-06, -3.874301910400391e-06, -3.084540367126465e-06, -2.294778823852539e-06, -1.5050172805786133e-06, -7.152557373046875e-07, 7.450580596923828e-08, 8.642673492431641e-07, 1.6540288925170898e-06, 2.4437904357910156e-06, 3.2335519790649414e-06, 4.023313522338867e-06, 4.813075065612793e-06, 5.602836608886719e-06, 6.3925981521606445e-06, 7.18235969543457e-06, 7.972121238708496e-06, 8.761882781982422e-06, 9.551644325256348e-06, 1.0341405868530273e-05, 1.11311674118042e-05, 1.1920928955078125e-05, 1.271069049835205e-05, 1.3500452041625977e-05, 1.4290213584899902e-05, 1.5079975128173828e-05, 1.5869736671447754e-05, 1.665949821472168e-05, 1.7449259757995605e-05, 1.823902130126953e-05, 1.9028782844543457e-05, 1.9818544387817383e-05, 2.060830593109131e-05, 2.1398067474365234e-05, 2.218782901763916e-05, 2.2977590560913086e-05, 2.3767352104187012e-05, 2.4557113647460938e-05, 2.5346875190734863e-05, 2.613663673400879e-05, 2.6926398277282715e-05, 2.771615982055664e-05]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 29.0, 433.0, 525.0, 28.0], "bins": [-1.2334198800090235e-05, -1.2135421457060147e-05, -1.193664411403006e-05, -1.1737867680494674e-05, -1.1539090337464586e-05, -1.1340312994434498e-05, -1.114153565140441e-05, -1.0942758308374323e-05, -1.0743980965344235e-05, -1.0545203622314148e-05, -1.034642627928406e-05, -1.0147648936253972e-05, -9.948872502718586e-06, -9.750095159688499e-06, -9.551317816658411e-06, -9.352540473628324e-06, -9.153764040092938e-06, -8.95498669706285e-06, -8.756209354032762e-06, -8.557432011002675e-06, -8.358655577467289e-06, -8.159878234437201e-06, -7.961100891407114e-06, -7.762323548377026e-06, -7.563546205346938e-06, -7.3647688623168506e-06, -7.165991974034114e-06, -6.967214631004026e-06, -6.7684372879739385e-06, -6.569660399691202e-06, -6.370883056661114e-06, -6.1721057136310264e-06, -5.97332882534829e-06, -5.774551482318202e-06, -5.575774594035465e-06, -5.376997251005378e-06, -5.17821990797529e-06, -4.979443019692553e-06, -4.7806656766624656e-06, -4.581888788379729e-06, -4.383111445349641e-06, -4.1843341023195535e-06, -3.985557214036817e-06, -3.786779871006729e-06, -3.588002755350317e-06, -3.3892256396939047e-06, -3.190448296663817e-06, -2.991671181007405e-06, -2.7928940653509926e-06, -2.5941169496945804e-06, -2.3953396066644927e-06, -2.1965624910080805e-06, -1.9977853753516683e-06, -1.7990081460084184e-06, -1.6002309166651685e-06, -1.4014538010087563e-06, -1.2026764579786686e-06, -1.0038992286354187e-06, -8.051221129790065e-07, -6.063448836357566e-07, -4.075677111359255e-07, -2.0879053863609442e-07, -1.0013309292844497e-08, 1.887638063635677e-07, 3.875410072851082e-07]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 25.0, 0.0, 0.0, 53.0, 0.0, 0.0, 121.0, 0.0, 0.0, 184.0, 0.0, 0.0, 0.0, 253.0, 0.0, 0.0, 170.0, 0.0, 0.0, 103.0, 0.0, 0.0, 47.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 7.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 8.0, 9.0, 17.0, 17.0, 13.0, 25.0, 18.0, 23.0, 22.0, 35.0, 33.0, 35.0, 49.0, 46.0, 43.0, 55.0, 54.0, 53.0, 53.0, 49.0, 40.0, 40.0, 42.0, 30.0, 36.0, 30.0, 21.0, 21.0, 17.0, 12.0, 16.0, 10.0, 6.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.99609375, -2.88812255859375, -2.7801513671875, -2.67218017578125, -2.564208984375, -2.45623779296875, -2.3482666015625, -2.24029541015625, -2.13232421875, -2.02435302734375, -1.9163818359375, -1.80841064453125, -1.700439453125, -1.59246826171875, -1.4844970703125, -1.37652587890625, -1.2685546875, -1.16058349609375, -1.0526123046875, -0.94464111328125, -0.836669921875, -0.72869873046875, -0.6207275390625, -0.51275634765625, -0.40478515625, -0.29681396484375, -0.1888427734375, -0.08087158203125, 0.027099609375, 0.13507080078125, 0.2430419921875, 0.35101318359375, 0.458984375, 0.56695556640625, 0.6749267578125, 0.78289794921875, 0.890869140625, 0.99884033203125, 1.1068115234375, 1.21478271484375, 1.32275390625, 1.43072509765625, 1.5386962890625, 1.64666748046875, 1.754638671875, 1.86260986328125, 1.9705810546875, 2.07855224609375, 2.1865234375, 2.29449462890625, 2.4024658203125, 2.51043701171875, 2.618408203125, 2.72637939453125, 2.8343505859375, 2.94232177734375, 3.05029296875, 3.15826416015625, 3.2662353515625, 3.37420654296875, 3.482177734375, 3.59014892578125, 3.6981201171875, 3.80609130859375, 3.9140625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 8.0, 15.0, 17.0, 20.0, 33.0, 37.0, 71.0, 87.0, 159.0, 241.0, 364.0, 513.0, 734.0, 1096.0, 1730.0, 2550.0, 4217.0, 6902.0, 11832.0, 21736.0, 44782.0, 101185.0, 246222.0, 322295.0, 150385.0, 63253.0, 29619.0, 15321.0, 8743.0, 5087.0, 3318.0, 2012.0, 1243.0, 921.0, 567.0, 403.0, 267.0, 191.0, 107.0, 83.0, 56.0, 41.0, 31.0, 17.0, 18.0, 8.0, 9.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.751953125, -3.639007568359375, -3.52606201171875, -3.413116455078125, -3.3001708984375, -3.187225341796875, -3.07427978515625, -2.961334228515625, -2.848388671875, -2.735443115234375, -2.62249755859375, -2.509552001953125, -2.3966064453125, -2.283660888671875, -2.17071533203125, -2.057769775390625, -1.94482421875, -1.831878662109375, -1.71893310546875, -1.605987548828125, -1.4930419921875, -1.380096435546875, -1.26715087890625, -1.154205322265625, -1.041259765625, -0.928314208984375, -0.81536865234375, -0.702423095703125, -0.5894775390625, -0.476531982421875, -0.36358642578125, -0.250640869140625, -0.1376953125, -0.024749755859375, 0.08819580078125, 0.201141357421875, 0.3140869140625, 0.427032470703125, 0.53997802734375, 0.652923583984375, 0.765869140625, 0.878814697265625, 0.99176025390625, 1.104705810546875, 1.2176513671875, 1.330596923828125, 1.44354248046875, 1.556488037109375, 1.66943359375, 1.782379150390625, 1.89532470703125, 2.008270263671875, 2.1212158203125, 2.234161376953125, 2.34710693359375, 2.460052490234375, 2.572998046875, 2.685943603515625, 2.79888916015625, 2.911834716796875, 3.0247802734375, 3.137725830078125, 3.25067138671875, 3.363616943359375, 3.4765625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 4.0, 8.0, 2.0, 8.0, 5.0, 13.0, 7.0, 12.0, 15.0, 12.0, 27.0, 22.0, 27.0, 27.0, 28.0, 34.0, 46.0, 40.0, 20.0, 56.0, 84.0, 139.0, 330.0, 1360.0, 195.0, 83.0, 55.0, 49.0, 42.0, 32.0, 32.0, 31.0, 33.0, 22.0, 21.0, 20.0, 17.0, 22.0, 6.0, 14.0, 9.0, 7.0, 6.0, 8.0, 8.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5, -8.2352294921875, -7.970458984375, -7.7056884765625, -7.44091796875, -7.1761474609375, -6.911376953125, -6.6466064453125, -6.3818359375, -6.1170654296875, -5.852294921875, -5.5875244140625, -5.32275390625, -5.0579833984375, -4.793212890625, -4.5284423828125, -4.263671875, -3.9989013671875, -3.734130859375, -3.4693603515625, -3.20458984375, -2.9398193359375, -2.675048828125, -2.4102783203125, -2.1455078125, -1.8807373046875, -1.615966796875, -1.3511962890625, -1.08642578125, -0.8216552734375, -0.556884765625, -0.2921142578125, -0.02734375, 0.2374267578125, 0.502197265625, 0.7669677734375, 1.03173828125, 1.2965087890625, 1.561279296875, 1.8260498046875, 2.0908203125, 2.3555908203125, 2.620361328125, 2.8851318359375, 3.14990234375, 3.4146728515625, 3.679443359375, 3.9442138671875, 4.208984375, 4.4737548828125, 4.738525390625, 5.0032958984375, 5.26806640625, 5.5328369140625, 5.797607421875, 6.0623779296875, 6.3271484375, 6.5919189453125, 6.856689453125, 7.1214599609375, 7.38623046875, 7.6510009765625, 7.915771484375, 8.1805419921875, 8.4453125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 10.0, 6.0, 14.0, 14.0, 15.0, 26.0, 31.0, 28.0, 52.0, 60.0, 71.0, 84.0, 97.0, 165.0, 200.0, 289.0, 682.0, 1810.0, 6733.0, 50677.0, 2278920.0, 773761.0, 24600.0, 4405.0, 1302.0, 560.0, 282.0, 202.0, 135.0, 94.0, 92.0, 71.0, 48.0, 28.0, 34.0, 22.0, 24.0, 13.0, 13.0, 10.0, 4.0, 9.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.015625, -12.5797119140625, -12.143798828125, -11.7078857421875, -11.27197265625, -10.8360595703125, -10.400146484375, -9.9642333984375, -9.5283203125, -9.0924072265625, -8.656494140625, -8.2205810546875, -7.78466796875, -7.3487548828125, -6.912841796875, -6.4769287109375, -6.041015625, -5.6051025390625, -5.169189453125, -4.7332763671875, -4.29736328125, -3.8614501953125, -3.425537109375, -2.9896240234375, -2.5537109375, -2.1177978515625, -1.681884765625, -1.2459716796875, -0.81005859375, -0.3741455078125, 0.061767578125, 0.4976806640625, 0.93359375, 1.3695068359375, 1.805419921875, 2.2413330078125, 2.67724609375, 3.1131591796875, 3.549072265625, 3.9849853515625, 4.4208984375, 4.8568115234375, 5.292724609375, 5.7286376953125, 6.16455078125, 6.6004638671875, 7.036376953125, 7.4722900390625, 7.908203125, 8.3441162109375, 8.780029296875, 9.2159423828125, 9.65185546875, 10.0877685546875, 10.523681640625, 10.9595947265625, 11.3955078125, 11.8314208984375, 12.267333984375, 12.7032470703125, 13.13916015625, 13.5750732421875, 14.010986328125, 14.4468994140625, 14.8828125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 52.0, 279.0, 531.0, 141.0, 8.0, 1.0, 1.0, 1.0], "bins": [-172.35409545898438, -169.39540100097656, -166.4366912841797, -163.47799682617188, -160.51930236816406, -157.56060791015625, -154.60189819335938, -151.64320373535156, -148.68450927734375, -145.72581481933594, -142.76710510253906, -139.80841064453125, -136.84971618652344, -133.89102172851562, -130.93231201171875, -127.97361755371094, -125.0149154663086, -122.05621337890625, -119.09751892089844, -116.1388168334961, -113.18012237548828, -110.22142028808594, -107.26272583007812, -104.30402374267578, -101.34532165527344, -98.3866195678711, -95.42792510986328, -92.46922302246094, -89.51052856445312, -86.55182647705078, -83.59312438964844, -80.63442993164062, -77.67574310302734, -74.717041015625, -71.75834655761719, -68.79964447021484, -65.84095001220703, -62.88224792480469, -59.92354965209961, -56.96485137939453, -54.00615310668945, -51.047454833984375, -48.0887565612793, -45.13005828857422, -42.171356201171875, -39.21266174316406, -36.25395965576172, -33.29526138305664, -30.336563110351562, -27.377864837646484, -24.419166564941406, -21.460466384887695, -18.501768112182617, -15.543069839477539, -12.584369659423828, -9.62567138671875, -6.666973114013672, -3.7082743644714355, -0.7495756149291992, 2.2091236114501953, 5.167821884155273, 8.126520156860352, 11.085220336914062, 14.04391860961914, 17.00261688232422]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 0.0, 7.0, 12.0, 14.0, 19.0, 15.0, 22.0, 24.0, 17.0, 37.0, 36.0, 35.0, 33.0, 41.0, 52.0, 49.0, 59.0, 58.0, 43.0, 55.0, 47.0, 43.0, 41.0, 54.0, 28.0, 22.0, 20.0, 25.0, 22.0, 18.0, 13.0, 6.0, 3.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.12200927734375, -31.067209243774414, -30.012407302856445, -28.95760726928711, -27.90280532836914, -26.848005294799805, -25.79320526123047, -24.7384033203125, -23.683603286743164, -22.628803253173828, -21.57400131225586, -20.519201278686523, -19.464401245117188, -18.40959930419922, -17.354799270629883, -16.299999237060547, -15.245197296142578, -14.190396308898926, -13.135595321655273, -12.080795288085938, -11.025994300842285, -9.971193313598633, -8.916393280029297, -7.8615922927856445, -6.806791305541992, -5.75199031829834, -4.697189807891846, -3.6423890590667725, -2.587588310241699, -1.5327873229980469, -0.47798681259155273, 0.5768136978149414, 1.6316146850585938, 2.686415433883667, 3.7412161827087402, 4.796016693115234, 5.850817680358887, 6.905618667602539, 7.960419178009033, 9.015219688415527, 10.07002067565918, 11.124821662902832, 12.179622650146484, 13.23442268371582, 14.289223670959473, 15.344024658203125, 16.39882469177246, 17.453624725341797, 18.508426666259766, 19.5632266998291, 20.61802864074707, 21.672828674316406, 22.727630615234375, 23.78243064880371, 24.837230682373047, 25.892032623291016, 26.94683265686035, 28.001632690429688, 29.056434631347656, 30.111234664916992, 31.166034698486328, 32.2208366394043, 33.275638580322266, 34.33043670654297, 35.38523864746094]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 8.0, 12.0, 24.0, 15.0, 19.0, 17.0, 27.0, 23.0, 26.0, 30.0, 41.0, 40.0, 54.0, 38.0, 43.0, 67.0, 46.0, 57.0, 45.0, 42.0, 45.0, 43.0, 30.0, 34.0, 33.0, 24.0, 20.0, 17.0, 19.0, 11.0, 9.0, 9.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.815643310546875, -2.70745849609375, -2.599273681640625, -2.4910888671875, -2.382904052734375, -2.27471923828125, -2.166534423828125, -2.058349609375, -1.950164794921875, -1.84197998046875, -1.733795166015625, -1.6256103515625, -1.517425537109375, -1.40924072265625, -1.301055908203125, -1.19287109375, -1.084686279296875, -0.97650146484375, -0.868316650390625, -0.7601318359375, -0.651947021484375, -0.54376220703125, -0.435577392578125, -0.327392578125, -0.219207763671875, -0.11102294921875, -0.002838134765625, 0.1053466796875, 0.213531494140625, 0.32171630859375, 0.429901123046875, 0.5380859375, 0.646270751953125, 0.75445556640625, 0.862640380859375, 0.9708251953125, 1.079010009765625, 1.18719482421875, 1.295379638671875, 1.403564453125, 1.511749267578125, 1.61993408203125, 1.728118896484375, 1.8363037109375, 1.944488525390625, 2.05267333984375, 2.160858154296875, 2.26904296875, 2.377227783203125, 2.48541259765625, 2.593597412109375, 2.7017822265625, 2.809967041015625, 2.91815185546875, 3.026336669921875, 3.134521484375, 3.242706298828125, 3.35089111328125, 3.459075927734375, 3.5672607421875, 3.675445556640625, 3.78363037109375, 3.891815185546875, 4.0]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 15.0, 7.0, 23.0, 17.0, 37.0, 41.0, 71.0, 98.0, 147.0, 206.0, 338.0, 566.0, 882.0, 1577.0, 2863.0, 5695.0, 11478.0, 25417.0, 63192.0, 184269.0, 640077.0, 1744201.0, 1055210.0, 295689.0, 94677.0, 36323.0, 15557.0, 7271.0, 3644.0, 1883.0, 1056.0, 598.0, 353.0, 240.0, 142.0, 125.0, 81.0, 55.0, 35.0, 25.0, 21.0, 20.0, 9.0, 11.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.55859375, -4.41009521484375, -4.2615966796875, -4.11309814453125, -3.964599609375, -3.81610107421875, -3.6676025390625, -3.51910400390625, -3.37060546875, -3.22210693359375, -3.0736083984375, -2.92510986328125, -2.776611328125, -2.62811279296875, -2.4796142578125, -2.33111572265625, -2.1826171875, -2.03411865234375, -1.8856201171875, -1.73712158203125, -1.588623046875, -1.44012451171875, -1.2916259765625, -1.14312744140625, -0.99462890625, -0.84613037109375, -0.6976318359375, -0.54913330078125, -0.400634765625, -0.25213623046875, -0.1036376953125, 0.04486083984375, 0.193359375, 0.34185791015625, 0.4903564453125, 0.63885498046875, 0.787353515625, 0.93585205078125, 1.0843505859375, 1.23284912109375, 1.38134765625, 1.52984619140625, 1.6783447265625, 1.82684326171875, 1.975341796875, 2.12384033203125, 2.2723388671875, 2.42083740234375, 2.5693359375, 2.71783447265625, 2.8663330078125, 3.01483154296875, 3.163330078125, 3.31182861328125, 3.4603271484375, 3.60882568359375, 3.75732421875, 3.90582275390625, 4.0543212890625, 4.20281982421875, 4.351318359375, 4.49981689453125, 4.6483154296875, 4.79681396484375, 4.9453125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 14.0, 13.0, 14.0, 23.0, 37.0, 28.0, 47.0, 69.0, 98.0, 125.0, 168.0, 294.0, 353.0, 470.0, 527.0, 435.0, 357.0, 311.0, 208.0, 136.0, 90.0, 68.0, 60.0, 36.0, 28.0, 21.0, 11.0, 13.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.25, -8.0465087890625, -7.843017578125, -7.6395263671875, -7.43603515625, -7.2325439453125, -7.029052734375, -6.8255615234375, -6.6220703125, -6.4185791015625, -6.215087890625, -6.0115966796875, -5.80810546875, -5.6046142578125, -5.401123046875, -5.1976318359375, -4.994140625, -4.7906494140625, -4.587158203125, -4.3836669921875, -4.18017578125, -3.9766845703125, -3.773193359375, -3.5697021484375, -3.3662109375, -3.1627197265625, -2.959228515625, -2.7557373046875, -2.55224609375, -2.3487548828125, -2.145263671875, -1.9417724609375, -1.73828125, -1.5347900390625, -1.331298828125, -1.1278076171875, -0.92431640625, -0.7208251953125, -0.517333984375, -0.3138427734375, -0.1103515625, 0.0931396484375, 0.296630859375, 0.5001220703125, 0.70361328125, 0.9071044921875, 1.110595703125, 1.3140869140625, 1.517578125, 1.7210693359375, 1.924560546875, 2.1280517578125, 2.33154296875, 2.5350341796875, 2.738525390625, 2.9420166015625, 3.1455078125, 3.3489990234375, 3.552490234375, 3.7559814453125, 3.95947265625, 4.1629638671875, 4.366455078125, 4.5699462890625, 4.7734375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 11.0, 10.0, 19.0, 26.0, 28.0, 39.0, 58.0, 90.0, 133.0, 211.0, 345.0, 732.0, 2173.0, 13863.0, 228651.0, 3379683.0, 536788.0, 26129.0, 3224.0, 911.0, 418.0, 221.0, 152.0, 101.0, 71.0, 48.0, 39.0, 20.0, 21.0, 11.0, 18.0, 10.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5859375, -15.0006103515625, -14.415283203125, -13.8299560546875, -13.24462890625, -12.6593017578125, -12.073974609375, -11.4886474609375, -10.9033203125, -10.3179931640625, -9.732666015625, -9.1473388671875, -8.56201171875, -7.9766845703125, -7.391357421875, -6.8060302734375, -6.220703125, -5.6353759765625, -5.050048828125, -4.4647216796875, -3.87939453125, -3.2940673828125, -2.708740234375, -2.1234130859375, -1.5380859375, -0.9527587890625, -0.367431640625, 0.2178955078125, 0.80322265625, 1.3885498046875, 1.973876953125, 2.5592041015625, 3.14453125, 3.7298583984375, 4.315185546875, 4.9005126953125, 5.48583984375, 6.0711669921875, 6.656494140625, 7.2418212890625, 7.8271484375, 8.4124755859375, 8.997802734375, 9.5831298828125, 10.16845703125, 10.7537841796875, 11.339111328125, 11.9244384765625, 12.509765625, 13.0950927734375, 13.680419921875, 14.2657470703125, 14.85107421875, 15.4364013671875, 16.021728515625, 16.6070556640625, 17.1923828125, 17.7777099609375, 18.363037109375, 18.9483642578125, 19.53369140625, 20.1190185546875, 20.704345703125, 21.2896728515625, 21.875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 10.0, 8.0, 20.0, 19.0, 31.0, 29.0, 44.0, 50.0, 72.0, 78.0, 98.0, 94.0, 79.0, 80.0, 69.0, 56.0, 40.0, 38.0, 26.0, 15.0, 16.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.686321258544922, -15.83186149597168, -14.977402687072754, -14.122942924499512, -13.26848316192627, -12.414024353027344, -11.559564590454102, -10.70510482788086, -9.850645065307617, -8.996185302734375, -8.14172649383545, -7.287266731262207, -6.432806968688965, -5.578347682952881, -4.723888397216797, -3.8694286346435547, -3.014969825744629, -2.160510301589966, -1.3060508966445923, -0.45159149169921875, 0.40286803245544434, 1.2573275566101074, 2.1117868423461914, 2.9662466049194336, 3.8207058906555176, 4.675165176391602, 5.529624938964844, 6.384084224700928, 7.238543510437012, 8.093003273010254, 8.94746208190918, 9.801921844482422, 10.656381607055664, 11.510841369628906, 12.365300178527832, 13.219759941101074, 14.074219703674316, 14.928678512573242, 15.783138275146484, 16.637598037719727, 17.49205780029297, 18.34651756286621, 19.200977325439453, 20.055435180664062, 20.909894943237305, 21.764354705810547, 22.61881446838379, 23.47327423095703, 24.32773208618164, 25.182191848754883, 26.036651611328125, 26.891109466552734, 27.745569229125977, 28.60002899169922, 29.45448875427246, 30.308948516845703, 31.163408279418945, 32.01786804199219, 32.8723258972168, 33.72678756713867, 34.58124542236328, 35.435707092285156, 36.290164947509766, 37.144622802734375, 37.99908447265625]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 5.0, 9.0, 11.0, 13.0, 10.0, 16.0, 20.0, 21.0, 17.0, 23.0, 28.0, 34.0, 36.0, 31.0, 31.0, 30.0, 41.0, 28.0, 45.0, 46.0, 52.0, 37.0, 45.0, 34.0, 30.0, 34.0, 32.0, 34.0, 30.0, 33.0, 28.0, 18.0, 12.0, 13.0, 17.0, 18.0, 6.0, 3.0, 4.0, 6.0, 1.0, 0.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.021026611328125, -19.350439071655273, -18.679851531982422, -18.00926399230957, -17.33867645263672, -16.6680908203125, -15.997502326965332, -15.326915740966797, -14.656328201293945, -13.985740661621094, -13.315153121948242, -12.64456558227539, -11.973978996276855, -11.303391456604004, -10.632803916931152, -9.962217330932617, -9.29162883758545, -8.621041297912598, -7.950454235076904, -7.279866695404053, -6.609279632568359, -5.938692092895508, -5.268104553222656, -4.597517490386963, -3.9269299507141113, -3.256342649459839, -2.5857553482055664, -1.9151678085327148, -1.2445805072784424, -0.5739932060241699, 0.09659433364868164, 0.767181396484375, 1.4377689361572266, 2.108356237411499, 2.7789435386657715, 3.449531078338623, 4.120118141174316, 4.790705680847168, 5.4612932205200195, 6.131880283355713, 6.8024678230285645, 7.473055362701416, 8.14364242553711, 8.814229965209961, 9.484817504882812, 10.155405044555664, 10.825992584228516, 11.49657917022705, 12.167166709899902, 12.837754249572754, 13.508341789245605, 14.17892837524414, 14.849515914916992, 15.520103454589844, 16.190690994262695, 16.861278533935547, 17.5318660736084, 18.20245361328125, 18.8730411529541, 19.543628692626953, 20.214216232299805, 20.884803771972656, 21.555389404296875, 22.225976943969727, 22.896564483642578]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 14.0, 10.0, 14.0, 18.0, 22.0, 24.0, 25.0, 32.0, 29.0, 34.0, 42.0, 43.0, 44.0, 56.0, 47.0, 58.0, 49.0, 64.0, 54.0, 46.0, 47.0, 35.0, 24.0, 28.0, 24.0, 32.0, 16.0, 13.0, 18.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44921875, -3.3319091796875, -3.214599609375, -3.0972900390625, -2.97998046875, -2.8626708984375, -2.745361328125, -2.6280517578125, -2.5107421875, -2.3934326171875, -2.276123046875, -2.1588134765625, -2.04150390625, -1.9241943359375, -1.806884765625, -1.6895751953125, -1.572265625, -1.4549560546875, -1.337646484375, -1.2203369140625, -1.10302734375, -0.9857177734375, -0.868408203125, -0.7510986328125, -0.6337890625, -0.5164794921875, -0.399169921875, -0.2818603515625, -0.16455078125, -0.0472412109375, 0.070068359375, 0.1873779296875, 0.3046875, 0.4219970703125, 0.539306640625, 0.6566162109375, 0.77392578125, 0.8912353515625, 1.008544921875, 1.1258544921875, 1.2431640625, 1.3604736328125, 1.477783203125, 1.5950927734375, 1.71240234375, 1.8297119140625, 1.947021484375, 2.0643310546875, 2.181640625, 2.2989501953125, 2.416259765625, 2.5335693359375, 2.65087890625, 2.7681884765625, 2.885498046875, 3.0028076171875, 3.1201171875, 3.2374267578125, 3.354736328125, 3.4720458984375, 3.58935546875, 3.7066650390625, 3.823974609375, 3.9412841796875, 4.05859375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 9.0, 11.0, 10.0, 18.0, 26.0, 17.0, 35.0, 56.0, 98.0, 161.0, 262.0, 419.0, 598.0, 1030.0, 1714.0, 2666.0, 4668.0, 8363.0, 14584.0, 26489.0, 48453.0, 96082.0, 207880.0, 321786.0, 152113.0, 73483.0, 38716.0, 20793.0, 11528.0, 6626.0, 3949.0, 2281.0, 1377.0, 857.0, 491.0, 309.0, 172.0, 142.0, 105.0, 63.0, 50.0, 28.0, 15.0, 8.0, 6.0, 6.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0273895263671875, -0.02656722068786621, -0.025744915008544922, -0.024922609329223633, -0.024100303649902344, -0.023277997970581055, -0.022455692291259766, -0.021633386611938477, -0.020811080932617188, -0.0199887752532959, -0.01916646957397461, -0.01834416389465332, -0.01752185821533203, -0.016699552536010742, -0.015877246856689453, -0.015054941177368164, -0.014232635498046875, -0.013410329818725586, -0.012588024139404297, -0.011765718460083008, -0.010943412780761719, -0.01012110710144043, -0.00929880142211914, -0.008476495742797852, -0.0076541900634765625, -0.0068318843841552734, -0.006009578704833984, -0.005187273025512695, -0.004364967346191406, -0.003542661666870117, -0.002720355987548828, -0.001898050308227539, -0.00107574462890625, -0.00025343894958496094, 0.0005688667297363281, 0.0013911724090576172, 0.0022134780883789062, 0.0030357837677001953, 0.0038580894470214844, 0.0046803951263427734, 0.0055027008056640625, 0.0063250064849853516, 0.007147312164306641, 0.00796961784362793, 0.008791923522949219, 0.009614229202270508, 0.010436534881591797, 0.011258840560913086, 0.012081146240234375, 0.012903451919555664, 0.013725757598876953, 0.014548063278198242, 0.015370368957519531, 0.01619267463684082, 0.01701498031616211, 0.0178372859954834, 0.018659591674804688, 0.019481897354125977, 0.020304203033447266, 0.021126508712768555, 0.021948814392089844, 0.022771120071411133, 0.023593425750732422, 0.02441573143005371, 0.025238037109375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 9.0, 14.0, 17.0, 17.0, 20.0, 18.0, 27.0, 24.0, 33.0, 20.0, 26.0, 31.0, 33.0, 27.0, 41.0, 40.0, 36.0, 1060.0, 36.0, 34.0, 35.0, 44.0, 35.0, 37.0, 39.0, 28.0, 37.0, 26.0, 22.0, 19.0, 18.0, 17.0, 12.0, 11.0, 11.0, 10.0, 9.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.193359375, -2.12420654296875, -2.0550537109375, -1.98590087890625, -1.916748046875, -1.84759521484375, -1.7784423828125, -1.70928955078125, -1.64013671875, -1.57098388671875, -1.5018310546875, -1.43267822265625, -1.363525390625, -1.29437255859375, -1.2252197265625, -1.15606689453125, -1.0869140625, -1.01776123046875, -0.9486083984375, -0.87945556640625, -0.810302734375, -0.74114990234375, -0.6719970703125, -0.60284423828125, -0.53369140625, -0.46453857421875, -0.3953857421875, -0.32623291015625, -0.257080078125, -0.18792724609375, -0.1187744140625, -0.04962158203125, 0.01953125, 0.08868408203125, 0.1578369140625, 0.22698974609375, 0.296142578125, 0.36529541015625, 0.4344482421875, 0.50360107421875, 0.57275390625, 0.64190673828125, 0.7110595703125, 0.78021240234375, 0.849365234375, 0.91851806640625, 0.9876708984375, 1.05682373046875, 1.1259765625, 1.19512939453125, 1.2642822265625, 1.33343505859375, 1.402587890625, 1.47174072265625, 1.5408935546875, 1.61004638671875, 1.67919921875, 1.74835205078125, 1.8175048828125, 1.88665771484375, 1.955810546875, 2.02496337890625, 2.0941162109375, 2.16326904296875, 2.232421875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 11.0, 17.0, 21.0, 31.0, 44.0, 78.0, 87.0, 134.0, 206.0, 280.0, 419.0, 617.0, 861.0, 1316.0, 1969.0, 2854.0, 4377.0, 6599.0, 10199.0, 15397.0, 23936.0, 36372.0, 56493.0, 88011.0, 140622.0, 1249659.0, 164833.0, 102920.0, 65708.0, 42585.0, 27834.0, 17920.0, 11655.0, 7626.0, 5153.0, 3350.0, 2236.0, 1492.0, 994.0, 686.0, 469.0, 326.0, 226.0, 162.0, 105.0, 63.0, 59.0, 34.0, 22.0, 18.0, 16.0, 9.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.00811767578125, -0.00786137580871582, -0.007605075836181641, -0.007348775863647461, -0.007092475891113281, -0.0068361759185791016, -0.006579875946044922, -0.006323575973510742, -0.0060672760009765625, -0.005810976028442383, -0.005554676055908203, -0.0052983760833740234, -0.005042076110839844, -0.004785776138305664, -0.004529476165771484, -0.004273176193237305, -0.004016876220703125, -0.0037605762481689453, -0.0035042762756347656, -0.003247976303100586, -0.0029916763305664062, -0.0027353763580322266, -0.002479076385498047, -0.002222776412963867, -0.0019664764404296875, -0.0017101764678955078, -0.0014538764953613281, -0.0011975765228271484, -0.0009412765502929688, -0.0006849765777587891, -0.0004286766052246094, -0.0001723766326904297, 8.392333984375e-05, 0.0003402233123779297, 0.0005965232849121094, 0.0008528232574462891, 0.0011091232299804688, 0.0013654232025146484, 0.0016217231750488281, 0.0018780231475830078, 0.0021343231201171875, 0.002390623092651367, 0.002646923065185547, 0.0029032230377197266, 0.0031595230102539062, 0.003415822982788086, 0.0036721229553222656, 0.003928422927856445, 0.004184722900390625, 0.004441022872924805, 0.004697322845458984, 0.004953622817993164, 0.005209922790527344, 0.0054662227630615234, 0.005722522735595703, 0.005978822708129883, 0.0062351226806640625, 0.006491422653198242, 0.006747722625732422, 0.0070040225982666016, 0.007260322570800781, 0.007516622543334961, 0.007772922515869141, 0.00802922248840332, 0.0082855224609375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 6.0, 0.0, 5.0, 11.0, 9.0, 5.0, 0.0, 11.0, 15.0, 7.0, 0.0, 12.0, 8.0, 30.0, 0.0, 32.0, 45.0, 65.0, 0.0, 142.0, 220.0, 124.0, 73.0, 0.0, 39.0, 28.0, 19.0, 0.0, 16.0, 10.0, 12.0, 0.0, 10.0, 12.0, 8.0, 0.0, 9.0, 3.0, 6.0, 10.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.3848766684532166e-06, -1.339241862297058e-06, -1.2936070561408997e-06, -1.2479722499847412e-06, -1.2023374438285828e-06, -1.1567026376724243e-06, -1.1110678315162659e-06, -1.0654330253601074e-06, -1.019798219203949e-06, -9.741634130477905e-07, -9.285286068916321e-07, -8.828938007354736e-07, -8.372589945793152e-07, -7.916241884231567e-07, -7.459893822669983e-07, -7.003545761108398e-07, -6.547197699546814e-07, -6.09084963798523e-07, -5.634501576423645e-07, -5.178153514862061e-07, -4.721805453300476e-07, -4.2654573917388916e-07, -3.809109330177307e-07, -3.3527612686157227e-07, -2.896413207054138e-07, -2.4400651454925537e-07, -1.9837170839309692e-07, -1.5273690223693848e-07, -1.0710209608078003e-07, -6.146728992462158e-08, -1.5832483768463135e-08, 2.9802322387695312e-08, 7.543712854385376e-08, 1.210719347000122e-07, 1.6670674085617065e-07, 2.123415470123291e-07, 2.5797635316848755e-07, 3.03611159324646e-07, 3.4924596548080444e-07, 3.948807716369629e-07, 4.4051557779312134e-07, 4.861503839492798e-07, 5.317851901054382e-07, 5.774199962615967e-07, 6.230548024177551e-07, 6.686896085739136e-07, 7.14324414730072e-07, 7.599592208862305e-07, 8.055940270423889e-07, 8.512288331985474e-07, 8.968636393547058e-07, 9.424984455108643e-07, 9.881332516670227e-07, 1.0337680578231812e-06, 1.0794028639793396e-06, 1.125037670135498e-06, 1.1706724762916565e-06, 1.216307282447815e-06, 1.2619420886039734e-06, 1.3075768947601318e-06, 1.3532117009162903e-06, 1.3988465070724487e-06, 1.4444813132286072e-06, 1.4901161193847656e-06]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 2.0, 9.0, 3.0, 7.0, 7.0, 13.0, 7.0, 11.0, 14.0, 13.0, 32.0, 40.0, 73.0, 143.0, 264.0, 788.0, 75989.0, 967226.0, 2988.0, 393.0, 187.0, 123.0, 51.0, 40.0, 20.0, 19.0, 10.0, 8.0, 6.0, 9.0, 9.0, 2.0, 5.0, 6.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0219554901123047e-05, -2.928171306848526e-05, -2.8343871235847473e-05, -2.7406029403209686e-05, -2.64681875705719e-05, -2.5530345737934113e-05, -2.4592503905296326e-05, -2.365466207265854e-05, -2.2716820240020752e-05, -2.1778978407382965e-05, -2.0841136574745178e-05, -1.990329474210739e-05, -1.8965452909469604e-05, -1.8027611076831818e-05, -1.708976924419403e-05, -1.6151927411556244e-05, -1.5214085578918457e-05, -1.427624374628067e-05, -1.3338401913642883e-05, -1.2400560081005096e-05, -1.146271824836731e-05, -1.0524876415729523e-05, -9.587034583091736e-06, -8.649192750453949e-06, -7.711350917816162e-06, -6.773509085178375e-06, -5.835667252540588e-06, -4.8978254199028015e-06, -3.959983587265015e-06, -3.0221417546272278e-06, -2.084299921989441e-06, -1.146458089351654e-06, -2.086162567138672e-07, 7.292255759239197e-07, 1.6670674085617065e-06, 2.6049092411994934e-06, 3.5427510738372803e-06, 4.480592906475067e-06, 5.418434739112854e-06, 6.356276571750641e-06, 7.294118404388428e-06, 8.231960237026215e-06, 9.169802069664001e-06, 1.0107643902301788e-05, 1.1045485734939575e-05, 1.1983327567577362e-05, 1.2921169400215149e-05, 1.3859011232852936e-05, 1.4796853065490723e-05, 1.573469489812851e-05, 1.6672536730766296e-05, 1.7610378563404083e-05, 1.854822039604187e-05, 1.9486062228679657e-05, 2.0423904061317444e-05, 2.136174589395523e-05, 2.2299587726593018e-05, 2.3237429559230804e-05, 2.417527139186859e-05, 2.5113113224506378e-05, 2.6050955057144165e-05, 2.6988796889781952e-05, 2.792663872241974e-05, 2.8864480555057526e-05, 2.9802322387695312e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 74.0, 905.0, 38.0, 1.0], "bins": [-2.0190791474306025e-05, -1.9862396584358066e-05, -1.9534001694410108e-05, -1.920560680446215e-05, -1.887721191451419e-05, -1.8548817024566233e-05, -1.822042031562887e-05, -1.7892025425680913e-05, -1.7563630535732955e-05, -1.7235235645784996e-05, -1.6906840755837038e-05, -1.657844586588908e-05, -1.625005097594112e-05, -1.592165426700376e-05, -1.5593261196045205e-05, -1.5264864487107843e-05, -1.4936470506654587e-05, -1.4608075616706628e-05, -1.427968072675867e-05, -1.395128492731601e-05, -1.3622890037368052e-05, -1.3294495147420093e-05, -1.2966100257472135e-05, -1.2637705367524177e-05, -1.2309310477576219e-05, -1.198091558762826e-05, -1.1652520697680302e-05, -1.1324125807732344e-05, -1.0995730008289684e-05, -1.0667335118341725e-05, -1.0338940228393767e-05, -1.0010545338445809e-05, -9.68215044849785e-06, -9.353755558549892e-06, -9.025360668601934e-06, -8.696964869159274e-06, -8.368569979211316e-06, -8.040175089263357e-06, -7.711780199315399e-06, -7.383385309367441e-06, -7.054989509924781e-06, -6.726594619976822e-06, -6.398199275281513e-06, -6.069804385333555e-06, -5.741409040638246e-06, -5.413014150690287e-06, -5.084619260742329e-06, -4.756224370794371e-06, -4.427829026099062e-06, -4.099434136151103e-06, -3.771038791455794e-06, -3.442643901507836e-06, -3.114248784186202e-06, -2.7858536668645684e-06, -2.45745877691661e-06, -2.1290636595949763e-06, -1.800668769647018e-06, -1.4722736523253843e-06, -1.1438786486905883e-06, -8.154836450557923e-07, -4.870885277341586e-07, -1.5869341041252483e-07, 1.6970147953543346e-07, 4.980965968570672e-07, 8.264917710221198e-07]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 9.0, 0.0, 9.0, 0.0, 0.0, 8.0, 0.0, 24.0, 0.0, 0.0, 28.0, 0.0, 56.0, 0.0, 0.0, 118.0, 0.0, 135.0, 0.0, 0.0, 217.0, 0.0, 145.0, 0.0, 0.0, 102.0, 0.0, 63.0, 0.0, 44.0, 0.0, 0.0, 26.0, 0.0, 9.0, 0.0, 0.0, 4.0, 0.0, 9.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.314367055892944e-07, -6.07222318649292e-07, -5.830079317092896e-07, -5.587935447692871e-07, -5.345791578292847e-07, -5.103647708892822e-07, -4.861503839492798e-07, -4.6193599700927734e-07, -4.377216100692749e-07, -4.1350722312927246e-07, -3.8929283618927e-07, -3.650784492492676e-07, -3.4086406230926514e-07, -3.166496753692627e-07, -2.9243528842926025e-07, -2.682209014892578e-07, -2.4400651454925537e-07, -2.1979212760925293e-07, -1.955777406692505e-07, -1.7136335372924805e-07, -1.471489667892456e-07, -1.2293457984924316e-07, -9.872019290924072e-08, -7.450580596923828e-08, -5.029141902923584e-08, -2.60770320892334e-08, -1.862645149230957e-09, 2.2351741790771484e-08, 4.6566128730773926e-08, 7.078051567077637e-08, 9.499490261077881e-08, 1.1920928955078125e-07, 1.434236764907837e-07, 1.6763806343078613e-07, 1.9185245037078857e-07, 2.1606683731079102e-07, 2.4028122425079346e-07, 2.644956111907959e-07, 2.8870999813079834e-07, 3.129243850708008e-07, 3.371387720108032e-07, 3.6135315895080566e-07, 3.855675458908081e-07, 4.0978193283081055e-07, 4.33996319770813e-07, 4.5821070671081543e-07, 4.824250936508179e-07, 5.066394805908203e-07, 5.308538675308228e-07, 5.550682544708252e-07, 5.792826414108276e-07, 6.034970283508301e-07, 6.277114152908325e-07, 6.51925802230835e-07, 6.761401891708374e-07, 7.003545761108398e-07, 7.245689630508423e-07, 7.487833499908447e-07, 7.729977369308472e-07, 7.972121238708496e-07, 8.21426510810852e-07, 8.456408977508545e-07, 8.698552846908569e-07, 8.940696716308594e-07]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 14.0, 10.0, 14.0, 18.0, 22.0, 24.0, 25.0, 32.0, 29.0, 34.0, 42.0, 43.0, 44.0, 56.0, 47.0, 58.0, 49.0, 64.0, 54.0, 46.0, 47.0, 35.0, 24.0, 28.0, 24.0, 32.0, 16.0, 13.0, 18.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44921875, -3.3319091796875, -3.214599609375, -3.0972900390625, -2.97998046875, -2.8626708984375, -2.745361328125, -2.6280517578125, -2.5107421875, -2.3934326171875, -2.276123046875, -2.1588134765625, -2.04150390625, -1.9241943359375, -1.806884765625, -1.6895751953125, -1.572265625, -1.4549560546875, -1.337646484375, -1.2203369140625, -1.10302734375, -0.9857177734375, -0.868408203125, -0.7510986328125, -0.6337890625, -0.5164794921875, -0.399169921875, -0.2818603515625, -0.16455078125, -0.0472412109375, 0.070068359375, 0.1873779296875, 0.3046875, 0.4219970703125, 0.539306640625, 0.6566162109375, 0.77392578125, 0.8912353515625, 1.008544921875, 1.1258544921875, 1.2431640625, 1.3604736328125, 1.477783203125, 1.5950927734375, 1.71240234375, 1.8297119140625, 1.947021484375, 2.0643310546875, 2.181640625, 2.2989501953125, 2.416259765625, 2.5335693359375, 2.65087890625, 2.7681884765625, 2.885498046875, 3.0028076171875, 3.1201171875, 3.2374267578125, 3.354736328125, 3.4720458984375, 3.58935546875, 3.7066650390625, 3.823974609375, 3.9412841796875, 4.05859375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 8.0, 5.0, 15.0, 10.0, 16.0, 26.0, 32.0, 45.0, 69.0, 92.0, 140.0, 191.0, 300.0, 399.0, 554.0, 844.0, 1158.0, 1669.0, 2348.0, 3672.0, 5827.0, 10050.0, 18897.0, 40409.0, 94434.0, 238008.0, 356344.0, 148276.0, 61579.0, 27751.0, 13649.0, 7614.0, 4629.0, 2964.0, 1931.0, 1351.0, 1006.0, 644.0, 464.0, 333.0, 231.0, 175.0, 141.0, 81.0, 59.0, 43.0, 28.0, 19.0, 6.0, 12.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.12890625, -3.025482177734375, -2.92205810546875, -2.818634033203125, -2.7152099609375, -2.611785888671875, -2.50836181640625, -2.404937744140625, -2.301513671875, -2.198089599609375, -2.09466552734375, -1.991241455078125, -1.8878173828125, -1.784393310546875, -1.68096923828125, -1.577545166015625, -1.47412109375, -1.370697021484375, -1.26727294921875, -1.163848876953125, -1.0604248046875, -0.957000732421875, -0.85357666015625, -0.750152587890625, -0.646728515625, -0.543304443359375, -0.43988037109375, -0.336456298828125, -0.2330322265625, -0.129608154296875, -0.02618408203125, 0.077239990234375, 0.1806640625, 0.284088134765625, 0.38751220703125, 0.490936279296875, 0.5943603515625, 0.697784423828125, 0.80120849609375, 0.904632568359375, 1.008056640625, 1.111480712890625, 1.21490478515625, 1.318328857421875, 1.4217529296875, 1.525177001953125, 1.62860107421875, 1.732025146484375, 1.83544921875, 1.938873291015625, 2.04229736328125, 2.145721435546875, 2.2491455078125, 2.352569580078125, 2.45599365234375, 2.559417724609375, 2.662841796875, 2.766265869140625, 2.86968994140625, 2.973114013671875, 3.0765380859375, 3.179962158203125, 3.28338623046875, 3.386810302734375, 3.490234375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 13.0, 9.0, 13.0, 10.0, 21.0, 19.0, 19.0, 27.0, 37.0, 42.0, 46.0, 50.0, 68.0, 115.0, 223.0, 1547.0, 278.0, 110.0, 59.0, 54.0, 46.0, 40.0, 35.0, 37.0, 28.0, 22.0, 20.0, 11.0, 14.0, 6.0, 13.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.260986328125, -9.88916015625, -9.517333984375, -9.1455078125, -8.773681640625, -8.40185546875, -8.030029296875, -7.658203125, -7.286376953125, -6.91455078125, -6.542724609375, -6.1708984375, -5.799072265625, -5.42724609375, -5.055419921875, -4.68359375, -4.311767578125, -3.93994140625, -3.568115234375, -3.1962890625, -2.824462890625, -2.45263671875, -2.080810546875, -1.708984375, -1.337158203125, -0.96533203125, -0.593505859375, -0.2216796875, 0.150146484375, 0.52197265625, 0.893798828125, 1.265625, 1.637451171875, 2.00927734375, 2.381103515625, 2.7529296875, 3.124755859375, 3.49658203125, 3.868408203125, 4.240234375, 4.612060546875, 4.98388671875, 5.355712890625, 5.7275390625, 6.099365234375, 6.47119140625, 6.843017578125, 7.21484375, 7.586669921875, 7.95849609375, 8.330322265625, 8.7021484375, 9.073974609375, 9.44580078125, 9.817626953125, 10.189453125, 10.561279296875, 10.93310546875, 11.304931640625, 11.6767578125, 12.048583984375, 12.42041015625, 12.792236328125, 13.1640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 2.0, 6.0, 13.0, 14.0, 20.0, 30.0, 37.0, 50.0, 77.0, 122.0, 185.0, 302.0, 698.0, 2484.0, 18169.0, 2705061.0, 407408.0, 8242.0, 1570.0, 478.0, 252.0, 159.0, 95.0, 59.0, 40.0, 29.0, 30.0, 19.0, 16.0, 9.0, 6.0, 8.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.40625, -19.744384765625, -19.08251953125, -18.420654296875, -17.7587890625, -17.096923828125, -16.43505859375, -15.773193359375, -15.111328125, -14.449462890625, -13.78759765625, -13.125732421875, -12.4638671875, -11.802001953125, -11.14013671875, -10.478271484375, -9.81640625, -9.154541015625, -8.49267578125, -7.830810546875, -7.1689453125, -6.507080078125, -5.84521484375, -5.183349609375, -4.521484375, -3.859619140625, -3.19775390625, -2.535888671875, -1.8740234375, -1.212158203125, -0.55029296875, 0.111572265625, 0.7734375, 1.435302734375, 2.09716796875, 2.759033203125, 3.4208984375, 4.082763671875, 4.74462890625, 5.406494140625, 6.068359375, 6.730224609375, 7.39208984375, 8.053955078125, 8.7158203125, 9.377685546875, 10.03955078125, 10.701416015625, 11.36328125, 12.025146484375, 12.68701171875, 13.348876953125, 14.0107421875, 14.672607421875, 15.33447265625, 15.996337890625, 16.658203125, 17.320068359375, 17.98193359375, 18.643798828125, 19.3056640625, 19.967529296875, 20.62939453125, 21.291259765625, 21.953125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 329.0, 688.0], "bins": [-439.1383972167969, -432.17840576171875, -425.2184143066406, -418.2584228515625, -411.2984619140625, -404.3384704589844, -397.37847900390625, -390.4184875488281, -383.45849609375, -376.4985046386719, -369.53851318359375, -362.57855224609375, -355.6185607910156, -348.6585693359375, -341.6985778808594, -334.73858642578125, -327.77862548828125, -320.8186340332031, -313.858642578125, -306.898681640625, -299.9386901855469, -292.97869873046875, -286.0187072753906, -279.0587158203125, -272.0987243652344, -265.13873291015625, -258.1787414550781, -251.21876525878906, -244.25877380371094, -237.29879760742188, -230.33880615234375, -223.37881469726562, -216.41883850097656, -209.45884704589844, -202.49887084960938, -195.53887939453125, -188.57888793945312, -181.618896484375, -174.65892028808594, -167.6989288330078, -160.7389373779297, -153.77894592285156, -146.8189697265625, -139.85897827148438, -132.89898681640625, -125.93900299072266, -118.97901916503906, -112.01902770996094, -105.05905151367188, -98.09906768798828, -91.13907623291016, -84.17909240722656, -77.21910095214844, -70.25911712646484, -63.29913330078125, -56.33914566040039, -49.37915802001953, -42.41917037963867, -35.45918273925781, -28.49919891357422, -21.53921127319336, -14.5792236328125, -7.619239807128906, -0.6592521667480469, 6.300736904144287]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 5.0, 7.0, 10.0, 12.0, 21.0, 22.0, 25.0, 16.0, 24.0, 22.0, 34.0, 26.0, 34.0, 48.0, 43.0, 42.0, 53.0, 42.0, 43.0, 60.0, 38.0, 42.0, 38.0, 36.0, 39.0, 31.0, 29.0, 26.0, 22.0, 21.0, 12.0, 16.0, 12.0, 10.0, 10.0, 4.0, 5.0, 8.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.695337295532227, -28.728042602539062, -27.760746002197266, -26.79344940185547, -25.826154708862305, -24.85886001586914, -23.891563415527344, -22.924266815185547, -21.956972122192383, -20.98967742919922, -20.022380828857422, -19.055084228515625, -18.08778953552246, -17.120494842529297, -16.1531982421875, -15.18590259552002, -14.218606948852539, -13.251311302185059, -12.284015655517578, -11.316720008850098, -10.349424362182617, -9.382128715515137, -8.414833068847656, -7.447537422180176, -6.480241775512695, -5.512946128845215, -4.545650482177734, -3.578354835510254, -2.6110591888427734, -1.643763542175293, -0.6764678955078125, 0.29082775115966797, 1.2581253051757812, 2.2254209518432617, 3.192716598510742, 4.160012245178223, 5.127307891845703, 6.094603538513184, 7.061899185180664, 8.029194831848145, 8.996490478515625, 9.963786125183105, 10.931081771850586, 11.898377418518066, 12.865673065185547, 13.832968711853027, 14.800264358520508, 15.767560005187988, 16.73485565185547, 17.702152252197266, 18.66944694519043, 19.636741638183594, 20.60403823852539, 21.571334838867188, 22.53862953186035, 23.505924224853516, 24.473220825195312, 25.44051742553711, 26.407812118530273, 27.375106811523438, 28.342403411865234, 29.30970001220703, 30.276994705200195, 31.24428939819336, 32.211585998535156]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 10.0, 9.0, 14.0, 11.0, 21.0, 24.0, 30.0, 37.0, 32.0, 41.0, 35.0, 51.0, 50.0, 54.0, 41.0, 54.0, 63.0, 61.0, 55.0, 46.0, 37.0, 44.0, 27.0, 30.0, 26.0, 23.0, 16.0, 17.0, 12.0, 6.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.751953125, -3.628204345703125, -3.50445556640625, -3.380706787109375, -3.2569580078125, -3.133209228515625, -3.00946044921875, -2.885711669921875, -2.761962890625, -2.638214111328125, -2.51446533203125, -2.390716552734375, -2.2669677734375, -2.143218994140625, -2.01947021484375, -1.895721435546875, -1.77197265625, -1.648223876953125, -1.52447509765625, -1.400726318359375, -1.2769775390625, -1.153228759765625, -1.02947998046875, -0.905731201171875, -0.781982421875, -0.658233642578125, -0.53448486328125, -0.410736083984375, -0.2869873046875, -0.163238525390625, -0.03948974609375, 0.084259033203125, 0.2080078125, 0.331756591796875, 0.45550537109375, 0.579254150390625, 0.7030029296875, 0.826751708984375, 0.95050048828125, 1.074249267578125, 1.197998046875, 1.321746826171875, 1.44549560546875, 1.569244384765625, 1.6929931640625, 1.816741943359375, 1.94049072265625, 2.064239501953125, 2.18798828125, 2.311737060546875, 2.43548583984375, 2.559234619140625, 2.6829833984375, 2.806732177734375, 2.93048095703125, 3.054229736328125, 3.177978515625, 3.301727294921875, 3.42547607421875, 3.549224853515625, 3.6729736328125, 3.796722412109375, 3.92047119140625, 4.044219970703125, 4.16796875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 11.0, 22.0, 28.0, 35.0, 52.0, 60.0, 92.0, 155.0, 249.0, 409.0, 639.0, 1094.0, 2062.0, 4024.0, 8969.0, 22586.0, 66099.0, 239046.0, 1041899.0, 1971188.0, 614388.0, 147739.0, 44116.0, 15903.0, 6488.0, 3049.0, 1554.0, 864.0, 519.0, 328.0, 183.0, 130.0, 81.0, 51.0, 52.0, 22.0, 28.0, 10.0, 12.0, 7.0, 2.0, 8.0, 5.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.05859375, -5.87677001953125, -5.6949462890625, -5.51312255859375, -5.331298828125, -5.14947509765625, -4.9676513671875, -4.78582763671875, -4.60400390625, -4.42218017578125, -4.2403564453125, -4.05853271484375, -3.876708984375, -3.69488525390625, -3.5130615234375, -3.33123779296875, -3.1494140625, -2.96759033203125, -2.7857666015625, -2.60394287109375, -2.422119140625, -2.24029541015625, -2.0584716796875, -1.87664794921875, -1.69482421875, -1.51300048828125, -1.3311767578125, -1.14935302734375, -0.967529296875, -0.78570556640625, -0.6038818359375, -0.42205810546875, -0.240234375, -0.05841064453125, 0.1234130859375, 0.30523681640625, 0.487060546875, 0.66888427734375, 0.8507080078125, 1.03253173828125, 1.21435546875, 1.39617919921875, 1.5780029296875, 1.75982666015625, 1.941650390625, 2.12347412109375, 2.3052978515625, 2.48712158203125, 2.6689453125, 2.85076904296875, 3.0325927734375, 3.21441650390625, 3.396240234375, 3.57806396484375, 3.7598876953125, 3.94171142578125, 4.12353515625, 4.30535888671875, 4.4871826171875, 4.66900634765625, 4.850830078125, 5.03265380859375, 5.2144775390625, 5.39630126953125, 5.578125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 11.0, 18.0, 12.0, 26.0, 35.0, 36.0, 43.0, 66.0, 63.0, 115.0, 130.0, 174.0, 227.0, 250.0, 322.0, 401.0, 399.0, 346.0, 284.0, 247.0, 189.0, 160.0, 117.0, 95.0, 70.0, 52.0, 41.0, 30.0, 19.0, 24.0, 15.0, 10.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.28515625, -6.1162109375, -5.947265625, -5.7783203125, -5.609375, -5.4404296875, -5.271484375, -5.1025390625, -4.93359375, -4.7646484375, -4.595703125, -4.4267578125, -4.2578125, -4.0888671875, -3.919921875, -3.7509765625, -3.58203125, -3.4130859375, -3.244140625, -3.0751953125, -2.90625, -2.7373046875, -2.568359375, -2.3994140625, -2.23046875, -2.0615234375, -1.892578125, -1.7236328125, -1.5546875, -1.3857421875, -1.216796875, -1.0478515625, -0.87890625, -0.7099609375, -0.541015625, -0.3720703125, -0.203125, -0.0341796875, 0.134765625, 0.3037109375, 0.47265625, 0.6416015625, 0.810546875, 0.9794921875, 1.1484375, 1.3173828125, 1.486328125, 1.6552734375, 1.82421875, 1.9931640625, 2.162109375, 2.3310546875, 2.5, 2.6689453125, 2.837890625, 3.0068359375, 3.17578125, 3.3447265625, 3.513671875, 3.6826171875, 3.8515625, 4.0205078125, 4.189453125, 4.3583984375, 4.52734375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 13.0, 19.0, 15.0, 28.0, 30.0, 39.0, 57.0, 70.0, 115.0, 157.0, 194.0, 385.0, 947.0, 5814.0, 121376.0, 3559243.0, 488899.0, 13935.0, 1604.0, 439.0, 254.0, 156.0, 119.0, 72.0, 64.0, 48.0, 40.0, 35.0, 21.0, 21.0, 11.0, 12.0, 6.0, 6.0, 4.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.015625, -18.27490234375, -17.5341796875, -16.79345703125, -16.052734375, -15.31201171875, -14.5712890625, -13.83056640625, -13.08984375, -12.34912109375, -11.6083984375, -10.86767578125, -10.126953125, -9.38623046875, -8.6455078125, -7.90478515625, -7.1640625, -6.42333984375, -5.6826171875, -4.94189453125, -4.201171875, -3.46044921875, -2.7197265625, -1.97900390625, -1.23828125, -0.49755859375, 0.2431640625, 0.98388671875, 1.724609375, 2.46533203125, 3.2060546875, 3.94677734375, 4.6875, 5.42822265625, 6.1689453125, 6.90966796875, 7.650390625, 8.39111328125, 9.1318359375, 9.87255859375, 10.61328125, 11.35400390625, 12.0947265625, 12.83544921875, 13.576171875, 14.31689453125, 15.0576171875, 15.79833984375, 16.5390625, 17.27978515625, 18.0205078125, 18.76123046875, 19.501953125, 20.24267578125, 20.9833984375, 21.72412109375, 22.46484375, 23.20556640625, 23.9462890625, 24.68701171875, 25.427734375, 26.16845703125, 26.9091796875, 27.64990234375, 28.390625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 10.0, 7.0, 21.0, 34.0, 70.0, 67.0, 81.0, 97.0, 127.0, 116.0, 107.0, 84.0, 62.0, 44.0, 29.0, 22.0, 17.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.76214027404785, -21.62501335144043, -20.487886428833008, -19.350759506225586, -18.213634490966797, -17.076507568359375, -15.939380645751953, -14.802253723144531, -13.66512680053711, -12.527999877929688, -11.390872955322266, -10.25374698638916, -9.116620063781738, -7.979493141174316, -6.842366695404053, -5.705240249633789, -4.568113327026367, -3.4309866428375244, -2.2938599586486816, -1.1567332744598389, -0.019606590270996094, 1.1175203323364258, 2.2546467781066895, 3.391773223876953, 4.528900146484375, 5.666027069091797, 6.8031535148620605, 7.940279960632324, 9.077406883239746, 10.214533805847168, 11.351659774780273, 12.488786697387695, 13.625911712646484, 14.763038635253906, 15.900165557861328, 17.03729248046875, 18.174419403076172, 19.311546325683594, 20.448671340942383, 21.585798263549805, 22.722925186157227, 23.86005210876465, 24.99717903137207, 26.134305953979492, 27.27143096923828, 28.408557891845703, 29.545684814453125, 30.682811737060547, 31.81993865966797, 32.95706558227539, 34.09419250488281, 35.231319427490234, 36.368446350097656, 37.50557327270508, 38.6427001953125, 39.779823303222656, 40.916954040527344, 42.054080963134766, 43.19120788574219, 44.32833480834961, 45.46546173095703, 46.60258865356445, 47.739715576171875, 48.87683868408203, 50.01396560668945]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 6.0, 13.0, 7.0, 14.0, 8.0, 25.0, 22.0, 28.0, 25.0, 26.0, 23.0, 32.0, 38.0, 50.0, 53.0, 44.0, 47.0, 43.0, 43.0, 48.0, 40.0, 39.0, 35.0, 31.0, 31.0, 30.0, 29.0, 27.0, 30.0, 24.0, 20.0, 17.0, 10.0, 11.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0], "bins": [-24.647010803222656, -23.960922241210938, -23.27483367919922, -22.5887451171875, -21.90265655517578, -21.21656608581543, -20.53047752380371, -19.844388961791992, -19.158300399780273, -18.472211837768555, -17.786123275756836, -17.100034713745117, -16.413944244384766, -15.727856636047363, -15.041767120361328, -14.35567855834961, -13.66958999633789, -12.983501434326172, -12.297412872314453, -11.611323356628418, -10.9252347946167, -10.23914623260498, -9.553056716918945, -8.866968154907227, -8.180879592895508, -7.494791030883789, -6.808701992034912, -6.122612953186035, -5.436524391174316, -4.750435829162598, -4.064346790313721, -3.3782577514648438, -2.692169189453125, -2.006080389022827, -1.3199915885925293, -0.6339027881622314, 0.052186012268066406, 0.7382748126983643, 1.424363613128662, 2.110452651977539, 2.796541213989258, 3.4826300144195557, 4.1687188148498535, 4.8548078536987305, 5.540896415710449, 6.226984977722168, 6.913074016571045, 7.599163055419922, 8.28525161743164, 8.97134017944336, 9.657428741455078, 10.343518257141113, 11.029606819152832, 11.71569538116455, 12.401784896850586, 13.087873458862305, 13.773962020874023, 14.460050582885742, 15.146139144897461, 15.832228660583496, 16.51831817626953, 17.20440673828125, 17.89049530029297, 18.576583862304688, 19.262672424316406]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 11.0, 8.0, 12.0, 19.0, 26.0, 28.0, 29.0, 35.0, 42.0, 44.0, 38.0, 47.0, 52.0, 46.0, 58.0, 45.0, 57.0, 57.0, 49.0, 35.0, 40.0, 40.0, 34.0, 26.0, 26.0, 20.0, 26.0, 5.0, 15.0, 4.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.798828125, -3.675811767578125, -3.55279541015625, -3.429779052734375, -3.3067626953125, -3.183746337890625, -3.06072998046875, -2.937713623046875, -2.814697265625, -2.691680908203125, -2.56866455078125, -2.445648193359375, -2.3226318359375, -2.199615478515625, -2.07659912109375, -1.953582763671875, -1.83056640625, -1.707550048828125, -1.58453369140625, -1.461517333984375, -1.3385009765625, -1.215484619140625, -1.09246826171875, -0.969451904296875, -0.846435546875, -0.723419189453125, -0.60040283203125, -0.477386474609375, -0.3543701171875, -0.231353759765625, -0.10833740234375, 0.014678955078125, 0.1376953125, 0.260711669921875, 0.38372802734375, 0.506744384765625, 0.6297607421875, 0.752777099609375, 0.87579345703125, 0.998809814453125, 1.121826171875, 1.244842529296875, 1.36785888671875, 1.490875244140625, 1.6138916015625, 1.736907958984375, 1.85992431640625, 1.982940673828125, 2.10595703125, 2.228973388671875, 2.35198974609375, 2.475006103515625, 2.5980224609375, 2.721038818359375, 2.84405517578125, 2.967071533203125, 3.090087890625, 3.213104248046875, 3.33612060546875, 3.459136962890625, 3.5821533203125, 3.705169677734375, 3.82818603515625, 3.951202392578125, 4.07421875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 13.0, 5.0, 6.0, 8.0, 16.0, 24.0, 31.0, 49.0, 67.0, 83.0, 157.0, 213.0, 311.0, 508.0, 802.0, 1224.0, 1862.0, 2806.0, 4532.0, 7057.0, 11148.0, 17907.0, 29474.0, 49576.0, 86947.0, 163233.0, 275186.0, 172044.0, 91017.0, 51166.0, 30430.0, 18637.0, 11614.0, 7277.0, 4653.0, 2975.0, 1952.0, 1204.0, 772.0, 496.0, 342.0, 233.0, 172.0, 104.0, 56.0, 38.0, 39.0, 18.0, 14.0, 18.0, 6.0, 8.0, 7.0, 6.0, 6.0, 2.0, 6.0], "bins": [-0.024810791015625, -0.02407097816467285, -0.023331165313720703, -0.022591352462768555, -0.021851539611816406, -0.021111726760864258, -0.02037191390991211, -0.01963210105895996, -0.018892288208007812, -0.018152475357055664, -0.017412662506103516, -0.016672849655151367, -0.01593303680419922, -0.01519322395324707, -0.014453411102294922, -0.013713598251342773, -0.012973785400390625, -0.012233972549438477, -0.011494159698486328, -0.01075434684753418, -0.010014533996582031, -0.009274721145629883, -0.008534908294677734, -0.007795095443725586, -0.0070552825927734375, -0.006315469741821289, -0.005575656890869141, -0.004835844039916992, -0.004096031188964844, -0.0033562183380126953, -0.002616405487060547, -0.0018765926361083984, -0.00113677978515625, -0.00039696693420410156, 0.0003428459167480469, 0.0010826587677001953, 0.0018224716186523438, 0.002562284469604492, 0.0033020973205566406, 0.004041910171508789, 0.0047817230224609375, 0.005521535873413086, 0.006261348724365234, 0.007001161575317383, 0.007740974426269531, 0.00848078727722168, 0.009220600128173828, 0.009960412979125977, 0.010700225830078125, 0.011440038681030273, 0.012179851531982422, 0.01291966438293457, 0.013659477233886719, 0.014399290084838867, 0.015139102935791016, 0.015878915786743164, 0.016618728637695312, 0.01735854148864746, 0.01809835433959961, 0.018838167190551758, 0.019577980041503906, 0.020317792892456055, 0.021057605743408203, 0.02179741859436035, 0.0225372314453125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 12.0, 8.0, 9.0, 10.0, 11.0, 21.0, 17.0, 22.0, 16.0, 27.0, 32.0, 34.0, 27.0, 28.0, 28.0, 43.0, 31.0, 46.0, 32.0, 1064.0, 50.0, 33.0, 40.0, 43.0, 38.0, 35.0, 38.0, 35.0, 35.0, 28.0, 20.0, 16.0, 9.0, 15.0, 6.0, 11.0, 10.0, 13.0, 4.0, 4.0, 5.0, 7.0, 0.0, 6.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3671875, -2.291900634765625, -2.21661376953125, -2.141326904296875, -2.0660400390625, -1.990753173828125, -1.91546630859375, -1.840179443359375, -1.764892578125, -1.689605712890625, -1.61431884765625, -1.539031982421875, -1.4637451171875, -1.388458251953125, -1.31317138671875, -1.237884521484375, -1.16259765625, -1.087310791015625, -1.01202392578125, -0.936737060546875, -0.8614501953125, -0.786163330078125, -0.71087646484375, -0.635589599609375, -0.560302734375, -0.485015869140625, -0.40972900390625, -0.334442138671875, -0.2591552734375, -0.183868408203125, -0.10858154296875, -0.033294677734375, 0.0419921875, 0.117279052734375, 0.19256591796875, 0.267852783203125, 0.3431396484375, 0.418426513671875, 0.49371337890625, 0.569000244140625, 0.644287109375, 0.719573974609375, 0.79486083984375, 0.870147705078125, 0.9454345703125, 1.020721435546875, 1.09600830078125, 1.171295166015625, 1.24658203125, 1.321868896484375, 1.39715576171875, 1.472442626953125, 1.5477294921875, 1.623016357421875, 1.69830322265625, 1.773590087890625, 1.848876953125, 1.924163818359375, 1.99945068359375, 2.074737548828125, 2.1500244140625, 2.225311279296875, 2.30059814453125, 2.375885009765625, 2.451171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 9.0, 10.0, 11.0, 20.0, 27.0, 41.0, 68.0, 86.0, 121.0, 175.0, 222.0, 336.0, 450.0, 668.0, 918.0, 1316.0, 1833.0, 2817.0, 3912.0, 5582.0, 8288.0, 12186.0, 18050.0, 26571.0, 39912.0, 59659.0, 91103.0, 137263.0, 1230176.0, 150792.0, 101191.0, 66533.0, 44202.0, 29576.0, 19849.0, 13494.0, 9096.0, 6249.0, 4319.0, 2999.0, 2105.0, 1470.0, 1009.0, 726.0, 536.0, 338.0, 246.0, 156.0, 131.0, 91.0, 74.0, 39.0, 28.0, 22.0, 11.0, 16.0, 7.0, 4.0, 3.0, 2.0], "bins": [-0.00789642333984375, -0.007654428482055664, -0.007412433624267578, -0.007170438766479492, -0.006928443908691406, -0.00668644905090332, -0.006444454193115234, -0.0062024593353271484, -0.0059604644775390625, -0.0057184696197509766, -0.005476474761962891, -0.005234479904174805, -0.004992485046386719, -0.004750490188598633, -0.004508495330810547, -0.004266500473022461, -0.004024505615234375, -0.003782510757446289, -0.003540515899658203, -0.003298521041870117, -0.0030565261840820312, -0.0028145313262939453, -0.0025725364685058594, -0.0023305416107177734, -0.0020885467529296875, -0.0018465518951416016, -0.0016045570373535156, -0.0013625621795654297, -0.0011205673217773438, -0.0008785724639892578, -0.0006365776062011719, -0.00039458274841308594, -0.000152587890625, 8.940696716308594e-05, 0.0003314018249511719, 0.0005733966827392578, 0.0008153915405273438, 0.0010573863983154297, 0.0012993812561035156, 0.0015413761138916016, 0.0017833709716796875, 0.0020253658294677734, 0.0022673606872558594, 0.0025093555450439453, 0.0027513504028320312, 0.002993345260620117, 0.003235340118408203, 0.003477334976196289, 0.003719329833984375, 0.003961324691772461, 0.004203319549560547, 0.004445314407348633, 0.004687309265136719, 0.004929304122924805, 0.005171298980712891, 0.0054132938385009766, 0.0056552886962890625, 0.0058972835540771484, 0.006139278411865234, 0.00638127326965332, 0.006623268127441406, 0.006865262985229492, 0.007107257843017578, 0.007349252700805664, 0.00759124755859375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 0.0, 5.0, 0.0, 16.0, 0.0, 12.0, 0.0, 17.0, 16.0, 0.0, 35.0, 0.0, 41.0, 0.0, 50.0, 65.0, 0.0, 139.0, 0.0, 212.0, 0.0, 142.0, 0.0, 92.0, 42.0, 0.0, 39.0, 0.0, 21.0, 0.0, 28.0, 8.0, 0.0, 6.0, 0.0, 6.0, 0.0, 1.0, 0.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.201467037200928e-07, -8.866190910339355e-07, -8.530914783477783e-07, -8.195638656616211e-07, -7.860362529754639e-07, -7.525086402893066e-07, -7.189810276031494e-07, -6.854534149169922e-07, -6.51925802230835e-07, -6.183981895446777e-07, -5.848705768585205e-07, -5.513429641723633e-07, -5.178153514862061e-07, -4.842877388000488e-07, -4.507601261138916e-07, -4.172325134277344e-07, -3.8370490074157715e-07, -3.501772880554199e-07, -3.166496753692627e-07, -2.8312206268310547e-07, -2.4959444999694824e-07, -2.1606683731079102e-07, -1.825392246246338e-07, -1.4901161193847656e-07, -1.1548399925231934e-07, -8.195638656616211e-08, -4.842877388000488e-08, -1.4901161193847656e-08, 1.862645149230957e-08, 5.21540641784668e-08, 8.568167686462402e-08, 1.1920928955078125e-07, 1.5273690223693848e-07, 1.862645149230957e-07, 2.1979212760925293e-07, 2.5331974029541016e-07, 2.868473529815674e-07, 3.203749656677246e-07, 3.5390257835388184e-07, 3.8743019104003906e-07, 4.209578037261963e-07, 4.544854164123535e-07, 4.880130290985107e-07, 5.21540641784668e-07, 5.550682544708252e-07, 5.885958671569824e-07, 6.221234798431396e-07, 6.556510925292969e-07, 6.891787052154541e-07, 7.227063179016113e-07, 7.562339305877686e-07, 7.897615432739258e-07, 8.23289155960083e-07, 8.568167686462402e-07, 8.903443813323975e-07, 9.238719940185547e-07, 9.57399606704712e-07, 9.909272193908691e-07, 1.0244548320770264e-06, 1.0579824447631836e-06, 1.0915100574493408e-06, 1.125037670135498e-06, 1.1585652828216553e-06, 1.1920928955078125e-06]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 7.0, 15.0, 21.0, 22.0, 36.0, 45.0, 87.0, 168.0, 344.0, 2435.0, 215796.0, 822799.0, 5768.0, 466.0, 172.0, 92.0, 68.0, 47.0, 20.0, 26.0, 13.0, 10.0, 15.0, 4.0, 6.0, 9.0, 9.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.580881118774414e-05, -2.5093555450439453e-05, -2.4378299713134766e-05, -2.3663043975830078e-05, -2.294778823852539e-05, -2.2232532501220703e-05, -2.1517276763916016e-05, -2.0802021026611328e-05, -2.008676528930664e-05, -1.9371509552001953e-05, -1.8656253814697266e-05, -1.7940998077392578e-05, -1.722574234008789e-05, -1.6510486602783203e-05, -1.5795230865478516e-05, -1.5079975128173828e-05, -1.436471939086914e-05, -1.3649463653564453e-05, -1.2934207916259766e-05, -1.2218952178955078e-05, -1.150369644165039e-05, -1.0788440704345703e-05, -1.0073184967041016e-05, -9.357929229736328e-06, -8.64267349243164e-06, -7.927417755126953e-06, -7.212162017822266e-06, -6.496906280517578e-06, -5.781650543212891e-06, -5.066394805908203e-06, -4.351139068603516e-06, -3.635883331298828e-06, -2.9206275939941406e-06, -2.205371856689453e-06, -1.4901161193847656e-06, -7.748603820800781e-07, -5.960464477539063e-08, 6.556510925292969e-07, 1.3709068298339844e-06, 2.086162567138672e-06, 2.8014183044433594e-06, 3.516674041748047e-06, 4.231929779052734e-06, 4.947185516357422e-06, 5.662441253662109e-06, 6.377696990966797e-06, 7.092952728271484e-06, 7.808208465576172e-06, 8.52346420288086e-06, 9.238719940185547e-06, 9.953975677490234e-06, 1.0669231414794922e-05, 1.138448715209961e-05, 1.2099742889404297e-05, 1.2814998626708984e-05, 1.3530254364013672e-05, 1.424551010131836e-05, 1.4960765838623047e-05, 1.5676021575927734e-05, 1.6391277313232422e-05, 1.710653305053711e-05, 1.7821788787841797e-05, 1.8537044525146484e-05, 1.9252300262451172e-05, 1.996755599975586e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 9.0, 36.0, 129.0, 375.0, 321.0, 122.0, 19.0, 5.0, 4.0], "bins": [-6.3115667217061855e-06, -6.2043445723247714e-06, -6.097122422943357e-06, -5.989900728309294e-06, -5.88267857892788e-06, -5.775456429546466e-06, -5.668234280165052e-06, -5.561012585530989e-06, -5.453790436149575e-06, -5.346568286768161e-06, -5.239346137386747e-06, -5.1321244427526835e-06, -5.0249022933712695e-06, -4.9176801439898554e-06, -4.810457994608441e-06, -4.703236299974378e-06, -4.596014150592964e-06, -4.48879200121155e-06, -4.381569851830136e-06, -4.274348157196073e-06, -4.167126007814659e-06, -4.059903858433245e-06, -3.952681709051831e-06, -3.8454600144177675e-06, -3.738237637662678e-06, -3.631015488281264e-06, -3.5237935662735254e-06, -3.4165714168921113e-06, -3.3093494948843727e-06, -3.2021273455029586e-06, -3.09490542349522e-06, -2.987683274113806e-06, -2.8804613521060674e-06, -2.7732392027246533e-06, -2.6660172807169147e-06, -2.5587951313355006e-06, -2.451573209327762e-06, -2.344351059946348e-06, -2.2371291379386093e-06, -2.1299069885571953e-06, -2.0226848391757812e-06, -1.915462689794367e-06, -1.8082407677866286e-06, -1.7010187320920522e-06, -1.593796696397476e-06, -1.4865745470160618e-06, -1.3793526250083232e-06, -1.2721304756269092e-06, -1.1649085536191706e-06, -1.0576865179245942e-06, -9.504644822300179e-07, -8.432424465354416e-07, -7.360204108408652e-07, -6.2879831830287e-07, -5.215762826082937e-07, -4.1435424691371736e-07, -3.071322680625599e-07, -1.9991023236798355e-07, -9.26881824625525e-08, 1.4533867442878545e-08, 1.2175590313745488e-07, 2.2897796725374064e-07, 3.36200002948317e-07, 4.434220386428933e-07, 5.506440743374696e-07]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 13.0, 0.0, 0.0, 40.0, 0.0, 0.0, 60.0, 0.0, 0.0, 118.0, 0.0, 0.0, 0.0, 172.0, 0.0, 0.0, 186.0, 0.0, 0.0, 148.0, 0.0, 0.0, 115.0, 0.0, 0.0, 70.0, 0.0, 0.0, 0.0, 39.0, 0.0, 0.0, 21.0, 0.0, 0.0, 12.0, 0.0, 0.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.370246410369873e-07, -6.183981895446777e-07, -5.997717380523682e-07, -5.811452865600586e-07, -5.62518835067749e-07, -5.438923835754395e-07, -5.252659320831299e-07, -5.066394805908203e-07, -4.880130290985107e-07, -4.6938657760620117e-07, -4.507601261138916e-07, -4.3213367462158203e-07, -4.1350722312927246e-07, -3.948807716369629e-07, -3.762543201446533e-07, -3.5762786865234375e-07, -3.390014171600342e-07, -3.203749656677246e-07, -3.0174851417541504e-07, -2.8312206268310547e-07, -2.644956111907959e-07, -2.4586915969848633e-07, -2.2724270820617676e-07, -2.086162567138672e-07, -1.8998980522155762e-07, -1.7136335372924805e-07, -1.5273690223693848e-07, -1.341104507446289e-07, -1.1548399925231934e-07, -9.685754776000977e-08, -7.82310962677002e-08, -5.960464477539063e-08, -4.0978193283081055e-08, -2.2351741790771484e-08, -3.725290298461914e-09, 1.4901161193847656e-08, 3.3527612686157227e-08, 5.21540641784668e-08, 7.078051567077637e-08, 8.940696716308594e-08, 1.0803341865539551e-07, 1.2665987014770508e-07, 1.4528632164001465e-07, 1.6391277313232422e-07, 1.825392246246338e-07, 2.0116567611694336e-07, 2.1979212760925293e-07, 2.384185791015625e-07, 2.5704503059387207e-07, 2.7567148208618164e-07, 2.942979335784912e-07, 3.129243850708008e-07, 3.3155083656311035e-07, 3.501772880554199e-07, 3.688037395477295e-07, 3.8743019104003906e-07, 4.0605664253234863e-07, 4.246830940246582e-07, 4.4330954551696777e-07, 4.6193599700927734e-07, 4.805624485015869e-07, 4.991888999938965e-07, 5.178153514862061e-07, 5.364418029785156e-07]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 11.0, 8.0, 12.0, 19.0, 26.0, 28.0, 29.0, 35.0, 42.0, 44.0, 38.0, 47.0, 52.0, 46.0, 58.0, 45.0, 57.0, 57.0, 49.0, 35.0, 40.0, 40.0, 34.0, 26.0, 26.0, 20.0, 26.0, 5.0, 15.0, 4.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.798828125, -3.675811767578125, -3.55279541015625, -3.429779052734375, -3.3067626953125, -3.183746337890625, -3.06072998046875, -2.937713623046875, -2.814697265625, -2.691680908203125, -2.56866455078125, -2.445648193359375, -2.3226318359375, -2.199615478515625, -2.07659912109375, -1.953582763671875, -1.83056640625, -1.707550048828125, -1.58453369140625, -1.461517333984375, -1.3385009765625, -1.215484619140625, -1.09246826171875, -0.969451904296875, -0.846435546875, -0.723419189453125, -0.60040283203125, -0.477386474609375, -0.3543701171875, -0.231353759765625, -0.10833740234375, 0.014678955078125, 0.1376953125, 0.260711669921875, 0.38372802734375, 0.506744384765625, 0.6297607421875, 0.752777099609375, 0.87579345703125, 0.998809814453125, 1.121826171875, 1.244842529296875, 1.36785888671875, 1.490875244140625, 1.6138916015625, 1.736907958984375, 1.85992431640625, 1.982940673828125, 2.10595703125, 2.228973388671875, 2.35198974609375, 2.475006103515625, 2.5980224609375, 2.721038818359375, 2.84405517578125, 2.967071533203125, 3.090087890625, 3.213104248046875, 3.33612060546875, 3.459136962890625, 3.5821533203125, 3.705169677734375, 3.82818603515625, 3.951202392578125, 4.07421875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 10.0, 17.0, 24.0, 32.0, 62.0, 91.0, 151.0, 219.0, 359.0, 483.0, 779.0, 1178.0, 1830.0, 2827.0, 4223.0, 6614.0, 10804.0, 18373.0, 33154.0, 67223.0, 180458.0, 439811.0, 146155.0, 59300.0, 30003.0, 16852.0, 9964.0, 6174.0, 3931.0, 2614.0, 1746.0, 1075.0, 668.0, 482.0, 318.0, 181.0, 142.0, 78.0, 64.0, 46.0, 11.0, 15.0, 9.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.82421875, -3.70977783203125, -3.5953369140625, -3.48089599609375, -3.366455078125, -3.25201416015625, -3.1375732421875, -3.02313232421875, -2.90869140625, -2.79425048828125, -2.6798095703125, -2.56536865234375, -2.450927734375, -2.33648681640625, -2.2220458984375, -2.10760498046875, -1.9931640625, -1.87872314453125, -1.7642822265625, -1.64984130859375, -1.535400390625, -1.42095947265625, -1.3065185546875, -1.19207763671875, -1.07763671875, -0.96319580078125, -0.8487548828125, -0.73431396484375, -0.619873046875, -0.50543212890625, -0.3909912109375, -0.27655029296875, -0.162109375, -0.04766845703125, 0.0667724609375, 0.18121337890625, 0.295654296875, 0.41009521484375, 0.5245361328125, 0.63897705078125, 0.75341796875, 0.86785888671875, 0.9822998046875, 1.09674072265625, 1.211181640625, 1.32562255859375, 1.4400634765625, 1.55450439453125, 1.6689453125, 1.78338623046875, 1.8978271484375, 2.01226806640625, 2.126708984375, 2.24114990234375, 2.3555908203125, 2.47003173828125, 2.58447265625, 2.69891357421875, 2.8133544921875, 2.92779541015625, 3.042236328125, 3.15667724609375, 3.2711181640625, 3.38555908203125, 3.5]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 9.0, 8.0, 22.0, 22.0, 26.0, 28.0, 30.0, 28.0, 27.0, 32.0, 35.0, 40.0, 39.0, 53.0, 84.0, 192.0, 1539.0, 217.0, 126.0, 68.0, 54.0, 44.0, 35.0, 34.0, 31.0, 27.0, 31.0, 23.0, 17.0, 17.0, 14.0, 14.0, 16.0, 10.0, 6.0, 4.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.0369873046875, -7.745849609375, -7.4547119140625, -7.16357421875, -6.8724365234375, -6.581298828125, -6.2901611328125, -5.9990234375, -5.7078857421875, -5.416748046875, -5.1256103515625, -4.83447265625, -4.5433349609375, -4.252197265625, -3.9610595703125, -3.669921875, -3.3787841796875, -3.087646484375, -2.7965087890625, -2.50537109375, -2.2142333984375, -1.923095703125, -1.6319580078125, -1.3408203125, -1.0496826171875, -0.758544921875, -0.4674072265625, -0.17626953125, 0.1148681640625, 0.406005859375, 0.6971435546875, 0.98828125, 1.2794189453125, 1.570556640625, 1.8616943359375, 2.15283203125, 2.4439697265625, 2.735107421875, 3.0262451171875, 3.3173828125, 3.6085205078125, 3.899658203125, 4.1907958984375, 4.48193359375, 4.7730712890625, 5.064208984375, 5.3553466796875, 5.646484375, 5.9376220703125, 6.228759765625, 6.5198974609375, 6.81103515625, 7.1021728515625, 7.393310546875, 7.6844482421875, 7.9755859375, 8.2667236328125, 8.557861328125, 8.8489990234375, 9.14013671875, 9.4312744140625, 9.722412109375, 10.0135498046875, 10.3046875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 6.0, 6.0, 5.0, 11.0, 9.0, 15.0, 19.0, 23.0, 22.0, 34.0, 28.0, 56.0, 64.0, 65.0, 93.0, 140.0, 165.0, 256.0, 552.0, 2321.0, 20963.0, 989638.0, 2100359.0, 26401.0, 2806.0, 603.0, 250.0, 167.0, 139.0, 115.0, 87.0, 67.0, 42.0, 39.0, 30.0, 31.0, 28.0, 10.0, 8.0, 5.0, 5.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0], "bins": [-20.328125, -19.7794189453125, -19.230712890625, -18.6820068359375, -18.13330078125, -17.5845947265625, -17.035888671875, -16.4871826171875, -15.9384765625, -15.3897705078125, -14.841064453125, -14.2923583984375, -13.74365234375, -13.1949462890625, -12.646240234375, -12.0975341796875, -11.548828125, -11.0001220703125, -10.451416015625, -9.9027099609375, -9.35400390625, -8.8052978515625, -8.256591796875, -7.7078857421875, -7.1591796875, -6.6104736328125, -6.061767578125, -5.5130615234375, -4.96435546875, -4.4156494140625, -3.866943359375, -3.3182373046875, -2.76953125, -2.2208251953125, -1.672119140625, -1.1234130859375, -0.57470703125, -0.0260009765625, 0.522705078125, 1.0714111328125, 1.6201171875, 2.1688232421875, 2.717529296875, 3.2662353515625, 3.81494140625, 4.3636474609375, 4.912353515625, 5.4610595703125, 6.009765625, 6.5584716796875, 7.107177734375, 7.6558837890625, 8.20458984375, 8.7532958984375, 9.302001953125, 9.8507080078125, 10.3994140625, 10.9481201171875, 11.496826171875, 12.0455322265625, 12.59423828125, 13.1429443359375, 13.691650390625, 14.2403564453125, 14.7890625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 17.0, 77.0, 208.0, 288.0, 243.0, 125.0, 42.0, 8.0, 2.0, 4.0], "bins": [-77.77172088623047, -76.42308807373047, -75.07445526123047, -73.72582244873047, -72.37718963623047, -71.02855682373047, -69.67992401123047, -68.331298828125, -66.982666015625, -65.634033203125, -64.285400390625, -62.936767578125, -61.588134765625, -60.239505767822266, -58.890872955322266, -57.542240142822266, -56.193603515625, -54.844970703125, -53.496337890625, -52.147705078125, -50.799072265625, -49.450443267822266, -48.101810455322266, -46.753177642822266, -45.404544830322266, -44.055912017822266, -42.707279205322266, -41.358646392822266, -40.01001739501953, -38.66138458251953, -37.31275177001953, -35.96411895751953, -34.6154899597168, -33.2668571472168, -31.918224334716797, -30.56959342956543, -29.22096061706543, -27.87232780456543, -26.523696899414062, -25.175064086914062, -23.826431274414062, -22.477798461914062, -21.129165649414062, -19.780534744262695, -18.431901931762695, -17.083269119262695, -15.734637260437012, -14.386005401611328, -13.037371635437012, -11.688739776611328, -10.340106964111328, -8.991474151611328, -7.6428422927856445, -6.294209957122803, -4.945577621459961, -3.5969457626342773, -2.2483129501342773, -0.8996806144714355, 0.44895172119140625, 1.797584056854248, 3.14621639251709, 4.494848728179932, 5.843481063842773, 7.192112922668457, 8.540745735168457]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 11.0, 8.0, 12.0, 10.0, 14.0, 14.0, 20.0, 22.0, 30.0, 18.0, 22.0, 30.0, 26.0, 22.0, 24.0, 30.0, 22.0, 40.0, 31.0, 46.0, 32.0, 45.0, 41.0, 31.0, 29.0, 36.0, 32.0, 38.0, 26.0, 35.0, 28.0, 26.0, 11.0, 23.0, 23.0, 11.0, 11.0, 7.0, 6.0, 9.0, 7.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.958168029785156, -21.232492446899414, -20.506818771362305, -19.781143188476562, -19.05546760559082, -18.329792022705078, -17.60411834716797, -16.878442764282227, -16.152767181396484, -15.427092552185059, -14.701416969299316, -13.97574234008789, -13.250066757202148, -12.524392127990723, -11.798717498779297, -11.073041915893555, -10.347368240356445, -9.62169361114502, -8.896018028259277, -8.170343399047852, -7.444668292999268, -6.718993186950684, -5.993318557739258, -5.267643451690674, -4.54196834564209, -3.816293239593506, -3.090618371963501, -2.364943504333496, -1.639268398284912, -0.9135932922363281, -0.18791866302490234, 0.5377564430236816, 1.2634315490722656, 1.98910653591156, 2.7147815227508545, 3.4404563903808594, 4.166131496429443, 4.891806602478027, 5.617481231689453, 6.343156337738037, 7.068831443786621, 7.794506549835205, 8.520181655883789, 9.245856285095215, 9.97153091430664, 10.697206497192383, 11.422881126403809, 12.148555755615234, 12.874231338500977, 13.599905967712402, 14.325581550598145, 15.05125617980957, 15.776931762695312, 16.502605438232422, 17.228281021118164, 17.953956604003906, 18.679630279541016, 19.405305862426758, 20.130979537963867, 20.85665512084961, 21.58233070373535, 22.308006286621094, 23.033679962158203, 23.759355545043945, 24.485031127929688]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 11.0, 10.0, 9.0, 13.0, 30.0, 26.0, 31.0, 34.0, 38.0, 43.0, 38.0, 48.0, 53.0, 34.0, 61.0, 50.0, 55.0, 53.0, 55.0, 36.0, 41.0, 37.0, 37.0, 26.0, 23.0, 17.0, 27.0, 19.0, 10.0, 10.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.859375, -3.7354736328125, -3.611572265625, -3.4876708984375, -3.36376953125, -3.2398681640625, -3.115966796875, -2.9920654296875, -2.8681640625, -2.7442626953125, -2.620361328125, -2.4964599609375, -2.37255859375, -2.2486572265625, -2.124755859375, -2.0008544921875, -1.876953125, -1.7530517578125, -1.629150390625, -1.5052490234375, -1.38134765625, -1.2574462890625, -1.133544921875, -1.0096435546875, -0.8857421875, -0.7618408203125, -0.637939453125, -0.5140380859375, -0.39013671875, -0.2662353515625, -0.142333984375, -0.0184326171875, 0.10546875, 0.2293701171875, 0.353271484375, 0.4771728515625, 0.60107421875, 0.7249755859375, 0.848876953125, 0.9727783203125, 1.0966796875, 1.2205810546875, 1.344482421875, 1.4683837890625, 1.59228515625, 1.7161865234375, 1.840087890625, 1.9639892578125, 2.087890625, 2.2117919921875, 2.335693359375, 2.4595947265625, 2.58349609375, 2.7073974609375, 2.831298828125, 2.9552001953125, 3.0791015625, 3.2030029296875, 3.326904296875, 3.4508056640625, 3.57470703125, 3.6986083984375, 3.822509765625, 3.9464111328125, 4.0703125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 8.0, 7.0, 19.0, 12.0, 23.0, 29.0, 34.0, 59.0, 72.0, 109.0, 189.0, 457.0, 1027.0, 2668.0, 7185.0, 22943.0, 95775.0, 624438.0, 2575965.0, 718075.0, 107954.0, 24765.0, 7634.0, 2788.0, 1054.0, 441.0, 203.0, 100.0, 76.0, 44.0, 34.0, 20.0, 18.0, 13.0, 5.0, 9.0, 9.0, 4.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-8.21875, -7.96612548828125, -7.7135009765625, -7.46087646484375, -7.208251953125, -6.95562744140625, -6.7030029296875, -6.45037841796875, -6.19775390625, -5.94512939453125, -5.6925048828125, -5.43988037109375, -5.187255859375, -4.93463134765625, -4.6820068359375, -4.42938232421875, -4.1767578125, -3.92413330078125, -3.6715087890625, -3.41888427734375, -3.166259765625, -2.91363525390625, -2.6610107421875, -2.40838623046875, -2.15576171875, -1.90313720703125, -1.6505126953125, -1.39788818359375, -1.145263671875, -0.89263916015625, -0.6400146484375, -0.38739013671875, -0.134765625, 0.11785888671875, 0.3704833984375, 0.62310791015625, 0.875732421875, 1.12835693359375, 1.3809814453125, 1.63360595703125, 1.88623046875, 2.13885498046875, 2.3914794921875, 2.64410400390625, 2.896728515625, 3.14935302734375, 3.4019775390625, 3.65460205078125, 3.9072265625, 4.15985107421875, 4.4124755859375, 4.66510009765625, 4.917724609375, 5.17034912109375, 5.4229736328125, 5.67559814453125, 5.92822265625, 6.18084716796875, 6.4334716796875, 6.68609619140625, 6.938720703125, 7.19134521484375, 7.4439697265625, 7.69659423828125, 7.94921875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 9.0, 7.0, 23.0, 23.0, 45.0, 35.0, 82.0, 118.0, 159.0, 250.0, 365.0, 498.0, 653.0, 574.0, 390.0, 293.0, 203.0, 115.0, 63.0, 59.0, 37.0, 30.0, 17.0, 10.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.11285400390625, -5.8546142578125, -5.59637451171875, -5.338134765625, -5.07989501953125, -4.8216552734375, -4.56341552734375, -4.30517578125, -4.04693603515625, -3.7886962890625, -3.53045654296875, -3.272216796875, -3.01397705078125, -2.7557373046875, -2.49749755859375, -2.2392578125, -1.98101806640625, -1.7227783203125, -1.46453857421875, -1.206298828125, -0.94805908203125, -0.6898193359375, -0.43157958984375, -0.17333984375, 0.08489990234375, 0.3431396484375, 0.60137939453125, 0.859619140625, 1.11785888671875, 1.3760986328125, 1.63433837890625, 1.892578125, 2.15081787109375, 2.4090576171875, 2.66729736328125, 2.925537109375, 3.18377685546875, 3.4420166015625, 3.70025634765625, 3.95849609375, 4.21673583984375, 4.4749755859375, 4.73321533203125, 4.991455078125, 5.24969482421875, 5.5079345703125, 5.76617431640625, 6.0244140625, 6.28265380859375, 6.5408935546875, 6.79913330078125, 7.057373046875, 7.31561279296875, 7.5738525390625, 7.83209228515625, 8.09033203125, 8.34857177734375, 8.6068115234375, 8.86505126953125, 9.123291015625, 9.38153076171875, 9.6397705078125, 9.89801025390625, 10.15625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 7.0, 13.0, 17.0, 26.0, 43.0, 51.0, 85.0, 118.0, 217.0, 395.0, 847.0, 5118.0, 332208.0, 3804788.0, 46799.0, 2103.0, 605.0, 313.0, 172.0, 113.0, 79.0, 52.0, 34.0, 27.0, 17.0, 13.0, 10.0, 2.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.767822265625, -33.75439453125, -32.740966796875, -31.7275390625, -30.714111328125, -29.70068359375, -28.687255859375, -27.673828125, -26.660400390625, -25.64697265625, -24.633544921875, -23.6201171875, -22.606689453125, -21.59326171875, -20.579833984375, -19.56640625, -18.552978515625, -17.53955078125, -16.526123046875, -15.5126953125, -14.499267578125, -13.48583984375, -12.472412109375, -11.458984375, -10.445556640625, -9.43212890625, -8.418701171875, -7.4052734375, -6.391845703125, -5.37841796875, -4.364990234375, -3.3515625, -2.338134765625, -1.32470703125, -0.311279296875, 0.7021484375, 1.715576171875, 2.72900390625, 3.742431640625, 4.755859375, 5.769287109375, 6.78271484375, 7.796142578125, 8.8095703125, 9.822998046875, 10.83642578125, 11.849853515625, 12.86328125, 13.876708984375, 14.89013671875, 15.903564453125, 16.9169921875, 17.930419921875, 18.94384765625, 19.957275390625, 20.970703125, 21.984130859375, 22.99755859375, 24.010986328125, 25.0244140625, 26.037841796875, 27.05126953125, 28.064697265625, 29.078125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 17.0, 38.0, 49.0, 93.0, 109.0, 143.0, 147.0, 131.0, 107.0, 68.0, 41.0, 33.0, 8.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-70.85023498535156, -69.44483947753906, -68.03943634033203, -66.63404083251953, -65.22864532470703, -63.823246002197266, -62.4178466796875, -61.012451171875, -59.607051849365234, -58.20165252685547, -56.79625701904297, -55.3908576965332, -53.9854621887207, -52.58006286621094, -51.17466735839844, -49.76926803588867, -48.363868713378906, -46.95846939086914, -45.55307388305664, -44.147674560546875, -42.742279052734375, -41.33687973022461, -39.931480407714844, -38.526084899902344, -37.120689392089844, -35.71529006958008, -34.30989456176758, -32.90449523925781, -31.49909782409668, -30.093700408935547, -28.688302993774414, -27.28290557861328, -25.877504348754883, -24.47210693359375, -23.066709518432617, -21.661312103271484, -20.25591278076172, -18.850515365600586, -17.445117950439453, -16.039718627929688, -14.634322166442871, -13.228924751281738, -11.823526382446289, -10.418128967285156, -9.012731552124023, -7.607333183288574, -6.201935768127441, -4.796537399291992, -3.3911399841308594, -1.985742211341858, -0.5803444385528564, 0.8250532150268555, 2.2304511070251465, 3.6358489990234375, 5.04124641418457, 6.4466447830200195, 7.852042198181152, 9.257439613342285, 10.662837982177734, 12.068235397338867, 13.4736328125, 14.87903118133545, 16.284427642822266, 17.68982696533203, 19.095224380493164]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 8.0, 2.0, 7.0, 7.0, 9.0, 4.0, 7.0, 7.0, 16.0, 12.0, 13.0, 21.0, 25.0, 23.0, 23.0, 33.0, 37.0, 33.0, 40.0, 44.0, 54.0, 52.0, 50.0, 44.0, 57.0, 32.0, 42.0, 33.0, 38.0, 39.0, 29.0, 28.0, 26.0, 20.0, 16.0, 16.0, 14.0, 11.0, 8.0, 18.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.21916961669922, -25.479211807250977, -24.739255905151367, -23.999298095703125, -23.259340286254883, -22.51938247680664, -21.77942657470703, -21.03946876525879, -20.299510955810547, -19.559553146362305, -18.819597244262695, -18.079639434814453, -17.33968162536621, -16.59972381591797, -15.85976791381836, -15.119810104370117, -14.379854202270508, -13.639897346496582, -12.89993953704834, -12.159982681274414, -11.420024871826172, -10.680068016052246, -9.94011116027832, -9.200153350830078, -8.460196495056152, -7.720239162445068, -6.980281829833984, -6.240324974060059, -5.500367641448975, -4.760410308837891, -4.020453453063965, -3.280496120452881, -2.540538787841797, -1.8005815744400024, -1.060624361038208, -0.3206672668457031, 0.41929006576538086, 1.1592473983764648, 1.8992042541503906, 2.6391615867614746, 3.3791189193725586, 4.119076251983643, 4.859033584594727, 5.598990440368652, 6.338947772979736, 7.07890510559082, 7.818861961364746, 8.558818817138672, 9.298776626586914, 10.03873348236084, 10.778691291809082, 11.518648147583008, 12.25860595703125, 12.998562812805176, 13.738519668579102, 14.478477478027344, 15.21843433380127, 15.958391189575195, 16.698348999023438, 17.438304901123047, 18.17826271057129, 18.91822052001953, 19.65817642211914, 20.398134231567383, 21.138092041015625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 2.0, 4.0, 7.0, 6.0, 13.0, 13.0, 11.0, 23.0, 30.0, 36.0, 21.0, 37.0, 36.0, 36.0, 39.0, 41.0, 51.0, 48.0, 48.0, 40.0, 45.0, 37.0, 49.0, 44.0, 33.0, 37.0, 31.0, 33.0, 27.0, 21.0, 19.0, 16.0, 17.0, 11.0, 11.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.371337890625, -3.25830078125, -3.145263671875, -3.0322265625, -2.919189453125, -2.80615234375, -2.693115234375, -2.580078125, -2.467041015625, -2.35400390625, -2.240966796875, -2.1279296875, -2.014892578125, -1.90185546875, -1.788818359375, -1.67578125, -1.562744140625, -1.44970703125, -1.336669921875, -1.2236328125, -1.110595703125, -0.99755859375, -0.884521484375, -0.771484375, -0.658447265625, -0.54541015625, -0.432373046875, -0.3193359375, -0.206298828125, -0.09326171875, 0.019775390625, 0.1328125, 0.245849609375, 0.35888671875, 0.471923828125, 0.5849609375, 0.697998046875, 0.81103515625, 0.924072265625, 1.037109375, 1.150146484375, 1.26318359375, 1.376220703125, 1.4892578125, 1.602294921875, 1.71533203125, 1.828369140625, 1.94140625, 2.054443359375, 2.16748046875, 2.280517578125, 2.3935546875, 2.506591796875, 2.61962890625, 2.732666015625, 2.845703125, 2.958740234375, 3.07177734375, 3.184814453125, 3.2978515625, 3.410888671875, 3.52392578125, 3.636962890625, 3.75]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 13.0, 16.0, 32.0, 38.0, 62.0, 119.0, 186.0, 297.0, 480.0, 860.0, 1432.0, 2475.0, 4249.0, 7955.0, 15053.0, 28498.0, 57613.0, 124255.0, 306941.0, 275974.0, 112141.0, 52361.0, 26570.0, 13764.0, 7550.0, 4057.0, 2304.0, 1311.0, 740.0, 460.0, 289.0, 155.0, 102.0, 64.0, 48.0, 22.0, 20.0, 7.0, 13.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03289794921875, -0.03183460235595703, -0.030771255493164062, -0.029707908630371094, -0.028644561767578125, -0.027581214904785156, -0.026517868041992188, -0.02545452117919922, -0.02439117431640625, -0.02332782745361328, -0.022264480590820312, -0.021201133728027344, -0.020137786865234375, -0.019074440002441406, -0.018011093139648438, -0.01694774627685547, -0.0158843994140625, -0.014821052551269531, -0.013757705688476562, -0.012694358825683594, -0.011631011962890625, -0.010567665100097656, -0.009504318237304688, -0.008440971374511719, -0.00737762451171875, -0.006314277648925781, -0.0052509307861328125, -0.004187583923339844, -0.003124237060546875, -0.0020608901977539062, -0.0009975433349609375, 6.580352783203125e-05, 0.001129150390625, 0.0021924972534179688, 0.0032558441162109375, 0.004319190979003906, 0.005382537841796875, 0.006445884704589844, 0.0075092315673828125, 0.008572578430175781, 0.00963592529296875, 0.010699272155761719, 0.011762619018554688, 0.012825965881347656, 0.013889312744140625, 0.014952659606933594, 0.016016006469726562, 0.01707935333251953, 0.0181427001953125, 0.01920604705810547, 0.020269393920898438, 0.021332740783691406, 0.022396087646484375, 0.023459434509277344, 0.024522781372070312, 0.02558612823486328, 0.02664947509765625, 0.02771282196044922, 0.028776168823242188, 0.029839515686035156, 0.030902862548828125, 0.031966209411621094, 0.03302955627441406, 0.03409290313720703, 0.03515625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 5.0, 5.0, 9.0, 15.0, 18.0, 21.0, 20.0, 31.0, 31.0, 38.0, 32.0, 35.0, 48.0, 34.0, 42.0, 48.0, 36.0, 1061.0, 53.0, 49.0, 32.0, 43.0, 33.0, 42.0, 36.0, 32.0, 23.0, 22.0, 24.0, 23.0, 10.0, 13.0, 19.0, 6.0, 7.0, 11.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.7991943359375, -2.707763671875, -2.6163330078125, -2.52490234375, -2.4334716796875, -2.342041015625, -2.2506103515625, -2.1591796875, -2.0677490234375, -1.976318359375, -1.8848876953125, -1.79345703125, -1.7020263671875, -1.610595703125, -1.5191650390625, -1.427734375, -1.3363037109375, -1.244873046875, -1.1534423828125, -1.06201171875, -0.9705810546875, -0.879150390625, -0.7877197265625, -0.6962890625, -0.6048583984375, -0.513427734375, -0.4219970703125, -0.33056640625, -0.2391357421875, -0.147705078125, -0.0562744140625, 0.03515625, 0.1265869140625, 0.218017578125, 0.3094482421875, 0.40087890625, 0.4923095703125, 0.583740234375, 0.6751708984375, 0.7666015625, 0.8580322265625, 0.949462890625, 1.0408935546875, 1.13232421875, 1.2237548828125, 1.315185546875, 1.4066162109375, 1.498046875, 1.5894775390625, 1.680908203125, 1.7723388671875, 1.86376953125, 1.9552001953125, 2.046630859375, 2.1380615234375, 2.2294921875, 2.3209228515625, 2.412353515625, 2.5037841796875, 2.59521484375, 2.6866455078125, 2.778076171875, 2.8695068359375, 2.9609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 5.0, 7.0, 8.0, 21.0, 22.0, 22.0, 53.0, 63.0, 115.0, 147.0, 247.0, 342.0, 525.0, 775.0, 1153.0, 1723.0, 2722.0, 4152.0, 6355.0, 10198.0, 15983.0, 25092.0, 39969.0, 64394.0, 105689.0, 176607.0, 1264156.0, 145061.0, 86783.0, 53275.0, 33155.0, 20871.0, 13257.0, 8457.0, 5464.0, 3510.0, 2274.0, 1475.0, 1007.0, 673.0, 423.0, 278.0, 191.0, 141.0, 87.0, 72.0, 38.0, 34.0, 24.0, 14.0, 8.0, 5.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.0098419189453125, -0.009537220001220703, -0.009232521057128906, -0.00892782211303711, -0.008623123168945312, -0.008318424224853516, -0.008013725280761719, -0.007709026336669922, -0.007404327392578125, -0.007099628448486328, -0.006794929504394531, -0.006490230560302734, -0.0061855316162109375, -0.005880832672119141, -0.005576133728027344, -0.005271434783935547, -0.00496673583984375, -0.004662036895751953, -0.004357337951660156, -0.004052639007568359, -0.0037479400634765625, -0.0034432411193847656, -0.0031385421752929688, -0.002833843231201172, -0.002529144287109375, -0.002224445343017578, -0.0019197463989257812, -0.0016150474548339844, -0.0013103485107421875, -0.0010056495666503906, -0.0007009506225585938, -0.0003962516784667969, -9.1552734375e-05, 0.00021314620971679688, 0.0005178451538085938, 0.0008225440979003906, 0.0011272430419921875, 0.0014319419860839844, 0.0017366409301757812, 0.002041339874267578, 0.002346038818359375, 0.002650737762451172, 0.0029554367065429688, 0.0032601356506347656, 0.0035648345947265625, 0.0038695335388183594, 0.004174232482910156, 0.004478931427001953, 0.00478363037109375, 0.005088329315185547, 0.005393028259277344, 0.005697727203369141, 0.0060024261474609375, 0.006307125091552734, 0.006611824035644531, 0.006916522979736328, 0.007221221923828125, 0.007525920867919922, 0.007830619812011719, 0.008135318756103516, 0.008440017700195312, 0.00874471664428711, 0.009049415588378906, 0.009354114532470703, 0.0096588134765625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 10.0, 0.0, 12.0, 12.0, 0.0, 15.0, 0.0, 30.0, 32.0, 0.0, 52.0, 0.0, 84.0, 0.0, 137.0, 228.0, 0.0, 150.0, 0.0, 80.0, 0.0, 56.0, 49.0, 0.0, 22.0, 0.0, 14.0, 11.0, 0.0, 3.0, 0.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0980293154716492e-06, -1.0635703802108765e-06, -1.0291114449501038e-06, -9.94652509689331e-07, -9.601935744285583e-07, -9.257346391677856e-07, -8.912757039070129e-07, -8.568167686462402e-07, -8.223578333854675e-07, -7.878988981246948e-07, -7.534399628639221e-07, -7.189810276031494e-07, -6.845220923423767e-07, -6.50063157081604e-07, -6.156042218208313e-07, -5.811452865600586e-07, -5.466863512992859e-07, -5.122274160385132e-07, -4.777684807777405e-07, -4.4330954551696777e-07, -4.0885061025619507e-07, -3.7439167499542236e-07, -3.3993273973464966e-07, -3.0547380447387695e-07, -2.7101486921310425e-07, -2.3655593395233154e-07, -2.0209699869155884e-07, -1.6763806343078613e-07, -1.3317912817001343e-07, -9.872019290924072e-08, -6.426125764846802e-08, -2.9802322387695312e-08, 4.6566128730773926e-09, 3.91155481338501e-08, 7.35744833946228e-08, 1.0803341865539551e-07, 1.424923539161682e-07, 1.7695128917694092e-07, 2.1141022443771362e-07, 2.4586915969848633e-07, 2.8032809495925903e-07, 3.1478703022003174e-07, 3.4924596548080444e-07, 3.8370490074157715e-07, 4.1816383600234985e-07, 4.5262277126312256e-07, 4.870817065238953e-07, 5.21540641784668e-07, 5.559995770454407e-07, 5.904585123062134e-07, 6.249174475669861e-07, 6.593763828277588e-07, 6.938353180885315e-07, 7.282942533493042e-07, 7.627531886100769e-07, 7.972121238708496e-07, 8.316710591316223e-07, 8.66129994392395e-07, 9.005889296531677e-07, 9.350478649139404e-07, 9.695068001747131e-07, 1.0039657354354858e-06, 1.0384246706962585e-06, 1.0728836059570312e-06]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 4.0, 14.0, 16.0, 14.0, 40.0, 38.0, 54.0, 101.0, 252.0, 2001.0, 354813.0, 688045.0, 2552.0, 251.0, 116.0, 74.0, 40.0, 24.0, 13.0, 27.0, 12.0, 5.0, 3.0, 10.0, 7.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.396106719970703e-05, -2.31890007853508e-05, -2.2416934370994568e-05, -2.1644867956638336e-05, -2.0872801542282104e-05, -2.0100735127925873e-05, -1.932866871356964e-05, -1.855660229921341e-05, -1.7784535884857178e-05, -1.7012469470500946e-05, -1.6240403056144714e-05, -1.5468336641788483e-05, -1.4696270227432251e-05, -1.392420381307602e-05, -1.3152137398719788e-05, -1.2380070984363556e-05, -1.1608004570007324e-05, -1.0835938155651093e-05, -1.006387174129486e-05, -9.291805326938629e-06, -8.519738912582397e-06, -7.747672498226166e-06, -6.975606083869934e-06, -6.203539669513702e-06, -5.431473255157471e-06, -4.659406840801239e-06, -3.887340426445007e-06, -3.1152740120887756e-06, -2.343207597732544e-06, -1.5711411833763123e-06, -7.990747690200806e-07, -2.7008354663848877e-08, 7.450580596923828e-07, 1.5171244740486145e-06, 2.289190888404846e-06, 3.061257302761078e-06, 3.8333237171173096e-06, 4.605390131473541e-06, 5.377456545829773e-06, 6.149522960186005e-06, 6.921589374542236e-06, 7.693655788898468e-06, 8.4657222032547e-06, 9.237788617610931e-06, 1.0009855031967163e-05, 1.0781921446323395e-05, 1.1553987860679626e-05, 1.2326054275035858e-05, 1.309812068939209e-05, 1.3870187103748322e-05, 1.4642253518104553e-05, 1.5414319932460785e-05, 1.6186386346817017e-05, 1.6958452761173248e-05, 1.773051917552948e-05, 1.850258558988571e-05, 1.9274652004241943e-05, 2.0046718418598175e-05, 2.0818784832954407e-05, 2.159085124731064e-05, 2.236291766166687e-05, 2.3134984076023102e-05, 2.3907050490379333e-05, 2.4679116904735565e-05, 2.5451183319091797e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 15.0, 32.0, 99.0, 217.0, 295.0, 215.0, 88.0, 25.0, 17.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2235677736025536e-06, -3.1608997232979164e-06, -3.098231672993279e-06, -3.0355636226886418e-06, -2.97289579975768e-06, -2.9102277494530426e-06, -2.8475596991484053e-06, -2.784891648843768e-06, -2.7222235985391308e-06, -2.6595555482344935e-06, -2.596887497929856e-06, -2.534219447625219e-06, -2.4715513973205816e-06, -2.4088835743896198e-06, -2.3462155240849825e-06, -2.283547473780345e-06, -2.220879423475708e-06, -2.1582113731710706e-06, -2.0955433228664333e-06, -2.032875272561796e-06, -1.970207449630834e-06, -1.907539399326197e-06, -1.8448713490215596e-06, -1.7822032987169223e-06, -1.719535248412285e-06, -1.6568671981076477e-06, -1.5941991478030104e-06, -1.5315312111852109e-06, -1.4688631608805736e-06, -1.4061951105759363e-06, -1.3435271739581367e-06, -1.2808591236534994e-06, -1.2181911870356998e-06, -1.1555231367310626e-06, -1.092855200113263e-06, -1.0301871498086257e-06, -9.675190995039884e-07, -9.048510491993511e-07, -8.421830557381327e-07, -7.795150622769143e-07, -7.16847011972277e-07, -6.541789616676397e-07, -5.915109682064212e-07, -5.288429747452028e-07, -4.661749244405655e-07, -4.0350690255763766e-07, -3.408388806747098e-07, -2.7817085879178194e-07, -2.1550283690885408e-07, -1.5283481502592622e-07, -9.016679314299836e-08, -2.7498771260070498e-08, 3.516925062285736e-08, 9.783727250578522e-08, 1.6050529438871308e-07, 2.2317331627164094e-07, 2.858413381545688e-07, 3.4850936003749666e-07, 4.111773819204245e-07, 4.738454038033524e-07, 5.365134256862802e-07, 5.991814759909175e-07, 6.61849469452136e-07, 7.245174629133544e-07, 7.871855132179917e-07]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 109.0, 0.0, 0.0, 0.0, 192.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 189.0, 0.0, 0.0, 0.0, 104.0, 0.0, 0.0, 0.0, 54.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 2.0, 4.0, 7.0, 6.0, 13.0, 13.0, 11.0, 23.0, 30.0, 36.0, 21.0, 37.0, 36.0, 36.0, 39.0, 41.0, 51.0, 48.0, 48.0, 40.0, 45.0, 37.0, 49.0, 44.0, 33.0, 37.0, 31.0, 33.0, 27.0, 21.0, 19.0, 16.0, 17.0, 11.0, 11.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.371337890625, -3.25830078125, -3.145263671875, -3.0322265625, -2.919189453125, -2.80615234375, -2.693115234375, -2.580078125, -2.467041015625, -2.35400390625, -2.240966796875, -2.1279296875, -2.014892578125, -1.90185546875, -1.788818359375, -1.67578125, -1.562744140625, -1.44970703125, -1.336669921875, -1.2236328125, -1.110595703125, -0.99755859375, -0.884521484375, -0.771484375, -0.658447265625, -0.54541015625, -0.432373046875, -0.3193359375, -0.206298828125, -0.09326171875, 0.019775390625, 0.1328125, 0.245849609375, 0.35888671875, 0.471923828125, 0.5849609375, 0.697998046875, 0.81103515625, 0.924072265625, 1.037109375, 1.150146484375, 1.26318359375, 1.376220703125, 1.4892578125, 1.602294921875, 1.71533203125, 1.828369140625, 1.94140625, 2.054443359375, 2.16748046875, 2.280517578125, 2.3935546875, 2.506591796875, 2.61962890625, 2.732666015625, 2.845703125, 2.958740234375, 3.07177734375, 3.184814453125, 3.2978515625, 3.410888671875, 3.52392578125, 3.636962890625, 3.75]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 8.0, 8.0, 11.0, 15.0, 23.0, 46.0, 81.0, 139.0, 219.0, 320.0, 606.0, 915.0, 1372.0, 2234.0, 3562.0, 5609.0, 9200.0, 14500.0, 24102.0, 43947.0, 86170.0, 227802.0, 375069.0, 118786.0, 56375.0, 30585.0, 17610.0, 11037.0, 6752.0, 4284.0, 2618.0, 1732.0, 1060.0, 646.0, 442.0, 260.0, 141.0, 112.0, 65.0, 35.0, 31.0, 15.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.736328125, -2.642608642578125, -2.54888916015625, -2.455169677734375, -2.3614501953125, -2.267730712890625, -2.17401123046875, -2.080291748046875, -1.986572265625, -1.892852783203125, -1.79913330078125, -1.705413818359375, -1.6116943359375, -1.517974853515625, -1.42425537109375, -1.330535888671875, -1.23681640625, -1.143096923828125, -1.04937744140625, -0.955657958984375, -0.8619384765625, -0.768218994140625, -0.67449951171875, -0.580780029296875, -0.487060546875, -0.393341064453125, -0.29962158203125, -0.205902099609375, -0.1121826171875, -0.018463134765625, 0.07525634765625, 0.168975830078125, 0.2626953125, 0.356414794921875, 0.45013427734375, 0.543853759765625, 0.6375732421875, 0.731292724609375, 0.82501220703125, 0.918731689453125, 1.012451171875, 1.106170654296875, 1.19989013671875, 1.293609619140625, 1.3873291015625, 1.481048583984375, 1.57476806640625, 1.668487548828125, 1.76220703125, 1.855926513671875, 1.94964599609375, 2.043365478515625, 2.1370849609375, 2.230804443359375, 2.32452392578125, 2.418243408203125, 2.511962890625, 2.605682373046875, 2.69940185546875, 2.793121337890625, 2.8868408203125, 2.980560302734375, 3.07427978515625, 3.167999267578125, 3.26171875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 14.0, 15.0, 12.0, 14.0, 13.0, 21.0, 22.0, 35.0, 28.0, 36.0, 31.0, 39.0, 56.0, 56.0, 87.0, 178.0, 1581.0, 264.0, 79.0, 54.0, 45.0, 63.0, 34.0, 38.0, 27.0, 24.0, 17.0, 27.0, 23.0, 19.0, 17.0, 15.0, 9.0, 11.0, 8.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.365966796875, -9.06005859375, -8.754150390625, -8.4482421875, -8.142333984375, -7.83642578125, -7.530517578125, -7.224609375, -6.918701171875, -6.61279296875, -6.306884765625, -6.0009765625, -5.695068359375, -5.38916015625, -5.083251953125, -4.77734375, -4.471435546875, -4.16552734375, -3.859619140625, -3.5537109375, -3.247802734375, -2.94189453125, -2.635986328125, -2.330078125, -2.024169921875, -1.71826171875, -1.412353515625, -1.1064453125, -0.800537109375, -0.49462890625, -0.188720703125, 0.1171875, 0.423095703125, 0.72900390625, 1.034912109375, 1.3408203125, 1.646728515625, 1.95263671875, 2.258544921875, 2.564453125, 2.870361328125, 3.17626953125, 3.482177734375, 3.7880859375, 4.093994140625, 4.39990234375, 4.705810546875, 5.01171875, 5.317626953125, 5.62353515625, 5.929443359375, 6.2353515625, 6.541259765625, 6.84716796875, 7.153076171875, 7.458984375, 7.764892578125, 8.07080078125, 8.376708984375, 8.6826171875, 8.988525390625, 9.29443359375, 9.600341796875, 9.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 5.0, 10.0, 15.0, 18.0, 31.0, 29.0, 56.0, 49.0, 66.0, 108.0, 118.0, 204.0, 257.0, 475.0, 1214.0, 6324.0, 87333.0, 2863403.0, 172818.0, 10011.0, 1558.0, 558.0, 289.0, 199.0, 140.0, 117.0, 59.0, 50.0, 46.0, 26.0, 32.0, 20.0, 11.0, 12.0, 9.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.359375, -15.8575439453125, -15.355712890625, -14.8538818359375, -14.35205078125, -13.8502197265625, -13.348388671875, -12.8465576171875, -12.3447265625, -11.8428955078125, -11.341064453125, -10.8392333984375, -10.33740234375, -9.8355712890625, -9.333740234375, -8.8319091796875, -8.330078125, -7.8282470703125, -7.326416015625, -6.8245849609375, -6.32275390625, -5.8209228515625, -5.319091796875, -4.8172607421875, -4.3154296875, -3.8135986328125, -3.311767578125, -2.8099365234375, -2.30810546875, -1.8062744140625, -1.304443359375, -0.8026123046875, -0.30078125, 0.2010498046875, 0.702880859375, 1.2047119140625, 1.70654296875, 2.2083740234375, 2.710205078125, 3.2120361328125, 3.7138671875, 4.2156982421875, 4.717529296875, 5.2193603515625, 5.72119140625, 6.2230224609375, 6.724853515625, 7.2266845703125, 7.728515625, 8.2303466796875, 8.732177734375, 9.2340087890625, 9.73583984375, 10.2376708984375, 10.739501953125, 11.2413330078125, 11.7431640625, 12.2449951171875, 12.746826171875, 13.2486572265625, 13.75048828125, 14.2523193359375, 14.754150390625, 15.2559814453125, 15.7578125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 15.0, 176.0, 509.0, 281.0, 28.0, 5.0, 0.0, 0.0, 1.0], "bins": [-152.0040283203125, -149.3657684326172, -146.72750854492188, -144.08924865722656, -141.45098876953125, -138.812744140625, -136.1744842529297, -133.53622436523438, -130.89796447753906, -128.25970458984375, -125.62144470214844, -122.98319244384766, -120.34493255615234, -117.70667266845703, -115.06842041015625, -112.43016052246094, -109.79190063476562, -107.15364074707031, -104.515380859375, -101.87712860107422, -99.2388687133789, -96.6006088256836, -93.96235656738281, -91.3240966796875, -88.68583679199219, -86.04757690429688, -83.40931701660156, -80.77106475830078, -78.13280487060547, -75.49454498291016, -72.85629272460938, -70.21803283691406, -67.57976531982422, -64.9415054321289, -62.30324935913086, -59.66499328613281, -57.0267333984375, -54.38847351074219, -51.75021743774414, -49.111961364746094, -46.47370147705078, -43.83544158935547, -41.19718551635742, -38.558929443359375, -35.92066955566406, -33.28240966796875, -30.644153594970703, -28.005895614624023, -25.367639541625977, -22.729381561279297, -20.091123580932617, -17.452865600585938, -14.814607620239258, -12.176349639892578, -9.538091659545898, -6.899833679199219, -4.261575698852539, -1.6233177185058594, 1.0149402618408203, 3.6531982421875, 6.29145622253418, 8.92971420288086, 11.567972183227539, 14.206230163574219, 16.8444881439209]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 5.0, 12.0, 9.0, 16.0, 20.0, 13.0, 25.0, 26.0, 34.0, 18.0, 38.0, 38.0, 53.0, 31.0, 43.0, 33.0, 38.0, 44.0, 49.0, 43.0, 44.0, 55.0, 43.0, 36.0, 32.0, 37.0, 28.0, 29.0, 25.0, 18.0, 13.0, 9.0, 8.0, 11.0, 11.0, 7.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.28861999511719, -37.29345703125, -36.29829406738281, -35.303131103515625, -34.30796432495117, -33.312801361083984, -32.3176383972168, -31.32247543334961, -30.327312469482422, -29.332149505615234, -28.336984634399414, -27.341821670532227, -26.34665870666504, -25.35149383544922, -24.35633087158203, -23.361167907714844, -22.366003036499023, -21.370840072631836, -20.375675201416016, -19.380512237548828, -18.38534927368164, -17.390186309814453, -16.395021438598633, -15.399858474731445, -14.404694557189941, -13.409530639648438, -12.41436767578125, -11.419203758239746, -10.424039840698242, -9.428876876831055, -8.43371295928955, -7.438549518585205, -6.443386077880859, -5.448222637176514, -4.453059196472168, -3.457895278930664, -2.4627318382263184, -1.4675683975219727, -0.47240447998046875, 0.522758960723877, 1.5179224014282227, 2.5130858421325684, 3.508249521255493, 4.503413200378418, 5.498576641082764, 6.493740081787109, 7.488903999328613, 8.484067916870117, 9.479230880737305, 10.474394798278809, 11.469557762145996, 12.4647216796875, 13.459884643554688, 14.455048561096191, 15.450212478637695, 16.445375442504883, 17.440540313720703, 18.43570327758789, 19.43086814880371, 20.4260311126709, 21.421194076538086, 22.416358947753906, 23.411521911621094, 24.40668487548828, 25.40184783935547]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 1.0, 9.0, 6.0, 14.0, 9.0, 16.0, 21.0, 16.0, 24.0, 39.0, 31.0, 35.0, 46.0, 42.0, 40.0, 48.0, 56.0, 38.0, 45.0, 50.0, 46.0, 30.0, 42.0, 47.0, 40.0, 37.0, 30.0, 21.0, 25.0, 23.0, 18.0, 13.0, 11.0, 7.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.763671875, -3.642486572265625, -3.52130126953125, -3.400115966796875, -3.2789306640625, -3.157745361328125, -3.03656005859375, -2.915374755859375, -2.794189453125, -2.673004150390625, -2.55181884765625, -2.430633544921875, -2.3094482421875, -2.188262939453125, -2.06707763671875, -1.945892333984375, -1.82470703125, -1.703521728515625, -1.58233642578125, -1.461151123046875, -1.3399658203125, -1.218780517578125, -1.09759521484375, -0.976409912109375, -0.855224609375, -0.734039306640625, -0.61285400390625, -0.491668701171875, -0.3704833984375, -0.249298095703125, -0.12811279296875, -0.006927490234375, 0.1142578125, 0.235443115234375, 0.35662841796875, 0.477813720703125, 0.5989990234375, 0.720184326171875, 0.84136962890625, 0.962554931640625, 1.083740234375, 1.204925537109375, 1.32611083984375, 1.447296142578125, 1.5684814453125, 1.689666748046875, 1.81085205078125, 1.932037353515625, 2.05322265625, 2.174407958984375, 2.29559326171875, 2.416778564453125, 2.5379638671875, 2.659149169921875, 2.78033447265625, 2.901519775390625, 3.022705078125, 3.143890380859375, 3.26507568359375, 3.386260986328125, 3.5074462890625, 3.628631591796875, 3.74981689453125, 3.871002197265625, 3.9921875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 15.0, 11.0, 13.0, 27.0, 34.0, 37.0, 52.0, 67.0, 98.0, 170.0, 299.0, 451.0, 853.0, 1754.0, 3871.0, 10810.0, 34493.0, 152549.0, 1047642.0, 2404297.0, 428335.0, 76246.0, 19911.0, 6648.0, 2699.0, 1254.0, 620.0, 372.0, 197.0, 137.0, 83.0, 66.0, 31.0, 34.0, 35.0, 23.0, 11.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.4765625, -8.22186279296875, -7.9671630859375, -7.71246337890625, -7.457763671875, -7.20306396484375, -6.9483642578125, -6.69366455078125, -6.43896484375, -6.18426513671875, -5.9295654296875, -5.67486572265625, -5.420166015625, -5.16546630859375, -4.9107666015625, -4.65606689453125, -4.4013671875, -4.14666748046875, -3.8919677734375, -3.63726806640625, -3.382568359375, -3.12786865234375, -2.8731689453125, -2.61846923828125, -2.36376953125, -2.10906982421875, -1.8543701171875, -1.59967041015625, -1.344970703125, -1.09027099609375, -0.8355712890625, -0.58087158203125, -0.326171875, -0.07147216796875, 0.1832275390625, 0.43792724609375, 0.692626953125, 0.94732666015625, 1.2020263671875, 1.45672607421875, 1.71142578125, 1.96612548828125, 2.2208251953125, 2.47552490234375, 2.730224609375, 2.98492431640625, 3.2396240234375, 3.49432373046875, 3.7490234375, 4.00372314453125, 4.2584228515625, 4.51312255859375, 4.767822265625, 5.02252197265625, 5.2772216796875, 5.53192138671875, 5.78662109375, 6.04132080078125, 6.2960205078125, 6.55072021484375, 6.805419921875, 7.06011962890625, 7.3148193359375, 7.56951904296875, 7.82421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 0.0, 5.0, 15.0, 14.0, 28.0, 44.0, 51.0, 77.0, 98.0, 169.0, 211.0, 289.0, 405.0, 565.0, 560.0, 478.0, 327.0, 221.0, 164.0, 113.0, 82.0, 47.0, 30.0, 25.0, 14.0, 15.0, 4.0, 7.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.62109375, -8.3828125, -8.14453125, -7.90625, -7.66796875, -7.4296875, -7.19140625, -6.953125, -6.71484375, -6.4765625, -6.23828125, -6.0, -5.76171875, -5.5234375, -5.28515625, -5.046875, -4.80859375, -4.5703125, -4.33203125, -4.09375, -3.85546875, -3.6171875, -3.37890625, -3.140625, -2.90234375, -2.6640625, -2.42578125, -2.1875, -1.94921875, -1.7109375, -1.47265625, -1.234375, -0.99609375, -0.7578125, -0.51953125, -0.28125, -0.04296875, 0.1953125, 0.43359375, 0.671875, 0.91015625, 1.1484375, 1.38671875, 1.625, 1.86328125, 2.1015625, 2.33984375, 2.578125, 2.81640625, 3.0546875, 3.29296875, 3.53125, 3.76953125, 4.0078125, 4.24609375, 4.484375, 4.72265625, 4.9609375, 5.19921875, 5.4375, 5.67578125, 5.9140625, 6.15234375, 6.390625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 10.0, 19.0, 25.0, 34.0, 43.0, 89.0, 120.0, 182.0, 311.0, 1009.0, 12094.0, 3055910.0, 1116114.0, 6660.0, 766.0, 318.0, 181.0, 127.0, 80.0, 52.0, 45.0, 27.0, 20.0, 13.0, 8.0, 2.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.5654296875, -32.318359375, -31.0712890625, -29.82421875, -28.5771484375, -27.330078125, -26.0830078125, -24.8359375, -23.5888671875, -22.341796875, -21.0947265625, -19.84765625, -18.6005859375, -17.353515625, -16.1064453125, -14.859375, -13.6123046875, -12.365234375, -11.1181640625, -9.87109375, -8.6240234375, -7.376953125, -6.1298828125, -4.8828125, -3.6357421875, -2.388671875, -1.1416015625, 0.10546875, 1.3525390625, 2.599609375, 3.8466796875, 5.09375, 6.3408203125, 7.587890625, 8.8349609375, 10.08203125, 11.3291015625, 12.576171875, 13.8232421875, 15.0703125, 16.3173828125, 17.564453125, 18.8115234375, 20.05859375, 21.3056640625, 22.552734375, 23.7998046875, 25.046875, 26.2939453125, 27.541015625, 28.7880859375, 30.03515625, 31.2822265625, 32.529296875, 33.7763671875, 35.0234375, 36.2705078125, 37.517578125, 38.7646484375, 40.01171875, 41.2587890625, 42.505859375, 43.7529296875, 45.0]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 10.0, 20.0, 34.0, 42.0, 58.0, 84.0, 100.0, 110.0, 119.0, 106.0, 80.0, 85.0, 55.0, 51.0, 22.0, 14.0, 11.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.600330352783203, -20.448476791381836, -19.29662322998047, -18.144771575927734, -16.992918014526367, -15.841064453125, -14.689210891723633, -13.537358283996582, -12.385504722595215, -11.233651161193848, -10.081798553466797, -8.92994499206543, -7.778091907501221, -6.626238822937012, -5.4743852615356445, -4.322532653808594, -3.1706790924072266, -2.0188260078430176, -0.8669726848602295, 0.2848806381225586, 1.4367337226867676, 2.5885868072509766, 3.7404403686523438, 4.8922929763793945, 6.044146537780762, 7.195999622344971, 8.34785270690918, 9.499706268310547, 10.651559829711914, 11.803412437438965, 12.955265998840332, 14.107118606567383, 15.25897216796875, 16.410825729370117, 17.562679290771484, 18.71453094482422, 19.866384506225586, 21.018238067626953, 22.17009162902832, 23.321945190429688, 24.473796844482422, 25.62565040588379, 26.777503967285156, 27.92935562133789, 29.081209182739258, 30.233062744140625, 31.384916305541992, 32.53676986694336, 33.688621520996094, 34.84047317504883, 35.99232864379883, 37.14418029785156, 38.29603576660156, 39.4478874206543, 40.59973907470703, 41.75159454345703, 42.90345001220703, 44.055301666259766, 45.207157135009766, 46.3590087890625, 47.5108642578125, 48.662715911865234, 49.81456756591797, 50.96642303466797, 52.1182746887207]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 14.0, 8.0, 14.0, 14.0, 21.0, 13.0, 22.0, 19.0, 24.0, 30.0, 43.0, 40.0, 35.0, 45.0, 54.0, 49.0, 41.0, 43.0, 40.0, 34.0, 32.0, 23.0, 43.0, 37.0, 32.0, 30.0, 23.0, 17.0, 18.0, 16.0, 16.0, 18.0, 9.0, 16.0, 14.0, 4.0, 10.0, 8.0, 2.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.611778259277344, -21.919265747070312, -21.22675323486328, -20.53424072265625, -19.841726303100586, -19.149213790893555, -18.456701278686523, -17.764188766479492, -17.071674346923828, -16.379161834716797, -15.68664836883545, -14.994135856628418, -14.30162239074707, -13.609109878540039, -12.916597366333008, -12.224084854125977, -11.531572341918945, -10.839059829711914, -10.146546363830566, -9.454033851623535, -8.761520385742188, -8.069007873535156, -7.376495361328125, -6.6839823722839355, -5.991469383239746, -5.298956394195557, -4.606443405151367, -3.913930892944336, -3.2214179039001465, -2.528904914855957, -1.8363924026489258, -1.1438794136047363, -0.45136451721191406, 0.24114835262298584, 0.9336612224578857, 1.626173973083496, 2.3186869621276855, 3.011199951171875, 3.7037124633789062, 4.396225452423096, 5.088738441467285, 5.781251430511475, 6.473764419555664, 7.166276931762695, 7.858789920806885, 8.551302909851074, 9.243815422058105, 9.936328887939453, 10.628841400146484, 11.321353912353516, 12.013867378234863, 12.706379890441895, 13.398893356323242, 14.091405868530273, 14.783918380737305, 15.476430892944336, 16.1689453125, 16.86145782470703, 17.553970336914062, 18.246482849121094, 18.938997268676758, 19.63150978088379, 20.32402229309082, 21.01653480529785, 21.709047317504883]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 12.0, 9.0, 4.0, 12.0, 21.0, 17.0, 18.0, 38.0, 32.0, 44.0, 59.0, 54.0, 34.0, 47.0, 56.0, 54.0, 55.0, 47.0, 50.0, 44.0, 56.0, 34.0, 33.0, 16.0, 35.0, 24.0, 28.0, 11.0, 18.0, 2.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.2288818359375, -4.094482421875, -3.9600830078125, -3.82568359375, -3.6912841796875, -3.556884765625, -3.4224853515625, -3.2880859375, -3.1536865234375, -3.019287109375, -2.8848876953125, -2.75048828125, -2.6160888671875, -2.481689453125, -2.3472900390625, -2.212890625, -2.0784912109375, -1.944091796875, -1.8096923828125, -1.67529296875, -1.5408935546875, -1.406494140625, -1.2720947265625, -1.1376953125, -1.0032958984375, -0.868896484375, -0.7344970703125, -0.60009765625, -0.4656982421875, -0.331298828125, -0.1968994140625, -0.0625, 0.0718994140625, 0.206298828125, 0.3406982421875, 0.47509765625, 0.6094970703125, 0.743896484375, 0.8782958984375, 1.0126953125, 1.1470947265625, 1.281494140625, 1.4158935546875, 1.55029296875, 1.6846923828125, 1.819091796875, 1.9534912109375, 2.087890625, 2.2222900390625, 2.356689453125, 2.4910888671875, 2.62548828125, 2.7598876953125, 2.894287109375, 3.0286865234375, 3.1630859375, 3.2974853515625, 3.431884765625, 3.5662841796875, 3.70068359375, 3.8350830078125, 3.969482421875, 4.1038818359375, 4.23828125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 13.0, 15.0, 25.0, 47.0, 61.0, 92.0, 145.0, 256.0, 381.0, 634.0, 1019.0, 1747.0, 2906.0, 5014.0, 8693.0, 15161.0, 27513.0, 53400.0, 107975.0, 232777.0, 300490.0, 141963.0, 68574.0, 35019.0, 19032.0, 10617.0, 6084.0, 3500.0, 2130.0, 1254.0, 760.0, 475.0, 265.0, 168.0, 108.0, 81.0, 46.0, 38.0, 17.0, 11.0, 9.0, 11.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.030792236328125, -0.02986431121826172, -0.028936386108398438, -0.028008460998535156, -0.027080535888671875, -0.026152610778808594, -0.025224685668945312, -0.02429676055908203, -0.02336883544921875, -0.02244091033935547, -0.021512985229492188, -0.020585060119628906, -0.019657135009765625, -0.018729209899902344, -0.017801284790039062, -0.01687335968017578, -0.0159454345703125, -0.015017509460449219, -0.014089584350585938, -0.013161659240722656, -0.012233734130859375, -0.011305809020996094, -0.010377883911132812, -0.009449958801269531, -0.00852203369140625, -0.007594108581542969, -0.0066661834716796875, -0.005738258361816406, -0.004810333251953125, -0.0038824081420898438, -0.0029544830322265625, -0.0020265579223632812, -0.0010986328125, -0.00017070770263671875, 0.0007572174072265625, 0.0016851425170898438, 0.002613067626953125, 0.0035409927368164062, 0.0044689178466796875, 0.005396842956542969, 0.00632476806640625, 0.007252693176269531, 0.008180618286132812, 0.009108543395996094, 0.010036468505859375, 0.010964393615722656, 0.011892318725585938, 0.012820243835449219, 0.0137481689453125, 0.014676094055175781, 0.015604019165039062, 0.016531944274902344, 0.017459869384765625, 0.018387794494628906, 0.019315719604492188, 0.02024364471435547, 0.02117156982421875, 0.02209949493408203, 0.023027420043945312, 0.023955345153808594, 0.024883270263671875, 0.025811195373535156, 0.026739120483398438, 0.02766704559326172, 0.028594970703125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 8.0, 15.0, 12.0, 10.0, 17.0, 20.0, 25.0, 40.0, 21.0, 29.0, 27.0, 32.0, 43.0, 55.0, 47.0, 46.0, 44.0, 1064.0, 33.0, 33.0, 33.0, 50.0, 23.0, 36.0, 23.0, 24.0, 20.0, 29.0, 19.0, 22.0, 15.0, 16.0, 15.0, 15.0, 4.0, 5.0, 6.0, 4.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.640625, -2.55615234375, -2.4716796875, -2.38720703125, -2.302734375, -2.21826171875, -2.1337890625, -2.04931640625, -1.96484375, -1.88037109375, -1.7958984375, -1.71142578125, -1.626953125, -1.54248046875, -1.4580078125, -1.37353515625, -1.2890625, -1.20458984375, -1.1201171875, -1.03564453125, -0.951171875, -0.86669921875, -0.7822265625, -0.69775390625, -0.61328125, -0.52880859375, -0.4443359375, -0.35986328125, -0.275390625, -0.19091796875, -0.1064453125, -0.02197265625, 0.0625, 0.14697265625, 0.2314453125, 0.31591796875, 0.400390625, 0.48486328125, 0.5693359375, 0.65380859375, 0.73828125, 0.82275390625, 0.9072265625, 0.99169921875, 1.076171875, 1.16064453125, 1.2451171875, 1.32958984375, 1.4140625, 1.49853515625, 1.5830078125, 1.66748046875, 1.751953125, 1.83642578125, 1.9208984375, 2.00537109375, 2.08984375, 2.17431640625, 2.2587890625, 2.34326171875, 2.427734375, 2.51220703125, 2.5966796875, 2.68115234375, 2.765625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 12.0, 22.0, 33.0, 52.0, 71.0, 80.0, 124.0, 182.0, 257.0, 323.0, 549.0, 740.0, 1066.0, 1597.0, 2470.0, 3667.0, 5412.0, 8015.0, 12240.0, 18519.0, 28481.0, 44568.0, 71075.0, 117896.0, 189888.0, 1247939.0, 127852.0, 77102.0, 47617.0, 30507.0, 19670.0, 12877.0, 8578.0, 5669.0, 3934.0, 2529.0, 1757.0, 1150.0, 821.0, 550.0, 367.0, 274.0, 196.0, 118.0, 85.0, 56.0, 44.0, 37.0, 27.0, 16.0, 10.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.0096282958984375, -0.009328126907348633, -0.009027957916259766, -0.008727788925170898, -0.008427619934082031, -0.008127450942993164, -0.007827281951904297, -0.00752711296081543, -0.0072269439697265625, -0.006926774978637695, -0.006626605987548828, -0.006326436996459961, -0.006026268005371094, -0.0057260990142822266, -0.005425930023193359, -0.005125761032104492, -0.004825592041015625, -0.004525423049926758, -0.004225254058837891, -0.0039250850677490234, -0.0036249160766601562, -0.003324747085571289, -0.003024578094482422, -0.0027244091033935547, -0.0024242401123046875, -0.0021240711212158203, -0.0018239021301269531, -0.001523733139038086, -0.0012235641479492188, -0.0009233951568603516, -0.0006232261657714844, -0.0003230571746826172, -2.288818359375e-05, 0.0002772808074951172, 0.0005774497985839844, 0.0008776187896728516, 0.0011777877807617188, 0.001477956771850586, 0.0017781257629394531, 0.0020782947540283203, 0.0023784637451171875, 0.0026786327362060547, 0.002978801727294922, 0.003278970718383789, 0.0035791397094726562, 0.0038793087005615234, 0.004179477691650391, 0.004479646682739258, 0.004779815673828125, 0.005079984664916992, 0.005380153656005859, 0.0056803226470947266, 0.005980491638183594, 0.006280660629272461, 0.006580829620361328, 0.006880998611450195, 0.0071811676025390625, 0.00748133659362793, 0.007781505584716797, 0.008081674575805664, 0.008381843566894531, 0.008682012557983398, 0.008982181549072266, 0.009282350540161133, 0.00958251953125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 6.0, 2.0, 6.0, 0.0, 6.0, 7.0, 12.0, 0.0, 19.0, 42.0, 46.0, 0.0, 77.0, 144.0, 245.0, 0.0, 136.0, 98.0, 51.0, 0.0, 41.0, 15.0, 13.0, 0.0, 10.0, 4.0, 4.0, 0.0, 5.0, 9.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5050172805786133e-06, -1.4603137969970703e-06, -1.4156103134155273e-06, -1.3709068298339844e-06, -1.3262033462524414e-06, -1.2814998626708984e-06, -1.2367963790893555e-06, -1.1920928955078125e-06, -1.1473894119262695e-06, -1.1026859283447266e-06, -1.0579824447631836e-06, -1.0132789611816406e-06, -9.685754776000977e-07, -9.238719940185547e-07, -8.791685104370117e-07, -8.344650268554688e-07, -7.897615432739258e-07, -7.450580596923828e-07, -7.003545761108398e-07, -6.556510925292969e-07, -6.109476089477539e-07, -5.662441253662109e-07, -5.21540641784668e-07, -4.76837158203125e-07, -4.3213367462158203e-07, -3.8743019104003906e-07, -3.427267074584961e-07, -2.980232238769531e-07, -2.5331974029541016e-07, -2.086162567138672e-07, -1.6391277313232422e-07, -1.1920928955078125e-07, -7.450580596923828e-08, -2.9802322387695312e-08, 1.4901161193847656e-08, 5.960464477539063e-08, 1.043081283569336e-07, 1.4901161193847656e-07, 1.9371509552001953e-07, 2.384185791015625e-07, 2.8312206268310547e-07, 3.2782554626464844e-07, 3.725290298461914e-07, 4.172325134277344e-07, 4.6193599700927734e-07, 5.066394805908203e-07, 5.513429641723633e-07, 5.960464477539062e-07, 6.407499313354492e-07, 6.854534149169922e-07, 7.301568984985352e-07, 7.748603820800781e-07, 8.195638656616211e-07, 8.642673492431641e-07, 9.08970832824707e-07, 9.5367431640625e-07, 9.98377799987793e-07, 1.043081283569336e-06, 1.087784767150879e-06, 1.1324882507324219e-06, 1.1771917343139648e-06, 1.2218952178955078e-06, 1.2665987014770508e-06, 1.3113021850585938e-06]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 4.0, 3.0, 6.0, 3.0, 12.0, 10.0, 16.0, 32.0, 60.0, 82.0, 218.0, 1043.0, 707537.0, 338427.0, 681.0, 164.0, 95.0, 55.0, 30.0, 21.0, 9.0, 7.0, 5.0, 10.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9265880584716797e-05, -2.828892320394516e-05, -2.7311965823173523e-05, -2.6335008442401886e-05, -2.535805106163025e-05, -2.4381093680858612e-05, -2.3404136300086975e-05, -2.2427178919315338e-05, -2.14502215385437e-05, -2.0473264157772064e-05, -1.9496306777000427e-05, -1.851934939622879e-05, -1.7542392015457153e-05, -1.6565434634685516e-05, -1.558847725391388e-05, -1.4611519873142242e-05, -1.3634562492370605e-05, -1.2657605111598969e-05, -1.1680647730827332e-05, -1.0703690350055695e-05, -9.726732969284058e-06, -8.74977558851242e-06, -7.772818207740784e-06, -6.795860826969147e-06, -5.81890344619751e-06, -4.841946065425873e-06, -3.864988684654236e-06, -2.888031303882599e-06, -1.911073923110962e-06, -9.34116542339325e-07, 4.284083843231201e-08, 1.019798219203949e-06, 1.996755599975586e-06, 2.973712980747223e-06, 3.95067036151886e-06, 4.927627742290497e-06, 5.904585123062134e-06, 6.881542503833771e-06, 7.858499884605408e-06, 8.835457265377045e-06, 9.812414646148682e-06, 1.0789372026920319e-05, 1.1766329407691956e-05, 1.2743286788463593e-05, 1.372024416923523e-05, 1.4697201550006866e-05, 1.5674158930778503e-05, 1.665111631155014e-05, 1.7628073692321777e-05, 1.8605031073093414e-05, 1.958198845386505e-05, 2.0558945834636688e-05, 2.1535903215408325e-05, 2.2512860596179962e-05, 2.34898179769516e-05, 2.4466775357723236e-05, 2.5443732738494873e-05, 2.642069011926651e-05, 2.7397647500038147e-05, 2.8374604880809784e-05, 2.935156226158142e-05, 3.0328519642353058e-05, 3.1305477023124695e-05, 3.228243440389633e-05, 3.325939178466797e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 12.0, 36.0, 149.0, 381.0, 290.0, 113.0, 31.0, 2.0, 2.0, 1.0, 4.0], "bins": [-4.538730536296498e-06, -4.45892055722652e-06, -4.379110578156542e-06, -4.299300144339213e-06, -4.219490165269235e-06, -4.139680186199257e-06, -4.059870207129279e-06, -3.980060228059301e-06, -3.900249794241972e-06, -3.820439815171994e-06, -3.740629608728341e-06, -3.660819629658363e-06, -3.5810094232147094e-06, -3.5011994441447314e-06, -3.4213894650747534e-06, -3.3415794860047754e-06, -3.2617695069347974e-06, -3.1819595278648194e-06, -3.102149321421166e-06, -3.022339342351188e-06, -2.9425291359075345e-06, -2.8627191568375565e-06, -2.7829091777675785e-06, -2.7030991986976005e-06, -2.623288992253947e-06, -2.543479013183969e-06, -2.4636688067403156e-06, -2.3838588276703376e-06, -2.3040488486003596e-06, -2.224238642156706e-06, -2.144428663086728e-06, -2.0646184566430748e-06, -1.9848084775730968e-06, -1.904998384816281e-06, -1.8251882920594653e-06, -1.7453783129894873e-06, -1.6655682202326716e-06, -1.5857581274758559e-06, -1.5059481484058779e-06, -1.4261380556490622e-06, -1.3463279628922464e-06, -1.2665178701354307e-06, -1.186707777378615e-06, -1.106897798308637e-06, -1.0270877055518213e-06, -9.472776127950056e-07, -8.674675768816087e-07, -7.876575409682118e-07, -7.07847505054815e-07, -6.280374691414181e-07, -5.482273763846024e-07, -4.684173120494961e-07, -3.886072477143898e-07, -3.087971833792835e-07, -2.2898711904417723e-07, -1.4917708313078037e-07, -6.936699037396465e-08, 1.0443073961141636e-08, 9.025313829624793e-08, 1.7006320263135422e-07, 2.498732669664605e-07, 3.296833313015668e-07, 4.094933956366731e-07, 4.893034315500699e-07, 5.691135243068857e-07]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 65.0, 0.0, 0.0, 112.0, 0.0, 0.0, 0.0, 167.0, 0.0, 0.0, 0.0, 221.0, 0.0, 0.0, 0.0, 185.0, 0.0, 0.0, 132.0, 0.0, 0.0, 0.0, 52.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.0140002965927124e-07, -3.855675458908081e-07, -3.6973506212234497e-07, -3.5390257835388184e-07, -3.380700945854187e-07, -3.2223761081695557e-07, -3.0640512704849243e-07, -2.905726432800293e-07, -2.7474015951156616e-07, -2.5890767574310303e-07, -2.430751919746399e-07, -2.2724270820617676e-07, -2.1141022443771362e-07, -1.955777406692505e-07, -1.7974525690078735e-07, -1.6391277313232422e-07, -1.4808028936386108e-07, -1.3224780559539795e-07, -1.1641532182693481e-07, -1.0058283805847168e-07, -8.475035429000854e-08, -6.891787052154541e-08, -5.3085386753082275e-08, -3.725290298461914e-08, -2.1420419216156006e-08, -5.587935447692871e-09, 1.0244548320770264e-08, 2.60770320892334e-08, 4.190951585769653e-08, 5.774199962615967e-08, 7.35744833946228e-08, 8.940696716308594e-08, 1.0523945093154907e-07, 1.210719347000122e-07, 1.3690441846847534e-07, 1.5273690223693848e-07, 1.685693860054016e-07, 1.8440186977386475e-07, 2.0023435354232788e-07, 2.1606683731079102e-07, 2.3189932107925415e-07, 2.477318048477173e-07, 2.635642886161804e-07, 2.7939677238464355e-07, 2.952292561531067e-07, 3.110617399215698e-07, 3.2689422369003296e-07, 3.427267074584961e-07, 3.5855919122695923e-07, 3.7439167499542236e-07, 3.902241587638855e-07, 4.0605664253234863e-07, 4.2188912630081177e-07, 4.377216100692749e-07, 4.5355409383773804e-07, 4.6938657760620117e-07, 4.852190613746643e-07, 5.010515451431274e-07, 5.168840289115906e-07, 5.327165126800537e-07, 5.485489964485168e-07, 5.6438148021698e-07, 5.802139639854431e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 12.0, 9.0, 4.0, 12.0, 21.0, 17.0, 18.0, 38.0, 32.0, 44.0, 59.0, 54.0, 34.0, 47.0, 56.0, 54.0, 55.0, 47.0, 50.0, 44.0, 56.0, 34.0, 33.0, 16.0, 35.0, 24.0, 28.0, 11.0, 18.0, 2.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.2288818359375, -4.094482421875, -3.9600830078125, -3.82568359375, -3.6912841796875, -3.556884765625, -3.4224853515625, -3.2880859375, -3.1536865234375, -3.019287109375, -2.8848876953125, -2.75048828125, -2.6160888671875, -2.481689453125, -2.3472900390625, -2.212890625, -2.0784912109375, -1.944091796875, -1.8096923828125, -1.67529296875, -1.5408935546875, -1.406494140625, -1.2720947265625, -1.1376953125, -1.0032958984375, -0.868896484375, -0.7344970703125, -0.60009765625, -0.4656982421875, -0.331298828125, -0.1968994140625, -0.0625, 0.0718994140625, 0.206298828125, 0.3406982421875, 0.47509765625, 0.6094970703125, 0.743896484375, 0.8782958984375, 1.0126953125, 1.1470947265625, 1.281494140625, 1.4158935546875, 1.55029296875, 1.6846923828125, 1.819091796875, 1.9534912109375, 2.087890625, 2.2222900390625, 2.356689453125, 2.4910888671875, 2.62548828125, 2.7598876953125, 2.894287109375, 3.0286865234375, 3.1630859375, 3.2974853515625, 3.431884765625, 3.5662841796875, 3.70068359375, 3.8350830078125, 3.969482421875, 4.1038818359375, 4.23828125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 6.0, 10.0, 12.0, 10.0, 21.0, 31.0, 31.0, 52.0, 51.0, 83.0, 127.0, 184.0, 258.0, 387.0, 610.0, 867.0, 1316.0, 2048.0, 3171.0, 5078.0, 8454.0, 14790.0, 27272.0, 56413.0, 165846.0, 514303.0, 136205.0, 50845.0, 24956.0, 13624.0, 8061.0, 4661.0, 3053.0, 1960.0, 1203.0, 780.0, 550.0, 367.0, 254.0, 174.0, 127.0, 95.0, 50.0, 46.0, 34.0, 24.0, 22.0, 7.0, 10.0, 3.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.9921875, -3.86517333984375, -3.7381591796875, -3.61114501953125, -3.484130859375, -3.35711669921875, -3.2301025390625, -3.10308837890625, -2.97607421875, -2.84906005859375, -2.7220458984375, -2.59503173828125, -2.468017578125, -2.34100341796875, -2.2139892578125, -2.08697509765625, -1.9599609375, -1.83294677734375, -1.7059326171875, -1.57891845703125, -1.451904296875, -1.32489013671875, -1.1978759765625, -1.07086181640625, -0.94384765625, -0.81683349609375, -0.6898193359375, -0.56280517578125, -0.435791015625, -0.30877685546875, -0.1817626953125, -0.05474853515625, 0.072265625, 0.19927978515625, 0.3262939453125, 0.45330810546875, 0.580322265625, 0.70733642578125, 0.8343505859375, 0.96136474609375, 1.08837890625, 1.21539306640625, 1.3424072265625, 1.46942138671875, 1.596435546875, 1.72344970703125, 1.8504638671875, 1.97747802734375, 2.1044921875, 2.23150634765625, 2.3585205078125, 2.48553466796875, 2.612548828125, 2.73956298828125, 2.8665771484375, 2.99359130859375, 3.12060546875, 3.24761962890625, 3.3746337890625, 3.50164794921875, 3.628662109375, 3.75567626953125, 3.8826904296875, 4.00970458984375, 4.13671875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 7.0, 8.0, 10.0, 15.0, 17.0, 16.0, 27.0, 28.0, 19.0, 35.0, 31.0, 29.0, 58.0, 64.0, 68.0, 74.0, 163.0, 1544.0, 266.0, 101.0, 75.0, 42.0, 46.0, 24.0, 36.0, 29.0, 27.0, 17.0, 17.0, 19.0, 16.0, 24.0, 12.0, 11.0, 11.0, 5.0, 7.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.765625, -10.4468994140625, -10.128173828125, -9.8094482421875, -9.49072265625, -9.1719970703125, -8.853271484375, -8.5345458984375, -8.2158203125, -7.8970947265625, -7.578369140625, -7.2596435546875, -6.94091796875, -6.6221923828125, -6.303466796875, -5.9847412109375, -5.666015625, -5.3472900390625, -5.028564453125, -4.7098388671875, -4.39111328125, -4.0723876953125, -3.753662109375, -3.4349365234375, -3.1162109375, -2.7974853515625, -2.478759765625, -2.1600341796875, -1.84130859375, -1.5225830078125, -1.203857421875, -0.8851318359375, -0.56640625, -0.2476806640625, 0.071044921875, 0.3897705078125, 0.70849609375, 1.0272216796875, 1.345947265625, 1.6646728515625, 1.9833984375, 2.3021240234375, 2.620849609375, 2.9395751953125, 3.25830078125, 3.5770263671875, 3.895751953125, 4.2144775390625, 4.533203125, 4.8519287109375, 5.170654296875, 5.4893798828125, 5.80810546875, 6.1268310546875, 6.445556640625, 6.7642822265625, 7.0830078125, 7.4017333984375, 7.720458984375, 8.0391845703125, 8.35791015625, 8.6766357421875, 8.995361328125, 9.3140869140625, 9.6328125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 3.0, 7.0, 5.0, 8.0, 10.0, 9.0, 20.0, 20.0, 24.0, 26.0, 27.0, 30.0, 33.0, 62.0, 67.0, 108.0, 151.0, 333.0, 733.0, 2821.0, 15735.0, 189543.0, 2809978.0, 110939.0, 11262.0, 2174.0, 665.0, 287.0, 148.0, 114.0, 78.0, 54.0, 58.0, 34.0, 26.0, 29.0, 16.0, 15.0, 6.0, 8.0, 10.0, 4.0, 2.0, 7.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.28125, -14.77880859375, -14.2763671875, -13.77392578125, -13.271484375, -12.76904296875, -12.2666015625, -11.76416015625, -11.26171875, -10.75927734375, -10.2568359375, -9.75439453125, -9.251953125, -8.74951171875, -8.2470703125, -7.74462890625, -7.2421875, -6.73974609375, -6.2373046875, -5.73486328125, -5.232421875, -4.72998046875, -4.2275390625, -3.72509765625, -3.22265625, -2.72021484375, -2.2177734375, -1.71533203125, -1.212890625, -0.71044921875, -0.2080078125, 0.29443359375, 0.796875, 1.29931640625, 1.8017578125, 2.30419921875, 2.806640625, 3.30908203125, 3.8115234375, 4.31396484375, 4.81640625, 5.31884765625, 5.8212890625, 6.32373046875, 6.826171875, 7.32861328125, 7.8310546875, 8.33349609375, 8.8359375, 9.33837890625, 9.8408203125, 10.34326171875, 10.845703125, 11.34814453125, 11.8505859375, 12.35302734375, 12.85546875, 13.35791015625, 13.8603515625, 14.36279296875, 14.865234375, 15.36767578125, 15.8701171875, 16.37255859375, 16.875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 133.0, 370.0, 333.0, 123.0, 19.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.88629913330078, -65.94255828857422, -63.99882125854492, -62.05508041381836, -60.11134338378906, -58.1676025390625, -56.22386169433594, -54.280120849609375, -52.33638381958008, -50.392642974853516, -48.44890594482422, -46.505165100097656, -44.561424255371094, -42.6176872253418, -40.673946380615234, -38.73020935058594, -36.786468505859375, -34.84272766113281, -32.898990631103516, -30.955249786376953, -29.011510848999023, -27.067771911621094, -25.12403106689453, -23.1802921295166, -21.236553192138672, -19.292814254760742, -17.349075317382812, -15.40533447265625, -13.46159553527832, -11.51785659790039, -9.574116706848145, -7.630376815795898, -5.686641693115234, -3.7429022789001465, -1.7991628646850586, 0.1445765495300293, 2.088315963745117, 4.032054901123047, 5.975794792175293, 7.919534683227539, 9.863273620605469, 11.807012557983398, 13.750752449035645, 15.69449234008789, 17.63823127746582, 19.58197021484375, 21.525711059570312, 23.469449996948242, 25.413188934326172, 27.3569278717041, 29.30066680908203, 31.244407653808594, 33.188148498535156, 35.13188552856445, 37.075626373291016, 39.01936340332031, 40.963104248046875, 42.90684509277344, 44.850582122802734, 46.7943229675293, 48.738059997558594, 50.681800842285156, 52.62554168701172, 54.56928253173828, 56.51301956176758]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 8.0, 3.0, 3.0, 11.0, 4.0, 7.0, 8.0, 8.0, 7.0, 25.0, 16.0, 25.0, 29.0, 34.0, 35.0, 34.0, 33.0, 31.0, 33.0, 43.0, 40.0, 49.0, 57.0, 49.0, 53.0, 40.0, 36.0, 26.0, 36.0, 28.0, 27.0, 27.0, 28.0, 19.0, 19.0, 17.0, 11.0, 19.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.740440368652344, -33.620113372802734, -32.499786376953125, -31.379457473754883, -30.25912857055664, -29.13880157470703, -28.018474578857422, -26.898147583007812, -25.77781867980957, -24.65749168395996, -23.53716278076172, -22.41683578491211, -21.2965087890625, -20.176179885864258, -19.05585289001465, -17.935523986816406, -16.815196990966797, -15.694869041442871, -14.574541091918945, -13.454214096069336, -12.33388614654541, -11.213558197021484, -10.093231201171875, -8.97290325164795, -7.852575302124023, -6.732247352600098, -5.61191987991333, -4.4915924072265625, -3.3712644577026367, -2.250936508178711, -1.1306090354919434, -0.010281562805175781, 1.1100425720214844, 2.230370283126831, 3.3506979942321777, 4.471025466918945, 5.591353416442871, 6.711681365966797, 7.8320088386535645, 8.952336311340332, 10.072664260864258, 11.192992210388184, 12.31332015991211, 13.433647155761719, 14.553975105285645, 15.67430305480957, 16.79463005065918, 17.914958953857422, 19.03528594970703, 20.15561294555664, 21.275941848754883, 22.396268844604492, 23.516597747802734, 24.636924743652344, 25.757251739501953, 26.877578735351562, 27.997907638549805, 29.118234634399414, 30.238563537597656, 31.358890533447266, 32.479217529296875, 33.59954833984375, 34.71987533569336, 35.84020233154297, 36.96052932739258]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 10.0, 7.0, 14.0, 8.0, 16.0, 17.0, 16.0, 34.0, 36.0, 39.0, 48.0, 49.0, 34.0, 48.0, 46.0, 39.0, 50.0, 51.0, 56.0, 41.0, 36.0, 35.0, 39.0, 34.0, 30.0, 28.0, 28.0, 23.0, 13.0, 18.0, 11.0, 10.0, 8.0, 3.0, 5.0, 0.0, 0.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.22265625, -4.095611572265625, -3.96856689453125, -3.841522216796875, -3.7144775390625, -3.587432861328125, -3.46038818359375, -3.333343505859375, -3.206298828125, -3.079254150390625, -2.95220947265625, -2.825164794921875, -2.6981201171875, -2.571075439453125, -2.44403076171875, -2.316986083984375, -2.18994140625, -2.062896728515625, -1.93585205078125, -1.808807373046875, -1.6817626953125, -1.554718017578125, -1.42767333984375, -1.300628662109375, -1.173583984375, -1.046539306640625, -0.91949462890625, -0.792449951171875, -0.6654052734375, -0.538360595703125, -0.41131591796875, -0.284271240234375, -0.1572265625, -0.030181884765625, 0.09686279296875, 0.223907470703125, 0.3509521484375, 0.477996826171875, 0.60504150390625, 0.732086181640625, 0.859130859375, 0.986175537109375, 1.11322021484375, 1.240264892578125, 1.3673095703125, 1.494354248046875, 1.62139892578125, 1.748443603515625, 1.87548828125, 2.002532958984375, 2.12957763671875, 2.256622314453125, 2.3836669921875, 2.510711669921875, 2.63775634765625, 2.764801025390625, 2.891845703125, 3.018890380859375, 3.14593505859375, 3.272979736328125, 3.4000244140625, 3.527069091796875, 3.65411376953125, 3.781158447265625, 3.908203125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 10.0, 17.0, 33.0, 47.0, 70.0, 86.0, 138.0, 260.0, 394.0, 548.0, 827.0, 1340.0, 2279.0, 3525.0, 6110.0, 10495.0, 19181.0, 37373.0, 79999.0, 188504.0, 475043.0, 1105554.0, 1253570.0, 585309.0, 231622.0, 96429.0, 44179.0, 22393.0, 11834.0, 6591.0, 3919.0, 2383.0, 1497.0, 968.0, 602.0, 404.0, 253.0, 169.0, 112.0, 70.0, 43.0, 40.0, 20.0, 13.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0], "bins": [-4.3828125, -4.261444091796875, -4.14007568359375, -4.018707275390625, -3.8973388671875, -3.775970458984375, -3.65460205078125, -3.533233642578125, -3.411865234375, -3.290496826171875, -3.16912841796875, -3.047760009765625, -2.9263916015625, -2.805023193359375, -2.68365478515625, -2.562286376953125, -2.44091796875, -2.319549560546875, -2.19818115234375, -2.076812744140625, -1.9554443359375, -1.834075927734375, -1.71270751953125, -1.591339111328125, -1.469970703125, -1.348602294921875, -1.22723388671875, -1.105865478515625, -0.9844970703125, -0.863128662109375, -0.74176025390625, -0.620391845703125, -0.4990234375, -0.377655029296875, -0.25628662109375, -0.134918212890625, -0.0135498046875, 0.107818603515625, 0.22918701171875, 0.350555419921875, 0.471923828125, 0.593292236328125, 0.71466064453125, 0.836029052734375, 0.9573974609375, 1.078765869140625, 1.20013427734375, 1.321502685546875, 1.44287109375, 1.564239501953125, 1.68560791015625, 1.806976318359375, 1.9283447265625, 2.049713134765625, 2.17108154296875, 2.292449951171875, 2.413818359375, 2.535186767578125, 2.65655517578125, 2.777923583984375, 2.8992919921875, 3.020660400390625, 3.14202880859375, 3.263397216796875, 3.384765625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 1.0, 8.0, 6.0, 10.0, 13.0, 19.0, 28.0, 19.0, 47.0, 41.0, 64.0, 81.0, 90.0, 120.0, 178.0, 222.0, 264.0, 357.0, 374.0, 441.0, 329.0, 298.0, 242.0, 188.0, 131.0, 112.0, 85.0, 69.0, 54.0, 45.0, 25.0, 26.0, 14.0, 13.0, 14.0, 12.0, 9.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.4439697265625, -5.274658203125, -5.1053466796875, -4.93603515625, -4.7667236328125, -4.597412109375, -4.4281005859375, -4.2587890625, -4.0894775390625, -3.920166015625, -3.7508544921875, -3.58154296875, -3.4122314453125, -3.242919921875, -3.0736083984375, -2.904296875, -2.7349853515625, -2.565673828125, -2.3963623046875, -2.22705078125, -2.0577392578125, -1.888427734375, -1.7191162109375, -1.5498046875, -1.3804931640625, -1.211181640625, -1.0418701171875, -0.87255859375, -0.7032470703125, -0.533935546875, -0.3646240234375, -0.1953125, -0.0260009765625, 0.143310546875, 0.3126220703125, 0.48193359375, 0.6512451171875, 0.820556640625, 0.9898681640625, 1.1591796875, 1.3284912109375, 1.497802734375, 1.6671142578125, 1.83642578125, 2.0057373046875, 2.175048828125, 2.3443603515625, 2.513671875, 2.6829833984375, 2.852294921875, 3.0216064453125, 3.19091796875, 3.3602294921875, 3.529541015625, 3.6988525390625, 3.8681640625, 4.0374755859375, 4.206787109375, 4.3760986328125, 4.54541015625, 4.7147216796875, 4.884033203125, 5.0533447265625, 5.22265625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 6.0, 9.0, 7.0, 18.0, 21.0, 27.0, 35.0, 42.0, 67.0, 102.0, 134.0, 196.0, 321.0, 610.0, 1542.0, 6671.0, 69963.0, 2326284.0, 1724043.0, 55435.0, 5732.0, 1439.0, 590.0, 329.0, 191.0, 118.0, 83.0, 66.0, 41.0, 35.0, 23.0, 24.0, 17.0, 9.0, 7.0, 6.0, 7.0, 5.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.265625, -18.643310546875, -18.02099609375, -17.398681640625, -16.7763671875, -16.154052734375, -15.53173828125, -14.909423828125, -14.287109375, -13.664794921875, -13.04248046875, -12.420166015625, -11.7978515625, -11.175537109375, -10.55322265625, -9.930908203125, -9.30859375, -8.686279296875, -8.06396484375, -7.441650390625, -6.8193359375, -6.197021484375, -5.57470703125, -4.952392578125, -4.330078125, -3.707763671875, -3.08544921875, -2.463134765625, -1.8408203125, -1.218505859375, -0.59619140625, 0.026123046875, 0.6484375, 1.270751953125, 1.89306640625, 2.515380859375, 3.1376953125, 3.760009765625, 4.38232421875, 5.004638671875, 5.626953125, 6.249267578125, 6.87158203125, 7.493896484375, 8.1162109375, 8.738525390625, 9.36083984375, 9.983154296875, 10.60546875, 11.227783203125, 11.85009765625, 12.472412109375, 13.0947265625, 13.717041015625, 14.33935546875, 14.961669921875, 15.583984375, 16.206298828125, 16.82861328125, 17.450927734375, 18.0732421875, 18.695556640625, 19.31787109375, 19.940185546875, 20.5625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 16.0, 78.0, 248.0, 331.0, 233.0, 88.0, 18.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-172.13938903808594, -168.85865783691406, -165.5779266357422, -162.2971954345703, -159.01646423339844, -155.73573303222656, -152.4550018310547, -149.1742706298828, -145.89353942871094, -142.61280822753906, -139.3320770263672, -136.0513458251953, -132.77061462402344, -129.48988342285156, -126.20915222167969, -122.92842102050781, -119.64768981933594, -116.36695861816406, -113.08622741699219, -109.80549621582031, -106.52476501464844, -103.24403381347656, -99.96330261230469, -96.68257141113281, -93.4018325805664, -90.12110137939453, -86.84037017822266, -83.55963897705078, -80.2789077758789, -76.99817657470703, -73.71744537353516, -70.43671417236328, -67.1559829711914, -63.87525177001953, -60.594520568847656, -57.31378936767578, -54.033058166503906, -50.75232696533203, -47.471595764160156, -44.19086456298828, -40.910133361816406, -37.62940216064453, -34.348670959472656, -31.06793975830078, -27.787208557128906, -24.5064754486084, -21.225744247436523, -17.94501304626465, -14.66427993774414, -11.383548736572266, -8.10281753540039, -4.822085380554199, -1.5413541793823242, 1.7393779754638672, 5.020109176635742, 8.300840377807617, 11.581571578979492, 14.862302780151367, 18.143033981323242, 21.42376708984375, 24.704498291015625, 27.9852294921875, 31.265960693359375, 34.54669189453125, 37.827423095703125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 9.0, 7.0, 17.0, 11.0, 15.0, 16.0, 22.0, 17.0, 15.0, 25.0, 23.0, 27.0, 32.0, 50.0, 41.0, 45.0, 32.0, 46.0, 50.0, 34.0, 40.0, 39.0, 36.0, 32.0, 28.0, 39.0, 35.0, 27.0, 23.0, 26.0, 20.0, 10.0, 20.0, 14.0, 13.0, 14.0, 12.0, 10.0, 7.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.730224609375, -21.10227394104004, -20.474321365356445, -19.846370697021484, -19.21841812133789, -18.59046745300293, -17.962514877319336, -17.334564208984375, -16.70661163330078, -16.07866096496582, -15.450708389282227, -14.82275676727295, -14.194805145263672, -13.566854476928711, -12.938902854919434, -12.310951232910156, -11.683000564575195, -11.055048942565918, -10.42709732055664, -9.799145698547363, -9.171194076538086, -8.543243408203125, -7.915291786193848, -7.28734016418457, -6.659388542175293, -6.031436920166016, -5.403485298156738, -4.775534152984619, -4.147582530975342, -3.5196309089660645, -2.891679525375366, -2.263728141784668, -1.6357765197753906, -1.0078250169754028, -0.37987351417541504, 0.24807798862457275, 0.8760294914245605, 1.503981113433838, 2.131932497024536, 2.7598838806152344, 3.3878355026245117, 4.015787124633789, 4.643738746643066, 5.2716898918151855, 5.899641513824463, 6.52759313583374, 7.155544281005859, 7.783495903015137, 8.411447525024414, 9.039399147033691, 9.667350769042969, 10.295302391052246, 10.923254013061523, 11.551204681396484, 12.179156303405762, 12.807107925415039, 13.435059547424316, 14.063011169433594, 14.690962791442871, 15.318914413452148, 15.94686508178711, 16.574817657470703, 17.202768325805664, 17.830718994140625, 18.45867156982422]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 9.0, 18.0, 15.0, 23.0, 9.0, 19.0, 27.0, 28.0, 34.0, 46.0, 36.0, 54.0, 45.0, 40.0, 43.0, 39.0, 49.0, 37.0, 46.0, 46.0, 41.0, 33.0, 37.0, 24.0, 24.0, 28.0, 21.0, 23.0, 18.0, 15.0, 10.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.87890625, -3.759674072265625, -3.64044189453125, -3.521209716796875, -3.4019775390625, -3.282745361328125, -3.16351318359375, -3.044281005859375, -2.925048828125, -2.805816650390625, -2.68658447265625, -2.567352294921875, -2.4481201171875, -2.328887939453125, -2.20965576171875, -2.090423583984375, -1.97119140625, -1.851959228515625, -1.73272705078125, -1.613494873046875, -1.4942626953125, -1.375030517578125, -1.25579833984375, -1.136566162109375, -1.017333984375, -0.898101806640625, -0.77886962890625, -0.659637451171875, -0.5404052734375, -0.421173095703125, -0.30194091796875, -0.182708740234375, -0.0634765625, 0.055755615234375, 0.17498779296875, 0.294219970703125, 0.4134521484375, 0.532684326171875, 0.65191650390625, 0.771148681640625, 0.890380859375, 1.009613037109375, 1.12884521484375, 1.248077392578125, 1.3673095703125, 1.486541748046875, 1.60577392578125, 1.725006103515625, 1.84423828125, 1.963470458984375, 2.08270263671875, 2.201934814453125, 2.3211669921875, 2.440399169921875, 2.55963134765625, 2.678863525390625, 2.798095703125, 2.917327880859375, 3.03656005859375, 3.155792236328125, 3.2750244140625, 3.394256591796875, 3.51348876953125, 3.632720947265625, 3.751953125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 10.0, 11.0, 9.0, 27.0, 36.0, 38.0, 60.0, 85.0, 143.0, 193.0, 366.0, 470.0, 742.0, 1282.0, 1928.0, 3009.0, 5156.0, 8281.0, 13524.0, 23544.0, 42242.0, 82175.0, 173123.0, 307131.0, 188411.0, 88507.0, 45385.0, 25330.0, 14486.0, 8681.0, 5258.0, 3222.0, 2054.0, 1262.0, 817.0, 542.0, 337.0, 213.0, 166.0, 95.0, 57.0, 45.0, 29.0, 24.0, 15.0, 12.0, 11.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0290985107421875, -0.028204679489135742, -0.027310848236083984, -0.026417016983032227, -0.02552318572998047, -0.02462935447692871, -0.023735523223876953, -0.022841691970825195, -0.021947860717773438, -0.02105402946472168, -0.020160198211669922, -0.019266366958618164, -0.018372535705566406, -0.01747870445251465, -0.01658487319946289, -0.015691041946411133, -0.014797210693359375, -0.013903379440307617, -0.01300954818725586, -0.012115716934204102, -0.011221885681152344, -0.010328054428100586, -0.009434223175048828, -0.00854039192199707, -0.0076465606689453125, -0.006752729415893555, -0.005858898162841797, -0.004965066909790039, -0.004071235656738281, -0.0031774044036865234, -0.0022835731506347656, -0.0013897418975830078, -0.00049591064453125, 0.0003979206085205078, 0.0012917518615722656, 0.0021855831146240234, 0.0030794143676757812, 0.003973245620727539, 0.004867076873779297, 0.005760908126831055, 0.0066547393798828125, 0.00754857063293457, 0.008442401885986328, 0.009336233139038086, 0.010230064392089844, 0.011123895645141602, 0.01201772689819336, 0.012911558151245117, 0.013805389404296875, 0.014699220657348633, 0.01559305191040039, 0.01648688316345215, 0.017380714416503906, 0.018274545669555664, 0.019168376922607422, 0.02006220817565918, 0.020956039428710938, 0.021849870681762695, 0.022743701934814453, 0.02363753318786621, 0.02453136444091797, 0.025425195693969727, 0.026319026947021484, 0.027212858200073242, 0.028106689453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 3.0, 5.0, 5.0, 3.0, 13.0, 4.0, 10.0, 9.0, 15.0, 15.0, 14.0, 21.0, 18.0, 20.0, 27.0, 28.0, 34.0, 27.0, 31.0, 33.0, 47.0, 42.0, 38.0, 27.0, 1079.0, 28.0, 35.0, 43.0, 29.0, 26.0, 35.0, 29.0, 33.0, 29.0, 22.0, 23.0, 14.0, 21.0, 21.0, 14.0, 10.0, 6.0, 8.0, 13.0, 2.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.60546875, -2.522430419921875, -2.43939208984375, -2.356353759765625, -2.2733154296875, -2.190277099609375, -2.10723876953125, -2.024200439453125, -1.941162109375, -1.858123779296875, -1.77508544921875, -1.692047119140625, -1.6090087890625, -1.525970458984375, -1.44293212890625, -1.359893798828125, -1.27685546875, -1.193817138671875, -1.11077880859375, -1.027740478515625, -0.9447021484375, -0.861663818359375, -0.77862548828125, -0.695587158203125, -0.612548828125, -0.529510498046875, -0.44647216796875, -0.363433837890625, -0.2803955078125, -0.197357177734375, -0.11431884765625, -0.031280517578125, 0.0517578125, 0.134796142578125, 0.21783447265625, 0.300872802734375, 0.3839111328125, 0.466949462890625, 0.54998779296875, 0.633026123046875, 0.716064453125, 0.799102783203125, 0.88214111328125, 0.965179443359375, 1.0482177734375, 1.131256103515625, 1.21429443359375, 1.297332763671875, 1.38037109375, 1.463409423828125, 1.54644775390625, 1.629486083984375, 1.7125244140625, 1.795562744140625, 1.87860107421875, 1.961639404296875, 2.044677734375, 2.127716064453125, 2.21075439453125, 2.293792724609375, 2.3768310546875, 2.459869384765625, 2.54290771484375, 2.625946044921875, 2.708984375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 14.0, 28.0, 41.0, 68.0, 65.0, 108.0, 141.0, 237.0, 326.0, 502.0, 703.0, 1155.0, 1696.0, 2553.0, 3930.0, 6188.0, 9447.0, 15185.0, 23862.0, 38394.0, 61938.0, 102020.0, 171177.0, 1267023.0, 151168.0, 90133.0, 55187.0, 34479.0, 21351.0, 13405.0, 8627.0, 5485.0, 3498.0, 2329.0, 1524.0, 1027.0, 698.0, 463.0, 314.0, 192.0, 159.0, 103.0, 76.0, 40.0, 23.0, 19.0, 10.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01013946533203125, -0.009805679321289062, -0.009471893310546875, -0.009138107299804688, -0.0088043212890625, -0.008470535278320312, -0.008136749267578125, -0.0078029632568359375, -0.00746917724609375, -0.0071353912353515625, -0.006801605224609375, -0.0064678192138671875, -0.006134033203125, -0.0058002471923828125, -0.005466461181640625, -0.0051326751708984375, -0.00479888916015625, -0.0044651031494140625, -0.004131317138671875, -0.0037975311279296875, -0.0034637451171875, -0.0031299591064453125, -0.002796173095703125, -0.0024623870849609375, -0.00212860107421875, -0.0017948150634765625, -0.001461029052734375, -0.0011272430419921875, -0.00079345703125, -0.0004596710205078125, -0.000125885009765625, 0.0002079010009765625, 0.00054168701171875, 0.0008754730224609375, 0.001209259033203125, 0.0015430450439453125, 0.0018768310546875, 0.0022106170654296875, 0.002544403076171875, 0.0028781890869140625, 0.00321197509765625, 0.0035457611083984375, 0.003879547119140625, 0.0042133331298828125, 0.004547119140625, 0.0048809051513671875, 0.005214691162109375, 0.0055484771728515625, 0.00588226318359375, 0.0062160491943359375, 0.006549835205078125, 0.0068836212158203125, 0.0072174072265625, 0.0075511932373046875, 0.007884979248046875, 0.008218765258789062, 0.00855255126953125, 0.008886337280273438, 0.009220123291015625, 0.009553909301757812, 0.0098876953125, 0.010221481323242188, 0.010555267333984375, 0.010889053344726562, 0.01122283935546875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 6.0, 0.0, 8.0, 0.0, 13.0, 0.0, 10.0, 0.0, 32.0, 0.0, 25.0, 41.0, 0.0, 98.0, 0.0, 125.0, 0.0, 260.0, 0.0, 136.0, 0.0, 89.0, 0.0, 50.0, 0.0, 40.0, 0.0, 23.0, 0.0, 18.0, 0.0, 13.0, 0.0, 5.0, 0.0, 7.0, 0.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1613592505455017e-06, -1.130625605583191e-06, -1.0998919606208801e-06, -1.0691583156585693e-06, -1.0384246706962585e-06, -1.0076910257339478e-06, -9.76957380771637e-07, -9.462237358093262e-07, -9.154900908470154e-07, -8.847564458847046e-07, -8.540228009223938e-07, -8.23289155960083e-07, -7.925555109977722e-07, -7.618218660354614e-07, -7.310882210731506e-07, -7.003545761108398e-07, -6.69620931148529e-07, -6.388872861862183e-07, -6.081536412239075e-07, -5.774199962615967e-07, -5.466863512992859e-07, -5.159527063369751e-07, -4.852190613746643e-07, -4.544854164123535e-07, -4.237517714500427e-07, -3.9301812648773193e-07, -3.6228448152542114e-07, -3.3155083656311035e-07, -3.0081719160079956e-07, -2.7008354663848877e-07, -2.39349901676178e-07, -2.086162567138672e-07, -1.778826117515564e-07, -1.471489667892456e-07, -1.1641532182693481e-07, -8.568167686462402e-08, -5.494803190231323e-08, -2.421438694000244e-08, 6.51925802230835e-09, 3.725290298461914e-08, 6.798654794692993e-08, 9.872019290924072e-08, 1.2945383787155151e-07, 1.601874828338623e-07, 1.909211277961731e-07, 2.2165477275848389e-07, 2.523884177207947e-07, 2.8312206268310547e-07, 3.1385570764541626e-07, 3.4458935260772705e-07, 3.7532299757003784e-07, 4.0605664253234863e-07, 4.367902874946594e-07, 4.675239324569702e-07, 4.98257577419281e-07, 5.289912223815918e-07, 5.597248673439026e-07, 5.904585123062134e-07, 6.211921572685242e-07, 6.51925802230835e-07, 6.826594471931458e-07, 7.133930921554565e-07, 7.441267371177673e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 7.0, 10.0, 5.0, 19.0, 8.0, 20.0, 37.0, 36.0, 58.0, 95.0, 179.0, 459.0, 17120.0, 1019398.0, 10270.0, 362.0, 175.0, 92.0, 61.0, 22.0, 25.0, 14.0, 14.0, 18.0, 3.0, 4.0, 10.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7404556274414062e-05, -1.669209450483322e-05, -1.597963273525238e-05, -1.526717096567154e-05, -1.4554709196090698e-05, -1.3842247426509857e-05, -1.3129785656929016e-05, -1.2417323887348175e-05, -1.1704862117767334e-05, -1.0992400348186493e-05, -1.0279938578605652e-05, -9.56747680902481e-06, -8.85501503944397e-06, -8.142553269863129e-06, -7.430091500282288e-06, -6.7176297307014465e-06, -6.0051679611206055e-06, -5.292706191539764e-06, -4.580244421958923e-06, -3.867782652378082e-06, -3.155320882797241e-06, -2.4428591132164e-06, -1.730397343635559e-06, -1.017935574054718e-06, -3.0547380447387695e-07, 4.069879651069641e-07, 1.1194497346878052e-06, 1.8319115042686462e-06, 2.5443732738494873e-06, 3.2568350434303284e-06, 3.9692968130111694e-06, 4.6817585825920105e-06, 5.3942203521728516e-06, 6.106682121753693e-06, 6.819143891334534e-06, 7.531605660915375e-06, 8.244067430496216e-06, 8.956529200077057e-06, 9.668990969657898e-06, 1.0381452739238739e-05, 1.109391450881958e-05, 1.1806376278400421e-05, 1.2518838047981262e-05, 1.3231299817562103e-05, 1.3943761587142944e-05, 1.4656223356723785e-05, 1.5368685126304626e-05, 1.6081146895885468e-05, 1.679360866546631e-05, 1.750607043504715e-05, 1.821853220462799e-05, 1.8930993974208832e-05, 1.9643455743789673e-05, 2.0355917513370514e-05, 2.1068379282951355e-05, 2.1780841052532196e-05, 2.2493302822113037e-05, 2.3205764591693878e-05, 2.391822636127472e-05, 2.463068813085556e-05, 2.53431499004364e-05, 2.6055611670017242e-05, 2.6768073439598083e-05, 2.7480535209178925e-05, 2.8192996978759766e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 30.0, 96.0, 286.0, 426.0, 131.0, 32.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.9762257983966265e-06, -3.904108780261595e-06, -3.831991762126563e-06, -3.759874516617856e-06, -3.6877574984828243e-06, -3.6156404803477926e-06, -3.543523462212761e-06, -3.4714064440777292e-06, -3.399289198569022e-06, -3.3271721804339904e-06, -3.2550551622989587e-06, -3.1829379167902516e-06, -3.11082089865522e-06, -3.0387038805201882e-06, -2.9665868623851566e-06, -2.894469844250125e-06, -2.822352826115093e-06, -2.7502358079800615e-06, -2.67811878984503e-06, -2.6060015443363227e-06, -2.533884526201291e-06, -2.4617675080662593e-06, -2.3896504899312276e-06, -2.317533471796196e-06, -2.2454164536611643e-06, -2.1732994355261326e-06, -2.101182417391101e-06, -2.0290651718823938e-06, -1.956948153747362e-06, -1.8848311356123304e-06, -1.8127141174772987e-06, -1.740597099342267e-06, -1.6684796264598845e-06, -1.5963626083248528e-06, -1.5242454765029834e-06, -1.4521284583679517e-06, -1.3800113265460823e-06, -1.3078943084110506e-06, -1.235777290276019e-06, -1.1636602721409872e-06, -1.0915432540059555e-06, -1.0194262358709238e-06, -9.473091040490544e-07, -8.751920859140228e-07, -8.030750109355722e-07, -7.309579359571217e-07, -6.5884091782209e-07, -5.867238428436394e-07, -5.1460671102177e-07, -4.424896360433195e-07, -3.7037258948657836e-07, -2.9825554292983725e-07, -2.261384679513867e-07, -1.5402139297293616e-07, -8.190434641619504e-08, -9.787299859453924e-09, 6.232977511899662e-08, 1.3444683588659245e-07, 2.0656389665418828e-07, 2.786809432109294e-07, 3.5079801818937995e-07, 4.229150931678305e-07, 4.95032168146281e-07, 5.671491862813127e-07, 6.392662612597633e-07]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 103.0, 0.0, 0.0, 0.0, 206.0, 0.0, 0.0, 0.0, 0.0, 239.0, 0.0, 0.0, 0.0, 184.0, 0.0, 0.0, 0.0, 122.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.76837158203125e-07, -4.628673195838928e-07, -4.4889748096466064e-07, -4.3492764234542847e-07, -4.209578037261963e-07, -4.069879651069641e-07, -3.9301812648773193e-07, -3.7904828786849976e-07, -3.650784492492676e-07, -3.511086106300354e-07, -3.371387720108032e-07, -3.2316893339157104e-07, -3.0919909477233887e-07, -2.952292561531067e-07, -2.812594175338745e-07, -2.6728957891464233e-07, -2.5331974029541016e-07, -2.39349901676178e-07, -2.253800630569458e-07, -2.1141022443771362e-07, -1.9744038581848145e-07, -1.8347054719924927e-07, -1.695007085800171e-07, -1.555308699607849e-07, -1.4156103134155273e-07, -1.2759119272232056e-07, -1.1362135410308838e-07, -9.96515154838562e-08, -8.568167686462402e-08, -7.171183824539185e-08, -5.774199962615967e-08, -4.377216100692749e-08, -2.9802322387695312e-08, -1.5832483768463135e-08, -1.862645149230957e-09, 1.210719347000122e-08, 2.60770320892334e-08, 4.0046870708465576e-08, 5.4016709327697754e-08, 6.798654794692993e-08, 8.195638656616211e-08, 9.592622518539429e-08, 1.0989606380462646e-07, 1.2386590242385864e-07, 1.3783574104309082e-07, 1.51805579662323e-07, 1.6577541828155518e-07, 1.7974525690078735e-07, 1.9371509552001953e-07, 2.076849341392517e-07, 2.2165477275848389e-07, 2.3562461137771606e-07, 2.4959444999694824e-07, 2.635642886161804e-07, 2.775341272354126e-07, 2.915039658546448e-07, 3.0547380447387695e-07, 3.1944364309310913e-07, 3.334134817123413e-07, 3.473833203315735e-07, 3.6135315895080566e-07, 3.7532299757003784e-07, 3.8929283618927e-07, 4.032626748085022e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 9.0, 18.0, 15.0, 23.0, 9.0, 19.0, 27.0, 28.0, 34.0, 46.0, 36.0, 54.0, 45.0, 40.0, 43.0, 39.0, 49.0, 37.0, 46.0, 46.0, 41.0, 33.0, 37.0, 24.0, 24.0, 28.0, 21.0, 23.0, 18.0, 15.0, 10.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.87890625, -3.759674072265625, -3.64044189453125, -3.521209716796875, -3.4019775390625, -3.282745361328125, -3.16351318359375, -3.044281005859375, -2.925048828125, -2.805816650390625, -2.68658447265625, -2.567352294921875, -2.4481201171875, -2.328887939453125, -2.20965576171875, -2.090423583984375, -1.97119140625, -1.851959228515625, -1.73272705078125, -1.613494873046875, -1.4942626953125, -1.375030517578125, -1.25579833984375, -1.136566162109375, -1.017333984375, -0.898101806640625, -0.77886962890625, -0.659637451171875, -0.5404052734375, -0.421173095703125, -0.30194091796875, -0.182708740234375, -0.0634765625, 0.055755615234375, 0.17498779296875, 0.294219970703125, 0.4134521484375, 0.532684326171875, 0.65191650390625, 0.771148681640625, 0.890380859375, 1.009613037109375, 1.12884521484375, 1.248077392578125, 1.3673095703125, 1.486541748046875, 1.60577392578125, 1.725006103515625, 1.84423828125, 1.963470458984375, 2.08270263671875, 2.201934814453125, 2.3211669921875, 2.440399169921875, 2.55963134765625, 2.678863525390625, 2.798095703125, 2.917327880859375, 3.03656005859375, 3.155792236328125, 3.2750244140625, 3.394256591796875, 3.51348876953125, 3.632720947265625, 3.751953125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 27.0, 21.0, 24.0, 53.0, 68.0, 120.0, 148.0, 205.0, 327.0, 467.0, 680.0, 1000.0, 1509.0, 2352.0, 3523.0, 5434.0, 8473.0, 14204.0, 24426.0, 44029.0, 83841.0, 175314.0, 326400.0, 169772.0, 81485.0, 42499.0, 23849.0, 14052.0, 8477.0, 5413.0, 3434.0, 2223.0, 1572.0, 1005.0, 639.0, 475.0, 321.0, 212.0, 165.0, 80.0, 70.0, 48.0, 37.0, 30.0, 12.0, 13.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.294921875, -3.179229736328125, -3.06353759765625, -2.947845458984375, -2.8321533203125, -2.716461181640625, -2.60076904296875, -2.485076904296875, -2.369384765625, -2.253692626953125, -2.13800048828125, -2.022308349609375, -1.9066162109375, -1.790924072265625, -1.67523193359375, -1.559539794921875, -1.44384765625, -1.328155517578125, -1.21246337890625, -1.096771240234375, -0.9810791015625, -0.865386962890625, -0.74969482421875, -0.634002685546875, -0.518310546875, -0.402618408203125, -0.28692626953125, -0.171234130859375, -0.0555419921875, 0.060150146484375, 0.17584228515625, 0.291534423828125, 0.4072265625, 0.522918701171875, 0.63861083984375, 0.754302978515625, 0.8699951171875, 0.985687255859375, 1.10137939453125, 1.217071533203125, 1.332763671875, 1.448455810546875, 1.56414794921875, 1.679840087890625, 1.7955322265625, 1.911224365234375, 2.02691650390625, 2.142608642578125, 2.25830078125, 2.373992919921875, 2.48968505859375, 2.605377197265625, 2.7210693359375, 2.836761474609375, 2.95245361328125, 3.068145751953125, 3.183837890625, 3.299530029296875, 3.41522216796875, 3.530914306640625, 3.6466064453125, 3.762298583984375, 3.87799072265625, 3.993682861328125, 4.109375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 16.0, 10.0, 14.0, 20.0, 22.0, 26.0, 26.0, 36.0, 34.0, 34.0, 37.0, 50.0, 53.0, 91.0, 169.0, 1391.0, 327.0, 151.0, 81.0, 54.0, 34.0, 59.0, 32.0, 27.0, 30.0, 41.0, 28.0, 18.0, 14.0, 22.0, 22.0, 7.0, 10.0, 10.0, 10.0, 4.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.2626953125, -8.931640625, -8.6005859375, -8.26953125, -7.9384765625, -7.607421875, -7.2763671875, -6.9453125, -6.6142578125, -6.283203125, -5.9521484375, -5.62109375, -5.2900390625, -4.958984375, -4.6279296875, -4.296875, -3.9658203125, -3.634765625, -3.3037109375, -2.97265625, -2.6416015625, -2.310546875, -1.9794921875, -1.6484375, -1.3173828125, -0.986328125, -0.6552734375, -0.32421875, 0.0068359375, 0.337890625, 0.6689453125, 1.0, 1.3310546875, 1.662109375, 1.9931640625, 2.32421875, 2.6552734375, 2.986328125, 3.3173828125, 3.6484375, 3.9794921875, 4.310546875, 4.6416015625, 4.97265625, 5.3037109375, 5.634765625, 5.9658203125, 6.296875, 6.6279296875, 6.958984375, 7.2900390625, 7.62109375, 7.9521484375, 8.283203125, 8.6142578125, 8.9453125, 9.2763671875, 9.607421875, 9.9384765625, 10.26953125, 10.6005859375, 10.931640625, 11.2626953125, 11.59375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 11.0, 15.0, 17.0, 23.0, 26.0, 41.0, 62.0, 66.0, 85.0, 150.0, 199.0, 354.0, 626.0, 1575.0, 5374.0, 28479.0, 273984.0, 2587046.0, 215353.0, 24414.0, 4772.0, 1458.0, 594.0, 326.0, 225.0, 135.0, 74.0, 41.0, 56.0, 20.0, 24.0, 14.0, 11.0, 10.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5625, -11.182861328125, -10.80322265625, -10.423583984375, -10.0439453125, -9.664306640625, -9.28466796875, -8.905029296875, -8.525390625, -8.145751953125, -7.76611328125, -7.386474609375, -7.0068359375, -6.627197265625, -6.24755859375, -5.867919921875, -5.48828125, -5.108642578125, -4.72900390625, -4.349365234375, -3.9697265625, -3.590087890625, -3.21044921875, -2.830810546875, -2.451171875, -2.071533203125, -1.69189453125, -1.312255859375, -0.9326171875, -0.552978515625, -0.17333984375, 0.206298828125, 0.5859375, 0.965576171875, 1.34521484375, 1.724853515625, 2.1044921875, 2.484130859375, 2.86376953125, 3.243408203125, 3.623046875, 4.002685546875, 4.38232421875, 4.761962890625, 5.1416015625, 5.521240234375, 5.90087890625, 6.280517578125, 6.66015625, 7.039794921875, 7.41943359375, 7.799072265625, 8.1787109375, 8.558349609375, 8.93798828125, 9.317626953125, 9.697265625, 10.076904296875, 10.45654296875, 10.836181640625, 11.2158203125, 11.595458984375, 11.97509765625, 12.354736328125, 12.734375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 18.0, 70.0, 170.0, 291.0, 254.0, 131.0, 61.0, 13.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.1630973815918, -59.54860305786133, -57.934104919433594, -56.319610595703125, -54.70511245727539, -53.09061813354492, -51.47611999511719, -49.86162567138672, -48.24713134765625, -46.63263702392578, -45.01813888549805, -43.40364456176758, -41.789146423339844, -40.174652099609375, -38.560157775878906, -36.94565963745117, -35.33116149902344, -33.71666717529297, -32.102169036865234, -30.487674713134766, -28.873178482055664, -27.258682250976562, -25.64418601989746, -24.02968978881836, -22.41519546508789, -20.80069923400879, -19.186203002929688, -17.57170867919922, -15.957212448120117, -14.342716217041016, -12.728219985961914, -11.113724708557129, -9.499229431152344, -7.8847336769104, -6.270237922668457, -4.6557416915893555, -3.041245937347412, -1.4267501831054688, 0.1877460479736328, 1.802241325378418, 3.4167375564575195, 5.031233310699463, 6.645729064941406, 8.260225296020508, 9.87472152709961, 11.489216804504395, 13.103713035583496, 14.718208312988281, 16.332704544067383, 17.947200775146484, 19.561697006225586, 21.176193237304688, 22.790687561035156, 24.405183792114258, 26.01968002319336, 27.634174346923828, 29.248672485351562, 30.863168716430664, 32.477664947509766, 34.092159271240234, 35.70665740966797, 37.32115173339844, 38.935646057128906, 40.55014419555664, 42.16463851928711]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 6.0, 6.0, 6.0, 19.0, 17.0, 19.0, 22.0, 18.0, 21.0, 27.0, 32.0, 31.0, 45.0, 47.0, 42.0, 27.0, 38.0, 44.0, 54.0, 34.0, 48.0, 47.0, 36.0, 35.0, 38.0, 38.0, 27.0, 24.0, 26.0, 24.0, 17.0, 14.0, 7.0, 23.0, 12.0, 4.0, 5.0, 3.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.847381591796875, -31.868642807006836, -30.88990592956543, -29.91116714477539, -28.932430267333984, -27.953691482543945, -26.974952697753906, -25.9962158203125, -25.017478942871094, -24.038740158081055, -23.06000328063965, -22.08126449584961, -21.102527618408203, -20.123788833618164, -19.145050048828125, -18.16631317138672, -17.18757438659668, -16.20883560180664, -15.230098724365234, -14.251359939575195, -13.272623062133789, -12.29388427734375, -11.315146446228027, -10.336408615112305, -9.357670783996582, -8.37893295288086, -7.400195121765137, -6.421456813812256, -5.442718982696533, -4.4639811515808105, -3.4852428436279297, -2.506505012512207, -1.5277671813964844, -0.5490292310714722, 0.42970871925354004, 1.4084467887878418, 2.3871846199035645, 3.365922451019287, 4.344660758972168, 5.323398590087891, 6.302136421203613, 7.280874252319336, 8.259612083435059, 9.238349914550781, 10.21708869934082, 11.195825576782227, 12.174564361572266, 13.153302192687988, 14.132040023803711, 15.110777854919434, 16.089515686035156, 17.068254470825195, 18.0469913482666, 19.02573013305664, 20.004467010498047, 20.983205795288086, 21.961944580078125, 22.940683364868164, 23.91942024230957, 24.89815902709961, 25.876895904541016, 26.855634689331055, 27.834373474121094, 28.8131103515625, 29.791847229003906]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 10.0, 5.0, 11.0, 11.0, 21.0, 11.0, 17.0, 17.0, 24.0, 21.0, 26.0, 46.0, 40.0, 47.0, 54.0, 39.0, 50.0, 35.0, 42.0, 46.0, 46.0, 50.0, 40.0, 41.0, 33.0, 25.0, 28.0, 24.0, 26.0, 24.0, 13.0, 18.0, 13.0, 8.0, 5.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.015625, -3.894073486328125, -3.77252197265625, -3.650970458984375, -3.5294189453125, -3.407867431640625, -3.28631591796875, -3.164764404296875, -3.043212890625, -2.921661376953125, -2.80010986328125, -2.678558349609375, -2.5570068359375, -2.435455322265625, -2.31390380859375, -2.192352294921875, -2.07080078125, -1.949249267578125, -1.82769775390625, -1.706146240234375, -1.5845947265625, -1.463043212890625, -1.34149169921875, -1.219940185546875, -1.098388671875, -0.976837158203125, -0.85528564453125, -0.733734130859375, -0.6121826171875, -0.490631103515625, -0.36907958984375, -0.247528076171875, -0.1259765625, -0.004425048828125, 0.11712646484375, 0.238677978515625, 0.3602294921875, 0.481781005859375, 0.60333251953125, 0.724884033203125, 0.846435546875, 0.967987060546875, 1.08953857421875, 1.211090087890625, 1.3326416015625, 1.454193115234375, 1.57574462890625, 1.697296142578125, 1.81884765625, 1.940399169921875, 2.06195068359375, 2.183502197265625, 2.3050537109375, 2.426605224609375, 2.54815673828125, 2.669708251953125, 2.791259765625, 2.912811279296875, 3.03436279296875, 3.155914306640625, 3.2774658203125, 3.399017333984375, 3.52056884765625, 3.642120361328125, 3.763671875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 6.0, 7.0, 6.0, 15.0, 15.0, 23.0, 29.0, 48.0, 55.0, 126.0, 228.0, 445.0, 902.0, 2148.0, 5572.0, 15704.0, 55088.0, 269880.0, 1926734.0, 1619431.0, 226474.0, 48555.0, 14008.0, 4981.0, 1982.0, 870.0, 417.0, 198.0, 103.0, 55.0, 47.0, 27.0, 25.0, 15.0, 8.0, 12.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.9765625, -8.712158203125, -8.44775390625, -8.183349609375, -7.9189453125, -7.654541015625, -7.39013671875, -7.125732421875, -6.861328125, -6.596923828125, -6.33251953125, -6.068115234375, -5.8037109375, -5.539306640625, -5.27490234375, -5.010498046875, -4.74609375, -4.481689453125, -4.21728515625, -3.952880859375, -3.6884765625, -3.424072265625, -3.15966796875, -2.895263671875, -2.630859375, -2.366455078125, -2.10205078125, -1.837646484375, -1.5732421875, -1.308837890625, -1.04443359375, -0.780029296875, -0.515625, -0.251220703125, 0.01318359375, 0.277587890625, 0.5419921875, 0.806396484375, 1.07080078125, 1.335205078125, 1.599609375, 1.864013671875, 2.12841796875, 2.392822265625, 2.6572265625, 2.921630859375, 3.18603515625, 3.450439453125, 3.71484375, 3.979248046875, 4.24365234375, 4.508056640625, 4.7724609375, 5.036865234375, 5.30126953125, 5.565673828125, 5.830078125, 6.094482421875, 6.35888671875, 6.623291015625, 6.8876953125, 7.152099609375, 7.41650390625, 7.680908203125, 7.9453125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 12.0, 16.0, 15.0, 19.0, 27.0, 58.0, 84.0, 123.0, 174.0, 241.0, 402.0, 579.0, 649.0, 491.0, 350.0, 282.0, 165.0, 102.0, 95.0, 52.0, 45.0, 29.0, 20.0, 14.0, 4.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.20703125, -6.96270751953125, -6.7183837890625, -6.47406005859375, -6.229736328125, -5.98541259765625, -5.7410888671875, -5.49676513671875, -5.25244140625, -5.00811767578125, -4.7637939453125, -4.51947021484375, -4.275146484375, -4.03082275390625, -3.7864990234375, -3.54217529296875, -3.2978515625, -3.05352783203125, -2.8092041015625, -2.56488037109375, -2.320556640625, -2.07623291015625, -1.8319091796875, -1.58758544921875, -1.34326171875, -1.09893798828125, -0.8546142578125, -0.61029052734375, -0.365966796875, -0.12164306640625, 0.1226806640625, 0.36700439453125, 0.611328125, 0.85565185546875, 1.0999755859375, 1.34429931640625, 1.588623046875, 1.83294677734375, 2.0772705078125, 2.32159423828125, 2.56591796875, 2.81024169921875, 3.0545654296875, 3.29888916015625, 3.543212890625, 3.78753662109375, 4.0318603515625, 4.27618408203125, 4.5205078125, 4.76483154296875, 5.0091552734375, 5.25347900390625, 5.497802734375, 5.74212646484375, 5.9864501953125, 6.23077392578125, 6.47509765625, 6.71942138671875, 6.9637451171875, 7.20806884765625, 7.452392578125, 7.69671630859375, 7.9410400390625, 8.18536376953125, 8.4296875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 7.0, 21.0, 27.0, 51.0, 66.0, 112.0, 206.0, 428.0, 1377.0, 8413.0, 212779.0, 3800108.0, 161231.0, 7284.0, 1285.0, 396.0, 192.0, 106.0, 69.0, 39.0, 23.0, 17.0, 10.0, 14.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.6875, -29.822265625, -28.95703125, -28.091796875, -27.2265625, -26.361328125, -25.49609375, -24.630859375, -23.765625, -22.900390625, -22.03515625, -21.169921875, -20.3046875, -19.439453125, -18.57421875, -17.708984375, -16.84375, -15.978515625, -15.11328125, -14.248046875, -13.3828125, -12.517578125, -11.65234375, -10.787109375, -9.921875, -9.056640625, -8.19140625, -7.326171875, -6.4609375, -5.595703125, -4.73046875, -3.865234375, -3.0, -2.134765625, -1.26953125, -0.404296875, 0.4609375, 1.326171875, 2.19140625, 3.056640625, 3.921875, 4.787109375, 5.65234375, 6.517578125, 7.3828125, 8.248046875, 9.11328125, 9.978515625, 10.84375, 11.708984375, 12.57421875, 13.439453125, 14.3046875, 15.169921875, 16.03515625, 16.900390625, 17.765625, 18.630859375, 19.49609375, 20.361328125, 21.2265625, 22.091796875, 22.95703125, 23.822265625, 24.6875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 46.0, 97.0, 228.0, 253.0, 193.0, 124.0, 49.0, 7.0, 7.0, 0.0, 2.0, 1.0, 1.0], "bins": [-129.52093505859375, -127.14391326904297, -124.76689910888672, -122.38987731933594, -120.01285552978516, -117.6358413696289, -115.25881958007812, -112.88180541992188, -110.5047836303711, -108.12776184082031, -105.75074768066406, -103.37372589111328, -100.9967041015625, -98.61968994140625, -96.24266815185547, -93.86564636230469, -91.48863220214844, -89.11161041259766, -86.7345962524414, -84.35757446289062, -81.98055267333984, -79.6035385131836, -77.22651672363281, -74.84950256347656, -72.47247314453125, -70.09545135498047, -67.71843719482422, -65.34141540527344, -62.96439743041992, -60.587379455566406, -58.210357666015625, -55.83333969116211, -53.456321716308594, -51.07930374145508, -48.7022819519043, -46.32526397705078, -43.948246002197266, -41.57122802734375, -39.19420623779297, -36.81718826293945, -34.44017028808594, -32.06315231323242, -29.686132431030273, -27.309112548828125, -24.93209457397461, -22.55507469177246, -20.178054809570312, -17.801036834716797, -15.424016952514648, -13.046998023986816, -10.669979095458984, -8.292959213256836, -5.915940284729004, -3.538921356201172, -1.1619014739990234, 1.2151165008544922, 3.5921363830566406, 5.969155311584473, 8.346174240112305, 10.723194122314453, 13.100213050842285, 15.477231979370117, 17.854251861572266, 20.23126983642578, 22.60828971862793]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 0.0, 11.0, 14.0, 14.0, 13.0, 15.0, 17.0, 22.0, 19.0, 23.0, 23.0, 42.0, 39.0, 31.0, 36.0, 38.0, 40.0, 37.0, 39.0, 31.0, 29.0, 38.0, 27.0, 43.0, 52.0, 37.0, 37.0, 33.0, 30.0, 29.0, 22.0, 10.0, 16.0, 10.0, 14.0, 15.0, 10.0, 10.0, 3.0, 4.0, 7.0, 6.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.04638671875, -21.394601821899414, -20.742816925048828, -20.091032028198242, -19.439247131347656, -18.78746223449707, -18.135677337646484, -17.48389434814453, -16.832107543945312, -16.180322647094727, -15.52853775024414, -14.876752853393555, -14.224967956542969, -13.573183059692383, -12.921399116516113, -12.269614219665527, -11.617830276489258, -10.966045379638672, -10.314260482788086, -9.6624755859375, -9.010690689086914, -8.358905792236328, -7.707121849060059, -7.055336952209473, -6.403552055358887, -5.751767158508301, -5.099982261657715, -4.448197841644287, -3.796412944793701, -3.1446280479431152, -2.4928433895111084, -1.8410587310791016, -1.1892738342285156, -0.5374890565872192, 0.11429572105407715, 0.7660804986953735, 1.41786527633667, 2.069650173187256, 2.7214348316192627, 3.3732194900512695, 4.0250043869018555, 4.676789283752441, 5.328574180603027, 5.980358600616455, 6.632143497467041, 7.283928394317627, 7.935712814331055, 8.58749771118164, 9.239282608032227, 9.891067504882812, 10.542852401733398, 11.194637298583984, 11.84642219543457, 12.498207092285156, 13.149991035461426, 13.801775932312012, 14.453560829162598, 15.105345726013184, 15.75713062286377, 16.40891456604004, 17.060699462890625, 17.71248435974121, 18.364269256591797, 19.016054153442383, 19.66783905029297]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 10.0, 7.0, 7.0, 9.0, 13.0, 17.0, 19.0, 18.0, 18.0, 27.0, 19.0, 30.0, 31.0, 34.0, 31.0, 54.0, 54.0, 51.0, 44.0, 38.0, 39.0, 53.0, 32.0, 35.0, 42.0, 24.0, 26.0, 29.0, 26.0, 35.0, 19.0, 27.0, 12.0, 14.0, 15.0, 10.0, 11.0, 2.0, 8.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.88671875, -3.7667236328125, -3.646728515625, -3.5267333984375, -3.40673828125, -3.2867431640625, -3.166748046875, -3.0467529296875, -2.9267578125, -2.8067626953125, -2.686767578125, -2.5667724609375, -2.44677734375, -2.3267822265625, -2.206787109375, -2.0867919921875, -1.966796875, -1.8468017578125, -1.726806640625, -1.6068115234375, -1.48681640625, -1.3668212890625, -1.246826171875, -1.1268310546875, -1.0068359375, -0.8868408203125, -0.766845703125, -0.6468505859375, -0.52685546875, -0.4068603515625, -0.286865234375, -0.1668701171875, -0.046875, 0.0731201171875, 0.193115234375, 0.3131103515625, 0.43310546875, 0.5531005859375, 0.673095703125, 0.7930908203125, 0.9130859375, 1.0330810546875, 1.153076171875, 1.2730712890625, 1.39306640625, 1.5130615234375, 1.633056640625, 1.7530517578125, 1.873046875, 1.9930419921875, 2.113037109375, 2.2330322265625, 2.35302734375, 2.4730224609375, 2.593017578125, 2.7130126953125, 2.8330078125, 2.9530029296875, 3.072998046875, 3.1929931640625, 3.31298828125, 3.4329833984375, 3.552978515625, 3.6729736328125, 3.79296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 6.0, 8.0, 17.0, 13.0, 24.0, 47.0, 56.0, 72.0, 115.0, 203.0, 254.0, 344.0, 554.0, 876.0, 1314.0, 1940.0, 3048.0, 4645.0, 7312.0, 11670.0, 18224.0, 28931.0, 47650.0, 82464.0, 147939.0, 255492.0, 183010.0, 101539.0, 57146.0, 34518.0, 21354.0, 13415.0, 8541.0, 5516.0, 3530.0, 2298.0, 1438.0, 1002.0, 658.0, 420.0, 323.0, 211.0, 131.0, 82.0, 63.0, 50.0, 26.0, 16.0, 22.0, 10.0, 5.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.025238037109375, -0.024441242218017578, -0.023644447326660156, -0.022847652435302734, -0.022050857543945312, -0.02125406265258789, -0.02045726776123047, -0.019660472869873047, -0.018863677978515625, -0.018066883087158203, -0.01727008819580078, -0.01647329330444336, -0.015676498413085938, -0.014879703521728516, -0.014082908630371094, -0.013286113739013672, -0.01248931884765625, -0.011692523956298828, -0.010895729064941406, -0.010098934173583984, -0.009302139282226562, -0.00850534439086914, -0.007708549499511719, -0.006911754608154297, -0.006114959716796875, -0.005318164825439453, -0.004521369934082031, -0.0037245750427246094, -0.0029277801513671875, -0.0021309852600097656, -0.0013341903686523438, -0.0005373954772949219, 0.0002593994140625, 0.0010561943054199219, 0.0018529891967773438, 0.0026497840881347656, 0.0034465789794921875, 0.004243373870849609, 0.005040168762207031, 0.005836963653564453, 0.006633758544921875, 0.007430553436279297, 0.008227348327636719, 0.00902414321899414, 0.009820938110351562, 0.010617733001708984, 0.011414527893066406, 0.012211322784423828, 0.01300811767578125, 0.013804912567138672, 0.014601707458496094, 0.015398502349853516, 0.016195297241210938, 0.01699209213256836, 0.01778888702392578, 0.018585681915283203, 0.019382476806640625, 0.020179271697998047, 0.02097606658935547, 0.02177286148071289, 0.022569656372070312, 0.023366451263427734, 0.024163246154785156, 0.024960041046142578, 0.0257568359375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 0.0, 1.0, 6.0, 6.0, 5.0, 6.0, 9.0, 13.0, 14.0, 13.0, 21.0, 21.0, 19.0, 20.0, 20.0, 35.0, 34.0, 26.0, 32.0, 45.0, 38.0, 40.0, 34.0, 1065.0, 50.0, 44.0, 34.0, 45.0, 40.0, 30.0, 35.0, 26.0, 32.0, 27.0, 25.0, 21.0, 15.0, 17.0, 16.0, 11.0, 8.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2734375, -3.168914794921875, -3.06439208984375, -2.959869384765625, -2.8553466796875, -2.750823974609375, -2.64630126953125, -2.541778564453125, -2.437255859375, -2.332733154296875, -2.22821044921875, -2.123687744140625, -2.0191650390625, -1.914642333984375, -1.81011962890625, -1.705596923828125, -1.60107421875, -1.496551513671875, -1.39202880859375, -1.287506103515625, -1.1829833984375, -1.078460693359375, -0.97393798828125, -0.869415283203125, -0.764892578125, -0.660369873046875, -0.55584716796875, -0.451324462890625, -0.3468017578125, -0.242279052734375, -0.13775634765625, -0.033233642578125, 0.0712890625, 0.175811767578125, 0.28033447265625, 0.384857177734375, 0.4893798828125, 0.593902587890625, 0.69842529296875, 0.802947998046875, 0.907470703125, 1.011993408203125, 1.11651611328125, 1.221038818359375, 1.3255615234375, 1.430084228515625, 1.53460693359375, 1.639129638671875, 1.74365234375, 1.848175048828125, 1.95269775390625, 2.057220458984375, 2.1617431640625, 2.266265869140625, 2.37078857421875, 2.475311279296875, 2.579833984375, 2.684356689453125, 2.78887939453125, 2.893402099609375, 2.9979248046875, 3.102447509765625, 3.20697021484375, 3.311492919921875, 3.416015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 6.0, 12.0, 11.0, 20.0, 18.0, 37.0, 47.0, 78.0, 90.0, 125.0, 189.0, 210.0, 380.0, 535.0, 716.0, 1028.0, 1572.0, 2177.0, 3077.0, 4431.0, 6765.0, 10007.0, 15081.0, 22758.0, 34779.0, 54396.0, 86785.0, 143799.0, 1263456.0, 166463.0, 98845.0, 61632.0, 39460.0, 25876.0, 16974.0, 11342.0, 7493.0, 5133.0, 3479.0, 2345.0, 1661.0, 1106.0, 795.0, 557.0, 382.0, 270.0, 222.0, 137.0, 110.0, 89.0, 61.0, 31.0, 27.0, 20.0, 20.0, 11.0, 6.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.01081085205078125, -0.010469198226928711, -0.010127544403076172, -0.009785890579223633, -0.009444236755371094, -0.009102582931518555, -0.008760929107666016, -0.008419275283813477, -0.008077621459960938, -0.0077359676361083984, -0.007394313812255859, -0.00705265998840332, -0.006711006164550781, -0.006369352340698242, -0.006027698516845703, -0.005686044692993164, -0.005344390869140625, -0.005002737045288086, -0.004661083221435547, -0.004319429397583008, -0.003977775573730469, -0.0036361217498779297, -0.0032944679260253906, -0.0029528141021728516, -0.0026111602783203125, -0.0022695064544677734, -0.0019278526306152344, -0.0015861988067626953, -0.0012445449829101562, -0.0009028911590576172, -0.0005612373352050781, -0.00021958351135253906, 0.0001220703125, 0.00046372413635253906, 0.0008053779602050781, 0.0011470317840576172, 0.0014886856079101562, 0.0018303394317626953, 0.0021719932556152344, 0.0025136470794677734, 0.0028553009033203125, 0.0031969547271728516, 0.0035386085510253906, 0.0038802623748779297, 0.004221916198730469, 0.004563570022583008, 0.004905223846435547, 0.005246877670288086, 0.005588531494140625, 0.005930185317993164, 0.006271839141845703, 0.006613492965698242, 0.006955146789550781, 0.00729680061340332, 0.007638454437255859, 0.007980108261108398, 0.008321762084960938, 0.008663415908813477, 0.009005069732666016, 0.009346723556518555, 0.009688377380371094, 0.010030031204223633, 0.010371685028076172, 0.010713338851928711, 0.01105499267578125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 0.0, 3.0, 9.0, 0.0, 5.0, 9.0, 0.0, 26.0, 35.0, 0.0, 30.0, 45.0, 0.0, 94.0, 0.0, 128.0, 230.0, 0.0, 146.0, 81.0, 0.0, 48.0, 43.0, 0.0, 21.0, 0.0, 18.0, 16.0, 0.0, 12.0, 1.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0943040251731873e-06, -1.0561197996139526e-06, -1.017935574054718e-06, -9.797513484954834e-07, -9.415671229362488e-07, -9.033828973770142e-07, -8.651986718177795e-07, -8.270144462585449e-07, -7.888302206993103e-07, -7.506459951400757e-07, -7.124617695808411e-07, -6.742775440216064e-07, -6.360933184623718e-07, -5.979090929031372e-07, -5.597248673439026e-07, -5.21540641784668e-07, -4.833564162254333e-07, -4.4517219066619873e-07, -4.069879651069641e-07, -3.688037395477295e-07, -3.3061951398849487e-07, -2.9243528842926025e-07, -2.5425106287002563e-07, -2.1606683731079102e-07, -1.778826117515564e-07, -1.3969838619232178e-07, -1.0151416063308716e-07, -6.332993507385254e-08, -2.514570951461792e-08, 1.30385160446167e-08, 5.122274160385132e-08, 8.940696716308594e-08, 1.2759119272232056e-07, 1.6577541828155518e-07, 2.039596438407898e-07, 2.421438694000244e-07, 2.8032809495925903e-07, 3.1851232051849365e-07, 3.5669654607772827e-07, 3.948807716369629e-07, 4.330649971961975e-07, 4.7124922275543213e-07, 5.094334483146667e-07, 5.476176738739014e-07, 5.85801899433136e-07, 6.239861249923706e-07, 6.621703505516052e-07, 7.003545761108398e-07, 7.385388016700745e-07, 7.767230272293091e-07, 8.149072527885437e-07, 8.530914783477783e-07, 8.912757039070129e-07, 9.294599294662476e-07, 9.676441550254822e-07, 1.0058283805847168e-06, 1.0440126061439514e-06, 1.082196831703186e-06, 1.1203810572624207e-06, 1.1585652828216553e-06, 1.1967495083808899e-06, 1.2349337339401245e-06, 1.2731179594993591e-06, 1.3113021850585938e-06]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 12.0, 16.0, 12.0, 17.0, 21.0, 45.0, 64.0, 98.0, 204.0, 1458.0, 854987.0, 190355.0, 762.0, 215.0, 83.0, 47.0, 40.0, 29.0, 19.0, 24.0, 10.0, 3.0, 5.0, 5.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921531677246094e-05, -2.903863787651062e-05, -2.8155744075775146e-05, -2.7272850275039673e-05, -2.63899564743042e-05, -2.5507062673568726e-05, -2.4624168872833252e-05, -2.374127507209778e-05, -2.2858381271362305e-05, -2.197548747062683e-05, -2.1092593669891357e-05, -2.0209699869155884e-05, -1.932680606842041e-05, -1.8443912267684937e-05, -1.7561018466949463e-05, -1.667812466621399e-05, -1.5795230865478516e-05, -1.4912337064743042e-05, -1.4029443264007568e-05, -1.3146549463272095e-05, -1.2263655662536621e-05, -1.1380761861801147e-05, -1.0497868061065674e-05, -9.6149742603302e-06, -8.732080459594727e-06, -7.849186658859253e-06, -6.966292858123779e-06, -6.083399057388306e-06, -5.200505256652832e-06, -4.317611455917358e-06, -3.4347176551818848e-06, -2.551823854446411e-06, -1.6689300537109375e-06, -7.860362529754639e-07, 9.685754776000977e-08, 9.797513484954834e-07, 1.862645149230957e-06, 2.7455389499664307e-06, 3.6284327507019043e-06, 4.511326551437378e-06, 5.3942203521728516e-06, 6.277114152908325e-06, 7.160007953643799e-06, 8.042901754379272e-06, 8.925795555114746e-06, 9.80868935585022e-06, 1.0691583156585693e-05, 1.1574476957321167e-05, 1.245737075805664e-05, 1.3340264558792114e-05, 1.4223158359527588e-05, 1.5106052160263062e-05, 1.5988945960998535e-05, 1.687183976173401e-05, 1.7754733562469482e-05, 1.8637627363204956e-05, 1.952052116394043e-05, 2.0403414964675903e-05, 2.1286308765411377e-05, 2.216920256614685e-05, 2.3052096366882324e-05, 2.3934990167617798e-05, 2.481788396835327e-05, 2.5700777769088745e-05, 2.658367156982422e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [6.0, 11.0, 35.0, 99.0, 279.0, 350.0, 159.0, 51.0, 22.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8575390703954326e-07, -3.1141877343543456e-07, -2.3708366825303528e-07, -1.627485488597813e-07, -8.84134294665273e-08, -1.407832428412803e-08, 6.025680931998068e-08, 1.3459194292408938e-07, 2.0892704810648866e-07, 2.8326218171059736e-07, 3.5759728689299664e-07, 4.319323920753959e-07, 5.062674972577952e-07, 5.806026592836133e-07, 6.549377644660126e-07, 7.292728696484119e-07, 8.0360803167423e-07, 8.779431368566293e-07, 9.522782420390286e-07, 1.0266134040648467e-06, 1.1009485660906648e-06, 1.1752836144296452e-06, 1.2496187764554634e-06, 1.3239539384812815e-06, 1.398288986820262e-06, 1.47262414884608e-06, 1.5469591971850605e-06, 1.6212943592108786e-06, 1.695629407549859e-06, 1.7699645695756772e-06, 1.8442997316014953e-06, 1.9186347799404757e-06, 1.992969828279456e-06, 2.0673048766184365e-06, 2.1416401523310924e-06, 2.215975200670073e-06, 2.2903102490090532e-06, 2.3646452973480336e-06, 2.4389805730606895e-06, 2.51331562139967e-06, 2.5876506697386503e-06, 2.6619857180776307e-06, 2.7363209937902866e-06, 2.810656042129267e-06, 2.8849910904682474e-06, 2.959326138807228e-06, 3.0336614145198837e-06, 3.107996462858864e-06, 3.18233173857152e-06, 3.2566667869105004e-06, 3.3310020626231562e-06, 3.4053371109621366e-06, 3.479672159301117e-06, 3.554007435013773e-06, 3.6283424833527533e-06, 3.7026775316917337e-06, 3.7770128074043896e-06, 3.8513480831170455e-06, 3.9256829040823504e-06, 4.000018179795006e-06, 4.074353455507662e-06, 4.148688276472967e-06, 4.223023552185623e-06, 4.297358827898279e-06, 4.371693648863584e-06]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 105.0, 0.0, 0.0, 0.0, 168.0, 0.0, 0.0, 0.0, 207.0, 0.0, 0.0, 0.0, 166.0, 0.0, 0.0, 0.0, 123.0, 0.0, 0.0, 0.0, 68.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 10.0, 7.0, 7.0, 9.0, 13.0, 17.0, 19.0, 18.0, 18.0, 27.0, 19.0, 30.0, 31.0, 34.0, 31.0, 54.0, 54.0, 51.0, 44.0, 38.0, 39.0, 53.0, 32.0, 35.0, 42.0, 24.0, 26.0, 29.0, 26.0, 35.0, 19.0, 27.0, 12.0, 14.0, 15.0, 10.0, 11.0, 2.0, 8.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.88671875, -3.7667236328125, -3.646728515625, -3.5267333984375, -3.40673828125, -3.2867431640625, -3.166748046875, -3.0467529296875, -2.9267578125, -2.8067626953125, -2.686767578125, -2.5667724609375, -2.44677734375, -2.3267822265625, -2.206787109375, -2.0867919921875, -1.966796875, -1.8468017578125, -1.726806640625, -1.6068115234375, -1.48681640625, -1.3668212890625, -1.246826171875, -1.1268310546875, -1.0068359375, -0.8868408203125, -0.766845703125, -0.6468505859375, -0.52685546875, -0.4068603515625, -0.286865234375, -0.1668701171875, -0.046875, 0.0731201171875, 0.193115234375, 0.3131103515625, 0.43310546875, 0.5531005859375, 0.673095703125, 0.7930908203125, 0.9130859375, 1.0330810546875, 1.153076171875, 1.2730712890625, 1.39306640625, 1.5130615234375, 1.633056640625, 1.7530517578125, 1.873046875, 1.9930419921875, 2.113037109375, 2.2330322265625, 2.35302734375, 2.4730224609375, 2.593017578125, 2.7130126953125, 2.8330078125, 2.9530029296875, 3.072998046875, 3.1929931640625, 3.31298828125, 3.4329833984375, 3.552978515625, 3.6729736328125, 3.79296875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 6.0, 14.0, 21.0, 26.0, 41.0, 56.0, 108.0, 164.0, 257.0, 418.0, 695.0, 1019.0, 1895.0, 3085.0, 5060.0, 8407.0, 15094.0, 28542.0, 73623.0, 300296.0, 431562.0, 100828.0, 35560.0, 17506.0, 9615.0, 5881.0, 3442.0, 2042.0, 1248.0, 762.0, 496.0, 305.0, 178.0, 126.0, 70.0, 43.0, 22.0, 14.0, 9.0, 5.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.859375, -4.7081298828125, -4.556884765625, -4.4056396484375, -4.25439453125, -4.1031494140625, -3.951904296875, -3.8006591796875, -3.6494140625, -3.4981689453125, -3.346923828125, -3.1956787109375, -3.04443359375, -2.8931884765625, -2.741943359375, -2.5906982421875, -2.439453125, -2.2882080078125, -2.136962890625, -1.9857177734375, -1.83447265625, -1.6832275390625, -1.531982421875, -1.3807373046875, -1.2294921875, -1.0782470703125, -0.927001953125, -0.7757568359375, -0.62451171875, -0.4732666015625, -0.322021484375, -0.1707763671875, -0.01953125, 0.1317138671875, 0.282958984375, 0.4342041015625, 0.58544921875, 0.7366943359375, 0.887939453125, 1.0391845703125, 1.1904296875, 1.3416748046875, 1.492919921875, 1.6441650390625, 1.79541015625, 1.9466552734375, 2.097900390625, 2.2491455078125, 2.400390625, 2.5516357421875, 2.702880859375, 2.8541259765625, 3.00537109375, 3.1566162109375, 3.307861328125, 3.4591064453125, 3.6103515625, 3.7615966796875, 3.912841796875, 4.0640869140625, 4.21533203125, 4.3665771484375, 4.517822265625, 4.6690673828125, 4.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 8.0, 16.0, 13.0, 15.0, 16.0, 22.0, 26.0, 17.0, 28.0, 33.0, 40.0, 41.0, 29.0, 46.0, 71.0, 114.0, 385.0, 1510.0, 166.0, 63.0, 36.0, 40.0, 36.0, 31.0, 27.0, 36.0, 33.0, 29.0, 21.0, 14.0, 19.0, 10.0, 13.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1015625, -10.7452392578125, -10.388916015625, -10.0325927734375, -9.67626953125, -9.3199462890625, -8.963623046875, -8.6072998046875, -8.2509765625, -7.8946533203125, -7.538330078125, -7.1820068359375, -6.82568359375, -6.4693603515625, -6.113037109375, -5.7567138671875, -5.400390625, -5.0440673828125, -4.687744140625, -4.3314208984375, -3.97509765625, -3.6187744140625, -3.262451171875, -2.9061279296875, -2.5498046875, -2.1934814453125, -1.837158203125, -1.4808349609375, -1.12451171875, -0.7681884765625, -0.411865234375, -0.0555419921875, 0.30078125, 0.6571044921875, 1.013427734375, 1.3697509765625, 1.72607421875, 2.0823974609375, 2.438720703125, 2.7950439453125, 3.1513671875, 3.5076904296875, 3.864013671875, 4.2203369140625, 4.57666015625, 4.9329833984375, 5.289306640625, 5.6456298828125, 6.001953125, 6.3582763671875, 6.714599609375, 7.0709228515625, 7.42724609375, 7.7835693359375, 8.139892578125, 8.4962158203125, 8.8525390625, 9.2088623046875, 9.565185546875, 9.9215087890625, 10.27783203125, 10.6341552734375, 10.990478515625, 11.3468017578125, 11.703125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 9.0, 13.0, 22.0, 34.0, 41.0, 52.0, 66.0, 103.0, 111.0, 166.0, 318.0, 847.0, 3134.0, 14541.0, 146782.0, 2832732.0, 128140.0, 13923.0, 2782.0, 856.0, 323.0, 206.0, 114.0, 80.0, 78.0, 54.0, 39.0, 33.0, 29.0, 18.0, 9.0, 11.0, 7.0, 8.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.484375, -13.0560302734375, -12.627685546875, -12.1993408203125, -11.77099609375, -11.3426513671875, -10.914306640625, -10.4859619140625, -10.0576171875, -9.6292724609375, -9.200927734375, -8.7725830078125, -8.34423828125, -7.9158935546875, -7.487548828125, -7.0592041015625, -6.630859375, -6.2025146484375, -5.774169921875, -5.3458251953125, -4.91748046875, -4.4891357421875, -4.060791015625, -3.6324462890625, -3.2041015625, -2.7757568359375, -2.347412109375, -1.9190673828125, -1.49072265625, -1.0623779296875, -0.634033203125, -0.2056884765625, 0.22265625, 0.6510009765625, 1.079345703125, 1.5076904296875, 1.93603515625, 2.3643798828125, 2.792724609375, 3.2210693359375, 3.6494140625, 4.0777587890625, 4.506103515625, 4.9344482421875, 5.36279296875, 5.7911376953125, 6.219482421875, 6.6478271484375, 7.076171875, 7.5045166015625, 7.932861328125, 8.3612060546875, 8.78955078125, 9.2178955078125, 9.646240234375, 10.0745849609375, 10.5029296875, 10.9312744140625, 11.359619140625, 11.7879638671875, 12.21630859375, 12.6446533203125, 13.072998046875, 13.5013427734375, 13.9296875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [36.0, 437.0, 512.0, 32.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.806355953216553, -3.492382764816284, -0.17840957641601562, 3.135563373565674, 6.4495368003845215, 9.763509750366211, 13.077482223510742, 16.391456604003906, 19.705429077148438, 23.01940155029297, 26.333375930786133, 29.647348403930664, 32.96132278442383, 36.27529525756836, 39.58926773071289, 42.90324401855469, 46.21721649169922, 49.53118896484375, 52.84516143798828, 56.15913391113281, 59.47311019897461, 62.78708267211914, 66.10105895996094, 69.41503143310547, 72.72900390625, 76.04297637939453, 79.35694885253906, 82.6709213256836, 85.98489379882812, 89.29887390136719, 92.61283874511719, 95.92681884765625, 99.24079132080078, 102.55476379394531, 105.86873626708984, 109.18270874023438, 112.4966812133789, 115.81065368652344, 119.1246337890625, 122.43860626220703, 125.75257873535156, 129.06655883789062, 132.38052368164062, 135.6945037841797, 139.0084686279297, 142.32244873046875, 145.63641357421875, 148.9503936767578, 152.2643585205078, 155.57833862304688, 158.89230346679688, 162.20628356933594, 165.52024841308594, 168.834228515625, 172.148193359375, 175.46217346191406, 178.77615356445312, 182.0901336669922, 185.4040985107422, 188.71807861328125, 192.03204345703125, 195.3460235595703, 198.6599884033203, 201.97396850585938, 205.28793334960938]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 8.0, 17.0, 17.0, 9.0, 8.0, 18.0, 24.0, 28.0, 25.0, 49.0, 30.0, 38.0, 41.0, 31.0, 33.0, 59.0, 49.0, 46.0, 49.0, 36.0, 41.0, 41.0, 35.0, 37.0, 35.0, 25.0, 23.0, 26.0, 20.0, 19.0, 16.0, 10.0, 5.0, 12.0, 8.0, 5.0, 7.0, 0.0, 2.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.620820999145508, -28.647905349731445, -27.67498779296875, -26.702072143554688, -25.729154586791992, -24.75623893737793, -23.783321380615234, -22.810405731201172, -21.83749008178711, -20.864574432373047, -19.89165687561035, -18.91874122619629, -17.945823669433594, -16.97290802001953, -15.999991416931152, -15.027074813842773, -14.054157257080078, -13.0812406539917, -12.10832405090332, -11.135408401489258, -10.162490844726562, -9.1895751953125, -8.216658592224121, -7.243741989135742, -6.270825386047363, -5.297908782958984, -4.3249921798706055, -3.3520760536193848, -2.379159450531006, -1.406242847442627, -0.43332672119140625, 0.5395898818969727, 1.5125083923339844, 2.4854249954223633, 3.458341360092163, 4.431257724761963, 5.404174327850342, 6.377090930938721, 7.350007057189941, 8.32292366027832, 9.2958402633667, 10.268756866455078, 11.241673469543457, 12.214590072631836, 13.187505722045898, 14.160423278808594, 15.133338928222656, 16.10625457763672, 17.079172134399414, 18.052087783813477, 19.025005340576172, 19.997920989990234, 20.97083854675293, 21.943754196166992, 22.916671752929688, 23.88958740234375, 24.862503051757812, 25.835418701171875, 26.80833625793457, 27.781251907348633, 28.754169464111328, 29.72708511352539, 30.700000762939453, 31.67291831970215, 32.645835876464844]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 3.0, 7.0, 5.0, 11.0, 15.0, 17.0, 15.0, 20.0, 23.0, 19.0, 21.0, 24.0, 31.0, 27.0, 32.0, 39.0, 44.0, 53.0, 53.0, 44.0, 37.0, 33.0, 45.0, 40.0, 34.0, 35.0, 29.0, 33.0, 23.0, 25.0, 31.0, 15.0, 23.0, 17.0, 15.0, 15.0, 9.0, 10.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.9765625, -3.856170654296875, -3.73577880859375, -3.615386962890625, -3.4949951171875, -3.374603271484375, -3.25421142578125, -3.133819580078125, -3.013427734375, -2.893035888671875, -2.77264404296875, -2.652252197265625, -2.5318603515625, -2.411468505859375, -2.29107666015625, -2.170684814453125, -2.05029296875, -1.929901123046875, -1.80950927734375, -1.689117431640625, -1.5687255859375, -1.448333740234375, -1.32794189453125, -1.207550048828125, -1.087158203125, -0.966766357421875, -0.84637451171875, -0.725982666015625, -0.6055908203125, -0.485198974609375, -0.36480712890625, -0.244415283203125, -0.1240234375, -0.003631591796875, 0.11676025390625, 0.237152099609375, 0.3575439453125, 0.477935791015625, 0.59832763671875, 0.718719482421875, 0.839111328125, 0.959503173828125, 1.07989501953125, 1.200286865234375, 1.3206787109375, 1.441070556640625, 1.56146240234375, 1.681854248046875, 1.80224609375, 1.922637939453125, 2.04302978515625, 2.163421630859375, 2.2838134765625, 2.404205322265625, 2.52459716796875, 2.644989013671875, 2.765380859375, 2.885772705078125, 3.00616455078125, 3.126556396484375, 3.2469482421875, 3.367340087890625, 3.48773193359375, 3.608123779296875, 3.728515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 15.0, 12.0, 18.0, 26.0, 42.0, 46.0, 75.0, 99.0, 135.0, 224.0, 331.0, 463.0, 685.0, 1171.0, 1979.0, 3397.0, 5811.0, 11036.0, 22702.0, 52305.0, 140142.0, 470734.0, 1599023.0, 1324111.0, 359749.0, 112734.0, 43659.0, 19988.0, 10068.0, 5459.0, 3075.0, 1753.0, 1086.0, 689.0, 447.0, 294.0, 195.0, 132.0, 93.0, 60.0, 66.0, 43.0, 29.0, 23.0, 9.0, 9.0, 10.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0], "bins": [-5.95703125, -5.78131103515625, -5.6055908203125, -5.42987060546875, -5.254150390625, -5.07843017578125, -4.9027099609375, -4.72698974609375, -4.55126953125, -4.37554931640625, -4.1998291015625, -4.02410888671875, -3.848388671875, -3.67266845703125, -3.4969482421875, -3.32122802734375, -3.1455078125, -2.96978759765625, -2.7940673828125, -2.61834716796875, -2.442626953125, -2.26690673828125, -2.0911865234375, -1.91546630859375, -1.73974609375, -1.56402587890625, -1.3883056640625, -1.21258544921875, -1.036865234375, -0.86114501953125, -0.6854248046875, -0.50970458984375, -0.333984375, -0.15826416015625, 0.0174560546875, 0.19317626953125, 0.368896484375, 0.54461669921875, 0.7203369140625, 0.89605712890625, 1.07177734375, 1.24749755859375, 1.4232177734375, 1.59893798828125, 1.774658203125, 1.95037841796875, 2.1260986328125, 2.30181884765625, 2.4775390625, 2.65325927734375, 2.8289794921875, 3.00469970703125, 3.180419921875, 3.35614013671875, 3.5318603515625, 3.70758056640625, 3.88330078125, 4.05902099609375, 4.2347412109375, 4.41046142578125, 4.586181640625, 4.76190185546875, 4.9376220703125, 5.11334228515625, 5.2890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 9.0, 9.0, 16.0, 12.0, 23.0, 47.0, 45.0, 64.0, 82.0, 118.0, 161.0, 195.0, 316.0, 393.0, 495.0, 517.0, 414.0, 283.0, 241.0, 164.0, 111.0, 93.0, 60.0, 47.0, 47.0, 19.0, 22.0, 16.0, 11.0, 7.0, 5.0, 11.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.109375, -6.90020751953125, -6.6910400390625, -6.48187255859375, -6.272705078125, -6.06353759765625, -5.8543701171875, -5.64520263671875, -5.43603515625, -5.22686767578125, -5.0177001953125, -4.80853271484375, -4.599365234375, -4.39019775390625, -4.1810302734375, -3.97186279296875, -3.7626953125, -3.55352783203125, -3.3443603515625, -3.13519287109375, -2.926025390625, -2.71685791015625, -2.5076904296875, -2.29852294921875, -2.08935546875, -1.88018798828125, -1.6710205078125, -1.46185302734375, -1.252685546875, -1.04351806640625, -0.8343505859375, -0.62518310546875, -0.416015625, -0.20684814453125, 0.0023193359375, 0.21148681640625, 0.420654296875, 0.62982177734375, 0.8389892578125, 1.04815673828125, 1.25732421875, 1.46649169921875, 1.6756591796875, 1.88482666015625, 2.093994140625, 2.30316162109375, 2.5123291015625, 2.72149658203125, 2.9306640625, 3.13983154296875, 3.3489990234375, 3.55816650390625, 3.767333984375, 3.97650146484375, 4.1856689453125, 4.39483642578125, 4.60400390625, 4.81317138671875, 5.0223388671875, 5.23150634765625, 5.440673828125, 5.64984130859375, 5.8590087890625, 6.06817626953125, 6.27734375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 13.0, 13.0, 19.0, 18.0, 33.0, 42.0, 66.0, 118.0, 184.0, 305.0, 541.0, 1269.0, 3242.0, 11446.0, 64011.0, 689405.0, 3071211.0, 304870.0, 35425.0, 7602.0, 2367.0, 947.0, 437.0, 241.0, 159.0, 81.0, 56.0, 44.0, 25.0, 25.0, 14.0, 10.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.984375, -14.50634765625, -14.0283203125, -13.55029296875, -13.072265625, -12.59423828125, -12.1162109375, -11.63818359375, -11.16015625, -10.68212890625, -10.2041015625, -9.72607421875, -9.248046875, -8.77001953125, -8.2919921875, -7.81396484375, -7.3359375, -6.85791015625, -6.3798828125, -5.90185546875, -5.423828125, -4.94580078125, -4.4677734375, -3.98974609375, -3.51171875, -3.03369140625, -2.5556640625, -2.07763671875, -1.599609375, -1.12158203125, -0.6435546875, -0.16552734375, 0.3125, 0.79052734375, 1.2685546875, 1.74658203125, 2.224609375, 2.70263671875, 3.1806640625, 3.65869140625, 4.13671875, 4.61474609375, 5.0927734375, 5.57080078125, 6.048828125, 6.52685546875, 7.0048828125, 7.48291015625, 7.9609375, 8.43896484375, 8.9169921875, 9.39501953125, 9.873046875, 10.35107421875, 10.8291015625, 11.30712890625, 11.78515625, 12.26318359375, 12.7412109375, 13.21923828125, 13.697265625, 14.17529296875, 14.6533203125, 15.13134765625, 15.609375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 17.0, 61.0, 212.0, 353.0, 264.0, 86.0, 15.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.74615478515625, -167.5551300048828, -164.36410522460938, -161.17308044433594, -157.98207092285156, -154.79104614257812, -151.6000213623047, -148.40899658203125, -145.2179718017578, -142.02694702148438, -138.83592224121094, -135.6448974609375, -132.45388793945312, -129.2628631591797, -126.07183837890625, -122.88081359863281, -119.68978881835938, -116.49876403808594, -113.30774688720703, -110.1167221069336, -106.92569732666016, -103.73467254638672, -100.54365539550781, -97.35263061523438, -94.16161346435547, -90.97058868408203, -87.77957153320312, -84.58854675292969, -81.39752197265625, -78.20649719238281, -75.0154800415039, -71.82445526123047, -68.63343048095703, -65.4424057006836, -62.25138473510742, -59.06036376953125, -55.86933898925781, -52.67831802368164, -49.48729705810547, -46.29627227783203, -43.105247497558594, -39.91422653198242, -36.723201751708984, -33.53218078613281, -30.341156005859375, -27.150135040283203, -23.9591121673584, -20.768089294433594, -17.577068328857422, -14.386045455932617, -11.195022583007812, -8.004000663757324, -4.8129777908325195, -1.6219549179077148, 1.5690670013427734, 4.760089874267578, 7.951112747192383, 11.142135620117188, 14.333158493041992, 17.524181365966797, 20.71520233154297, 23.906227111816406, 27.097248077392578, 30.288270950317383, 33.47929382324219]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 8.0, 4.0, 13.0, 9.0, 9.0, 6.0, 20.0, 13.0, 15.0, 22.0, 19.0, 27.0, 20.0, 36.0, 37.0, 32.0, 49.0, 48.0, 44.0, 44.0, 40.0, 60.0, 45.0, 39.0, 38.0, 39.0, 32.0, 43.0, 24.0, 24.0, 26.0, 28.0, 23.0, 13.0, 15.0, 6.0, 6.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.090110778808594, -22.3328914642334, -21.575674057006836, -20.81845474243164, -20.061235427856445, -19.30401611328125, -18.546798706054688, -17.789579391479492, -17.032360076904297, -16.2751407623291, -15.517922401428223, -14.760704040527344, -14.003484725952148, -13.24626636505127, -12.48904800415039, -11.731828689575195, -10.974611282348633, -10.217392921447754, -9.460173606872559, -8.70295524597168, -7.945736408233643, -7.1885175704956055, -6.431299209594727, -5.6740803718566895, -4.916861534118652, -4.159642696380615, -3.4024240970611572, -2.645205497741699, -1.887986660003662, -1.130767822265625, -0.3735494613647461, 0.383669376373291, 1.1408882141113281, 1.8981069326400757, 2.6553256511688232, 3.4125442504882812, 4.169763088226318, 4.9269819259643555, 5.684200286865234, 6.4414191246032715, 7.198637962341309, 7.955856800079346, 8.713075637817383, 9.470293998718262, 10.22751235961914, 10.984731674194336, 11.741950035095215, 12.499168395996094, 13.256387710571289, 14.013606071472168, 14.770825386047363, 15.528043746948242, 16.285263061523438, 17.04248046875, 17.799699783325195, 18.55691909790039, 19.314136505126953, 20.07135581970215, 20.82857322692871, 21.585792541503906, 22.3430118560791, 23.100231170654297, 23.85744857788086, 24.614667892456055, 25.37188720703125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 12.0, 15.0, 21.0, 23.0, 16.0, 22.0, 27.0, 24.0, 33.0, 34.0, 33.0, 27.0, 48.0, 49.0, 41.0, 44.0, 54.0, 47.0, 52.0, 27.0, 48.0, 32.0, 33.0, 29.0, 26.0, 29.0, 28.0, 14.0, 15.0, 12.0, 9.0, 16.0, 4.0, 9.0, 13.0, 7.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.896484375, -3.766815185546875, -3.63714599609375, -3.507476806640625, -3.3778076171875, -3.248138427734375, -3.11846923828125, -2.988800048828125, -2.859130859375, -2.729461669921875, -2.59979248046875, -2.470123291015625, -2.3404541015625, -2.210784912109375, -2.08111572265625, -1.951446533203125, -1.82177734375, -1.692108154296875, -1.56243896484375, -1.432769775390625, -1.3031005859375, -1.173431396484375, -1.04376220703125, -0.914093017578125, -0.784423828125, -0.654754638671875, -0.52508544921875, -0.395416259765625, -0.2657470703125, -0.136077880859375, -0.00640869140625, 0.123260498046875, 0.2529296875, 0.382598876953125, 0.51226806640625, 0.641937255859375, 0.7716064453125, 0.901275634765625, 1.03094482421875, 1.160614013671875, 1.290283203125, 1.419952392578125, 1.54962158203125, 1.679290771484375, 1.8089599609375, 1.938629150390625, 2.06829833984375, 2.197967529296875, 2.32763671875, 2.457305908203125, 2.58697509765625, 2.716644287109375, 2.8463134765625, 2.975982666015625, 3.10565185546875, 3.235321044921875, 3.364990234375, 3.494659423828125, 3.62432861328125, 3.753997802734375, 3.8836669921875, 4.013336181640625, 4.14300537109375, 4.272674560546875, 4.40234375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 3.0, 7.0, 6.0, 15.0, 23.0, 28.0, 45.0, 59.0, 76.0, 142.0, 166.0, 238.0, 336.0, 484.0, 718.0, 949.0, 1453.0, 2032.0, 3038.0, 4137.0, 5982.0, 8689.0, 12872.0, 19053.0, 28976.0, 45226.0, 73658.0, 126919.0, 221421.0, 195757.0, 109671.0, 64975.0, 40383.0, 25914.0, 17329.0, 11605.0, 8081.0, 5509.0, 3779.0, 2618.0, 1836.0, 1296.0, 923.0, 670.0, 449.0, 296.0, 192.0, 153.0, 112.0, 86.0, 53.0, 31.0, 41.0, 20.0, 9.0, 14.0, 4.0, 5.0, 1.0, 2.0], "bins": [-0.0235595703125, -0.022842884063720703, -0.022126197814941406, -0.02140951156616211, -0.020692825317382812, -0.019976139068603516, -0.01925945281982422, -0.018542766571044922, -0.017826080322265625, -0.017109394073486328, -0.01639270782470703, -0.015676021575927734, -0.014959335327148438, -0.01424264907836914, -0.013525962829589844, -0.012809276580810547, -0.01209259033203125, -0.011375904083251953, -0.010659217834472656, -0.00994253158569336, -0.009225845336914062, -0.008509159088134766, -0.007792472839355469, -0.007075786590576172, -0.006359100341796875, -0.005642414093017578, -0.004925727844238281, -0.004209041595458984, -0.0034923553466796875, -0.0027756690979003906, -0.0020589828491210938, -0.0013422966003417969, -0.0006256103515625, 9.107589721679688e-05, 0.0008077621459960938, 0.0015244483947753906, 0.0022411346435546875, 0.0029578208923339844, 0.0036745071411132812, 0.004391193389892578, 0.005107879638671875, 0.005824565887451172, 0.006541252136230469, 0.007257938385009766, 0.007974624633789062, 0.00869131088256836, 0.009407997131347656, 0.010124683380126953, 0.01084136962890625, 0.011558055877685547, 0.012274742126464844, 0.01299142837524414, 0.013708114624023438, 0.014424800872802734, 0.015141487121582031, 0.015858173370361328, 0.016574859619140625, 0.017291545867919922, 0.01800823211669922, 0.018724918365478516, 0.019441604614257812, 0.02015829086303711, 0.020874977111816406, 0.021591663360595703, 0.022308349609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 1.0, 3.0, 9.0, 18.0, 10.0, 12.0, 5.0, 21.0, 13.0, 18.0, 34.0, 22.0, 23.0, 22.0, 31.0, 36.0, 28.0, 30.0, 46.0, 40.0, 32.0, 48.0, 1060.0, 32.0, 38.0, 34.0, 31.0, 28.0, 34.0, 30.0, 33.0, 24.0, 28.0, 25.0, 24.0, 15.0, 16.0, 13.0, 8.0, 7.0, 8.0, 8.0, 8.0, 1.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.486328125, -3.378021240234375, -3.26971435546875, -3.161407470703125, -3.0531005859375, -2.944793701171875, -2.83648681640625, -2.728179931640625, -2.619873046875, -2.511566162109375, -2.40325927734375, -2.294952392578125, -2.1866455078125, -2.078338623046875, -1.97003173828125, -1.861724853515625, -1.75341796875, -1.645111083984375, -1.53680419921875, -1.428497314453125, -1.3201904296875, -1.211883544921875, -1.10357666015625, -0.995269775390625, -0.886962890625, -0.778656005859375, -0.67034912109375, -0.562042236328125, -0.4537353515625, -0.345428466796875, -0.23712158203125, -0.128814697265625, -0.0205078125, 0.087799072265625, 0.19610595703125, 0.304412841796875, 0.4127197265625, 0.521026611328125, 0.62933349609375, 0.737640380859375, 0.845947265625, 0.954254150390625, 1.06256103515625, 1.170867919921875, 1.2791748046875, 1.387481689453125, 1.49578857421875, 1.604095458984375, 1.71240234375, 1.820709228515625, 1.92901611328125, 2.037322998046875, 2.1456298828125, 2.253936767578125, 2.36224365234375, 2.470550537109375, 2.578857421875, 2.687164306640625, 2.79547119140625, 2.903778076171875, 3.0120849609375, 3.120391845703125, 3.22869873046875, 3.337005615234375, 3.4453125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 14.0, 6.0, 23.0, 38.0, 34.0, 67.0, 91.0, 127.0, 166.0, 248.0, 386.0, 555.0, 729.0, 1124.0, 1582.0, 2344.0, 3392.0, 5299.0, 7841.0, 11614.0, 17411.0, 27463.0, 42470.0, 67740.0, 113124.0, 194589.0, 1259575.0, 127986.0, 75648.0, 46810.0, 30423.0, 19333.0, 12706.0, 8554.0, 5730.0, 3642.0, 2576.0, 1775.0, 1206.0, 754.0, 603.0, 424.0, 302.0, 167.0, 112.0, 101.0, 74.0, 59.0, 38.0, 21.0, 13.0, 6.0, 5.0, 9.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.012420654296875, -0.012033820152282715, -0.01164698600769043, -0.011260151863098145, -0.01087331771850586, -0.010486483573913574, -0.010099649429321289, -0.009712815284729004, -0.009325981140136719, -0.008939146995544434, -0.008552312850952148, -0.008165478706359863, -0.007778644561767578, -0.007391810417175293, -0.007004976272583008, -0.006618142127990723, -0.0062313079833984375, -0.005844473838806152, -0.005457639694213867, -0.005070805549621582, -0.004683971405029297, -0.004297137260437012, -0.0039103031158447266, -0.0035234689712524414, -0.0031366348266601562, -0.002749800682067871, -0.002362966537475586, -0.0019761323928833008, -0.0015892982482910156, -0.0012024641036987305, -0.0008156299591064453, -0.00042879581451416016, -4.1961669921875e-05, 0.00034487247467041016, 0.0007317066192626953, 0.0011185407638549805, 0.0015053749084472656, 0.0018922090530395508, 0.002279043197631836, 0.002665877342224121, 0.0030527114868164062, 0.0034395456314086914, 0.0038263797760009766, 0.004213213920593262, 0.004600048065185547, 0.004986882209777832, 0.005373716354370117, 0.005760550498962402, 0.0061473846435546875, 0.006534218788146973, 0.006921052932739258, 0.007307887077331543, 0.007694721221923828, 0.008081555366516113, 0.008468389511108398, 0.008855223655700684, 0.009242057800292969, 0.009628891944885254, 0.010015726089477539, 0.010402560234069824, 0.01078939437866211, 0.011176228523254395, 0.01156306266784668, 0.011949896812438965, 0.01233673095703125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 0.0, 4.0, 8.0, 0.0, 8.0, 8.0, 0.0, 21.0, 24.0, 0.0, 39.0, 80.0, 0.0, 154.0, 267.0, 0.0, 148.0, 79.0, 0.0, 52.0, 33.0, 0.0, 29.0, 12.0, 0.0, 8.0, 9.0, 0.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.152046024799347e-06, -1.1119991540908813e-06, -1.0719522833824158e-06, -1.0319054126739502e-06, -9.918585419654846e-07, -9.51811671257019e-07, -9.117648005485535e-07, -8.717179298400879e-07, -8.316710591316223e-07, -7.916241884231567e-07, -7.515773177146912e-07, -7.115304470062256e-07, -6.7148357629776e-07, -6.314367055892944e-07, -5.913898348808289e-07, -5.513429641723633e-07, -5.112960934638977e-07, -4.7124922275543213e-07, -4.3120235204696655e-07, -3.91155481338501e-07, -3.511086106300354e-07, -3.110617399215698e-07, -2.7101486921310425e-07, -2.3096799850463867e-07, -1.909211277961731e-07, -1.5087425708770752e-07, -1.1082738637924194e-07, -7.078051567077637e-08, -3.073364496231079e-08, 9.313225746154785e-09, 4.936009645462036e-08, 8.940696716308594e-08, 1.2945383787155151e-07, 1.695007085800171e-07, 2.0954757928848267e-07, 2.4959444999694824e-07, 2.896413207054138e-07, 3.296881914138794e-07, 3.6973506212234497e-07, 4.0978193283081055e-07, 4.498288035392761e-07, 4.898756742477417e-07, 5.299225449562073e-07, 5.699694156646729e-07, 6.100162863731384e-07, 6.50063157081604e-07, 6.901100277900696e-07, 7.301568984985352e-07, 7.702037692070007e-07, 8.102506399154663e-07, 8.502975106239319e-07, 8.903443813323975e-07, 9.30391252040863e-07, 9.704381227493286e-07, 1.0104849934577942e-06, 1.0505318641662598e-06, 1.0905787348747253e-06, 1.130625605583191e-06, 1.1706724762916565e-06, 1.210719347000122e-06, 1.2507662177085876e-06, 1.2908130884170532e-06, 1.3308599591255188e-06, 1.3709068298339844e-06]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 7.0, 10.0, 19.0, 22.0, 40.0, 66.0, 82.0, 185.0, 712.0, 170858.0, 875121.0, 982.0, 187.0, 87.0, 49.0, 25.0, 22.0, 19.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1948089599609375e-05, -3.101024776697159e-05, -3.00724059343338e-05, -2.9134564101696014e-05, -2.8196722269058228e-05, -2.725888043642044e-05, -2.6321038603782654e-05, -2.5383196771144867e-05, -2.444535493850708e-05, -2.3507513105869293e-05, -2.2569671273231506e-05, -2.163182944059372e-05, -2.0693987607955933e-05, -1.9756145775318146e-05, -1.881830394268036e-05, -1.7880462110042572e-05, -1.6942620277404785e-05, -1.6004778444766998e-05, -1.5066936612129211e-05, -1.4129094779491425e-05, -1.3191252946853638e-05, -1.225341111421585e-05, -1.1315569281578064e-05, -1.0377727448940277e-05, -9.43988561630249e-06, -8.502043783664703e-06, -7.5642019510269165e-06, -6.62636011838913e-06, -5.688518285751343e-06, -4.750676453113556e-06, -3.812834620475769e-06, -2.874992787837982e-06, -1.9371509552001953e-06, -9.993091225624084e-07, -6.146728992462158e-08, 8.763745427131653e-07, 1.8142163753509521e-06, 2.752058207988739e-06, 3.689900040626526e-06, 4.627741873264313e-06, 5.5655837059021e-06, 6.5034255385398865e-06, 7.441267371177673e-06, 8.37910920381546e-06, 9.316951036453247e-06, 1.0254792869091034e-05, 1.119263470172882e-05, 1.2130476534366608e-05, 1.3068318367004395e-05, 1.4006160199642181e-05, 1.4944002032279968e-05, 1.5881843864917755e-05, 1.6819685697555542e-05, 1.775752753019333e-05, 1.8695369362831116e-05, 1.9633211195468903e-05, 2.057105302810669e-05, 2.1508894860744476e-05, 2.2446736693382263e-05, 2.338457852602005e-05, 2.4322420358657837e-05, 2.5260262191295624e-05, 2.619810402393341e-05, 2.7135945856571198e-05, 2.8073787689208984e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 17.0, 51.0, 131.0, 204.0, 288.0, 167.0, 78.0, 34.0, 17.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.900216481473763e-07, -4.425238842031831e-07, -3.9502612025899e-07, -3.475283278930874e-07, -3.0003056394889427e-07, -2.5253280000470113e-07, -2.0503500763879856e-07, -1.5753724369460542e-07, -1.1003947975041228e-07, -6.254170870079179e-08, -1.504393765117129e-08, 3.245384050387656e-08, 7.99516044480697e-08, 1.2744936839226284e-07, 1.749471607581654e-07, 2.2244492470235855e-07, 2.699426886465517e-07, 3.174404525907448e-07, 3.6493821653493796e-07, 4.1243600890084053e-07, 4.5993377284503367e-07, 5.074315367892268e-07, 5.549293291551294e-07, 6.02427121521032e-07, 6.499248570435157e-07, 6.974226494094182e-07, 7.449203849319019e-07, 7.924181772978045e-07, 8.399159696637071e-07, 8.874137051861908e-07, 9.349114975520934e-07, 9.82409233074577e-07, 1.0299070254404796e-06, 1.0774048178063822e-06, 1.1249026101722848e-06, 1.1724002888513496e-06, 1.2198980812172522e-06, 1.2673958735831548e-06, 1.3148936659490573e-06, 1.3623914583149599e-06, 1.4098891369940247e-06, 1.4573869293599273e-06, 1.5048847217258299e-06, 1.5523824004048947e-06, 1.5998801927707973e-06, 1.6473779851366999e-06, 1.6948757775026024e-06, 1.742373569868505e-06, 1.7898713622344076e-06, 1.8373691546003101e-06, 1.8848669469662127e-06, 1.9323647393321153e-06, 1.97986241801118e-06, 2.027360096690245e-06, 2.0748580027429853e-06, 2.12235568142205e-06, 2.1698535874747904e-06, 2.2173512661538552e-06, 2.2648491722065955e-06, 2.3123468508856604e-06, 2.3598447569384007e-06, 2.4073424356174655e-06, 2.454840341670206e-06, 2.5023380203492707e-06, 2.5498356990283355e-06]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 103.0, 0.0, 0.0, 0.0, 192.0, 0.0, 0.0, 0.0, 228.0, 0.0, 0.0, 0.0, 0.0, 203.0, 0.0, 0.0, 0.0, 110.0, 0.0, 0.0, 0.0, 66.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.032626748085022e-07, -3.8929283618927e-07, -3.7532299757003784e-07, -3.6135315895080566e-07, -3.473833203315735e-07, -3.334134817123413e-07, -3.1944364309310913e-07, -3.0547380447387695e-07, -2.915039658546448e-07, -2.775341272354126e-07, -2.635642886161804e-07, -2.4959444999694824e-07, -2.3562461137771606e-07, -2.2165477275848389e-07, -2.076849341392517e-07, -1.9371509552001953e-07, -1.7974525690078735e-07, -1.6577541828155518e-07, -1.51805579662323e-07, -1.3783574104309082e-07, -1.2386590242385864e-07, -1.0989606380462646e-07, -9.592622518539429e-08, -8.195638656616211e-08, -6.798654794692993e-08, -5.4016709327697754e-08, -4.0046870708465576e-08, -2.60770320892334e-08, -1.210719347000122e-08, 1.862645149230957e-09, 1.5832483768463135e-08, 2.9802322387695312e-08, 4.377216100692749e-08, 5.774199962615967e-08, 7.171183824539185e-08, 8.568167686462402e-08, 9.96515154838562e-08, 1.1362135410308838e-07, 1.2759119272232056e-07, 1.4156103134155273e-07, 1.555308699607849e-07, 1.695007085800171e-07, 1.8347054719924927e-07, 1.9744038581848145e-07, 2.1141022443771362e-07, 2.253800630569458e-07, 2.39349901676178e-07, 2.5331974029541016e-07, 2.6728957891464233e-07, 2.812594175338745e-07, 2.952292561531067e-07, 3.0919909477233887e-07, 3.2316893339157104e-07, 3.371387720108032e-07, 3.511086106300354e-07, 3.650784492492676e-07, 3.7904828786849976e-07, 3.9301812648773193e-07, 4.069879651069641e-07, 4.209578037261963e-07, 4.3492764234542847e-07, 4.4889748096466064e-07, 4.628673195838928e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 12.0, 15.0, 21.0, 23.0, 16.0, 22.0, 27.0, 24.0, 33.0, 34.0, 33.0, 27.0, 48.0, 49.0, 41.0, 44.0, 54.0, 47.0, 52.0, 27.0, 48.0, 32.0, 33.0, 29.0, 26.0, 29.0, 28.0, 14.0, 15.0, 12.0, 9.0, 16.0, 4.0, 9.0, 13.0, 7.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.896484375, -3.766815185546875, -3.63714599609375, -3.507476806640625, -3.3778076171875, -3.248138427734375, -3.11846923828125, -2.988800048828125, -2.859130859375, -2.729461669921875, -2.59979248046875, -2.470123291015625, -2.3404541015625, -2.210784912109375, -2.08111572265625, -1.951446533203125, -1.82177734375, -1.692108154296875, -1.56243896484375, -1.432769775390625, -1.3031005859375, -1.173431396484375, -1.04376220703125, -0.914093017578125, -0.784423828125, -0.654754638671875, -0.52508544921875, -0.395416259765625, -0.2657470703125, -0.136077880859375, -0.00640869140625, 0.123260498046875, 0.2529296875, 0.382598876953125, 0.51226806640625, 0.641937255859375, 0.7716064453125, 0.901275634765625, 1.03094482421875, 1.160614013671875, 1.290283203125, 1.419952392578125, 1.54962158203125, 1.679290771484375, 1.8089599609375, 1.938629150390625, 2.06829833984375, 2.197967529296875, 2.32763671875, 2.457305908203125, 2.58697509765625, 2.716644287109375, 2.8463134765625, 2.975982666015625, 3.10565185546875, 3.235321044921875, 3.364990234375, 3.494659423828125, 3.62432861328125, 3.753997802734375, 3.8836669921875, 4.013336181640625, 4.14300537109375, 4.272674560546875, 4.40234375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 6.0, 2.0, 14.0, 6.0, 15.0, 16.0, 29.0, 26.0, 44.0, 58.0, 93.0, 133.0, 200.0, 275.0, 433.0, 611.0, 896.0, 1450.0, 2226.0, 3546.0, 5311.0, 8293.0, 13026.0, 21130.0, 37355.0, 91105.0, 572685.0, 171428.0, 48967.0, 25637.0, 15533.0, 9931.0, 6268.0, 4170.0, 2651.0, 1653.0, 1084.0, 756.0, 449.0, 313.0, 216.0, 164.0, 106.0, 70.0, 45.0, 48.0, 32.0, 16.0, 15.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.890625, -4.72589111328125, -4.5611572265625, -4.39642333984375, -4.231689453125, -4.06695556640625, -3.9022216796875, -3.73748779296875, -3.57275390625, -3.40802001953125, -3.2432861328125, -3.07855224609375, -2.913818359375, -2.74908447265625, -2.5843505859375, -2.41961669921875, -2.2548828125, -2.09014892578125, -1.9254150390625, -1.76068115234375, -1.595947265625, -1.43121337890625, -1.2664794921875, -1.10174560546875, -0.93701171875, -0.77227783203125, -0.6075439453125, -0.44281005859375, -0.278076171875, -0.11334228515625, 0.0513916015625, 0.21612548828125, 0.380859375, 0.54559326171875, 0.7103271484375, 0.87506103515625, 1.039794921875, 1.20452880859375, 1.3692626953125, 1.53399658203125, 1.69873046875, 1.86346435546875, 2.0281982421875, 2.19293212890625, 2.357666015625, 2.52239990234375, 2.6871337890625, 2.85186767578125, 3.0166015625, 3.18133544921875, 3.3460693359375, 3.51080322265625, 3.675537109375, 3.84027099609375, 4.0050048828125, 4.16973876953125, 4.33447265625, 4.49920654296875, 4.6639404296875, 4.82867431640625, 4.993408203125, 5.15814208984375, 5.3228759765625, 5.48760986328125, 5.65234375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 4.0, 15.0, 7.0, 9.0, 17.0, 14.0, 26.0, 28.0, 22.0, 16.0, 29.0, 32.0, 46.0, 29.0, 52.0, 34.0, 78.0, 106.0, 291.0, 1494.0, 116.0, 97.0, 50.0, 53.0, 43.0, 33.0, 37.0, 33.0, 25.0, 32.0, 22.0, 15.0, 15.0, 24.0, 21.0, 14.0, 11.0, 14.0, 6.0, 7.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.28125, -10.9501953125, -10.619140625, -10.2880859375, -9.95703125, -9.6259765625, -9.294921875, -8.9638671875, -8.6328125, -8.3017578125, -7.970703125, -7.6396484375, -7.30859375, -6.9775390625, -6.646484375, -6.3154296875, -5.984375, -5.6533203125, -5.322265625, -4.9912109375, -4.66015625, -4.3291015625, -3.998046875, -3.6669921875, -3.3359375, -3.0048828125, -2.673828125, -2.3427734375, -2.01171875, -1.6806640625, -1.349609375, -1.0185546875, -0.6875, -0.3564453125, -0.025390625, 0.3056640625, 0.63671875, 0.9677734375, 1.298828125, 1.6298828125, 1.9609375, 2.2919921875, 2.623046875, 2.9541015625, 3.28515625, 3.6162109375, 3.947265625, 4.2783203125, 4.609375, 4.9404296875, 5.271484375, 5.6025390625, 5.93359375, 6.2646484375, 6.595703125, 6.9267578125, 7.2578125, 7.5888671875, 7.919921875, 8.2509765625, 8.58203125, 8.9130859375, 9.244140625, 9.5751953125, 9.90625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 12.0, 13.0, 25.0, 37.0, 53.0, 72.0, 81.0, 145.0, 235.0, 350.0, 910.0, 3741.0, 20809.0, 205423.0, 2792103.0, 104153.0, 13362.0, 2594.0, 753.0, 311.0, 158.0, 125.0, 88.0, 35.0, 36.0, 24.0, 18.0, 8.0, 3.0, 10.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.25, -16.71728515625, -16.1845703125, -15.65185546875, -15.119140625, -14.58642578125, -14.0537109375, -13.52099609375, -12.98828125, -12.45556640625, -11.9228515625, -11.39013671875, -10.857421875, -10.32470703125, -9.7919921875, -9.25927734375, -8.7265625, -8.19384765625, -7.6611328125, -7.12841796875, -6.595703125, -6.06298828125, -5.5302734375, -4.99755859375, -4.46484375, -3.93212890625, -3.3994140625, -2.86669921875, -2.333984375, -1.80126953125, -1.2685546875, -0.73583984375, -0.203125, 0.32958984375, 0.8623046875, 1.39501953125, 1.927734375, 2.46044921875, 2.9931640625, 3.52587890625, 4.05859375, 4.59130859375, 5.1240234375, 5.65673828125, 6.189453125, 6.72216796875, 7.2548828125, 7.78759765625, 8.3203125, 8.85302734375, 9.3857421875, 9.91845703125, 10.451171875, 10.98388671875, 11.5166015625, 12.04931640625, 12.58203125, 13.11474609375, 13.6474609375, 14.18017578125, 14.712890625, 15.24560546875, 15.7783203125, 16.31103515625, 16.84375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 3.0, 9.0, 18.0, 14.0, 26.0, 41.0, 50.0, 59.0, 87.0, 90.0, 101.0, 94.0, 92.0, 71.0, 69.0, 46.0, 40.0, 30.0, 19.0, 11.0, 14.0, 6.0, 5.0, 0.0, 4.0, 1.0, 3.0], "bins": [-23.106103897094727, -22.62194061279297, -22.137779235839844, -21.653615951538086, -21.16945457458496, -20.685291290283203, -20.201129913330078, -19.71696662902832, -19.232805252075195, -18.748641967773438, -18.264480590820312, -17.780317306518555, -17.29615592956543, -16.811992645263672, -16.327831268310547, -15.843667984008789, -15.359504699707031, -14.87534236907959, -14.391180038452148, -13.907017707824707, -13.422855377197266, -12.938692092895508, -12.454530715942383, -11.970367431640625, -11.4862060546875, -11.002043724060059, -10.517881393432617, -10.033719062805176, -9.549556732177734, -9.065393447875977, -8.581232070922852, -8.097068786621094, -7.612906455993652, -7.128744125366211, -6.6445817947387695, -6.160419464111328, -5.6762566566467285, -5.192094326019287, -4.707931995391846, -4.223769187927246, -3.739607095718384, -3.2554447650909424, -2.771282196044922, -2.2871198654174805, -1.8029574155807495, -1.3187949657440186, -0.8346326351165771, -0.35047006607055664, 0.13369226455688477, 0.6178547143936157, 1.1020171642303467, 1.586179494857788, 2.0703420639038086, 2.55450439453125, 3.0386667251586914, 3.522829294204712, 4.006991386413574, 4.491153717041016, 4.975316047668457, 5.459478378295898, 5.943641185760498, 6.4278035163879395, 6.911965847015381, 7.3961286544799805, 7.880290985107422]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 4.0, 6.0, 5.0, 13.0, 17.0, 18.0, 16.0, 25.0, 29.0, 22.0, 21.0, 28.0, 37.0, 28.0, 33.0, 31.0, 51.0, 36.0, 47.0, 47.0, 37.0, 42.0, 33.0, 40.0, 32.0, 41.0, 38.0, 31.0, 20.0, 22.0, 20.0, 21.0, 15.0, 18.0, 15.0, 11.0, 14.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 6.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0], "bins": [-30.62610626220703, -29.68626594543457, -28.746423721313477, -27.806583404541016, -26.866743087768555, -25.926902770996094, -24.987060546875, -24.04722023010254, -23.107379913330078, -22.167539596557617, -21.227697372436523, -20.287857055664062, -19.3480167388916, -18.40817642211914, -17.468334197998047, -16.528493881225586, -15.588652610778809, -14.648811340332031, -13.70897102355957, -12.769129753112793, -11.829289436340332, -10.889448165893555, -9.949607849121094, -9.009766578674316, -8.069925308227539, -7.13008451461792, -6.190243721008301, -5.250402450561523, -4.3105621337890625, -3.370720863342285, -2.430880069732666, -1.4910392761230469, -0.5511989593505859, 0.388641893863678, 1.328482747077942, 2.2683236598968506, 3.2081644535064697, 4.148005485534668, 5.087846279144287, 6.027687072753906, 6.967527866363525, 7.9073686599731445, 8.847209930419922, 9.787050247192383, 10.72689151763916, 11.666732788085938, 12.606573104858398, 13.54641342163086, 14.486254692077637, 15.426095962524414, 16.365936279296875, 17.305776596069336, 18.24561882019043, 19.18545913696289, 20.12529945373535, 21.065139770507812, 22.004981994628906, 22.944822311401367, 23.88466453552246, 24.824504852294922, 25.764345169067383, 26.704185485839844, 27.644027709960938, 28.5838680267334, 29.52370834350586]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 7.0, 4.0, 6.0, 7.0, 12.0, 10.0, 18.0, 22.0, 15.0, 23.0, 24.0, 13.0, 28.0, 28.0, 37.0, 35.0, 40.0, 38.0, 44.0, 41.0, 25.0, 58.0, 44.0, 31.0, 44.0, 26.0, 41.0, 29.0, 37.0, 34.0, 31.0, 23.0, 14.0, 21.0, 15.0, 11.0, 14.0, 4.0, 7.0, 10.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.536529541015625, -3.41094970703125, -3.285369873046875, -3.1597900390625, -3.034210205078125, -2.90863037109375, -2.783050537109375, -2.657470703125, -2.531890869140625, -2.40631103515625, -2.280731201171875, -2.1551513671875, -2.029571533203125, -1.90399169921875, -1.778411865234375, -1.65283203125, -1.527252197265625, -1.40167236328125, -1.276092529296875, -1.1505126953125, -1.024932861328125, -0.89935302734375, -0.773773193359375, -0.648193359375, -0.522613525390625, -0.39703369140625, -0.271453857421875, -0.1458740234375, -0.020294189453125, 0.10528564453125, 0.230865478515625, 0.3564453125, 0.482025146484375, 0.60760498046875, 0.733184814453125, 0.8587646484375, 0.984344482421875, 1.10992431640625, 1.235504150390625, 1.361083984375, 1.486663818359375, 1.61224365234375, 1.737823486328125, 1.8634033203125, 1.988983154296875, 2.11456298828125, 2.240142822265625, 2.36572265625, 2.491302490234375, 2.61688232421875, 2.742462158203125, 2.8680419921875, 2.993621826171875, 3.11920166015625, 3.244781494140625, 3.370361328125, 3.495941162109375, 3.62152099609375, 3.747100830078125, 3.8726806640625, 3.998260498046875, 4.12384033203125, 4.249420166015625, 4.375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 13.0, 24.0, 25.0, 28.0, 51.0, 78.0, 115.0, 145.0, 196.0, 282.0, 428.0, 583.0, 904.0, 1347.0, 2119.0, 3508.0, 6048.0, 10629.0, 20813.0, 43880.0, 103609.0, 283978.0, 890806.0, 1686886.0, 734457.0, 233958.0, 87618.0, 38012.0, 18800.0, 9837.0, 5463.0, 3282.0, 2115.0, 1331.0, 909.0, 603.0, 388.0, 320.0, 212.0, 145.0, 92.0, 71.0, 46.0, 40.0, 29.0, 19.0, 9.0, 10.0, 2.0, 5.0, 4.0, 3.0, 2.0, 3.0], "bins": [-5.3046875, -5.14593505859375, -4.9871826171875, -4.82843017578125, -4.669677734375, -4.51092529296875, -4.3521728515625, -4.19342041015625, -4.03466796875, -3.87591552734375, -3.7171630859375, -3.55841064453125, -3.399658203125, -3.24090576171875, -3.0821533203125, -2.92340087890625, -2.7646484375, -2.60589599609375, -2.4471435546875, -2.28839111328125, -2.129638671875, -1.97088623046875, -1.8121337890625, -1.65338134765625, -1.49462890625, -1.33587646484375, -1.1771240234375, -1.01837158203125, -0.859619140625, -0.70086669921875, -0.5421142578125, -0.38336181640625, -0.224609375, -0.06585693359375, 0.0928955078125, 0.25164794921875, 0.410400390625, 0.56915283203125, 0.7279052734375, 0.88665771484375, 1.04541015625, 1.20416259765625, 1.3629150390625, 1.52166748046875, 1.680419921875, 1.83917236328125, 1.9979248046875, 2.15667724609375, 2.3154296875, 2.47418212890625, 2.6329345703125, 2.79168701171875, 2.950439453125, 3.10919189453125, 3.2679443359375, 3.42669677734375, 3.58544921875, 3.74420166015625, 3.9029541015625, 4.06170654296875, 4.220458984375, 4.37921142578125, 4.5379638671875, 4.69671630859375, 4.85546875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 11.0, 8.0, 25.0, 27.0, 42.0, 77.0, 127.0, 194.0, 304.0, 503.0, 788.0, 737.0, 490.0, 299.0, 182.0, 93.0, 52.0, 47.0, 27.0, 18.0, 6.0, 7.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7890625, -11.4420166015625, -11.094970703125, -10.7479248046875, -10.40087890625, -10.0538330078125, -9.706787109375, -9.3597412109375, -9.0126953125, -8.6656494140625, -8.318603515625, -7.9715576171875, -7.62451171875, -7.2774658203125, -6.930419921875, -6.5833740234375, -6.236328125, -5.8892822265625, -5.542236328125, -5.1951904296875, -4.84814453125, -4.5010986328125, -4.154052734375, -3.8070068359375, -3.4599609375, -3.1129150390625, -2.765869140625, -2.4188232421875, -2.07177734375, -1.7247314453125, -1.377685546875, -1.0306396484375, -0.68359375, -0.3365478515625, 0.010498046875, 0.3575439453125, 0.70458984375, 1.0516357421875, 1.398681640625, 1.7457275390625, 2.0927734375, 2.4398193359375, 2.786865234375, 3.1339111328125, 3.48095703125, 3.8280029296875, 4.175048828125, 4.5220947265625, 4.869140625, 5.2161865234375, 5.563232421875, 5.9102783203125, 6.25732421875, 6.6043701171875, 6.951416015625, 7.2984619140625, 7.6455078125, 7.9925537109375, 8.339599609375, 8.6866455078125, 9.03369140625, 9.3807373046875, 9.727783203125, 10.0748291015625, 10.421875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 7.0, 15.0, 29.0, 37.0, 66.0, 121.0, 208.0, 359.0, 730.0, 1711.0, 5582.0, 34162.0, 696045.0, 3300701.0, 136130.0, 13018.0, 3045.0, 1183.0, 494.0, 274.0, 151.0, 80.0, 50.0, 36.0, 14.0, 13.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.421875, -18.734619140625, -18.04736328125, -17.360107421875, -16.6728515625, -15.985595703125, -15.29833984375, -14.611083984375, -13.923828125, -13.236572265625, -12.54931640625, -11.862060546875, -11.1748046875, -10.487548828125, -9.80029296875, -9.113037109375, -8.42578125, -7.738525390625, -7.05126953125, -6.364013671875, -5.6767578125, -4.989501953125, -4.30224609375, -3.614990234375, -2.927734375, -2.240478515625, -1.55322265625, -0.865966796875, -0.1787109375, 0.508544921875, 1.19580078125, 1.883056640625, 2.5703125, 3.257568359375, 3.94482421875, 4.632080078125, 5.3193359375, 6.006591796875, 6.69384765625, 7.381103515625, 8.068359375, 8.755615234375, 9.44287109375, 10.130126953125, 10.8173828125, 11.504638671875, 12.19189453125, 12.879150390625, 13.56640625, 14.253662109375, 14.94091796875, 15.628173828125, 16.3154296875, 17.002685546875, 17.68994140625, 18.377197265625, 19.064453125, 19.751708984375, 20.43896484375, 21.126220703125, 21.8134765625, 22.500732421875, 23.18798828125, 23.875244140625, 24.5625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 15.0, 29.0, 133.0, 321.0, 366.0, 118.0, 31.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.84858703613281, -79.87300109863281, -75.89741516113281, -71.92182922363281, -67.94624328613281, -63.97065734863281, -59.99507141113281, -56.01948547363281, -52.04389953613281, -48.06831359863281, -44.09272766113281, -40.11714172363281, -36.14155578613281, -32.16596984863281, -28.190383911132812, -24.214797973632812, -20.239212036132812, -16.263626098632812, -12.288040161132812, -8.312454223632812, -4.3368682861328125, -0.3612823486328125, 3.6143035888671875, 7.5898895263671875, 11.565475463867188, 15.541061401367188, 19.516647338867188, 23.492233276367188, 27.467819213867188, 31.443405151367188, 35.41899108886719, 39.39457702636719, 43.37016296386719, 47.34574890136719, 51.32133483886719, 55.29692077636719, 59.27250671386719, 63.24809265136719, 67.22367858886719, 71.19926452636719, 75.17485046386719, 79.15043640136719, 83.12602233886719, 87.10160827636719, 91.07719421386719, 95.05278015136719, 99.02836608886719, 103.00395202636719, 106.97953796386719, 110.95512390136719, 114.93070983886719, 118.90629577636719, 122.88188171386719, 126.85746765136719, 130.8330535888672, 134.8086395263672, 138.7842254638672, 142.7598114013672, 146.7353973388672, 150.7109832763672, 154.6865692138672, 158.6621551513672, 162.6377410888672, 166.6133270263672, 170.5889129638672]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 6.0, 8.0, 11.0, 14.0, 21.0, 18.0, 19.0, 17.0, 28.0, 38.0, 31.0, 40.0, 48.0, 32.0, 51.0, 40.0, 45.0, 42.0, 33.0, 53.0, 48.0, 37.0, 30.0, 33.0, 33.0, 20.0, 33.0, 27.0, 30.0, 20.0, 14.0, 13.0, 13.0, 6.0, 9.0, 9.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.58300018310547, -27.684797286987305, -26.78659439086914, -25.888391494750977, -24.990188598632812, -24.091983795166016, -23.19378089904785, -22.295578002929688, -21.397375106811523, -20.49917221069336, -19.600969314575195, -18.70276641845703, -17.804561614990234, -16.906360626220703, -16.008155822753906, -15.109952926635742, -14.211750030517578, -13.313547134399414, -12.41534423828125, -11.51714038848877, -10.618937492370605, -9.720734596252441, -8.822530746459961, -7.924327850341797, -7.026124954223633, -6.127922058105469, -5.2297186851501465, -4.331515312194824, -3.43331241607666, -2.535109519958496, -1.6369061470031738, -0.7387027740478516, 0.1595001220703125, 1.0577032566070557, 1.9559063911437988, 2.854109525680542, 3.752312660217285, 4.650515556335449, 5.5487189292907715, 6.446922302246094, 7.345125198364258, 8.243328094482422, 9.141530990600586, 10.039734840393066, 10.93793773651123, 11.836140632629395, 12.734344482421875, 13.632547378540039, 14.530750274658203, 15.428953170776367, 16.32715606689453, 17.225358963012695, 18.12356185913086, 19.021766662597656, 19.91996955871582, 20.818172454833984, 21.71637535095215, 22.614578247070312, 23.512781143188477, 24.41098403930664, 25.309188842773438, 26.20738983154297, 27.105594635009766, 28.00379753112793, 28.902000427246094]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 6.0, 8.0, 9.0, 8.0, 11.0, 22.0, 24.0, 13.0, 25.0, 32.0, 29.0, 30.0, 32.0, 39.0, 33.0, 33.0, 35.0, 40.0, 38.0, 50.0, 49.0, 34.0, 33.0, 43.0, 35.0, 44.0, 26.0, 32.0, 25.0, 25.0, 28.0, 12.0, 22.0, 8.0, 13.0, 8.0, 7.0, 9.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.821044921875, -3.68896484375, -3.556884765625, -3.4248046875, -3.292724609375, -3.16064453125, -3.028564453125, -2.896484375, -2.764404296875, -2.63232421875, -2.500244140625, -2.3681640625, -2.236083984375, -2.10400390625, -1.971923828125, -1.83984375, -1.707763671875, -1.57568359375, -1.443603515625, -1.3115234375, -1.179443359375, -1.04736328125, -0.915283203125, -0.783203125, -0.651123046875, -0.51904296875, -0.386962890625, -0.2548828125, -0.122802734375, 0.00927734375, 0.141357421875, 0.2734375, 0.405517578125, 0.53759765625, 0.669677734375, 0.8017578125, 0.933837890625, 1.06591796875, 1.197998046875, 1.330078125, 1.462158203125, 1.59423828125, 1.726318359375, 1.8583984375, 1.990478515625, 2.12255859375, 2.254638671875, 2.38671875, 2.518798828125, 2.65087890625, 2.782958984375, 2.9150390625, 3.047119140625, 3.17919921875, 3.311279296875, 3.443359375, 3.575439453125, 3.70751953125, 3.839599609375, 3.9716796875, 4.103759765625, 4.23583984375, 4.367919921875, 4.5]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 14.0, 15.0, 29.0, 40.0, 48.0, 76.0, 121.0, 173.0, 248.0, 354.0, 549.0, 791.0, 1125.0, 1668.0, 2643.0, 3829.0, 5846.0, 9214.0, 14151.0, 22713.0, 36307.0, 59143.0, 99594.0, 184623.0, 254161.0, 141169.0, 79476.0, 47775.0, 29510.0, 18582.0, 11897.0, 7558.0, 5022.0, 3310.0, 2219.0, 1484.0, 971.0, 693.0, 452.0, 287.0, 204.0, 161.0, 96.0, 57.0, 45.0, 46.0, 21.0, 13.0, 8.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.0261688232421875, -0.02535843849182129, -0.024548053741455078, -0.023737668991088867, -0.022927284240722656, -0.022116899490356445, -0.021306514739990234, -0.020496129989624023, -0.019685745239257812, -0.0188753604888916, -0.01806497573852539, -0.01725459098815918, -0.01644420623779297, -0.015633821487426758, -0.014823436737060547, -0.014013051986694336, -0.013202667236328125, -0.012392282485961914, -0.011581897735595703, -0.010771512985229492, -0.009961128234863281, -0.00915074348449707, -0.00834035873413086, -0.0075299739837646484, -0.0067195892333984375, -0.0059092044830322266, -0.005098819732666016, -0.004288434982299805, -0.0034780502319335938, -0.002667665481567383, -0.0018572807312011719, -0.001046895980834961, -0.00023651123046875, 0.0005738735198974609, 0.0013842582702636719, 0.002194643020629883, 0.0030050277709960938, 0.0038154125213623047, 0.004625797271728516, 0.0054361820220947266, 0.0062465667724609375, 0.0070569515228271484, 0.00786733627319336, 0.00867772102355957, 0.009488105773925781, 0.010298490524291992, 0.011108875274658203, 0.011919260025024414, 0.012729644775390625, 0.013540029525756836, 0.014350414276123047, 0.015160799026489258, 0.01597118377685547, 0.01678156852722168, 0.01759195327758789, 0.0184023380279541, 0.019212722778320312, 0.020023107528686523, 0.020833492279052734, 0.021643877029418945, 0.022454261779785156, 0.023264646530151367, 0.024075031280517578, 0.02488541603088379, 0.02569580078125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 12.0, 16.0, 13.0, 19.0, 11.0, 20.0, 25.0, 41.0, 27.0, 31.0, 33.0, 43.0, 41.0, 33.0, 38.0, 31.0, 42.0, 1056.0, 28.0, 36.0, 44.0, 34.0, 29.0, 33.0, 37.0, 35.0, 25.0, 28.0, 21.0, 18.0, 18.0, 15.0, 15.0, 10.0, 13.0, 5.0, 4.0, 9.0, 6.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.46875, -4.342376708984375, -4.21600341796875, -4.089630126953125, -3.9632568359375, -3.836883544921875, -3.71051025390625, -3.584136962890625, -3.457763671875, -3.331390380859375, -3.20501708984375, -3.078643798828125, -2.9522705078125, -2.825897216796875, -2.69952392578125, -2.573150634765625, -2.44677734375, -2.320404052734375, -2.19403076171875, -2.067657470703125, -1.9412841796875, -1.814910888671875, -1.68853759765625, -1.562164306640625, -1.435791015625, -1.309417724609375, -1.18304443359375, -1.056671142578125, -0.9302978515625, -0.803924560546875, -0.67755126953125, -0.551177978515625, -0.4248046875, -0.298431396484375, -0.17205810546875, -0.045684814453125, 0.0806884765625, 0.207061767578125, 0.33343505859375, 0.459808349609375, 0.586181640625, 0.712554931640625, 0.83892822265625, 0.965301513671875, 1.0916748046875, 1.218048095703125, 1.34442138671875, 1.470794677734375, 1.59716796875, 1.723541259765625, 1.84991455078125, 1.976287841796875, 2.1026611328125, 2.229034423828125, 2.35540771484375, 2.481781005859375, 2.608154296875, 2.734527587890625, 2.86090087890625, 2.987274169921875, 3.1136474609375, 3.240020751953125, 3.36639404296875, 3.492767333984375, 3.619140625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 11.0, 16.0, 38.0, 34.0, 64.0, 91.0, 123.0, 185.0, 278.0, 412.0, 577.0, 886.0, 1267.0, 1857.0, 2843.0, 4306.0, 6483.0, 9964.0, 15560.0, 24412.0, 38519.0, 62383.0, 102196.0, 176130.0, 1276326.0, 143255.0, 85234.0, 52248.0, 32572.0, 20425.0, 13196.0, 8571.0, 5590.0, 3577.0, 2401.0, 1637.0, 1129.0, 757.0, 497.0, 344.0, 239.0, 154.0, 107.0, 68.0, 58.0, 41.0, 28.0, 21.0, 10.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.01488494873046875, -0.014438152313232422, -0.013991355895996094, -0.013544559478759766, -0.013097763061523438, -0.01265096664428711, -0.012204170227050781, -0.011757373809814453, -0.011310577392578125, -0.010863780975341797, -0.010416984558105469, -0.00997018814086914, -0.009523391723632812, -0.009076595306396484, -0.008629798889160156, -0.008183002471923828, -0.0077362060546875, -0.007289409637451172, -0.006842613220214844, -0.006395816802978516, -0.0059490203857421875, -0.005502223968505859, -0.005055427551269531, -0.004608631134033203, -0.004161834716796875, -0.003715038299560547, -0.0032682418823242188, -0.0028214454650878906, -0.0023746490478515625, -0.0019278526306152344, -0.0014810562133789062, -0.0010342597961425781, -0.00058746337890625, -0.00014066696166992188, 0.00030612945556640625, 0.0007529258728027344, 0.0011997222900390625, 0.0016465187072753906, 0.0020933151245117188, 0.002540111541748047, 0.002986907958984375, 0.003433704376220703, 0.0038805007934570312, 0.004327297210693359, 0.0047740936279296875, 0.005220890045166016, 0.005667686462402344, 0.006114482879638672, 0.006561279296875, 0.007008075714111328, 0.007454872131347656, 0.007901668548583984, 0.008348464965820312, 0.00879526138305664, 0.009242057800292969, 0.009688854217529297, 0.010135650634765625, 0.010582447052001953, 0.011029243469238281, 0.01147603988647461, 0.011922836303710938, 0.012369632720947266, 0.012816429138183594, 0.013263225555419922, 0.01371002197265625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 3.0, 7.0, 0.0, 4.0, 8.0, 0.0, 16.0, 12.0, 0.0, 19.0, 31.0, 0.0, 46.0, 0.0, 77.0, 157.0, 0.0, 198.0, 144.0, 0.0, 91.0, 59.0, 0.0, 30.0, 0.0, 19.0, 17.0, 0.0, 8.0, 8.0, 0.0, 8.0, 5.0, 0.0, 6.0, 7.0, 0.0, 4.0, 0.0, 6.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1539086699485779e-06, -1.1157244443893433e-06, -1.0775402188301086e-06, -1.039355993270874e-06, -1.0011717677116394e-06, -9.629875421524048e-07, -9.248033165931702e-07, -8.866190910339355e-07, -8.484348654747009e-07, -8.102506399154663e-07, -7.720664143562317e-07, -7.338821887969971e-07, -6.956979632377625e-07, -6.575137376785278e-07, -6.193295121192932e-07, -5.811452865600586e-07, -5.42961061000824e-07, -5.047768354415894e-07, -4.6659260988235474e-07, -4.284083843231201e-07, -3.902241587638855e-07, -3.520399332046509e-07, -3.1385570764541626e-07, -2.7567148208618164e-07, -2.3748725652694702e-07, -1.993030309677124e-07, -1.6111880540847778e-07, -1.2293457984924316e-07, -8.475035429000854e-08, -4.6566128730773926e-08, -8.381903171539307e-09, 2.9802322387695312e-08, 6.798654794692993e-08, 1.0617077350616455e-07, 1.4435499906539917e-07, 1.825392246246338e-07, 2.207234501838684e-07, 2.5890767574310303e-07, 2.9709190130233765e-07, 3.3527612686157227e-07, 3.734603524208069e-07, 4.116445779800415e-07, 4.498288035392761e-07, 4.880130290985107e-07, 5.261972546577454e-07, 5.6438148021698e-07, 6.025657057762146e-07, 6.407499313354492e-07, 6.789341568946838e-07, 7.171183824539185e-07, 7.553026080131531e-07, 7.934868335723877e-07, 8.316710591316223e-07, 8.698552846908569e-07, 9.080395102500916e-07, 9.462237358093262e-07, 9.844079613685608e-07, 1.0225921869277954e-06, 1.06077641248703e-06, 1.0989606380462646e-06, 1.1371448636054993e-06, 1.1753290891647339e-06, 1.2135133147239685e-06, 1.2516975402832031e-06]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 5.0, 5.0, 6.0, 9.0, 16.0, 27.0, 28.0, 38.0, 69.0, 112.0, 245.0, 712.0, 39768.0, 1002439.0, 4308.0, 299.0, 149.0, 89.0, 51.0, 25.0, 23.0, 18.0, 13.0, 10.0, 14.0, 4.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.8252601623535156e-05, -2.7377158403396606e-05, -2.6501715183258057e-05, -2.5626271963119507e-05, -2.4750828742980957e-05, -2.3875385522842407e-05, -2.2999942302703857e-05, -2.2124499082565308e-05, -2.1249055862426758e-05, -2.0373612642288208e-05, -1.9498169422149658e-05, -1.862272620201111e-05, -1.774728298187256e-05, -1.687183976173401e-05, -1.599639654159546e-05, -1.512095332145691e-05, -1.424551010131836e-05, -1.337006688117981e-05, -1.249462366104126e-05, -1.161918044090271e-05, -1.074373722076416e-05, -9.86829400062561e-06, -8.99285078048706e-06, -8.11740756034851e-06, -7.241964340209961e-06, -6.366521120071411e-06, -5.491077899932861e-06, -4.6156346797943115e-06, -3.7401914596557617e-06, -2.864748239517212e-06, -1.989305019378662e-06, -1.1138617992401123e-06, -2.384185791015625e-07, 6.370246410369873e-07, 1.5124678611755371e-06, 2.387911081314087e-06, 3.2633543014526367e-06, 4.1387975215911865e-06, 5.014240741729736e-06, 5.889683961868286e-06, 6.765127182006836e-06, 7.640570402145386e-06, 8.516013622283936e-06, 9.391456842422485e-06, 1.0266900062561035e-05, 1.1142343282699585e-05, 1.2017786502838135e-05, 1.2893229722976685e-05, 1.3768672943115234e-05, 1.4644116163253784e-05, 1.5519559383392334e-05, 1.6395002603530884e-05, 1.7270445823669434e-05, 1.8145889043807983e-05, 1.9021332263946533e-05, 1.9896775484085083e-05, 2.0772218704223633e-05, 2.1647661924362183e-05, 2.2523105144500732e-05, 2.3398548364639282e-05, 2.4273991584777832e-05, 2.5149434804916382e-05, 2.602487802505493e-05, 2.690032124519348e-05, 2.777576446533203e-05]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [11.0, 51.0, 328.0, 505.0, 108.0, 16.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.076991615420411e-07, -2.7785171141658793e-07, -1.4800423286942532e-07, -1.8156782743972144e-08, 1.1169069580319047e-07, 2.415381743503531e-07, 3.713855960540968e-07, 5.012331030229689e-07, 6.310805247267126e-07, 7.609280032738752e-07, 8.907754818210378e-07, 1.0206229035247816e-06, 1.1504703252285253e-06, 1.2803178606191068e-06, 1.4101652823228505e-06, 1.540012817713432e-06, 1.6698602394171758e-06, 1.7997076611209195e-06, 1.9295550828246633e-06, 2.059402504528407e-06, 2.189250153605826e-06, 2.31909757530957e-06, 2.4489449970133137e-06, 2.5787924187170574e-06, 2.7086400677944766e-06, 2.8384874894982204e-06, 2.968334911201964e-06, 3.098182332905708e-06, 3.228029981983127e-06, 3.357877403686871e-06, 3.4877248253906146e-06, 3.6175722470943583e-06, 3.747419668798102e-06, 3.877267317875521e-06, 4.0071145122055896e-06, 4.136962161283009e-06, 4.266809355613077e-06, 4.396657004690496e-06, 4.5265041990205646e-06, 4.656351848097984e-06, 4.786199497175403e-06, 4.916047146252822e-06, 5.0458943405828904e-06, 5.17574198966031e-06, 5.305589183990378e-06, 5.435436833067797e-06, 5.565284482145216e-06, 5.695131676475285e-06, 5.824978870805353e-06, 5.954826519882772e-06, 6.08467371421284e-06, 6.21452136329026e-06, 6.344368557620328e-06, 6.474216206697747e-06, 6.604063855775166e-06, 6.733911050105235e-06, 6.863758699182654e-06, 6.993606348260073e-06, 7.123453542590141e-06, 7.2533011916675605e-06, 7.383148385997629e-06, 7.512996035075048e-06, 7.642843229405116e-06, 7.772690878482535e-06, 7.902538527559955e-06]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 33.0, 0.0, 0.0, 74.0, 0.0, 0.0, 128.0, 0.0, 0.0, 176.0, 0.0, 0.0, 0.0, 178.0, 0.0, 0.0, 156.0, 0.0, 0.0, 112.0, 0.0, 0.0, 60.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 6.0, 8.0, 9.0, 8.0, 11.0, 22.0, 24.0, 13.0, 25.0, 32.0, 29.0, 30.0, 32.0, 39.0, 33.0, 33.0, 35.0, 40.0, 38.0, 50.0, 49.0, 34.0, 33.0, 43.0, 35.0, 44.0, 26.0, 32.0, 25.0, 25.0, 28.0, 12.0, 22.0, 8.0, 13.0, 8.0, 7.0, 9.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.821044921875, -3.68896484375, -3.556884765625, -3.4248046875, -3.292724609375, -3.16064453125, -3.028564453125, -2.896484375, -2.764404296875, -2.63232421875, -2.500244140625, -2.3681640625, -2.236083984375, -2.10400390625, -1.971923828125, -1.83984375, -1.707763671875, -1.57568359375, -1.443603515625, -1.3115234375, -1.179443359375, -1.04736328125, -0.915283203125, -0.783203125, -0.651123046875, -0.51904296875, -0.386962890625, -0.2548828125, -0.122802734375, 0.00927734375, 0.141357421875, 0.2734375, 0.405517578125, 0.53759765625, 0.669677734375, 0.8017578125, 0.933837890625, 1.06591796875, 1.197998046875, 1.330078125, 1.462158203125, 1.59423828125, 1.726318359375, 1.8583984375, 1.990478515625, 2.12255859375, 2.254638671875, 2.38671875, 2.518798828125, 2.65087890625, 2.782958984375, 2.9150390625, 3.047119140625, 3.17919921875, 3.311279296875, 3.443359375, 3.575439453125, 3.70751953125, 3.839599609375, 3.9716796875, 4.103759765625, 4.23583984375, 4.367919921875, 4.5]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 10.0, 13.0, 21.0, 26.0, 43.0, 49.0, 96.0, 121.0, 178.0, 256.0, 387.0, 589.0, 884.0, 1349.0, 2027.0, 3309.0, 5247.0, 8853.0, 14886.0, 24917.0, 42103.0, 72370.0, 140928.0, 313351.0, 197321.0, 90921.0, 51558.0, 30651.0, 17833.0, 10696.0, 6415.0, 3894.0, 2550.0, 1571.0, 1015.0, 675.0, 421.0, 324.0, 202.0, 151.0, 117.0, 75.0, 41.0, 31.0, 23.0, 16.0, 15.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0], "bins": [-5.56640625, -5.40594482421875, -5.2454833984375, -5.08502197265625, -4.924560546875, -4.76409912109375, -4.6036376953125, -4.44317626953125, -4.28271484375, -4.12225341796875, -3.9617919921875, -3.80133056640625, -3.640869140625, -3.48040771484375, -3.3199462890625, -3.15948486328125, -2.9990234375, -2.83856201171875, -2.6781005859375, -2.51763916015625, -2.357177734375, -2.19671630859375, -2.0362548828125, -1.87579345703125, -1.71533203125, -1.55487060546875, -1.3944091796875, -1.23394775390625, -1.073486328125, -0.91302490234375, -0.7525634765625, -0.59210205078125, -0.431640625, -0.27117919921875, -0.1107177734375, 0.04974365234375, 0.210205078125, 0.37066650390625, 0.5311279296875, 0.69158935546875, 0.85205078125, 1.01251220703125, 1.1729736328125, 1.33343505859375, 1.493896484375, 1.65435791015625, 1.8148193359375, 1.97528076171875, 2.1357421875, 2.29620361328125, 2.4566650390625, 2.61712646484375, 2.777587890625, 2.93804931640625, 3.0985107421875, 3.25897216796875, 3.41943359375, 3.57989501953125, 3.7403564453125, 3.90081787109375, 4.061279296875, 4.22174072265625, 4.3822021484375, 4.54266357421875, 4.703125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 12.0, 10.0, 11.0, 11.0, 10.0, 21.0, 21.0, 20.0, 31.0, 32.0, 30.0, 37.0, 38.0, 50.0, 63.0, 74.0, 110.0, 171.0, 1440.0, 235.0, 113.0, 82.0, 49.0, 43.0, 43.0, 35.0, 29.0, 30.0, 25.0, 30.0, 26.0, 13.0, 12.0, 15.0, 10.0, 10.0, 9.0, 7.0, 6.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.390625, -11.0302734375, -10.669921875, -10.3095703125, -9.94921875, -9.5888671875, -9.228515625, -8.8681640625, -8.5078125, -8.1474609375, -7.787109375, -7.4267578125, -7.06640625, -6.7060546875, -6.345703125, -5.9853515625, -5.625, -5.2646484375, -4.904296875, -4.5439453125, -4.18359375, -3.8232421875, -3.462890625, -3.1025390625, -2.7421875, -2.3818359375, -2.021484375, -1.6611328125, -1.30078125, -0.9404296875, -0.580078125, -0.2197265625, 0.140625, 0.5009765625, 0.861328125, 1.2216796875, 1.58203125, 1.9423828125, 2.302734375, 2.6630859375, 3.0234375, 3.3837890625, 3.744140625, 4.1044921875, 4.46484375, 4.8251953125, 5.185546875, 5.5458984375, 5.90625, 6.2666015625, 6.626953125, 6.9873046875, 7.34765625, 7.7080078125, 8.068359375, 8.4287109375, 8.7890625, 9.1494140625, 9.509765625, 9.8701171875, 10.23046875, 10.5908203125, 10.951171875, 11.3115234375, 11.671875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 11.0, 12.0, 12.0, 13.0, 19.0, 29.0, 37.0, 59.0, 64.0, 88.0, 187.0, 354.0, 780.0, 2004.0, 6341.0, 23321.0, 126200.0, 1890579.0, 981782.0, 87736.0, 17908.0, 4923.0, 1743.0, 660.0, 322.0, 161.0, 107.0, 62.0, 43.0, 29.0, 28.0, 20.0, 13.0, 16.0, 5.0, 6.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.375, -10.99462890625, -10.6142578125, -10.23388671875, -9.853515625, -9.47314453125, -9.0927734375, -8.71240234375, -8.33203125, -7.95166015625, -7.5712890625, -7.19091796875, -6.810546875, -6.43017578125, -6.0498046875, -5.66943359375, -5.2890625, -4.90869140625, -4.5283203125, -4.14794921875, -3.767578125, -3.38720703125, -3.0068359375, -2.62646484375, -2.24609375, -1.86572265625, -1.4853515625, -1.10498046875, -0.724609375, -0.34423828125, 0.0361328125, 0.41650390625, 0.796875, 1.17724609375, 1.5576171875, 1.93798828125, 2.318359375, 2.69873046875, 3.0791015625, 3.45947265625, 3.83984375, 4.22021484375, 4.6005859375, 4.98095703125, 5.361328125, 5.74169921875, 6.1220703125, 6.50244140625, 6.8828125, 7.26318359375, 7.6435546875, 8.02392578125, 8.404296875, 8.78466796875, 9.1650390625, 9.54541015625, 9.92578125, 10.30615234375, 10.6865234375, 11.06689453125, 11.447265625, 11.82763671875, 12.2080078125, 12.58837890625, 12.96875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 35.0, 60.0, 128.0, 201.0, 234.0, 177.0, 100.0, 54.0, 15.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.812421798706055, -10.224956512451172, -8.637491226196289, -7.050025939941406, -5.462560653686523, -3.8750953674316406, -2.287630081176758, -0.700164794921875, 0.8873004913330078, 2.4747657775878906, 4.062231063842773, 5.649696350097656, 7.237161636352539, 8.824626922607422, 10.412092208862305, 11.999557495117188, 13.58702278137207, 15.174488067626953, 16.761953353881836, 18.34941864013672, 19.9368839263916, 21.524349212646484, 23.111814498901367, 24.69927978515625, 26.286745071411133, 27.874210357666016, 29.4616756439209, 31.04914093017578, 32.63660430908203, 34.22407150268555, 35.81153869628906, 37.39900207519531, 38.98646545410156, 40.57392883300781, 42.16139602661133, 43.748863220214844, 45.336326599121094, 46.923789978027344, 48.51125717163086, 50.098724365234375, 51.686187744140625, 53.273651123046875, 54.86111831665039, 56.448585510253906, 58.036048889160156, 59.623512268066406, 61.21097946166992, 62.79844665527344, 64.38591003417969, 65.97337341308594, 67.56083679199219, 69.14830780029297, 70.73577117919922, 72.32323455810547, 73.91070556640625, 75.4981689453125, 77.08563232421875, 78.673095703125, 80.26055908203125, 81.84803009033203, 83.43549346923828, 85.02295684814453, 86.61042785644531, 88.19789123535156, 89.78535461425781]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 10.0, 8.0, 10.0, 11.0, 11.0, 17.0, 13.0, 11.0, 24.0, 21.0, 21.0, 25.0, 24.0, 32.0, 33.0, 39.0, 39.0, 40.0, 48.0, 41.0, 44.0, 36.0, 26.0, 27.0, 36.0, 30.0, 29.0, 35.0, 29.0, 26.0, 26.0, 32.0, 30.0, 17.0, 15.0, 10.0, 14.0, 14.0, 11.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-30.29950714111328, -29.36054229736328, -28.42157745361328, -27.48261260986328, -26.543649673461914, -25.604684829711914, -24.665719985961914, -23.726755142211914, -22.787792205810547, -21.848827362060547, -20.909862518310547, -19.970897674560547, -19.03193473815918, -18.09296989440918, -17.15400505065918, -16.21504020690918, -15.27607536315918, -14.33711051940918, -13.398146629333496, -12.459181785583496, -11.520217895507812, -10.581253051757812, -9.642288208007812, -8.703323364257812, -7.764359474182129, -6.825395107269287, -5.886430740356445, -4.947465896606445, -4.0085015296936035, -3.0695371627807617, -2.1305723190307617, -1.19160795211792, -0.2526435852050781, 0.6863209009170532, 1.6252853870391846, 2.5642499923706055, 3.5032143592834473, 4.442178726196289, 5.381143569946289, 6.320107936859131, 7.259072303771973, 8.198037147521973, 9.137001037597656, 10.075965881347656, 11.014930725097656, 11.95389461517334, 12.89285945892334, 13.831823348999023, 14.770788192749023, 15.709753036499023, 16.648717880249023, 17.58768081665039, 18.52664566040039, 19.46561050415039, 20.40457534790039, 21.34354019165039, 22.28250503540039, 23.22146987915039, 24.16043472290039, 25.09939956665039, 26.038362503051758, 26.977327346801758, 27.916292190551758, 28.855257034301758, 29.794219970703125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 8.0, 12.0, 8.0, 9.0, 17.0, 15.0, 20.0, 26.0, 24.0, 31.0, 33.0, 31.0, 32.0, 35.0, 42.0, 35.0, 37.0, 30.0, 53.0, 51.0, 44.0, 35.0, 52.0, 42.0, 29.0, 32.0, 33.0, 31.0, 26.0, 27.0, 21.0, 13.0, 8.0, 10.0, 13.0, 6.0, 5.0, 5.0, 0.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.87762451171875, -3.7357177734375, -3.59381103515625, -3.451904296875, -3.30999755859375, -3.1680908203125, -3.02618408203125, -2.88427734375, -2.74237060546875, -2.6004638671875, -2.45855712890625, -2.316650390625, -2.17474365234375, -2.0328369140625, -1.89093017578125, -1.7490234375, -1.60711669921875, -1.4652099609375, -1.32330322265625, -1.181396484375, -1.03948974609375, -0.8975830078125, -0.75567626953125, -0.61376953125, -0.47186279296875, -0.3299560546875, -0.18804931640625, -0.046142578125, 0.09576416015625, 0.2376708984375, 0.37957763671875, 0.521484375, 0.66339111328125, 0.8052978515625, 0.94720458984375, 1.089111328125, 1.23101806640625, 1.3729248046875, 1.51483154296875, 1.65673828125, 1.79864501953125, 1.9405517578125, 2.08245849609375, 2.224365234375, 2.36627197265625, 2.5081787109375, 2.65008544921875, 2.7919921875, 2.93389892578125, 3.0758056640625, 3.21771240234375, 3.359619140625, 3.50152587890625, 3.6434326171875, 3.78533935546875, 3.92724609375, 4.06915283203125, 4.2110595703125, 4.35296630859375, 4.494873046875, 4.63677978515625, 4.7786865234375, 4.92059326171875, 5.0625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 9.0, 11.0, 19.0, 24.0, 41.0, 64.0, 107.0, 142.0, 211.0, 360.0, 600.0, 1027.0, 1959.0, 4147.0, 9678.0, 26984.0, 101953.0, 682500.0, 2739272.0, 502834.0, 82923.0, 23163.0, 8374.0, 3667.0, 1846.0, 979.0, 529.0, 294.0, 195.0, 122.0, 77.0, 45.0, 33.0, 29.0, 16.0, 12.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.905517578125, -8.59228515625, -8.279052734375, -7.9658203125, -7.652587890625, -7.33935546875, -7.026123046875, -6.712890625, -6.399658203125, -6.08642578125, -5.773193359375, -5.4599609375, -5.146728515625, -4.83349609375, -4.520263671875, -4.20703125, -3.893798828125, -3.58056640625, -3.267333984375, -2.9541015625, -2.640869140625, -2.32763671875, -2.014404296875, -1.701171875, -1.387939453125, -1.07470703125, -0.761474609375, -0.4482421875, -0.135009765625, 0.17822265625, 0.491455078125, 0.8046875, 1.117919921875, 1.43115234375, 1.744384765625, 2.0576171875, 2.370849609375, 2.68408203125, 2.997314453125, 3.310546875, 3.623779296875, 3.93701171875, 4.250244140625, 4.5634765625, 4.876708984375, 5.18994140625, 5.503173828125, 5.81640625, 6.129638671875, 6.44287109375, 6.756103515625, 7.0693359375, 7.382568359375, 7.69580078125, 8.009033203125, 8.322265625, 8.635498046875, 8.94873046875, 9.261962890625, 9.5751953125, 9.888427734375, 10.20166015625, 10.514892578125, 10.828125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 9.0, 12.0, 14.0, 25.0, 24.0, 32.0, 47.0, 56.0, 69.0, 95.0, 121.0, 165.0, 256.0, 315.0, 459.0, 514.0, 432.0, 365.0, 241.0, 198.0, 139.0, 111.0, 100.0, 48.0, 46.0, 29.0, 28.0, 28.0, 20.0, 14.0, 14.0, 7.0, 14.0, 5.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.0748291015625, -4.884033203125, -4.6932373046875, -4.50244140625, -4.3116455078125, -4.120849609375, -3.9300537109375, -3.7392578125, -3.5484619140625, -3.357666015625, -3.1668701171875, -2.97607421875, -2.7852783203125, -2.594482421875, -2.4036865234375, -2.212890625, -2.0220947265625, -1.831298828125, -1.6405029296875, -1.44970703125, -1.2589111328125, -1.068115234375, -0.8773193359375, -0.6865234375, -0.4957275390625, -0.304931640625, -0.1141357421875, 0.07666015625, 0.2674560546875, 0.458251953125, 0.6490478515625, 0.83984375, 1.0306396484375, 1.221435546875, 1.4122314453125, 1.60302734375, 1.7938232421875, 1.984619140625, 2.1754150390625, 2.3662109375, 2.5570068359375, 2.747802734375, 2.9385986328125, 3.12939453125, 3.3201904296875, 3.510986328125, 3.7017822265625, 3.892578125, 4.0833740234375, 4.274169921875, 4.4649658203125, 4.65576171875, 4.8465576171875, 5.037353515625, 5.2281494140625, 5.4189453125, 5.6097412109375, 5.800537109375, 5.9913330078125, 6.18212890625, 6.3729248046875, 6.563720703125, 6.7545166015625, 6.9453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 8.0, 15.0, 13.0, 34.0, 32.0, 52.0, 79.0, 108.0, 169.0, 266.0, 437.0, 716.0, 1310.0, 2560.0, 5203.0, 12172.0, 32731.0, 106639.0, 449253.0, 2337547.0, 965616.0, 191874.0, 53867.0, 18426.0, 7550.0, 3482.0, 1663.0, 1013.0, 542.0, 305.0, 194.0, 134.0, 95.0, 57.0, 37.0, 21.0, 15.0, 15.0, 8.0, 3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4122314453125, -8.129150390625, -7.8460693359375, -7.56298828125, -7.2799072265625, -6.996826171875, -6.7137451171875, -6.4306640625, -6.1475830078125, -5.864501953125, -5.5814208984375, -5.29833984375, -5.0152587890625, -4.732177734375, -4.4490966796875, -4.166015625, -3.8829345703125, -3.599853515625, -3.3167724609375, -3.03369140625, -2.7506103515625, -2.467529296875, -2.1844482421875, -1.9013671875, -1.6182861328125, -1.335205078125, -1.0521240234375, -0.76904296875, -0.4859619140625, -0.202880859375, 0.0802001953125, 0.36328125, 0.6463623046875, 0.929443359375, 1.2125244140625, 1.49560546875, 1.7786865234375, 2.061767578125, 2.3448486328125, 2.6279296875, 2.9110107421875, 3.194091796875, 3.4771728515625, 3.76025390625, 4.0433349609375, 4.326416015625, 4.6094970703125, 4.892578125, 5.1756591796875, 5.458740234375, 5.7418212890625, 6.02490234375, 6.3079833984375, 6.591064453125, 6.8741455078125, 7.1572265625, 7.4403076171875, 7.723388671875, 8.0064697265625, 8.28955078125, 8.5726318359375, 8.855712890625, 9.1387939453125, 9.421875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 23.0, 202.0, 437.0, 296.0, 51.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-228.0792236328125, -223.8254852294922, -219.57176208496094, -215.31802368164062, -211.0642852783203, -206.810546875, -202.55682373046875, -198.30308532714844, -194.04934692382812, -189.7956085205078, -185.54188537597656, -181.28814697265625, -177.03440856933594, -172.78067016601562, -168.52694702148438, -164.27320861816406, -160.01947021484375, -155.76573181152344, -151.5120086669922, -147.25827026367188, -143.00453186035156, -138.75079345703125, -134.4970703125, -130.2433319091797, -125.98960876464844, -121.73587799072266, -117.48213958740234, -113.22840881347656, -108.97467041015625, -104.72093963623047, -100.46720886230469, -96.21347045898438, -91.95973205566406, -87.70600128173828, -83.45226287841797, -79.19853210449219, -74.94479370117188, -70.6910629272461, -66.43733215332031, -62.18359375, -57.92985916137695, -53.676124572753906, -49.42238998413086, -45.16865539550781, -40.91492462158203, -36.66118621826172, -32.40745544433594, -28.15372085571289, -23.899986267089844, -19.646251678466797, -15.392518043518066, -11.138784408569336, -6.885049819946289, -2.631315231323242, 1.6224174499511719, 5.876152038574219, 10.129886627197266, 14.383621215820312, 18.63735580444336, 22.891088485717773, 27.14482307434082, 31.398557662963867, 35.65229034423828, 39.90602493286133, 44.159759521484375]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 9.0, 14.0, 17.0, 15.0, 25.0, 27.0, 23.0, 23.0, 40.0, 40.0, 45.0, 41.0, 47.0, 33.0, 44.0, 42.0, 55.0, 53.0, 43.0, 47.0, 29.0, 32.0, 30.0, 34.0, 23.0, 28.0, 21.0, 20.0, 11.0, 8.0, 18.0, 10.0, 9.0, 9.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.772537231445312, -26.928003311157227, -26.08346939086914, -25.238933563232422, -24.394399642944336, -23.54986572265625, -22.70532989501953, -21.860795974731445, -21.01626205444336, -20.171728134155273, -19.327194213867188, -18.48265838623047, -17.638124465942383, -16.793590545654297, -15.949055671691895, -15.104520797729492, -14.259986877441406, -13.41545295715332, -12.570918083190918, -11.726383209228516, -10.88184928894043, -10.037315368652344, -9.192780494689941, -8.348245620727539, -7.503711700439453, -6.659177303314209, -5.814642906188965, -4.970108509063721, -4.125574111938477, -3.2810397148132324, -2.4365053176879883, -1.5919709205627441, -0.7474365234375, 0.09709787368774414, 0.9416322708129883, 1.7861666679382324, 2.6307010650634766, 3.4752354621887207, 4.319769859313965, 5.164304256439209, 6.008838653564453, 6.853373050689697, 7.697907447814941, 8.542442321777344, 9.38697624206543, 10.231510162353516, 11.076045036315918, 11.92057991027832, 12.765113830566406, 13.609647750854492, 14.454182624816895, 15.298717498779297, 16.143251419067383, 16.98778533935547, 17.832321166992188, 18.676855087280273, 19.52138900756836, 20.365922927856445, 21.21045684814453, 22.05499267578125, 22.899526596069336, 23.744060516357422, 24.58859634399414, 25.433130264282227, 26.277664184570312]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 5.0, 10.0, 9.0, 14.0, 15.0, 16.0, 20.0, 20.0, 14.0, 27.0, 27.0, 31.0, 43.0, 27.0, 40.0, 39.0, 34.0, 47.0, 49.0, 39.0, 46.0, 26.0, 45.0, 35.0, 45.0, 43.0, 35.0, 36.0, 26.0, 22.0, 22.0, 13.0, 21.0, 12.0, 10.0, 13.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.77734375, -3.6337890625, -3.490234375, -3.3466796875, -3.203125, -3.0595703125, -2.916015625, -2.7724609375, -2.62890625, -2.4853515625, -2.341796875, -2.1982421875, -2.0546875, -1.9111328125, -1.767578125, -1.6240234375, -1.48046875, -1.3369140625, -1.193359375, -1.0498046875, -0.90625, -0.7626953125, -0.619140625, -0.4755859375, -0.33203125, -0.1884765625, -0.044921875, 0.0986328125, 0.2421875, 0.3857421875, 0.529296875, 0.6728515625, 0.81640625, 0.9599609375, 1.103515625, 1.2470703125, 1.390625, 1.5341796875, 1.677734375, 1.8212890625, 1.96484375, 2.1083984375, 2.251953125, 2.3955078125, 2.5390625, 2.6826171875, 2.826171875, 2.9697265625, 3.11328125, 3.2568359375, 3.400390625, 3.5439453125, 3.6875, 3.8310546875, 3.974609375, 4.1181640625, 4.26171875, 4.4052734375, 4.548828125, 4.6923828125, 4.8359375, 4.9794921875, 5.123046875, 5.2666015625, 5.41015625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 11.0, 15.0, 27.0, 52.0, 64.0, 95.0, 147.0, 226.0, 328.0, 470.0, 716.0, 1140.0, 1751.0, 2745.0, 4109.0, 6326.0, 9837.0, 16274.0, 26956.0, 45675.0, 78398.0, 136040.0, 245950.0, 200151.0, 110109.0, 64070.0, 37222.0, 22286.0, 13550.0, 8259.0, 5364.0, 3403.0, 2374.0, 1487.0, 962.0, 649.0, 441.0, 283.0, 194.0, 137.0, 70.0, 49.0, 42.0, 22.0, 20.0, 15.0, 8.0, 6.0, 9.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.026519775390625, -0.02563023567199707, -0.02474069595336914, -0.02385115623474121, -0.02296161651611328, -0.02207207679748535, -0.021182537078857422, -0.020292997360229492, -0.019403457641601562, -0.018513917922973633, -0.017624378204345703, -0.016734838485717773, -0.015845298767089844, -0.014955759048461914, -0.014066219329833984, -0.013176679611206055, -0.012287139892578125, -0.011397600173950195, -0.010508060455322266, -0.009618520736694336, -0.008728981018066406, -0.007839441299438477, -0.006949901580810547, -0.006060361862182617, -0.0051708221435546875, -0.004281282424926758, -0.003391742706298828, -0.0025022029876708984, -0.0016126632690429688, -0.0007231235504150391, 0.00016641616821289062, 0.0010559558868408203, 0.00194549560546875, 0.0028350353240966797, 0.0037245750427246094, 0.004614114761352539, 0.005503654479980469, 0.0063931941986083984, 0.007282733917236328, 0.008172273635864258, 0.009061813354492188, 0.009951353073120117, 0.010840892791748047, 0.011730432510375977, 0.012619972229003906, 0.013509511947631836, 0.014399051666259766, 0.015288591384887695, 0.016178131103515625, 0.017067670822143555, 0.017957210540771484, 0.018846750259399414, 0.019736289978027344, 0.020625829696655273, 0.021515369415283203, 0.022404909133911133, 0.023294448852539062, 0.024183988571166992, 0.025073528289794922, 0.02596306800842285, 0.02685260772705078, 0.02774214744567871, 0.02863168716430664, 0.02952122688293457, 0.0304107666015625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 1.0, 8.0, 5.0, 8.0, 9.0, 4.0, 11.0, 11.0, 13.0, 17.0, 13.0, 23.0, 21.0, 28.0, 20.0, 40.0, 26.0, 25.0, 33.0, 32.0, 29.0, 37.0, 32.0, 39.0, 1053.0, 39.0, 32.0, 44.0, 43.0, 31.0, 34.0, 26.0, 26.0, 28.0, 24.0, 19.0, 15.0, 12.0, 27.0, 15.0, 13.0, 13.0, 5.0, 9.0, 4.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.16015625, -4.0313720703125, -3.902587890625, -3.7738037109375, -3.64501953125, -3.5162353515625, -3.387451171875, -3.2586669921875, -3.1298828125, -3.0010986328125, -2.872314453125, -2.7435302734375, -2.61474609375, -2.4859619140625, -2.357177734375, -2.2283935546875, -2.099609375, -1.9708251953125, -1.842041015625, -1.7132568359375, -1.58447265625, -1.4556884765625, -1.326904296875, -1.1981201171875, -1.0693359375, -0.9405517578125, -0.811767578125, -0.6829833984375, -0.55419921875, -0.4254150390625, -0.296630859375, -0.1678466796875, -0.0390625, 0.0897216796875, 0.218505859375, 0.3472900390625, 0.47607421875, 0.6048583984375, 0.733642578125, 0.8624267578125, 0.9912109375, 1.1199951171875, 1.248779296875, 1.3775634765625, 1.50634765625, 1.6351318359375, 1.763916015625, 1.8927001953125, 2.021484375, 2.1502685546875, 2.279052734375, 2.4078369140625, 2.53662109375, 2.6654052734375, 2.794189453125, 2.9229736328125, 3.0517578125, 3.1805419921875, 3.309326171875, 3.4381103515625, 3.56689453125, 3.6956787109375, 3.824462890625, 3.9532470703125, 4.08203125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 9.0, 11.0, 19.0, 26.0, 33.0, 53.0, 62.0, 98.0, 124.0, 194.0, 244.0, 323.0, 472.0, 649.0, 943.0, 1339.0, 1790.0, 2588.0, 3590.0, 5094.0, 7336.0, 10543.0, 15321.0, 21905.0, 33232.0, 49156.0, 75730.0, 121485.0, 1240097.0, 179470.0, 110470.0, 69672.0, 45921.0, 30838.0, 20844.0, 13919.0, 10022.0, 6876.0, 4819.0, 3471.0, 2370.0, 1706.0, 1190.0, 876.0, 614.0, 445.0, 339.0, 226.0, 173.0, 133.0, 89.0, 60.0, 56.0, 32.0, 18.0, 18.0, 7.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.01357269287109375, -0.013147354125976562, -0.012722015380859375, -0.012296676635742188, -0.011871337890625, -0.011445999145507812, -0.011020660400390625, -0.010595321655273438, -0.01016998291015625, -0.009744644165039062, -0.009319305419921875, -0.008893966674804688, -0.0084686279296875, -0.008043289184570312, -0.007617950439453125, -0.0071926116943359375, -0.00676727294921875, -0.0063419342041015625, -0.005916595458984375, -0.0054912567138671875, -0.00506591796875, -0.0046405792236328125, -0.004215240478515625, -0.0037899017333984375, -0.00336456298828125, -0.0029392242431640625, -0.002513885498046875, -0.0020885467529296875, -0.0016632080078125, -0.0012378692626953125, -0.000812530517578125, -0.0003871917724609375, 3.814697265625e-05, 0.0004634857177734375, 0.000888824462890625, 0.0013141632080078125, 0.001739501953125, 0.0021648406982421875, 0.002590179443359375, 0.0030155181884765625, 0.00344085693359375, 0.0038661956787109375, 0.004291534423828125, 0.0047168731689453125, 0.0051422119140625, 0.0055675506591796875, 0.005992889404296875, 0.0064182281494140625, 0.00684356689453125, 0.0072689056396484375, 0.007694244384765625, 0.008119583129882812, 0.008544921875, 0.008970260620117188, 0.009395599365234375, 0.009820938110351562, 0.01024627685546875, 0.010671615600585938, 0.011096954345703125, 0.011522293090820312, 0.0119476318359375, 0.012372970581054688, 0.012798309326171875, 0.013223648071289062, 0.01364898681640625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 6.0, 6.0, 10.0, 7.0, 13.0, 17.0, 15.0, 13.0, 22.0, 22.0, 20.0, 20.0, 38.0, 53.0, 79.0, 106.0, 118.0, 78.0, 72.0, 57.0, 31.0, 26.0, 22.0, 24.0, 20.0, 11.0, 10.0, 14.0, 4.0, 12.0, 8.0, 8.0, 3.0, 9.0, 3.0, 4.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.9669532775878906e-06, -1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 5.0, 8.0, 6.0, 12.0, 10.0, 6.0, 13.0, 14.0, 19.0, 24.0, 33.0, 42.0, 69.0, 105.0, 241.0, 496.0, 8826.0, 1033589.0, 3968.0, 440.0, 213.0, 130.0, 56.0, 39.0, 23.0, 26.0, 21.0, 21.0, 18.0, 16.0, 8.0, 9.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.208087921142578e-05, -4.065129905939102e-05, -3.922171890735626e-05, -3.77921387553215e-05, -3.636255860328674e-05, -3.4932978451251984e-05, -3.3503398299217224e-05, -3.2073818147182465e-05, -3.0644237995147705e-05, -2.9214657843112946e-05, -2.7785077691078186e-05, -2.6355497539043427e-05, -2.4925917387008667e-05, -2.3496337234973907e-05, -2.2066757082939148e-05, -2.063717693090439e-05, -1.920759677886963e-05, -1.777801662683487e-05, -1.634843647480011e-05, -1.491885632276535e-05, -1.348927617073059e-05, -1.2059696018695831e-05, -1.0630115866661072e-05, -9.200535714626312e-06, -7.770955562591553e-06, -6.341375410556793e-06, -4.911795258522034e-06, -3.482215106487274e-06, -2.0526349544525146e-06, -6.230548024177551e-07, 8.065253496170044e-07, 2.236105501651764e-06, 3.6656856536865234e-06, 5.095265805721283e-06, 6.5248459577560425e-06, 7.954426109790802e-06, 9.384006261825562e-06, 1.0813586413860321e-05, 1.224316656589508e-05, 1.367274671792984e-05, 1.51023268699646e-05, 1.653190702199936e-05, 1.796148717403412e-05, 1.9391067326068878e-05, 2.0820647478103638e-05, 2.2250227630138397e-05, 2.3679807782173157e-05, 2.5109387934207916e-05, 2.6538968086242676e-05, 2.7968548238277435e-05, 2.9398128390312195e-05, 3.0827708542346954e-05, 3.2257288694381714e-05, 3.3686868846416473e-05, 3.511644899845123e-05, 3.654602915048599e-05, 3.797560930252075e-05, 3.940518945455551e-05, 4.083476960659027e-05, 4.226434975862503e-05, 4.369392991065979e-05, 4.512351006269455e-05, 4.655309021472931e-05, 4.798267036676407e-05, 4.941225051879883e-05]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [135.0, 852.0, 33.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.440404606815719e-07, -1.346054148143594e-07, 2.748296310528531e-07, 6.842646484983561e-07, 1.0936996659438591e-06, 1.5031348539196188e-06, 1.912569814521703e-06, 2.3220050024974626e-06, 2.7314399630995467e-06, 3.140874923701631e-06, 3.5503101116773905e-06, 3.95974529965315e-06, 4.369180260255234e-06, 4.7786152208573185e-06, 5.188050181459403e-06, 5.597485142061487e-06, 6.006920102663571e-06, 6.416355063265655e-06, 6.825790023867739e-06, 7.2352249844698235e-06, 7.644660399819259e-06, 8.054095815168694e-06, 8.463530321023427e-06, 8.872965736372862e-06, 9.282400242227595e-06, 9.69183565757703e-06, 1.0101270163431764e-05, 1.0510705578781199e-05, 1.0920140084635932e-05, 1.1329575499985367e-05, 1.17390100058401e-05, 1.2148445421189535e-05, 1.2557881746033672e-05, 1.2967317161383107e-05, 1.337675166723784e-05, 1.3786187082587276e-05, 1.4195621588442009e-05, 1.4605057003791444e-05, 1.5014491509646177e-05, 1.5423927834490314e-05, 1.5833362340345047e-05, 1.624279684619978e-05, 1.6652233171043918e-05, 1.706166767689865e-05, 1.7471102182753384e-05, 1.788053850759752e-05, 1.8289973013452254e-05, 1.8699407519306988e-05, 1.910884202516172e-05, 1.9518276531016454e-05, 1.992771285586059e-05, 2.0337147361715324e-05, 2.0746581867570058e-05, 2.1156018192414194e-05, 2.1565452698268928e-05, 2.197488720412366e-05, 2.2384323528967798e-05, 2.279375803482253e-05, 2.3203194359666668e-05, 2.36126288655214e-05, 2.4022063371376134e-05, 2.4431497877230868e-05, 2.4840934202075005e-05, 2.5250368707929738e-05, 2.565980321378447e-05]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 0.0, 9.0, 0.0, 12.0, 0.0, 11.0, 13.0, 0.0, 23.0, 0.0, 33.0, 0.0, 41.0, 0.0, 53.0, 0.0, 76.0, 0.0, 81.0, 0.0, 109.0, 0.0, 102.0, 95.0, 0.0, 85.0, 0.0, 67.0, 0.0, 52.0, 0.0, 42.0, 0.0, 32.0, 0.0, 20.0, 0.0, 15.0, 13.0, 0.0, 8.0, 0.0, 6.0, 0.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.0132789611816406e-06, -9.816139936447144e-07, -9.499490261077881e-07, -9.182840585708618e-07, -8.866190910339355e-07, -8.549541234970093e-07, -8.23289155960083e-07, -7.916241884231567e-07, -7.599592208862305e-07, -7.282942533493042e-07, -6.966292858123779e-07, -6.649643182754517e-07, -6.332993507385254e-07, -6.016343832015991e-07, -5.699694156646729e-07, -5.383044481277466e-07, -5.066394805908203e-07, -4.7497451305389404e-07, -4.4330954551696777e-07, -4.116445779800415e-07, -3.7997961044311523e-07, -3.4831464290618896e-07, -3.166496753692627e-07, -2.849847078323364e-07, -2.5331974029541016e-07, -2.2165477275848389e-07, -1.8998980522155762e-07, -1.5832483768463135e-07, -1.2665987014770508e-07, -9.499490261077881e-08, -6.332993507385254e-08, -3.166496753692627e-08, 0.0, 3.166496753692627e-08, 6.332993507385254e-08, 9.499490261077881e-08, 1.2665987014770508e-07, 1.5832483768463135e-07, 1.8998980522155762e-07, 2.2165477275848389e-07, 2.5331974029541016e-07, 2.849847078323364e-07, 3.166496753692627e-07, 3.4831464290618896e-07, 3.7997961044311523e-07, 4.116445779800415e-07, 4.4330954551696777e-07, 4.7497451305389404e-07, 5.066394805908203e-07, 5.383044481277466e-07, 5.699694156646729e-07, 6.016343832015991e-07, 6.332993507385254e-07, 6.649643182754517e-07, 6.966292858123779e-07, 7.282942533493042e-07, 7.599592208862305e-07, 7.916241884231567e-07, 8.23289155960083e-07, 8.549541234970093e-07, 8.866190910339355e-07, 9.182840585708618e-07, 9.499490261077881e-07, 9.816139936447144e-07, 1.0132789611816406e-06]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 5.0, 10.0, 9.0, 14.0, 15.0, 16.0, 20.0, 20.0, 14.0, 27.0, 27.0, 31.0, 43.0, 27.0, 40.0, 39.0, 34.0, 47.0, 49.0, 39.0, 46.0, 26.0, 45.0, 35.0, 45.0, 43.0, 35.0, 36.0, 26.0, 22.0, 22.0, 13.0, 21.0, 12.0, 10.0, 13.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.77734375, -3.6337890625, -3.490234375, -3.3466796875, -3.203125, -3.0595703125, -2.916015625, -2.7724609375, -2.62890625, -2.4853515625, -2.341796875, -2.1982421875, -2.0546875, -1.9111328125, -1.767578125, -1.6240234375, -1.48046875, -1.3369140625, -1.193359375, -1.0498046875, -0.90625, -0.7626953125, -0.619140625, -0.4755859375, -0.33203125, -0.1884765625, -0.044921875, 0.0986328125, 0.2421875, 0.3857421875, 0.529296875, 0.6728515625, 0.81640625, 0.9599609375, 1.103515625, 1.2470703125, 1.390625, 1.5341796875, 1.677734375, 1.8212890625, 1.96484375, 2.1083984375, 2.251953125, 2.3955078125, 2.5390625, 2.6826171875, 2.826171875, 2.9697265625, 3.11328125, 3.2568359375, 3.400390625, 3.5439453125, 3.6875, 3.8310546875, 3.974609375, 4.1181640625, 4.26171875, 4.4052734375, 4.548828125, 4.6923828125, 4.8359375, 4.9794921875, 5.123046875, 5.2666015625, 5.41015625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 20.0, 21.0, 33.0, 63.0, 73.0, 101.0, 136.0, 192.0, 307.0, 426.0, 701.0, 1008.0, 1549.0, 2288.0, 3599.0, 5671.0, 8651.0, 13540.0, 21440.0, 34932.0, 57832.0, 100797.0, 182807.0, 274526.0, 136405.0, 78568.0, 46082.0, 27662.0, 17400.0, 11204.0, 7150.0, 4594.0, 2989.0, 1918.0, 1248.0, 856.0, 538.0, 376.0, 250.0, 167.0, 121.0, 78.0, 61.0, 46.0, 29.0, 25.0, 14.0, 12.0, 5.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.4921875, -4.34381103515625, -4.1954345703125, -4.04705810546875, -3.898681640625, -3.75030517578125, -3.6019287109375, -3.45355224609375, -3.30517578125, -3.15679931640625, -3.0084228515625, -2.86004638671875, -2.711669921875, -2.56329345703125, -2.4149169921875, -2.26654052734375, -2.1181640625, -1.96978759765625, -1.8214111328125, -1.67303466796875, -1.524658203125, -1.37628173828125, -1.2279052734375, -1.07952880859375, -0.93115234375, -0.78277587890625, -0.6343994140625, -0.48602294921875, -0.337646484375, -0.18927001953125, -0.0408935546875, 0.10748291015625, 0.255859375, 0.40423583984375, 0.5526123046875, 0.70098876953125, 0.849365234375, 0.99774169921875, 1.1461181640625, 1.29449462890625, 1.44287109375, 1.59124755859375, 1.7396240234375, 1.88800048828125, 2.036376953125, 2.18475341796875, 2.3331298828125, 2.48150634765625, 2.6298828125, 2.77825927734375, 2.9266357421875, 3.07501220703125, 3.223388671875, 3.37176513671875, 3.5201416015625, 3.66851806640625, 3.81689453125, 3.96527099609375, 4.1136474609375, 4.26202392578125, 4.410400390625, 4.55877685546875, 4.7071533203125, 4.85552978515625, 5.00390625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 8.0, 8.0, 7.0, 3.0, 8.0, 9.0, 10.0, 10.0, 11.0, 28.0, 14.0, 23.0, 22.0, 23.0, 32.0, 30.0, 34.0, 30.0, 62.0, 54.0, 87.0, 108.0, 190.0, 1350.0, 244.0, 129.0, 81.0, 67.0, 48.0, 28.0, 26.0, 40.0, 39.0, 24.0, 19.0, 31.0, 14.0, 16.0, 14.0, 9.0, 14.0, 8.0, 7.0, 10.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.8046875, -9.4847412109375, -9.164794921875, -8.8448486328125, -8.52490234375, -8.2049560546875, -7.885009765625, -7.5650634765625, -7.2451171875, -6.9251708984375, -6.605224609375, -6.2852783203125, -5.96533203125, -5.6453857421875, -5.325439453125, -5.0054931640625, -4.685546875, -4.3656005859375, -4.045654296875, -3.7257080078125, -3.40576171875, -3.0858154296875, -2.765869140625, -2.4459228515625, -2.1259765625, -1.8060302734375, -1.486083984375, -1.1661376953125, -0.84619140625, -0.5262451171875, -0.206298828125, 0.1136474609375, 0.43359375, 0.7535400390625, 1.073486328125, 1.3934326171875, 1.71337890625, 2.0333251953125, 2.353271484375, 2.6732177734375, 2.9931640625, 3.3131103515625, 3.633056640625, 3.9530029296875, 4.27294921875, 4.5928955078125, 4.912841796875, 5.2327880859375, 5.552734375, 5.8726806640625, 6.192626953125, 6.5125732421875, 6.83251953125, 7.1524658203125, 7.472412109375, 7.7923583984375, 8.1123046875, 8.4322509765625, 8.752197265625, 9.0721435546875, 9.39208984375, 9.7120361328125, 10.031982421875, 10.3519287109375, 10.671875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 8.0, 9.0, 9.0, 8.0, 11.0, 15.0, 27.0, 29.0, 32.0, 42.0, 76.0, 69.0, 143.0, 188.0, 469.0, 1269.0, 4846.0, 23911.0, 164034.0, 2398536.0, 489662.0, 49519.0, 9188.0, 2107.0, 657.0, 275.0, 155.0, 94.0, 60.0, 51.0, 48.0, 40.0, 32.0, 15.0, 13.0, 15.0, 8.0, 6.0, 7.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.90625, -13.4676513671875, -13.029052734375, -12.5904541015625, -12.15185546875, -11.7132568359375, -11.274658203125, -10.8360595703125, -10.3974609375, -9.9588623046875, -9.520263671875, -9.0816650390625, -8.64306640625, -8.2044677734375, -7.765869140625, -7.3272705078125, -6.888671875, -6.4500732421875, -6.011474609375, -5.5728759765625, -5.13427734375, -4.6956787109375, -4.257080078125, -3.8184814453125, -3.3798828125, -2.9412841796875, -2.502685546875, -2.0640869140625, -1.62548828125, -1.1868896484375, -0.748291015625, -0.3096923828125, 0.12890625, 0.5675048828125, 1.006103515625, 1.4447021484375, 1.88330078125, 2.3218994140625, 2.760498046875, 3.1990966796875, 3.6376953125, 4.0762939453125, 4.514892578125, 4.9534912109375, 5.39208984375, 5.8306884765625, 6.269287109375, 6.7078857421875, 7.146484375, 7.5850830078125, 8.023681640625, 8.4622802734375, 8.90087890625, 9.3394775390625, 9.778076171875, 10.2166748046875, 10.6552734375, 11.0938720703125, 11.532470703125, 11.9710693359375, 12.40966796875, 12.8482666015625, 13.286865234375, 13.7254638671875, 14.1640625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 17.0, 79.0, 310.0, 385.0, 180.0, 36.0, 6.0, 2.0, 1.0], "bins": [-177.2153778076172, -174.1724395751953, -171.12950134277344, -168.08656311035156, -165.0436248779297, -162.0006866455078, -158.95774841308594, -155.91481018066406, -152.8718719482422, -149.8289337158203, -146.78599548339844, -143.74305725097656, -140.7001190185547, -137.6571807861328, -134.61424255371094, -131.57130432128906, -128.52838134765625, -125.48544311523438, -122.4425048828125, -119.39956665039062, -116.35662841796875, -113.31369018554688, -110.270751953125, -107.22782135009766, -104.18487548828125, -101.14193725585938, -98.0989990234375, -95.05606079101562, -92.01312255859375, -88.97018432617188, -85.92724609375, -82.88431549072266, -79.84138488769531, -76.79844665527344, -73.75550842285156, -70.71257019042969, -67.66963195800781, -64.62669372558594, -61.58375930786133, -58.54082489013672, -55.49788284301758, -52.4549446105957, -49.41200637817383, -46.36907196044922, -43.326133728027344, -40.28319549560547, -37.240257263183594, -34.19731903076172, -31.154382705688477, -28.1114444732666, -25.06850814819336, -22.025569915771484, -18.98263168334961, -15.939695358276367, -12.896757125854492, -9.85382080078125, -6.810882568359375, -3.7679450511932373, -0.7250075340270996, 2.317930221557617, 5.360867500305176, 8.403804779052734, 11.44674301147461, 14.489679336547852, 17.532617568969727]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 8.0, 15.0, 13.0, 13.0, 24.0, 20.0, 23.0, 40.0, 49.0, 34.0, 44.0, 40.0, 41.0, 43.0, 41.0, 42.0, 44.0, 51.0, 54.0, 52.0, 42.0, 34.0, 38.0, 33.0, 24.0, 25.0, 18.0, 19.0, 8.0, 10.0, 11.0, 7.0, 13.0, 5.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.805797576904297, -28.655921936035156, -27.506046295166016, -26.356168746948242, -25.2062931060791, -24.05641746520996, -22.906539916992188, -21.756664276123047, -20.606788635253906, -19.456912994384766, -18.307037353515625, -17.15715980529785, -16.00728416442871, -14.85740852355957, -13.707531929016113, -12.557655334472656, -11.407779693603516, -10.257904052734375, -9.108027458190918, -7.958151340484619, -6.80827522277832, -5.6583991050720215, -4.508522987365723, -3.3586463928222656, -2.208770751953125, -1.0588946342468262, 0.09098148345947266, 1.2408576011657715, 2.3907337188720703, 3.540609836578369, 4.690485954284668, 5.840362548828125, 6.990234375, 8.14011001586914, 9.289986610412598, 10.439863204956055, 11.589738845825195, 12.739614486694336, 13.889491081237793, 15.03936767578125, 16.18924331665039, 17.33911895751953, 18.488994598388672, 19.638872146606445, 20.788747787475586, 21.938623428344727, 23.0885009765625, 24.23837661743164, 25.38825225830078, 26.538127899169922, 27.688003540039062, 28.837881088256836, 29.987756729125977, 31.137632369995117, 32.28750991821289, 33.43738555908203, 34.58726119995117, 35.73713684082031, 36.88701248168945, 38.036888122558594, 39.186767578125, 40.33664321899414, 41.48651885986328, 42.63639450073242, 43.78627014160156]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 11.0, 8.0, 21.0, 17.0, 22.0, 15.0, 23.0, 29.0, 35.0, 33.0, 31.0, 41.0, 40.0, 39.0, 53.0, 56.0, 39.0, 46.0, 43.0, 41.0, 53.0, 49.0, 40.0, 36.0, 33.0, 29.0, 18.0, 18.0, 16.0, 13.0, 13.0, 8.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51171875, -4.35260009765625, -4.1934814453125, -4.03436279296875, -3.875244140625, -3.71612548828125, -3.5570068359375, -3.39788818359375, -3.23876953125, -3.07965087890625, -2.9205322265625, -2.76141357421875, -2.602294921875, -2.44317626953125, -2.2840576171875, -2.12493896484375, -1.9658203125, -1.80670166015625, -1.6475830078125, -1.48846435546875, -1.329345703125, -1.17022705078125, -1.0111083984375, -0.85198974609375, -0.69287109375, -0.53375244140625, -0.3746337890625, -0.21551513671875, -0.056396484375, 0.10272216796875, 0.2618408203125, 0.42095947265625, 0.580078125, 0.73919677734375, 0.8983154296875, 1.05743408203125, 1.216552734375, 1.37567138671875, 1.5347900390625, 1.69390869140625, 1.85302734375, 2.01214599609375, 2.1712646484375, 2.33038330078125, 2.489501953125, 2.64862060546875, 2.8077392578125, 2.96685791015625, 3.1259765625, 3.28509521484375, 3.4442138671875, 3.60333251953125, 3.762451171875, 3.92156982421875, 4.0806884765625, 4.23980712890625, 4.39892578125, 4.55804443359375, 4.7171630859375, 4.87628173828125, 5.035400390625, 5.19451904296875, 5.3536376953125, 5.51275634765625, 5.671875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 12.0, 14.0, 15.0, 24.0, 21.0, 31.0, 36.0, 61.0, 78.0, 78.0, 119.0, 219.0, 270.0, 444.0, 1688.0, 283132.0, 3902240.0, 4147.0, 509.0, 326.0, 202.0, 165.0, 94.0, 62.0, 62.0, 46.0, 37.0, 28.0, 23.0, 18.0, 13.0, 13.0, 11.0, 8.0, 5.0, 7.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.4375, -58.4326171875, -56.427734375, -54.4228515625, -52.41796875, -50.4130859375, -48.408203125, -46.4033203125, -44.3984375, -42.3935546875, -40.388671875, -38.3837890625, -36.37890625, -34.3740234375, -32.369140625, -30.3642578125, -28.359375, -26.3544921875, -24.349609375, -22.3447265625, -20.33984375, -18.3349609375, -16.330078125, -14.3251953125, -12.3203125, -10.3154296875, -8.310546875, -6.3056640625, -4.30078125, -2.2958984375, -0.291015625, 1.7138671875, 3.71875, 5.7236328125, 7.728515625, 9.7333984375, 11.73828125, 13.7431640625, 15.748046875, 17.7529296875, 19.7578125, 21.7626953125, 23.767578125, 25.7724609375, 27.77734375, 29.7822265625, 31.787109375, 33.7919921875, 35.796875, 37.8017578125, 39.806640625, 41.8115234375, 43.81640625, 45.8212890625, 47.826171875, 49.8310546875, 51.8359375, 53.8408203125, 55.845703125, 57.8505859375, 59.85546875, 61.8603515625, 63.865234375, 65.8701171875, 67.875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 4.0, 7.0, 10.0, 9.0, 12.0, 22.0, 32.0, 26.0, 58.0, 64.0, 82.0, 151.0, 159.0, 225.0, 337.0, 497.0, 613.0, 521.0, 366.0, 223.0, 152.0, 133.0, 82.0, 72.0, 49.0, 42.0, 24.0, 20.0, 16.0, 21.0, 8.0, 9.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.1583251953125, -5.949462890625, -5.7406005859375, -5.53173828125, -5.3228759765625, -5.114013671875, -4.9051513671875, -4.6962890625, -4.4874267578125, -4.278564453125, -4.0697021484375, -3.86083984375, -3.6519775390625, -3.443115234375, -3.2342529296875, -3.025390625, -2.8165283203125, -2.607666015625, -2.3988037109375, -2.18994140625, -1.9810791015625, -1.772216796875, -1.5633544921875, -1.3544921875, -1.1456298828125, -0.936767578125, -0.7279052734375, -0.51904296875, -0.3101806640625, -0.101318359375, 0.1075439453125, 0.31640625, 0.5252685546875, 0.734130859375, 0.9429931640625, 1.15185546875, 1.3607177734375, 1.569580078125, 1.7784423828125, 1.9873046875, 2.1961669921875, 2.405029296875, 2.6138916015625, 2.82275390625, 3.0316162109375, 3.240478515625, 3.4493408203125, 3.658203125, 3.8670654296875, 4.075927734375, 4.2847900390625, 4.49365234375, 4.7025146484375, 4.911376953125, 5.1202392578125, 5.3291015625, 5.5379638671875, 5.746826171875, 5.9556884765625, 6.16455078125, 6.3734130859375, 6.582275390625, 6.7911376953125, 7.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 2.0, 9.0, 14.0, 13.0, 21.0, 20.0, 33.0, 51.0, 116.0, 280.0, 1128.0, 7638.0, 174921.0, 3908421.0, 94840.0, 5405.0, 918.0, 205.0, 97.0, 58.0, 31.0, 21.0, 14.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.80126953125, -32.7900390625, -31.77880859375, -30.767578125, -29.75634765625, -28.7451171875, -27.73388671875, -26.72265625, -25.71142578125, -24.7001953125, -23.68896484375, -22.677734375, -21.66650390625, -20.6552734375, -19.64404296875, -18.6328125, -17.62158203125, -16.6103515625, -15.59912109375, -14.587890625, -13.57666015625, -12.5654296875, -11.55419921875, -10.54296875, -9.53173828125, -8.5205078125, -7.50927734375, -6.498046875, -5.48681640625, -4.4755859375, -3.46435546875, -2.453125, -1.44189453125, -0.4306640625, 0.58056640625, 1.591796875, 2.60302734375, 3.6142578125, 4.62548828125, 5.63671875, 6.64794921875, 7.6591796875, 8.67041015625, 9.681640625, 10.69287109375, 11.7041015625, 12.71533203125, 13.7265625, 14.73779296875, 15.7490234375, 16.76025390625, 17.771484375, 18.78271484375, 19.7939453125, 20.80517578125, 21.81640625, 22.82763671875, 23.8388671875, 24.85009765625, 25.861328125, 26.87255859375, 27.8837890625, 28.89501953125, 29.90625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 22.0, 104.0, 295.0, 369.0, 163.0, 39.0, 17.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.0868377685547, -154.0750732421875, -151.06329345703125, -148.05152893066406, -145.03976440429688, -142.02798461914062, -139.01622009277344, -136.00445556640625, -132.99267578125, -129.9809112548828, -126.9691390991211, -123.95736694335938, -120.94559478759766, -117.93382263183594, -114.92205810546875, -111.91028594970703, -108.89851379394531, -105.8867416381836, -102.8749771118164, -99.86320495605469, -96.85143280029297, -93.83966064453125, -90.82789611816406, -87.81612396240234, -84.80435943603516, -81.79258728027344, -78.78082275390625, -75.76905059814453, -72.75727844238281, -69.7455062866211, -66.7337417602539, -63.72196960449219, -60.71019744873047, -57.698429107666016, -54.6866569519043, -51.674888610839844, -48.663116455078125, -45.65134811401367, -42.63957977294922, -39.6278076171875, -36.61603546142578, -33.60426712036133, -30.59249496459961, -27.580726623535156, -24.568954467773438, -21.557186126708984, -18.5454158782959, -15.533645629882812, -12.52187728881836, -9.510107040405273, -6.498337268829346, -3.486567497253418, -0.47479724884033203, 2.536972999572754, 5.548742294311523, 8.56051254272461, 11.572282791137695, 14.584053039550781, 17.595823287963867, 20.607593536376953, 23.619361877441406, 26.631134033203125, 29.642902374267578, 32.65467071533203, 35.66644287109375]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 4.0, 11.0, 5.0, 12.0, 8.0, 15.0, 13.0, 17.0, 18.0, 26.0, 22.0, 28.0, 24.0, 33.0, 34.0, 40.0, 44.0, 42.0, 33.0, 36.0, 39.0, 49.0, 39.0, 37.0, 37.0, 42.0, 29.0, 20.0, 37.0, 34.0, 34.0, 23.0, 17.0, 16.0, 16.0, 7.0, 7.0, 9.0, 8.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-21.501502990722656, -20.853721618652344, -20.20594024658203, -19.55815887451172, -18.910377502441406, -18.262596130371094, -17.61481475830078, -16.96703338623047, -16.319252014160156, -15.671470642089844, -15.023689270019531, -14.375907897949219, -13.728126525878906, -13.080345153808594, -12.432564735412598, -11.784783363342285, -11.137002944946289, -10.489221572875977, -9.841440200805664, -9.193658828735352, -8.545877456665039, -7.898096561431885, -7.2503156661987305, -6.602534294128418, -5.9547529220581055, -5.306971549987793, -4.6591901779174805, -4.011409282684326, -3.3636279106140137, -2.715846538543701, -2.0680654048919678, -1.4202842712402344, -0.7725028991699219, -0.12472164630889893, 0.523059606552124, 1.170840859413147, 1.81862211227417, 2.4664034843444824, 3.114184617996216, 3.761965751647949, 4.409747123718262, 5.057528495788574, 5.705309867858887, 6.353090763092041, 7.0008721351623535, 7.648653507232666, 8.29643440246582, 8.944215774536133, 9.591997146606445, 10.239778518676758, 10.88755989074707, 11.535341262817383, 12.183122634887695, 12.830904006958008, 13.478684425354004, 14.126465797424316, 14.774247169494629, 15.422028541564941, 16.069808959960938, 16.71759033203125, 17.365371704101562, 18.013153076171875, 18.660934448242188, 19.3087158203125, 19.956497192382812]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 11.0, 9.0, 4.0, 9.0, 12.0, 14.0, 15.0, 20.0, 22.0, 30.0, 23.0, 45.0, 34.0, 38.0, 41.0, 38.0, 39.0, 39.0, 42.0, 47.0, 36.0, 58.0, 55.0, 43.0, 45.0, 39.0, 22.0, 31.0, 28.0, 26.0, 14.0, 12.0, 18.0, 13.0, 7.0, 2.0, 9.0, 6.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.55859375, -4.40673828125, -4.2548828125, -4.10302734375, -3.951171875, -3.79931640625, -3.6474609375, -3.49560546875, -3.34375, -3.19189453125, -3.0400390625, -2.88818359375, -2.736328125, -2.58447265625, -2.4326171875, -2.28076171875, -2.12890625, -1.97705078125, -1.8251953125, -1.67333984375, -1.521484375, -1.36962890625, -1.2177734375, -1.06591796875, -0.9140625, -0.76220703125, -0.6103515625, -0.45849609375, -0.306640625, -0.15478515625, -0.0029296875, 0.14892578125, 0.30078125, 0.45263671875, 0.6044921875, 0.75634765625, 0.908203125, 1.06005859375, 1.2119140625, 1.36376953125, 1.515625, 1.66748046875, 1.8193359375, 1.97119140625, 2.123046875, 2.27490234375, 2.4267578125, 2.57861328125, 2.73046875, 2.88232421875, 3.0341796875, 3.18603515625, 3.337890625, 3.48974609375, 3.6416015625, 3.79345703125, 3.9453125, 4.09716796875, 4.2490234375, 4.40087890625, 4.552734375, 4.70458984375, 4.8564453125, 5.00830078125, 5.16015625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 20.0, 9.0, 24.0, 44.0, 50.0, 75.0, 120.0, 169.0, 270.0, 404.0, 578.0, 881.0, 1270.0, 1945.0, 3017.0, 4546.0, 6918.0, 10764.0, 16554.0, 25736.0, 41536.0, 67785.0, 115162.0, 196834.0, 220348.0, 130470.0, 76498.0, 45798.0, 28449.0, 18214.0, 11709.0, 7494.0, 5018.0, 3235.0, 2176.0, 1397.0, 1040.0, 684.0, 432.0, 301.0, 181.0, 124.0, 91.0, 55.0, 29.0, 22.0, 28.0, 16.0, 7.0, 7.0, 1.0, 3.0, 2.0, 5.0], "bins": [-0.03131103515625, -0.030393123626708984, -0.02947521209716797, -0.028557300567626953, -0.027639389038085938, -0.026721477508544922, -0.025803565979003906, -0.02488565444946289, -0.023967742919921875, -0.02304983139038086, -0.022131919860839844, -0.021214008331298828, -0.020296096801757812, -0.019378185272216797, -0.01846027374267578, -0.017542362213134766, -0.01662445068359375, -0.015706539154052734, -0.014788627624511719, -0.013870716094970703, -0.012952804565429688, -0.012034893035888672, -0.011116981506347656, -0.01019906997680664, -0.009281158447265625, -0.00836324691772461, -0.007445335388183594, -0.006527423858642578, -0.0056095123291015625, -0.004691600799560547, -0.0037736892700195312, -0.0028557777404785156, -0.0019378662109375, -0.0010199546813964844, -0.00010204315185546875, 0.0008158683776855469, 0.0017337799072265625, 0.002651691436767578, 0.0035696029663085938, 0.004487514495849609, 0.005405426025390625, 0.006323337554931641, 0.007241249084472656, 0.008159160614013672, 0.009077072143554688, 0.009994983673095703, 0.010912895202636719, 0.011830806732177734, 0.01274871826171875, 0.013666629791259766, 0.014584541320800781, 0.015502452850341797, 0.016420364379882812, 0.017338275909423828, 0.018256187438964844, 0.01917409896850586, 0.020092010498046875, 0.02100992202758789, 0.021927833557128906, 0.022845745086669922, 0.023763656616210938, 0.024681568145751953, 0.02559947967529297, 0.026517391204833984, 0.027435302734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 12.0, 8.0, 5.0, 12.0, 9.0, 9.0, 18.0, 17.0, 21.0, 16.0, 25.0, 24.0, 24.0, 38.0, 31.0, 38.0, 38.0, 26.0, 33.0, 28.0, 45.0, 1064.0, 43.0, 30.0, 34.0, 38.0, 43.0, 38.0, 29.0, 38.0, 21.0, 25.0, 20.0, 16.0, 17.0, 18.0, 12.0, 14.0, 7.0, 12.0, 5.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.455078125, -3.344146728515625, -3.23321533203125, -3.122283935546875, -3.0113525390625, -2.900421142578125, -2.78948974609375, -2.678558349609375, -2.567626953125, -2.456695556640625, -2.34576416015625, -2.234832763671875, -2.1239013671875, -2.012969970703125, -1.90203857421875, -1.791107177734375, -1.68017578125, -1.569244384765625, -1.45831298828125, -1.347381591796875, -1.2364501953125, -1.125518798828125, -1.01458740234375, -0.903656005859375, -0.792724609375, -0.681793212890625, -0.57086181640625, -0.459930419921875, -0.3489990234375, -0.238067626953125, -0.12713623046875, -0.016204833984375, 0.0947265625, 0.205657958984375, 0.31658935546875, 0.427520751953125, 0.5384521484375, 0.649383544921875, 0.76031494140625, 0.871246337890625, 0.982177734375, 1.093109130859375, 1.20404052734375, 1.314971923828125, 1.4259033203125, 1.536834716796875, 1.64776611328125, 1.758697509765625, 1.86962890625, 1.980560302734375, 2.09149169921875, 2.202423095703125, 2.3133544921875, 2.424285888671875, 2.53521728515625, 2.646148681640625, 2.757080078125, 2.868011474609375, 2.97894287109375, 3.089874267578125, 3.2008056640625, 3.311737060546875, 3.42266845703125, 3.533599853515625, 3.64453125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 10.0, 16.0, 8.0, 15.0, 20.0, 31.0, 57.0, 82.0, 129.0, 167.0, 226.0, 313.0, 460.0, 679.0, 936.0, 1324.0, 1967.0, 2946.0, 4105.0, 6119.0, 8909.0, 13251.0, 19582.0, 29283.0, 44892.0, 69324.0, 107847.0, 169693.0, 1240814.0, 130051.0, 82679.0, 53906.0, 34815.0, 23231.0, 15695.0, 10540.0, 7291.0, 4872.0, 3340.0, 2292.0, 1529.0, 1124.0, 753.0, 559.0, 393.0, 259.0, 183.0, 118.0, 110.0, 64.0, 41.0, 32.0, 20.0, 9.0, 11.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.01202392578125, -0.011638641357421875, -0.01125335693359375, -0.010868072509765625, -0.0104827880859375, -0.010097503662109375, -0.00971221923828125, -0.009326934814453125, -0.008941650390625, -0.008556365966796875, -0.00817108154296875, -0.007785797119140625, -0.0074005126953125, -0.007015228271484375, -0.00662994384765625, -0.006244659423828125, -0.005859375, -0.005474090576171875, -0.00508880615234375, -0.004703521728515625, -0.0043182373046875, -0.003932952880859375, -0.00354766845703125, -0.003162384033203125, -0.002777099609375, -0.002391815185546875, -0.00200653076171875, -0.001621246337890625, -0.0012359619140625, -0.000850677490234375, -0.00046539306640625, -8.0108642578125e-05, 0.00030517578125, 0.000690460205078125, 0.00107574462890625, 0.001461029052734375, 0.0018463134765625, 0.002231597900390625, 0.00261688232421875, 0.003002166748046875, 0.003387451171875, 0.003772735595703125, 0.00415802001953125, 0.004543304443359375, 0.0049285888671875, 0.005313873291015625, 0.00569915771484375, 0.006084442138671875, 0.0064697265625, 0.006855010986328125, 0.00724029541015625, 0.007625579833984375, 0.0080108642578125, 0.008396148681640625, 0.00878143310546875, 0.009166717529296875, 0.009552001953125, 0.009937286376953125, 0.01032257080078125, 0.010707855224609375, 0.0110931396484375, 0.011478424072265625, 0.01186370849609375, 0.012248992919921875, 0.01263427734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 12.0, 0.0, 9.0, 3.0, 8.0, 0.0, 11.0, 20.0, 20.0, 0.0, 12.0, 13.0, 19.0, 0.0, 27.0, 52.0, 56.0, 84.0, 0.0, 107.0, 123.0, 106.0, 0.0, 83.0, 45.0, 45.0, 0.0, 30.0, 27.0, 23.0, 0.0, 14.0, 15.0, 8.0, 4.0, 0.0, 12.0, 8.0, 3.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.623295247554779e-06, -1.5776604413986206e-06, -1.5320256352424622e-06, -1.4863908290863037e-06, -1.4407560229301453e-06, -1.3951212167739868e-06, -1.3494864106178284e-06, -1.30385160446167e-06, -1.2582167983055115e-06, -1.212581992149353e-06, -1.1669471859931946e-06, -1.1213123798370361e-06, -1.0756775736808777e-06, -1.0300427675247192e-06, -9.844079613685608e-07, -9.387731552124023e-07, -8.931383490562439e-07, -8.475035429000854e-07, -8.01868736743927e-07, -7.562339305877686e-07, -7.105991244316101e-07, -6.649643182754517e-07, -6.193295121192932e-07, -5.736947059631348e-07, -5.280598998069763e-07, -4.824250936508179e-07, -4.367902874946594e-07, -3.91155481338501e-07, -3.4552067518234253e-07, -2.998858690261841e-07, -2.5425106287002563e-07, -2.086162567138672e-07, -1.6298145055770874e-07, -1.1734664440155029e-07, -7.171183824539185e-08, -2.60770320892334e-08, 1.955777406692505e-08, 6.51925802230835e-08, 1.1082738637924194e-07, 1.564621925354004e-07, 2.0209699869155884e-07, 2.477318048477173e-07, 2.9336661100387573e-07, 3.390014171600342e-07, 3.8463622331619263e-07, 4.302710294723511e-07, 4.759058356285095e-07, 5.21540641784668e-07, 5.671754479408264e-07, 6.128102540969849e-07, 6.584450602531433e-07, 7.040798664093018e-07, 7.497146725654602e-07, 7.953494787216187e-07, 8.409842848777771e-07, 8.866190910339355e-07, 9.32253897190094e-07, 9.778887033462524e-07, 1.0235235095024109e-06, 1.0691583156585693e-06, 1.1147931218147278e-06, 1.1604279279708862e-06, 1.2060627341270447e-06, 1.2516975402832031e-06]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 12.0, 5.0, 7.0, 7.0, 8.0, 15.0, 16.0, 26.0, 36.0, 39.0, 53.0, 99.0, 189.0, 419.0, 4292.0, 935321.0, 105947.0, 1243.0, 346.0, 134.0, 86.0, 49.0, 46.0, 30.0, 27.0, 12.0, 12.0, 18.0, 15.0, 8.0, 5.0, 4.0, 8.0, 9.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-05, -2.864748239517212e-05, -2.7492642402648926e-05, -2.6337802410125732e-05, -2.518296241760254e-05, -2.4028122425079346e-05, -2.2873282432556152e-05, -2.171844244003296e-05, -2.0563602447509766e-05, -1.9408762454986572e-05, -1.825392246246338e-05, -1.7099082469940186e-05, -1.5944242477416992e-05, -1.4789402484893799e-05, -1.3634562492370605e-05, -1.2479722499847412e-05, -1.1324882507324219e-05, -1.0170042514801025e-05, -9.015202522277832e-06, -7.860362529754639e-06, -6.705522537231445e-06, -5.550682544708252e-06, -4.395842552185059e-06, -3.2410025596618652e-06, -2.086162567138672e-06, -9.313225746154785e-07, 2.2351741790771484e-07, 1.3783574104309082e-06, 2.5331974029541016e-06, 3.688037395477295e-06, 4.842877388000488e-06, 5.997717380523682e-06, 7.152557373046875e-06, 8.307397365570068e-06, 9.462237358093262e-06, 1.0617077350616455e-05, 1.1771917343139648e-05, 1.2926757335662842e-05, 1.4081597328186035e-05, 1.5236437320709229e-05, 1.6391277313232422e-05, 1.7546117305755615e-05, 1.870095729827881e-05, 1.9855797290802002e-05, 2.1010637283325195e-05, 2.216547727584839e-05, 2.3320317268371582e-05, 2.4475157260894775e-05, 2.562999725341797e-05, 2.6784837245941162e-05, 2.7939677238464355e-05, 2.909451723098755e-05, 3.0249357223510742e-05, 3.1404197216033936e-05, 3.255903720855713e-05, 3.371387720108032e-05, 3.4868717193603516e-05, 3.602355718612671e-05, 3.71783971786499e-05, 3.8333237171173096e-05, 3.948807716369629e-05, 4.064291715621948e-05, 4.1797757148742676e-05, 4.295259714126587e-05, 4.410743713378906e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [136.0, 852.0, 32.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.463166985464341e-07, -1.3300893897394417e-07, 2.802988205985457e-07, 6.936065233276167e-07, 1.1069143965869443e-06, 1.520222213002853e-06, 1.9335298020450864e-06, 2.346837618460995e-06, 2.760145434876904e-06, 3.1734532512928126e-06, 3.5867610677087214e-06, 4.000068656750955e-06, 4.413376700540539e-06, 4.826684289582772e-06, 5.2399918786250055e-06, 5.65329992241459e-06, 6.066607511456823e-06, 6.479915100499056e-06, 6.8932231442886405e-06, 7.306530733330874e-06, 7.719838322373107e-06, 8.133146366162691e-06, 8.546454409952275e-06, 8.959761544247158e-06, 9.373069588036742e-06, 9.786377631826326e-06, 1.0199684766121209e-05, 1.0612992809910793e-05, 1.1026300853700377e-05, 1.143960798799526e-05, 1.1852916031784844e-05, 1.2266224075574428e-05, 1.267953120986931e-05, 1.3092839253658894e-05, 1.3506146387953777e-05, 1.3919454431743361e-05, 1.4332762475532945e-05, 1.474607051932253e-05, 1.5159377653617412e-05, 1.5572684787912294e-05, 1.598599374119658e-05, 1.6399300875491463e-05, 1.681260982877575e-05, 1.722591696307063e-05, 1.7639224097365513e-05, 1.80525330506498e-05, 1.8465840184944682e-05, 1.8879147319239564e-05, 1.929245627252385e-05, 1.9705763406818733e-05, 2.011907236010302e-05, 2.05323794943979e-05, 2.0945686628692783e-05, 2.135899558197707e-05, 2.1772302716271952e-05, 2.2185609850566834e-05, 2.2598916984861717e-05, 2.30122241191566e-05, 2.3425533072440885e-05, 2.3838840206735767e-05, 2.425214734103065e-05, 2.4665456294314936e-05, 2.5078763428609818e-05, 2.54920705629047e-05, 2.5905379516188987e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 10.0, 0.0, 21.0, 0.0, 25.0, 0.0, 32.0, 0.0, 50.0, 0.0, 46.0, 0.0, 64.0, 0.0, 70.0, 0.0, 92.0, 113.0, 0.0, 99.0, 0.0, 82.0, 0.0, 88.0, 0.0, 66.0, 0.0, 44.0, 0.0, 43.0, 0.0, 18.0, 0.0, 17.0, 0.0, 16.0, 0.0, 4.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.825453162193298e-07, -9.51811671257019e-07, -9.210780262947083e-07, -8.903443813323975e-07, -8.596107363700867e-07, -8.288770914077759e-07, -7.981434464454651e-07, -7.674098014831543e-07, -7.366761565208435e-07, -7.059425115585327e-07, -6.752088665962219e-07, -6.444752216339111e-07, -6.137415766716003e-07, -5.830079317092896e-07, -5.522742867469788e-07, -5.21540641784668e-07, -4.908069968223572e-07, -4.600733518600464e-07, -4.293397068977356e-07, -3.986060619354248e-07, -3.67872416973114e-07, -3.371387720108032e-07, -3.0640512704849243e-07, -2.7567148208618164e-07, -2.4493783712387085e-07, -2.1420419216156006e-07, -1.8347054719924927e-07, -1.5273690223693848e-07, -1.2200325727462769e-07, -9.12696123123169e-08, -6.05359673500061e-08, -2.9802322387695312e-08, 9.313225746154785e-10, 3.166496753692627e-08, 6.239861249923706e-08, 9.313225746154785e-08, 1.2386590242385864e-07, 1.5459954738616943e-07, 1.8533319234848022e-07, 2.1606683731079102e-07, 2.468004822731018e-07, 2.775341272354126e-07, 3.082677721977234e-07, 3.390014171600342e-07, 3.6973506212234497e-07, 4.0046870708465576e-07, 4.3120235204696655e-07, 4.6193599700927734e-07, 4.926696419715881e-07, 5.234032869338989e-07, 5.541369318962097e-07, 5.848705768585205e-07, 6.156042218208313e-07, 6.463378667831421e-07, 6.770715117454529e-07, 7.078051567077637e-07, 7.385388016700745e-07, 7.692724466323853e-07, 8.00006091594696e-07, 8.307397365570068e-07, 8.614733815193176e-07, 8.922070264816284e-07, 9.229406714439392e-07, 9.5367431640625e-07]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 11.0, 9.0, 4.0, 9.0, 12.0, 14.0, 15.0, 20.0, 22.0, 30.0, 23.0, 45.0, 34.0, 38.0, 41.0, 38.0, 39.0, 39.0, 42.0, 47.0, 36.0, 58.0, 55.0, 43.0, 45.0, 39.0, 22.0, 31.0, 28.0, 26.0, 14.0, 12.0, 18.0, 13.0, 7.0, 2.0, 9.0, 6.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.55859375, -4.40673828125, -4.2548828125, -4.10302734375, -3.951171875, -3.79931640625, -3.6474609375, -3.49560546875, -3.34375, -3.19189453125, -3.0400390625, -2.88818359375, -2.736328125, -2.58447265625, -2.4326171875, -2.28076171875, -2.12890625, -1.97705078125, -1.8251953125, -1.67333984375, -1.521484375, -1.36962890625, -1.2177734375, -1.06591796875, -0.9140625, -0.76220703125, -0.6103515625, -0.45849609375, -0.306640625, -0.15478515625, -0.0029296875, 0.14892578125, 0.30078125, 0.45263671875, 0.6044921875, 0.75634765625, 0.908203125, 1.06005859375, 1.2119140625, 1.36376953125, 1.515625, 1.66748046875, 1.8193359375, 1.97119140625, 2.123046875, 2.27490234375, 2.4267578125, 2.57861328125, 2.73046875, 2.88232421875, 3.0341796875, 3.18603515625, 3.337890625, 3.48974609375, 3.6416015625, 3.79345703125, 3.9453125, 4.09716796875, 4.2490234375, 4.40087890625, 4.552734375, 4.70458984375, 4.8564453125, 5.00830078125, 5.16015625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 18.0, 34.0, 27.0, 43.0, 59.0, 93.0, 137.0, 224.0, 274.0, 404.0, 631.0, 896.0, 1266.0, 2019.0, 3139.0, 4976.0, 8238.0, 13297.0, 22020.0, 37223.0, 63813.0, 110842.0, 188719.0, 225198.0, 151375.0, 86712.0, 50430.0, 29529.0, 17843.0, 10790.0, 6451.0, 4159.0, 2604.0, 1667.0, 1085.0, 706.0, 471.0, 329.0, 234.0, 176.0, 115.0, 83.0, 63.0, 36.0, 29.0, 19.0, 17.0, 5.0, 8.0, 5.0, 3.0, 3.0, 0.0, 5.0, 1.0, 2.0], "bins": [-4.5859375, -4.4393310546875, -4.292724609375, -4.1461181640625, -3.99951171875, -3.8529052734375, -3.706298828125, -3.5596923828125, -3.4130859375, -3.2664794921875, -3.119873046875, -2.9732666015625, -2.82666015625, -2.6800537109375, -2.533447265625, -2.3868408203125, -2.240234375, -2.0936279296875, -1.947021484375, -1.8004150390625, -1.65380859375, -1.5072021484375, -1.360595703125, -1.2139892578125, -1.0673828125, -0.9207763671875, -0.774169921875, -0.6275634765625, -0.48095703125, -0.3343505859375, -0.187744140625, -0.0411376953125, 0.10546875, 0.2520751953125, 0.398681640625, 0.5452880859375, 0.69189453125, 0.8385009765625, 0.985107421875, 1.1317138671875, 1.2783203125, 1.4249267578125, 1.571533203125, 1.7181396484375, 1.86474609375, 2.0113525390625, 2.157958984375, 2.3045654296875, 2.451171875, 2.5977783203125, 2.744384765625, 2.8909912109375, 3.03759765625, 3.1842041015625, 3.330810546875, 3.4774169921875, 3.6240234375, 3.7706298828125, 3.917236328125, 4.0638427734375, 4.21044921875, 4.3570556640625, 4.503662109375, 4.6502685546875, 4.796875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 9.0, 9.0, 9.0, 12.0, 19.0, 22.0, 22.0, 17.0, 30.0, 32.0, 42.0, 27.0, 40.0, 67.0, 84.0, 129.0, 209.0, 1338.0, 219.0, 162.0, 89.0, 62.0, 51.0, 47.0, 37.0, 33.0, 34.0, 20.0, 17.0, 13.0, 20.0, 12.0, 19.0, 15.0, 13.0, 12.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.22607421875, -8.9052734375, -8.58447265625, -8.263671875, -7.94287109375, -7.6220703125, -7.30126953125, -6.98046875, -6.65966796875, -6.3388671875, -6.01806640625, -5.697265625, -5.37646484375, -5.0556640625, -4.73486328125, -4.4140625, -4.09326171875, -3.7724609375, -3.45166015625, -3.130859375, -2.81005859375, -2.4892578125, -2.16845703125, -1.84765625, -1.52685546875, -1.2060546875, -0.88525390625, -0.564453125, -0.24365234375, 0.0771484375, 0.39794921875, 0.71875, 1.03955078125, 1.3603515625, 1.68115234375, 2.001953125, 2.32275390625, 2.6435546875, 2.96435546875, 3.28515625, 3.60595703125, 3.9267578125, 4.24755859375, 4.568359375, 4.88916015625, 5.2099609375, 5.53076171875, 5.8515625, 6.17236328125, 6.4931640625, 6.81396484375, 7.134765625, 7.45556640625, 7.7763671875, 8.09716796875, 8.41796875, 8.73876953125, 9.0595703125, 9.38037109375, 9.701171875, 10.02197265625, 10.3427734375, 10.66357421875, 10.984375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 16.0, 13.0, 23.0, 17.0, 39.0, 38.0, 53.0, 97.0, 147.0, 269.0, 534.0, 1349.0, 22939.0, 2995740.0, 120322.0, 2483.0, 689.0, 358.0, 158.0, 112.0, 76.0, 44.0, 36.0, 32.0, 26.0, 18.0, 14.0, 8.0, 9.0, 3.0, 2.0, 2.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.9375, -26.962890625, -25.98828125, -25.013671875, -24.0390625, -23.064453125, -22.08984375, -21.115234375, -20.140625, -19.166015625, -18.19140625, -17.216796875, -16.2421875, -15.267578125, -14.29296875, -13.318359375, -12.34375, -11.369140625, -10.39453125, -9.419921875, -8.4453125, -7.470703125, -6.49609375, -5.521484375, -4.546875, -3.572265625, -2.59765625, -1.623046875, -0.6484375, 0.326171875, 1.30078125, 2.275390625, 3.25, 4.224609375, 5.19921875, 6.173828125, 7.1484375, 8.123046875, 9.09765625, 10.072265625, 11.046875, 12.021484375, 12.99609375, 13.970703125, 14.9453125, 15.919921875, 16.89453125, 17.869140625, 18.84375, 19.818359375, 20.79296875, 21.767578125, 22.7421875, 23.716796875, 24.69140625, 25.666015625, 26.640625, 27.615234375, 28.58984375, 29.564453125, 30.5390625, 31.513671875, 32.48828125, 33.462890625, 34.4375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 8.0, 18.0, 64.0, 177.0, 258.0, 246.0, 151.0, 68.0, 18.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.480012893676758, -17.034095764160156, -14.588180541992188, -12.142264366149902, -9.696348190307617, -7.250432014465332, -4.804515838623047, -2.3585987091064453, 0.08731651306152344, 2.5332326889038086, 4.979148864746094, 7.425065040588379, 9.870981216430664, 12.31689739227295, 14.762813568115234, 17.208730697631836, 19.654645919799805, 22.100563049316406, 24.546478271484375, 26.992393493652344, 29.438310623168945, 31.884227752685547, 34.330142974853516, 36.77606201171875, 39.22197723388672, 41.66789245605469, 44.113807678222656, 46.55972671508789, 49.00564193725586, 51.45155715942383, 53.89747619628906, 56.34339141845703, 58.789306640625, 61.23522186279297, 63.68113708496094, 66.1270523071289, 68.57296752929688, 71.01889038085938, 73.46480560302734, 75.91072082519531, 78.35663604736328, 80.80255126953125, 83.24846649169922, 85.69438171386719, 88.14030456542969, 90.58621978759766, 93.03213500976562, 95.4780502319336, 97.92396545410156, 100.36988067626953, 102.8157958984375, 105.26171112060547, 107.70762634277344, 110.15354919433594, 112.5994644165039, 115.04537963867188, 117.49129486083984, 119.93721008300781, 122.38312530517578, 124.82904052734375, 127.27496337890625, 129.7208709716797, 132.1667938232422, 134.61270141601562, 137.05862426757812]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 10.0, 10.0, 4.0, 9.0, 19.0, 24.0, 13.0, 19.0, 34.0, 25.0, 30.0, 21.0, 29.0, 32.0, 27.0, 49.0, 34.0, 47.0, 49.0, 36.0, 35.0, 34.0, 27.0, 33.0, 37.0, 30.0, 38.0, 36.0, 33.0, 21.0, 24.0, 28.0, 13.0, 10.0, 20.0, 12.0, 7.0, 8.0, 5.0, 4.0, 7.0, 1.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-35.830047607421875, -34.75184631347656, -33.67364501953125, -32.59544372558594, -31.517240524291992, -30.43903923034668, -29.360836029052734, -28.282634735107422, -27.20443344116211, -26.126232147216797, -25.048030853271484, -23.96982765197754, -22.891626358032227, -21.813425064086914, -20.73522186279297, -19.657020568847656, -18.578819274902344, -17.50061798095703, -16.42241668701172, -15.344213485717773, -14.266012191772461, -13.187810897827148, -12.10960865020752, -11.03140640258789, -9.953205108642578, -8.875003814697266, -7.796801567077637, -6.718599796295166, -5.640398025512695, -4.562196254730225, -3.483994483947754, -2.405792713165283, -1.3275909423828125, -0.2493891716003418, 0.8288125991821289, 1.9070143699645996, 2.9852161407470703, 4.063417911529541, 5.141619682312012, 6.219821453094482, 7.298023223876953, 8.376224517822266, 9.454426765441895, 10.532629013061523, 11.610830307006836, 12.689031600952148, 13.767233848571777, 14.845436096191406, 15.923637390136719, 17.00183868408203, 18.080039978027344, 19.15824317932129, 20.2364444732666, 21.314645767211914, 22.39284896850586, 23.471050262451172, 24.549251556396484, 25.627452850341797, 26.70565414428711, 27.783857345581055, 28.862058639526367, 29.94025993347168, 31.018463134765625, 32.09666442871094, 33.17486572265625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 4.0, 7.0, 9.0, 15.0, 11.0, 19.0, 19.0, 22.0, 28.0, 31.0, 36.0, 44.0, 33.0, 39.0, 48.0, 43.0, 42.0, 36.0, 47.0, 46.0, 52.0, 45.0, 42.0, 37.0, 37.0, 30.0, 26.0, 24.0, 20.0, 23.0, 16.0, 10.0, 9.0, 7.0, 11.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.51202392578125, -4.3599853515625, -4.20794677734375, -4.055908203125, -3.90386962890625, -3.7518310546875, -3.59979248046875, -3.44775390625, -3.29571533203125, -3.1436767578125, -2.99163818359375, -2.839599609375, -2.68756103515625, -2.5355224609375, -2.38348388671875, -2.2314453125, -2.07940673828125, -1.9273681640625, -1.77532958984375, -1.623291015625, -1.47125244140625, -1.3192138671875, -1.16717529296875, -1.01513671875, -0.86309814453125, -0.7110595703125, -0.55902099609375, -0.406982421875, -0.25494384765625, -0.1029052734375, 0.04913330078125, 0.201171875, 0.35321044921875, 0.5052490234375, 0.65728759765625, 0.809326171875, 0.96136474609375, 1.1134033203125, 1.26544189453125, 1.41748046875, 1.56951904296875, 1.7215576171875, 1.87359619140625, 2.025634765625, 2.17767333984375, 2.3297119140625, 2.48175048828125, 2.6337890625, 2.78582763671875, 2.9378662109375, 3.08990478515625, 3.241943359375, 3.39398193359375, 3.5460205078125, 3.69805908203125, 3.85009765625, 4.00213623046875, 4.1541748046875, 4.30621337890625, 4.458251953125, 4.61029052734375, 4.7623291015625, 4.91436767578125, 5.06640625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 9.0, 13.0, 15.0, 14.0, 22.0, 36.0, 48.0, 56.0, 89.0, 128.0, 196.0, 285.0, 450.0, 767.0, 1373.0, 2873.0, 6042.0, 15533.0, 54168.0, 422949.0, 2687621.0, 872569.0, 91348.0, 22022.0, 7962.0, 3534.0, 1656.0, 866.0, 552.0, 323.0, 223.0, 156.0, 95.0, 69.0, 52.0, 40.0, 31.0, 19.0, 19.0, 11.0, 11.0, 5.0, 5.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3046875, -9.968505859375, -9.63232421875, -9.296142578125, -8.9599609375, -8.623779296875, -8.28759765625, -7.951416015625, -7.615234375, -7.279052734375, -6.94287109375, -6.606689453125, -6.2705078125, -5.934326171875, -5.59814453125, -5.261962890625, -4.92578125, -4.589599609375, -4.25341796875, -3.917236328125, -3.5810546875, -3.244873046875, -2.90869140625, -2.572509765625, -2.236328125, -1.900146484375, -1.56396484375, -1.227783203125, -0.8916015625, -0.555419921875, -0.21923828125, 0.116943359375, 0.453125, 0.789306640625, 1.12548828125, 1.461669921875, 1.7978515625, 2.134033203125, 2.47021484375, 2.806396484375, 3.142578125, 3.478759765625, 3.81494140625, 4.151123046875, 4.4873046875, 4.823486328125, 5.15966796875, 5.495849609375, 5.83203125, 6.168212890625, 6.50439453125, 6.840576171875, 7.1767578125, 7.512939453125, 7.84912109375, 8.185302734375, 8.521484375, 8.857666015625, 9.19384765625, 9.530029296875, 9.8662109375, 10.202392578125, 10.53857421875, 10.874755859375, 11.2109375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 9.0, 6.0, 14.0, 14.0, 22.0, 30.0, 35.0, 42.0, 66.0, 64.0, 110.0, 134.0, 192.0, 278.0, 337.0, 489.0, 530.0, 448.0, 303.0, 268.0, 159.0, 117.0, 104.0, 69.0, 55.0, 49.0, 40.0, 25.0, 16.0, 12.0, 6.0, 12.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.46875, -8.24114990234375, -8.0135498046875, -7.78594970703125, -7.558349609375, -7.33074951171875, -7.1031494140625, -6.87554931640625, -6.64794921875, -6.42034912109375, -6.1927490234375, -5.96514892578125, -5.737548828125, -5.50994873046875, -5.2823486328125, -5.05474853515625, -4.8271484375, -4.59954833984375, -4.3719482421875, -4.14434814453125, -3.916748046875, -3.68914794921875, -3.4615478515625, -3.23394775390625, -3.00634765625, -2.77874755859375, -2.5511474609375, -2.32354736328125, -2.095947265625, -1.86834716796875, -1.6407470703125, -1.41314697265625, -1.185546875, -0.95794677734375, -0.7303466796875, -0.50274658203125, -0.275146484375, -0.04754638671875, 0.1800537109375, 0.40765380859375, 0.63525390625, 0.86285400390625, 1.0904541015625, 1.31805419921875, 1.545654296875, 1.77325439453125, 2.0008544921875, 2.22845458984375, 2.4560546875, 2.68365478515625, 2.9112548828125, 3.13885498046875, 3.366455078125, 3.59405517578125, 3.8216552734375, 4.04925537109375, 4.27685546875, 4.50445556640625, 4.7320556640625, 4.95965576171875, 5.187255859375, 5.41485595703125, 5.6424560546875, 5.87005615234375, 6.09765625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 11.0, 10.0, 21.0, 31.0, 51.0, 64.0, 116.0, 197.0, 302.0, 536.0, 812.0, 1658.0, 3245.0, 7679.0, 21376.0, 77732.0, 408489.0, 2603189.0, 878950.0, 136713.0, 33311.0, 10853.0, 4352.0, 1979.0, 1060.0, 592.0, 359.0, 204.0, 125.0, 91.0, 66.0, 32.0, 24.0, 15.0, 10.0, 10.0, 5.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296875, -7.9859619140625, -7.675048828125, -7.3641357421875, -7.05322265625, -6.7423095703125, -6.431396484375, -6.1204833984375, -5.8095703125, -5.4986572265625, -5.187744140625, -4.8768310546875, -4.56591796875, -4.2550048828125, -3.944091796875, -3.6331787109375, -3.322265625, -3.0113525390625, -2.700439453125, -2.3895263671875, -2.07861328125, -1.7677001953125, -1.456787109375, -1.1458740234375, -0.8349609375, -0.5240478515625, -0.213134765625, 0.0977783203125, 0.40869140625, 0.7196044921875, 1.030517578125, 1.3414306640625, 1.65234375, 1.9632568359375, 2.274169921875, 2.5850830078125, 2.89599609375, 3.2069091796875, 3.517822265625, 3.8287353515625, 4.1396484375, 4.4505615234375, 4.761474609375, 5.0723876953125, 5.38330078125, 5.6942138671875, 6.005126953125, 6.3160400390625, 6.626953125, 6.9378662109375, 7.248779296875, 7.5596923828125, 7.87060546875, 8.1815185546875, 8.492431640625, 8.8033447265625, 9.1142578125, 9.4251708984375, 9.736083984375, 10.0469970703125, 10.35791015625, 10.6688232421875, 10.979736328125, 11.2906494140625, 11.6015625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 28.0, 277.0, 544.0, 151.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-268.76300048828125, -263.0848693847656, -257.4067077636719, -251.72857666015625, -246.05043029785156, -240.37228393554688, -234.69415283203125, -229.01600646972656, -223.33786010742188, -217.6597137451172, -211.98158264160156, -206.30343627929688, -200.6252899169922, -194.9471435546875, -189.26901245117188, -183.5908660888672, -177.91273498535156, -172.23458862304688, -166.55645751953125, -160.87831115722656, -155.20016479492188, -149.52203369140625, -143.84388732910156, -138.16574096679688, -132.48760986328125, -126.8094711303711, -121.1313247680664, -115.45318603515625, -109.77503967285156, -104.0969009399414, -98.41876220703125, -92.74061584472656, -87.06248474121094, -81.38434600830078, -75.7061996459961, -70.02806091308594, -64.34991455078125, -58.671775817871094, -52.99363708496094, -47.315494537353516, -41.637351989746094, -35.95920944213867, -30.281068801879883, -24.602928161621094, -18.924785614013672, -13.24664306640625, -7.568504333496094, -1.8903617858886719, 3.78778076171875, 9.465922355651855, 15.144063949584961, 20.82220458984375, 26.500347137451172, 32.178489685058594, 37.85662841796875, 43.53477096557617, 49.212913513183594, 54.891056060791016, 60.56919860839844, 66.2473373413086, 71.92547607421875, 77.60362243652344, 83.2817611694336, 88.95989990234375, 94.63804626464844]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 4.0, 2.0, 4.0, 8.0, 14.0, 14.0, 16.0, 13.0, 19.0, 23.0, 23.0, 21.0, 23.0, 40.0, 31.0, 29.0, 47.0, 39.0, 42.0, 41.0, 50.0, 45.0, 31.0, 31.0, 37.0, 44.0, 37.0, 29.0, 21.0, 27.0, 27.0, 28.0, 31.0, 15.0, 23.0, 11.0, 17.0, 9.0, 4.0, 2.0, 10.0, 5.0, 5.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.735641479492188, -26.862028121948242, -25.98841667175293, -25.114803314208984, -24.241191864013672, -23.367578506469727, -22.49396514892578, -21.62035369873047, -20.746740341186523, -19.873126983642578, -18.999515533447266, -18.12590217590332, -17.252288818359375, -16.378677368164062, -15.505064010620117, -14.631451606750488, -13.75783920288086, -12.88422679901123, -12.010614395141602, -11.137001037597656, -10.263388633728027, -9.389776229858398, -8.516162872314453, -7.642550468444824, -6.768938064575195, -5.895325660705566, -5.021712779998779, -4.148099899291992, -3.2744874954223633, -2.4008750915527344, -1.5272622108459473, -0.6536493301391602, 0.21996307373046875, 1.0935757160186768, 1.9671883583068848, 2.8408010005950928, 3.714413642883301, 4.58802604675293, 5.461638927459717, 6.335251808166504, 7.208864212036133, 8.082476615905762, 8.95608901977539, 9.829702377319336, 10.703314781188965, 11.576927185058594, 12.450540542602539, 13.324152946472168, 14.197765350341797, 15.071377754211426, 15.944990158081055, 16.818603515625, 17.692214965820312, 18.565828323364258, 19.439441680908203, 20.313053131103516, 21.18666648864746, 22.060279846191406, 22.93389129638672, 23.807504653930664, 24.68111801147461, 25.554729461669922, 26.428342819213867, 27.301956176757812, 28.175567626953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 2.0, 7.0, 8.0, 15.0, 8.0, 11.0, 15.0, 19.0, 19.0, 28.0, 27.0, 27.0, 40.0, 38.0, 36.0, 41.0, 48.0, 42.0, 40.0, 52.0, 37.0, 35.0, 56.0, 41.0, 48.0, 39.0, 33.0, 26.0, 33.0, 15.0, 22.0, 9.0, 15.0, 16.0, 8.0, 13.0, 11.0, 6.0, 6.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.484375, -4.34210205078125, -4.1998291015625, -4.05755615234375, -3.915283203125, -3.77301025390625, -3.6307373046875, -3.48846435546875, -3.34619140625, -3.20391845703125, -3.0616455078125, -2.91937255859375, -2.777099609375, -2.63482666015625, -2.4925537109375, -2.35028076171875, -2.2080078125, -2.06573486328125, -1.9234619140625, -1.78118896484375, -1.638916015625, -1.49664306640625, -1.3543701171875, -1.21209716796875, -1.06982421875, -0.92755126953125, -0.7852783203125, -0.64300537109375, -0.500732421875, -0.35845947265625, -0.2161865234375, -0.07391357421875, 0.068359375, 0.21063232421875, 0.3529052734375, 0.49517822265625, 0.637451171875, 0.77972412109375, 0.9219970703125, 1.06427001953125, 1.20654296875, 1.34881591796875, 1.4910888671875, 1.63336181640625, 1.775634765625, 1.91790771484375, 2.0601806640625, 2.20245361328125, 2.3447265625, 2.48699951171875, 2.6292724609375, 2.77154541015625, 2.913818359375, 3.05609130859375, 3.1983642578125, 3.34063720703125, 3.48291015625, 3.62518310546875, 3.7674560546875, 3.90972900390625, 4.052001953125, 4.19427490234375, 4.3365478515625, 4.47882080078125, 4.62109375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 4.0, 12.0, 24.0, 18.0, 42.0, 50.0, 93.0, 124.0, 181.0, 305.0, 429.0, 669.0, 1059.0, 1634.0, 2546.0, 4067.0, 6642.0, 10913.0, 17853.0, 30575.0, 52344.0, 94638.0, 171384.0, 259714.0, 170164.0, 93918.0, 52434.0, 30262.0, 17849.0, 10698.0, 6593.0, 4056.0, 2627.0, 1605.0, 1034.0, 682.0, 464.0, 264.0, 167.0, 144.0, 97.0, 51.0, 31.0, 35.0, 15.0, 9.0, 12.0, 12.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.032318115234375, -0.031291961669921875, -0.03026580810546875, -0.029239654541015625, -0.0282135009765625, -0.027187347412109375, -0.02616119384765625, -0.025135040283203125, -0.02410888671875, -0.023082733154296875, -0.02205657958984375, -0.021030426025390625, -0.0200042724609375, -0.018978118896484375, -0.01795196533203125, -0.016925811767578125, -0.015899658203125, -0.014873504638671875, -0.01384735107421875, -0.012821197509765625, -0.0117950439453125, -0.010768890380859375, -0.00974273681640625, -0.008716583251953125, -0.0076904296875, -0.006664276123046875, -0.00563812255859375, -0.004611968994140625, -0.0035858154296875, -0.002559661865234375, -0.00153350830078125, -0.000507354736328125, 0.000518798828125, 0.001544952392578125, 0.00257110595703125, 0.003597259521484375, 0.0046234130859375, 0.005649566650390625, 0.00667572021484375, 0.007701873779296875, 0.00872802734375, 0.009754180908203125, 0.01078033447265625, 0.011806488037109375, 0.0128326416015625, 0.013858795166015625, 0.01488494873046875, 0.015911102294921875, 0.016937255859375, 0.017963409423828125, 0.01898956298828125, 0.020015716552734375, 0.0210418701171875, 0.022068023681640625, 0.02309417724609375, 0.024120330810546875, 0.025146484375, 0.026172637939453125, 0.02719879150390625, 0.028224945068359375, 0.0292510986328125, 0.030277252197265625, 0.03130340576171875, 0.032329559326171875, 0.033355712890625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 13.0, 15.0, 7.0, 17.0, 16.0, 13.0, 20.0, 20.0, 31.0, 33.0, 28.0, 32.0, 44.0, 30.0, 42.0, 36.0, 49.0, 43.0, 1074.0, 48.0, 50.0, 41.0, 39.0, 32.0, 30.0, 36.0, 30.0, 19.0, 27.0, 23.0, 14.0, 15.0, 16.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.76953125, -3.6590576171875, -3.548583984375, -3.4381103515625, -3.32763671875, -3.2171630859375, -3.106689453125, -2.9962158203125, -2.8857421875, -2.7752685546875, -2.664794921875, -2.5543212890625, -2.44384765625, -2.3333740234375, -2.222900390625, -2.1124267578125, -2.001953125, -1.8914794921875, -1.781005859375, -1.6705322265625, -1.56005859375, -1.4495849609375, -1.339111328125, -1.2286376953125, -1.1181640625, -1.0076904296875, -0.897216796875, -0.7867431640625, -0.67626953125, -0.5657958984375, -0.455322265625, -0.3448486328125, -0.234375, -0.1239013671875, -0.013427734375, 0.0970458984375, 0.20751953125, 0.3179931640625, 0.428466796875, 0.5389404296875, 0.6494140625, 0.7598876953125, 0.870361328125, 0.9808349609375, 1.09130859375, 1.2017822265625, 1.312255859375, 1.4227294921875, 1.533203125, 1.6436767578125, 1.754150390625, 1.8646240234375, 1.97509765625, 2.0855712890625, 2.196044921875, 2.3065185546875, 2.4169921875, 2.5274658203125, 2.637939453125, 2.7484130859375, 2.85888671875, 2.9693603515625, 3.079833984375, 3.1903076171875, 3.30078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 11.0, 11.0, 30.0, 30.0, 34.0, 55.0, 63.0, 109.0, 142.0, 219.0, 321.0, 437.0, 691.0, 971.0, 1473.0, 2144.0, 3105.0, 4834.0, 7389.0, 11251.0, 17136.0, 26850.0, 41948.0, 65198.0, 105121.0, 171724.0, 1258321.0, 139409.0, 85390.0, 54248.0, 34534.0, 22130.0, 14152.0, 9211.0, 6086.0, 3923.0, 2737.0, 1808.0, 1218.0, 830.0, 543.0, 413.0, 265.0, 191.0, 120.0, 90.0, 60.0, 34.0, 39.0, 29.0, 20.0, 12.0, 7.0, 7.0, 3.0, 4.0, 2.0], "bins": [-0.01258087158203125, -0.012202858924865723, -0.011824846267700195, -0.011446833610534668, -0.01106882095336914, -0.010690808296203613, -0.010312795639038086, -0.009934782981872559, -0.009556770324707031, -0.009178757667541504, -0.008800745010375977, -0.00842273235321045, -0.008044719696044922, -0.0076667070388793945, -0.007288694381713867, -0.00691068172454834, -0.0065326690673828125, -0.006154656410217285, -0.005776643753051758, -0.0053986310958862305, -0.005020618438720703, -0.004642605781555176, -0.0042645931243896484, -0.003886580467224121, -0.0035085678100585938, -0.0031305551528930664, -0.002752542495727539, -0.0023745298385620117, -0.0019965171813964844, -0.001618504524230957, -0.0012404918670654297, -0.0008624792098999023, -0.000484466552734375, -0.00010645389556884766, 0.0002715587615966797, 0.000649571418762207, 0.0010275840759277344, 0.0014055967330932617, 0.001783609390258789, 0.0021616220474243164, 0.0025396347045898438, 0.002917647361755371, 0.0032956600189208984, 0.0036736726760864258, 0.004051685333251953, 0.0044296979904174805, 0.004807710647583008, 0.005185723304748535, 0.0055637359619140625, 0.00594174861907959, 0.006319761276245117, 0.0066977739334106445, 0.007075786590576172, 0.007453799247741699, 0.007831811904907227, 0.008209824562072754, 0.008587837219238281, 0.008965849876403809, 0.009343862533569336, 0.009721875190734863, 0.01009988784790039, 0.010477900505065918, 0.010855913162231445, 0.011233925819396973, 0.0116119384765625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 12.0, 5.0, 4.0, 10.0, 8.0, 15.0, 14.0, 20.0, 27.0, 46.0, 61.0, 92.0, 126.0, 124.0, 130.0, 85.0, 60.0, 31.0, 27.0, 24.0, 15.0, 16.0, 10.0, 7.0, 8.0, 1.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.4437904357910156e-06, -2.3832544684410095e-06, -2.3227185010910034e-06, -2.2621825337409973e-06, -2.201646566390991e-06, -2.141110599040985e-06, -2.080574631690979e-06, -2.020038664340973e-06, -1.959502696990967e-06, -1.8989667296409607e-06, -1.8384307622909546e-06, -1.7778947949409485e-06, -1.7173588275909424e-06, -1.6568228602409363e-06, -1.5962868928909302e-06, -1.535750925540924e-06, -1.475214958190918e-06, -1.4146789908409119e-06, -1.3541430234909058e-06, -1.2936070561408997e-06, -1.2330710887908936e-06, -1.1725351214408875e-06, -1.1119991540908813e-06, -1.0514631867408752e-06, -9.909272193908691e-07, -9.30391252040863e-07, -8.698552846908569e-07, -8.093193173408508e-07, -7.487833499908447e-07, -6.882473826408386e-07, -6.277114152908325e-07, -5.671754479408264e-07, -5.066394805908203e-07, -4.461035132408142e-07, -3.855675458908081e-07, -3.25031578540802e-07, -2.644956111907959e-07, -2.039596438407898e-07, -1.434236764907837e-07, -8.288770914077759e-08, -2.2351741790771484e-08, 3.818422555923462e-08, 9.872019290924072e-08, 1.5925616025924683e-07, 2.1979212760925293e-07, 2.8032809495925903e-07, 3.4086406230926514e-07, 4.0140002965927124e-07, 4.6193599700927734e-07, 5.224719643592834e-07, 5.830079317092896e-07, 6.435438990592957e-07, 7.040798664093018e-07, 7.646158337593079e-07, 8.25151801109314e-07, 8.856877684593201e-07, 9.462237358093262e-07, 1.0067597031593323e-06, 1.0672956705093384e-06, 1.1278316378593445e-06, 1.1883676052093506e-06, 1.2489035725593567e-06, 1.3094395399093628e-06, 1.369975507259369e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 3.0, 2.0, 9.0, 5.0, 8.0, 10.0, 9.0, 17.0, 26.0, 25.0, 23.0, 47.0, 72.0, 163.0, 259.0, 1212.0, 122033.0, 920486.0, 3236.0, 401.0, 191.0, 104.0, 46.0, 47.0, 23.0, 19.0, 16.0, 16.0, 12.0, 7.0, 7.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8967857360839844e-05, -2.7816742658615112e-05, -2.666562795639038e-05, -2.551451325416565e-05, -2.4363398551940918e-05, -2.3212283849716187e-05, -2.2061169147491455e-05, -2.0910054445266724e-05, -1.9758939743041992e-05, -1.860782504081726e-05, -1.745671033859253e-05, -1.6305595636367798e-05, -1.5154480934143066e-05, -1.4003366231918335e-05, -1.2852251529693604e-05, -1.1701136827468872e-05, -1.055002212524414e-05, -9.39890742301941e-06, -8.247792720794678e-06, -7.096678018569946e-06, -5.945563316345215e-06, -4.794448614120483e-06, -3.643333911895752e-06, -2.4922192096710205e-06, -1.341104507446289e-06, -1.8998980522155762e-07, 9.611248970031738e-07, 2.1122395992279053e-06, 3.2633543014526367e-06, 4.414469003677368e-06, 5.5655837059021e-06, 6.716698408126831e-06, 7.867813110351562e-06, 9.018927812576294e-06, 1.0170042514801025e-05, 1.1321157217025757e-05, 1.2472271919250488e-05, 1.362338662147522e-05, 1.4774501323699951e-05, 1.5925616025924683e-05, 1.7076730728149414e-05, 1.8227845430374146e-05, 1.9378960132598877e-05, 2.053007483482361e-05, 2.168118953704834e-05, 2.283230423927307e-05, 2.3983418941497803e-05, 2.5134533643722534e-05, 2.6285648345947266e-05, 2.7436763048171997e-05, 2.858787775039673e-05, 2.973899245262146e-05, 3.089010715484619e-05, 3.204122185707092e-05, 3.3192336559295654e-05, 3.4343451261520386e-05, 3.549456596374512e-05, 3.664568066596985e-05, 3.779679536819458e-05, 3.894791007041931e-05, 4.009902477264404e-05, 4.1250139474868774e-05, 4.2401254177093506e-05, 4.355236887931824e-05, 4.470348358154297e-05]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 10.0, 2.0, 12.0, 12.0, 12.0, 25.0, 46.0, 66.0, 140.0, 157.0, 174.0, 130.0, 89.0, 46.0, 39.0, 16.0, 13.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.810659556322207e-07, -6.328792210297252e-07, -5.846925432706485e-07, -5.365058086681529e-07, -4.883190740656573e-07, -4.401323678848712e-07, -3.9194566170408507e-07, -3.437589271015895e-07, -2.955722209208034e-07, -2.4738551474001724e-07, -1.9919878013752168e-07, -1.5101207395673555e-07, -1.028253535650947e-07, -5.4638633173453854e-08, -6.4519269926677225e-09, 4.173480760982784e-08, 8.992151379061397e-08, 1.3810823418225482e-07, 1.8629495457389567e-07, 2.344816607546818e-07, 2.8266839535717736e-07, 3.308551015379635e-07, 3.790418077187496e-07, 4.272285423212452e-07, 4.754152485020313e-07, 5.236019546828174e-07, 5.71788689285313e-07, 6.199753670443897e-07, 6.681621016468853e-07, 7.163488362493808e-07, 7.645355708518764e-07, 8.12722305454372e-07, 8.609089263700298e-07, 9.090956609725254e-07, 9.57282395575021e-07, 1.0054691301775165e-06, 1.0536557510931743e-06, 1.1018424856956699e-06, 1.1500292202981655e-06, 1.198215954900661e-06, 1.2464026895031566e-06, 1.2945894241056521e-06, 1.3427761587081477e-06, 1.3909627796238055e-06, 1.4391495142263011e-06, 1.4873362488287967e-06, 1.5355229834312922e-06, 1.5837097180337878e-06, 1.6318963389494456e-06, 1.6800830735519412e-06, 1.7282698081544368e-06, 1.7764564290700946e-06, 1.8246431636725902e-06, 1.8728298982750857e-06, 1.9210165191907436e-06, 1.969203367480077e-06, 2.01739021576941e-06, 2.065576836685068e-06, 2.1137636849744013e-06, 2.161950305890059e-06, 2.2101371541793924e-06, 2.2583237750950502e-06, 2.306510396010708e-06, 2.3546972443000413e-06, 2.402883865215699e-06]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 16.0, 0.0, 27.0, 0.0, 0.0, 33.0, 0.0, 54.0, 0.0, 0.0, 85.0, 0.0, 110.0, 0.0, 106.0, 0.0, 0.0, 113.0, 0.0, 129.0, 0.0, 101.0, 0.0, 0.0, 73.0, 0.0, 66.0, 0.0, 0.0, 36.0, 0.0, 28.0, 0.0, 22.0, 0.0, 0.0, 5.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 2.0, 7.0, 8.0, 15.0, 8.0, 11.0, 15.0, 19.0, 19.0, 28.0, 27.0, 27.0, 40.0, 38.0, 36.0, 41.0, 48.0, 42.0, 40.0, 52.0, 37.0, 35.0, 56.0, 41.0, 48.0, 39.0, 33.0, 26.0, 33.0, 15.0, 22.0, 9.0, 15.0, 16.0, 8.0, 13.0, 11.0, 6.0, 6.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.484375, -4.34210205078125, -4.1998291015625, -4.05755615234375, -3.915283203125, -3.77301025390625, -3.6307373046875, -3.48846435546875, -3.34619140625, -3.20391845703125, -3.0616455078125, -2.91937255859375, -2.777099609375, -2.63482666015625, -2.4925537109375, -2.35028076171875, -2.2080078125, -2.06573486328125, -1.9234619140625, -1.78118896484375, -1.638916015625, -1.49664306640625, -1.3543701171875, -1.21209716796875, -1.06982421875, -0.92755126953125, -0.7852783203125, -0.64300537109375, -0.500732421875, -0.35845947265625, -0.2161865234375, -0.07391357421875, 0.068359375, 0.21063232421875, 0.3529052734375, 0.49517822265625, 0.637451171875, 0.77972412109375, 0.9219970703125, 1.06427001953125, 1.20654296875, 1.34881591796875, 1.4910888671875, 1.63336181640625, 1.775634765625, 1.91790771484375, 2.0601806640625, 2.20245361328125, 2.3447265625, 2.48699951171875, 2.6292724609375, 2.77154541015625, 2.913818359375, 3.05609130859375, 3.1983642578125, 3.34063720703125, 3.48291015625, 3.62518310546875, 3.7674560546875, 3.90972900390625, 4.052001953125, 4.19427490234375, 4.3365478515625, 4.47882080078125, 4.62109375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 2.0, 4.0, 10.0, 12.0, 25.0, 27.0, 50.0, 49.0, 98.0, 146.0, 215.0, 324.0, 542.0, 941.0, 1764.0, 3423.0, 6588.0, 14489.0, 33050.0, 87130.0, 286521.0, 409163.0, 123255.0, 44583.0, 18635.0, 8366.0, 4078.0, 2143.0, 1117.0, 655.0, 416.0, 261.0, 140.0, 114.0, 73.0, 40.0, 30.0, 21.0, 22.0, 13.0, 5.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.0859375, -7.8623046875, -7.638671875, -7.4150390625, -7.19140625, -6.9677734375, -6.744140625, -6.5205078125, -6.296875, -6.0732421875, -5.849609375, -5.6259765625, -5.40234375, -5.1787109375, -4.955078125, -4.7314453125, -4.5078125, -4.2841796875, -4.060546875, -3.8369140625, -3.61328125, -3.3896484375, -3.166015625, -2.9423828125, -2.71875, -2.4951171875, -2.271484375, -2.0478515625, -1.82421875, -1.6005859375, -1.376953125, -1.1533203125, -0.9296875, -0.7060546875, -0.482421875, -0.2587890625, -0.03515625, 0.1884765625, 0.412109375, 0.6357421875, 0.859375, 1.0830078125, 1.306640625, 1.5302734375, 1.75390625, 1.9775390625, 2.201171875, 2.4248046875, 2.6484375, 2.8720703125, 3.095703125, 3.3193359375, 3.54296875, 3.7666015625, 3.990234375, 4.2138671875, 4.4375, 4.6611328125, 4.884765625, 5.1083984375, 5.33203125, 5.5556640625, 5.779296875, 6.0029296875, 6.2265625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 6.0, 4.0, 8.0, 9.0, 11.0, 15.0, 20.0, 24.0, 19.0, 40.0, 39.0, 33.0, 48.0, 66.0, 97.0, 172.0, 245.0, 1440.0, 173.0, 131.0, 90.0, 51.0, 38.0, 45.0, 25.0, 30.0, 21.0, 27.0, 19.0, 15.0, 7.0, 17.0, 16.0, 11.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-12.125, -11.7813720703125, -11.437744140625, -11.0941162109375, -10.75048828125, -10.4068603515625, -10.063232421875, -9.7196044921875, -9.3759765625, -9.0323486328125, -8.688720703125, -8.3450927734375, -8.00146484375, -7.6578369140625, -7.314208984375, -6.9705810546875, -6.626953125, -6.2833251953125, -5.939697265625, -5.5960693359375, -5.25244140625, -4.9088134765625, -4.565185546875, -4.2215576171875, -3.8779296875, -3.5343017578125, -3.190673828125, -2.8470458984375, -2.50341796875, -2.1597900390625, -1.816162109375, -1.4725341796875, -1.12890625, -0.7852783203125, -0.441650390625, -0.0980224609375, 0.24560546875, 0.5892333984375, 0.932861328125, 1.2764892578125, 1.6201171875, 1.9637451171875, 2.307373046875, 2.6510009765625, 2.99462890625, 3.3382568359375, 3.681884765625, 4.0255126953125, 4.369140625, 4.7127685546875, 5.056396484375, 5.4000244140625, 5.74365234375, 6.0872802734375, 6.430908203125, 6.7745361328125, 7.1181640625, 7.4617919921875, 7.805419921875, 8.1490478515625, 8.49267578125, 8.8363037109375, 9.179931640625, 9.5235595703125, 9.8671875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 10.0, 10.0, 10.0, 23.0, 27.0, 25.0, 31.0, 58.0, 77.0, 105.0, 199.0, 290.0, 476.0, 911.0, 5800.0, 1557229.0, 1572268.0, 5916.0, 932.0, 474.0, 265.0, 167.0, 98.0, 80.0, 47.0, 38.0, 23.0, 24.0, 15.0, 14.0, 8.0, 8.0, 9.0, 8.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.515625, -24.742431640625, -23.96923828125, -23.196044921875, -22.4228515625, -21.649658203125, -20.87646484375, -20.103271484375, -19.330078125, -18.556884765625, -17.78369140625, -17.010498046875, -16.2373046875, -15.464111328125, -14.69091796875, -13.917724609375, -13.14453125, -12.371337890625, -11.59814453125, -10.824951171875, -10.0517578125, -9.278564453125, -8.50537109375, -7.732177734375, -6.958984375, -6.185791015625, -5.41259765625, -4.639404296875, -3.8662109375, -3.093017578125, -2.31982421875, -1.546630859375, -0.7734375, -0.000244140625, 0.77294921875, 1.546142578125, 2.3193359375, 3.092529296875, 3.86572265625, 4.638916015625, 5.412109375, 6.185302734375, 6.95849609375, 7.731689453125, 8.5048828125, 9.278076171875, 10.05126953125, 10.824462890625, 11.59765625, 12.370849609375, 13.14404296875, 13.917236328125, 14.6904296875, 15.463623046875, 16.23681640625, 17.010009765625, 17.783203125, 18.556396484375, 19.32958984375, 20.102783203125, 20.8759765625, 21.649169921875, 22.42236328125, 23.195556640625, 23.96875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 14.0, 67.0, 218.0, 367.0, 253.0, 80.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.10261917114258, -44.062416076660156, -41.022216796875, -37.98201370239258, -34.941810607910156, -31.901607513427734, -28.861406326293945, -25.821205139160156, -22.781002044677734, -19.740798950195312, -16.700597763061523, -13.660395622253418, -10.620193481445312, -7.579991340637207, -4.539789199829102, -1.4995880126953125, 1.5406150817871094, 4.580817222595215, 7.62101936340332, 10.661221504211426, 13.701423645019531, 16.741626739501953, 19.781827926635742, 22.82202911376953, 25.862232208251953, 28.902435302734375, 31.942636489868164, 34.98283767700195, 38.023040771484375, 41.0632438659668, 44.10344696044922, 47.143646240234375, 50.18385314941406, 53.224056243896484, 56.264259338378906, 59.30445861816406, 62.344661712646484, 65.3848648071289, 68.42506408691406, 71.46527099609375, 74.5054702758789, 77.54566955566406, 80.58587646484375, 83.6260757446289, 86.66627502441406, 89.70648193359375, 92.7466812133789, 95.78688049316406, 98.82708740234375, 101.8672866821289, 104.9074935913086, 107.94769287109375, 110.98789978027344, 114.0280990600586, 117.06829833984375, 120.10850524902344, 123.1487045288086, 126.18890380859375, 129.22911071777344, 132.26931762695312, 135.30950927734375, 138.34971618652344, 141.38992309570312, 144.43011474609375, 147.47032165527344]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 3.0, 8.0, 10.0, 5.0, 11.0, 7.0, 12.0, 17.0, 20.0, 15.0, 17.0, 32.0, 28.0, 20.0, 33.0, 34.0, 36.0, 44.0, 43.0, 36.0, 39.0, 49.0, 44.0, 44.0, 38.0, 40.0, 37.0, 39.0, 28.0, 28.0, 25.0, 20.0, 26.0, 18.0, 23.0, 10.0, 13.0, 14.0, 11.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.33778381347656, -33.19041442871094, -32.04304885864258, -30.895681381225586, -29.748313903808594, -28.6009464263916, -27.45357894897461, -26.306209564208984, -25.158843994140625, -24.011476516723633, -22.86410903930664, -21.71674156188965, -20.569374084472656, -19.422006607055664, -18.274639129638672, -17.127269744873047, -15.979902267456055, -14.832534790039062, -13.68516731262207, -12.537799835205078, -11.390432357788086, -10.243064880371094, -9.095696449279785, -7.948328971862793, -6.800961494445801, -5.653594017028809, -4.506226539611816, -3.358858585357666, -2.211491107940674, -1.0641236305236816, 0.08324432373046875, 1.230611801147461, 2.377979278564453, 3.5253467559814453, 4.6727142333984375, 5.820082187652588, 6.96744966506958, 8.114816665649414, 9.262185096740723, 10.409552574157715, 11.556920051574707, 12.7042875289917, 13.851655006408691, 14.9990234375, 16.146390914916992, 17.293758392333984, 18.441125869750977, 19.58849334716797, 20.73586082458496, 21.883228302001953, 23.030595779418945, 24.177963256835938, 25.32533073425293, 26.472698211669922, 27.620067596435547, 28.767433166503906, 29.91480255126953, 31.062170028686523, 32.209537506103516, 33.35690689086914, 34.5042724609375, 35.651641845703125, 36.799007415771484, 37.94637680053711, 39.09374237060547]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 4.0, 8.0, 14.0, 10.0, 17.0, 24.0, 20.0, 32.0, 37.0, 39.0, 19.0, 38.0, 30.0, 49.0, 42.0, 46.0, 45.0, 44.0, 51.0, 41.0, 39.0, 40.0, 42.0, 34.0, 30.0, 28.0, 32.0, 18.0, 19.0, 16.0, 16.0, 10.0, 14.0, 9.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.83026123046875, -4.6839599609375, -4.53765869140625, -4.391357421875, -4.24505615234375, -4.0987548828125, -3.95245361328125, -3.80615234375, -3.65985107421875, -3.5135498046875, -3.36724853515625, -3.220947265625, -3.07464599609375, -2.9283447265625, -2.78204345703125, -2.6357421875, -2.48944091796875, -2.3431396484375, -2.19683837890625, -2.050537109375, -1.90423583984375, -1.7579345703125, -1.61163330078125, -1.46533203125, -1.31903076171875, -1.1727294921875, -1.02642822265625, -0.880126953125, -0.73382568359375, -0.5875244140625, -0.44122314453125, -0.294921875, -0.14862060546875, -0.0023193359375, 0.14398193359375, 0.290283203125, 0.43658447265625, 0.5828857421875, 0.72918701171875, 0.87548828125, 1.02178955078125, 1.1680908203125, 1.31439208984375, 1.460693359375, 1.60699462890625, 1.7532958984375, 1.89959716796875, 2.0458984375, 2.19219970703125, 2.3385009765625, 2.48480224609375, 2.631103515625, 2.77740478515625, 2.9237060546875, 3.07000732421875, 3.21630859375, 3.36260986328125, 3.5089111328125, 3.65521240234375, 3.801513671875, 3.94781494140625, 4.0941162109375, 4.24041748046875, 4.38671875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 5.0, 5.0, 10.0, 12.0, 21.0, 30.0, 31.0, 60.0, 69.0, 124.0, 166.0, 242.0, 324.0, 479.0, 739.0, 1085.0, 1644.0, 2691.0, 4313.0, 7365.0, 13253.0, 27867.0, 99820.0, 619629.0, 2252770.0, 931467.0, 155070.0, 36962.0, 15763.0, 8626.0, 4911.0, 3020.0, 1919.0, 1235.0, 809.0, 565.0, 368.0, 235.0, 188.0, 117.0, 83.0, 59.0, 52.0, 25.0, 18.0, 17.0, 10.0, 7.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.6197509765625, -6.380126953125, -6.1405029296875, -5.90087890625, -5.6612548828125, -5.421630859375, -5.1820068359375, -4.9423828125, -4.7027587890625, -4.463134765625, -4.2235107421875, -3.98388671875, -3.7442626953125, -3.504638671875, -3.2650146484375, -3.025390625, -2.7857666015625, -2.546142578125, -2.3065185546875, -2.06689453125, -1.8272705078125, -1.587646484375, -1.3480224609375, -1.1083984375, -0.8687744140625, -0.629150390625, -0.3895263671875, -0.14990234375, 0.0897216796875, 0.329345703125, 0.5689697265625, 0.80859375, 1.0482177734375, 1.287841796875, 1.5274658203125, 1.76708984375, 2.0067138671875, 2.246337890625, 2.4859619140625, 2.7255859375, 2.9652099609375, 3.204833984375, 3.4444580078125, 3.68408203125, 3.9237060546875, 4.163330078125, 4.4029541015625, 4.642578125, 4.8822021484375, 5.121826171875, 5.3614501953125, 5.60107421875, 5.8406982421875, 6.080322265625, 6.3199462890625, 6.5595703125, 6.7991943359375, 7.038818359375, 7.2784423828125, 7.51806640625, 7.7576904296875, 7.997314453125, 8.2369384765625, 8.4765625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 5.0, 10.0, 11.0, 10.0, 28.0, 20.0, 38.0, 52.0, 66.0, 124.0, 151.0, 215.0, 322.0, 377.0, 561.0, 520.0, 436.0, 316.0, 236.0, 165.0, 104.0, 92.0, 72.0, 26.0, 30.0, 20.0, 15.0, 7.0, 6.0, 9.0, 10.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.95703125, -7.7576904296875, -7.558349609375, -7.3590087890625, -7.15966796875, -6.9603271484375, -6.760986328125, -6.5616455078125, -6.3623046875, -6.1629638671875, -5.963623046875, -5.7642822265625, -5.56494140625, -5.3656005859375, -5.166259765625, -4.9669189453125, -4.767578125, -4.5682373046875, -4.368896484375, -4.1695556640625, -3.97021484375, -3.7708740234375, -3.571533203125, -3.3721923828125, -3.1728515625, -2.9735107421875, -2.774169921875, -2.5748291015625, -2.37548828125, -2.1761474609375, -1.976806640625, -1.7774658203125, -1.578125, -1.3787841796875, -1.179443359375, -0.9801025390625, -0.78076171875, -0.5814208984375, -0.382080078125, -0.1827392578125, 0.0166015625, 0.2159423828125, 0.415283203125, 0.6146240234375, 0.81396484375, 1.0133056640625, 1.212646484375, 1.4119873046875, 1.611328125, 1.8106689453125, 2.010009765625, 2.2093505859375, 2.40869140625, 2.6080322265625, 2.807373046875, 3.0067138671875, 3.2060546875, 3.4053955078125, 3.604736328125, 3.8040771484375, 4.00341796875, 4.2027587890625, 4.402099609375, 4.6014404296875, 4.80078125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 10.0, 17.0, 30.0, 25.0, 52.0, 82.0, 197.0, 355.0, 734.0, 1851.0, 5511.0, 28089.0, 379659.0, 3532465.0, 217866.0, 20124.0, 4423.0, 1486.0, 623.0, 292.0, 131.0, 79.0, 58.0, 31.0, 15.0, 12.0, 18.0, 6.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.1875, -10.747314453125, -10.30712890625, -9.866943359375, -9.4267578125, -8.986572265625, -8.54638671875, -8.106201171875, -7.666015625, -7.225830078125, -6.78564453125, -6.345458984375, -5.9052734375, -5.465087890625, -5.02490234375, -4.584716796875, -4.14453125, -3.704345703125, -3.26416015625, -2.823974609375, -2.3837890625, -1.943603515625, -1.50341796875, -1.063232421875, -0.623046875, -0.182861328125, 0.25732421875, 0.697509765625, 1.1376953125, 1.577880859375, 2.01806640625, 2.458251953125, 2.8984375, 3.338623046875, 3.77880859375, 4.218994140625, 4.6591796875, 5.099365234375, 5.53955078125, 5.979736328125, 6.419921875, 6.860107421875, 7.30029296875, 7.740478515625, 8.1806640625, 8.620849609375, 9.06103515625, 9.501220703125, 9.94140625, 10.381591796875, 10.82177734375, 11.261962890625, 11.7021484375, 12.142333984375, 12.58251953125, 13.022705078125, 13.462890625, 13.903076171875, 14.34326171875, 14.783447265625, 15.2236328125, 15.663818359375, 16.10400390625, 16.544189453125, 16.984375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 10.0, 111.0, 558.0, 301.0, 38.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.09686279296875, -135.38832092285156, -129.6797637939453, -123.97122192382812, -118.26268005371094, -112.55413055419922, -106.8455810546875, -101.13703918457031, -95.4284896850586, -89.71994018554688, -84.01139831542969, -78.30284881591797, -72.59429931640625, -66.88575744628906, -61.177207946777344, -55.46866226196289, -49.76011657714844, -44.051570892333984, -38.34302520751953, -32.63447570800781, -26.92593002319336, -21.217384338378906, -15.508834838867188, -9.800289154052734, -4.091743469238281, 1.6168031692504883, 7.325349807739258, 13.033897399902344, 18.742443084716797, 24.45098876953125, 30.15953826904297, 35.86808395385742, 41.576629638671875, 47.28517532348633, 52.99372100830078, 58.7022705078125, 64.41081237792969, 70.1193618774414, 75.82791137695312, 81.53645324707031, 87.24500274658203, 92.95355224609375, 98.66209411621094, 104.37064361572266, 110.07919311523438, 115.78773498535156, 121.49628448486328, 127.204833984375, 132.9133758544922, 138.62191772460938, 144.33047485351562, 150.0390167236328, 155.74755859375, 161.45611572265625, 167.16465759277344, 172.87319946289062, 178.58175659179688, 184.29029846191406, 189.9988555908203, 195.7073974609375, 201.4159393310547, 207.12448120117188, 212.83303833007812, 218.5415802001953, 224.2501220703125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 7.0, 16.0, 15.0, 13.0, 11.0, 18.0, 19.0, 22.0, 36.0, 30.0, 21.0, 23.0, 23.0, 32.0, 37.0, 37.0, 41.0, 33.0, 42.0, 37.0, 37.0, 38.0, 36.0, 43.0, 23.0, 36.0, 31.0, 31.0, 24.0, 25.0, 18.0, 15.0, 16.0, 19.0, 13.0, 12.0, 9.0, 9.0, 12.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.692291259765625, -20.019268035888672, -19.34624481201172, -18.673221588134766, -18.000200271606445, -17.327177047729492, -16.65415382385254, -15.981130599975586, -15.30810832977295, -14.635085105895996, -13.96206283569336, -13.289039611816406, -12.616016387939453, -11.942994117736816, -11.269970893859863, -10.596948623657227, -9.923925399780273, -9.25090217590332, -8.577879905700684, -7.9048566818237305, -7.2318339347839355, -6.558811187744141, -5.8857879638671875, -5.212765216827393, -4.539742469787598, -3.8667197227478027, -3.1936967372894287, -2.5206737518310547, -1.8476510047912598, -1.1746282577514648, -0.5016050338745117, 0.1714177131652832, 0.8444404602050781, 1.5174633264541626, 2.190486192703247, 2.863509178161621, 3.536531925201416, 4.209554672241211, 4.882577896118164, 5.555600643157959, 6.228623390197754, 6.901646137237549, 7.574668884277344, 8.247692108154297, 8.92071533203125, 9.593737602233887, 10.26676082611084, 10.939783096313477, 11.61280632019043, 12.285829544067383, 12.95885181427002, 13.631875038146973, 14.30489730834961, 14.977920532226562, 15.650943756103516, 16.32396697998047, 16.996990203857422, 17.670013427734375, 18.343036651611328, 19.01605987548828, 19.6890811920166, 20.362104415893555, 21.035127639770508, 21.70815086364746, 22.38117218017578]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 4.0, 5.0, 16.0, 17.0, 13.0, 19.0, 14.0, 30.0, 38.0, 30.0, 30.0, 38.0, 32.0, 48.0, 35.0, 47.0, 44.0, 51.0, 58.0, 35.0, 31.0, 55.0, 32.0, 30.0, 37.0, 30.0, 26.0, 28.0, 17.0, 18.0, 22.0, 17.0, 9.0, 10.0, 4.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.3638916015625, -4.219970703125, -4.0760498046875, -3.93212890625, -3.7882080078125, -3.644287109375, -3.5003662109375, -3.3564453125, -3.2125244140625, -3.068603515625, -2.9246826171875, -2.78076171875, -2.6368408203125, -2.492919921875, -2.3489990234375, -2.205078125, -2.0611572265625, -1.917236328125, -1.7733154296875, -1.62939453125, -1.4854736328125, -1.341552734375, -1.1976318359375, -1.0537109375, -0.9097900390625, -0.765869140625, -0.6219482421875, -0.47802734375, -0.3341064453125, -0.190185546875, -0.0462646484375, 0.09765625, 0.2415771484375, 0.385498046875, 0.5294189453125, 0.67333984375, 0.8172607421875, 0.961181640625, 1.1051025390625, 1.2490234375, 1.3929443359375, 1.536865234375, 1.6807861328125, 1.82470703125, 1.9686279296875, 2.112548828125, 2.2564697265625, 2.400390625, 2.5443115234375, 2.688232421875, 2.8321533203125, 2.97607421875, 3.1199951171875, 3.263916015625, 3.4078369140625, 3.5517578125, 3.6956787109375, 3.839599609375, 3.9835205078125, 4.12744140625, 4.2713623046875, 4.415283203125, 4.5592041015625, 4.703125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 16.0, 25.0, 27.0, 45.0, 66.0, 109.0, 155.0, 221.0, 340.0, 514.0, 798.0, 1220.0, 1931.0, 2817.0, 4399.0, 6983.0, 10900.0, 16688.0, 26005.0, 42043.0, 71067.0, 123548.0, 228950.0, 215311.0, 116715.0, 67490.0, 39912.0, 25046.0, 16214.0, 10247.0, 6624.0, 4256.0, 2783.0, 1713.0, 1172.0, 742.0, 509.0, 312.0, 206.0, 155.0, 88.0, 57.0, 40.0, 24.0, 24.0, 16.0, 13.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.03786945343017578, -0.03664588928222656, -0.035422325134277344, -0.034198760986328125, -0.032975196838378906, -0.03175163269042969, -0.03052806854248047, -0.02930450439453125, -0.02808094024658203, -0.026857376098632812, -0.025633811950683594, -0.024410247802734375, -0.023186683654785156, -0.021963119506835938, -0.02073955535888672, -0.0195159912109375, -0.01829242706298828, -0.017068862915039062, -0.015845298767089844, -0.014621734619140625, -0.013398170471191406, -0.012174606323242188, -0.010951042175292969, -0.00972747802734375, -0.008503913879394531, -0.0072803497314453125, -0.006056785583496094, -0.004833221435546875, -0.0036096572875976562, -0.0023860931396484375, -0.0011625289916992188, 6.103515625e-05, 0.0012845993041992188, 0.0025081634521484375, 0.0037317276000976562, 0.004955291748046875, 0.006178855895996094, 0.0074024200439453125, 0.008625984191894531, 0.00984954833984375, 0.011073112487792969, 0.012296676635742188, 0.013520240783691406, 0.014743804931640625, 0.015967369079589844, 0.017190933227539062, 0.01841449737548828, 0.0196380615234375, 0.02086162567138672, 0.022085189819335938, 0.023308753967285156, 0.024532318115234375, 0.025755882263183594, 0.026979446411132812, 0.02820301055908203, 0.02942657470703125, 0.03065013885498047, 0.03187370300292969, 0.033097267150878906, 0.034320831298828125, 0.035544395446777344, 0.03676795959472656, 0.03799152374267578, 0.039215087890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 11.0, 11.0, 10.0, 16.0, 25.0, 18.0, 26.0, 31.0, 40.0, 40.0, 27.0, 49.0, 54.0, 41.0, 55.0, 1073.0, 47.0, 47.0, 48.0, 51.0, 39.0, 42.0, 35.0, 21.0, 33.0, 27.0, 18.0, 21.0, 14.0, 14.0, 9.0, 2.0, 9.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8125, -3.68292236328125, -3.5533447265625, -3.42376708984375, -3.294189453125, -3.16461181640625, -3.0350341796875, -2.90545654296875, -2.77587890625, -2.64630126953125, -2.5167236328125, -2.38714599609375, -2.257568359375, -2.12799072265625, -1.9984130859375, -1.86883544921875, -1.7392578125, -1.60968017578125, -1.4801025390625, -1.35052490234375, -1.220947265625, -1.09136962890625, -0.9617919921875, -0.83221435546875, -0.70263671875, -0.57305908203125, -0.4434814453125, -0.31390380859375, -0.184326171875, -0.05474853515625, 0.0748291015625, 0.20440673828125, 0.333984375, 0.46356201171875, 0.5931396484375, 0.72271728515625, 0.852294921875, 0.98187255859375, 1.1114501953125, 1.24102783203125, 1.37060546875, 1.50018310546875, 1.6297607421875, 1.75933837890625, 1.888916015625, 2.01849365234375, 2.1480712890625, 2.27764892578125, 2.4072265625, 2.53680419921875, 2.6663818359375, 2.79595947265625, 2.925537109375, 3.05511474609375, 3.1846923828125, 3.31427001953125, 3.44384765625, 3.57342529296875, 3.7030029296875, 3.83258056640625, 3.962158203125, 4.09173583984375, 4.2213134765625, 4.35089111328125, 4.48046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 15.0, 20.0, 26.0, 47.0, 58.0, 81.0, 117.0, 200.0, 317.0, 470.0, 651.0, 1062.0, 1704.0, 2637.0, 4221.0, 6925.0, 11275.0, 18662.0, 31243.0, 53491.0, 93087.0, 171965.0, 1303113.0, 169600.0, 93388.0, 53159.0, 30965.0, 18692.0, 11332.0, 6931.0, 4172.0, 2703.0, 1675.0, 1055.0, 709.0, 474.0, 286.0, 178.0, 136.0, 92.0, 55.0, 47.0, 15.0, 22.0, 13.0, 16.0, 9.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0142669677734375, -0.013799190521240234, -0.013331413269042969, -0.012863636016845703, -0.012395858764648438, -0.011928081512451172, -0.011460304260253906, -0.01099252700805664, -0.010524749755859375, -0.01005697250366211, -0.009589195251464844, -0.009121417999267578, -0.008653640747070312, -0.008185863494873047, -0.007718086242675781, -0.007250308990478516, -0.00678253173828125, -0.006314754486083984, -0.005846977233886719, -0.005379199981689453, -0.0049114227294921875, -0.004443645477294922, -0.003975868225097656, -0.0035080909729003906, -0.003040313720703125, -0.0025725364685058594, -0.0021047592163085938, -0.0016369819641113281, -0.0011692047119140625, -0.0007014274597167969, -0.00023365020751953125, 0.00023412704467773438, 0.000701904296875, 0.0011696815490722656, 0.0016374588012695312, 0.002105236053466797, 0.0025730133056640625, 0.003040790557861328, 0.0035085678100585938, 0.003976345062255859, 0.004444122314453125, 0.004911899566650391, 0.005379676818847656, 0.005847454071044922, 0.0063152313232421875, 0.006783008575439453, 0.007250785827636719, 0.007718563079833984, 0.00818634033203125, 0.008654117584228516, 0.009121894836425781, 0.009589672088623047, 0.010057449340820312, 0.010525226593017578, 0.010993003845214844, 0.01146078109741211, 0.011928558349609375, 0.01239633560180664, 0.012864112854003906, 0.013331890106201172, 0.013799667358398438, 0.014267444610595703, 0.014735221862792969, 0.015202999114990234, 0.0156707763671875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 12.0, 0.0, 16.0, 25.0, 37.0, 48.0, 0.0, 65.0, 89.0, 121.0, 141.0, 0.0, 123.0, 88.0, 72.0, 52.0, 0.0, 28.0, 28.0, 20.0, 8.0, 0.0, 7.0, 8.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5618279576301575e-06, -1.514330506324768e-06, -1.4668330550193787e-06, -1.4193356037139893e-06, -1.3718381524085999e-06, -1.3243407011032104e-06, -1.276843249797821e-06, -1.2293457984924316e-06, -1.1818483471870422e-06, -1.1343508958816528e-06, -1.0868534445762634e-06, -1.039355993270874e-06, -9.918585419654846e-07, -9.443610906600952e-07, -8.968636393547058e-07, -8.493661880493164e-07, -8.01868736743927e-07, -7.543712854385376e-07, -7.068738341331482e-07, -6.593763828277588e-07, -6.118789315223694e-07, -5.6438148021698e-07, -5.168840289115906e-07, -4.6938657760620117e-07, -4.2188912630081177e-07, -3.7439167499542236e-07, -3.2689422369003296e-07, -2.7939677238464355e-07, -2.3189932107925415e-07, -1.8440186977386475e-07, -1.3690441846847534e-07, -8.940696716308594e-08, -4.190951585769653e-08, 5.587935447692871e-09, 5.3085386753082275e-08, 1.0058283805847168e-07, 1.4808028936386108e-07, 1.955777406692505e-07, 2.430751919746399e-07, 2.905726432800293e-07, 3.380700945854187e-07, 3.855675458908081e-07, 4.330649971961975e-07, 4.805624485015869e-07, 5.280598998069763e-07, 5.755573511123657e-07, 6.230548024177551e-07, 6.705522537231445e-07, 7.180497050285339e-07, 7.655471563339233e-07, 8.130446076393127e-07, 8.605420589447021e-07, 9.080395102500916e-07, 9.55536961555481e-07, 1.0030344128608704e-06, 1.0505318641662598e-06, 1.0980293154716492e-06, 1.1455267667770386e-06, 1.193024218082428e-06, 1.2405216693878174e-06, 1.2880191206932068e-06, 1.3355165719985962e-06, 1.3830140233039856e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 8.0, 14.0, 14.0, 28.0, 23.0, 61.0, 58.0, 70.0, 125.0, 273.0, 590.0, 2436.0, 9894.0, 73665.0, 703596.0, 227558.0, 23214.0, 4693.0, 1298.0, 387.0, 179.0, 83.0, 69.0, 49.0, 28.0, 24.0, 18.0, 18.0, 12.0, 10.0, 4.0, 7.0, 4.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8596649169921875e-05, -1.797173172235489e-05, -1.7346814274787903e-05, -1.6721896827220917e-05, -1.609697937965393e-05, -1.5472061932086945e-05, -1.4847144484519958e-05, -1.4222227036952972e-05, -1.3597309589385986e-05, -1.2972392141819e-05, -1.2347474694252014e-05, -1.1722557246685028e-05, -1.1097639799118042e-05, -1.0472722351551056e-05, -9.84780490398407e-06, -9.222887456417084e-06, -8.597970008850098e-06, -7.973052561283112e-06, -7.3481351137161255e-06, -6.723217666149139e-06, -6.098300218582153e-06, -5.473382771015167e-06, -4.848465323448181e-06, -4.223547875881195e-06, -3.598630428314209e-06, -2.973712980747223e-06, -2.348795533180237e-06, -1.7238780856132507e-06, -1.0989606380462646e-06, -4.7404319047927856e-07, 1.5087425708770752e-07, 7.757917046546936e-07, 1.4007091522216797e-06, 2.0256265997886658e-06, 2.650544047355652e-06, 3.275461494922638e-06, 3.900378942489624e-06, 4.52529639005661e-06, 5.150213837623596e-06, 5.775131285190582e-06, 6.400048732757568e-06, 7.0249661803245544e-06, 7.64988362789154e-06, 8.274801075458527e-06, 8.899718523025513e-06, 9.524635970592499e-06, 1.0149553418159485e-05, 1.0774470865726471e-05, 1.1399388313293457e-05, 1.2024305760860443e-05, 1.264922320842743e-05, 1.3274140655994415e-05, 1.3899058103561401e-05, 1.4523975551128387e-05, 1.5148892998695374e-05, 1.577381044626236e-05, 1.6398727893829346e-05, 1.7023645341396332e-05, 1.7648562788963318e-05, 1.8273480236530304e-05, 1.889839768409729e-05, 1.9523315131664276e-05, 2.0148232579231262e-05, 2.0773150026798248e-05, 2.1398067474365234e-05]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 14.0, 39.0, 88.0, 229.0, 358.0, 170.0, 64.0, 28.0, 11.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.162233825714793e-06, -8.003089533303864e-06, -7.843946150387637e-06, -7.684801857976709e-06, -7.525658475060482e-06, -7.366514182649553e-06, -7.207370344985975e-06, -7.048226507322397e-06, -6.889082669658819e-06, -6.729938831995241e-06, -6.5707949943316635e-06, -6.411651156668086e-06, -6.252506864257157e-06, -6.093363026593579e-06, -5.934219188930001e-06, -5.775075351266423e-06, -5.615931513602845e-06, -5.4567876759392675e-06, -5.29764383827569e-06, -5.138500000612112e-06, -4.979356162948534e-06, -4.820211870537605e-06, -4.661068032874027e-06, -4.501924195210449e-06, -4.3427803575468715e-06, -4.183636519883294e-06, -4.024492682219716e-06, -3.865348844556138e-06, -3.7062047795188846e-06, -3.5470609418553067e-06, -3.3879168768180534e-06, -3.2287730391544756e-06, -3.0696289741172222e-06, -2.9104851364536444e-06, -2.751341071416391e-06, -2.592197233752813e-06, -2.4330533960892353e-06, -2.2739095584256575e-06, -2.1147657207620796e-06, -1.9556216557248263e-06, -1.7964778180612484e-06, -1.6373339803976705e-06, -1.478190029047255e-06, -1.3190460776968393e-06, -1.1599022400332615e-06, -1.0007584023696836e-06, -8.41614451019268e-07, -6.824704996688524e-07, -5.233266620052746e-07, -3.641827674982778e-07, -2.050388729912811e-07, -4.5894978484284366e-08, 1.1324891602271236e-07, 2.723928105297091e-07, 4.315367050367058e-07, 5.906806563871214e-07, 7.498244940506993e-07, 9.08968388557696e-07, 1.0681122830646927e-06, 1.2272562344151083e-06, 1.3864000720786862e-06, 1.545543909742264e-06, 1.7046878610926797e-06, 1.8638318124430953e-06, 2.022975650106673e-06]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 12.0, 0.0, 0.0, 13.0, 0.0, 0.0, 23.0, 0.0, 0.0, 47.0, 0.0, 0.0, 63.0, 0.0, 0.0, 72.0, 0.0, 0.0, 109.0, 0.0, 0.0, 117.0, 0.0, 0.0, 119.0, 0.0, 0.0, 119.0, 0.0, 0.0, 103.0, 0.0, 0.0, 72.0, 0.0, 0.0, 59.0, 0.0, 0.0, 40.0, 0.0, 0.0, 18.0, 0.0, 0.0, 16.0, 0.0, 0.0, 10.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0], "bins": [-6.556510925292969e-07, -6.360933184623718e-07, -6.165355443954468e-07, -5.969777703285217e-07, -5.774199962615967e-07, -5.578622221946716e-07, -5.383044481277466e-07, -5.187466740608215e-07, -4.991888999938965e-07, -4.796311259269714e-07, -4.600733518600464e-07, -4.4051557779312134e-07, -4.209578037261963e-07, -4.0140002965927124e-07, -3.818422555923462e-07, -3.6228448152542114e-07, -3.427267074584961e-07, -3.2316893339157104e-07, -3.03611159324646e-07, -2.8405338525772095e-07, -2.644956111907959e-07, -2.4493783712387085e-07, -2.253800630569458e-07, -2.0582228899002075e-07, -1.862645149230957e-07, -1.6670674085617065e-07, -1.471489667892456e-07, -1.2759119272232056e-07, -1.0803341865539551e-07, -8.847564458847046e-08, -6.891787052154541e-08, -4.936009645462036e-08, -2.9802322387695312e-08, -1.0244548320770264e-08, 9.313225746154785e-09, 2.8870999813079834e-08, 4.842877388000488e-08, 6.798654794692993e-08, 8.754432201385498e-08, 1.0710209608078003e-07, 1.2665987014770508e-07, 1.4621764421463013e-07, 1.6577541828155518e-07, 1.8533319234848022e-07, 2.0489096641540527e-07, 2.2444874048233032e-07, 2.4400651454925537e-07, 2.635642886161804e-07, 2.8312206268310547e-07, 3.026798367500305e-07, 3.2223761081695557e-07, 3.417953848838806e-07, 3.6135315895080566e-07, 3.809109330177307e-07, 4.0046870708465576e-07, 4.200264811515808e-07, 4.3958425521850586e-07, 4.591420292854309e-07, 4.78699803352356e-07, 4.98257577419281e-07, 5.178153514862061e-07, 5.373731255531311e-07, 5.569308996200562e-07, 5.764886736869812e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 4.0, 5.0, 16.0, 17.0, 13.0, 19.0, 14.0, 30.0, 38.0, 30.0, 30.0, 38.0, 32.0, 48.0, 35.0, 47.0, 44.0, 51.0, 58.0, 35.0, 31.0, 55.0, 32.0, 30.0, 37.0, 30.0, 26.0, 28.0, 17.0, 18.0, 22.0, 17.0, 9.0, 10.0, 4.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.3638916015625, -4.219970703125, -4.0760498046875, -3.93212890625, -3.7882080078125, -3.644287109375, -3.5003662109375, -3.3564453125, -3.2125244140625, -3.068603515625, -2.9246826171875, -2.78076171875, -2.6368408203125, -2.492919921875, -2.3489990234375, -2.205078125, -2.0611572265625, -1.917236328125, -1.7733154296875, -1.62939453125, -1.4854736328125, -1.341552734375, -1.1976318359375, -1.0537109375, -0.9097900390625, -0.765869140625, -0.6219482421875, -0.47802734375, -0.3341064453125, -0.190185546875, -0.0462646484375, 0.09765625, 0.2415771484375, 0.385498046875, 0.5294189453125, 0.67333984375, 0.8172607421875, 0.961181640625, 1.1051025390625, 1.2490234375, 1.3929443359375, 1.536865234375, 1.6807861328125, 1.82470703125, 1.9686279296875, 2.112548828125, 2.2564697265625, 2.400390625, 2.5443115234375, 2.688232421875, 2.8321533203125, 2.97607421875, 3.1199951171875, 3.263916015625, 3.4078369140625, 3.5517578125, 3.6956787109375, 3.839599609375, 3.9835205078125, 4.12744140625, 4.2713623046875, 4.415283203125, 4.5592041015625, 4.703125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 5.0, 7.0, 13.0, 15.0, 10.0, 20.0, 37.0, 47.0, 62.0, 117.0, 259.0, 398.0, 715.0, 1421.0, 2816.0, 5787.0, 12820.0, 32617.0, 100479.0, 311801.0, 376171.0, 131219.0, 42131.0, 15696.0, 6855.0, 3318.0, 1749.0, 828.0, 461.0, 258.0, 149.0, 71.0, 64.0, 39.0, 26.0, 26.0, 8.0, 9.0, 9.0, 8.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.786376953125, -4.62744140625, -4.468505859375, -4.3095703125, -4.150634765625, -3.99169921875, -3.832763671875, -3.673828125, -3.514892578125, -3.35595703125, -3.197021484375, -3.0380859375, -2.879150390625, -2.72021484375, -2.561279296875, -2.40234375, -2.243408203125, -2.08447265625, -1.925537109375, -1.7666015625, -1.607666015625, -1.44873046875, -1.289794921875, -1.130859375, -0.971923828125, -0.81298828125, -0.654052734375, -0.4951171875, -0.336181640625, -0.17724609375, -0.018310546875, 0.140625, 0.299560546875, 0.45849609375, 0.617431640625, 0.7763671875, 0.935302734375, 1.09423828125, 1.253173828125, 1.412109375, 1.571044921875, 1.72998046875, 1.888916015625, 2.0478515625, 2.206787109375, 2.36572265625, 2.524658203125, 2.68359375, 2.842529296875, 3.00146484375, 3.160400390625, 3.3193359375, 3.478271484375, 3.63720703125, 3.796142578125, 3.955078125, 4.114013671875, 4.27294921875, 4.431884765625, 4.5908203125, 4.749755859375, 4.90869140625, 5.067626953125, 5.2265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 14.0, 14.0, 14.0, 18.0, 21.0, 24.0, 39.0, 38.0, 41.0, 59.0, 83.0, 126.0, 281.0, 1595.0, 198.0, 106.0, 67.0, 47.0, 65.0, 39.0, 32.0, 28.0, 22.0, 17.0, 18.0, 13.0, 10.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.84375, -16.392822265625, -15.94189453125, -15.490966796875, -15.0400390625, -14.589111328125, -14.13818359375, -13.687255859375, -13.236328125, -12.785400390625, -12.33447265625, -11.883544921875, -11.4326171875, -10.981689453125, -10.53076171875, -10.079833984375, -9.62890625, -9.177978515625, -8.72705078125, -8.276123046875, -7.8251953125, -7.374267578125, -6.92333984375, -6.472412109375, -6.021484375, -5.570556640625, -5.11962890625, -4.668701171875, -4.2177734375, -3.766845703125, -3.31591796875, -2.864990234375, -2.4140625, -1.963134765625, -1.51220703125, -1.061279296875, -0.6103515625, -0.159423828125, 0.29150390625, 0.742431640625, 1.193359375, 1.644287109375, 2.09521484375, 2.546142578125, 2.9970703125, 3.447998046875, 3.89892578125, 4.349853515625, 4.80078125, 5.251708984375, 5.70263671875, 6.153564453125, 6.6044921875, 7.055419921875, 7.50634765625, 7.957275390625, 8.408203125, 8.859130859375, 9.31005859375, 9.760986328125, 10.2119140625, 10.662841796875, 11.11376953125, 11.564697265625, 12.015625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 5.0, 15.0, 12.0, 20.0, 30.0, 45.0, 63.0, 69.0, 105.0, 158.0, 272.0, 560.0, 2842.0, 66301.0, 3049824.0, 22439.0, 1809.0, 434.0, 200.0, 137.0, 102.0, 46.0, 62.0, 43.0, 24.0, 21.0, 11.0, 8.0, 19.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140625, -16.490966796875, -15.84130859375, -15.191650390625, -14.5419921875, -13.892333984375, -13.24267578125, -12.593017578125, -11.943359375, -11.293701171875, -10.64404296875, -9.994384765625, -9.3447265625, -8.695068359375, -8.04541015625, -7.395751953125, -6.74609375, -6.096435546875, -5.44677734375, -4.797119140625, -4.1474609375, -3.497802734375, -2.84814453125, -2.198486328125, -1.548828125, -0.899169921875, -0.24951171875, 0.400146484375, 1.0498046875, 1.699462890625, 2.34912109375, 2.998779296875, 3.6484375, 4.298095703125, 4.94775390625, 5.597412109375, 6.2470703125, 6.896728515625, 7.54638671875, 8.196044921875, 8.845703125, 9.495361328125, 10.14501953125, 10.794677734375, 11.4443359375, 12.093994140625, 12.74365234375, 13.393310546875, 14.04296875, 14.692626953125, 15.34228515625, 15.991943359375, 16.6416015625, 17.291259765625, 17.94091796875, 18.590576171875, 19.240234375, 19.889892578125, 20.53955078125, 21.189208984375, 21.8388671875, 22.488525390625, 23.13818359375, 23.787841796875, 24.4375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 18.0, 153.0, 471.0, 316.0, 49.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.64859771728516, -63.4387092590332, -60.228816986083984, -57.01892852783203, -53.80903625488281, -50.59914779663086, -47.389259338378906, -44.17936706542969, -40.969478607177734, -37.75959014892578, -34.54969787597656, -31.33980941772461, -28.129919052124023, -24.920028686523438, -21.710140228271484, -18.5002498626709, -15.290359497070312, -12.080469131469727, -8.870579719543457, -5.6606903076171875, -2.4507999420166016, 0.7590904235839844, 3.9689788818359375, 7.178869247436523, 10.38875961303711, 13.598649978637695, 16.80854034423828, 20.018428802490234, 23.22831916809082, 26.438209533691406, 29.64809799194336, 32.85798645019531, 36.06787109375, 39.27775955200195, 42.48765182495117, 45.697540283203125, 48.907432556152344, 52.1173210144043, 55.32720947265625, 58.53710174560547, 61.74699020385742, 64.95687866210938, 68.1667709350586, 71.37666320800781, 74.5865478515625, 77.79644012451172, 81.00633239746094, 84.21621704101562, 87.42610931396484, 90.63600158691406, 93.84588623046875, 97.05577850341797, 100.26567077636719, 103.47555541992188, 106.6854476928711, 109.89533996582031, 113.105224609375, 116.31511688232422, 119.5250015258789, 122.73489379882812, 125.94478607177734, 129.15467834472656, 132.36456298828125, 135.57444763183594, 138.7843475341797]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 3.0, 3.0, 9.0, 9.0, 13.0, 11.0, 12.0, 11.0, 19.0, 19.0, 24.0, 23.0, 24.0, 25.0, 27.0, 44.0, 39.0, 36.0, 49.0, 52.0, 35.0, 43.0, 43.0, 47.0, 28.0, 38.0, 41.0, 29.0, 34.0, 34.0, 24.0, 16.0, 13.0, 11.0, 26.0, 12.0, 16.0, 10.0, 12.0, 2.0, 8.0, 9.0, 6.0, 1.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.55046844482422, -28.6372127532959, -27.723957061767578, -26.81070327758789, -25.89744758605957, -24.98419189453125, -24.07093620300293, -23.15768051147461, -22.24442481994629, -21.33116912841797, -20.41791343688965, -19.504657745361328, -18.59140396118164, -17.67814826965332, -16.764892578125, -15.85163688659668, -14.938382148742676, -14.025126457214355, -13.111871719360352, -12.198616027832031, -11.285360336303711, -10.37210464477539, -9.458849906921387, -8.545594215393066, -7.632339000701904, -6.719083786010742, -5.805828094482422, -4.89257287979126, -3.9793174266815186, -3.0660619735717773, -2.1528067588806152, -1.239551067352295, -0.3262958526611328, 0.5869595408439636, 1.50021493434906, 2.4134702682495117, 3.326725721359253, 4.239981174468994, 5.153236389160156, 6.066492080688477, 6.979747295379639, 7.893002510070801, 8.806258201599121, 9.719512939453125, 10.632768630981445, 11.546024322509766, 12.459280014038086, 13.372535705566406, 14.28579044342041, 15.19904613494873, 16.112300872802734, 17.025556564331055, 17.938812255859375, 18.852067947387695, 19.765323638916016, 20.678577423095703, 21.591833114624023, 22.505088806152344, 23.418344497680664, 24.331600189208984, 25.244853973388672, 26.158109664916992, 27.071365356445312, 27.984621047973633, 28.897876739501953]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 8.0, 5.0, 13.0, 7.0, 14.0, 20.0, 14.0, 15.0, 33.0, 23.0, 28.0, 29.0, 32.0, 35.0, 32.0, 47.0, 45.0, 46.0, 53.0, 47.0, 56.0, 38.0, 43.0, 36.0, 37.0, 30.0, 36.0, 35.0, 22.0, 28.0, 18.0, 13.0, 22.0, 8.0, 11.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.45977783203125, -4.3062744140625, -4.15277099609375, -3.999267578125, -3.84576416015625, -3.6922607421875, -3.53875732421875, -3.38525390625, -3.23175048828125, -3.0782470703125, -2.92474365234375, -2.771240234375, -2.61773681640625, -2.4642333984375, -2.31072998046875, -2.1572265625, -2.00372314453125, -1.8502197265625, -1.69671630859375, -1.543212890625, -1.38970947265625, -1.2362060546875, -1.08270263671875, -0.92919921875, -0.77569580078125, -0.6221923828125, -0.46868896484375, -0.315185546875, -0.16168212890625, -0.0081787109375, 0.14532470703125, 0.298828125, 0.45233154296875, 0.6058349609375, 0.75933837890625, 0.912841796875, 1.06634521484375, 1.2198486328125, 1.37335205078125, 1.52685546875, 1.68035888671875, 1.8338623046875, 1.98736572265625, 2.140869140625, 2.29437255859375, 2.4478759765625, 2.60137939453125, 2.7548828125, 2.90838623046875, 3.0618896484375, 3.21539306640625, 3.368896484375, 3.52239990234375, 3.6759033203125, 3.82940673828125, 3.98291015625, 4.13641357421875, 4.2899169921875, 4.44342041015625, 4.596923828125, 4.75042724609375, 4.9039306640625, 5.05743408203125, 5.2109375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 13.0, 12.0, 25.0, 28.0, 46.0, 58.0, 62.0, 105.0, 133.0, 156.0, 200.0, 310.0, 419.0, 608.0, 1053.0, 2207.0, 7007.0, 40785.0, 456043.0, 3256467.0, 379664.0, 36889.0, 6758.0, 2089.0, 1019.0, 597.0, 370.0, 301.0, 209.0, 174.0, 112.0, 88.0, 64.0, 57.0, 53.0, 25.0, 23.0, 11.0, 14.0, 8.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.1875, -24.36083984375, -23.5341796875, -22.70751953125, -21.880859375, -21.05419921875, -20.2275390625, -19.40087890625, -18.57421875, -17.74755859375, -16.9208984375, -16.09423828125, -15.267578125, -14.44091796875, -13.6142578125, -12.78759765625, -11.9609375, -11.13427734375, -10.3076171875, -9.48095703125, -8.654296875, -7.82763671875, -7.0009765625, -6.17431640625, -5.34765625, -4.52099609375, -3.6943359375, -2.86767578125, -2.041015625, -1.21435546875, -0.3876953125, 0.43896484375, 1.265625, 2.09228515625, 2.9189453125, 3.74560546875, 4.572265625, 5.39892578125, 6.2255859375, 7.05224609375, 7.87890625, 8.70556640625, 9.5322265625, 10.35888671875, 11.185546875, 12.01220703125, 12.8388671875, 13.66552734375, 14.4921875, 15.31884765625, 16.1455078125, 16.97216796875, 17.798828125, 18.62548828125, 19.4521484375, 20.27880859375, 21.10546875, 21.93212890625, 22.7587890625, 23.58544921875, 24.412109375, 25.23876953125, 26.0654296875, 26.89208984375, 27.71875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 7.0, 11.0, 13.0, 4.0, 7.0, 15.0, 19.0, 23.0, 30.0, 52.0, 62.0, 76.0, 102.0, 122.0, 138.0, 150.0, 216.0, 229.0, 295.0, 327.0, 320.0, 322.0, 265.0, 229.0, 185.0, 176.0, 116.0, 108.0, 87.0, 73.0, 60.0, 47.0, 39.0, 36.0, 25.0, 16.0, 12.0, 15.0, 6.0, 12.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.6796875, -8.42718505859375, -8.1746826171875, -7.92218017578125, -7.669677734375, -7.41717529296875, -7.1646728515625, -6.91217041015625, -6.65966796875, -6.40716552734375, -6.1546630859375, -5.90216064453125, -5.649658203125, -5.39715576171875, -5.1446533203125, -4.89215087890625, -4.6396484375, -4.38714599609375, -4.1346435546875, -3.88214111328125, -3.629638671875, -3.37713623046875, -3.1246337890625, -2.87213134765625, -2.61962890625, -2.36712646484375, -2.1146240234375, -1.86212158203125, -1.609619140625, -1.35711669921875, -1.1046142578125, -0.85211181640625, -0.599609375, -0.34710693359375, -0.0946044921875, 0.15789794921875, 0.410400390625, 0.66290283203125, 0.9154052734375, 1.16790771484375, 1.42041015625, 1.67291259765625, 1.9254150390625, 2.17791748046875, 2.430419921875, 2.68292236328125, 2.9354248046875, 3.18792724609375, 3.4404296875, 3.69293212890625, 3.9454345703125, 4.19793701171875, 4.450439453125, 4.70294189453125, 4.9554443359375, 5.20794677734375, 5.46044921875, 5.71295166015625, 5.9654541015625, 6.21795654296875, 6.470458984375, 6.72296142578125, 6.9754638671875, 7.22796630859375, 7.48046875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 4.0, 3.0, 8.0, 17.0, 13.0, 20.0, 25.0, 28.0, 76.0, 80.0, 132.0, 198.0, 317.0, 604.0, 1188.0, 2807.0, 7981.0, 24980.0, 94661.0, 419560.0, 1923423.0, 1347639.0, 276983.0, 65304.0, 17897.0, 5835.0, 2194.0, 944.0, 494.0, 287.0, 184.0, 121.0, 85.0, 59.0, 37.0, 26.0, 17.0, 16.0, 10.0, 8.0, 6.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.546875, -11.1468505859375, -10.746826171875, -10.3468017578125, -9.94677734375, -9.5467529296875, -9.146728515625, -8.7467041015625, -8.3466796875, -7.9466552734375, -7.546630859375, -7.1466064453125, -6.74658203125, -6.3465576171875, -5.946533203125, -5.5465087890625, -5.146484375, -4.7464599609375, -4.346435546875, -3.9464111328125, -3.54638671875, -3.1463623046875, -2.746337890625, -2.3463134765625, -1.9462890625, -1.5462646484375, -1.146240234375, -0.7462158203125, -0.34619140625, 0.0538330078125, 0.453857421875, 0.8538818359375, 1.25390625, 1.6539306640625, 2.053955078125, 2.4539794921875, 2.85400390625, 3.2540283203125, 3.654052734375, 4.0540771484375, 4.4541015625, 4.8541259765625, 5.254150390625, 5.6541748046875, 6.05419921875, 6.4542236328125, 6.854248046875, 7.2542724609375, 7.654296875, 8.0543212890625, 8.454345703125, 8.8543701171875, 9.25439453125, 9.6544189453125, 10.054443359375, 10.4544677734375, 10.8544921875, 11.2545166015625, 11.654541015625, 12.0545654296875, 12.45458984375, 12.8546142578125, 13.254638671875, 13.6546630859375, 14.0546875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 9.0, 7.0, 4.0, 14.0, 22.0, 32.0, 36.0, 58.0, 76.0, 72.0, 87.0, 100.0, 92.0, 88.0, 83.0, 66.0, 39.0, 35.0, 32.0, 18.0, 17.0, 5.0, 9.0, 4.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0766830444336, -71.915283203125, -68.75387573242188, -65.59247589111328, -62.43107604980469, -59.269676208496094, -56.108272552490234, -52.946868896484375, -49.78546905517578, -46.62406921386719, -43.46266555786133, -40.30126190185547, -37.139862060546875, -33.97846221923828, -30.817058563232422, -27.655656814575195, -24.49425506591797, -21.332853317260742, -18.171451568603516, -15.010049819946289, -11.848648071289062, -8.687246322631836, -5.525844573974609, -2.364442825317383, 0.7969589233398438, 3.9583606719970703, 7.119762420654297, 10.281164169311523, 13.44256591796875, 16.603967666625977, 19.765369415283203, 22.92677116394043, 26.088165283203125, 29.24956703186035, 32.41096878051758, 35.57237243652344, 38.73377227783203, 41.895172119140625, 45.056575775146484, 48.217979431152344, 51.37937927246094, 54.54077911376953, 57.70218276977539, 60.86358642578125, 64.02498626708984, 67.18638610839844, 70.34779357910156, 73.50919342041016, 76.67059326171875, 79.83199310302734, 82.99339294433594, 86.15480041503906, 89.31620025634766, 92.47760009765625, 95.63900756835938, 98.80040740966797, 101.96180725097656, 105.12320709228516, 108.28460693359375, 111.44601440429688, 114.60741424560547, 117.76881408691406, 120.93022155761719, 124.09162139892578, 127.25302124023438]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 8.0, 10.0, 15.0, 13.0, 8.0, 19.0, 21.0, 28.0, 27.0, 24.0, 30.0, 36.0, 28.0, 39.0, 45.0, 41.0, 47.0, 41.0, 50.0, 39.0, 50.0, 45.0, 31.0, 34.0, 34.0, 39.0, 23.0, 27.0, 27.0, 24.0, 16.0, 13.0, 10.0, 16.0, 9.0, 8.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.72960662841797, -56.040584564208984, -54.351566314697266, -52.66254425048828, -50.97352600097656, -49.28450393676758, -47.595481872558594, -45.906463623046875, -44.217445373535156, -42.52842330932617, -40.83940505981445, -39.15038299560547, -37.46136474609375, -35.772342681884766, -34.08332061767578, -32.39430236816406, -30.705280303955078, -29.016260147094727, -27.327239990234375, -25.63821792602539, -23.949199676513672, -22.260177612304688, -20.571157455444336, -18.882137298583984, -17.193117141723633, -15.504096984863281, -13.81507682800293, -12.126055717468262, -10.43703556060791, -8.748015403747559, -7.058994293212891, -5.369974136352539, -3.680950164794922, -1.9919297695159912, -0.30290937423706055, 1.3861112594604492, 3.075131416320801, 4.764151573181152, 6.45317268371582, 8.142192840576172, 9.831212997436523, 11.520233154296875, 13.209253311157227, 14.898274421691895, 16.587295532226562, 18.27631378173828, 19.965335845947266, 21.654356002807617, 23.34337615966797, 25.03239631652832, 26.721416473388672, 28.410438537597656, 30.099456787109375, 31.78847885131836, 33.477500915527344, 35.16651916503906, 36.85553741455078, 38.544559478759766, 40.233577728271484, 41.92259979248047, 43.61161804199219, 45.30064010620117, 46.989662170410156, 48.678680419921875, 50.36770248413086]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 9.0, 8.0, 8.0, 16.0, 11.0, 13.0, 26.0, 30.0, 10.0, 24.0, 25.0, 29.0, 27.0, 33.0, 34.0, 31.0, 29.0, 35.0, 48.0, 50.0, 53.0, 49.0, 40.0, 36.0, 32.0, 26.0, 31.0, 29.0, 27.0, 19.0, 23.0, 19.0, 19.0, 10.0, 8.0, 17.0, 12.0, 3.0, 7.0, 4.0, 6.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-106.125, -103.0478515625, -99.970703125, -96.8935546875, -93.81640625, -90.7392578125, -87.662109375, -84.5849609375, -81.5078125, -78.4306640625, -75.353515625, -72.2763671875, -69.19921875, -66.1220703125, -63.044921875, -59.9677734375, -56.890625, -53.8134765625, -50.736328125, -47.6591796875, -44.58203125, -41.5048828125, -38.427734375, -35.3505859375, -32.2734375, -29.1962890625, -26.119140625, -23.0419921875, -19.96484375, -16.8876953125, -13.810546875, -10.7333984375, -7.65625, -4.5791015625, -1.501953125, 1.5751953125, 4.65234375, 7.7294921875, 10.806640625, 13.8837890625, 16.9609375, 20.0380859375, 23.115234375, 26.1923828125, 29.26953125, 32.3466796875, 35.423828125, 38.5009765625, 41.578125, 44.6552734375, 47.732421875, 50.8095703125, 53.88671875, 56.9638671875, 60.041015625, 63.1181640625, 66.1953125, 69.2724609375, 72.349609375, 75.4267578125, 78.50390625, 81.5810546875, 84.658203125, 87.7353515625, 90.8125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 15.0, 30.0, 24.0, 51.0, 82.0, 128.0, 177.0, 269.0, 386.0, 589.0, 901.0, 1329.0, 1982.0, 2930.0, 4662.0, 7123.0, 10850.0, 17072.0, 27874.0, 45557.0, 79389.0, 147418.0, 273679.0, 185027.0, 96785.0, 54991.0, 32703.0, 20158.0, 12701.0, 8074.0, 5243.0, 3413.0, 2326.0, 1513.0, 1037.0, 698.0, 492.0, 290.0, 217.0, 136.0, 80.0, 47.0, 35.0, 16.0, 20.0, 10.0, 11.0, 10.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.86279296875, -0.8379058837890625, -0.813018798828125, -0.7881317138671875, -0.76324462890625, -0.7383575439453125, -0.713470458984375, -0.6885833740234375, -0.6636962890625, -0.6388092041015625, -0.613922119140625, -0.5890350341796875, -0.56414794921875, -0.5392608642578125, -0.514373779296875, -0.4894866943359375, -0.464599609375, -0.4397125244140625, -0.414825439453125, -0.3899383544921875, -0.36505126953125, -0.3401641845703125, -0.315277099609375, -0.2903900146484375, -0.2655029296875, -0.2406158447265625, -0.215728759765625, -0.1908416748046875, -0.16595458984375, -0.1410675048828125, -0.116180419921875, -0.0912933349609375, -0.06640625, -0.0415191650390625, -0.016632080078125, 0.0082550048828125, 0.03314208984375, 0.0580291748046875, 0.082916259765625, 0.1078033447265625, 0.1326904296875, 0.1575775146484375, 0.182464599609375, 0.2073516845703125, 0.23223876953125, 0.2571258544921875, 0.282012939453125, 0.3069000244140625, 0.331787109375, 0.3566741943359375, 0.381561279296875, 0.4064483642578125, 0.43133544921875, 0.4562225341796875, 0.481109619140625, 0.5059967041015625, 0.5308837890625, 0.5557708740234375, 0.580657958984375, 0.6055450439453125, 0.63043212890625, 0.6553192138671875, 0.680206298828125, 0.7050933837890625, 0.72998046875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 6.0, 3.0, 1.0, 2.0, 7.0, 4.0, 6.0, 5.0, 5.0, 7.0, 5.0, 12.0, 13.0, 15.0, 16.0, 17.0, 25.0, 20.0, 19.0, 25.0, 25.0, 25.0, 39.0, 39.0, 41.0, 38.0, 35.0, 30.0, 1071.0, 39.0, 34.0, 34.0, 57.0, 36.0, 39.0, 26.0, 25.0, 20.0, 28.0, 17.0, 17.0, 17.0, 13.0, 11.0, 10.0, 12.0, 11.0, 6.0, 5.0, 6.0, 9.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-77.8125, -75.3857421875, -72.958984375, -70.5322265625, -68.10546875, -65.6787109375, -63.251953125, -60.8251953125, -58.3984375, -55.9716796875, -53.544921875, -51.1181640625, -48.69140625, -46.2646484375, -43.837890625, -41.4111328125, -38.984375, -36.5576171875, -34.130859375, -31.7041015625, -29.27734375, -26.8505859375, -24.423828125, -21.9970703125, -19.5703125, -17.1435546875, -14.716796875, -12.2900390625, -9.86328125, -7.4365234375, -5.009765625, -2.5830078125, -0.15625, 2.2705078125, 4.697265625, 7.1240234375, 9.55078125, 11.9775390625, 14.404296875, 16.8310546875, 19.2578125, 21.6845703125, 24.111328125, 26.5380859375, 28.96484375, 31.3916015625, 33.818359375, 36.2451171875, 38.671875, 41.0986328125, 43.525390625, 45.9521484375, 48.37890625, 50.8056640625, 53.232421875, 55.6591796875, 58.0859375, 60.5126953125, 62.939453125, 65.3662109375, 67.79296875, 70.2197265625, 72.646484375, 75.0732421875, 77.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 8.0, 6.0, 19.0, 14.0, 35.0, 32.0, 53.0, 73.0, 105.0, 137.0, 209.0, 308.0, 431.0, 650.0, 864.0, 1328.0, 1807.0, 2683.0, 3904.0, 5834.0, 8495.0, 12922.0, 19395.0, 29934.0, 46309.0, 74722.0, 123994.0, 1248216.0, 193282.0, 118305.0, 71673.0, 44827.0, 29048.0, 18859.0, 12301.0, 8484.0, 5582.0, 3898.0, 2517.0, 1716.0, 1219.0, 846.0, 645.0, 456.0, 302.0, 200.0, 159.0, 116.0, 65.0, 45.0, 32.0, 18.0, 18.0, 21.0, 9.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.298095703125, -0.2884674072265625, -0.278839111328125, -0.2692108154296875, -0.25958251953125, -0.2499542236328125, -0.240325927734375, -0.2306976318359375, -0.2210693359375, -0.2114410400390625, -0.201812744140625, -0.1921844482421875, -0.18255615234375, -0.1729278564453125, -0.163299560546875, -0.1536712646484375, -0.14404296875, -0.1344146728515625, -0.124786376953125, -0.1151580810546875, -0.10552978515625, -0.0959014892578125, -0.086273193359375, -0.0766448974609375, -0.0670166015625, -0.0573883056640625, -0.047760009765625, -0.0381317138671875, -0.02850341796875, -0.0188751220703125, -0.009246826171875, 0.0003814697265625, 0.010009765625, 0.0196380615234375, 0.029266357421875, 0.0388946533203125, 0.04852294921875, 0.0581512451171875, 0.067779541015625, 0.0774078369140625, 0.0870361328125, 0.0966644287109375, 0.106292724609375, 0.1159210205078125, 0.12554931640625, 0.1351776123046875, 0.144805908203125, 0.1544342041015625, 0.1640625, 0.1736907958984375, 0.183319091796875, 0.1929473876953125, 0.20257568359375, 0.2122039794921875, 0.221832275390625, 0.2314605712890625, 0.2410888671875, 0.2507171630859375, 0.260345458984375, 0.2699737548828125, 0.27960205078125, 0.2892303466796875, 0.298858642578125, 0.3084869384765625, 0.318115234375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 7.0, 6.0, 7.0, 9.0, 8.0, 10.0, 15.0, 26.0, 41.0, 32.0, 58.0, 100.0, 143.0, 134.0, 119.0, 66.0, 54.0, 34.0, 28.0, 23.0, 11.0, 12.0, 9.0, 6.0, 7.0, 5.0, 5.0, 7.0, 0.0, 3.0, 2.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.796815872192383e-05, -3.645848482847214e-05, -3.494881093502045e-05, -3.3439137041568756e-05, -3.1929463148117065e-05, -3.0419789254665375e-05, -2.8910115361213684e-05, -2.7400441467761993e-05, -2.5890767574310303e-05, -2.4381093680858612e-05, -2.287141978740692e-05, -2.136174589395523e-05, -1.985207200050354e-05, -1.834239810705185e-05, -1.683272421360016e-05, -1.5323050320148468e-05, -1.3813376426696777e-05, -1.2303702533245087e-05, -1.0794028639793396e-05, -9.284354746341705e-06, -7.774680852890015e-06, -6.265006959438324e-06, -4.755333065986633e-06, -3.2456591725349426e-06, -1.735985279083252e-06, -2.2631138563156128e-07, 1.2833625078201294e-06, 2.79303640127182e-06, 4.302710294723511e-06, 5.812384188175201e-06, 7.322058081626892e-06, 8.831731975078583e-06, 1.0341405868530273e-05, 1.1851079761981964e-05, 1.3360753655433655e-05, 1.4870427548885345e-05, 1.6380101442337036e-05, 1.7889775335788727e-05, 1.9399449229240417e-05, 2.0909123122692108e-05, 2.24187970161438e-05, 2.392847090959549e-05, 2.543814480304718e-05, 2.694781869649887e-05, 2.845749258995056e-05, 2.9967166483402252e-05, 3.147684037685394e-05, 3.2986514270305634e-05, 3.4496188163757324e-05, 3.6005862057209015e-05, 3.7515535950660706e-05, 3.9025209844112396e-05, 4.053488373756409e-05, 4.204455763101578e-05, 4.355423152446747e-05, 4.506390541791916e-05, 4.657357931137085e-05, 4.808325320482254e-05, 4.959292709827423e-05, 5.110260099172592e-05, 5.261227488517761e-05, 5.41219487786293e-05, 5.5631622672080994e-05, 5.7141296565532684e-05, 5.8650970458984375e-05]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 3.0, 6.0, 11.0, 11.0, 19.0, 22.0, 46.0, 48.0, 66.0, 112.0, 189.0, 290.0, 500.0, 924.0, 1772.0, 3345.0, 6469.0, 13784.0, 31265.0, 77119.0, 242696.0, 435466.0, 141036.0, 51176.0, 21837.0, 9830.0, 4858.0, 2459.0, 1337.0, 737.0, 396.0, 248.0, 159.0, 97.0, 71.0, 44.0, 38.0, 19.0, 13.0, 6.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00021970272064208984, -0.00021310150623321533, -0.00020650029182434082, -0.0001998990774154663, -0.0001932978630065918, -0.00018669664859771729, -0.00018009543418884277, -0.00017349421977996826, -0.00016689300537109375, -0.00016029179096221924, -0.00015369057655334473, -0.00014708936214447021, -0.0001404881477355957, -0.0001338869333267212, -0.00012728571891784668, -0.00012068450450897217, -0.00011408329010009766, -0.00010748207569122314, -0.00010088086128234863, -9.427964687347412e-05, -8.767843246459961e-05, -8.10772180557251e-05, -7.447600364685059e-05, -6.787478923797607e-05, -6.127357482910156e-05, -5.467236042022705e-05, -4.807114601135254e-05, -4.146993160247803e-05, -3.4868717193603516e-05, -2.8267502784729004e-05, -2.1666288375854492e-05, -1.506507396697998e-05, -8.463859558105469e-06, -1.862645149230957e-06, 4.738569259643555e-06, 1.1339783668518066e-05, 1.7940998077392578e-05, 2.454221248626709e-05, 3.11434268951416e-05, 3.774464130401611e-05, 4.4345855712890625e-05, 5.094707012176514e-05, 5.754828453063965e-05, 6.414949893951416e-05, 7.075071334838867e-05, 7.735192775726318e-05, 8.39531421661377e-05, 9.055435657501221e-05, 9.715557098388672e-05, 0.00010375678539276123, 0.00011035799980163574, 0.00011695921421051025, 0.00012356042861938477, 0.00013016164302825928, 0.0001367628574371338, 0.0001433640718460083, 0.0001499652862548828, 0.00015656650066375732, 0.00016316771507263184, 0.00016976892948150635, 0.00017637014389038086, 0.00018297135829925537, 0.00018957257270812988, 0.0001961737871170044, 0.0002027750015258789]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 12.0, 8.0, 12.0, 20.0, 32.0, 56.0, 90.0, 109.0, 127.0, 132.0, 98.0, 91.0, 46.0, 54.0, 32.0, 27.0, 14.0, 13.0, 7.0, 10.0, 1.0, 6.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5547399824718013e-05, -5.274198701954447e-05, -4.9936570576392114e-05, -4.713115777121857e-05, -4.432574496604502e-05, -4.1520332160871476e-05, -3.871491935569793e-05, -3.590950291254558e-05, -3.310409010737203e-05, -3.0298677302198485e-05, -2.7493262678035535e-05, -2.4687848053872585e-05, -2.188243524869904e-05, -1.9077022443525493e-05, -1.6271607819362544e-05, -1.3466193195199594e-05, -1.0660780390026048e-05, -7.8553666753578e-06, -5.049952960689552e-06, -2.2445392460213043e-06, 5.608744686469436e-07, 3.3662881833151914e-06, 6.171701897983439e-06, 8.977116522146389e-06, 1.1782529327319935e-05, 1.4587943041988183e-05, 1.739335675665643e-05, 2.019877138081938e-05, 2.3004184185992926e-05, 2.5809596991166472e-05, 2.8615011615329422e-05, 3.142042623949237e-05, 3.4225842682644725e-05, 3.703125548781827e-05, 3.983666829299182e-05, 4.264208473614417e-05, 4.5447497541317716e-05, 4.825291034649126e-05, 5.1058326789643615e-05, 5.386373959481716e-05, 5.666915239999071e-05, 5.9474565205164254e-05, 6.22799780103378e-05, 6.508539081551135e-05, 6.78908108966425e-05, 7.069622370181605e-05, 7.35016365069896e-05, 7.630704931216314e-05, 7.911246211733669e-05, 8.191787492251024e-05, 8.472328772768378e-05, 8.752870053285733e-05, 9.033411333803087e-05, 9.313953341916203e-05, 9.594494622433558e-05, 9.875035902950913e-05, 0.00010155577183468267, 0.00010436118463985622, 0.00010716659744502977, 0.00010997201025020331, 0.00011277743033133447, 0.00011558284313650802, 0.00011838825594168156, 0.00012119366874685511, 0.00012399908155202866]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 8.0, 10.0, 5.0, 13.0, 9.0, 9.0, 22.0, 14.0, 17.0, 34.0, 17.0, 26.0, 39.0, 27.0, 43.0, 33.0, 40.0, 36.0, 28.0, 33.0, 41.0, 34.0, 41.0, 29.0, 29.0, 35.0, 27.0, 33.0, 31.0, 32.0, 29.0, 21.0, 21.0, 16.0, 18.0, 12.0, 13.0, 13.0, 8.0, 5.0, 6.0, 4.0, 4.0, 8.0, 11.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-2.4020671844482422e-05, -2.329424023628235e-05, -2.2567808628082275e-05, -2.1841377019882202e-05, -2.111494541168213e-05, -2.0388513803482056e-05, -1.9662082195281982e-05, -1.893565058708191e-05, -1.8209218978881836e-05, -1.7482787370681763e-05, -1.675635576248169e-05, -1.6029924154281616e-05, -1.5303492546081543e-05, -1.457706093788147e-05, -1.3850629329681396e-05, -1.3124197721481323e-05, -1.239776611328125e-05, -1.1671334505081177e-05, -1.0944902896881104e-05, -1.021847128868103e-05, -9.492039680480957e-06, -8.765608072280884e-06, -8.03917646408081e-06, -7.312744855880737e-06, -6.586313247680664e-06, -5.859881639480591e-06, -5.133450031280518e-06, -4.407018423080444e-06, -3.680586814880371e-06, -2.954155206680298e-06, -2.2277235984802246e-06, -1.5012919902801514e-06, -7.748603820800781e-07, -4.842877388000488e-08, 6.780028343200684e-07, 1.4044344425201416e-06, 2.130866050720215e-06, 2.857297658920288e-06, 3.5837292671203613e-06, 4.3101608753204346e-06, 5.036592483520508e-06, 5.763024091720581e-06, 6.489455699920654e-06, 7.2158873081207275e-06, 7.9423189163208e-06, 8.668750524520874e-06, 9.395182132720947e-06, 1.012161374092102e-05, 1.0848045349121094e-05, 1.1574476957321167e-05, 1.230090856552124e-05, 1.3027340173721313e-05, 1.3753771781921387e-05, 1.448020339012146e-05, 1.5206634998321533e-05, 1.5933066606521606e-05, 1.665949821472168e-05, 1.7385929822921753e-05, 1.8112361431121826e-05, 1.88387930393219e-05, 1.9565224647521973e-05, 2.0291656255722046e-05, 2.101808786392212e-05, 2.1744519472122192e-05, 2.2470951080322266e-05]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 9.0, 8.0, 8.0, 16.0, 11.0, 13.0, 26.0, 30.0, 10.0, 24.0, 25.0, 29.0, 27.0, 33.0, 34.0, 31.0, 29.0, 35.0, 48.0, 50.0, 53.0, 49.0, 40.0, 36.0, 32.0, 26.0, 31.0, 29.0, 27.0, 19.0, 23.0, 19.0, 19.0, 10.0, 8.0, 17.0, 12.0, 3.0, 7.0, 4.0, 6.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-106.125, -103.0478515625, -99.970703125, -96.8935546875, -93.81640625, -90.7392578125, -87.662109375, -84.5849609375, -81.5078125, -78.4306640625, -75.353515625, -72.2763671875, -69.19921875, -66.1220703125, -63.044921875, -59.9677734375, -56.890625, -53.8134765625, -50.736328125, -47.6591796875, -44.58203125, -41.5048828125, -38.427734375, -35.3505859375, -32.2734375, -29.1962890625, -26.119140625, -23.0419921875, -19.96484375, -16.8876953125, -13.810546875, -10.7333984375, -7.65625, -4.5791015625, -1.501953125, 1.5751953125, 4.65234375, 7.7294921875, 10.806640625, 13.8837890625, 16.9609375, 20.0380859375, 23.115234375, 26.1923828125, 29.26953125, 32.3466796875, 35.423828125, 38.5009765625, 41.578125, 44.6552734375, 47.732421875, 50.8095703125, 53.88671875, 56.9638671875, 60.041015625, 63.1181640625, 66.1953125, 69.2724609375, 72.349609375, 75.4267578125, 78.50390625, 81.5810546875, 84.658203125, 87.7353515625, 90.8125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 3.0, 8.0, 9.0, 7.0, 11.0, 15.0, 14.0, 31.0, 33.0, 40.0, 31.0, 42.0, 57.0, 87.0, 158.0, 295.0, 571.0, 1509.0, 8218.0, 79967.0, 574036.0, 342415.0, 34497.0, 4308.0, 1037.0, 418.0, 221.0, 143.0, 90.0, 63.0, 41.0, 30.0, 29.0, 24.0, 14.0, 13.0, 10.0, 12.0, 7.0, 3.0, 5.0, 8.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-19.078125, -18.5302734375, -17.982421875, -17.4345703125, -16.88671875, -16.3388671875, -15.791015625, -15.2431640625, -14.6953125, -14.1474609375, -13.599609375, -13.0517578125, -12.50390625, -11.9560546875, -11.408203125, -10.8603515625, -10.3125, -9.7646484375, -9.216796875, -8.6689453125, -8.12109375, -7.5732421875, -7.025390625, -6.4775390625, -5.9296875, -5.3818359375, -4.833984375, -4.2861328125, -3.73828125, -3.1904296875, -2.642578125, -2.0947265625, -1.546875, -0.9990234375, -0.451171875, 0.0966796875, 0.64453125, 1.1923828125, 1.740234375, 2.2880859375, 2.8359375, 3.3837890625, 3.931640625, 4.4794921875, 5.02734375, 5.5751953125, 6.123046875, 6.6708984375, 7.21875, 7.7666015625, 8.314453125, 8.8623046875, 9.41015625, 9.9580078125, 10.505859375, 11.0537109375, 11.6015625, 12.1494140625, 12.697265625, 13.2451171875, 13.79296875, 14.3408203125, 14.888671875, 15.4365234375, 15.984375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 11.0, 10.0, 10.0, 17.0, 19.0, 22.0, 24.0, 33.0, 37.0, 37.0, 34.0, 54.0, 44.0, 44.0, 46.0, 55.0, 2092.0, 45.0, 45.0, 47.0, 31.0, 39.0, 34.0, 45.0, 28.0, 21.0, 25.0, 17.0, 14.0, 12.0, 8.0, 11.0, 7.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-171.5, -166.658203125, -161.81640625, -156.974609375, -152.1328125, -147.291015625, -142.44921875, -137.607421875, -132.765625, -127.923828125, -123.08203125, -118.240234375, -113.3984375, -108.556640625, -103.71484375, -98.873046875, -94.03125, -89.189453125, -84.34765625, -79.505859375, -74.6640625, -69.822265625, -64.98046875, -60.138671875, -55.296875, -50.455078125, -45.61328125, -40.771484375, -35.9296875, -31.087890625, -26.24609375, -21.404296875, -16.5625, -11.720703125, -6.87890625, -2.037109375, 2.8046875, 7.646484375, 12.48828125, 17.330078125, 22.171875, 27.013671875, 31.85546875, 36.697265625, 41.5390625, 46.380859375, 51.22265625, 56.064453125, 60.90625, 65.748046875, 70.58984375, 75.431640625, 80.2734375, 85.115234375, 89.95703125, 94.798828125, 99.640625, 104.482421875, 109.32421875, 114.166015625, 119.0078125, 123.849609375, 128.69140625, 133.533203125, 138.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 10.0, 7.0, 15.0, 16.0, 32.0, 73.0, 99.0, 188.0, 371.0, 757.0, 1908.0, 9557.0, 184799.0, 2894731.0, 46445.0, 4298.0, 1197.0, 562.0, 272.0, 152.0, 82.0, 49.0, 29.0, 17.0, 17.0, 6.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5234375, -14.8843994140625, -14.245361328125, -13.6063232421875, -12.96728515625, -12.3282470703125, -11.689208984375, -11.0501708984375, -10.4111328125, -9.7720947265625, -9.133056640625, -8.4940185546875, -7.85498046875, -7.2159423828125, -6.576904296875, -5.9378662109375, -5.298828125, -4.6597900390625, -4.020751953125, -3.3817138671875, -2.74267578125, -2.1036376953125, -1.464599609375, -0.8255615234375, -0.1865234375, 0.4525146484375, 1.091552734375, 1.7305908203125, 2.36962890625, 3.0086669921875, 3.647705078125, 4.2867431640625, 4.92578125, 5.5648193359375, 6.203857421875, 6.8428955078125, 7.48193359375, 8.1209716796875, 8.760009765625, 9.3990478515625, 10.0380859375, 10.6771240234375, 11.316162109375, 11.9552001953125, 12.59423828125, 13.2332763671875, 13.872314453125, 14.5113525390625, 15.150390625, 15.7894287109375, 16.428466796875, 17.0675048828125, 17.70654296875, 18.3455810546875, 18.984619140625, 19.6236572265625, 20.2626953125, 20.9017333984375, 21.540771484375, 22.1798095703125, 22.81884765625, 23.4578857421875, 24.096923828125, 24.7359619140625, 25.375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 9.0, 12.0, 11.0, 22.0, 45.0, 93.0, 115.0, 163.0, 166.0, 142.0, 90.0, 56.0, 27.0, 16.0, 12.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-231.48439025878906, -220.6607666015625, -209.837158203125, -199.01353454589844, -188.18991088867188, -177.3662872314453, -166.54266357421875, -155.71905517578125, -144.8954315185547, -134.07180786132812, -123.2481918334961, -112.42457580566406, -101.6009521484375, -90.77732849121094, -79.9537124633789, -69.13009643554688, -58.30647277832031, -47.482852935791016, -36.65923309326172, -25.835613250732422, -15.011993408203125, -4.188373565673828, 6.635246276855469, 17.4588623046875, 28.282485961914062, 39.10610580444336, 49.929725646972656, 60.75334548950195, 71.57696533203125, 82.40058898925781, 93.22420501708984, 104.04782104492188, 114.87142944335938, 125.69505310058594, 136.5186767578125, 147.34228515625, 158.16590881347656, 168.98953247070312, 179.81314086914062, 190.6367645263672, 201.46038818359375, 212.2840118408203, 223.10763549804688, 233.93124389648438, 244.75486755371094, 255.5784912109375, 266.402099609375, 277.2257080078125, 288.0493469238281, 298.8729553222656, 309.69659423828125, 320.52020263671875, 331.34381103515625, 342.1674499511719, 352.9910583496094, 363.814697265625, 374.6383056640625, 385.4619140625, 396.2855529785156, 407.1091613769531, 417.93280029296875, 428.75640869140625, 439.58001708984375, 450.40362548828125, 461.2272644042969]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 9.0, 6.0, 12.0, 13.0, 12.0, 16.0, 13.0, 12.0, 18.0, 19.0, 21.0, 29.0, 30.0, 30.0, 25.0, 30.0, 45.0, 42.0, 37.0, 41.0, 41.0, 42.0, 33.0, 36.0, 43.0, 30.0, 30.0, 39.0, 27.0, 29.0, 24.0, 16.0, 28.0, 24.0, 13.0, 10.0, 9.0, 13.0, 9.0, 10.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-218.80093383789062, -211.5113983154297, -204.2218780517578, -196.93234252929688, -189.642822265625, -182.35328674316406, -175.06375122070312, -167.77423095703125, -160.48471069335938, -153.19517517089844, -145.90565490722656, -138.61611938476562, -131.32659912109375, -124.03706359863281, -116.7475357055664, -109.4580078125, -102.16847229003906, -94.87894439697266, -87.58941650390625, -80.29988098144531, -73.01036071777344, -65.7208251953125, -58.431297302246094, -51.14176940917969, -43.85224151611328, -36.562713623046875, -29.273183822631836, -21.983654022216797, -14.69412612915039, -7.404598236083984, -0.1150665283203125, 7.174461364746094, 14.464004516601562, 21.75353240966797, 29.043062210083008, 36.33259201049805, 43.62211990356445, 50.91164779663086, 58.20117950439453, 65.49070739746094, 72.78023529052734, 80.06976318359375, 87.35929107666016, 94.64881896972656, 101.9383544921875, 109.22787475585938, 116.51741027832031, 123.80693817138672, 131.09646606445312, 138.38600158691406, 145.67552185058594, 152.96505737304688, 160.25457763671875, 167.5441131591797, 174.83364868164062, 182.1231689453125, 189.41268920898438, 196.7022247314453, 203.9917449951172, 211.28128051757812, 218.57080078125, 225.86033630371094, 233.14987182617188, 240.43939208984375, 247.7289276123047]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 15.0, 7.0, 21.0, 20.0, 33.0, 31.0, 55.0, 64.0, 99.0, 120.0, 159.0, 224.0, 233.0, 335.0, 441.0, 519.0, 686.0, 1079.0, 1040564.0, 938.0, 632.0, 524.0, 402.0, 329.0, 252.0, 210.0, 132.0, 97.0, 86.0, 62.0, 60.0, 49.0, 21.0, 12.0, 16.0, 5.0, 12.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.50636672973633, -58.374576568603516, -56.2427864074707, -54.11099624633789, -51.97920608520508, -49.847415924072266, -47.71562957763672, -45.583839416503906, -43.452049255371094, -41.32025909423828, -39.18846893310547, -37.056678771972656, -34.924888610839844, -32.79309844970703, -30.66131019592285, -28.52952003479004, -26.397727966308594, -24.26593780517578, -22.13414764404297, -20.002357482910156, -17.870567321777344, -15.738778114318848, -13.606988906860352, -11.475198745727539, -9.343408584594727, -7.211618423461914, -5.07982873916626, -2.9480390548706055, -0.816248893737793, 1.3155412673950195, 3.4473304748535156, 5.579120635986328, 7.710906982421875, 9.842697143554688, 11.9744873046875, 14.106276512145996, 16.238067626953125, 18.369857788085938, 20.501646041870117, 22.63343620300293, 24.765226364135742, 26.897016525268555, 29.028806686401367, 31.160594940185547, 33.29238510131836, 35.42417526245117, 37.555965423583984, 39.6877555847168, 41.81954574584961, 43.95133590698242, 46.083126068115234, 48.21491622924805, 50.34670639038086, 52.47849655151367, 54.61028289794922, 56.74207305908203, 58.873863220214844, 61.005653381347656, 63.13744354248047, 65.26923370361328, 67.4010238647461, 69.5328140258789, 71.66460418701172, 73.79639434814453, 75.92818450927734]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 12.0, 3.0, 9.0, 6.0, 11.0, 25.0, 50.0, 73.0, 115.0, 187.0, 1657.0, 51435812.0, 24197.0, 674.0, 141.0, 72.0, 40.0, 18.0, 14.0, 9.0, 4.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1009.6558837890625, -973.3961181640625, -937.1363525390625, -900.8765869140625, -864.6168212890625, -828.3570556640625, -792.0973510742188, -755.8375854492188, -719.5778198242188, -683.3180541992188, -647.0582885742188, -610.7985229492188, -574.538818359375, -538.279052734375, -502.019287109375, -465.759521484375, -429.499755859375, -393.239990234375, -356.980224609375, -320.7204895019531, -284.4607238769531, -248.20095825195312, -211.9412078857422, -175.68145751953125, -139.42169189453125, -103.16193389892578, -66.90217590332031, -30.642417907714844, 5.617340087890625, 41.877105712890625, 78.13685607910156, 114.3966064453125, 150.6563720703125, 186.9161376953125, 223.17588806152344, 259.4356384277344, 295.6954040527344, 331.9551696777344, 368.21490478515625, 404.47467041015625, 440.73443603515625, 476.99420166015625, 513.2539672851562, 549.5137329101562, 585.7734375, 622.033203125, 658.29296875, 694.552734375, 730.8125, 767.072265625, 803.33203125, 839.591796875, 875.8515625, 912.111328125, 948.3710327148438, 984.6307983398438, 1020.8905639648438, 1057.1502685546875, 1093.4100341796875, 1129.6697998046875, 1165.9295654296875, 1202.1893310546875, 1238.4490966796875, 1274.7088623046875, 1310.9686279296875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 9.0, 12.0, 23.0, 32.0, 35.0, 62.0, 94.0, 160.0, 254.0, 395.0, 531.0, 845.0, 1320.0, 1960.0, 3012.0, 4577.0, 6914.0, 10934.0, 16889.0, 26845.0, 42673.0, 69498.0, 114709.0, 191176.0, 327152.0, 531196.0, 3783744.0, 460198.0, 275487.0, 162428.0, 97433.0, 59325.0, 36633.0, 23232.0, 14458.0, 9534.0, 6095.0, 3905.0, 2718.0, 1718.0, 1061.0, 676.0, 497.0, 313.0, 202.0, 166.0, 112.0, 74.0, 32.0, 30.0, 24.0, 8.0, 11.0, 7.0, 10.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1298828125, -0.1254558563232422, -0.12102890014648438, -0.11660194396972656, -0.11217498779296875, -0.10774803161621094, -0.10332107543945312, -0.09889411926269531, -0.0944671630859375, -0.09004020690917969, -0.08561325073242188, -0.08118629455566406, -0.07675933837890625, -0.07233238220214844, -0.06790542602539062, -0.06347846984863281, -0.059051513671875, -0.05462455749511719, -0.050197601318359375, -0.04577064514160156, -0.04134368896484375, -0.03691673278808594, -0.032489776611328125, -0.028062820434570312, -0.0236358642578125, -0.019208908081054688, -0.014781951904296875, -0.010354995727539062, -0.00592803955078125, -0.0015010833740234375, 0.002925872802734375, 0.0073528289794921875, 0.01177978515625, 0.016206741333007812, 0.020633697509765625, 0.025060653686523438, 0.02948760986328125, 0.03391456604003906, 0.038341522216796875, 0.04276847839355469, 0.0471954345703125, 0.05162239074707031, 0.056049346923828125, 0.06047630310058594, 0.06490325927734375, 0.06933021545410156, 0.07375717163085938, 0.07818412780761719, 0.082611083984375, 0.08703804016113281, 0.09146499633789062, 0.09589195251464844, 0.10031890869140625, 0.10474586486816406, 0.10917282104492188, 0.11359977722167969, 0.1180267333984375, 0.12245368957519531, 0.12688064575195312, 0.13130760192871094, 0.13573455810546875, 0.14016151428222656, 0.14458847045898438, 0.1490154266357422, 0.1534423828125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 6.0, 6.0, 12.0, 13.0, 17.0, 23.0, 20.0, 22.0, 22.0, 32.0, 30.0, 24.0, 34.0, 30.0, 26.0, 36.0, 50.0, 37.0, 109.0, 996.0, 44.0, 42.0, 29.0, 22.0, 39.0, 31.0, 38.0, 30.0, 20.0, 24.0, 20.0, 17.0, 23.0, 10.0, 11.0, 18.0, 5.0, 6.0, 7.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-48.5625, -47.17578125, -45.7890625, -44.40234375, -43.015625, -41.62890625, -40.2421875, -38.85546875, -37.46875, -36.08203125, -34.6953125, -33.30859375, -31.921875, -30.53515625, -29.1484375, -27.76171875, -26.375, -24.98828125, -23.6015625, -22.21484375, -20.828125, -19.44140625, -18.0546875, -16.66796875, -15.28125, -13.89453125, -12.5078125, -11.12109375, -9.734375, -8.34765625, -6.9609375, -5.57421875, -4.1875, -2.80078125, -1.4140625, -0.02734375, 1.359375, 2.74609375, 4.1328125, 5.51953125, 6.90625, 8.29296875, 9.6796875, 11.06640625, 12.453125, 13.83984375, 15.2265625, 16.61328125, 18.0, 19.38671875, 20.7734375, 22.16015625, 23.546875, 24.93359375, 26.3203125, 27.70703125, 29.09375, 30.48046875, 31.8671875, 33.25390625, 34.640625, 36.02734375, 37.4140625, 38.80078125, 40.1875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 5.0, 8.0, 11.0, 16.0, 19.0, 26.0, 32.0, 52.0, 77.0, 110.0, 174.0, 243.0, 365.0, 476.0, 734.0, 1050.0, 1617.0, 2465.0, 3703.0, 5842.0, 8940.0, 14045.0, 21850.0, 35297.0, 57644.0, 93337.0, 152964.0, 256885.0, 426407.0, 3758659.0, 551751.0, 351975.0, 210411.0, 126797.0, 77120.0, 47843.0, 30044.0, 18838.0, 11667.0, 7451.0, 4948.0, 3072.0, 2103.0, 1434.0, 967.0, 630.0, 425.0, 263.0, 202.0, 140.0, 97.0, 73.0, 44.0, 38.0, 25.0, 10.0, 10.0, 8.0, 3.0, 0.0, 3.0, 2.0, 3.0], "bins": [-0.12384033203125, -0.11982059478759766, -0.11580085754394531, -0.11178112030029297, -0.10776138305664062, -0.10374164581298828, -0.09972190856933594, -0.0957021713256836, -0.09168243408203125, -0.0876626968383789, -0.08364295959472656, -0.07962322235107422, -0.07560348510742188, -0.07158374786376953, -0.06756401062011719, -0.06354427337646484, -0.0595245361328125, -0.055504798889160156, -0.05148506164550781, -0.04746532440185547, -0.043445587158203125, -0.03942584991455078, -0.03540611267089844, -0.031386375427246094, -0.02736663818359375, -0.023346900939941406, -0.019327163696289062, -0.015307426452636719, -0.011287689208984375, -0.007267951965332031, -0.0032482147216796875, 0.0007715225219726562, 0.004791259765625, 0.008810997009277344, 0.012830734252929688, 0.01685047149658203, 0.020870208740234375, 0.02488994598388672, 0.028909683227539062, 0.032929420471191406, 0.03694915771484375, 0.040968894958496094, 0.04498863220214844, 0.04900836944580078, 0.053028106689453125, 0.05704784393310547, 0.06106758117675781, 0.06508731842041016, 0.0691070556640625, 0.07312679290771484, 0.07714653015136719, 0.08116626739501953, 0.08518600463867188, 0.08920574188232422, 0.09322547912597656, 0.0972452163696289, 0.10126495361328125, 0.1052846908569336, 0.10930442810058594, 0.11332416534423828, 0.11734390258789062, 0.12136363983154297, 0.1253833770751953, 0.12940311431884766, 0.1334228515625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 11.0, 9.0, 9.0, 18.0, 15.0, 17.0, 21.0, 20.0, 31.0, 29.0, 40.0, 29.0, 47.0, 39.0, 51.0, 42.0, 27.0, 1068.0, 49.0, 38.0, 35.0, 40.0, 35.0, 38.0, 33.0, 27.0, 36.0, 20.0, 31.0, 19.0, 20.0, 10.0, 14.0, 13.0, 7.0, 7.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.40625, -40.05029296875, -38.6943359375, -37.33837890625, -35.982421875, -34.62646484375, -33.2705078125, -31.91455078125, -30.55859375, -29.20263671875, -27.8466796875, -26.49072265625, -25.134765625, -23.77880859375, -22.4228515625, -21.06689453125, -19.7109375, -18.35498046875, -16.9990234375, -15.64306640625, -14.287109375, -12.93115234375, -11.5751953125, -10.21923828125, -8.86328125, -7.50732421875, -6.1513671875, -4.79541015625, -3.439453125, -2.08349609375, -0.7275390625, 0.62841796875, 1.984375, 3.34033203125, 4.6962890625, 6.05224609375, 7.408203125, 8.76416015625, 10.1201171875, 11.47607421875, 12.83203125, 14.18798828125, 15.5439453125, 16.89990234375, 18.255859375, 19.61181640625, 20.9677734375, 22.32373046875, 23.6796875, 25.03564453125, 26.3916015625, 27.74755859375, 29.103515625, 30.45947265625, 31.8154296875, 33.17138671875, 34.52734375, 35.88330078125, 37.2392578125, 38.59521484375, 39.951171875, 41.30712890625, 42.6630859375, 44.01904296875, 45.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 15.0, 12.0, 19.0, 16.0, 30.0, 33.0, 55.0, 79.0, 81.0, 84.0, 123.0, 112.0, 220.0, 302.0, 494.0, 906.0, 2835.0, 14666.0, 103144.0, 6078680.0, 73373.0, 11474.0, 2382.0, 822.0, 425.0, 264.0, 176.0, 131.0, 114.0, 80.0, 61.0, 38.0, 47.0, 39.0, 26.0, 22.0, 10.0, 14.0, 7.0, 7.0, 4.0, 2.0, 0.0, 3.0], "bins": [-1.408203125, -1.3724822998046875, -1.336761474609375, -1.3010406494140625, -1.26531982421875, -1.2295989990234375, -1.193878173828125, -1.1581573486328125, -1.1224365234375, -1.0867156982421875, -1.050994873046875, -1.0152740478515625, -0.97955322265625, -0.9438323974609375, -0.908111572265625, -0.8723907470703125, -0.836669921875, -0.8009490966796875, -0.765228271484375, -0.7295074462890625, -0.69378662109375, -0.6580657958984375, -0.622344970703125, -0.5866241455078125, -0.5509033203125, -0.5151824951171875, -0.479461669921875, -0.4437408447265625, -0.40802001953125, -0.3722991943359375, -0.336578369140625, -0.3008575439453125, -0.26513671875, -0.2294158935546875, -0.193695068359375, -0.1579742431640625, -0.12225341796875, -0.0865325927734375, -0.050811767578125, -0.0150909423828125, 0.0206298828125, 0.0563507080078125, 0.092071533203125, 0.1277923583984375, 0.16351318359375, 0.1992340087890625, 0.234954833984375, 0.2706756591796875, 0.306396484375, 0.3421173095703125, 0.377838134765625, 0.4135589599609375, 0.44927978515625, 0.4850006103515625, 0.520721435546875, 0.5564422607421875, 0.5921630859375, 0.6278839111328125, 0.663604736328125, 0.6993255615234375, 0.73504638671875, 0.7707672119140625, 0.806488037109375, 0.8422088623046875, 0.8779296875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 7.0, 9.0, 17.0, 23.0, 20.0, 24.0, 32.0, 28.0, 27.0, 38.0, 41.0, 34.0, 57.0, 51.0, 47.0, 67.0, 1047.0, 59.0, 48.0, 37.0, 41.0, 36.0, 41.0, 21.0, 34.0, 26.0, 18.0, 17.0, 17.0, 12.0, 9.0, 13.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.96875, -40.864990234375, -39.76123046875, -38.657470703125, -37.5537109375, -36.449951171875, -35.34619140625, -34.242431640625, -33.138671875, -32.034912109375, -30.93115234375, -29.827392578125, -28.7236328125, -27.619873046875, -26.51611328125, -25.412353515625, -24.30859375, -23.204833984375, -22.10107421875, -20.997314453125, -19.8935546875, -18.789794921875, -17.68603515625, -16.582275390625, -15.478515625, -14.374755859375, -13.27099609375, -12.167236328125, -11.0634765625, -9.959716796875, -8.85595703125, -7.752197265625, -6.6484375, -5.544677734375, -4.44091796875, -3.337158203125, -2.2333984375, -1.129638671875, -0.02587890625, 1.077880859375, 2.181640625, 3.285400390625, 4.38916015625, 5.492919921875, 6.5966796875, 7.700439453125, 8.80419921875, 9.907958984375, 11.01171875, 12.115478515625, 13.21923828125, 14.322998046875, 15.4267578125, 16.530517578125, 17.63427734375, 18.738037109375, 19.841796875, 20.945556640625, 22.04931640625, 23.153076171875, 24.2568359375, 25.360595703125, 26.46435546875, 27.568115234375, 28.671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [4.0, 6.0, 865.0, 130.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.044088363647461, -7.142311096191406, -3.2405333518981934, 0.6612443923950195, 4.563021659851074, 8.464799880981445, 12.3665771484375, 16.268354415893555, 20.17013168334961, 24.071908950805664, 27.97368621826172, 31.875465393066406, 35.77724075317383, 39.679019927978516, 43.58079528808594, 47.482574462890625, 51.38435363769531, 55.2861328125, 59.18790817260742, 63.08968734741211, 66.99146270751953, 70.89324188232422, 74.7950210571289, 78.69679260253906, 82.59857177734375, 86.50035095214844, 90.40213012695312, 94.30390167236328, 98.20568084716797, 102.10746002197266, 106.00923919677734, 109.9110107421875, 113.81279754638672, 117.7145767211914, 121.6163558959961, 125.51812744140625, 129.41990661621094, 133.32168579101562, 137.2234649658203, 141.125244140625, 145.0270233154297, 148.92880249023438, 152.83058166503906, 156.73236083984375, 160.63414001464844, 164.53591918945312, 168.43768310546875, 172.33946228027344, 176.24124145507812, 180.1430206298828, 184.0447998046875, 187.9465789794922, 191.84835815429688, 195.7501220703125, 199.6519012451172, 203.55368041992188, 207.45545959472656, 211.35723876953125, 215.25901794433594, 219.16079711914062, 223.0625762939453, 226.96435546875, 230.86611938476562, 234.7678985595703, 238.669677734375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 4.0, 5.0, 13.0, 5.0, 16.0, 9.0, 6.0, 26.0, 19.0, 18.0, 26.0, 25.0, 30.0, 25.0, 34.0, 21.0, 49.0, 41.0, 37.0, 47.0, 35.0, 37.0, 54.0, 41.0, 34.0, 41.0, 34.0, 32.0, 32.0, 33.0, 26.0, 20.0, 17.0, 15.0, 13.0, 10.0, 26.0, 3.0, 10.0, 7.0, 0.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.79846954345703, -43.307960510253906, -41.81745529174805, -40.32694625854492, -38.83644104003906, -37.34593200683594, -35.85542297363281, -34.36491775512695, -32.87440872192383, -31.383901596069336, -29.893394470214844, -28.40288543701172, -26.912378311157227, -25.421871185302734, -23.931364059448242, -22.44085693359375, -20.950349807739258, -19.459842681884766, -17.969335556030273, -16.47882843017578, -14.988319396972656, -13.497812271118164, -12.007305145263672, -10.516797065734863, -9.026289939880371, -7.535782337188721, -6.04527473449707, -4.554767608642578, -3.0642600059509277, -1.5737524032592773, -0.08324527740478516, 1.4072628021240234, 2.8977699279785156, 4.388277530670166, 5.878785133361816, 7.369292259216309, 8.859800338745117, 10.35030746459961, 11.840814590454102, 13.33132266998291, 14.821829795837402, 16.31233787536621, 17.802845001220703, 19.293352127075195, 20.783859252929688, 22.274368286132812, 23.764873504638672, 25.255382537841797, 26.74588966369629, 28.23639678955078, 29.726903915405273, 31.217411041259766, 32.70792007446289, 34.19842529296875, 35.688934326171875, 37.179443359375, 38.66994857788086, 40.160457611083984, 41.650962829589844, 43.14147186279297, 44.63197708129883, 46.12248611450195, 47.61299133300781, 49.10350036621094, 50.59400939941406]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 6.0, 1.0, 13.0, 10.0, 3.0, 2.0, 12.0, 6.0, 13.0, 10.0, 19.0, 15.0, 18.0, 32.0, 33.0, 46.0, 59.0, 113.0, 146.0, 239.0, 949.0, 5480.0, 40906.0, 4125321.0, 14530.0, 4733.0, 843.0, 359.0, 89.0, 68.0, 42.0, 40.0, 21.0, 17.0, 18.0, 25.0, 7.0, 3.0, 6.0, 6.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-0.05975341796875, -0.0581507682800293, -0.056548118591308594, -0.05494546890258789, -0.05334281921386719, -0.051740169525146484, -0.05013751983642578, -0.04853487014770508, -0.046932220458984375, -0.04532957077026367, -0.04372692108154297, -0.042124271392822266, -0.04052162170410156, -0.03891897201538086, -0.037316322326660156, -0.03571367263793945, -0.03411102294921875, -0.03250837326049805, -0.030905723571777344, -0.02930307388305664, -0.027700424194335938, -0.026097774505615234, -0.02449512481689453, -0.022892475128173828, -0.021289825439453125, -0.019687175750732422, -0.01808452606201172, -0.016481876373291016, -0.014879226684570312, -0.01327657699584961, -0.011673927307128906, -0.010071277618408203, -0.0084686279296875, -0.006865978240966797, -0.005263328552246094, -0.0036606788635253906, -0.0020580291748046875, -0.0004553794860839844, 0.0011472702026367188, 0.002749919891357422, 0.004352569580078125, 0.005955219268798828, 0.007557868957519531, 0.009160518646240234, 0.010763168334960938, 0.01236581802368164, 0.013968467712402344, 0.015571117401123047, 0.01717376708984375, 0.018776416778564453, 0.020379066467285156, 0.02198171615600586, 0.023584365844726562, 0.025187015533447266, 0.02678966522216797, 0.028392314910888672, 0.029994964599609375, 0.03159761428833008, 0.03320026397705078, 0.034802913665771484, 0.03640556335449219, 0.03800821304321289, 0.039610862731933594, 0.0412135124206543, 0.042816162109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 6.0, 14.0, 5.0, 11.0, 14.0, 22.0, 784.0, 30.0, 16.0, 14.0, 11.0, 2.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.039825439453125, -0.03876519203186035, -0.0377049446105957, -0.036644697189331055, -0.035584449768066406, -0.03452420234680176, -0.03346395492553711, -0.03240370750427246, -0.03134346008300781, -0.030283212661743164, -0.029222965240478516, -0.028162717819213867, -0.02710247039794922, -0.02604222297668457, -0.024981975555419922, -0.023921728134155273, -0.022861480712890625, -0.021801233291625977, -0.020740985870361328, -0.01968073844909668, -0.01862049102783203, -0.017560243606567383, -0.016499996185302734, -0.015439748764038086, -0.014379501342773438, -0.013319253921508789, -0.01225900650024414, -0.011198759078979492, -0.010138511657714844, -0.009078264236450195, -0.008018016815185547, -0.0069577693939208984, -0.00589752197265625, -0.0048372745513916016, -0.003777027130126953, -0.0027167797088623047, -0.0016565322875976562, -0.0005962848663330078, 0.0004639625549316406, 0.001524209976196289, 0.0025844573974609375, 0.003644704818725586, 0.004704952239990234, 0.005765199661254883, 0.006825447082519531, 0.00788569450378418, 0.008945941925048828, 0.010006189346313477, 0.011066436767578125, 0.012126684188842773, 0.013186931610107422, 0.01424717903137207, 0.015307426452636719, 0.016367673873901367, 0.017427921295166016, 0.018488168716430664, 0.019548416137695312, 0.02060866355895996, 0.02166891098022461, 0.022729158401489258, 0.023789405822753906, 0.024849653244018555, 0.025909900665283203, 0.02697014808654785, 0.0280303955078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 7.0, 5.0, 17.0, 17.0, 20.0, 57.0, 125.0, 493.0, 3425.0, 4135649.0, 52308.0, 1633.0, 287.0, 92.0, 43.0, 32.0, 15.0, 8.0, 7.0, 5.0, 12.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.206298828125, -0.2000255584716797, -0.19375228881835938, -0.18747901916503906, -0.18120574951171875, -0.17493247985839844, -0.16865921020507812, -0.1623859405517578, -0.1561126708984375, -0.1498394012451172, -0.14356613159179688, -0.13729286193847656, -0.13101959228515625, -0.12474632263183594, -0.11847305297851562, -0.11219978332519531, -0.105926513671875, -0.09965324401855469, -0.09337997436523438, -0.08710670471191406, -0.08083343505859375, -0.07456016540527344, -0.06828689575195312, -0.06201362609863281, -0.0557403564453125, -0.04946708679199219, -0.043193817138671875, -0.03692054748535156, -0.03064727783203125, -0.024374008178710938, -0.018100738525390625, -0.011827468872070312, -0.00555419921875, 0.0007190704345703125, 0.006992340087890625, 0.013265609741210938, 0.01953887939453125, 0.025812149047851562, 0.032085418701171875, 0.03835868835449219, 0.0446319580078125, 0.05090522766113281, 0.057178497314453125, 0.06345176696777344, 0.06972503662109375, 0.07599830627441406, 0.08227157592773438, 0.08854484558105469, 0.094818115234375, 0.10109138488769531, 0.10736465454101562, 0.11363792419433594, 0.11991119384765625, 0.12618446350097656, 0.13245773315429688, 0.1387310028076172, 0.1450042724609375, 0.1512775421142578, 0.15755081176757812, 0.16382408142089844, 0.17009735107421875, 0.17637062072753906, 0.18264389038085938, 0.1889171600341797, 0.1951904296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 8.0, 9.0, 6.0, 7.0, 16.0, 23.0, 117.0, 2959.0, 783.0, 76.0, 17.0, 7.0, 11.0, 10.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0738525390625, -0.07160663604736328, -0.06936073303222656, -0.06711483001708984, -0.06486892700195312, -0.0626230239868164, -0.06037712097167969, -0.05813121795654297, -0.05588531494140625, -0.05363941192626953, -0.05139350891113281, -0.049147605895996094, -0.046901702880859375, -0.044655799865722656, -0.04240989685058594, -0.04016399383544922, -0.0379180908203125, -0.03567218780517578, -0.03342628479003906, -0.031180381774902344, -0.028934478759765625, -0.026688575744628906, -0.024442672729492188, -0.02219676971435547, -0.01995086669921875, -0.01770496368408203, -0.015459060668945312, -0.013213157653808594, -0.010967254638671875, -0.008721351623535156, -0.0064754486083984375, -0.004229545593261719, -0.001983642578125, 0.00026226043701171875, 0.0025081634521484375, 0.004754066467285156, 0.006999969482421875, 0.009245872497558594, 0.011491775512695312, 0.013737678527832031, 0.01598358154296875, 0.01822948455810547, 0.020475387573242188, 0.022721290588378906, 0.024967193603515625, 0.027213096618652344, 0.029458999633789062, 0.03170490264892578, 0.0339508056640625, 0.03619670867919922, 0.03844261169433594, 0.040688514709472656, 0.042934417724609375, 0.045180320739746094, 0.04742622375488281, 0.04967212677001953, 0.05191802978515625, 0.05416393280029297, 0.05640983581542969, 0.058655738830566406, 0.060901641845703125, 0.06314754486083984, 0.06539344787597656, 0.06763935089111328, 0.06988525390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 199.0, 813.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10257516801357269, -0.08216091245412827, -0.06174665316939354, -0.041332393884658813, -0.020918138325214386, -0.0005038827657699585, 0.019910380244255066, 0.040324628353118896, 0.06073889136314392, 0.08115314692258835, 0.10156740248203278, 0.1219816654920578, 0.14239591360092163, 0.16281017661094666, 0.18322443962097168, 0.2036386877298355, 0.22405295073986053, 0.24446721374988556, 0.2648814618587494, 0.2852957248687744, 0.30570998787879944, 0.32612425088882446, 0.3465384840965271, 0.3669527471065521, 0.38736701011657715, 0.4077812731266022, 0.4281955361366272, 0.44860976934432983, 0.46902403235435486, 0.4894382953643799, 0.5098525285720825, 0.5302668213844299, 0.5506810545921326, 0.5710952877998352, 0.5915095806121826, 0.6119238138198853, 0.6323381066322327, 0.6527523398399353, 0.6731666326522827, 0.6935808658599854, 0.713995099067688, 0.7344093322753906, 0.754823625087738, 0.7752378582954407, 0.7956521511077881, 0.8160663843154907, 0.8364806175231934, 0.8568949103355408, 0.8773092031478882, 0.8977234363555908, 0.9181377291679382, 0.9385519623756409, 0.9589662551879883, 0.9793804883956909, 0.9997947216033936, 1.0202089548110962, 1.0406231880187988, 1.0610374212265015, 1.081451654434204, 1.1018660068511963, 1.122280240058899, 1.1426944732666016, 1.1631087064743042, 1.1835229396820068, 1.203937292098999]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 12.0, 14.0, 13.0, 27.0, 28.0, 45.0, 61.0, 73.0, 98.0, 96.0, 107.0, 77.0, 70.0, 51.0, 54.0, 27.0, 20.0, 19.0, 12.0, 12.0, 5.0, 3.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1507476568222046, -0.14573675394058228, -0.14072585105895996, -0.13571494817733765, -0.13070404529571533, -0.12569314241409302, -0.1206822395324707, -0.11567133665084839, -0.11066043376922607, -0.10564953088760376, -0.10063862800598145, -0.09562772512435913, -0.09061682224273682, -0.0856059193611145, -0.08059501647949219, -0.07558411359786987, -0.07057321071624756, -0.06556230783462524, -0.06055140495300293, -0.055540502071380615, -0.0505295991897583, -0.045518696308135986, -0.04050779342651367, -0.03549689054489136, -0.030485987663269043, -0.02547508478164673, -0.020464181900024414, -0.0154532790184021, -0.010442376136779785, -0.005431473255157471, -0.00042057037353515625, 0.004590332508087158, 0.009601235389709473, 0.014612138271331787, 0.0196230411529541, 0.024633944034576416, 0.02964484691619873, 0.034655749797821045, 0.03966665267944336, 0.044677555561065674, 0.04968845844268799, 0.0546993613243103, 0.05971026420593262, 0.06472116708755493, 0.06973206996917725, 0.07474297285079956, 0.07975387573242188, 0.08476477861404419, 0.0897756814956665, 0.09478658437728882, 0.09979748725891113, 0.10480839014053345, 0.10981929302215576, 0.11483019590377808, 0.11984109878540039, 0.1248520016670227, 0.12986290454864502, 0.13487380743026733, 0.13988471031188965, 0.14489561319351196, 0.14990651607513428, 0.1549174189567566, 0.1599283218383789, 0.16493922472000122, 0.16995012760162354]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 6.0, 12.0, 22.0, 28.0, 44.0, 41.0, 80.0, 93.0, 167.0, 255.0, 349.0, 504.0, 732.0, 1141.0, 1669.0, 2501.0, 4071.0, 7484.0, 16762.0, 82994.0, 887604.0, 20237.0, 8670.0, 4663.0, 2757.0, 1921.0, 1223.0, 806.0, 532.0, 360.0, 281.0, 171.0, 113.0, 76.0, 63.0, 29.0, 30.0, 20.0, 5.0, 11.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052642822265625, -0.05100297927856445, -0.049363136291503906, -0.04772329330444336, -0.04608345031738281, -0.044443607330322266, -0.04280376434326172, -0.04116392135620117, -0.039524078369140625, -0.03788423538208008, -0.03624439239501953, -0.034604549407958984, -0.03296470642089844, -0.03132486343383789, -0.029685020446777344, -0.028045177459716797, -0.02640533447265625, -0.024765491485595703, -0.023125648498535156, -0.02148580551147461, -0.019845962524414062, -0.018206119537353516, -0.01656627655029297, -0.014926433563232422, -0.013286590576171875, -0.011646747589111328, -0.010006904602050781, -0.008367061614990234, -0.0067272186279296875, -0.005087375640869141, -0.0034475326538085938, -0.0018076896667480469, -0.0001678466796875, 0.0014719963073730469, 0.0031118392944335938, 0.004751682281494141, 0.0063915252685546875, 0.008031368255615234, 0.009671211242675781, 0.011311054229736328, 0.012950897216796875, 0.014590740203857422, 0.01623058319091797, 0.017870426177978516, 0.019510269165039062, 0.02115011215209961, 0.022789955139160156, 0.024429798126220703, 0.02606964111328125, 0.027709484100341797, 0.029349327087402344, 0.03098917007446289, 0.03262901306152344, 0.034268856048583984, 0.03590869903564453, 0.03754854202270508, 0.039188385009765625, 0.04082822799682617, 0.04246807098388672, 0.044107913970947266, 0.04574775695800781, 0.04738759994506836, 0.049027442932128906, 0.05066728591918945, 0.05230712890625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 12.0, 6.0, 12.0, 14.0, 21.0, 777.0, 34.0, 19.0, 9.0, 16.0, 4.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.039459228515625, -0.03840994834899902, -0.03736066818237305, -0.03631138801574707, -0.035262107849121094, -0.03421282768249512, -0.03316354751586914, -0.032114267349243164, -0.031064987182617188, -0.03001570701599121, -0.028966426849365234, -0.027917146682739258, -0.02686786651611328, -0.025818586349487305, -0.024769306182861328, -0.02372002601623535, -0.022670745849609375, -0.0216214656829834, -0.020572185516357422, -0.019522905349731445, -0.01847362518310547, -0.017424345016479492, -0.016375064849853516, -0.015325784683227539, -0.014276504516601562, -0.013227224349975586, -0.01217794418334961, -0.011128664016723633, -0.010079383850097656, -0.00903010368347168, -0.007980823516845703, -0.0069315433502197266, -0.00588226318359375, -0.0048329830169677734, -0.003783702850341797, -0.0027344226837158203, -0.0016851425170898438, -0.0006358623504638672, 0.0004134178161621094, 0.001462697982788086, 0.0025119781494140625, 0.003561258316040039, 0.004610538482666016, 0.005659818649291992, 0.006709098815917969, 0.007758378982543945, 0.008807659149169922, 0.009856939315795898, 0.010906219482421875, 0.011955499649047852, 0.013004779815673828, 0.014054059982299805, 0.015103340148925781, 0.016152620315551758, 0.017201900482177734, 0.01825118064880371, 0.019300460815429688, 0.020349740982055664, 0.02139902114868164, 0.022448301315307617, 0.023497581481933594, 0.02454686164855957, 0.025596141815185547, 0.026645421981811523, 0.0276947021484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 2.0, 9.0, 12.0, 10.0, 17.0, 21.0, 21.0, 22.0, 24.0, 41.0, 46.0, 77.0, 89.0, 98.0, 137.0, 209.0, 353.0, 725.0, 1782.0, 6859.0, 49689.0, 875778.0, 97874.0, 10133.0, 2392.0, 808.0, 392.0, 242.0, 150.0, 118.0, 81.0, 73.0, 55.0, 35.0, 28.0, 29.0, 19.0, 24.0, 19.0, 6.0, 12.0, 12.0, 1.0, 5.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.08428955078125, -0.08162403106689453, -0.07895851135253906, -0.0762929916381836, -0.07362747192382812, -0.07096195220947266, -0.06829643249511719, -0.06563091278076172, -0.06296539306640625, -0.06029987335205078, -0.05763435363769531, -0.054968833923339844, -0.052303314208984375, -0.049637794494628906, -0.04697227478027344, -0.04430675506591797, -0.0416412353515625, -0.03897571563720703, -0.03631019592285156, -0.033644676208496094, -0.030979156494140625, -0.028313636779785156, -0.025648117065429688, -0.02298259735107422, -0.02031707763671875, -0.01765155792236328, -0.014986038208007812, -0.012320518493652344, -0.009654998779296875, -0.006989479064941406, -0.0043239593505859375, -0.0016584396362304688, 0.001007080078125, 0.0036725997924804688, 0.0063381195068359375, 0.009003639221191406, 0.011669158935546875, 0.014334678649902344, 0.017000198364257812, 0.01966571807861328, 0.02233123779296875, 0.02499675750732422, 0.027662277221679688, 0.030327796936035156, 0.032993316650390625, 0.035658836364746094, 0.03832435607910156, 0.04098987579345703, 0.0436553955078125, 0.04632091522216797, 0.04898643493652344, 0.051651954650878906, 0.054317474365234375, 0.056982994079589844, 0.05964851379394531, 0.06231403350830078, 0.06497955322265625, 0.06764507293701172, 0.07031059265136719, 0.07297611236572266, 0.07564163208007812, 0.0783071517944336, 0.08097267150878906, 0.08363819122314453, 0.0863037109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 2.0, 8.0, 10.0, 8.0, 11.0, 14.0, 14.0, 12.0, 13.0, 20.0, 21.0, 28.0, 28.0, 28.0, 23.0, 28.0, 33.0, 41.0, 30.0, 37.0, 45.0, 43.0, 39.0, 39.0, 36.0, 24.0, 31.0, 32.0, 37.0, 39.0, 23.0, 31.0, 27.0, 15.0, 14.0, 17.0, 11.0, 17.0, 15.0, 5.0, 10.0, 12.0, 1.0, 5.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.11431884765625, -0.1107034683227539, -0.10708808898925781, -0.10347270965576172, -0.09985733032226562, -0.09624195098876953, -0.09262657165527344, -0.08901119232177734, -0.08539581298828125, -0.08178043365478516, -0.07816505432128906, -0.07454967498779297, -0.07093429565429688, -0.06731891632080078, -0.06370353698730469, -0.060088157653808594, -0.0564727783203125, -0.052857398986816406, -0.04924201965332031, -0.04562664031982422, -0.042011260986328125, -0.03839588165283203, -0.03478050231933594, -0.031165122985839844, -0.02754974365234375, -0.023934364318847656, -0.020318984985351562, -0.01670360565185547, -0.013088226318359375, -0.009472846984863281, -0.0058574676513671875, -0.0022420883178710938, 0.001373291015625, 0.004988670349121094, 0.008604049682617188, 0.012219429016113281, 0.015834808349609375, 0.01945018768310547, 0.023065567016601562, 0.026680946350097656, 0.03029632568359375, 0.033911705017089844, 0.03752708435058594, 0.04114246368408203, 0.044757843017578125, 0.04837322235107422, 0.05198860168457031, 0.055603981018066406, 0.0592193603515625, 0.0628347396850586, 0.06645011901855469, 0.07006549835205078, 0.07368087768554688, 0.07729625701904297, 0.08091163635253906, 0.08452701568603516, 0.08814239501953125, 0.09175777435302734, 0.09537315368652344, 0.09898853302001953, 0.10260391235351562, 0.10621929168701172, 0.10983467102050781, 0.1134500503540039, 0.1170654296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 8.0, 11.0, 18.0, 23.0, 38.0, 45.0, 88.0, 128.0, 212.0, 397.0, 657.0, 1463.0, 3299.0, 10731.0, 61425.0, 857913.0, 92147.0, 12658.0, 3900.0, 1633.0, 733.0, 399.0, 215.0, 149.0, 79.0, 48.0, 44.0, 21.0, 16.0, 15.0, 6.0, 4.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.100271224975586e-05, -7.865950465202332e-05, -7.631629705429077e-05, -7.397308945655823e-05, -7.162988185882568e-05, -6.928667426109314e-05, -6.69434666633606e-05, -6.460025906562805e-05, -6.225705146789551e-05, -5.9913843870162964e-05, -5.757063627243042e-05, -5.5227428674697876e-05, -5.288422107696533e-05, -5.054101347923279e-05, -4.8197805881500244e-05, -4.58545982837677e-05, -4.3511390686035156e-05, -4.116818308830261e-05, -3.882497549057007e-05, -3.6481767892837524e-05, -3.413856029510498e-05, -3.1795352697372437e-05, -2.9452145099639893e-05, -2.710893750190735e-05, -2.4765729904174805e-05, -2.242252230644226e-05, -2.0079314708709717e-05, -1.7736107110977173e-05, -1.539289951324463e-05, -1.3049691915512085e-05, -1.0706484317779541e-05, -8.363276720046997e-06, -6.020069122314453e-06, -3.676861524581909e-06, -1.3336539268493652e-06, 1.0095536708831787e-06, 3.3527612686157227e-06, 5.695968866348267e-06, 8.03917646408081e-06, 1.0382384061813354e-05, 1.2725591659545898e-05, 1.5068799257278442e-05, 1.7412006855010986e-05, 1.975521445274353e-05, 2.2098422050476074e-05, 2.4441629648208618e-05, 2.6784837245941162e-05, 2.9128044843673706e-05, 3.147125244140625e-05, 3.3814460039138794e-05, 3.615766763687134e-05, 3.850087523460388e-05, 4.0844082832336426e-05, 4.318729043006897e-05, 4.5530498027801514e-05, 4.787370562553406e-05, 5.02169132232666e-05, 5.2560120820999146e-05, 5.490332841873169e-05, 5.7246536016464233e-05, 5.958974361419678e-05, 6.193295121192932e-05, 6.427615880966187e-05, 6.661936640739441e-05, 6.896257400512695e-05]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 9.0, 4.0, 2.0, 5.0, 3.0, 11.0, 11.0, 9.0, 9.0, 13.0, 12.0, 38.0, 15.0, 27.0, 19.0, 19.0, 55.0, 29.0, 22.0, 31.0, 34.0, 86.0, 40.0, 34.0, 38.0, 28.0, 19.0, 63.0, 27.0, 32.0, 33.0, 29.0, 53.0, 14.0, 15.0, 20.0, 19.0, 18.0, 9.0, 8.0, 6.0, 7.0, 4.0, 12.0, 3.0, 8.0, 1.0, 2.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.955777406692505e-06, -1.8849968910217285e-06, -1.8142163753509521e-06, -1.7434358596801758e-06, -1.6726553440093994e-06, -1.601874828338623e-06, -1.5310943126678467e-06, -1.4603137969970703e-06, -1.389533281326294e-06, -1.3187527656555176e-06, -1.2479722499847412e-06, -1.1771917343139648e-06, -1.1064112186431885e-06, -1.0356307029724121e-06, -9.648501873016357e-07, -8.940696716308594e-07, -8.23289155960083e-07, -7.525086402893066e-07, -6.817281246185303e-07, -6.109476089477539e-07, -5.401670932769775e-07, -4.6938657760620117e-07, -3.986060619354248e-07, -3.2782554626464844e-07, -2.5704503059387207e-07, -1.862645149230957e-07, -1.1548399925231934e-07, -4.470348358154297e-08, 2.60770320892334e-08, 9.685754776000977e-08, 1.6763806343078613e-07, 2.384185791015625e-07, 3.0919909477233887e-07, 3.7997961044311523e-07, 4.507601261138916e-07, 5.21540641784668e-07, 5.923211574554443e-07, 6.631016731262207e-07, 7.338821887969971e-07, 8.046627044677734e-07, 8.754432201385498e-07, 9.462237358093262e-07, 1.0170042514801025e-06, 1.087784767150879e-06, 1.1585652828216553e-06, 1.2293457984924316e-06, 1.300126314163208e-06, 1.3709068298339844e-06, 1.4416873455047607e-06, 1.5124678611755371e-06, 1.5832483768463135e-06, 1.6540288925170898e-06, 1.7248094081878662e-06, 1.7955899238586426e-06, 1.866370439529419e-06, 1.9371509552001953e-06, 2.0079314708709717e-06, 2.078711986541748e-06, 2.1494925022125244e-06, 2.2202730178833008e-06, 2.291053533554077e-06, 2.3618340492248535e-06, 2.43261456489563e-06, 2.5033950805664062e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 10.0, 14.0, 17.0, 15.0, 36.0, 36.0, 60.0, 120.0, 197.0, 340.0, 971.0, 3924.0, 81564.0, 944430.0, 13864.0, 1800.0, 493.0, 238.0, 150.0, 73.0, 58.0, 38.0, 34.0, 16.0, 13.0, 5.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.967782974243164e-05, -6.721261888742447e-05, -6.47474080324173e-05, -6.228219717741013e-05, -5.9816986322402954e-05, -5.735177546739578e-05, -5.488656461238861e-05, -5.242135375738144e-05, -4.995614290237427e-05, -4.7490932047367096e-05, -4.5025721192359924e-05, -4.256051033735275e-05, -4.009529948234558e-05, -3.763008862733841e-05, -3.516487777233124e-05, -3.2699666917324066e-05, -3.0234456062316895e-05, -2.7769245207309723e-05, -2.530403435230255e-05, -2.283882349729538e-05, -2.0373612642288208e-05, -1.7908401787281036e-05, -1.5443190932273865e-05, -1.2977980077266693e-05, -1.0512769222259521e-05, -8.04755836725235e-06, -5.582347512245178e-06, -3.1171366572380066e-06, -6.51925802230835e-07, 1.8132850527763367e-06, 4.278495907783508e-06, 6.74370676279068e-06, 9.208917617797852e-06, 1.1674128472805023e-05, 1.4139339327812195e-05, 1.6604550182819366e-05, 1.9069761037826538e-05, 2.153497189283371e-05, 2.400018274784088e-05, 2.6465393602848053e-05, 2.8930604457855225e-05, 3.1395815312862396e-05, 3.386102616786957e-05, 3.632623702287674e-05, 3.879144787788391e-05, 4.125665873289108e-05, 4.3721869587898254e-05, 4.6187080442905426e-05, 4.86522912979126e-05, 5.111750215291977e-05, 5.358271300792694e-05, 5.604792386293411e-05, 5.8513134717941284e-05, 6.0978345572948456e-05, 6.344355642795563e-05, 6.59087672829628e-05, 6.837397813796997e-05, 7.083918899297714e-05, 7.330439984798431e-05, 7.576961070299149e-05, 7.823482155799866e-05, 8.070003241300583e-05, 8.3165243268013e-05, 8.563045412302017e-05, 8.809566497802734e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 9.0, 11.0, 9.0, 25.0, 18.0, 22.0, 46.0, 42.0, 54.0, 69.0, 76.0, 83.0, 74.0, 69.0, 81.0, 49.0, 45.0, 63.0, 27.0, 31.0, 20.0, 25.0, 9.0, 13.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.429454803466797e-05, -9.09566879272461e-05, -8.761882781982422e-05, -8.428096771240234e-05, -8.094310760498047e-05, -7.76052474975586e-05, -7.426738739013672e-05, -7.092952728271484e-05, -6.759166717529297e-05, -6.42538070678711e-05, -6.091594696044922e-05, -5.7578086853027344e-05, -5.424022674560547e-05, -5.0902366638183594e-05, -4.756450653076172e-05, -4.4226646423339844e-05, -4.088878631591797e-05, -3.7550926208496094e-05, -3.421306610107422e-05, -3.0875205993652344e-05, -2.753734588623047e-05, -2.4199485778808594e-05, -2.086162567138672e-05, -1.7523765563964844e-05, -1.4185905456542969e-05, -1.0848045349121094e-05, -7.510185241699219e-06, -4.172325134277344e-06, -8.344650268554688e-07, 2.5033950805664062e-06, 5.841255187988281e-06, 9.179115295410156e-06, 1.2516975402832031e-05, 1.5854835510253906e-05, 1.919269561767578e-05, 2.2530555725097656e-05, 2.586841583251953e-05, 2.9206275939941406e-05, 3.254413604736328e-05, 3.5881996154785156e-05, 3.921985626220703e-05, 4.2557716369628906e-05, 4.589557647705078e-05, 4.9233436584472656e-05, 5.257129669189453e-05, 5.5909156799316406e-05, 5.924701690673828e-05, 6.258487701416016e-05, 6.592273712158203e-05, 6.92605972290039e-05, 7.259845733642578e-05, 7.593631744384766e-05, 7.927417755126953e-05, 8.26120376586914e-05, 8.594989776611328e-05, 8.928775787353516e-05, 9.262561798095703e-05, 9.59634780883789e-05, 9.930133819580078e-05, 0.00010263919830322266, 0.00010597705841064453, 0.0001093149185180664, 0.00011265277862548828, 0.00011599063873291016, 0.00011932849884033203]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 992.0, 17.0, 2.0, 1.0], "bins": [-11.061187744140625, -10.87851619720459, -10.695844650268555, -10.51317310333252, -10.330501556396484, -10.147829055786133, -9.965157508850098, -9.782485961914062, -9.599814414978027, -9.417142868041992, -9.234471321105957, -9.051799774169922, -8.869128227233887, -8.686455726623535, -8.5037841796875, -8.321112632751465, -8.13844108581543, -7.9557695388793945, -7.773097991943359, -7.590425968170166, -7.407754421234131, -7.225082874298096, -7.0424113273620605, -6.859739303588867, -6.67706823348999, -6.494396686553955, -6.31172513961792, -6.129053115844727, -5.946381568908691, -5.763710021972656, -5.581038475036621, -5.398366928100586, -5.215694904327393, -5.033023357391357, -4.850351810455322, -4.667679786682129, -4.485008239746094, -4.302336692810059, -4.119665145874023, -3.936993360519409, -3.754321813583374, -3.571650266647339, -3.3889784812927246, -3.2063069343566895, -3.023635149002075, -2.84096360206604, -2.658291816711426, -2.4756202697753906, -2.2929487228393555, -2.1102771759033203, -1.927605390548706, -1.744933843612671, -1.5622620582580566, -1.3795905113220215, -1.1969188451766968, -1.014247179031372, -0.8315754532814026, -0.6489037871360779, -0.46623215079307556, -0.28356051445007324, -0.10088884830474854, 0.08178281784057617, 0.2644544243812561, 0.4471260905265808, 0.6297977566719055]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 5.0, 2.0, 7.0, 8.0, 15.0, 9.0, 29.0, 40.0, 59.0, 101.0, 146.0, 190.0, 134.0, 69.0, 48.0, 39.0, 13.0, 4.0, 14.0, 7.0, 5.0, 4.0, 4.0, 11.0, 4.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9148207902908325, -1.8361753225326538, -1.757529854774475, -1.6788843870162964, -1.6002390384674072, -1.5215935707092285, -1.4429481029510498, -1.364302635192871, -1.2856571674346924, -1.2070116996765137, -1.128366231918335, -1.0497207641601562, -0.9710753560066223, -0.8924298882484436, -0.8137844800949097, -0.735139012336731, -0.6564935445785522, -0.5778480768203735, -0.4992026388645172, -0.4205572009086609, -0.3419117331504822, -0.26326626539230347, -0.18462082743644714, -0.10597538948059082, -0.02732992172241211, 0.05131553113460541, 0.12996098399162292, 0.20860643684864044, 0.28725188970565796, 0.36589735746383667, 0.444542795419693, 0.5231882333755493, 0.6018338203430176, 0.6804792881011963, 0.759124755859375, 0.8377701640129089, 0.9164156317710876, 0.9950610995292664, 1.0737065076828003, 1.152351975440979, 1.2309974431991577, 1.3096429109573364, 1.3882883787155151, 1.4669338464736938, 1.545579195022583, 1.6242246627807617, 1.7028701305389404, 1.7815155982971191, 1.8601610660552979, 1.9388065338134766, 2.0174520015716553, 2.096097469329834, 2.1747429370880127, 2.2533884048461914, 2.33203387260437, 2.410679340362549, 2.4893245697021484, 2.567970037460327, 2.646615505218506, 2.7252609729766846, 2.8039064407348633, 2.882551908493042, 2.9611973762512207, 3.0398426055908203, 3.118488311767578]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 9.0, 14.0, 16.0, 32.0, 62.0, 130.0, 387.0, 1254.0, 5322.0, 4175431.0, 9771.0, 1300.0, 306.0, 101.0, 41.0, 23.0, 14.0, 14.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.61669921875, -0.5998649597167969, -0.5830307006835938, -0.5661964416503906, -0.5493621826171875, -0.5325279235839844, -0.5156936645507812, -0.4988594055175781, -0.482025146484375, -0.4651908874511719, -0.44835662841796875, -0.4315223693847656, -0.4146881103515625, -0.3978538513183594, -0.38101959228515625, -0.3641853332519531, -0.34735107421875, -0.3305168151855469, -0.31368255615234375, -0.2968482971191406, -0.2800140380859375, -0.2631797790527344, -0.24634552001953125, -0.22951126098632812, -0.212677001953125, -0.19584274291992188, -0.17900848388671875, -0.16217422485351562, -0.1453399658203125, -0.12850570678710938, -0.11167144775390625, -0.09483718872070312, -0.0780029296875, -0.061168670654296875, -0.04433441162109375, -0.027500152587890625, -0.0106658935546875, 0.006168365478515625, 0.02300262451171875, 0.039836883544921875, 0.056671142578125, 0.07350540161132812, 0.09033966064453125, 0.10717391967773438, 0.1240081787109375, 0.14084243774414062, 0.15767669677734375, 0.17451095581054688, 0.19134521484375, 0.20817947387695312, 0.22501373291015625, 0.24184799194335938, 0.2586822509765625, 0.2755165100097656, 0.29235076904296875, 0.3091850280761719, 0.326019287109375, 0.3428535461425781, 0.35968780517578125, 0.3765220642089844, 0.3933563232421875, 0.4101905822753906, 0.42702484130859375, 0.4438591003417969, 0.460693359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 6.0, 11.0, 17.0, 11.0, 15.0, 15.0, 649.0, 151.0, 18.0, 10.0, 13.0, 10.0, 5.0, 6.0, 8.0, 7.0, 3.0, 3.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0313720703125, -0.030516386032104492, -0.029660701751708984, -0.028805017471313477, -0.02794933319091797, -0.02709364891052246, -0.026237964630126953, -0.025382280349731445, -0.024526596069335938, -0.02367091178894043, -0.022815227508544922, -0.021959543228149414, -0.021103858947753906, -0.0202481746673584, -0.01939249038696289, -0.018536806106567383, -0.017681121826171875, -0.016825437545776367, -0.01596975326538086, -0.015114068984985352, -0.014258384704589844, -0.013402700424194336, -0.012547016143798828, -0.01169133186340332, -0.010835647583007812, -0.009979963302612305, -0.009124279022216797, -0.008268594741821289, -0.007412910461425781, -0.0065572261810302734, -0.005701541900634766, -0.004845857620239258, -0.00399017333984375, -0.003134489059448242, -0.0022788047790527344, -0.0014231204986572266, -0.0005674362182617188, 0.00028824806213378906, 0.0011439323425292969, 0.0019996166229248047, 0.0028553009033203125, 0.0037109851837158203, 0.004566669464111328, 0.005422353744506836, 0.006278038024902344, 0.0071337223052978516, 0.00798940658569336, 0.008845090866088867, 0.009700775146484375, 0.010556459426879883, 0.01141214370727539, 0.012267827987670898, 0.013123512268066406, 0.013979196548461914, 0.014834880828857422, 0.01569056510925293, 0.016546249389648438, 0.017401933670043945, 0.018257617950439453, 0.01911330223083496, 0.01996898651123047, 0.020824670791625977, 0.021680355072021484, 0.022536039352416992, 0.0233917236328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 8.0, 12.0, 16.0, 10.0, 15.0, 24.0, 26.0, 45.0, 40.0, 72.0, 123.0, 246.0, 635.0, 2255.0, 14783.0, 4102724.0, 65823.0, 5350.0, 1143.0, 372.0, 181.0, 96.0, 57.0, 36.0, 35.0, 23.0, 26.0, 19.0, 12.0, 7.0, 9.0, 7.0, 3.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.265869140625, -0.25722503662109375, -0.2485809326171875, -0.23993682861328125, -0.231292724609375, -0.22264862060546875, -0.2140045166015625, -0.20536041259765625, -0.19671630859375, -0.18807220458984375, -0.1794281005859375, -0.17078399658203125, -0.162139892578125, -0.15349578857421875, -0.1448516845703125, -0.13620758056640625, -0.1275634765625, -0.11891937255859375, -0.1102752685546875, -0.10163116455078125, -0.092987060546875, -0.08434295654296875, -0.0756988525390625, -0.06705474853515625, -0.05841064453125, -0.04976654052734375, -0.0411224365234375, -0.03247833251953125, -0.023834228515625, -0.01519012451171875, -0.0065460205078125, 0.00209808349609375, 0.0107421875, 0.01938629150390625, 0.0280303955078125, 0.03667449951171875, 0.045318603515625, 0.05396270751953125, 0.0626068115234375, 0.07125091552734375, 0.07989501953125, 0.08853912353515625, 0.0971832275390625, 0.10582733154296875, 0.114471435546875, 0.12311553955078125, 0.1317596435546875, 0.14040374755859375, 0.1490478515625, 0.15769195556640625, 0.1663360595703125, 0.17498016357421875, 0.183624267578125, 0.19226837158203125, 0.2009124755859375, 0.20955657958984375, 0.21820068359375, 0.22684478759765625, 0.2354888916015625, 0.24413299560546875, 0.252777099609375, 0.26142120361328125, 0.2700653076171875, 0.27870941162109375, 0.287353515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 6.0, 2.0, 3.0, 6.0, 7.0, 8.0, 5.0, 9.0, 11.0, 9.0, 11.0, 10.0, 11.0, 13.0, 19.0, 21.0, 28.0, 33.0, 3615.0, 40.0, 21.0, 30.0, 22.0, 21.0, 14.0, 8.0, 15.0, 11.0, 8.0, 15.0, 8.0, 7.0, 4.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.039306640625, -0.038028717041015625, -0.03675079345703125, -0.035472869873046875, -0.0341949462890625, -0.032917022705078125, -0.03163909912109375, -0.030361175537109375, -0.029083251953125, -0.027805328369140625, -0.02652740478515625, -0.025249481201171875, -0.0239715576171875, -0.022693634033203125, -0.02141571044921875, -0.020137786865234375, -0.01885986328125, -0.017581939697265625, -0.01630401611328125, -0.015026092529296875, -0.0137481689453125, -0.012470245361328125, -0.01119232177734375, -0.009914398193359375, -0.008636474609375, -0.007358551025390625, -0.00608062744140625, -0.004802703857421875, -0.0035247802734375, -0.002246856689453125, -0.00096893310546875, 0.000308990478515625, 0.0015869140625, 0.002864837646484375, 0.00414276123046875, 0.005420684814453125, 0.0066986083984375, 0.007976531982421875, 0.00925445556640625, 0.010532379150390625, 0.011810302734375, 0.013088226318359375, 0.01436614990234375, 0.015644073486328125, 0.0169219970703125, 0.018199920654296875, 0.01947784423828125, 0.020755767822265625, 0.02203369140625, 0.023311614990234375, 0.02458953857421875, 0.025867462158203125, 0.0271453857421875, 0.028423309326171875, 0.02970123291015625, 0.030979156494140625, 0.032257080078125, 0.033535003662109375, 0.03481292724609375, 0.036090850830078125, 0.0373687744140625, 0.038646697998046875, 0.03992462158203125, 0.041202545166015625, 0.04248046875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 25.0, 901.0, 79.0, 10.0, 3.0], "bins": [-0.5195388793945312, -0.5109933018684387, -0.5024476647377014, -0.4939020872116089, -0.48535650968551636, -0.47681090235710144, -0.4682652950286865, -0.459719717502594, -0.4511741101741791, -0.44262850284576416, -0.43408292531967163, -0.4255373179912567, -0.4169917106628418, -0.40844613313674927, -0.39990052580833435, -0.3913549482822418, -0.3828093409538269, -0.374263733625412, -0.36571815609931946, -0.35717254877090454, -0.348626971244812, -0.3400813639163971, -0.3315357565879822, -0.32299017906188965, -0.31444457173347473, -0.3058989644050598, -0.2973533868789673, -0.28880777955055237, -0.28026217222213745, -0.2717165946960449, -0.26317098736763, -0.2546254098415375, -0.24607977271080017, -0.23753418028354645, -0.22898858785629272, -0.2204429805278778, -0.21189738810062408, -0.20335179567337036, -0.19480618834495544, -0.18626059591770172, -0.177715003490448, -0.16916941106319427, -0.16062381863594055, -0.15207821130752563, -0.1435326188802719, -0.1349870264530182, -0.12644141912460327, -0.11789582669734955, -0.10935023427009583, -0.1008046418428421, -0.09225904196500778, -0.08371344208717346, -0.07516784965991974, -0.06662225723266602, -0.058076657354831696, -0.049531061202287674, -0.04098546504974365, -0.03243986889719963, -0.02389427274465561, -0.015348676592111588, -0.006803080439567566, 0.0017425157129764557, 0.010288111865520477, 0.0188337080180645, 0.02737930417060852]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 6.0, 24.0, 20.0, 24.0, 59.0, 107.0, 146.0, 167.0, 157.0, 95.0, 59.0, 28.0, 20.0, 8.0, 10.0, 6.0, 5.0, 5.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2094680666923523, -0.20156686007976532, -0.19366565346717834, -0.18576443195343018, -0.1778632253408432, -0.16996201872825623, -0.16206081211566925, -0.15415960550308228, -0.1462583839893341, -0.13835717737674713, -0.13045597076416016, -0.12255475670099258, -0.11465354263782501, -0.10675233602523804, -0.09885112941265106, -0.09094992280006409, -0.08304871618747711, -0.07514750957489014, -0.06724629551172256, -0.05934508889913559, -0.051443878561258316, -0.04354266822338104, -0.03564146161079407, -0.027740251272916794, -0.01983904093503952, -0.011937831528484821, -0.004036622121930122, 0.003864586353302002, 0.011765796691179276, 0.01966700702905655, 0.027568213641643524, 0.0354694239795208, 0.04337063431739807, 0.051271844655275345, 0.05917305499315262, 0.0670742616057396, 0.07497547566890717, 0.08287668228149414, 0.09077788889408112, 0.09867909550666809, 0.10658030956983566, 0.11448151618242264, 0.12238273024559021, 0.13028393685817719, 0.13818514347076416, 0.14608636498451233, 0.1539875566959381, 0.16188877820968628, 0.16978998482227325, 0.17769119143486023, 0.1855923980474472, 0.19349360466003418, 0.20139482617378235, 0.20929603278636932, 0.2171972393989563, 0.22509844601154327, 0.23299965262413025, 0.24090085923671722, 0.2488020658493042, 0.25670328736305237, 0.26460447907447815, 0.2725057005882263, 0.2804068922996521, 0.28830811381340027, 0.29620933532714844]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 8.0, 17.0, 10.0, 21.0, 28.0, 53.0, 55.0, 71.0, 102.0, 163.0, 222.0, 321.0, 427.0, 633.0, 920.0, 1329.0, 1959.0, 3185.0, 5099.0, 9826.0, 22235.0, 806959.0, 152364.0, 19653.0, 8843.0, 4976.0, 2878.0, 1910.0, 1322.0, 855.0, 638.0, 412.0, 293.0, 211.0, 151.0, 103.0, 72.0, 46.0, 47.0, 36.0, 25.0, 17.0, 13.0, 11.0, 11.0, 6.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.07537841796875, -0.07294178009033203, -0.07050514221191406, -0.0680685043334961, -0.06563186645507812, -0.06319522857666016, -0.06075859069824219, -0.05832195281982422, -0.05588531494140625, -0.05344867706298828, -0.05101203918457031, -0.048575401306152344, -0.046138763427734375, -0.043702125549316406, -0.04126548767089844, -0.03882884979248047, -0.0363922119140625, -0.03395557403564453, -0.03151893615722656, -0.029082298278808594, -0.026645660400390625, -0.024209022521972656, -0.021772384643554688, -0.01933574676513672, -0.01689910888671875, -0.014462471008300781, -0.012025833129882812, -0.009589195251464844, -0.007152557373046875, -0.004715919494628906, -0.0022792816162109375, 0.00015735626220703125, 0.002593994140625, 0.005030632019042969, 0.0074672698974609375, 0.009903907775878906, 0.012340545654296875, 0.014777183532714844, 0.017213821411132812, 0.01965045928955078, 0.02208709716796875, 0.02452373504638672, 0.026960372924804688, 0.029397010803222656, 0.031833648681640625, 0.034270286560058594, 0.03670692443847656, 0.03914356231689453, 0.0415802001953125, 0.04401683807373047, 0.04645347595214844, 0.048890113830566406, 0.051326751708984375, 0.053763389587402344, 0.05620002746582031, 0.05863666534423828, 0.06107330322265625, 0.06350994110107422, 0.06594657897949219, 0.06838321685791016, 0.07081985473632812, 0.0732564926147461, 0.07569313049316406, 0.07812976837158203, 0.08056640625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 15.0, 16.0, 11.0, 13.0, 112.0, 674.0, 29.0, 17.0, 6.0, 11.0, 6.0, 4.0, 11.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0281524658203125, -0.027372121810913086, -0.026591777801513672, -0.025811433792114258, -0.025031089782714844, -0.02425074577331543, -0.023470401763916016, -0.0226900577545166, -0.021909713745117188, -0.021129369735717773, -0.02034902572631836, -0.019568681716918945, -0.01878833770751953, -0.018007993698120117, -0.017227649688720703, -0.01644730567932129, -0.015666961669921875, -0.014886617660522461, -0.014106273651123047, -0.013325929641723633, -0.012545585632324219, -0.011765241622924805, -0.01098489761352539, -0.010204553604125977, -0.009424209594726562, -0.008643865585327148, -0.007863521575927734, -0.00708317756652832, -0.006302833557128906, -0.005522489547729492, -0.004742145538330078, -0.003961801528930664, -0.00318145751953125, -0.002401113510131836, -0.0016207695007324219, -0.0008404254913330078, -6.008148193359375e-05, 0.0007202625274658203, 0.0015006065368652344, 0.0022809505462646484, 0.0030612945556640625, 0.0038416385650634766, 0.004621982574462891, 0.005402326583862305, 0.006182670593261719, 0.006963014602661133, 0.007743358612060547, 0.008523702621459961, 0.009304046630859375, 0.010084390640258789, 0.010864734649658203, 0.011645078659057617, 0.012425422668457031, 0.013205766677856445, 0.01398611068725586, 0.014766454696655273, 0.015546798706054688, 0.0163271427154541, 0.017107486724853516, 0.01788783073425293, 0.018668174743652344, 0.019448518753051758, 0.020228862762451172, 0.021009206771850586, 0.02178955078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 6.0, 9.0, 14.0, 16.0, 29.0, 18.0, 37.0, 34.0, 39.0, 54.0, 79.0, 87.0, 111.0, 155.0, 170.0, 285.0, 633.0, 2936.0, 147910.0, 887293.0, 6462.0, 888.0, 334.0, 230.0, 152.0, 108.0, 93.0, 90.0, 55.0, 47.0, 43.0, 30.0, 18.0, 24.0, 12.0, 15.0, 8.0, 6.0, 4.0, 2.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17584991455078125, -0.1705474853515625, -0.16524505615234375, -0.159942626953125, -0.15464019775390625, -0.1493377685546875, -0.14403533935546875, -0.13873291015625, -0.13343048095703125, -0.1281280517578125, -0.12282562255859375, -0.117523193359375, -0.11222076416015625, -0.1069183349609375, -0.10161590576171875, -0.0963134765625, -0.09101104736328125, -0.0857086181640625, -0.08040618896484375, -0.075103759765625, -0.06980133056640625, -0.0644989013671875, -0.05919647216796875, -0.05389404296875, -0.04859161376953125, -0.0432891845703125, -0.03798675537109375, -0.032684326171875, -0.02738189697265625, -0.0220794677734375, -0.01677703857421875, -0.011474609375, -0.00617218017578125, -0.0008697509765625, 0.00443267822265625, 0.009735107421875, 0.01503753662109375, 0.0203399658203125, 0.02564239501953125, 0.03094482421875, 0.03624725341796875, 0.0415496826171875, 0.04685211181640625, 0.052154541015625, 0.05745697021484375, 0.0627593994140625, 0.06806182861328125, 0.0733642578125, 0.07866668701171875, 0.0839691162109375, 0.08927154541015625, 0.094573974609375, 0.09987640380859375, 0.1051788330078125, 0.11048126220703125, 0.11578369140625, 0.12108612060546875, 0.1263885498046875, 0.13169097900390625, 0.136993408203125, 0.14229583740234375, 0.1475982666015625, 0.15290069580078125, 0.158203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 4.0, 2.0, 4.0, 8.0, 14.0, 10.0, 20.0, 15.0, 25.0, 21.0, 21.0, 20.0, 28.0, 27.0, 30.0, 40.0, 31.0, 45.0, 40.0, 53.0, 50.0, 43.0, 40.0, 49.0, 44.0, 45.0, 33.0, 32.0, 21.0, 37.0, 18.0, 22.0, 17.0, 17.0, 15.0, 16.0, 9.0, 10.0, 7.0, 5.0, 4.0, 0.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.08526611328125, -0.08277225494384766, -0.08027839660644531, -0.07778453826904297, -0.07529067993164062, -0.07279682159423828, -0.07030296325683594, -0.0678091049194336, -0.06531524658203125, -0.0628213882446289, -0.06032752990722656, -0.05783367156982422, -0.055339813232421875, -0.05284595489501953, -0.05035209655761719, -0.047858238220214844, -0.0453643798828125, -0.042870521545410156, -0.04037666320800781, -0.03788280487060547, -0.035388946533203125, -0.03289508819580078, -0.030401229858398438, -0.027907371520996094, -0.02541351318359375, -0.022919654846191406, -0.020425796508789062, -0.01793193817138672, -0.015438079833984375, -0.012944221496582031, -0.010450363159179688, -0.007956504821777344, -0.005462646484375, -0.0029687881469726562, -0.0004749298095703125, 0.0020189285278320312, 0.004512786865234375, 0.007006645202636719, 0.009500503540039062, 0.011994361877441406, 0.01448822021484375, 0.016982078552246094, 0.019475936889648438, 0.02196979522705078, 0.024463653564453125, 0.02695751190185547, 0.029451370239257812, 0.031945228576660156, 0.0344390869140625, 0.036932945251464844, 0.03942680358886719, 0.04192066192626953, 0.044414520263671875, 0.04690837860107422, 0.04940223693847656, 0.051896095275878906, 0.05438995361328125, 0.056883811950683594, 0.05937767028808594, 0.06187152862548828, 0.06436538696289062, 0.06685924530029297, 0.06935310363769531, 0.07184696197509766, 0.0743408203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 6.0, 11.0, 24.0, 23.0, 42.0, 64.0, 119.0, 260.0, 495.0, 1342.0, 5193.0, 63765.0, 953984.0, 18498.0, 2913.0, 986.0, 383.0, 183.0, 97.0, 67.0, 40.0, 18.0, 11.0, 2.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002181529998779297, -0.00021095573902130127, -0.00020375847816467285, -0.00019656121730804443, -0.00018936395645141602, -0.0001821666955947876, -0.00017496943473815918, -0.00016777217388153076, -0.00016057491302490234, -0.00015337765216827393, -0.0001461803913116455, -0.0001389831304550171, -0.00013178586959838867, -0.00012458860874176025, -0.00011739134788513184, -0.00011019408702850342, -0.000102996826171875, -9.579956531524658e-05, -8.860230445861816e-05, -8.140504360198975e-05, -7.420778274536133e-05, -6.701052188873291e-05, -5.981326103210449e-05, -5.2616000175476074e-05, -4.5418739318847656e-05, -3.822147846221924e-05, -3.102421760559082e-05, -2.3826956748962402e-05, -1.6629695892333984e-05, -9.432435035705566e-06, -2.2351741790771484e-06, 4.9620866775512695e-06, 1.2159347534179688e-05, 1.9356608390808105e-05, 2.6553869247436523e-05, 3.375113010406494e-05, 4.094839096069336e-05, 4.814565181732178e-05, 5.5342912673950195e-05, 6.254017353057861e-05, 6.973743438720703e-05, 7.693469524383545e-05, 8.413195610046387e-05, 9.132921695709229e-05, 9.85264778137207e-05, 0.00010572373867034912, 0.00011292099952697754, 0.00012011826038360596, 0.00012731552124023438, 0.0001345127820968628, 0.0001417100429534912, 0.00014890730381011963, 0.00015610456466674805, 0.00016330182552337646, 0.00017049908638000488, 0.0001776963472366333, 0.00018489360809326172, 0.00019209086894989014, 0.00019928812980651855, 0.00020648539066314697, 0.0002136826515197754, 0.0002208799123764038, 0.00022807717323303223, 0.00023527443408966064, 0.00024247169494628906]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 3.0, 16.0, 25.0, 37.0, 52.0, 71.0, 105.0, 92.0, 131.0, 91.0, 114.0, 55.0, 67.0, 36.0, 45.0, 24.0, 16.0, 10.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.331371307373047e-06, -7.119961082935333e-06, -6.90855085849762e-06, -6.697140634059906e-06, -6.485730409622192e-06, -6.274320185184479e-06, -6.062909960746765e-06, -5.8514997363090515e-06, -5.640089511871338e-06, -5.428679287433624e-06, -5.217269062995911e-06, -5.005858838558197e-06, -4.794448614120483e-06, -4.58303838968277e-06, -4.371628165245056e-06, -4.1602179408073425e-06, -3.948807716369629e-06, -3.7373974919319153e-06, -3.5259872674942017e-06, -3.314577043056488e-06, -3.1031668186187744e-06, -2.891756594181061e-06, -2.680346369743347e-06, -2.4689361453056335e-06, -2.25752592086792e-06, -2.0461156964302063e-06, -1.8347054719924927e-06, -1.623295247554779e-06, -1.4118850231170654e-06, -1.2004747986793518e-06, -9.890645742416382e-07, -7.776543498039246e-07, -5.662441253662109e-07, -3.548339009284973e-07, -1.434236764907837e-07, 6.798654794692993e-08, 2.7939677238464355e-07, 4.908069968223572e-07, 7.022172212600708e-07, 9.136274456977844e-07, 1.125037670135498e-06, 1.3364478945732117e-06, 1.5478581190109253e-06, 1.759268343448639e-06, 1.9706785678863525e-06, 2.182088792324066e-06, 2.3934990167617798e-06, 2.6049092411994934e-06, 2.816319465637207e-06, 3.0277296900749207e-06, 3.2391399145126343e-06, 3.450550138950348e-06, 3.6619603633880615e-06, 3.873370587825775e-06, 4.084780812263489e-06, 4.296191036701202e-06, 4.507601261138916e-06, 4.71901148557663e-06, 4.930421710014343e-06, 5.141831934452057e-06, 5.3532421588897705e-06, 5.564652383327484e-06, 5.776062607765198e-06, 5.987472832202911e-06, 6.198883056640625e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 5.0, 9.0, 14.0, 19.0, 17.0, 23.0, 39.0, 41.0, 84.0, 102.0, 173.0, 285.0, 627.0, 4735.0, 1010626.0, 29736.0, 1038.0, 350.0, 191.0, 131.0, 85.0, 64.0, 40.0, 43.0, 18.0, 10.0, 15.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001894235610961914, -0.00018282420933246613, -0.00017622485756874084, -0.00016962550580501556, -0.00016302615404129028, -0.000156426802277565, -0.00014982745051383972, -0.00014322809875011444, -0.00013662874698638916, -0.00013002939522266388, -0.0001234300434589386, -0.00011683069169521332, -0.00011023133993148804, -0.00010363198816776276, -9.703263640403748e-05, -9.04332846403122e-05, -8.383393287658691e-05, -7.723458111286163e-05, -7.063522934913635e-05, -6.403587758541107e-05, -5.743652582168579e-05, -5.083717405796051e-05, -4.423782229423523e-05, -3.763847053050995e-05, -3.103911876678467e-05, -2.4439767003059387e-05, -1.7840415239334106e-05, -1.1241063475608826e-05, -4.641711711883545e-06, 1.957640051841736e-06, 8.556991815567017e-06, 1.5156343579292297e-05, 2.1755695343017578e-05, 2.835504710674286e-05, 3.495439887046814e-05, 4.155375063419342e-05, 4.81531023979187e-05, 5.475245416164398e-05, 6.135180592536926e-05, 6.795115768909454e-05, 7.455050945281982e-05, 8.11498612165451e-05, 8.774921298027039e-05, 9.434856474399567e-05, 0.00010094791650772095, 0.00010754726827144623, 0.00011414662003517151, 0.00012074597179889679, 0.00012734532356262207, 0.00013394467532634735, 0.00014054402709007263, 0.0001471433788537979, 0.0001537427306175232, 0.00016034208238124847, 0.00016694143414497375, 0.00017354078590869904, 0.00018014013767242432, 0.0001867394894361496, 0.00019333884119987488, 0.00019993819296360016, 0.00020653754472732544, 0.00021313689649105072, 0.000219736248254776, 0.00022633560001850128, 0.00023293495178222656]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 7.0, 10.0, 14.0, 11.0, 11.0, 19.0, 22.0, 32.0, 45.0, 53.0, 63.0, 82.0, 68.0, 83.0, 86.0, 63.0, 74.0, 51.0, 41.0, 41.0, 34.0, 14.0, 26.0, 11.0, 6.0, 9.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.916854858398438e-05, -8.606258779764175e-05, -8.295662701129913e-05, -7.985066622495651e-05, -7.674470543861389e-05, -7.363874465227127e-05, -7.053278386592865e-05, -6.742682307958603e-05, -6.432086229324341e-05, -6.121490150690079e-05, -5.8108940720558167e-05, -5.5002979934215546e-05, -5.1897019147872925e-05, -4.8791058361530304e-05, -4.568509757518768e-05, -4.257913678884506e-05, -3.947317600250244e-05, -3.636721521615982e-05, -3.32612544298172e-05, -3.015529364347458e-05, -2.7049332857131958e-05, -2.3943372070789337e-05, -2.0837411284446716e-05, -1.7731450498104095e-05, -1.4625489711761475e-05, -1.1519528925418854e-05, -8.413568139076233e-06, -5.307607352733612e-06, -2.201646566390991e-06, 9.043142199516296e-07, 4.0102750062942505e-06, 7.116235792636871e-06, 1.0222196578979492e-05, 1.3328157365322113e-05, 1.6434118151664734e-05, 1.9540078938007355e-05, 2.2646039724349976e-05, 2.5752000510692596e-05, 2.8857961297035217e-05, 3.196392208337784e-05, 3.506988286972046e-05, 3.817584365606308e-05, 4.12818044424057e-05, 4.438776522874832e-05, 4.749372601509094e-05, 5.059968680143356e-05, 5.3705647587776184e-05, 5.6811608374118805e-05, 5.9917569160461426e-05, 6.302352994680405e-05, 6.612949073314667e-05, 6.923545151948929e-05, 7.234141230583191e-05, 7.544737309217453e-05, 7.855333387851715e-05, 8.165929466485977e-05, 8.476525545120239e-05, 8.787121623754501e-05, 9.097717702388763e-05, 9.408313781023026e-05, 9.718909859657288e-05, 0.0001002950593829155, 0.00010340102016925812, 0.00010650698095560074, 0.00010961294174194336]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 36.0, 967.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22593055665493011, -0.1744968444108963, -0.12306312471628189, -0.07162940502166748, -0.020195692777633667, 0.03123803436756134, 0.08267174661159515, 0.13410545885562897, 0.18553917109966278, 0.2369728833436966, 0.2884066104888916, 0.3398403227329254, 0.39127403497695923, 0.44270777702331543, 0.49414145946502686, 0.5455752015113831, 0.5970088839530945, 0.6484426259994507, 0.6998763084411621, 0.7513100504875183, 0.8027437329292297, 0.8541774749755859, 0.9056111574172974, 0.9570448994636536, 1.0084786415100098, 1.0599123239517212, 1.1113461256027222, 1.1627798080444336, 1.214213490486145, 1.2656471729278564, 1.3170809745788574, 1.3685146570205688, 1.4199484586715698, 1.4713821411132812, 1.5228159427642822, 1.5742496252059937, 1.625683307647705, 1.677117109298706, 1.7285507917404175, 1.779984474182129, 1.8314181566238403, 1.8828518390655518, 1.9342856407165527, 1.9857193231582642, 2.0371530055999756, 2.0885868072509766, 2.1400203704833984, 2.1914541721343994, 2.2428879737854004, 2.2943217754364014, 2.3457553386688232, 2.397189140319824, 2.448622941970825, 2.500056505203247, 2.551490306854248, 2.60292387008667, 2.654357671737671, 2.705791473388672, 2.7572250366210938, 2.8086588382720947, 2.8600926399230957, 2.9115262031555176, 2.9629600048065186, 3.0143938064575195, 3.0658273696899414]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 6.0, 13.0, 12.0, 6.0, 8.0, 15.0, 22.0, 32.0, 33.0, 53.0, 56.0, 60.0, 78.0, 70.0, 83.0, 71.0, 55.0, 70.0, 50.0, 53.0, 36.0, 33.0, 12.0, 12.0, 12.0, 4.0, 6.0, 6.0, 2.0, 1.0, 5.0, 2.0, 0.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.7773054242134094, -0.7545614838600159, -0.7318175435066223, -0.7090736031532288, -0.6863296031951904, -0.6635856628417969, -0.6408417224884033, -0.6180977821350098, -0.5953538417816162, -0.5726099014282227, -0.5498659610748291, -0.5271220207214355, -0.504378080368042, -0.48163411021232605, -0.4588901400566101, -0.43614619970321655, -0.413402259349823, -0.39065831899642944, -0.3679143786430359, -0.34517040848731995, -0.3224264681339264, -0.29968252778053284, -0.2769385576248169, -0.25419461727142334, -0.23145067691802979, -0.20870673656463623, -0.18596278131008148, -0.16321882605552673, -0.14047488570213318, -0.11773093789815903, -0.09498699009418488, -0.07224303483963013, -0.0494990348815918, -0.026755087077617645, -0.004011139273643494, 0.018732808530330658, 0.04147675633430481, 0.06422070413827896, 0.08696465194225311, 0.10970860719680786, 0.13245254755020142, 0.15519648790359497, 0.17794044315814972, 0.20068439841270447, 0.22342833876609802, 0.24617227911949158, 0.2689162492752075, 0.2916601896286011, 0.31440412998199463, 0.3371480703353882, 0.35989201068878174, 0.3826359808444977, 0.40537992119789124, 0.4281238615512848, 0.45086783170700073, 0.4736117720603943, 0.49635571241378784, 0.5190996527671814, 0.541843593120575, 0.5645875334739685, 0.5873315334320068, 0.6100754737854004, 0.632819414138794, 0.6555633544921875, 0.678307294845581]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 14.0, 11.0, 15.0, 31.0, 34.0, 63.0, 84.0, 139.0, 228.0, 397.0, 669.0, 1349.0, 2939.0, 8716.0, 4119184.0, 51205.0, 5617.0, 1867.0, 794.0, 389.0, 213.0, 103.0, 70.0, 51.0, 18.0, 20.0, 9.0, 10.0, 6.0, 5.0, 1.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.264404296875, -0.25702667236328125, -0.2496490478515625, -0.24227142333984375, -0.234893798828125, -0.22751617431640625, -0.2201385498046875, -0.21276092529296875, -0.20538330078125, -0.19800567626953125, -0.1906280517578125, -0.18325042724609375, -0.175872802734375, -0.16849517822265625, -0.1611175537109375, -0.15373992919921875, -0.1463623046875, -0.13898468017578125, -0.1316070556640625, -0.12422943115234375, -0.116851806640625, -0.10947418212890625, -0.1020965576171875, -0.09471893310546875, -0.08734130859375, -0.07996368408203125, -0.0725860595703125, -0.06520843505859375, -0.057830810546875, -0.05045318603515625, -0.0430755615234375, -0.03569793701171875, -0.0283203125, -0.02094268798828125, -0.0135650634765625, -0.00618743896484375, 0.001190185546875, 0.00856781005859375, 0.0159454345703125, 0.02332305908203125, 0.03070068359375, 0.03807830810546875, 0.0454559326171875, 0.05283355712890625, 0.060211181640625, 0.06758880615234375, 0.0749664306640625, 0.08234405517578125, 0.0897216796875, 0.09709930419921875, 0.1044769287109375, 0.11185455322265625, 0.119232177734375, 0.12660980224609375, 0.1339874267578125, 0.14136505126953125, 0.14874267578125, 0.15612030029296875, 0.1634979248046875, 0.17087554931640625, 0.178253173828125, 0.18563079833984375, 0.1930084228515625, 0.20038604736328125, 0.207763671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 3.0, 6.0, 10.0, 17.0, 14.0, 16.0, 9.0, 272.0, 509.0, 29.0, 18.0, 9.0, 12.0, 4.0, 9.0, 8.0, 9.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0264892578125, -0.02575230598449707, -0.02501535415649414, -0.02427840232849121, -0.02354145050048828, -0.02280449867248535, -0.022067546844482422, -0.021330595016479492, -0.020593643188476562, -0.019856691360473633, -0.019119739532470703, -0.018382787704467773, -0.017645835876464844, -0.016908884048461914, -0.016171932220458984, -0.015434980392456055, -0.014698028564453125, -0.013961076736450195, -0.013224124908447266, -0.012487173080444336, -0.011750221252441406, -0.011013269424438477, -0.010276317596435547, -0.009539365768432617, -0.008802413940429688, -0.008065462112426758, -0.007328510284423828, -0.0065915584564208984, -0.005854606628417969, -0.005117654800415039, -0.004380702972412109, -0.0036437511444091797, -0.00290679931640625, -0.0021698474884033203, -0.0014328956604003906, -0.0006959438323974609, 4.100799560546875e-05, 0.0007779598236083984, 0.0015149116516113281, 0.002251863479614258, 0.0029888153076171875, 0.003725767135620117, 0.004462718963623047, 0.0051996707916259766, 0.005936622619628906, 0.006673574447631836, 0.007410526275634766, 0.008147478103637695, 0.008884429931640625, 0.009621381759643555, 0.010358333587646484, 0.011095285415649414, 0.011832237243652344, 0.012569189071655273, 0.013306140899658203, 0.014043092727661133, 0.014780044555664062, 0.015516996383666992, 0.016253948211669922, 0.01699090003967285, 0.01772785186767578, 0.01846480369567871, 0.01920175552368164, 0.01993870735168457, 0.0206756591796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 14.0, 10.0, 7.0, 18.0, 38.0, 54.0, 86.0, 123.0, 324.0, 1283.0, 115543.0, 4074336.0, 1686.0, 372.0, 127.0, 90.0, 62.0, 29.0, 22.0, 14.0, 11.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6365127563476562, -0.6172637939453125, -0.5980148315429688, -0.578765869140625, -0.5595169067382812, -0.5402679443359375, -0.5210189819335938, -0.50177001953125, -0.48252105712890625, -0.4632720947265625, -0.44402313232421875, -0.424774169921875, -0.40552520751953125, -0.3862762451171875, -0.36702728271484375, -0.3477783203125, -0.32852935791015625, -0.3092803955078125, -0.29003143310546875, -0.270782470703125, -0.25153350830078125, -0.2322845458984375, -0.21303558349609375, -0.19378662109375, -0.17453765869140625, -0.1552886962890625, -0.13603973388671875, -0.116790771484375, -0.09754180908203125, -0.0782928466796875, -0.05904388427734375, -0.039794921875, -0.02054595947265625, -0.0012969970703125, 0.01795196533203125, 0.037200927734375, 0.05644989013671875, 0.0756988525390625, 0.09494781494140625, 0.11419677734375, 0.13344573974609375, 0.1526947021484375, 0.17194366455078125, 0.191192626953125, 0.21044158935546875, 0.2296905517578125, 0.24893951416015625, 0.2681884765625, 0.28743743896484375, 0.3066864013671875, 0.32593536376953125, 0.345184326171875, 0.36443328857421875, 0.3836822509765625, 0.40293121337890625, 0.42218017578125, 0.44142913818359375, 0.4606781005859375, 0.47992706298828125, 0.499176025390625, 0.5184249877929688, 0.5376739501953125, 0.5569229125976562, 0.576171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 7.0, 9.0, 17.0, 23.0, 23.0, 21.0, 51.0, 85.0, 132.0, 3050.0, 316.0, 101.0, 65.0, 37.0, 37.0, 25.0, 17.0, 8.0, 12.0, 8.0, 4.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.10040283203125, -0.09794187545776367, -0.09548091888427734, -0.09301996231079102, -0.09055900573730469, -0.08809804916381836, -0.08563709259033203, -0.0831761360168457, -0.08071517944335938, -0.07825422286987305, -0.07579326629638672, -0.07333230972290039, -0.07087135314941406, -0.06841039657592773, -0.0659494400024414, -0.06348848342895508, -0.06102752685546875, -0.05856657028198242, -0.056105613708496094, -0.053644657135009766, -0.05118370056152344, -0.04872274398803711, -0.04626178741455078, -0.04380083084106445, -0.041339874267578125, -0.0388789176940918, -0.03641796112060547, -0.03395700454711914, -0.03149604797363281, -0.029035091400146484, -0.026574134826660156, -0.024113178253173828, -0.0216522216796875, -0.019191265106201172, -0.016730308532714844, -0.014269351959228516, -0.011808395385742188, -0.00934743881225586, -0.006886482238769531, -0.004425525665283203, -0.001964569091796875, 0.0004963874816894531, 0.0029573440551757812, 0.005418300628662109, 0.007879257202148438, 0.010340213775634766, 0.012801170349121094, 0.015262126922607422, 0.01772308349609375, 0.020184040069580078, 0.022644996643066406, 0.025105953216552734, 0.027566909790039062, 0.03002786636352539, 0.03248882293701172, 0.03494977951049805, 0.037410736083984375, 0.0398716926574707, 0.04233264923095703, 0.04479360580444336, 0.04725456237792969, 0.049715518951416016, 0.052176475524902344, 0.05463743209838867, 0.057098388671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 6.0, 29.0, 90.0, 610.0, 205.0, 36.0, 12.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1501970887184143, -0.14717577397823334, -0.14415445923805237, -0.1411331295967102, -0.13811181485652924, -0.13509050011634827, -0.1320691853761673, -0.12904787063598633, -0.12602655589580536, -0.12300524115562439, -0.11998391896486282, -0.11696260422468185, -0.11394128948450089, -0.11091996729373932, -0.10789865255355835, -0.10487733781337738, -0.10185600817203522, -0.09883469343185425, -0.09581337124109268, -0.09279205650091171, -0.08977074176073074, -0.08674941956996918, -0.08372810482978821, -0.08070679008960724, -0.07768547534942627, -0.0746641606092453, -0.07164283841848373, -0.06862152367830276, -0.0656002089381218, -0.06257888674736023, -0.05955757200717926, -0.05653625354170799, -0.053514935076236725, -0.05049361661076546, -0.04747230187058449, -0.04445098340511322, -0.04142966493964195, -0.038408346474170685, -0.035387031733989716, -0.03236571326851845, -0.02934439666569233, -0.02632308006286621, -0.023301761597394943, -0.020280444994568825, -0.017259128391742706, -0.014237809926271439, -0.01121649332344532, -0.008195174857974052, -0.005173858255147934, -0.0021525409538298845, 0.0008687763474881649, 0.0038900934159755707, 0.006911410950124264, 0.009932728484272957, 0.012954045087099075, 0.015975363552570343, 0.01899668015539646, 0.02201799675822258, 0.025039315223693848, 0.028060631826519966, 0.031081948429346085, 0.03410326689481735, 0.03712458163499832, 0.04014590382575989, 0.04316721856594086]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 7.0, 9.0, 21.0, 35.0, 43.0, 81.0, 83.0, 112.0, 112.0, 113.0, 84.0, 81.0, 68.0, 38.0, 29.0, 18.0, 7.0, 7.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28254222869873047, -0.2722442150115967, -0.2619462013244629, -0.2516481876373291, -0.2413501888513565, -0.23105217516422272, -0.22075417637825012, -0.21045616269111633, -0.20015814900398254, -0.18986013531684875, -0.17956212162971497, -0.16926412284374237, -0.15896610915660858, -0.1486680954694748, -0.1383700966835022, -0.1280720829963684, -0.11777406930923462, -0.10747605562210083, -0.09717804938554764, -0.08688004314899445, -0.07658202946186066, -0.06628401577472687, -0.055986009538173676, -0.04568800330162048, -0.035389989614486694, -0.025091979652643204, -0.014793969690799713, -0.0044959597289562225, 0.005802050232887268, 0.01610006019473076, 0.02639807015657425, 0.03669607639312744, 0.04699409008026123, 0.05729210004210472, 0.06759011000394821, 0.0778881162405014, 0.08818612992763519, 0.09848414361476898, 0.10878214985132217, 0.11908015608787537, 0.12937816977500916, 0.13967618346214294, 0.14997419714927673, 0.16027219593524933, 0.17057020962238312, 0.1808682233095169, 0.1911662220954895, 0.2014642357826233, 0.21176224946975708, 0.22206026315689087, 0.23235827684402466, 0.24265627562999725, 0.25295430421829224, 0.26325228810310364, 0.2735503017902374, 0.2838483154773712, 0.294146329164505, 0.3044443428516388, 0.3147423565387726, 0.32504037022590637, 0.3353383541107178, 0.34563636779785156, 0.35593438148498535, 0.36623239517211914, 0.37653040885925293]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 3.0, 15.0, 12.0, 10.0, 23.0, 25.0, 27.0, 34.0, 54.0, 63.0, 84.0, 104.0, 141.0, 151.0, 228.0, 292.0, 381.0, 537.0, 742.0, 1141.0, 1592.0, 2605.0, 4664.0, 8837.0, 20527.0, 805958.0, 162476.0, 18022.0, 7606.0, 4170.0, 2543.0, 1638.0, 1072.0, 762.0, 506.0, 369.0, 279.0, 226.0, 148.0, 122.0, 76.0, 70.0, 63.0, 39.0, 29.0, 16.0, 13.0, 12.0, 15.0, 5.0, 10.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0], "bins": [-0.06182861328125, -0.059950828552246094, -0.05807304382324219, -0.05619525909423828, -0.054317474365234375, -0.05243968963623047, -0.05056190490722656, -0.048684120178222656, -0.04680633544921875, -0.044928550720214844, -0.04305076599121094, -0.04117298126220703, -0.039295196533203125, -0.03741741180419922, -0.03553962707519531, -0.033661842346191406, -0.0317840576171875, -0.029906272888183594, -0.028028488159179688, -0.02615070343017578, -0.024272918701171875, -0.02239513397216797, -0.020517349243164062, -0.018639564514160156, -0.01676177978515625, -0.014883995056152344, -0.013006210327148438, -0.011128425598144531, -0.009250640869140625, -0.007372856140136719, -0.0054950714111328125, -0.0036172866821289062, -0.001739501953125, 0.00013828277587890625, 0.0020160675048828125, 0.0038938522338867188, 0.005771636962890625, 0.007649421691894531, 0.009527206420898438, 0.011404991149902344, 0.01328277587890625, 0.015160560607910156, 0.017038345336914062, 0.01891613006591797, 0.020793914794921875, 0.02267169952392578, 0.024549484252929688, 0.026427268981933594, 0.0283050537109375, 0.030182838439941406, 0.03206062316894531, 0.03393840789794922, 0.035816192626953125, 0.03769397735595703, 0.03957176208496094, 0.041449546813964844, 0.04332733154296875, 0.045205116271972656, 0.04708290100097656, 0.04896068572998047, 0.050838470458984375, 0.05271625518798828, 0.05459403991699219, 0.056471824645996094, 0.058349609375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 2.0, 7.0, 10.0, 16.0, 14.0, 13.0, 7.0, 103.0, 620.0, 82.0, 24.0, 13.0, 8.0, 8.0, 4.0, 12.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0231781005859375, -0.022502422332763672, -0.021826744079589844, -0.021151065826416016, -0.020475387573242188, -0.01979970932006836, -0.01912403106689453, -0.018448352813720703, -0.017772674560546875, -0.017096996307373047, -0.01642131805419922, -0.01574563980102539, -0.015069961547851562, -0.014394283294677734, -0.013718605041503906, -0.013042926788330078, -0.01236724853515625, -0.011691570281982422, -0.011015892028808594, -0.010340213775634766, -0.009664535522460938, -0.00898885726928711, -0.008313179016113281, -0.007637500762939453, -0.006961822509765625, -0.006286144256591797, -0.005610466003417969, -0.004934787750244141, -0.0042591094970703125, -0.0035834312438964844, -0.0029077529907226562, -0.002232074737548828, -0.001556396484375, -0.0008807182312011719, -0.00020503997802734375, 0.0004706382751464844, 0.0011463165283203125, 0.0018219947814941406, 0.0024976730346679688, 0.003173351287841797, 0.003849029541015625, 0.004524707794189453, 0.005200386047363281, 0.005876064300537109, 0.0065517425537109375, 0.007227420806884766, 0.007903099060058594, 0.008578777313232422, 0.00925445556640625, 0.009930133819580078, 0.010605812072753906, 0.011281490325927734, 0.011957168579101562, 0.01263284683227539, 0.013308525085449219, 0.013984203338623047, 0.014659881591796875, 0.015335559844970703, 0.01601123809814453, 0.01668691635131836, 0.017362594604492188, 0.018038272857666016, 0.018713951110839844, 0.019389629364013672, 0.0200653076171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 9.0, 12.0, 16.0, 24.0, 22.0, 36.0, 40.0, 42.0, 60.0, 81.0, 86.0, 110.0, 125.0, 188.0, 234.0, 516.0, 2499.0, 256256.0, 782890.0, 3481.0, 593.0, 296.0, 208.0, 140.0, 114.0, 89.0, 86.0, 54.0, 50.0, 36.0, 33.0, 27.0, 18.0, 11.0, 19.0, 9.0, 13.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15586090087890625, -0.1501007080078125, -0.14434051513671875, -0.138580322265625, -0.13282012939453125, -0.1270599365234375, -0.12129974365234375, -0.11553955078125, -0.10977935791015625, -0.1040191650390625, -0.09825897216796875, -0.092498779296875, -0.08673858642578125, -0.0809783935546875, -0.07521820068359375, -0.0694580078125, -0.06369781494140625, -0.0579376220703125, -0.05217742919921875, -0.046417236328125, -0.04065704345703125, -0.0348968505859375, -0.02913665771484375, -0.02337646484375, -0.01761627197265625, -0.0118560791015625, -0.00609588623046875, -0.000335693359375, 0.00542449951171875, 0.0111846923828125, 0.01694488525390625, 0.022705078125, 0.02846527099609375, 0.0342254638671875, 0.03998565673828125, 0.045745849609375, 0.05150604248046875, 0.0572662353515625, 0.06302642822265625, 0.06878662109375, 0.07454681396484375, 0.0803070068359375, 0.08606719970703125, 0.091827392578125, 0.09758758544921875, 0.1033477783203125, 0.10910797119140625, 0.1148681640625, 0.12062835693359375, 0.1263885498046875, 0.13214874267578125, 0.137908935546875, 0.14366912841796875, 0.1494293212890625, 0.15518951416015625, 0.16094970703125, 0.16670989990234375, 0.1724700927734375, 0.17823028564453125, 0.183990478515625, 0.18975067138671875, 0.1955108642578125, 0.20127105712890625, 0.20703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 9.0, 11.0, 16.0, 10.0, 19.0, 25.0, 14.0, 26.0, 29.0, 27.0, 37.0, 29.0, 36.0, 34.0, 55.0, 43.0, 52.0, 39.0, 43.0, 46.0, 43.0, 50.0, 42.0, 42.0, 34.0, 30.0, 20.0, 18.0, 17.0, 19.0, 16.0, 9.0, 5.0, 13.0, 6.0, 10.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0538330078125, -0.05191230773925781, -0.049991607666015625, -0.04807090759277344, -0.04615020751953125, -0.04422950744628906, -0.042308807373046875, -0.04038810729980469, -0.0384674072265625, -0.03654670715332031, -0.034626007080078125, -0.03270530700683594, -0.03078460693359375, -0.028863906860351562, -0.026943206787109375, -0.025022506713867188, -0.023101806640625, -0.021181106567382812, -0.019260406494140625, -0.017339706420898438, -0.01541900634765625, -0.013498306274414062, -0.011577606201171875, -0.009656906127929688, -0.0077362060546875, -0.0058155059814453125, -0.003894805908203125, -0.0019741058349609375, -5.340576171875e-05, 0.0018672943115234375, 0.003787994384765625, 0.0057086944580078125, 0.00762939453125, 0.009550094604492188, 0.011470794677734375, 0.013391494750976562, 0.01531219482421875, 0.017232894897460938, 0.019153594970703125, 0.021074295043945312, 0.0229949951171875, 0.024915695190429688, 0.026836395263671875, 0.028757095336914062, 0.03067779541015625, 0.03259849548339844, 0.034519195556640625, 0.03643989562988281, 0.038360595703125, 0.04028129577636719, 0.042201995849609375, 0.04412269592285156, 0.04604339599609375, 0.04796409606933594, 0.049884796142578125, 0.05180549621582031, 0.0537261962890625, 0.05564689636230469, 0.057567596435546875, 0.05948829650878906, 0.06140899658203125, 0.06332969665527344, 0.06525039672851562, 0.06717109680175781, 0.069091796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 8.0, 22.0, 21.0, 40.0, 61.0, 74.0, 159.0, 262.0, 446.0, 986.0, 2383.0, 10972.0, 313018.0, 701596.0, 13679.0, 2581.0, 1025.0, 511.0, 262.0, 159.0, 107.0, 54.0, 44.0, 25.0, 11.0, 16.0, 4.0, 7.0, 0.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002498626708984375, -0.00024273432791233063, -0.00023560598492622375, -0.00022847764194011688, -0.00022134929895401, -0.00021422095596790314, -0.00020709261298179626, -0.0001999642699956894, -0.00019283592700958252, -0.00018570758402347565, -0.00017857924103736877, -0.0001714508980512619, -0.00016432255506515503, -0.00015719421207904816, -0.00015006586909294128, -0.0001429375261068344, -0.00013580918312072754, -0.00012868084013462067, -0.0001215524971485138, -0.00011442415416240692, -0.00010729581117630005, -0.00010016746819019318, -9.30391252040863e-05, -8.591078221797943e-05, -7.878243923187256e-05, -7.165409624576569e-05, -6.452575325965881e-05, -5.739741027355194e-05, -5.026906728744507e-05, -4.3140724301338196e-05, -3.601238131523132e-05, -2.888403832912445e-05, -2.1755695343017578e-05, -1.4627352356910706e-05, -7.499009370803833e-06, -3.7066638469696045e-07, 6.757676601409912e-06, 1.3886019587516785e-05, 2.1014362573623657e-05, 2.814270555973053e-05, 3.52710485458374e-05, 4.2399391531944275e-05, 4.952773451805115e-05, 5.665607750415802e-05, 6.378442049026489e-05, 7.091276347637177e-05, 7.804110646247864e-05, 8.516944944858551e-05, 9.229779243469238e-05, 9.942613542079926e-05, 0.00010655447840690613, 0.000113682821393013, 0.00012081116437911987, 0.00012793950736522675, 0.00013506785035133362, 0.0001421961933374405, 0.00014932453632354736, 0.00015645287930965424, 0.0001635812222957611, 0.00017070956528186798, 0.00017783790826797485, 0.00018496625125408173, 0.0001920945942401886, 0.00019922293722629547, 0.00020635128021240234]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 4.0, 6.0, 4.0, 11.0, 8.0, 22.0, 18.0, 22.0, 40.0, 38.0, 62.0, 51.0, 75.0, 93.0, 78.0, 70.0, 80.0, 80.0, 46.0, 47.0, 28.0, 23.0, 27.0, 13.0, 18.0, 11.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.092952728271484e-06, -6.86105340719223e-06, -6.629154086112976e-06, -6.397254765033722e-06, -6.165355443954468e-06, -5.933456122875214e-06, -5.7015568017959595e-06, -5.469657480716705e-06, -5.237758159637451e-06, -5.005858838558197e-06, -4.773959517478943e-06, -4.542060196399689e-06, -4.3101608753204346e-06, -4.07826155424118e-06, -3.846362233161926e-06, -3.614462912082672e-06, -3.382563591003418e-06, -3.150664269924164e-06, -2.9187649488449097e-06, -2.6868656277656555e-06, -2.4549663066864014e-06, -2.2230669856071472e-06, -1.991167664527893e-06, -1.759268343448639e-06, -1.5273690223693848e-06, -1.2954697012901306e-06, -1.0635703802108765e-06, -8.316710591316223e-07, -5.997717380523682e-07, -3.67872416973114e-07, -1.3597309589385986e-07, 9.592622518539429e-08, 3.2782554626464844e-07, 5.597248673439026e-07, 7.916241884231567e-07, 1.0235235095024109e-06, 1.255422830581665e-06, 1.4873221516609192e-06, 1.7192214727401733e-06, 1.9511207938194275e-06, 2.1830201148986816e-06, 2.414919435977936e-06, 2.64681875705719e-06, 2.878718078136444e-06, 3.1106173992156982e-06, 3.3425167202949524e-06, 3.5744160413742065e-06, 3.8063153624534607e-06, 4.038214683532715e-06, 4.270114004611969e-06, 4.502013325691223e-06, 4.733912646770477e-06, 4.9658119678497314e-06, 5.197711288928986e-06, 5.42961061000824e-06, 5.661509931087494e-06, 5.893409252166748e-06, 6.125308573246002e-06, 6.357207894325256e-06, 6.5891072154045105e-06, 6.821006536483765e-06, 7.052905857563019e-06, 7.284805178642273e-06, 7.516704499721527e-06, 7.748603820800781e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 13.0, 10.0, 11.0, 17.0, 24.0, 34.0, 40.0, 76.0, 92.0, 134.0, 212.0, 372.0, 1125.0, 69410.0, 973671.0, 2114.0, 449.0, 244.0, 139.0, 99.0, 61.0, 51.0, 33.0, 30.0, 13.0, 20.0, 12.0, 8.0, 7.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0004417896270751953, -0.00042956694960594177, -0.00041734427213668823, -0.0004051215946674347, -0.00039289891719818115, -0.0003806762397289276, -0.00036845356225967407, -0.00035623088479042053, -0.000344008207321167, -0.00033178552985191345, -0.0003195628523826599, -0.00030734017491340637, -0.00029511749744415283, -0.0002828948199748993, -0.00027067214250564575, -0.0002584494650363922, -0.00024622678756713867, -0.00023400411009788513, -0.0002217814326286316, -0.00020955875515937805, -0.0001973360776901245, -0.00018511340022087097, -0.00017289072275161743, -0.0001606680452823639, -0.00014844536781311035, -0.0001362226903438568, -0.00012400001287460327, -0.00011177733540534973, -9.955465793609619e-05, -8.733198046684265e-05, -7.510930299758911e-05, -6.288662552833557e-05, -5.066394805908203e-05, -3.844127058982849e-05, -2.621859312057495e-05, -1.3995915651321411e-05, -1.773238182067871e-06, 1.0449439287185669e-05, 2.267211675643921e-05, 3.489479422569275e-05, 4.711747169494629e-05, 5.934014916419983e-05, 7.156282663345337e-05, 8.378550410270691e-05, 9.600818157196045e-05, 0.00010823085904121399, 0.00012045353651046753, 0.00013267621397972107, 0.0001448988914489746, 0.00015712156891822815, 0.0001693442463874817, 0.00018156692385673523, 0.00019378960132598877, 0.0002060122787952423, 0.00021823495626449585, 0.0002304576337337494, 0.00024268031120300293, 0.00025490298867225647, 0.00026712566614151, 0.00027934834361076355, 0.0002915710210800171, 0.00030379369854927063, 0.00031601637601852417, 0.0003282390534877777, 0.00034046173095703125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 4.0, 5.0, 14.0, 14.0, 16.0, 18.0, 34.0, 31.0, 55.0, 63.0, 60.0, 89.0, 80.0, 90.0, 85.0, 64.0, 64.0, 51.0, 36.0, 20.0, 19.0, 19.0, 17.0, 5.0, 13.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014710426330566406, -0.0001430325210094452, -0.00013896077871322632, -0.00013488903641700745, -0.00013081729412078857, -0.0001267455518245697, -0.00012267380952835083, -0.00011860206723213196, -0.00011453032493591309, -0.00011045858263969421, -0.00010638684034347534, -0.00010231509804725647, -9.82433557510376e-05, -9.417161345481873e-05, -9.009987115859985e-05, -8.602812886238098e-05, -8.195638656616211e-05, -7.788464426994324e-05, -7.381290197372437e-05, -6.974115967750549e-05, -6.566941738128662e-05, -6.159767508506775e-05, -5.752593278884888e-05, -5.3454190492630005e-05, -4.938244819641113e-05, -4.531070590019226e-05, -4.123896360397339e-05, -3.7167221307754517e-05, -3.3095479011535645e-05, -2.9023736715316772e-05, -2.49519944190979e-05, -2.088025212287903e-05, -1.6808509826660156e-05, -1.2736767530441284e-05, -8.665025234222412e-06, -4.59328293800354e-06, -5.21540641784668e-07, 3.550201654434204e-06, 7.621943950653076e-06, 1.1693686246871948e-05, 1.576542854309082e-05, 1.9837170839309692e-05, 2.3908913135528564e-05, 2.7980655431747437e-05, 3.205239772796631e-05, 3.612414002418518e-05, 4.019588232040405e-05, 4.4267624616622925e-05, 4.83393669128418e-05, 5.241110920906067e-05, 5.648285150527954e-05, 6.055459380149841e-05, 6.462633609771729e-05, 6.869807839393616e-05, 7.276982069015503e-05, 7.68415629863739e-05, 8.091330528259277e-05, 8.498504757881165e-05, 8.905678987503052e-05, 9.312853217124939e-05, 9.720027446746826e-05, 0.00010127201676368713, 0.000105343759059906, 0.00010941550135612488, 0.00011348724365234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 226.0, 782.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6853296756744385, -1.6479500532150269, -1.6105704307556152, -1.5731908082962036, -1.535811185836792, -1.4984315633773804, -1.4610519409179688, -1.4236721992492676, -1.3862926959991455, -1.3489130735397339, -1.3115334510803223, -1.2741538286209106, -1.236774206161499, -1.1993945837020874, -1.1620149612426758, -1.1246352195739746, -1.087255597114563, -1.0498759746551514, -1.0124963521957397, -0.9751167297363281, -0.9377371072769165, -0.9003574848175049, -0.8629778027534485, -0.8255981802940369, -0.7882185578346252, -0.7508389353752136, -0.713459312915802, -0.6760796904563904, -0.638700008392334, -0.6013203859329224, -0.5639407634735107, -0.5265611410140991, -0.48918139934539795, -0.45180177688598633, -0.4144221544265747, -0.3770425021648407, -0.3396628797054291, -0.30228325724601746, -0.26490360498428345, -0.22752398252487183, -0.1901443600654602, -0.15276473760604858, -0.11538510024547577, -0.07800547033548355, -0.04062584042549133, -0.003246217966079712, 0.0341334193944931, 0.07151305675506592, 0.10889267921447754, 0.14627230167388916, 0.18365193903446198, 0.2210315763950348, 0.2584111988544464, 0.29579082131385803, 0.33317047357559204, 0.37055009603500366, 0.4079297184944153, 0.4453093409538269, 0.4826889634132385, 0.5200685858726501, 0.5574482679367065, 0.5948278903961182, 0.6322075128555298, 0.6695871353149414, 0.706966757774353]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 9.0, 12.0, 14.0, 15.0, 12.0, 27.0, 30.0, 33.0, 47.0, 40.0, 55.0, 61.0, 61.0, 67.0, 80.0, 60.0, 59.0, 46.0, 54.0, 38.0, 47.0, 32.0, 28.0, 13.0, 18.0, 9.0, 8.0, 11.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6014357805252075, -0.5824732780456543, -0.5635108351707458, -0.5445483922958374, -0.5255858898162842, -0.506623387336731, -0.4876609444618225, -0.4686984717845917, -0.44973599910736084, -0.43077352643013, -0.41181105375289917, -0.39284858107566833, -0.3738861083984375, -0.35492363572120667, -0.33596116304397583, -0.316998690366745, -0.29803621768951416, -0.2790737450122833, -0.2601112723350525, -0.24114879965782166, -0.22218632698059082, -0.20322385430335999, -0.18426138162612915, -0.16529890894889832, -0.14633643627166748, -0.12737396359443665, -0.10841149091720581, -0.08944901823997498, -0.07048654556274414, -0.051524072885513306, -0.03256160020828247, -0.013599127531051636, 0.005363285541534424, 0.02432575821876526, 0.043288230895996094, 0.06225070357322693, 0.08121317625045776, 0.1001756489276886, 0.11913812160491943, 0.13810059428215027, 0.1570630669593811, 0.17602553963661194, 0.19498801231384277, 0.2139504849910736, 0.23291295766830444, 0.2518754303455353, 0.2708379030227661, 0.28980037569999695, 0.3087628483772278, 0.3277253210544586, 0.34668779373168945, 0.3656502664089203, 0.3846127390861511, 0.40357521176338196, 0.4225376844406128, 0.44150015711784363, 0.46046262979507446, 0.4794251024723053, 0.49838757514953613, 0.5173500776290894, 0.5363125205039978, 0.5552749633789062, 0.5742374658584595, 0.5931999683380127, 0.6121624112129211]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 4.0, 7.0, 5.0, 3.0, 5.0, 14.0, 27.0, 51.0, 90.0, 190.0, 505.0, 1989.0, 4182162.0, 8010.0, 803.0, 221.0, 74.0, 32.0, 21.0, 16.0, 9.0, 7.0, 10.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38818359375, -0.3766822814941406, -0.36518096923828125, -0.3536796569824219, -0.3421783447265625, -0.3306770324707031, -0.31917572021484375, -0.3076744079589844, -0.296173095703125, -0.2846717834472656, -0.27317047119140625, -0.2616691589355469, -0.2501678466796875, -0.23866653442382812, -0.22716522216796875, -0.21566390991210938, -0.20416259765625, -0.19266128540039062, -0.18115997314453125, -0.16965866088867188, -0.1581573486328125, -0.14665603637695312, -0.13515472412109375, -0.12365341186523438, -0.112152099609375, -0.10065078735351562, -0.08914947509765625, -0.07764816284179688, -0.0661468505859375, -0.054645538330078125, -0.04314422607421875, -0.031642913818359375, -0.0201416015625, -0.008640289306640625, 0.00286102294921875, 0.014362335205078125, 0.0258636474609375, 0.037364959716796875, 0.04886627197265625, 0.060367584228515625, 0.071868896484375, 0.08337020874023438, 0.09487152099609375, 0.10637283325195312, 0.1178741455078125, 0.12937545776367188, 0.14087677001953125, 0.15237808227539062, 0.16387939453125, 0.17538070678710938, 0.18688201904296875, 0.19838333129882812, 0.2098846435546875, 0.22138595581054688, 0.23288726806640625, 0.24438858032226562, 0.255889892578125, 0.2673912048339844, 0.27889251708984375, 0.2903938293457031, 0.3018951416015625, 0.3133964538574219, 0.32489776611328125, 0.3363990783691406, 0.347900390625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 6.0, 2.0, 2.0, 2.0, 4.0, 6.0, 15.0, 19.0, 11.0, 15.0, 27.0, 420.0, 335.0, 34.0, 20.0, 8.0, 9.0, 7.0, 8.0, 8.0, 6.0, 9.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0225830078125, -0.021914243698120117, -0.021245479583740234, -0.02057671546936035, -0.01990795135498047, -0.019239187240600586, -0.018570423126220703, -0.01790165901184082, -0.017232894897460938, -0.016564130783081055, -0.015895366668701172, -0.015226602554321289, -0.014557838439941406, -0.013889074325561523, -0.01322031021118164, -0.012551546096801758, -0.011882781982421875, -0.011214017868041992, -0.01054525375366211, -0.009876489639282227, -0.009207725524902344, -0.008538961410522461, -0.007870197296142578, -0.007201433181762695, -0.0065326690673828125, -0.00586390495300293, -0.005195140838623047, -0.004526376724243164, -0.0038576126098632812, -0.0031888484954833984, -0.0025200843811035156, -0.0018513202667236328, -0.00118255615234375, -0.0005137920379638672, 0.00015497207641601562, 0.0008237361907958984, 0.0014925003051757812, 0.002161264419555664, 0.002830028533935547, 0.0034987926483154297, 0.0041675567626953125, 0.004836320877075195, 0.005505084991455078, 0.006173849105834961, 0.006842613220214844, 0.0075113773345947266, 0.00818014144897461, 0.008848905563354492, 0.009517669677734375, 0.010186433792114258, 0.01085519790649414, 0.011523962020874023, 0.012192726135253906, 0.012861490249633789, 0.013530254364013672, 0.014199018478393555, 0.014867782592773438, 0.01553654670715332, 0.016205310821533203, 0.016874074935913086, 0.01754283905029297, 0.01821160316467285, 0.018880367279052734, 0.019549131393432617, 0.0202178955078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 7.0, 12.0, 9.0, 8.0, 16.0, 25.0, 19.0, 47.0, 39.0, 69.0, 113.0, 204.0, 427.0, 2190.0, 4039359.0, 148879.0, 1856.0, 429.0, 189.0, 107.0, 59.0, 40.0, 36.0, 16.0, 28.0, 15.0, 8.0, 11.0, 13.0, 8.0, 3.0, 6.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.23388671875, -0.22699928283691406, -0.22011184692382812, -0.2132244110107422, -0.20633697509765625, -0.1994495391845703, -0.19256210327148438, -0.18567466735839844, -0.1787872314453125, -0.17189979553222656, -0.16501235961914062, -0.1581249237060547, -0.15123748779296875, -0.1443500518798828, -0.13746261596679688, -0.13057518005371094, -0.123687744140625, -0.11680030822753906, -0.10991287231445312, -0.10302543640136719, -0.09613800048828125, -0.08925056457519531, -0.08236312866210938, -0.07547569274902344, -0.0685882568359375, -0.06170082092285156, -0.054813385009765625, -0.04792594909667969, -0.04103851318359375, -0.03415107727050781, -0.027263641357421875, -0.020376205444335938, -0.01348876953125, -0.0066013336181640625, 0.000286102294921875, 0.0071735382080078125, 0.01406097412109375, 0.020948410034179688, 0.027835845947265625, 0.03472328186035156, 0.0416107177734375, 0.04849815368652344, 0.055385589599609375, 0.06227302551269531, 0.06916046142578125, 0.07604789733886719, 0.08293533325195312, 0.08982276916503906, 0.096710205078125, 0.10359764099121094, 0.11048507690429688, 0.11737251281738281, 0.12425994873046875, 0.1311473846435547, 0.13803482055664062, 0.14492225646972656, 0.1518096923828125, 0.15869712829589844, 0.16558456420898438, 0.1724720001220703, 0.17935943603515625, 0.1862468719482422, 0.19313430786132812, 0.20002174377441406, 0.2069091796875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 8.0, 6.0, 5.0, 14.0, 8.0, 16.0, 19.0, 19.0, 24.0, 70.0, 3139.0, 496.0, 66.0, 31.0, 22.0, 26.0, 19.0, 14.0, 8.0, 6.0, 12.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0377197265625, -0.03660869598388672, -0.03549766540527344, -0.034386634826660156, -0.033275604248046875, -0.032164573669433594, -0.031053543090820312, -0.02994251251220703, -0.02883148193359375, -0.02772045135498047, -0.026609420776367188, -0.025498390197753906, -0.024387359619140625, -0.023276329040527344, -0.022165298461914062, -0.02105426788330078, -0.0199432373046875, -0.01883220672607422, -0.017721176147460938, -0.016610145568847656, -0.015499114990234375, -0.014388084411621094, -0.013277053833007812, -0.012166023254394531, -0.01105499267578125, -0.009943962097167969, -0.008832931518554688, -0.007721900939941406, -0.006610870361328125, -0.005499839782714844, -0.0043888092041015625, -0.0032777786254882812, -0.002166748046875, -0.0010557174682617188, 5.53131103515625e-05, 0.0011663436889648438, 0.002277374267578125, 0.0033884048461914062, 0.0044994354248046875, 0.005610466003417969, 0.00672149658203125, 0.007832527160644531, 0.008943557739257812, 0.010054588317871094, 0.011165618896484375, 0.012276649475097656, 0.013387680053710938, 0.014498710632324219, 0.0156097412109375, 0.01672077178955078, 0.017831802368164062, 0.018942832946777344, 0.020053863525390625, 0.021164894104003906, 0.022275924682617188, 0.02338695526123047, 0.02449798583984375, 0.02560901641845703, 0.026720046997070312, 0.027831077575683594, 0.028942108154296875, 0.030053138732910156, 0.031164169311523438, 0.03227519989013672, 0.03338623046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 107.0, 910.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9734079837799072, -0.9554080963134766, -0.9374082088470459, -0.9194082617759705, -0.9014083743095398, -0.8834084868431091, -0.8654085397720337, -0.847408652305603, -0.8294087648391724, -0.8114088773727417, -0.793408989906311, -0.7754090428352356, -0.7574091553688049, -0.7394092679023743, -0.7214093208312988, -0.7034094333648682, -0.6854095458984375, -0.6674096584320068, -0.6494097709655762, -0.6314098238945007, -0.6134099364280701, -0.5954100489616394, -0.577410101890564, -0.5594102144241333, -0.5414103269577026, -0.523410439491272, -0.5054105520248413, -0.48741060495376587, -0.4694107174873352, -0.45141083002090454, -0.4334109127521515, -0.41541099548339844, -0.3974111080169678, -0.3794112205505371, -0.36141130328178406, -0.343411386013031, -0.32541149854660034, -0.3074116110801697, -0.2894116938114166, -0.2714117765426636, -0.2534118890762329, -0.23541198670864105, -0.2174120843410492, -0.19941218197345734, -0.18141227960586548, -0.16341237723827362, -0.14541247487068176, -0.1274125725030899, -0.10941268503665924, -0.09141278266906738, -0.07341288030147552, -0.05541297793388367, -0.03741307556629181, -0.01941317319869995, -0.0014132708311080933, 0.016586631536483765, 0.03458653390407562, 0.05258643627166748, 0.07058633863925934, 0.0885862410068512, 0.10658614337444305, 0.12458604574203491, 0.14258594810962677, 0.16058585047721863, 0.17858575284481049]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 9.0, 6.0, 16.0, 30.0, 21.0, 34.0, 42.0, 59.0, 57.0, 71.0, 78.0, 77.0, 78.0, 77.0, 76.0, 65.0, 46.0, 38.0, 31.0, 28.0, 10.0, 11.0, 8.0, 8.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11659932136535645, -0.1123775988817215, -0.10815587639808655, -0.1039341539144516, -0.09971243143081665, -0.0954907089471817, -0.09126899391412735, -0.0870472714304924, -0.08282554894685745, -0.0786038264632225, -0.07438210397958755, -0.0701603814959526, -0.06593866646289825, -0.06171694025397301, -0.05749522149562836, -0.05327349901199341, -0.04905177652835846, -0.04483005404472351, -0.04060833156108856, -0.03638661280274391, -0.03216489031910896, -0.027943167835474014, -0.023721447214484215, -0.019499726593494415, -0.015278004109859467, -0.011056282557547092, -0.006834561005234718, -0.002612839452922344, 0.00160888209939003, 0.005830604583024979, 0.010052325204014778, 0.014274045825004578, 0.018495768308639526, 0.022717490792274475, 0.026939211413264275, 0.031160932034254074, 0.03538265451788902, 0.03960437700152397, 0.04382609575986862, 0.04804781824350357, 0.05226954072713852, 0.05649126321077347, 0.06071298569440842, 0.06493470817804337, 0.06915642321109772, 0.07337814569473267, 0.07759986817836761, 0.08182159066200256, 0.08604331314563751, 0.09026503562927246, 0.09448675811290741, 0.09870848059654236, 0.10293020308017731, 0.10715192556381226, 0.11137364059686661, 0.11559536308050156, 0.1198170855641365, 0.12403880804777145, 0.1282605230808258, 0.13248224556446075, 0.1367039680480957, 0.14092569053173065, 0.1451474130153656, 0.14936913549900055, 0.1535908579826355]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 11.0, 3.0, 5.0, 7.0, 17.0, 25.0, 27.0, 53.0, 60.0, 96.0, 122.0, 148.0, 245.0, 342.0, 550.0, 857.0, 1300.0, 2229.0, 3990.0, 8308.0, 22522.0, 883313.0, 93734.0, 15604.0, 6545.0, 3429.0, 1803.0, 1071.0, 709.0, 451.0, 278.0, 198.0, 138.0, 94.0, 80.0, 63.0, 33.0, 27.0, 11.0, 10.0, 14.0, 8.0, 11.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.054718017578125, -0.05294370651245117, -0.051169395446777344, -0.049395084381103516, -0.04762077331542969, -0.04584646224975586, -0.04407215118408203, -0.0422978401184082, -0.040523529052734375, -0.03874921798706055, -0.03697490692138672, -0.03520059585571289, -0.03342628479003906, -0.031651973724365234, -0.029877662658691406, -0.028103351593017578, -0.02632904052734375, -0.024554729461669922, -0.022780418395996094, -0.021006107330322266, -0.019231796264648438, -0.01745748519897461, -0.01568317413330078, -0.013908863067626953, -0.012134552001953125, -0.010360240936279297, -0.008585929870605469, -0.006811618804931641, -0.0050373077392578125, -0.0032629966735839844, -0.0014886856079101562, 0.0002856254577636719, 0.0020599365234375, 0.003834247589111328, 0.005608558654785156, 0.007382869720458984, 0.009157180786132812, 0.01093149185180664, 0.012705802917480469, 0.014480113983154297, 0.016254425048828125, 0.018028736114501953, 0.01980304718017578, 0.02157735824584961, 0.023351669311523438, 0.025125980377197266, 0.026900291442871094, 0.028674602508544922, 0.03044891357421875, 0.03222322463989258, 0.033997535705566406, 0.035771846771240234, 0.03754615783691406, 0.03932046890258789, 0.04109477996826172, 0.04286909103393555, 0.044643402099609375, 0.0464177131652832, 0.04819202423095703, 0.04996633529663086, 0.05174064636230469, 0.053514957427978516, 0.055289268493652344, 0.05706357955932617, 0.058837890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 4.0, 5.0, 12.0, 15.0, 17.0, 9.0, 18.0, 164.0, 545.0, 87.0, 23.0, 12.0, 9.0, 5.0, 6.0, 13.0, 8.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0216827392578125, -0.02102971076965332, -0.02037668228149414, -0.01972365379333496, -0.01907062530517578, -0.0184175968170166, -0.017764568328857422, -0.017111539840698242, -0.016458511352539062, -0.015805482864379883, -0.015152454376220703, -0.014499425888061523, -0.013846397399902344, -0.013193368911743164, -0.012540340423583984, -0.011887311935424805, -0.011234283447265625, -0.010581254959106445, -0.009928226470947266, -0.009275197982788086, -0.008622169494628906, -0.007969141006469727, -0.007316112518310547, -0.006663084030151367, -0.0060100555419921875, -0.005357027053833008, -0.004703998565673828, -0.0040509700775146484, -0.0033979415893554688, -0.002744913101196289, -0.0020918846130371094, -0.0014388561248779297, -0.00078582763671875, -0.0001327991485595703, 0.0005202293395996094, 0.001173257827758789, 0.0018262863159179688, 0.0024793148040771484, 0.003132343292236328, 0.003785371780395508, 0.0044384002685546875, 0.005091428756713867, 0.005744457244873047, 0.0063974857330322266, 0.007050514221191406, 0.007703542709350586, 0.008356571197509766, 0.009009599685668945, 0.009662628173828125, 0.010315656661987305, 0.010968685150146484, 0.011621713638305664, 0.012274742126464844, 0.012927770614624023, 0.013580799102783203, 0.014233827590942383, 0.014886856079101562, 0.015539884567260742, 0.016192913055419922, 0.0168459415435791, 0.01749897003173828, 0.01815199851989746, 0.01880502700805664, 0.01945805549621582, 0.020111083984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 7.0, 13.0, 13.0, 24.0, 24.0, 21.0, 27.0, 33.0, 45.0, 38.0, 46.0, 60.0, 85.0, 102.0, 105.0, 119.0, 187.0, 228.0, 373.0, 795.0, 4118.0, 292039.0, 741435.0, 5957.0, 966.0, 448.0, 215.0, 166.0, 130.0, 118.0, 101.0, 99.0, 58.0, 55.0, 50.0, 46.0, 36.0, 23.0, 28.0, 23.0, 20.0, 15.0, 16.0, 6.0, 10.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.1275634765625, -0.12358474731445312, -0.11960601806640625, -0.11562728881835938, -0.1116485595703125, -0.10766983032226562, -0.10369110107421875, -0.09971237182617188, -0.095733642578125, -0.09175491333007812, -0.08777618408203125, -0.08379745483398438, -0.0798187255859375, -0.07583999633789062, -0.07186126708984375, -0.06788253784179688, -0.06390380859375, -0.059925079345703125, -0.05594635009765625, -0.051967620849609375, -0.0479888916015625, -0.044010162353515625, -0.04003143310546875, -0.036052703857421875, -0.032073974609375, -0.028095245361328125, -0.02411651611328125, -0.020137786865234375, -0.0161590576171875, -0.012180328369140625, -0.00820159912109375, -0.004222869873046875, -0.000244140625, 0.003734588623046875, 0.00771331787109375, 0.011692047119140625, 0.0156707763671875, 0.019649505615234375, 0.02362823486328125, 0.027606964111328125, 0.031585693359375, 0.035564422607421875, 0.03954315185546875, 0.043521881103515625, 0.0475006103515625, 0.051479339599609375, 0.05545806884765625, 0.059436798095703125, 0.06341552734375, 0.06739425659179688, 0.07137298583984375, 0.07535171508789062, 0.0793304443359375, 0.08330917358398438, 0.08728790283203125, 0.09126663208007812, 0.095245361328125, 0.09922409057617188, 0.10320281982421875, 0.10718154907226562, 0.1111602783203125, 0.11513900756835938, 0.11911773681640625, 0.12309646606445312, 0.1270751953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 8.0, 6.0, 9.0, 7.0, 8.0, 9.0, 13.0, 7.0, 15.0, 17.0, 29.0, 24.0, 22.0, 41.0, 33.0, 36.0, 47.0, 35.0, 47.0, 54.0, 45.0, 46.0, 39.0, 53.0, 36.0, 29.0, 28.0, 24.0, 34.0, 28.0, 28.0, 27.0, 11.0, 23.0, 15.0, 16.0, 3.0, 9.0, 8.0, 13.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.058685302734375, -0.05681800842285156, -0.054950714111328125, -0.05308341979980469, -0.05121612548828125, -0.04934883117675781, -0.047481536865234375, -0.04561424255371094, -0.0437469482421875, -0.04187965393066406, -0.040012359619140625, -0.03814506530761719, -0.03627777099609375, -0.03441047668457031, -0.032543182373046875, -0.030675888061523438, -0.02880859375, -0.026941299438476562, -0.025074005126953125, -0.023206710815429688, -0.02133941650390625, -0.019472122192382812, -0.017604827880859375, -0.015737533569335938, -0.0138702392578125, -0.012002944946289062, -0.010135650634765625, -0.008268356323242188, -0.00640106201171875, -0.0045337677001953125, -0.002666473388671875, -0.0007991790771484375, 0.001068115234375, 0.0029354095458984375, 0.004802703857421875, 0.0066699981689453125, 0.00853729248046875, 0.010404586791992188, 0.012271881103515625, 0.014139175415039062, 0.0160064697265625, 0.017873764038085938, 0.019741058349609375, 0.021608352661132812, 0.02347564697265625, 0.025342941284179688, 0.027210235595703125, 0.029077529907226562, 0.03094482421875, 0.03281211853027344, 0.034679412841796875, 0.03654670715332031, 0.03841400146484375, 0.04028129577636719, 0.042148590087890625, 0.04401588439941406, 0.0458831787109375, 0.04775047302246094, 0.049617767333984375, 0.05148506164550781, 0.05335235595703125, 0.05521965026855469, 0.057086944580078125, 0.05895423889160156, 0.060821533203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 10.0, 11.0, 22.0, 23.0, 31.0, 47.0, 82.0, 115.0, 170.0, 266.0, 462.0, 804.0, 1541.0, 3549.0, 9687.0, 38324.0, 697813.0, 254614.0, 27134.0, 7634.0, 2960.0, 1349.0, 724.0, 395.0, 265.0, 144.0, 111.0, 70.0, 47.0, 31.0, 33.0, 6.0, 15.0, 15.0, 10.0, 5.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00010824203491210938, -0.00010514073073863983, -0.00010203942656517029, -9.893812239170074e-05, -9.58368182182312e-05, -9.273551404476166e-05, -8.963420987129211e-05, -8.653290569782257e-05, -8.343160152435303e-05, -8.033029735088348e-05, -7.722899317741394e-05, -7.41276890039444e-05, -7.102638483047485e-05, -6.792508065700531e-05, -6.482377648353577e-05, -6.172247231006622e-05, -5.862116813659668e-05, -5.5519863963127136e-05, -5.241855978965759e-05, -4.931725561618805e-05, -4.6215951442718506e-05, -4.311464726924896e-05, -4.001334309577942e-05, -3.6912038922309875e-05, -3.381073474884033e-05, -3.070943057537079e-05, -2.7608126401901245e-05, -2.45068222284317e-05, -2.1405518054962158e-05, -1.8304213881492615e-05, -1.5202909708023071e-05, -1.2101605534553528e-05, -9.000301361083984e-06, -5.898997187614441e-06, -2.7976930141448975e-06, 3.03611159324646e-07, 3.4049153327941895e-06, 6.506219506263733e-06, 9.607523679733276e-06, 1.270882785320282e-05, 1.5810132026672363e-05, 1.8911436200141907e-05, 2.201274037361145e-05, 2.5114044547080994e-05, 2.8215348720550537e-05, 3.131665289402008e-05, 3.4417957067489624e-05, 3.751926124095917e-05, 4.062056541442871e-05, 4.3721869587898254e-05, 4.68231737613678e-05, 4.992447793483734e-05, 5.3025782108306885e-05, 5.612708628177643e-05, 5.922839045524597e-05, 6.232969462871552e-05, 6.543099880218506e-05, 6.85323029756546e-05, 7.163360714912415e-05, 7.473491132259369e-05, 7.783621549606323e-05, 8.093751966953278e-05, 8.403882384300232e-05, 8.714012801647186e-05, 9.02414321899414e-05]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 6.0, 8.0, 3.0, 7.0, 24.0, 18.0, 17.0, 27.0, 51.0, 47.0, 70.0, 68.0, 85.0, 65.0, 88.0, 78.0, 49.0, 56.0, 43.0, 38.0, 32.0, 32.0, 21.0, 19.0, 8.0, 8.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.4871121644973755e-06, -4.325062036514282e-06, -4.163011908531189e-06, -4.000961780548096e-06, -3.8389116525650024e-06, -3.676861524581909e-06, -3.514811396598816e-06, -3.3527612686157227e-06, -3.1907111406326294e-06, -3.028661012649536e-06, -2.866610884666443e-06, -2.7045607566833496e-06, -2.5425106287002563e-06, -2.380460500717163e-06, -2.21841037273407e-06, -2.0563602447509766e-06, -1.8943101167678833e-06, -1.73225998878479e-06, -1.5702098608016968e-06, -1.4081597328186035e-06, -1.2461096048355103e-06, -1.084059476852417e-06, -9.220093488693237e-07, -7.599592208862305e-07, -5.979090929031372e-07, -4.3585896492004395e-07, -2.738088369369507e-07, -1.1175870895385742e-07, 5.029141902923584e-08, 2.123415470123291e-07, 3.7439167499542236e-07, 5.364418029785156e-07, 6.984919309616089e-07, 8.605420589447021e-07, 1.0225921869277954e-06, 1.1846423149108887e-06, 1.346692442893982e-06, 1.5087425708770752e-06, 1.6707926988601685e-06, 1.8328428268432617e-06, 1.994892954826355e-06, 2.1569430828094482e-06, 2.3189932107925415e-06, 2.4810433387756348e-06, 2.643093466758728e-06, 2.8051435947418213e-06, 2.9671937227249146e-06, 3.129243850708008e-06, 3.291293978691101e-06, 3.4533441066741943e-06, 3.6153942346572876e-06, 3.777444362640381e-06, 3.939494490623474e-06, 4.101544618606567e-06, 4.263594746589661e-06, 4.425644874572754e-06, 4.587695002555847e-06, 4.7497451305389404e-06, 4.911795258522034e-06, 5.073845386505127e-06, 5.23589551448822e-06, 5.3979456424713135e-06, 5.559995770454407e-06, 5.7220458984375e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 12.0, 17.0, 21.0, 48.0, 66.0, 109.0, 207.0, 332.0, 1157.0, 846193.0, 198523.0, 1043.0, 321.0, 199.0, 111.0, 68.0, 46.0, 22.0, 19.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003566741943359375, -0.0003455132246017456, -0.0003343522548675537, -0.0003231912851333618, -0.0003120303153991699, -0.00030086934566497803, -0.00028970837593078613, -0.00027854740619659424, -0.00026738643646240234, -0.00025622546672821045, -0.00024506449699401855, -0.00023390352725982666, -0.00022274255752563477, -0.00021158158779144287, -0.00020042061805725098, -0.00018925964832305908, -0.0001780986785888672, -0.0001669377088546753, -0.0001557767391204834, -0.0001446157693862915, -0.0001334547996520996, -0.00012229382991790771, -0.00011113286018371582, -9.997189044952393e-05, -8.881092071533203e-05, -7.764995098114014e-05, -6.648898124694824e-05, -5.532801151275635e-05, -4.416704177856445e-05, -3.300607204437256e-05, -2.1845102310180664e-05, -1.068413257598877e-05, 4.76837158203125e-07, 1.163780689239502e-05, 2.2798776626586914e-05, 3.395974636077881e-05, 4.51207160949707e-05, 5.62816858291626e-05, 6.744265556335449e-05, 7.860362529754639e-05, 8.976459503173828e-05, 0.00010092556476593018, 0.00011208653450012207, 0.00012324750423431396, 0.00013440847396850586, 0.00014556944370269775, 0.00015673041343688965, 0.00016789138317108154, 0.00017905235290527344, 0.00019021332263946533, 0.00020137429237365723, 0.00021253526210784912, 0.00022369623184204102, 0.0002348572015762329, 0.0002460181713104248, 0.0002571791410446167, 0.0002683401107788086, 0.0002795010805130005, 0.0002906620502471924, 0.0003018230199813843, 0.00031298398971557617, 0.00032414495944976807, 0.00033530592918395996, 0.00034646689891815186, 0.00035762786865234375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 10.0, 15.0, 15.0, 38.0, 53.0, 58.0, 103.0, 122.0, 136.0, 126.0, 107.0, 54.0, 58.0, 33.0, 23.0, 17.0, 7.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017142295837402344, -0.00016671046614646912, -0.0001619979739189148, -0.00015728548169136047, -0.00015257298946380615, -0.00014786049723625183, -0.0001431480050086975, -0.0001384355127811432, -0.00013372302055358887, -0.00012901052832603455, -0.00012429803609848022, -0.0001195855438709259, -0.00011487305164337158, -0.00011016055941581726, -0.00010544806718826294, -0.00010073557496070862, -9.60230827331543e-05, -9.131059050559998e-05, -8.659809827804565e-05, -8.188560605049133e-05, -7.717311382293701e-05, -7.246062159538269e-05, -6.774812936782837e-05, -6.303563714027405e-05, -5.8323144912719727e-05, -5.3610652685165405e-05, -4.8898160457611084e-05, -4.418566823005676e-05, -3.947317600250244e-05, -3.476068377494812e-05, -3.00481915473938e-05, -2.5335699319839478e-05, -2.0623207092285156e-05, -1.5910714864730835e-05, -1.1198222637176514e-05, -6.485730409622192e-06, -1.773238182067871e-06, 2.93925404548645e-06, 7.651746273040771e-06, 1.2364238500595093e-05, 1.7076730728149414e-05, 2.1789222955703735e-05, 2.6501715183258057e-05, 3.121420741081238e-05, 3.59266996383667e-05, 4.063919186592102e-05, 4.535168409347534e-05, 5.006417632102966e-05, 5.4776668548583984e-05, 5.9489160776138306e-05, 6.420165300369263e-05, 6.891414523124695e-05, 7.362663745880127e-05, 7.833912968635559e-05, 8.305162191390991e-05, 8.776411414146423e-05, 9.247660636901855e-05, 9.718909859657288e-05, 0.0001019015908241272, 0.00010661408305168152, 0.00011132657527923584, 0.00011603906750679016, 0.00012075155973434448, 0.0001254640519618988, 0.00013017654418945312]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 37.0, 964.0, 16.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.892841100692749, -0.8576000928878784, -0.822359025478363, -0.7871179580688477, -0.751876950263977, -0.7166359424591064, -0.6813948750495911, -0.6461538076400757, -0.6109127998352051, -0.5756717920303345, -0.5404307246208191, -0.5051896572113037, -0.4699486494064331, -0.4347076117992401, -0.3994665741920471, -0.3642255365848541, -0.32898449897766113, -0.29374346137046814, -0.25850242376327515, -0.22326138615608215, -0.18802034854888916, -0.15277931094169617, -0.11753827333450317, -0.08229723572731018, -0.04705619812011719, -0.011815160512924194, 0.0234258770942688, 0.05866691470146179, 0.09390795230865479, 0.12914898991584778, 0.16439002752304077, 0.19963106513023376, 0.23487210273742676, 0.27011314034461975, 0.30535417795181274, 0.34059521555900574, 0.37583625316619873, 0.4110772907733917, 0.4463183283805847, 0.4815593659877777, 0.5168004035949707, 0.5520414113998413, 0.5872824788093567, 0.6225235462188721, 0.6577645540237427, 0.6930055618286133, 0.7282466292381287, 0.763487696647644, 0.7987287044525146, 0.8339697122573853, 0.8692107796669006, 0.904451847076416, 0.9396928548812866, 0.9749338626861572, 1.0101749897003174, 1.045415997505188, 1.0806570053100586, 1.1158980131149292, 1.1511390209197998, 1.18638014793396, 1.2216211557388306, 1.2568621635437012, 1.2921032905578613, 1.327344298362732, 1.3625853061676025]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 6.0, 10.0, 9.0, 17.0, 23.0, 27.0, 26.0, 20.0, 25.0, 26.0, 41.0, 38.0, 45.0, 43.0, 58.0, 49.0, 54.0, 42.0, 45.0, 40.0, 44.0, 47.0, 49.0, 38.0, 35.0, 34.0, 24.0, 16.0, 18.0, 15.0, 13.0, 2.0, 5.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.48736441135406494, -0.4729677438735962, -0.45857110619544983, -0.4441744387149811, -0.4297778010368347, -0.41538113355636597, -0.4009844660758972, -0.38658782839775085, -0.3721911907196045, -0.35779452323913574, -0.3433978855609894, -0.32900121808052063, -0.31460458040237427, -0.3002079129219055, -0.28581124544143677, -0.2714146077632904, -0.25701794028282166, -0.2426212877035141, -0.22822463512420654, -0.2138279676437378, -0.19943132996559143, -0.18503466248512268, -0.17063800990581512, -0.15624135732650757, -0.1418447047472, -0.12744805216789246, -0.1130513995885849, -0.09865473955869675, -0.08425808697938919, -0.06986143440008163, -0.05546477437019348, -0.041068121790885925, -0.02667146921157837, -0.012274814769625664, 0.0021218396723270416, 0.016518495976924896, 0.030915148556232452, 0.04531180113554001, 0.05970846116542816, 0.07410511374473572, 0.08850176632404327, 0.10289841890335083, 0.11729507148265839, 0.13169172406196594, 0.1460883915424347, 0.16048502922058105, 0.1748816967010498, 0.18927834928035736, 0.20367500185966492, 0.21807165443897247, 0.23246830701828003, 0.24686497449874878, 0.26126161217689514, 0.2756582796573639, 0.29005491733551025, 0.304451584815979, 0.31884825229644775, 0.3332449197769165, 0.34764155745506287, 0.3620382249355316, 0.376434862613678, 0.39083153009414673, 0.4052281975746155, 0.41962483525276184, 0.4340214729309082]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 6.0, 1.0, 4.0, 10.0, 13.0, 9.0, 12.0, 24.0, 24.0, 23.0, 34.0, 46.0, 62.0, 93.0, 131.0, 204.0, 297.0, 571.0, 2567.0, 4171887.0, 16358.0, 815.0, 401.0, 220.0, 128.0, 96.0, 69.0, 49.0, 26.0, 26.0, 16.0, 10.0, 12.0, 11.0, 3.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1055908203125, -0.10236167907714844, -0.09913253784179688, -0.09590339660644531, -0.09267425537109375, -0.08944511413574219, -0.08621597290039062, -0.08298683166503906, -0.0797576904296875, -0.07652854919433594, -0.07329940795898438, -0.07007026672363281, -0.06684112548828125, -0.06361198425292969, -0.060382843017578125, -0.05715370178222656, -0.053924560546875, -0.05069541931152344, -0.047466278076171875, -0.04423713684082031, -0.04100799560546875, -0.03777885437011719, -0.034549713134765625, -0.03132057189941406, -0.0280914306640625, -0.024862289428710938, -0.021633148193359375, -0.018404006958007812, -0.01517486572265625, -0.011945724487304688, -0.008716583251953125, -0.0054874420166015625, -0.00225830078125, 0.0009708404541015625, 0.004199981689453125, 0.0074291229248046875, 0.01065826416015625, 0.013887405395507812, 0.017116546630859375, 0.020345687866210938, 0.0235748291015625, 0.026803970336914062, 0.030033111572265625, 0.03326225280761719, 0.03649139404296875, 0.03972053527832031, 0.042949676513671875, 0.04617881774902344, 0.049407958984375, 0.05263710021972656, 0.055866241455078125, 0.05909538269042969, 0.06232452392578125, 0.06555366516113281, 0.06878280639648438, 0.07201194763183594, 0.0752410888671875, 0.07847023010253906, 0.08169937133789062, 0.08492851257324219, 0.08815765380859375, 0.09138679504394531, 0.09461593627929688, 0.09784507751464844, 0.10107421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 8.0, 16.0, 17.0, 12.0, 11.0, 51.0, 374.0, 337.0, 57.0, 19.0, 7.0, 9.0, 5.0, 7.0, 12.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02099609375, -0.020355939865112305, -0.01971578598022461, -0.019075632095336914, -0.01843547821044922, -0.017795324325561523, -0.017155170440673828, -0.016515016555786133, -0.015874862670898438, -0.015234708786010742, -0.014594554901123047, -0.013954401016235352, -0.013314247131347656, -0.012674093246459961, -0.012033939361572266, -0.01139378547668457, -0.010753631591796875, -0.01011347770690918, -0.009473323822021484, -0.008833169937133789, -0.008193016052246094, -0.0075528621673583984, -0.006912708282470703, -0.006272554397583008, -0.0056324005126953125, -0.004992246627807617, -0.004352092742919922, -0.0037119388580322266, -0.0030717849731445312, -0.002431631088256836, -0.0017914772033691406, -0.0011513233184814453, -0.00051116943359375, 0.0001289844512939453, 0.0007691383361816406, 0.001409292221069336, 0.0020494461059570312, 0.0026895999908447266, 0.003329753875732422, 0.003969907760620117, 0.0046100616455078125, 0.005250215530395508, 0.005890369415283203, 0.0065305233001708984, 0.007170677185058594, 0.007810831069946289, 0.008450984954833984, 0.00909113883972168, 0.009731292724609375, 0.01037144660949707, 0.011011600494384766, 0.011651754379272461, 0.012291908264160156, 0.012932062149047852, 0.013572216033935547, 0.014212369918823242, 0.014852523803710938, 0.015492677688598633, 0.016132831573486328, 0.016772985458374023, 0.01741313934326172, 0.018053293228149414, 0.01869344711303711, 0.019333600997924805, 0.0199737548828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 3.0, 9.0, 7.0, 15.0, 9.0, 21.0, 29.0, 59.0, 70.0, 213.0, 1460.0, 4174301.0, 16951.0, 774.0, 160.0, 63.0, 38.0, 22.0, 16.0, 14.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.191650390625, -0.18580245971679688, -0.17995452880859375, -0.17410659790039062, -0.1682586669921875, -0.16241073608398438, -0.15656280517578125, -0.15071487426757812, -0.144866943359375, -0.13901901245117188, -0.13317108154296875, -0.12732315063476562, -0.1214752197265625, -0.11562728881835938, -0.10977935791015625, -0.10393142700195312, -0.09808349609375, -0.09223556518554688, -0.08638763427734375, -0.08053970336914062, -0.0746917724609375, -0.06884384155273438, -0.06299591064453125, -0.057147979736328125, -0.051300048828125, -0.045452117919921875, -0.03960418701171875, -0.033756256103515625, -0.0279083251953125, -0.022060394287109375, -0.01621246337890625, -0.010364532470703125, -0.0045166015625, 0.001331329345703125, 0.00717926025390625, 0.013027191162109375, 0.0188751220703125, 0.024723052978515625, 0.03057098388671875, 0.036418914794921875, 0.042266845703125, 0.048114776611328125, 0.05396270751953125, 0.059810638427734375, 0.0656585693359375, 0.07150650024414062, 0.07735443115234375, 0.08320236206054688, 0.08905029296875, 0.09489822387695312, 0.10074615478515625, 0.10659408569335938, 0.1124420166015625, 0.11828994750976562, 0.12413787841796875, 0.12998580932617188, 0.135833740234375, 0.14168167114257812, 0.14752960205078125, 0.15337753295898438, 0.1592254638671875, 0.16507339477539062, 0.17092132568359375, 0.17676925659179688, 0.1826171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 6.0, 12.0, 26.0, 76.0, 3651.0, 189.0, 42.0, 15.0, 9.0, 8.0, 3.0, 4.0, 2.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033660888671875, -0.03252983093261719, -0.031398773193359375, -0.030267715454101562, -0.02913665771484375, -0.028005599975585938, -0.026874542236328125, -0.025743484497070312, -0.0246124267578125, -0.023481369018554688, -0.022350311279296875, -0.021219253540039062, -0.02008819580078125, -0.018957138061523438, -0.017826080322265625, -0.016695022583007812, -0.01556396484375, -0.014432907104492188, -0.013301849365234375, -0.012170791625976562, -0.01103973388671875, -0.009908676147460938, -0.008777618408203125, -0.0076465606689453125, -0.0065155029296875, -0.0053844451904296875, -0.004253387451171875, -0.0031223297119140625, -0.00199127197265625, -0.0008602142333984375, 0.000270843505859375, 0.0014019012451171875, 0.002532958984375, 0.0036640167236328125, 0.004795074462890625, 0.0059261322021484375, 0.00705718994140625, 0.008188247680664062, 0.009319305419921875, 0.010450363159179688, 0.0115814208984375, 0.012712478637695312, 0.013843536376953125, 0.014974594116210938, 0.01610565185546875, 0.017236709594726562, 0.018367767333984375, 0.019498825073242188, 0.0206298828125, 0.021760940551757812, 0.022891998291015625, 0.024023056030273438, 0.02515411376953125, 0.026285171508789062, 0.027416229248046875, 0.028547286987304688, 0.0296783447265625, 0.030809402465820312, 0.031940460205078125, 0.03307151794433594, 0.03420257568359375, 0.03533363342285156, 0.036464691162109375, 0.03759574890136719, 0.038726806640625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1016.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8144657015800476, -0.800572395324707, -0.7866790294647217, -0.7727857232093811, -0.7588924169540405, -0.7449990510940552, -0.7311057448387146, -0.717212438583374, -0.7033190727233887, -0.6894257664680481, -0.6755324006080627, -0.6616390943527222, -0.6477457880973816, -0.6338524222373962, -0.6199591159820557, -0.6060658097267151, -0.5921725034713745, -0.5782791972160339, -0.5643858313560486, -0.550492525100708, -0.5365992188453674, -0.5227058529853821, -0.5088125467300415, -0.4949192404747009, -0.4810258746147156, -0.4671325385570526, -0.45323923230171204, -0.4393458962440491, -0.4254525601863861, -0.41155925393104553, -0.39766591787338257, -0.383772611618042, -0.3698793053627014, -0.35598596930503845, -0.3420926630496979, -0.3281993269920349, -0.31430599093437195, -0.30041268467903137, -0.2865193486213684, -0.27262604236602783, -0.2587326765060425, -0.2448393553495407, -0.23094601929187775, -0.21705269813537598, -0.2031593769788742, -0.18926605582237244, -0.17537271976470947, -0.1614793986082077, -0.14758607745170593, -0.13369275629520416, -0.1197994276881218, -0.10590609908103943, -0.09201277792453766, -0.07811944931745529, -0.06422612071037292, -0.050332799553871155, -0.03643947094678879, -0.02254614606499672, -0.008652819320559502, 0.005240507423877716, 0.019133832305669785, 0.03302715718746185, 0.04692048579454422, 0.06081380695104599, 0.07470713555812836]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 4.0, 4.0, 9.0, 9.0, 10.0, 9.0, 17.0, 13.0, 21.0, 16.0, 24.0, 24.0, 28.0, 36.0, 41.0, 41.0, 40.0, 40.0, 62.0, 50.0, 51.0, 41.0, 51.0, 38.0, 44.0, 25.0, 44.0, 27.0, 23.0, 26.0, 21.0, 15.0, 22.0, 20.0, 9.0, 13.0, 9.0, 4.0, 7.0, 2.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.047602951526641846, -0.04605260118842125, -0.04450225085020065, -0.04295190051198006, -0.04140155017375946, -0.039851199835538864, -0.03830084949731827, -0.03675049915909767, -0.035200148820877075, -0.03364979848265648, -0.03209944814443588, -0.030549097806215286, -0.02899874746799469, -0.027448397129774094, -0.025898046791553497, -0.0243476964533329, -0.022797346115112305, -0.02124699577689171, -0.019696645438671112, -0.018146295100450516, -0.01659594476222992, -0.015045594424009323, -0.013495244085788727, -0.01194489374756813, -0.010394543409347534, -0.008844193071126938, -0.0072938427329063416, -0.005743492394685745, -0.004193142056465149, -0.0026427917182445526, -0.0010924413800239563, 0.00045790895819664, 0.0020082592964172363, 0.0035586096346378326, 0.005108959972858429, 0.006659310311079025, 0.008209660649299622, 0.009760010987520218, 0.011310361325740814, 0.01286071166396141, 0.014411062002182007, 0.015961412340402603, 0.0175117626786232, 0.019062113016843796, 0.020612463355064392, 0.02216281369328499, 0.023713164031505585, 0.02526351436972618, 0.026813864707946777, 0.028364215046167374, 0.02991456538438797, 0.031464915722608566, 0.03301526606082916, 0.03456561639904976, 0.036115966737270355, 0.03766631707549095, 0.03921666741371155, 0.040767017751932144, 0.04231736809015274, 0.04386771842837334, 0.04541806876659393, 0.04696841910481453, 0.048518769443035126, 0.05006911978125572, 0.05161947011947632]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 11.0, 9.0, 12.0, 35.0, 33.0, 52.0, 78.0, 86.0, 160.0, 190.0, 281.0, 457.0, 638.0, 989.0, 1592.0, 2614.0, 4363.0, 9258.0, 26853.0, 910672.0, 61795.0, 13669.0, 6075.0, 3111.0, 1932.0, 1077.0, 791.0, 509.0, 368.0, 252.0, 144.0, 104.0, 91.0, 65.0, 51.0, 29.0, 32.0, 21.0, 15.0, 5.0, 6.0, 5.0, 0.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03955078125, -0.038341522216796875, -0.03713226318359375, -0.035923004150390625, -0.0347137451171875, -0.033504486083984375, -0.03229522705078125, -0.031085968017578125, -0.029876708984375, -0.028667449951171875, -0.02745819091796875, -0.026248931884765625, -0.0250396728515625, -0.023830413818359375, -0.02262115478515625, -0.021411895751953125, -0.02020263671875, -0.018993377685546875, -0.01778411865234375, -0.016574859619140625, -0.0153656005859375, -0.014156341552734375, -0.01294708251953125, -0.011737823486328125, -0.010528564453125, -0.009319305419921875, -0.00811004638671875, -0.006900787353515625, -0.0056915283203125, -0.004482269287109375, -0.00327301025390625, -0.002063751220703125, -0.0008544921875, 0.000354766845703125, 0.00156402587890625, 0.002773284912109375, 0.0039825439453125, 0.005191802978515625, 0.00640106201171875, 0.007610321044921875, 0.008819580078125, 0.010028839111328125, 0.01123809814453125, 0.012447357177734375, 0.0136566162109375, 0.014865875244140625, 0.01607513427734375, 0.017284393310546875, 0.01849365234375, 0.019702911376953125, 0.02091217041015625, 0.022121429443359375, 0.0233306884765625, 0.024539947509765625, 0.02574920654296875, 0.026958465576171875, 0.028167724609375, 0.029376983642578125, 0.03058624267578125, 0.031795501708984375, 0.0330047607421875, 0.034214019775390625, 0.03542327880859375, 0.036632537841796875, 0.037841796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 10.0, 15.0, 16.0, 12.0, 10.0, 61.0, 388.0, 315.0, 57.0, 17.0, 11.0, 5.0, 6.0, 8.0, 11.0, 7.0, 9.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208740234375, -0.020236492156982422, -0.019598960876464844, -0.018961429595947266, -0.018323898315429688, -0.01768636703491211, -0.01704883575439453, -0.016411304473876953, -0.015773773193359375, -0.015136241912841797, -0.014498710632324219, -0.01386117935180664, -0.013223648071289062, -0.012586116790771484, -0.011948585510253906, -0.011311054229736328, -0.01067352294921875, -0.010035991668701172, -0.009398460388183594, -0.008760929107666016, -0.008123397827148438, -0.007485866546630859, -0.006848335266113281, -0.006210803985595703, -0.005573272705078125, -0.004935741424560547, -0.004298210144042969, -0.0036606788635253906, -0.0030231475830078125, -0.0023856163024902344, -0.0017480850219726562, -0.0011105537414550781, -0.0004730224609375, 0.00016450881958007812, 0.0008020401000976562, 0.0014395713806152344, 0.0020771026611328125, 0.0027146339416503906, 0.0033521652221679688, 0.003989696502685547, 0.004627227783203125, 0.005264759063720703, 0.005902290344238281, 0.006539821624755859, 0.0071773529052734375, 0.007814884185791016, 0.008452415466308594, 0.009089946746826172, 0.00972747802734375, 0.010365009307861328, 0.011002540588378906, 0.011640071868896484, 0.012277603149414062, 0.01291513442993164, 0.013552665710449219, 0.014190196990966797, 0.014827728271484375, 0.015465259552001953, 0.01610279083251953, 0.01674032211303711, 0.017377853393554688, 0.018015384674072266, 0.018652915954589844, 0.019290447235107422, 0.019927978515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 2.0, 7.0, 8.0, 5.0, 9.0, 12.0, 11.0, 29.0, 39.0, 30.0, 43.0, 62.0, 66.0, 95.0, 100.0, 112.0, 184.0, 220.0, 350.0, 678.0, 1819.0, 25732.0, 997098.0, 18239.0, 1595.0, 658.0, 321.0, 226.0, 161.0, 140.0, 99.0, 70.0, 73.0, 67.0, 51.0, 31.0, 21.0, 24.0, 19.0, 18.0, 7.0, 9.0, 5.0, 3.0, 7.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09132194519042969, -0.08822250366210938, -0.08512306213378906, -0.08202362060546875, -0.07892417907714844, -0.07582473754882812, -0.07272529602050781, -0.0696258544921875, -0.06652641296386719, -0.06342697143554688, -0.06032752990722656, -0.05722808837890625, -0.05412864685058594, -0.051029205322265625, -0.04792976379394531, -0.044830322265625, -0.04173088073730469, -0.038631439208984375, -0.03553199768066406, -0.03243255615234375, -0.029333114624023438, -0.026233673095703125, -0.023134231567382812, -0.0200347900390625, -0.016935348510742188, -0.013835906982421875, -0.010736465454101562, -0.00763702392578125, -0.0045375823974609375, -0.001438140869140625, 0.0016613006591796875, 0.0047607421875, 0.007860183715820312, 0.010959625244140625, 0.014059066772460938, 0.01715850830078125, 0.020257949829101562, 0.023357391357421875, 0.026456832885742188, 0.0295562744140625, 0.03265571594238281, 0.035755157470703125, 0.03885459899902344, 0.04195404052734375, 0.04505348205566406, 0.048152923583984375, 0.05125236511230469, 0.054351806640625, 0.05745124816894531, 0.060550689697265625, 0.06365013122558594, 0.06674957275390625, 0.06984901428222656, 0.07294845581054688, 0.07604789733886719, 0.0791473388671875, 0.08224678039550781, 0.08534622192382812, 0.08844566345214844, 0.09154510498046875, 0.09464454650878906, 0.09774398803710938, 0.10084342956542969, 0.10394287109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 10.0, 14.0, 16.0, 19.0, 22.0, 20.0, 24.0, 27.0, 32.0, 38.0, 33.0, 35.0, 55.0, 46.0, 46.0, 50.0, 55.0, 45.0, 51.0, 37.0, 43.0, 38.0, 28.0, 18.0, 18.0, 26.0, 22.0, 24.0, 23.0, 11.0, 9.0, 10.0, 15.0, 5.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055206298828125, -0.05335378646850586, -0.05150127410888672, -0.04964876174926758, -0.04779624938964844, -0.0459437370300293, -0.044091224670410156, -0.042238712310791016, -0.040386199951171875, -0.038533687591552734, -0.036681175231933594, -0.03482866287231445, -0.03297615051269531, -0.031123638153076172, -0.02927112579345703, -0.02741861343383789, -0.02556610107421875, -0.02371358871459961, -0.02186107635498047, -0.020008563995361328, -0.018156051635742188, -0.016303539276123047, -0.014451026916503906, -0.012598514556884766, -0.010746002197265625, -0.008893489837646484, -0.007040977478027344, -0.005188465118408203, -0.0033359527587890625, -0.0014834403991699219, 0.00036907196044921875, 0.0022215843200683594, 0.0040740966796875, 0.005926609039306641, 0.007779121398925781, 0.009631633758544922, 0.011484146118164062, 0.013336658477783203, 0.015189170837402344, 0.017041683197021484, 0.018894195556640625, 0.020746707916259766, 0.022599220275878906, 0.024451732635498047, 0.026304244995117188, 0.028156757354736328, 0.03000926971435547, 0.03186178207397461, 0.03371429443359375, 0.03556680679321289, 0.03741931915283203, 0.03927183151245117, 0.04112434387207031, 0.04297685623168945, 0.044829368591308594, 0.046681880950927734, 0.048534393310546875, 0.050386905670166016, 0.052239418029785156, 0.0540919303894043, 0.05594444274902344, 0.05779695510864258, 0.05964946746826172, 0.06150197982788086, 0.0633544921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 6.0, 5.0, 7.0, 7.0, 22.0, 36.0, 43.0, 84.0, 147.0, 310.0, 682.0, 1830.0, 6690.0, 50846.0, 926746.0, 50960.0, 7018.0, 1756.0, 727.0, 272.0, 144.0, 78.0, 42.0, 28.0, 18.0, 12.0, 9.0, 6.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.499622344970703e-05, -8.229818195104599e-05, -7.960014045238495e-05, -7.690209895372391e-05, -7.420405745506287e-05, -7.150601595640182e-05, -6.880797445774078e-05, -6.610993295907974e-05, -6.34118914604187e-05, -6.071384996175766e-05, -5.801580846309662e-05, -5.531776696443558e-05, -5.2619725465774536e-05, -4.9921683967113495e-05, -4.7223642468452454e-05, -4.452560096979141e-05, -4.182755947113037e-05, -3.912951797246933e-05, -3.643147647380829e-05, -3.373343497514725e-05, -3.1035393476486206e-05, -2.8337351977825165e-05, -2.5639310479164124e-05, -2.2941268980503082e-05, -2.024322748184204e-05, -1.7545185983181e-05, -1.4847144484519958e-05, -1.2149102985858917e-05, -9.451061487197876e-06, -6.753019988536835e-06, -4.0549784898757935e-06, -1.3569369912147522e-06, 1.341104507446289e-06, 4.03914600610733e-06, 6.737187504768372e-06, 9.435229003429413e-06, 1.2133270502090454e-05, 1.4831312000751495e-05, 1.7529353499412537e-05, 2.0227394998073578e-05, 2.292543649673462e-05, 2.562347799539566e-05, 2.83215194940567e-05, 3.101956099271774e-05, 3.3717602491378784e-05, 3.6415643990039825e-05, 3.911368548870087e-05, 4.181172698736191e-05, 4.450976848602295e-05, 4.720780998468399e-05, 4.990585148334503e-05, 5.260389298200607e-05, 5.5301934480667114e-05, 5.7999975979328156e-05, 6.06980174779892e-05, 6.339605897665024e-05, 6.609410047531128e-05, 6.879214197397232e-05, 7.149018347263336e-05, 7.41882249712944e-05, 7.688626646995544e-05, 7.958430796861649e-05, 8.228234946727753e-05, 8.498039096593857e-05, 8.767843246459961e-05]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 9.0, 9.0, 11.0, 9.0, 17.0, 15.0, 21.0, 25.0, 23.0, 48.0, 50.0, 37.0, 65.0, 33.0, 78.0, 46.0, 67.0, 66.0, 38.0, 50.0, 28.0, 50.0, 24.0, 31.0, 32.0, 18.0, 25.0, 11.0, 16.0, 8.0, 3.0, 7.0, 1.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.614703357219696e-06, -4.461035132408142e-06, -4.307366907596588e-06, -4.153698682785034e-06, -4.00003045797348e-06, -3.846362233161926e-06, -3.6926940083503723e-06, -3.5390257835388184e-06, -3.3853575587272644e-06, -3.2316893339157104e-06, -3.0780211091041565e-06, -2.9243528842926025e-06, -2.7706846594810486e-06, -2.6170164346694946e-06, -2.4633482098579407e-06, -2.3096799850463867e-06, -2.1560117602348328e-06, -2.002343535423279e-06, -1.8486753106117249e-06, -1.695007085800171e-06, -1.541338860988617e-06, -1.387670636177063e-06, -1.234002411365509e-06, -1.080334186553955e-06, -9.266659617424011e-07, -7.729977369308472e-07, -6.193295121192932e-07, -4.6566128730773926e-07, -3.119930624961853e-07, -1.5832483768463135e-07, -4.6566128730773926e-09, 1.4901161193847656e-07, 3.026798367500305e-07, 4.5634806156158447e-07, 6.100162863731384e-07, 7.636845111846924e-07, 9.173527359962463e-07, 1.0710209608078003e-06, 1.2246891856193542e-06, 1.3783574104309082e-06, 1.5320256352424622e-06, 1.6856938600540161e-06, 1.83936208486557e-06, 1.993030309677124e-06, 2.146698534488678e-06, 2.300366759300232e-06, 2.454034984111786e-06, 2.60770320892334e-06, 2.761371433734894e-06, 2.9150396585464478e-06, 3.0687078833580017e-06, 3.2223761081695557e-06, 3.3760443329811096e-06, 3.5297125577926636e-06, 3.6833807826042175e-06, 3.8370490074157715e-06, 3.9907172322273254e-06, 4.144385457038879e-06, 4.298053681850433e-06, 4.451721906661987e-06, 4.605390131473541e-06, 4.759058356285095e-06, 4.912726581096649e-06, 5.066394805908203e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 8.0, 12.0, 23.0, 16.0, 21.0, 49.0, 74.0, 101.0, 151.0, 313.0, 673.0, 3927.0, 1029759.0, 11608.0, 902.0, 361.0, 206.0, 105.0, 79.0, 48.0, 35.0, 16.0, 17.0, 10.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001697540283203125, -0.0001647062599658966, -0.0001596584916114807, -0.00015461072325706482, -0.00014956295490264893, -0.00014451518654823303, -0.00013946741819381714, -0.00013441964983940125, -0.00012937188148498535, -0.00012432411313056946, -0.00011927634477615356, -0.00011422857642173767, -0.00010918080806732178, -0.00010413303971290588, -9.908527135848999e-05, -9.40375030040741e-05, -8.89897346496582e-05, -8.394196629524231e-05, -7.889419794082642e-05, -7.384642958641052e-05, -6.879866123199463e-05, -6.375089287757874e-05, -5.870312452316284e-05, -5.365535616874695e-05, -4.8607587814331055e-05, -4.355981945991516e-05, -3.851205110549927e-05, -3.3464282751083374e-05, -2.841651439666748e-05, -2.3368746042251587e-05, -1.8320977687835693e-05, -1.32732093334198e-05, -8.225440979003906e-06, -3.1776726245880127e-06, 1.8700957298278809e-06, 6.917864084243774e-06, 1.1965632438659668e-05, 1.701340079307556e-05, 2.2061169147491455e-05, 2.710893750190735e-05, 3.215670585632324e-05, 3.7204474210739136e-05, 4.225224256515503e-05, 4.730001091957092e-05, 5.2347779273986816e-05, 5.739554762840271e-05, 6.24433159828186e-05, 6.74910843372345e-05, 7.253885269165039e-05, 7.758662104606628e-05, 8.263438940048218e-05, 8.768215775489807e-05, 9.272992610931396e-05, 9.777769446372986e-05, 0.00010282546281814575, 0.00010787323117256165, 0.00011292099952697754, 0.00011796876788139343, 0.00012301653623580933, 0.00012806430459022522, 0.0001331120729446411, 0.000138159841299057, 0.0001432076096534729, 0.0001482553780078888, 0.0001533031463623047]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 9.0, 8.0, 8.0, 18.0, 18.0, 24.0, 31.0, 36.0, 58.0, 71.0, 111.0, 115.0, 115.0, 87.0, 76.0, 56.0, 51.0, 23.0, 28.0, 18.0, 12.0, 6.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010448694229125977, -0.00010173581540584564, -9.898468852043152e-05, -9.62335616350174e-05, -9.348243474960327e-05, -9.073130786418915e-05, -8.798018097877502e-05, -8.52290540933609e-05, -8.247792720794678e-05, -7.972680032253265e-05, -7.697567343711853e-05, -7.42245465517044e-05, -7.147341966629028e-05, -6.872229278087616e-05, -6.597116589546204e-05, -6.322003901004791e-05, -6.046891212463379e-05, -5.7717785239219666e-05, -5.496665835380554e-05, -5.221553146839142e-05, -4.9464404582977295e-05, -4.671327769756317e-05, -4.396215081214905e-05, -4.1211023926734924e-05, -3.84598970413208e-05, -3.570877015590668e-05, -3.2957643270492554e-05, -3.020651638507843e-05, -2.7455389499664307e-05, -2.4704262614250183e-05, -2.195313572883606e-05, -1.9202008843421936e-05, -1.6450881958007812e-05, -1.3699755072593689e-05, -1.0948628187179565e-05, -8.197501301765442e-06, -5.446374416351318e-06, -2.695247530937195e-06, 5.587935447692871e-08, 2.8070062398910522e-06, 5.558133125305176e-06, 8.3092600107193e-06, 1.1060386896133423e-05, 1.3811513781547546e-05, 1.656264066696167e-05, 1.9313767552375793e-05, 2.2064894437789917e-05, 2.481602132320404e-05, 2.7567148208618164e-05, 3.0318275094032288e-05, 3.306940197944641e-05, 3.5820528864860535e-05, 3.857165575027466e-05, 4.132278263568878e-05, 4.4073909521102905e-05, 4.682503640651703e-05, 4.957616329193115e-05, 5.2327290177345276e-05, 5.50784170627594e-05, 5.782954394817352e-05, 6.0580670833587646e-05, 6.333179771900177e-05, 6.60829246044159e-05, 6.883405148983002e-05, 7.158517837524414e-05]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 9.0, 58.0, 748.0, 173.0, 21.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49996310472488403, -0.4876924157142639, -0.4754217565059662, -0.46315106749534607, -0.45088037848472595, -0.43860968947410583, -0.4263390302658081, -0.414068341255188, -0.40179765224456787, -0.38952696323394775, -0.37725630402565, -0.3649856150150299, -0.3527149260044098, -0.3404442369937897, -0.32817357778549194, -0.3159028887748718, -0.3036321997642517, -0.2913615107536316, -0.27909085154533386, -0.26682016253471375, -0.25454947352409363, -0.2422787994146347, -0.23000812530517578, -0.21773743629455566, -0.20546677708625793, -0.193196102976799, -0.1809254139661789, -0.16865473985671997, -0.15638405084609985, -0.14411337673664093, -0.131842702627182, -0.11957201361656189, -0.10730132460594177, -0.09503064304590225, -0.08275996148586273, -0.07048928737640381, -0.05821860209107399, -0.04594792053103447, -0.03367724269628525, -0.021406561136245728, -0.009135879576206207, 0.0031348010525107384, 0.015405481681227684, 0.027676161378622055, 0.039946842938661575, 0.052217524498701096, 0.06448820233345032, 0.07675888389348984, 0.08902956545352936, 0.10130024701356888, 0.1135709285736084, 0.12584160268306732, 0.13811229169368744, 0.15038296580314636, 0.16265365481376648, 0.1749243289232254, 0.18719500303268433, 0.19946567714214325, 0.21173636615276337, 0.2240070402622223, 0.2362777292728424, 0.24854840338230133, 0.26081907749176025, 0.27308976650238037, 0.2853604555130005]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 10.0, 10.0, 18.0, 19.0, 21.0, 26.0, 13.0, 39.0, 30.0, 36.0, 54.0, 42.0, 49.0, 46.0, 71.0, 65.0, 67.0, 51.0, 48.0, 43.0, 48.0, 29.0, 37.0, 25.0, 24.0, 16.0, 16.0, 21.0, 3.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3970259428024292, -0.3834264278411865, -0.36982694268226624, -0.35622742772102356, -0.34262794256210327, -0.3290284276008606, -0.3154289126396179, -0.30182939767837524, -0.28822991251945496, -0.2746303975582123, -0.261030912399292, -0.24743139743804932, -0.23383189737796783, -0.22023239731788635, -0.20663288235664368, -0.1930333822965622, -0.1794338822364807, -0.16583438217639923, -0.15223488211631775, -0.13863536715507507, -0.1250358670949936, -0.11143636703491211, -0.09783685952425003, -0.08423735201358795, -0.07063785195350647, -0.05703834816813469, -0.04343884438276291, -0.02983934059739113, -0.016239836812019348, -0.002640336751937866, 0.010959170758724213, 0.02455867826938629, 0.03815817832946777, 0.051757682114839554, 0.06535718590021133, 0.07895669341087341, 0.0925561934709549, 0.10615569353103638, 0.11975520104169846, 0.13335470855236053, 0.14695420861244202, 0.1605537086725235, 0.17415320873260498, 0.18775272369384766, 0.20135222375392914, 0.21495172381401062, 0.2285512387752533, 0.24215073883533478, 0.25575023889541626, 0.26934975385665894, 0.2829492390155792, 0.2965487539768219, 0.3101482391357422, 0.32374775409698486, 0.33734726905822754, 0.3509467840194702, 0.3645462691783905, 0.3781457841396332, 0.39174526929855347, 0.40534478425979614, 0.4189442992210388, 0.4325437843799591, 0.4461432993412018, 0.45974278450012207, 0.47334229946136475]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 6.0, 3.0, 5.0, 8.0, 8.0, 23.0, 18.0, 15.0, 18.0, 31.0, 46.0, 56.0, 84.0, 106.0, 221.0, 3370.0, 4188287.0, 1400.0, 171.0, 113.0, 71.0, 56.0, 41.0, 26.0, 21.0, 17.0, 11.0, 12.0, 6.0, 2.0, 7.0, 1.0, 2.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12432861328125, -0.120361328125, -0.11639404296875, -0.1124267578125, -0.10845947265625, -0.1044921875, -0.10052490234375, -0.0965576171875, -0.09259033203125, -0.088623046875, -0.08465576171875, -0.0806884765625, -0.07672119140625, -0.07275390625, -0.06878662109375, -0.0648193359375, -0.06085205078125, -0.056884765625, -0.05291748046875, -0.0489501953125, -0.04498291015625, -0.041015625, -0.03704833984375, -0.0330810546875, -0.02911376953125, -0.025146484375, -0.02117919921875, -0.0172119140625, -0.01324462890625, -0.00927734375, -0.00531005859375, -0.0013427734375, 0.00262451171875, 0.006591796875, 0.01055908203125, 0.0145263671875, 0.01849365234375, 0.0224609375, 0.02642822265625, 0.0303955078125, 0.03436279296875, 0.038330078125, 0.04229736328125, 0.0462646484375, 0.05023193359375, 0.05419921875, 0.05816650390625, 0.0621337890625, 0.06610107421875, 0.070068359375, 0.07403564453125, 0.0780029296875, 0.08197021484375, 0.0859375, 0.08990478515625, 0.0938720703125, 0.09783935546875, 0.101806640625, 0.10577392578125, 0.1097412109375, 0.11370849609375, 0.11767578125, 0.12164306640625, 0.1256103515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 6.0, 1.0, 3.0, 1.0, 4.0, 10.0, 15.0, 22.0, 7.0, 19.0, 138.0, 455.0, 183.0, 40.0, 13.0, 8.0, 8.0, 6.0, 10.0, 11.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204925537109375, -0.01986098289489746, -0.019229412078857422, -0.018597841262817383, -0.017966270446777344, -0.017334699630737305, -0.016703128814697266, -0.016071557998657227, -0.015439987182617188, -0.014808416366577148, -0.01417684555053711, -0.01354527473449707, -0.012913703918457031, -0.012282133102416992, -0.011650562286376953, -0.011018991470336914, -0.010387420654296875, -0.009755849838256836, -0.009124279022216797, -0.008492708206176758, -0.007861137390136719, -0.00722956657409668, -0.006597995758056641, -0.0059664249420166016, -0.0053348541259765625, -0.0047032833099365234, -0.004071712493896484, -0.0034401416778564453, -0.0028085708618164062, -0.002177000045776367, -0.0015454292297363281, -0.0009138584136962891, -0.00028228759765625, 0.00034928321838378906, 0.0009808540344238281, 0.0016124248504638672, 0.0022439956665039062, 0.0028755664825439453, 0.0035071372985839844, 0.0041387081146240234, 0.0047702789306640625, 0.0054018497467041016, 0.006033420562744141, 0.00666499137878418, 0.007296562194824219, 0.007928133010864258, 0.008559703826904297, 0.009191274642944336, 0.009822845458984375, 0.010454416275024414, 0.011085987091064453, 0.011717557907104492, 0.012349128723144531, 0.01298069953918457, 0.01361227035522461, 0.014243841171264648, 0.014875411987304688, 0.015506982803344727, 0.016138553619384766, 0.016770124435424805, 0.017401695251464844, 0.018033266067504883, 0.018664836883544922, 0.01929640769958496, 0.019927978515625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 21.0, 17.0, 38.0, 148.0, 527.0, 3281.0, 4187496.0, 2404.0, 193.0, 76.0, 30.0, 11.0, 12.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08441162109375, -0.0813302993774414, -0.07824897766113281, -0.07516765594482422, -0.07208633422851562, -0.06900501251220703, -0.06592369079589844, -0.06284236907958984, -0.05976104736328125, -0.056679725646972656, -0.05359840393066406, -0.05051708221435547, -0.047435760498046875, -0.04435443878173828, -0.04127311706542969, -0.038191795349121094, -0.0351104736328125, -0.032029151916503906, -0.028947830200195312, -0.02586650848388672, -0.022785186767578125, -0.01970386505126953, -0.016622543334960938, -0.013541221618652344, -0.01045989990234375, -0.007378578186035156, -0.0042972564697265625, -0.0012159347534179688, 0.001865386962890625, 0.004946708679199219, 0.008028030395507812, 0.011109352111816406, 0.014190673828125, 0.017271995544433594, 0.020353317260742188, 0.02343463897705078, 0.026515960693359375, 0.02959728240966797, 0.03267860412597656, 0.035759925842285156, 0.03884124755859375, 0.041922569274902344, 0.04500389099121094, 0.04808521270751953, 0.051166534423828125, 0.05424785614013672, 0.05732917785644531, 0.060410499572753906, 0.0634918212890625, 0.0665731430053711, 0.06965446472167969, 0.07273578643798828, 0.07581710815429688, 0.07889842987060547, 0.08197975158691406, 0.08506107330322266, 0.08814239501953125, 0.09122371673583984, 0.09430503845214844, 0.09738636016845703, 0.10046768188476562, 0.10354900360107422, 0.10663032531738281, 0.1097116470336914, 0.11279296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 7.0, 4.0, 23.0, 64.0, 3755.0, 159.0, 32.0, 10.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0250091552734375, -0.024379968643188477, -0.023750782012939453, -0.02312159538269043, -0.022492408752441406, -0.021863222122192383, -0.02123403549194336, -0.020604848861694336, -0.019975662231445312, -0.01934647560119629, -0.018717288970947266, -0.018088102340698242, -0.01745891571044922, -0.016829729080200195, -0.016200542449951172, -0.015571355819702148, -0.014942169189453125, -0.014312982559204102, -0.013683795928955078, -0.013054609298706055, -0.012425422668457031, -0.011796236038208008, -0.011167049407958984, -0.010537862777709961, -0.009908676147460938, -0.009279489517211914, -0.00865030288696289, -0.008021116256713867, -0.007391929626464844, -0.00676274299621582, -0.006133556365966797, -0.0055043697357177734, -0.00487518310546875, -0.0042459964752197266, -0.003616809844970703, -0.0029876232147216797, -0.0023584365844726562, -0.0017292499542236328, -0.0011000633239746094, -0.00047087669372558594, 0.0001583099365234375, 0.0007874965667724609, 0.0014166831970214844, 0.002045869827270508, 0.0026750564575195312, 0.0033042430877685547, 0.003933429718017578, 0.0045626163482666016, 0.005191802978515625, 0.0058209896087646484, 0.006450176239013672, 0.007079362869262695, 0.007708549499511719, 0.008337736129760742, 0.008966922760009766, 0.009596109390258789, 0.010225296020507812, 0.010854482650756836, 0.01148366928100586, 0.012112855911254883, 0.012742042541503906, 0.01337122917175293, 0.014000415802001953, 0.014629602432250977, 0.0152587890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 998.0, 21.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5493103265762329, -0.5399830937385559, -0.5306558012962341, -0.5213285684585571, -0.5120012760162354, -0.5026740431785583, -0.49334678053855896, -0.48401951789855957, -0.4746922552585602, -0.4653649926185608, -0.4560377299785614, -0.446710467338562, -0.437383234500885, -0.4280559718608856, -0.41872870922088623, -0.40940144658088684, -0.40007418394088745, -0.39074692130088806, -0.38141965866088867, -0.3720923960208893, -0.3627651333808899, -0.3534379005432129, -0.3441106379032135, -0.3347833752632141, -0.3254561126232147, -0.31612884998321533, -0.30680158734321594, -0.29747432470321655, -0.28814709186553955, -0.27881982922554016, -0.26949256658554077, -0.2601653039455414, -0.250838041305542, -0.2415107786655426, -0.2321835160255432, -0.22285626828670502, -0.21352900564670563, -0.20420174300670624, -0.19487449526786804, -0.18554723262786865, -0.17621998488903046, -0.16689272224903107, -0.15756547451019287, -0.14823821187019348, -0.1389109492301941, -0.1295836865901947, -0.12025643140077591, -0.11092917621135712, -0.10160191357135773, -0.09227465093135834, -0.08294739574193954, -0.07362014055252075, -0.06429287791252136, -0.05496561899781227, -0.04563836008310318, -0.03631110489368439, -0.026983842253684998, -0.017656583338975906, -0.008329324424266815, 0.000997934490442276, 0.010325193405151367, 0.01965245231986046, 0.02897971123456955, 0.03830696642398834, 0.04763422906398773]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 5.0, 17.0, 16.0, 26.0, 26.0, 31.0, 44.0, 45.0, 40.0, 54.0, 66.0, 64.0, 76.0, 66.0, 52.0, 57.0, 60.0, 41.0, 40.0, 33.0, 32.0, 32.0, 19.0, 11.0, 10.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023692727088928223, -0.022679012268781662, -0.021665295585989952, -0.020651578903198242, -0.01963786408305168, -0.01862414926290512, -0.01761043258011341, -0.0165967158973217, -0.01558300107717514, -0.014569285325706005, -0.01355556957423687, -0.012541853822767735, -0.0115281380712986, -0.010514422319829464, -0.009500706568360329, -0.008486990816891193, -0.007473275065422058, -0.006459559313952923, -0.0054458435624837875, -0.004432127811014652, -0.003418412059545517, -0.0024046963080763817, -0.0013909805566072464, -0.0003772648051381111, 0.0006364509463310242, 0.0016501666978001595, 0.0026638824492692947, 0.00367759820073843, 0.004691313952207565, 0.005705029703676701, 0.006718745455145836, 0.007732461206614971, 0.008746176958084106, 0.009759892709553242, 0.010773608461022377, 0.011787324212491512, 0.012801039963960648, 0.013814755715429783, 0.014828471466898918, 0.015842188149690628, 0.01685590296983719, 0.01786961778998375, 0.01888333447277546, 0.01989705115556717, 0.02091076597571373, 0.02192448079586029, 0.022938197478652, 0.02395191416144371, 0.02496562898159027, 0.02597934380173683, 0.02699306048452854, 0.02800677716732025, 0.029020491987466812, 0.030034206807613373, 0.031047923490405083, 0.03206164017319679, 0.03307535499334335, 0.034089069813489914, 0.035102784633636475, 0.036116503179073334, 0.037130217999219894, 0.038143932819366455, 0.039157651364803314, 0.040171366184949875, 0.041185081005096436]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 5.0, 12.0, 10.0, 9.0, 13.0, 19.0, 31.0, 46.0, 53.0, 67.0, 97.0, 127.0, 155.0, 217.0, 307.0, 438.0, 631.0, 943.0, 1452.0, 2341.0, 4026.0, 7524.0, 18436.0, 261692.0, 709523.0, 20707.0, 8350.0, 4068.0, 2336.0, 1469.0, 1019.0, 677.0, 493.0, 333.0, 234.0, 167.0, 124.0, 110.0, 63.0, 56.0, 48.0, 31.0, 19.0, 13.0, 13.0, 6.0, 6.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0235137939453125, -0.02277994155883789, -0.02204608917236328, -0.021312236785888672, -0.020578384399414062, -0.019844532012939453, -0.019110679626464844, -0.018376827239990234, -0.017642974853515625, -0.016909122467041016, -0.016175270080566406, -0.015441417694091797, -0.014707565307617188, -0.013973712921142578, -0.013239860534667969, -0.01250600814819336, -0.01177215576171875, -0.01103830337524414, -0.010304450988769531, -0.009570598602294922, -0.008836746215820312, -0.008102893829345703, -0.007369041442871094, -0.006635189056396484, -0.005901336669921875, -0.005167484283447266, -0.004433631896972656, -0.003699779510498047, -0.0029659271240234375, -0.002232074737548828, -0.0014982223510742188, -0.0007643699645996094, -3.0517578125e-05, 0.0007033348083496094, 0.0014371871948242188, 0.002171039581298828, 0.0029048919677734375, 0.003638744354248047, 0.004372596740722656, 0.005106449127197266, 0.005840301513671875, 0.006574153900146484, 0.007308006286621094, 0.008041858673095703, 0.008775711059570312, 0.009509563446044922, 0.010243415832519531, 0.01097726821899414, 0.01171112060546875, 0.01244497299194336, 0.013178825378417969, 0.013912677764892578, 0.014646530151367188, 0.015380382537841797, 0.016114234924316406, 0.016848087310791016, 0.017581939697265625, 0.018315792083740234, 0.019049644470214844, 0.019783496856689453, 0.020517349243164062, 0.021251201629638672, 0.02198505401611328, 0.02271890640258789, 0.0234527587890625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 6.0, 1.0, 3.0, 1.0, 4.0, 10.0, 15.0, 22.0, 7.0, 17.0, 127.0, 458.0, 191.0, 40.0, 14.0, 9.0, 8.0, 6.0, 10.0, 10.0, 5.0, 6.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204925537109375, -0.019861459732055664, -0.019230365753173828, -0.018599271774291992, -0.017968177795410156, -0.01733708381652832, -0.016705989837646484, -0.01607489585876465, -0.015443801879882812, -0.014812707901000977, -0.01418161392211914, -0.013550519943237305, -0.012919425964355469, -0.012288331985473633, -0.011657238006591797, -0.011026144027709961, -0.010395050048828125, -0.009763956069946289, -0.009132862091064453, -0.008501768112182617, -0.007870674133300781, -0.007239580154418945, -0.006608486175537109, -0.0059773921966552734, -0.0053462982177734375, -0.0047152042388916016, -0.004084110260009766, -0.0034530162811279297, -0.0028219223022460938, -0.002190828323364258, -0.0015597343444824219, -0.0009286403656005859, -0.00029754638671875, 0.00033354759216308594, 0.0009646415710449219, 0.0015957355499267578, 0.0022268295288085938, 0.0028579235076904297, 0.0034890174865722656, 0.0041201114654541016, 0.0047512054443359375, 0.0053822994232177734, 0.006013393402099609, 0.006644487380981445, 0.007275581359863281, 0.007906675338745117, 0.008537769317626953, 0.009168863296508789, 0.009799957275390625, 0.010431051254272461, 0.011062145233154297, 0.011693239212036133, 0.012324333190917969, 0.012955427169799805, 0.01358652114868164, 0.014217615127563477, 0.014848709106445312, 0.015479803085327148, 0.016110897064208984, 0.01674199104309082, 0.017373085021972656, 0.018004179000854492, 0.018635272979736328, 0.019266366958618164, 0.0198974609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 6.0, 4.0, 2.0, 4.0, 7.0, 9.0, 12.0, 23.0, 15.0, 17.0, 27.0, 20.0, 26.0, 35.0, 50.0, 53.0, 62.0, 97.0, 110.0, 188.0, 249.0, 409.0, 688.0, 1462.0, 8608.0, 899537.0, 130456.0, 3513.0, 1117.0, 530.0, 318.0, 206.0, 128.0, 113.0, 88.0, 76.0, 67.0, 41.0, 35.0, 39.0, 15.0, 30.0, 15.0, 12.0, 9.0, 11.0, 3.0, 9.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06378173828125, -0.06164264678955078, -0.05950355529785156, -0.057364463806152344, -0.055225372314453125, -0.053086280822753906, -0.05094718933105469, -0.04880809783935547, -0.04666900634765625, -0.04452991485595703, -0.04239082336425781, -0.040251731872558594, -0.038112640380859375, -0.035973548889160156, -0.03383445739746094, -0.03169536590576172, -0.0295562744140625, -0.02741718292236328, -0.025278091430664062, -0.023138999938964844, -0.020999908447265625, -0.018860816955566406, -0.016721725463867188, -0.014582633972167969, -0.01244354248046875, -0.010304450988769531, -0.008165359497070312, -0.006026268005371094, -0.003887176513671875, -0.0017480850219726562, 0.0003910064697265625, 0.0025300979614257812, 0.004669189453125, 0.006808280944824219, 0.008947372436523438, 0.011086463928222656, 0.013225555419921875, 0.015364646911621094, 0.017503738403320312, 0.01964282989501953, 0.02178192138671875, 0.02392101287841797, 0.026060104370117188, 0.028199195861816406, 0.030338287353515625, 0.032477378845214844, 0.03461647033691406, 0.03675556182861328, 0.0388946533203125, 0.04103374481201172, 0.04317283630371094, 0.045311927795410156, 0.047451019287109375, 0.049590110778808594, 0.05172920227050781, 0.05386829376220703, 0.05600738525390625, 0.05814647674560547, 0.06028556823730469, 0.062424659729003906, 0.06456375122070312, 0.06670284271240234, 0.06884193420410156, 0.07098102569580078, 0.0731201171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 8.0, 3.0, 4.0, 9.0, 15.0, 8.0, 19.0, 11.0, 8.0, 18.0, 14.0, 22.0, 23.0, 25.0, 28.0, 34.0, 39.0, 35.0, 38.0, 51.0, 27.0, 50.0, 43.0, 40.0, 41.0, 48.0, 39.0, 37.0, 32.0, 39.0, 25.0, 34.0, 25.0, 22.0, 16.0, 15.0, 12.0, 4.0, 9.0, 4.0, 6.0, 7.0, 5.0, 1.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.045745849609375, -0.04419136047363281, -0.042636871337890625, -0.04108238220214844, -0.03952789306640625, -0.03797340393066406, -0.036418914794921875, -0.03486442565917969, -0.0333099365234375, -0.03175544738769531, -0.030200958251953125, -0.028646469116210938, -0.02709197998046875, -0.025537490844726562, -0.023983001708984375, -0.022428512573242188, -0.0208740234375, -0.019319534301757812, -0.017765045166015625, -0.016210556030273438, -0.01465606689453125, -0.013101577758789062, -0.011547088623046875, -0.009992599487304688, -0.0084381103515625, -0.0068836212158203125, -0.005329132080078125, -0.0037746429443359375, -0.00222015380859375, -0.0006656646728515625, 0.000888824462890625, 0.0024433135986328125, 0.003997802734375, 0.0055522918701171875, 0.007106781005859375, 0.008661270141601562, 0.01021575927734375, 0.011770248413085938, 0.013324737548828125, 0.014879226684570312, 0.0164337158203125, 0.017988204956054688, 0.019542694091796875, 0.021097183227539062, 0.02265167236328125, 0.024206161499023438, 0.025760650634765625, 0.027315139770507812, 0.02886962890625, 0.030424118041992188, 0.031978607177734375, 0.03353309631347656, 0.03508758544921875, 0.03664207458496094, 0.038196563720703125, 0.03975105285644531, 0.0413055419921875, 0.04286003112792969, 0.044414520263671875, 0.04596900939941406, 0.04752349853515625, 0.04907798767089844, 0.050632476806640625, 0.05218696594238281, 0.053741455078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 10.0, 3.0, 12.0, 17.0, 18.0, 33.0, 51.0, 66.0, 137.0, 277.0, 714.0, 2829.0, 19488.0, 960456.0, 57580.0, 4869.0, 1195.0, 370.0, 163.0, 99.0, 55.0, 30.0, 18.0, 17.0, 17.0, 3.0, 6.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.16312026977539e-05, -5.878787487745285e-05, -5.5944547057151794e-05, -5.310121923685074e-05, -5.025789141654968e-05, -4.741456359624863e-05, -4.457123577594757e-05, -4.1727907955646515e-05, -3.888458013534546e-05, -3.60412523150444e-05, -3.319792449474335e-05, -3.035459667444229e-05, -2.7511268854141235e-05, -2.466794103384018e-05, -2.1824613213539124e-05, -1.8981285393238068e-05, -1.6137957572937012e-05, -1.3294629752635956e-05, -1.04513019323349e-05, -7.607974112033844e-06, -4.764646291732788e-06, -1.921318471431732e-06, 9.220093488693237e-07, 3.7653371691703796e-06, 6.6086649894714355e-06, 9.451992809772491e-06, 1.2295320630073547e-05, 1.5138648450374603e-05, 1.798197627067566e-05, 2.0825304090976715e-05, 2.366863191127777e-05, 2.6511959731578827e-05, 2.9355287551879883e-05, 3.219861537218094e-05, 3.5041943192481995e-05, 3.788527101278305e-05, 4.0728598833084106e-05, 4.357192665338516e-05, 4.641525447368622e-05, 4.9258582293987274e-05, 5.210191011428833e-05, 5.4945237934589386e-05, 5.778856575489044e-05, 6.06318935751915e-05, 6.347522139549255e-05, 6.631854921579361e-05, 6.916187703609467e-05, 7.200520485639572e-05, 7.484853267669678e-05, 7.769186049699783e-05, 8.053518831729889e-05, 8.337851613759995e-05, 8.6221843957901e-05, 8.906517177820206e-05, 9.190849959850311e-05, 9.475182741880417e-05, 9.759515523910522e-05, 0.00010043848305940628, 0.00010328181087970734, 0.00010612513870000839, 0.00010896846652030945, 0.0001118117943406105, 0.00011465512216091156, 0.00011749844998121262, 0.00012034177780151367]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 8.0, 2.0, 11.0, 13.0, 14.0, 20.0, 26.0, 31.0, 32.0, 54.0, 35.0, 35.0, 90.0, 40.0, 75.0, 52.0, 71.0, 56.0, 60.0, 42.0, 40.0, 36.0, 27.0, 29.0, 11.0, 20.0, 8.0, 8.0, 9.0, 4.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.066394805908203e-06, -4.9211084842681885e-06, -4.775822162628174e-06, -4.630535840988159e-06, -4.4852495193481445e-06, -4.33996319770813e-06, -4.194676876068115e-06, -4.049390554428101e-06, -3.904104232788086e-06, -3.7588179111480713e-06, -3.6135315895080566e-06, -3.468245267868042e-06, -3.3229589462280273e-06, -3.1776726245880127e-06, -3.032386302947998e-06, -2.8870999813079834e-06, -2.7418136596679688e-06, -2.596527338027954e-06, -2.4512410163879395e-06, -2.305954694747925e-06, -2.16066837310791e-06, -2.0153820514678955e-06, -1.8700957298278809e-06, -1.7248094081878662e-06, -1.5795230865478516e-06, -1.434236764907837e-06, -1.2889504432678223e-06, -1.1436641216278076e-06, -9.98377799987793e-07, -8.530914783477783e-07, -7.078051567077637e-07, -5.62518835067749e-07, -4.172325134277344e-07, -2.7194619178771973e-07, -1.2665987014770508e-07, 1.862645149230957e-08, 1.6391277313232422e-07, 3.0919909477233887e-07, 4.544854164123535e-07, 5.997717380523682e-07, 7.450580596923828e-07, 8.903443813323975e-07, 1.0356307029724121e-06, 1.1809170246124268e-06, 1.3262033462524414e-06, 1.471489667892456e-06, 1.6167759895324707e-06, 1.7620623111724854e-06, 1.9073486328125e-06, 2.0526349544525146e-06, 2.1979212760925293e-06, 2.343207597732544e-06, 2.4884939193725586e-06, 2.6337802410125732e-06, 2.779066562652588e-06, 2.9243528842926025e-06, 3.069639205932617e-06, 3.214925527572632e-06, 3.3602118492126465e-06, 3.505498170852661e-06, 3.6507844924926758e-06, 3.7960708141326904e-06, 3.941357135772705e-06, 4.08664345741272e-06, 4.231929779052734e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 7.0, 7.0, 10.0, 19.0, 17.0, 13.0, 21.0, 18.0, 45.0, 28.0, 47.0, 71.0, 89.0, 182.0, 254.0, 521.0, 1303.0, 16911.0, 1012063.0, 14229.0, 1312.0, 515.0, 276.0, 174.0, 106.0, 66.0, 48.0, 33.0, 18.0, 31.0, 24.0, 8.0, 10.0, 10.0, 15.0, 12.0, 8.0, 3.0, 4.0, 2.0, 7.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.949901580810547e-05, -6.722006946802139e-05, -6.494112312793732e-05, -6.266217678785324e-05, -6.0383230447769165e-05, -5.810428410768509e-05, -5.582533776760101e-05, -5.354639142751694e-05, -5.126744508743286e-05, -4.8988498747348785e-05, -4.670955240726471e-05, -4.4430606067180634e-05, -4.215165972709656e-05, -3.987271338701248e-05, -3.7593767046928406e-05, -3.531482070684433e-05, -3.3035874366760254e-05, -3.075692802667618e-05, -2.8477981686592102e-05, -2.6199035346508026e-05, -2.392008900642395e-05, -2.1641142666339874e-05, -1.93621963262558e-05, -1.7083249986171722e-05, -1.4804303646087646e-05, -1.252535730600357e-05, -1.0246410965919495e-05, -7.967464625835419e-06, -5.688518285751343e-06, -3.409571945667267e-06, -1.130625605583191e-06, 1.148320734500885e-06, 3.427267074584961e-06, 5.706213414669037e-06, 7.985159754753113e-06, 1.0264106094837189e-05, 1.2543052434921265e-05, 1.482199877500534e-05, 1.7100945115089417e-05, 1.9379891455173492e-05, 2.165883779525757e-05, 2.3937784135341644e-05, 2.621673047542572e-05, 2.8495676815509796e-05, 3.077462315559387e-05, 3.305356949567795e-05, 3.5332515835762024e-05, 3.76114621758461e-05, 3.9890408515930176e-05, 4.216935485601425e-05, 4.444830119609833e-05, 4.6727247536182404e-05, 4.900619387626648e-05, 5.1285140216350555e-05, 5.356408655643463e-05, 5.584303289651871e-05, 5.812197923660278e-05, 6.040092557668686e-05, 6.267987191677094e-05, 6.495881825685501e-05, 6.723776459693909e-05, 6.951671093702316e-05, 7.179565727710724e-05, 7.407460361719131e-05, 7.635354995727539e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 6.0, 5.0, 10.0, 4.0, 5.0, 12.0, 21.0, 14.0, 18.0, 36.0, 39.0, 65.0, 85.0, 99.0, 94.0, 79.0, 97.0, 65.0, 44.0, 40.0, 31.0, 15.0, 13.0, 12.0, 8.0, 12.0, 12.0, 4.0, 4.0, 3.0, 11.0, 7.0, 7.0, 1.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.161762237548828e-05, -4.9930065870285034e-05, -4.824250936508179e-05, -4.655495285987854e-05, -4.486739635467529e-05, -4.3179839849472046e-05, -4.14922833442688e-05, -3.980472683906555e-05, -3.8117170333862305e-05, -3.642961382865906e-05, -3.474205732345581e-05, -3.3054500818252563e-05, -3.1366944313049316e-05, -2.967938780784607e-05, -2.7991831302642822e-05, -2.6304274797439575e-05, -2.4616718292236328e-05, -2.292916178703308e-05, -2.1241605281829834e-05, -1.9554048776626587e-05, -1.786649227142334e-05, -1.6178935766220093e-05, -1.4491379261016846e-05, -1.2803822755813599e-05, -1.1116266250610352e-05, -9.428709745407104e-06, -7.741153240203857e-06, -6.05359673500061e-06, -4.366040229797363e-06, -2.678483724594116e-06, -9.909272193908691e-07, 6.966292858123779e-07, 2.384185791015625e-06, 4.071742296218872e-06, 5.759298801422119e-06, 7.446855306625366e-06, 9.134411811828613e-06, 1.082196831703186e-05, 1.2509524822235107e-05, 1.4197081327438354e-05, 1.58846378326416e-05, 1.757219433784485e-05, 1.9259750843048096e-05, 2.0947307348251343e-05, 2.263486385345459e-05, 2.4322420358657837e-05, 2.6009976863861084e-05, 2.769753336906433e-05, 2.9385089874267578e-05, 3.1072646379470825e-05, 3.276020288467407e-05, 3.444775938987732e-05, 3.6135315895080566e-05, 3.7822872400283813e-05, 3.951042890548706e-05, 4.119798541069031e-05, 4.2885541915893555e-05, 4.45730984210968e-05, 4.626065492630005e-05, 4.7948211431503296e-05, 4.963576793670654e-05, 5.132332444190979e-05, 5.301088094711304e-05, 5.4698437452316284e-05, 5.638599395751953e-05]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 48.0, 914.0, 46.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21399924159049988, -0.1953517198562622, -0.17670419812202454, -0.15805667638778687, -0.1394091546535492, -0.12076162546873093, -0.10211409628391266, -0.08346657454967499, -0.06481905281543732, -0.046171531081199646, -0.027524005621671677, -0.008876480162143707, 0.009771041572093964, 0.028418563306331635, 0.0470660924911499, 0.06571361422538757, 0.08436113595962524, 0.10300865769386292, 0.12165617942810059, 0.14030370116233826, 0.15895122289657593, 0.1775987446308136, 0.19624628126621246, 0.21489380300045013, 0.2335413247346878, 0.25218886137008667, 0.27083638310432434, 0.289483904838562, 0.3081314265727997, 0.32677894830703735, 0.345426470041275, 0.3640739917755127, 0.382721483707428, 0.40136900544166565, 0.4200165271759033, 0.438664048910141, 0.45731157064437866, 0.47595909237861633, 0.494606614112854, 0.5132541656494141, 0.5319016575813293, 0.5505492091178894, 0.5691967010498047, 0.5878442525863647, 0.60649174451828, 0.6251392960548401, 0.6437867879867554, 0.6624343395233154, 0.6810818910598755, 0.6997294425964355, 0.7183769345283508, 0.7370244860649109, 0.7556719779968262, 0.7743195295333862, 0.7929670214653015, 0.8116145730018616, 0.8302620649337769, 0.8489096164703369, 0.8675571084022522, 0.8862046599388123, 0.9048521518707275, 0.9234997034072876, 0.9421471953392029, 0.9607947468757629, 0.9794422388076782]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 12.0, 11.0, 31.0, 38.0, 36.0, 54.0, 69.0, 82.0, 106.0, 82.0, 98.0, 77.0, 65.0, 56.0, 47.0, 35.0, 24.0, 11.0, 15.0, 10.0, 6.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4558250308036804, -0.43731236457824707, -0.4187996983528137, -0.40028703212738037, -0.3817743957042694, -0.36326172947883606, -0.3447490632534027, -0.32623642683029175, -0.3077237606048584, -0.28921109437942505, -0.2706984281539917, -0.25218576192855835, -0.2336731255054474, -0.21516045928001404, -0.1966477930545807, -0.17813514173030853, -0.159622460603714, -0.14110979437828064, -0.12259714305400848, -0.10408447682857513, -0.08557181805372238, -0.06705915927886963, -0.04854649305343628, -0.030033841729164124, -0.011521175503730774, 0.006991485133767128, 0.02550414577126503, 0.04401680827140808, 0.06252946704626083, 0.08104212582111359, 0.09955479204654694, 0.11806744337081909, 0.13658010959625244, 0.1550927758216858, 0.17360542714595795, 0.1921180933713913, 0.21063074469566345, 0.2291434109210968, 0.24765607714653015, 0.2661687135696411, 0.28468137979507446, 0.3031940460205078, 0.32170671224594116, 0.3402193784713745, 0.3587320148944855, 0.3772446811199188, 0.3957573473453522, 0.41426998376846313, 0.43278267979621887, 0.4512953460216522, 0.46980801224708557, 0.48832064867019653, 0.5068333148956299, 0.5253459811210632, 0.5438586473464966, 0.5623713135719299, 0.5808839797973633, 0.5993966460227966, 0.61790931224823, 0.6364219784736633, 0.6549346446990967, 0.6734472513198853, 0.6919599771499634, 0.710472583770752, 0.7289852499961853]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 10.0, 10.0, 12.0, 7.0, 10.0, 15.0, 21.0, 24.0, 39.0, 46.0, 56.0, 55.0, 108.0, 185.0, 352.0, 4836.0, 4091495.0, 91885.0, 4352.0, 228.0, 158.0, 123.0, 62.0, 42.0, 39.0, 26.0, 24.0, 10.0, 15.0, 4.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062744140625, -0.060776710510253906, -0.05880928039550781, -0.05684185028076172, -0.054874420166015625, -0.05290699005126953, -0.05093955993652344, -0.048972129821777344, -0.04700469970703125, -0.045037269592285156, -0.04306983947753906, -0.04110240936279297, -0.039134979248046875, -0.03716754913330078, -0.03520011901855469, -0.033232688903808594, -0.0312652587890625, -0.029297828674316406, -0.027330398559570312, -0.02536296844482422, -0.023395538330078125, -0.02142810821533203, -0.019460678100585938, -0.017493247985839844, -0.01552581787109375, -0.013558387756347656, -0.011590957641601562, -0.009623527526855469, -0.007656097412109375, -0.005688667297363281, -0.0037212371826171875, -0.0017538070678710938, 0.000213623046875, 0.0021810531616210938, 0.0041484832763671875, 0.006115913391113281, 0.008083343505859375, 0.010050773620605469, 0.012018203735351562, 0.013985633850097656, 0.01595306396484375, 0.017920494079589844, 0.019887924194335938, 0.02185535430908203, 0.023822784423828125, 0.02579021453857422, 0.027757644653320312, 0.029725074768066406, 0.0316925048828125, 0.033659934997558594, 0.03562736511230469, 0.03759479522705078, 0.039562225341796875, 0.04152965545654297, 0.04349708557128906, 0.045464515686035156, 0.04743194580078125, 0.049399375915527344, 0.05136680603027344, 0.05333423614501953, 0.055301666259765625, 0.05726909637451172, 0.05923652648925781, 0.061203956604003906, 0.06317138671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 9.0, 21.0, 18.0, 8.0, 24.0, 189.0, 442.0, 148.0, 27.0, 15.0, 11.0, 6.0, 7.0, 10.0, 12.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020233154296875, -0.019606351852416992, -0.018979549407958984, -0.018352746963500977, -0.01772594451904297, -0.01709914207458496, -0.016472339630126953, -0.015845537185668945, -0.015218734741210938, -0.01459193229675293, -0.013965129852294922, -0.013338327407836914, -0.012711524963378906, -0.012084722518920898, -0.01145792007446289, -0.010831117630004883, -0.010204315185546875, -0.009577512741088867, -0.00895071029663086, -0.008323907852172852, -0.007697105407714844, -0.007070302963256836, -0.006443500518798828, -0.00581669807434082, -0.0051898956298828125, -0.004563093185424805, -0.003936290740966797, -0.003309488296508789, -0.0026826858520507812, -0.0020558834075927734, -0.0014290809631347656, -0.0008022785186767578, -0.00017547607421875, 0.0004513263702392578, 0.0010781288146972656, 0.0017049312591552734, 0.0023317337036132812, 0.002958536148071289, 0.003585338592529297, 0.004212141036987305, 0.0048389434814453125, 0.00546574592590332, 0.006092548370361328, 0.006719350814819336, 0.007346153259277344, 0.007972955703735352, 0.00859975814819336, 0.009226560592651367, 0.009853363037109375, 0.010480165481567383, 0.01110696792602539, 0.011733770370483398, 0.012360572814941406, 0.012987375259399414, 0.013614177703857422, 0.01424098014831543, 0.014867782592773438, 0.015494585037231445, 0.016121387481689453, 0.01674818992614746, 0.01737499237060547, 0.018001794815063477, 0.018628597259521484, 0.019255399703979492, 0.0198822021484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 0.0, 3.0, 1.0, 11.0, 14.0, 14.0, 33.0, 36.0, 89.0, 251.0, 1214.0, 28606.0, 4160928.0, 2345.0, 456.0, 116.0, 45.0, 41.0, 22.0, 18.0, 7.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.085693359375, -0.08318614959716797, -0.08067893981933594, -0.0781717300415039, -0.07566452026367188, -0.07315731048583984, -0.07065010070800781, -0.06814289093017578, -0.06563568115234375, -0.06312847137451172, -0.06062126159667969, -0.058114051818847656, -0.055606842041015625, -0.053099632263183594, -0.05059242248535156, -0.04808521270751953, -0.0455780029296875, -0.04307079315185547, -0.04056358337402344, -0.038056373596191406, -0.035549163818359375, -0.033041954040527344, -0.030534744262695312, -0.02802753448486328, -0.02552032470703125, -0.02301311492919922, -0.020505905151367188, -0.017998695373535156, -0.015491485595703125, -0.012984275817871094, -0.010477066040039062, -0.007969856262207031, -0.005462646484375, -0.0029554367065429688, -0.0004482269287109375, 0.0020589828491210938, 0.004566192626953125, 0.007073402404785156, 0.009580612182617188, 0.012087821960449219, 0.01459503173828125, 0.01710224151611328, 0.019609451293945312, 0.022116661071777344, 0.024623870849609375, 0.027131080627441406, 0.029638290405273438, 0.03214550018310547, 0.0346527099609375, 0.03715991973876953, 0.03966712951660156, 0.042174339294433594, 0.044681549072265625, 0.047188758850097656, 0.04969596862792969, 0.05220317840576172, 0.05471038818359375, 0.05721759796142578, 0.05972480773925781, 0.062232017517089844, 0.06473922729492188, 0.0672464370727539, 0.06975364685058594, 0.07226085662841797, 0.07476806640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 11.0, 17.0, 41.0, 166.0, 2793.0, 850.0, 110.0, 38.0, 16.0, 6.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249786376953125, -0.02411341667175293, -0.02324819564819336, -0.02238297462463379, -0.02151775360107422, -0.02065253257751465, -0.019787311553955078, -0.018922090530395508, -0.018056869506835938, -0.017191648483276367, -0.016326427459716797, -0.015461206436157227, -0.014595985412597656, -0.013730764389038086, -0.012865543365478516, -0.012000322341918945, -0.011135101318359375, -0.010269880294799805, -0.009404659271240234, -0.008539438247680664, -0.007674217224121094, -0.0068089962005615234, -0.005943775177001953, -0.005078554153442383, -0.0042133331298828125, -0.003348112106323242, -0.002482891082763672, -0.0016176700592041016, -0.0007524490356445312, 0.00011277198791503906, 0.0009779930114746094, 0.0018432140350341797, 0.00270843505859375, 0.0035736560821533203, 0.004438877105712891, 0.005304098129272461, 0.006169319152832031, 0.0070345401763916016, 0.007899761199951172, 0.008764982223510742, 0.009630203247070312, 0.010495424270629883, 0.011360645294189453, 0.012225866317749023, 0.013091087341308594, 0.013956308364868164, 0.014821529388427734, 0.015686750411987305, 0.016551971435546875, 0.017417192459106445, 0.018282413482666016, 0.019147634506225586, 0.020012855529785156, 0.020878076553344727, 0.021743297576904297, 0.022608518600463867, 0.023473739624023438, 0.024338960647583008, 0.025204181671142578, 0.02606940269470215, 0.02693462371826172, 0.02779984474182129, 0.02866506576538086, 0.02953028678894043, 0.0303955078125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 28.0, 983.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3283839225769043, -0.3226533532142639, -0.31692278385162354, -0.31119221448898315, -0.3054616451263428, -0.2997310757637024, -0.294000506401062, -0.28826993703842163, -0.28253936767578125, -0.27680879831314087, -0.2710782289505005, -0.2653476595878601, -0.2596170902252197, -0.25388652086257935, -0.24815595149993896, -0.24242539703845978, -0.2366948425769806, -0.2309642732143402, -0.22523370385169983, -0.21950313448905945, -0.21377256512641907, -0.2080419957637787, -0.2023114264011383, -0.19658087193965912, -0.19085028767585754, -0.18511971831321716, -0.17938914895057678, -0.1736585795879364, -0.16792801022529602, -0.16219744086265564, -0.15646687150001526, -0.15073631703853607, -0.14500576257705688, -0.1392751932144165, -0.13354462385177612, -0.12781405448913574, -0.12208349257707596, -0.11635292321443558, -0.1106223538517952, -0.10489179193973541, -0.09916120767593384, -0.09343063831329346, -0.08770006895065308, -0.0819694995880127, -0.07623893767595291, -0.07050836831331253, -0.06477779895067215, -0.05904723331332207, -0.053316667675971985, -0.047586098313331604, -0.04185553267598152, -0.03612496331334114, -0.03039439581334591, -0.024663828313350677, -0.018933258950710297, -0.013202693313360214, -0.007472123950719833, -0.0017415559850633144, 0.0039890119805932045, 0.00971958041191101, 0.015450147911906242, 0.021180715411901474, 0.026911284774541855, 0.03264185041189194, 0.03837241977453232]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 12.0, 7.0, 9.0, 12.0, 16.0, 17.0, 25.0, 34.0, 54.0, 48.0, 50.0, 69.0, 69.0, 72.0, 76.0, 65.0, 55.0, 58.0, 47.0, 50.0, 27.0, 36.0, 24.0, 21.0, 23.0, 7.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06458860635757446, -0.06287883967161179, -0.061169080436229706, -0.05945931375026703, -0.05774955078959465, -0.05603978782892227, -0.054330021142959595, -0.052620258182287216, -0.05091049522161484, -0.04920073226094246, -0.04749096930027008, -0.045781202614307404, -0.044071439653635025, -0.042361676692962646, -0.04065191000699997, -0.03894214704632759, -0.03723238408565521, -0.035522621124982834, -0.033812858164310455, -0.03210309147834778, -0.0303933285176754, -0.02868356555700302, -0.026973800733685493, -0.025264035910367966, -0.023554272949695587, -0.02184450998902321, -0.02013474516570568, -0.018424980342388153, -0.016715217381715775, -0.015005453489720821, -0.013295689597725868, -0.011585925705730915, -0.009876161813735962, -0.008166397921741009, -0.006456634029746056, -0.0047468701377511024, -0.0030371062457561493, -0.0013273423537611961, 0.000382421538233757, 0.00209218543022871, 0.0038019493222236633, 0.0055117132142186165, 0.00722147710621357, 0.008931240998208523, 0.010641004890203476, 0.012350768782198429, 0.014060532674193382, 0.01577029749751091, 0.01748006045818329, 0.019189823418855667, 0.020899588242173195, 0.022609353065490723, 0.0243191160261631, 0.02602887898683548, 0.027738643810153008, 0.029448408633470535, 0.031158171594142914, 0.03286793455481529, 0.03457769751548767, 0.03628746420145035, 0.037997227162122726, 0.039706990122795105, 0.04141675680875778, 0.04312651976943016, 0.04483628273010254]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 5.0, 5.0, 5.0, 9.0, 14.0, 22.0, 20.0, 31.0, 33.0, 55.0, 72.0, 102.0, 133.0, 179.0, 264.0, 337.0, 505.0, 729.0, 1086.0, 1550.0, 2321.0, 3967.0, 7346.0, 15966.0, 80262.0, 878518.0, 29435.0, 10862.0, 5255.0, 3143.0, 2021.0, 1295.0, 833.0, 599.0, 432.0, 309.0, 215.0, 157.0, 116.0, 84.0, 73.0, 50.0, 32.0, 28.0, 18.0, 12.0, 9.0, 9.0, 8.0, 8.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.0200958251953125, -0.01947307586669922, -0.018850326538085938, -0.018227577209472656, -0.017604827880859375, -0.016982078552246094, -0.016359329223632812, -0.01573657989501953, -0.01511383056640625, -0.014491081237792969, -0.013868331909179688, -0.013245582580566406, -0.012622833251953125, -0.012000083923339844, -0.011377334594726562, -0.010754585266113281, -0.0101318359375, -0.009509086608886719, -0.008886337280273438, -0.008263587951660156, -0.007640838623046875, -0.007018089294433594, -0.0063953399658203125, -0.005772590637207031, -0.00514984130859375, -0.004527091979980469, -0.0039043426513671875, -0.0032815933227539062, -0.002658843994140625, -0.0020360946655273438, -0.0014133453369140625, -0.0007905960083007812, -0.0001678466796875, 0.00045490264892578125, 0.0010776519775390625, 0.0017004013061523438, 0.002323150634765625, 0.0029458999633789062, 0.0035686492919921875, 0.004191398620605469, 0.00481414794921875, 0.005436897277832031, 0.0060596466064453125, 0.006682395935058594, 0.007305145263671875, 0.007927894592285156, 0.008550643920898438, 0.009173393249511719, 0.009796142578125, 0.010418891906738281, 0.011041641235351562, 0.011664390563964844, 0.012287139892578125, 0.012909889221191406, 0.013532638549804688, 0.014155387878417969, 0.01477813720703125, 0.015400886535644531, 0.016023635864257812, 0.016646385192871094, 0.017269134521484375, 0.017891883850097656, 0.018514633178710938, 0.01913738250732422, 0.0197601318359375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 9.0, 19.0, 19.0, 8.0, 21.0, 180.0, 452.0, 153.0, 25.0, 15.0, 11.0, 5.0, 7.0, 11.0, 12.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0202484130859375, -0.019621610641479492, -0.018994808197021484, -0.018368005752563477, -0.01774120330810547, -0.01711440086364746, -0.016487598419189453, -0.015860795974731445, -0.015233993530273438, -0.01460719108581543, -0.013980388641357422, -0.013353586196899414, -0.012726783752441406, -0.012099981307983398, -0.01147317886352539, -0.010846376419067383, -0.010219573974609375, -0.009592771530151367, -0.00896596908569336, -0.008339166641235352, -0.007712364196777344, -0.007085561752319336, -0.006458759307861328, -0.00583195686340332, -0.0052051544189453125, -0.004578351974487305, -0.003951549530029297, -0.003324747085571289, -0.0026979446411132812, -0.0020711421966552734, -0.0014443397521972656, -0.0008175373077392578, -0.00019073486328125, 0.0004360675811767578, 0.0010628700256347656, 0.0016896724700927734, 0.0023164749145507812, 0.002943277359008789, 0.003570079803466797, 0.004196882247924805, 0.0048236846923828125, 0.00545048713684082, 0.006077289581298828, 0.006704092025756836, 0.007330894470214844, 0.007957696914672852, 0.00858449935913086, 0.009211301803588867, 0.009838104248046875, 0.010464906692504883, 0.01109170913696289, 0.011718511581420898, 0.012345314025878906, 0.012972116470336914, 0.013598918914794922, 0.01422572135925293, 0.014852523803710938, 0.015479326248168945, 0.016106128692626953, 0.01673293113708496, 0.01735973358154297, 0.017986536026000977, 0.018613338470458984, 0.019240140914916992, 0.019866943359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 6.0, 11.0, 8.0, 21.0, 20.0, 35.0, 38.0, 32.0, 37.0, 71.0, 79.0, 93.0, 106.0, 157.0, 209.0, 306.0, 493.0, 1115.0, 6020.0, 877122.0, 156931.0, 3177.0, 867.0, 449.0, 248.0, 194.0, 139.0, 119.0, 67.0, 79.0, 58.0, 45.0, 33.0, 40.0, 29.0, 25.0, 12.0, 13.0, 6.0, 7.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.06329345703125, -0.06130695343017578, -0.05932044982910156, -0.057333946228027344, -0.055347442626953125, -0.053360939025878906, -0.05137443542480469, -0.04938793182373047, -0.04740142822265625, -0.04541492462158203, -0.04342842102050781, -0.041441917419433594, -0.039455413818359375, -0.037468910217285156, -0.03548240661621094, -0.03349590301513672, -0.0315093994140625, -0.02952289581298828, -0.027536392211914062, -0.025549888610839844, -0.023563385009765625, -0.021576881408691406, -0.019590377807617188, -0.01760387420654297, -0.01561737060546875, -0.013630867004394531, -0.011644363403320312, -0.009657859802246094, -0.007671356201171875, -0.005684852600097656, -0.0036983489990234375, -0.0017118453979492188, 0.000274658203125, 0.0022611618041992188, 0.0042476654052734375, 0.006234169006347656, 0.008220672607421875, 0.010207176208496094, 0.012193679809570312, 0.014180183410644531, 0.01616668701171875, 0.01815319061279297, 0.020139694213867188, 0.022126197814941406, 0.024112701416015625, 0.026099205017089844, 0.028085708618164062, 0.03007221221923828, 0.0320587158203125, 0.03404521942138672, 0.03603172302246094, 0.038018226623535156, 0.040004730224609375, 0.041991233825683594, 0.04397773742675781, 0.04596424102783203, 0.04795074462890625, 0.04993724822998047, 0.05192375183105469, 0.053910255432128906, 0.055896759033203125, 0.057883262634277344, 0.05986976623535156, 0.06185626983642578, 0.0638427734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 3.0, 6.0, 4.0, 13.0, 4.0, 15.0, 18.0, 20.0, 15.0, 30.0, 20.0, 22.0, 37.0, 40.0, 37.0, 39.0, 38.0, 42.0, 47.0, 41.0, 58.0, 39.0, 42.0, 40.0, 38.0, 34.0, 31.0, 30.0, 32.0, 26.0, 29.0, 20.0, 14.0, 11.0, 17.0, 20.0, 6.0, 7.0, 4.0, 0.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0517578125, -0.05009174346923828, -0.04842567443847656, -0.046759605407714844, -0.045093536376953125, -0.043427467346191406, -0.04176139831542969, -0.04009532928466797, -0.03842926025390625, -0.03676319122314453, -0.03509712219238281, -0.033431053161621094, -0.031764984130859375, -0.030098915100097656, -0.028432846069335938, -0.02676677703857422, -0.0251007080078125, -0.02343463897705078, -0.021768569946289062, -0.020102500915527344, -0.018436431884765625, -0.016770362854003906, -0.015104293823242188, -0.013438224792480469, -0.01177215576171875, -0.010106086730957031, -0.008440017700195312, -0.006773948669433594, -0.005107879638671875, -0.0034418106079101562, -0.0017757415771484375, -0.00010967254638671875, 0.001556396484375, 0.0032224655151367188, 0.0048885345458984375, 0.006554603576660156, 0.008220672607421875, 0.009886741638183594, 0.011552810668945312, 0.013218879699707031, 0.01488494873046875, 0.01655101776123047, 0.018217086791992188, 0.019883155822753906, 0.021549224853515625, 0.023215293884277344, 0.024881362915039062, 0.02654743194580078, 0.0282135009765625, 0.02987957000732422, 0.03154563903808594, 0.033211708068847656, 0.034877777099609375, 0.036543846130371094, 0.03820991516113281, 0.03987598419189453, 0.04154205322265625, 0.04320812225341797, 0.04487419128417969, 0.046540260314941406, 0.048206329345703125, 0.049872398376464844, 0.05153846740722656, 0.05320453643798828, 0.05487060546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 6.0, 12.0, 19.0, 31.0, 31.0, 50.0, 59.0, 111.0, 165.0, 271.0, 535.0, 1030.0, 2296.0, 5325.0, 17407.0, 137635.0, 833159.0, 35474.0, 8436.0, 3419.0, 1389.0, 668.0, 379.0, 221.0, 136.0, 97.0, 71.0, 41.0, 22.0, 13.0, 9.0, 10.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2961368560791016e-05, -3.187078982591629e-05, -3.0780211091041565e-05, -2.968963235616684e-05, -2.8599053621292114e-05, -2.750847488641739e-05, -2.6417896151542664e-05, -2.5327317416667938e-05, -2.4236738681793213e-05, -2.3146159946918488e-05, -2.2055581212043762e-05, -2.0965002477169037e-05, -1.987442374229431e-05, -1.8783845007419586e-05, -1.769326627254486e-05, -1.6602687537670135e-05, -1.551210880279541e-05, -1.4421530067920685e-05, -1.333095133304596e-05, -1.2240372598171234e-05, -1.1149793863296509e-05, -1.0059215128421783e-05, -8.968636393547058e-06, -7.878057658672333e-06, -6.787478923797607e-06, -5.696900188922882e-06, -4.606321454048157e-06, -3.5157427191734314e-06, -2.425163984298706e-06, -1.3345852494239807e-06, -2.4400651454925537e-07, 8.4657222032547e-07, 1.9371509552001953e-06, 3.0277296900749207e-06, 4.118308424949646e-06, 5.208887159824371e-06, 6.299465894699097e-06, 7.390044629573822e-06, 8.480623364448547e-06, 9.571202099323273e-06, 1.0661780834197998e-05, 1.1752359569072723e-05, 1.2842938303947449e-05, 1.3933517038822174e-05, 1.50240957736969e-05, 1.6114674508571625e-05, 1.720525324344635e-05, 1.8295831978321075e-05, 1.93864107131958e-05, 2.0476989448070526e-05, 2.156756818294525e-05, 2.2658146917819977e-05, 2.3748725652694702e-05, 2.4839304387569427e-05, 2.5929883122444153e-05, 2.7020461857318878e-05, 2.8111040592193604e-05, 2.920161932706833e-05, 3.0292198061943054e-05, 3.138277679681778e-05, 3.2473355531692505e-05, 3.356393426656723e-05, 3.4654513001441956e-05, 3.574509173631668e-05, 3.6835670471191406e-05]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 8.0, 8.0, 13.0, 21.0, 16.0, 35.0, 24.0, 38.0, 38.0, 61.0, 67.0, 48.0, 81.0, 59.0, 78.0, 43.0, 81.0, 59.0, 34.0, 46.0, 24.0, 23.0, 17.0, 16.0, 18.0, 9.0, 9.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4836273193359375e-06, -5.3299590945243835e-06, -5.17629086971283e-06, -5.022622644901276e-06, -4.868954420089722e-06, -4.715286195278168e-06, -4.561617970466614e-06, -4.40794974565506e-06, -4.254281520843506e-06, -4.100613296031952e-06, -3.946945071220398e-06, -3.793276846408844e-06, -3.63960862159729e-06, -3.485940396785736e-06, -3.332272171974182e-06, -3.178603947162628e-06, -3.0249357223510742e-06, -2.8712674975395203e-06, -2.7175992727279663e-06, -2.5639310479164124e-06, -2.4102628231048584e-06, -2.2565945982933044e-06, -2.1029263734817505e-06, -1.9492581486701965e-06, -1.7955899238586426e-06, -1.6419216990470886e-06, -1.4882534742355347e-06, -1.3345852494239807e-06, -1.1809170246124268e-06, -1.0272487998008728e-06, -8.735805749893188e-07, -7.199123501777649e-07, -5.662441253662109e-07, -4.12575900554657e-07, -2.5890767574310303e-07, -1.0523945093154907e-07, 4.842877388000488e-08, 2.0209699869155884e-07, 3.557652235031128e-07, 5.094334483146667e-07, 6.631016731262207e-07, 8.167698979377747e-07, 9.704381227493286e-07, 1.1241063475608826e-06, 1.2777745723724365e-06, 1.4314427971839905e-06, 1.5851110219955444e-06, 1.7387792468070984e-06, 1.8924474716186523e-06, 2.0461156964302063e-06, 2.1997839212417603e-06, 2.353452146053314e-06, 2.507120370864868e-06, 2.660788595676422e-06, 2.814456820487976e-06, 2.96812504529953e-06, 3.121793270111084e-06, 3.275461494922638e-06, 3.429129719734192e-06, 3.582797944545746e-06, 3.7364661693573e-06, 3.890134394168854e-06, 4.043802618980408e-06, 4.197470843791962e-06, 4.351139068603516e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 2.0, 9.0, 11.0, 11.0, 13.0, 24.0, 38.0, 50.0, 59.0, 107.0, 188.0, 366.0, 1085.0, 26327.0, 1016132.0, 2882.0, 572.0, 252.0, 142.0, 77.0, 44.0, 43.0, 33.0, 15.0, 12.0, 11.0, 13.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.796287536621094e-05, -7.554329931735992e-05, -7.312372326850891e-05, -7.07041472196579e-05, -6.828457117080688e-05, -6.586499512195587e-05, -6.344541907310486e-05, -6.1025843024253845e-05, -5.860626697540283e-05, -5.618669092655182e-05, -5.3767114877700806e-05, -5.134753882884979e-05, -4.892796277999878e-05, -4.6508386731147766e-05, -4.408881068229675e-05, -4.166923463344574e-05, -3.9249658584594727e-05, -3.683008253574371e-05, -3.44105064868927e-05, -3.199093043804169e-05, -2.9571354389190674e-05, -2.715177834033966e-05, -2.4732202291488647e-05, -2.2312626242637634e-05, -1.989305019378662e-05, -1.7473474144935608e-05, -1.5053898096084595e-05, -1.2634322047233582e-05, -1.0214745998382568e-05, -7.795169949531555e-06, -5.375593900680542e-06, -2.956017851829529e-06, -5.364418029785156e-07, 1.8831342458724976e-06, 4.302710294723511e-06, 6.722286343574524e-06, 9.141862392425537e-06, 1.156143844127655e-05, 1.3981014490127563e-05, 1.6400590538978577e-05, 1.882016658782959e-05, 2.1239742636680603e-05, 2.3659318685531616e-05, 2.607889473438263e-05, 2.8498470783233643e-05, 3.0918046832084656e-05, 3.333762288093567e-05, 3.575719892978668e-05, 3.8176774978637695e-05, 4.059635102748871e-05, 4.301592707633972e-05, 4.5435503125190735e-05, 4.785507917404175e-05, 5.027465522289276e-05, 5.2694231271743774e-05, 5.511380732059479e-05, 5.75333833694458e-05, 5.9952959418296814e-05, 6.237253546714783e-05, 6.479211151599884e-05, 6.721168756484985e-05, 6.963126361370087e-05, 7.205083966255188e-05, 7.447041571140289e-05, 7.68899917602539e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 11.0, 9.0, 19.0, 10.0, 24.0, 41.0, 48.0, 82.0, 86.0, 132.0, 135.0, 93.0, 82.0, 61.0, 51.0, 18.0, 16.0, 16.0, 14.0, 11.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.747245788574219e-05, -6.5607950091362e-05, -6.374344229698181e-05, -6.187893450260162e-05, -6.0014426708221436e-05, -5.814991891384125e-05, -5.628541111946106e-05, -5.442090332508087e-05, -5.2556395530700684e-05, -5.0691887736320496e-05, -4.882737994194031e-05, -4.696287214756012e-05, -4.509836435317993e-05, -4.3233856558799744e-05, -4.1369348764419556e-05, -3.950484097003937e-05, -3.764033317565918e-05, -3.577582538127899e-05, -3.3911317586898804e-05, -3.2046809792518616e-05, -3.0182301998138428e-05, -2.831779420375824e-05, -2.6453286409378052e-05, -2.4588778614997864e-05, -2.2724270820617676e-05, -2.0859763026237488e-05, -1.89952552318573e-05, -1.7130747437477112e-05, -1.5266239643096924e-05, -1.3401731848716736e-05, -1.1537224054336548e-05, -9.67271625995636e-06, -7.808208465576172e-06, -5.943700671195984e-06, -4.079192876815796e-06, -2.214685082435608e-06, -3.501772880554199e-07, 1.514330506324768e-06, 3.378838300704956e-06, 5.243346095085144e-06, 7.107853889465332e-06, 8.97236168384552e-06, 1.0836869478225708e-05, 1.2701377272605896e-05, 1.4565885066986084e-05, 1.6430392861366272e-05, 1.829490065574646e-05, 2.0159408450126648e-05, 2.2023916244506836e-05, 2.3888424038887024e-05, 2.5752931833267212e-05, 2.76174396276474e-05, 2.9481947422027588e-05, 3.1346455216407776e-05, 3.3210963010787964e-05, 3.507547080516815e-05, 3.693997859954834e-05, 3.880448639392853e-05, 4.0668994188308716e-05, 4.2533501982688904e-05, 4.439800977706909e-05, 4.626251757144928e-05, 4.812702536582947e-05, 4.9991533160209656e-05, 5.1856040954589844e-05]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 18.0, 779.0, 203.0, 12.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18240585923194885, -0.1655949056148529, -0.14878395199775696, -0.1319730132818222, -0.11516205966472626, -0.09835110604763031, -0.08154015988111496, -0.06472921371459961, -0.04791826009750366, -0.031107310205698013, -0.014296360313892365, 0.0025145895779132843, 0.019325539469718933, 0.03613649308681488, 0.05294743925333023, 0.06975838541984558, 0.08656933903694153, 0.10338029265403748, 0.12019123882055283, 0.13700218498706818, 0.15381313860416412, 0.17062409222126007, 0.18743503093719482, 0.20424598455429077, 0.22105693817138672, 0.23786789178848267, 0.2546788454055786, 0.27148979902267456, 0.2883007526397705, 0.30511170625686646, 0.32192263007164, 0.33873358368873596, 0.3555445671081543, 0.37235552072525024, 0.3891664743423462, 0.40597742795944214, 0.4227883815765381, 0.43959933519363403, 0.4564102590084076, 0.47322121262550354, 0.4900321662425995, 0.506843090057373, 0.523654043674469, 0.5404649972915649, 0.5572759509086609, 0.5740869045257568, 0.5908978581428528, 0.6077088117599487, 0.6245197653770447, 0.6413307189941406, 0.6581416726112366, 0.6749526262283325, 0.6917635798454285, 0.7085745334625244, 0.7253854870796204, 0.7421964406967163, 0.7590073347091675, 0.7758182883262634, 0.7926292419433594, 0.8094401955604553, 0.8262511491775513, 0.8430621027946472, 0.8598730564117432, 0.8766839504241943, 0.8934949636459351]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 12.0, 16.0, 11.0, 19.0, 25.0, 33.0, 36.0, 44.0, 56.0, 51.0, 65.0, 77.0, 76.0, 77.0, 42.0, 56.0, 54.0, 47.0, 37.0, 44.0, 28.0, 24.0, 15.0, 15.0, 16.0, 12.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4224570393562317, -0.4082862138748169, -0.3941153883934021, -0.3799445629119873, -0.3657737374305725, -0.3516029119491577, -0.3374320864677429, -0.3232612609863281, -0.30909043550491333, -0.29491961002349854, -0.28074878454208374, -0.26657795906066895, -0.25240713357925415, -0.23823630809783936, -0.22406549751758575, -0.20989467203617096, -0.19572386145591736, -0.18155303597450256, -0.16738221049308777, -0.15321138501167297, -0.13904055953025818, -0.12486974149942398, -0.11069892346858978, -0.09652809798717499, -0.08235727250576019, -0.0681864470243454, -0.0540156252682209, -0.039844803512096405, -0.02567397803068161, -0.011503152549266815, 0.002667665481567383, 0.016838490962982178, 0.031009316444396973, 0.04518014192581177, 0.059350963681936264, 0.07352178543806076, 0.08769261091947556, 0.10186343640089035, 0.11603425443172455, 0.13020507991313934, 0.14437590539455414, 0.15854673087596893, 0.17271755635738373, 0.18688836693763733, 0.20105919241905212, 0.21523001790046692, 0.2294008433818817, 0.2435716688632965, 0.2577424943447113, 0.2719133198261261, 0.2860841453075409, 0.3002549707889557, 0.3144257962703705, 0.3285966217517853, 0.3427674174308777, 0.3569382429122925, 0.3711090683937073, 0.38527989387512207, 0.39945071935653687, 0.41362154483795166, 0.42779237031936646, 0.44196319580078125, 0.45613402128219604, 0.47030484676361084, 0.48447567224502563]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 16.0, 12.0, 27.0, 41.0, 53.0, 69.0, 353.0, 10782.0, 4180510.0, 2067.0, 106.0, 61.0, 43.0, 21.0, 16.0, 15.0, 15.0, 9.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.065185546875, -0.06315994262695312, -0.06113433837890625, -0.059108734130859375, -0.0570831298828125, -0.055057525634765625, -0.05303192138671875, -0.051006317138671875, -0.048980712890625, -0.046955108642578125, -0.04492950439453125, -0.042903900146484375, -0.0408782958984375, -0.038852691650390625, -0.03682708740234375, -0.034801483154296875, -0.03277587890625, -0.030750274658203125, -0.02872467041015625, -0.026699066162109375, -0.0246734619140625, -0.022647857666015625, -0.02062225341796875, -0.018596649169921875, -0.016571044921875, -0.014545440673828125, -0.01251983642578125, -0.010494232177734375, -0.0084686279296875, -0.006443023681640625, -0.00441741943359375, -0.002391815185546875, -0.0003662109375, 0.001659393310546875, 0.00368499755859375, 0.005710601806640625, 0.0077362060546875, 0.009761810302734375, 0.01178741455078125, 0.013813018798828125, 0.015838623046875, 0.017864227294921875, 0.01988983154296875, 0.021915435791015625, 0.0239410400390625, 0.025966644287109375, 0.02799224853515625, 0.030017852783203125, 0.03204345703125, 0.034069061279296875, 0.03609466552734375, 0.038120269775390625, 0.0401458740234375, 0.042171478271484375, 0.04419708251953125, 0.046222686767578125, 0.048248291015625, 0.050273895263671875, 0.05229949951171875, 0.054325103759765625, 0.0563507080078125, 0.058376312255859375, 0.06040191650390625, 0.062427520751953125, 0.064453125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 5.0, 11.0, 17.0, 17.0, 10.0, 28.0, 218.0, 439.0, 120.0, 23.0, 16.0, 12.0, 4.0, 8.0, 11.0, 12.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0199737548828125, -0.019353151321411133, -0.018732547760009766, -0.0181119441986084, -0.01749134063720703, -0.016870737075805664, -0.016250133514404297, -0.01562952995300293, -0.015008926391601562, -0.014388322830200195, -0.013767719268798828, -0.013147115707397461, -0.012526512145996094, -0.011905908584594727, -0.01128530502319336, -0.010664701461791992, -0.010044097900390625, -0.009423494338989258, -0.00880289077758789, -0.008182287216186523, -0.007561683654785156, -0.006941080093383789, -0.006320476531982422, -0.005699872970581055, -0.0050792694091796875, -0.00445866584777832, -0.003838062286376953, -0.003217458724975586, -0.0025968551635742188, -0.0019762516021728516, -0.0013556480407714844, -0.0007350444793701172, -0.00011444091796875, 0.0005061626434326172, 0.0011267662048339844, 0.0017473697662353516, 0.0023679733276367188, 0.002988576889038086, 0.003609180450439453, 0.00422978401184082, 0.0048503875732421875, 0.005470991134643555, 0.006091594696044922, 0.006712198257446289, 0.007332801818847656, 0.007953405380249023, 0.00857400894165039, 0.009194612503051758, 0.009815216064453125, 0.010435819625854492, 0.01105642318725586, 0.011677026748657227, 0.012297630310058594, 0.012918233871459961, 0.013538837432861328, 0.014159440994262695, 0.014780044555664062, 0.01540064811706543, 0.016021251678466797, 0.016641855239868164, 0.01726245880126953, 0.0178830623626709, 0.018503665924072266, 0.019124269485473633, 0.019744873046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 14.0, 14.0, 13.0, 54.0, 178.0, 543.0, 2682.0, 4185692.0, 4169.0, 622.0, 194.0, 42.0, 18.0, 18.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04180908203125, -0.04034709930419922, -0.03888511657714844, -0.037423133850097656, -0.035961151123046875, -0.034499168395996094, -0.03303718566894531, -0.03157520294189453, -0.03011322021484375, -0.02865123748779297, -0.027189254760742188, -0.025727272033691406, -0.024265289306640625, -0.022803306579589844, -0.021341323852539062, -0.01987934112548828, -0.0184173583984375, -0.01695537567138672, -0.015493392944335938, -0.014031410217285156, -0.012569427490234375, -0.011107444763183594, -0.009645462036132812, -0.008183479309082031, -0.00672149658203125, -0.005259513854980469, -0.0037975311279296875, -0.0023355484008789062, -0.000873565673828125, 0.0005884170532226562, 0.0020503997802734375, 0.0035123825073242188, 0.004974365234375, 0.006436347961425781, 0.007898330688476562, 0.009360313415527344, 0.010822296142578125, 0.012284278869628906, 0.013746261596679688, 0.015208244323730469, 0.01667022705078125, 0.01813220977783203, 0.019594192504882812, 0.021056175231933594, 0.022518157958984375, 0.023980140686035156, 0.025442123413085938, 0.02690410614013672, 0.0283660888671875, 0.02982807159423828, 0.03129005432128906, 0.032752037048339844, 0.034214019775390625, 0.035676002502441406, 0.03713798522949219, 0.03859996795654297, 0.04006195068359375, 0.04152393341064453, 0.04298591613769531, 0.044447898864746094, 0.045909881591796875, 0.047371864318847656, 0.04883384704589844, 0.05029582977294922, 0.0517578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 16.0, 35.0, 2938.0, 1014.0, 49.0, 14.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174407958984375, -0.016942381858825684, -0.016443967819213867, -0.01594555377960205, -0.015447139739990234, -0.014948725700378418, -0.014450311660766602, -0.013951897621154785, -0.013453483581542969, -0.012955069541931152, -0.012456655502319336, -0.01195824146270752, -0.011459827423095703, -0.010961413383483887, -0.01046299934387207, -0.009964585304260254, -0.009466171264648438, -0.008967757225036621, -0.008469343185424805, -0.007970929145812988, -0.007472515106201172, -0.0069741010665893555, -0.006475687026977539, -0.005977272987365723, -0.005478858947753906, -0.00498044490814209, -0.0044820308685302734, -0.003983616828918457, -0.0034852027893066406, -0.0029867887496948242, -0.002488374710083008, -0.0019899606704711914, -0.001491546630859375, -0.0009931325912475586, -0.0004947185516357422, 3.6954879760742188e-06, 0.0005021095275878906, 0.001000523567199707, 0.0014989376068115234, 0.00199735164642334, 0.0024957656860351562, 0.0029941797256469727, 0.003492593765258789, 0.0039910078048706055, 0.004489421844482422, 0.004987835884094238, 0.005486249923706055, 0.005984663963317871, 0.0064830780029296875, 0.006981492042541504, 0.00747990608215332, 0.007978320121765137, 0.008476734161376953, 0.00897514820098877, 0.009473562240600586, 0.009971976280212402, 0.010470390319824219, 0.010968804359436035, 0.011467218399047852, 0.011965632438659668, 0.012464046478271484, 0.0129624605178833, 0.013460874557495117, 0.013959288597106934, 0.01445770263671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 1007.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05711958557367325, -0.0536467619240284, -0.050173938274383545, -0.04670111835002899, -0.04322829470038414, -0.03975547105073929, -0.036282651126384735, -0.03280982747673988, -0.029337003827095032, -0.02586418017745018, -0.022391358390450478, -0.018918536603450775, -0.015445712953805923, -0.011972889304161072, -0.00850006751716137, -0.005027245730161667, -0.0015544220805168152, 0.0019184006378054619, 0.005391223356127739, 0.008864046074450016, 0.012336868792772293, 0.015809692442417145, 0.019282514229416847, 0.02275533601641655, 0.0262281596660614, 0.029700983315706253, 0.033173806965351105, 0.03664662688970566, 0.04011945053935051, 0.04359227418899536, 0.047065094113349915, 0.050537917762994766, 0.05401073396205902, 0.05748355761170387, 0.060956381261348724, 0.06442920118570328, 0.06790202856063843, 0.07137484848499298, 0.07484766840934753, 0.07832048833370209, 0.08179331570863724, 0.08526613563299179, 0.08873896300792694, 0.0922117829322815, 0.09568460285663605, 0.0991574302315712, 0.10263025015592575, 0.1061030775308609, 0.10957589745521545, 0.11304871737957001, 0.11652154475450516, 0.11999436467885971, 0.12346719205379486, 0.12694001197814941, 0.13041283190250397, 0.13388565182685852, 0.13735848665237427, 0.14083130657672882, 0.14430412650108337, 0.14777696132659912, 0.15124978125095367, 0.15472260117530823, 0.15819542109966278, 0.16166824102401733, 0.1651410609483719]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 5.0, 15.0, 22.0, 34.0, 56.0, 73.0, 88.0, 116.0, 124.0, 117.0, 95.0, 76.0, 69.0, 54.0, 30.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036485135555267334, -0.035463348031044006, -0.03444156050682068, -0.03341977670788765, -0.03239798918366432, -0.031376201659440994, -0.030354415997862816, -0.029332630336284637, -0.02831084281206131, -0.027289055287837982, -0.026267269626259804, -0.025245483964681625, -0.024223696440458298, -0.02320190891623497, -0.02218012325465679, -0.021158337593078613, -0.020136550068855286, -0.019114762544631958, -0.01809297688305378, -0.0170711912214756, -0.016049403697252274, -0.01502761710435152, -0.014005830511450768, -0.012984043918550014, -0.011962257325649261, -0.010940470732748508, -0.009918684139847755, -0.008896897546947002, -0.00787511095404625, -0.006853324361145496, -0.005831537768244743, -0.00480975117534399, -0.0037879645824432373, -0.0027661779895424843, -0.0017443913966417313, -0.0007226048037409782, 0.0002991817891597748, 0.0013209683820605278, 0.002342754974961281, 0.003364541567862034, 0.004386328160762787, 0.00540811475366354, 0.006429901346564293, 0.007451687939465046, 0.008473474532365799, 0.009495261125266552, 0.010517047718167305, 0.011538834311068058, 0.012560620903968811, 0.013582407496869564, 0.014604194089770317, 0.015625979751348495, 0.016647767275571823, 0.01766955479979515, 0.01869134046137333, 0.019713126122951508, 0.020734913647174835, 0.021756701171398163, 0.02277848683297634, 0.02380027249455452, 0.024822060018777847, 0.025843847543001175, 0.026865633204579353, 0.027887418866157532, 0.02890920639038086]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 7.0, 10.0, 16.0, 11.0, 28.0, 27.0, 35.0, 46.0, 80.0, 84.0, 143.0, 181.0, 285.0, 486.0, 821.0, 1368.0, 2555.0, 5288.0, 14076.0, 98180.0, 888218.0, 21535.0, 7287.0, 3433.0, 1722.0, 912.0, 566.0, 343.0, 191.0, 151.0, 103.0, 92.0, 58.0, 46.0, 31.0, 27.0, 18.0, 20.0, 18.0, 2.0, 10.0, 10.0, 3.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0230255126953125, -0.02230978012084961, -0.02159404754638672, -0.020878314971923828, -0.020162582397460938, -0.019446849822998047, -0.018731117248535156, -0.018015384674072266, -0.017299652099609375, -0.016583919525146484, -0.015868186950683594, -0.015152454376220703, -0.014436721801757812, -0.013720989227294922, -0.013005256652832031, -0.01228952407836914, -0.01157379150390625, -0.01085805892944336, -0.010142326354980469, -0.009426593780517578, -0.008710861206054688, -0.007995128631591797, -0.007279396057128906, -0.006563663482666016, -0.005847930908203125, -0.005132198333740234, -0.004416465759277344, -0.003700733184814453, -0.0029850006103515625, -0.002269268035888672, -0.0015535354614257812, -0.0008378028869628906, -0.0001220703125, 0.0005936622619628906, 0.0013093948364257812, 0.002025127410888672, 0.0027408599853515625, 0.003456592559814453, 0.004172325134277344, 0.004888057708740234, 0.005603790283203125, 0.006319522857666016, 0.007035255432128906, 0.007750988006591797, 0.008466720581054688, 0.009182453155517578, 0.009898185729980469, 0.01061391830444336, 0.01132965087890625, 0.01204538345336914, 0.012761116027832031, 0.013476848602294922, 0.014192581176757812, 0.014908313751220703, 0.015624046325683594, 0.016339778900146484, 0.017055511474609375, 0.017771244049072266, 0.018486976623535156, 0.019202709197998047, 0.019918441772460938, 0.020634174346923828, 0.02134990692138672, 0.02206563949584961, 0.0227813720703125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 4.0, 12.0, 17.0, 17.0, 11.0, 27.0, 217.0, 439.0, 121.0, 23.0, 16.0, 12.0, 5.0, 7.0, 11.0, 12.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0199737548828125, -0.019353151321411133, -0.018732547760009766, -0.0181119441986084, -0.01749134063720703, -0.016870737075805664, -0.016250133514404297, -0.01562952995300293, -0.015008926391601562, -0.014388322830200195, -0.013767719268798828, -0.013147115707397461, -0.012526512145996094, -0.011905908584594727, -0.01128530502319336, -0.010664701461791992, -0.010044097900390625, -0.009423494338989258, -0.00880289077758789, -0.008182287216186523, -0.007561683654785156, -0.006941080093383789, -0.006320476531982422, -0.005699872970581055, -0.0050792694091796875, -0.00445866584777832, -0.003838062286376953, -0.003217458724975586, -0.0025968551635742188, -0.0019762516021728516, -0.0013556480407714844, -0.0007350444793701172, -0.00011444091796875, 0.0005061626434326172, 0.0011267662048339844, 0.0017473697662353516, 0.0023679733276367188, 0.002988576889038086, 0.003609180450439453, 0.00422978401184082, 0.0048503875732421875, 0.005470991134643555, 0.006091594696044922, 0.006712198257446289, 0.007332801818847656, 0.007953405380249023, 0.00857400894165039, 0.009194612503051758, 0.009815216064453125, 0.010435819625854492, 0.01105642318725586, 0.011677026748657227, 0.012297630310058594, 0.012918233871459961, 0.013538837432861328, 0.014159440994262695, 0.014780044555664062, 0.01540064811706543, 0.016021251678466797, 0.016641855239868164, 0.01726245880126953, 0.0178830623626709, 0.018503665924072266, 0.019124269485473633, 0.019744873046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 9.0, 6.0, 8.0, 11.0, 15.0, 24.0, 22.0, 34.0, 29.0, 45.0, 58.0, 59.0, 76.0, 119.0, 127.0, 164.0, 241.0, 429.0, 792.0, 1904.0, 39491.0, 995941.0, 5814.0, 1219.0, 644.0, 339.0, 218.0, 134.0, 93.0, 91.0, 69.0, 64.0, 57.0, 45.0, 34.0, 34.0, 22.0, 17.0, 15.0, 10.0, 13.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05609130859375, -0.05423927307128906, -0.052387237548828125, -0.05053520202636719, -0.04868316650390625, -0.04683113098144531, -0.044979095458984375, -0.04312705993652344, -0.0412750244140625, -0.03942298889160156, -0.037570953369140625, -0.03571891784667969, -0.03386688232421875, -0.03201484680175781, -0.030162811279296875, -0.028310775756835938, -0.026458740234375, -0.024606704711914062, -0.022754669189453125, -0.020902633666992188, -0.01905059814453125, -0.017198562622070312, -0.015346527099609375, -0.013494491577148438, -0.0116424560546875, -0.009790420532226562, -0.007938385009765625, -0.0060863494873046875, -0.00423431396484375, -0.0023822784423828125, -0.000530242919921875, 0.0013217926025390625, 0.003173828125, 0.0050258636474609375, 0.006877899169921875, 0.008729934692382812, 0.01058197021484375, 0.012434005737304688, 0.014286041259765625, 0.016138076782226562, 0.0179901123046875, 0.019842147827148438, 0.021694183349609375, 0.023546218872070312, 0.02539825439453125, 0.027250289916992188, 0.029102325439453125, 0.030954360961914062, 0.032806396484375, 0.03465843200683594, 0.036510467529296875, 0.03836250305175781, 0.04021453857421875, 0.04206657409667969, 0.043918609619140625, 0.04577064514160156, 0.0476226806640625, 0.04947471618652344, 0.051326751708984375, 0.05317878723144531, 0.05503082275390625, 0.05688285827636719, 0.058734893798828125, 0.06058692932128906, 0.06243896484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 5.0, 6.0, 4.0, 12.0, 16.0, 10.0, 13.0, 14.0, 22.0, 16.0, 19.0, 22.0, 37.0, 36.0, 28.0, 32.0, 50.0, 52.0, 37.0, 44.0, 36.0, 34.0, 49.0, 52.0, 41.0, 38.0, 28.0, 24.0, 29.0, 38.0, 25.0, 15.0, 28.0, 20.0, 12.0, 9.0, 10.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041778564453125, -0.04031705856323242, -0.038855552673339844, -0.037394046783447266, -0.03593254089355469, -0.03447103500366211, -0.03300952911376953, -0.03154802322387695, -0.030086517333984375, -0.028625011444091797, -0.02716350555419922, -0.02570199966430664, -0.024240493774414062, -0.022778987884521484, -0.021317481994628906, -0.019855976104736328, -0.01839447021484375, -0.016932964324951172, -0.015471458435058594, -0.014009952545166016, -0.012548446655273438, -0.01108694076538086, -0.009625434875488281, -0.008163928985595703, -0.006702423095703125, -0.005240917205810547, -0.0037794113159179688, -0.0023179054260253906, -0.0008563995361328125, 0.0006051063537597656, 0.0020666122436523438, 0.003528118133544922, 0.0049896240234375, 0.006451129913330078, 0.007912635803222656, 0.009374141693115234, 0.010835647583007812, 0.01229715347290039, 0.013758659362792969, 0.015220165252685547, 0.016681671142578125, 0.018143177032470703, 0.01960468292236328, 0.02106618881225586, 0.022527694702148438, 0.023989200592041016, 0.025450706481933594, 0.026912212371826172, 0.02837371826171875, 0.029835224151611328, 0.031296730041503906, 0.032758235931396484, 0.03421974182128906, 0.03568124771118164, 0.03714275360107422, 0.0386042594909668, 0.040065765380859375, 0.04152727127075195, 0.04298877716064453, 0.04445028305053711, 0.04591178894042969, 0.047373294830322266, 0.048834800720214844, 0.05029630661010742, 0.0517578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 13.0, 4.0, 8.0, 8.0, 6.0, 18.0, 25.0, 30.0, 48.0, 60.0, 121.0, 117.0, 262.0, 388.0, 656.0, 1190.0, 2205.0, 5419.0, 12114.0, 43437.0, 245706.0, 649762.0, 56669.0, 17889.0, 6072.0, 2995.0, 1321.0, 806.0, 406.0, 280.0, 153.0, 113.0, 73.0, 50.0, 38.0, 30.0, 11.0, 14.0, 9.0, 10.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.09808349609375e-05, -2.0415522158145905e-05, -1.985020935535431e-05, -1.9284896552562714e-05, -1.8719583749771118e-05, -1.8154270946979523e-05, -1.7588958144187927e-05, -1.7023645341396332e-05, -1.6458332538604736e-05, -1.589301973581314e-05, -1.5327706933021545e-05, -1.476239413022995e-05, -1.4197081327438354e-05, -1.3631768524646759e-05, -1.3066455721855164e-05, -1.2501142919063568e-05, -1.1935830116271973e-05, -1.1370517313480377e-05, -1.0805204510688782e-05, -1.0239891707897186e-05, -9.67457890510559e-06, -9.109266102313995e-06, -8.5439532995224e-06, -7.978640496730804e-06, -7.413327693939209e-06, -6.8480148911476135e-06, -6.282702088356018e-06, -5.717389285564423e-06, -5.152076482772827e-06, -4.586763679981232e-06, -4.021450877189636e-06, -3.4561380743980408e-06, -2.8908252716064453e-06, -2.32551246881485e-06, -1.7601996660232544e-06, -1.194886863231659e-06, -6.295740604400635e-07, -6.426125764846802e-08, 5.010515451431274e-07, 1.066364347934723e-06, 1.6316771507263184e-06, 2.196989953517914e-06, 2.7623027563095093e-06, 3.3276155591011047e-06, 3.8929283618927e-06, 4.458241164684296e-06, 5.023553967475891e-06, 5.5888667702674866e-06, 6.154179573059082e-06, 6.7194923758506775e-06, 7.284805178642273e-06, 7.850117981433868e-06, 8.415430784225464e-06, 8.98074358701706e-06, 9.546056389808655e-06, 1.011136919260025e-05, 1.0676681995391846e-05, 1.1241994798183441e-05, 1.1807307600975037e-05, 1.2372620403766632e-05, 1.2937933206558228e-05, 1.3503246009349823e-05, 1.4068558812141418e-05, 1.4633871614933014e-05, 1.519918441772461e-05]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 3.0, 8.0, 8.0, 16.0, 22.0, 20.0, 36.0, 29.0, 58.0, 55.0, 84.0, 67.0, 83.0, 94.0, 77.0, 78.0, 50.0, 52.0, 26.0, 36.0, 24.0, 16.0, 19.0, 9.0, 13.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.616115570068359e-06, -6.411224603652954e-06, -6.206333637237549e-06, -6.0014426708221436e-06, -5.796551704406738e-06, -5.591660737991333e-06, -5.386769771575928e-06, -5.1818788051605225e-06, -4.976987838745117e-06, -4.772096872329712e-06, -4.567205905914307e-06, -4.362314939498901e-06, -4.157423973083496e-06, -3.952533006668091e-06, -3.7476420402526855e-06, -3.5427510738372803e-06, -3.337860107421875e-06, -3.1329691410064697e-06, -2.9280781745910645e-06, -2.723187208175659e-06, -2.518296241760254e-06, -2.3134052753448486e-06, -2.1085143089294434e-06, -1.903623342514038e-06, -1.6987323760986328e-06, -1.4938414096832275e-06, -1.2889504432678223e-06, -1.084059476852417e-06, -8.791685104370117e-07, -6.742775440216064e-07, -4.6938657760620117e-07, -2.644956111907959e-07, -5.960464477539063e-08, 1.4528632164001465e-07, 3.501772880554199e-07, 5.550682544708252e-07, 7.599592208862305e-07, 9.648501873016357e-07, 1.169741153717041e-06, 1.3746321201324463e-06, 1.5795230865478516e-06, 1.7844140529632568e-06, 1.989305019378662e-06, 2.1941959857940674e-06, 2.3990869522094727e-06, 2.603977918624878e-06, 2.808868885040283e-06, 3.0137598514556885e-06, 3.2186508178710938e-06, 3.423541784286499e-06, 3.6284327507019043e-06, 3.8333237171173096e-06, 4.038214683532715e-06, 4.24310564994812e-06, 4.447996616363525e-06, 4.652887582778931e-06, 4.857778549194336e-06, 5.062669515609741e-06, 5.2675604820251465e-06, 5.472451448440552e-06, 5.677342414855957e-06, 5.882233381271362e-06, 6.087124347686768e-06, 6.292015314102173e-06, 6.496906280517578e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 16.0, 21.0, 28.0, 43.0, 75.0, 139.0, 258.0, 475.0, 1948.0, 1034484.0, 9509.0, 790.0, 313.0, 155.0, 112.0, 55.0, 33.0, 26.0, 19.0, 14.0, 5.0, 5.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.112192153930664e-05, -7.871631532907486e-05, -7.631070911884308e-05, -7.39051029086113e-05, -7.149949669837952e-05, -6.909389048814774e-05, -6.668828427791595e-05, -6.428267806768417e-05, -6.187707185745239e-05, -5.947146564722061e-05, -5.706585943698883e-05, -5.466025322675705e-05, -5.225464701652527e-05, -4.984904080629349e-05, -4.7443434596061707e-05, -4.5037828385829926e-05, -4.2632222175598145e-05, -4.0226615965366364e-05, -3.782100975513458e-05, -3.54154035449028e-05, -3.300979733467102e-05, -3.060419112443924e-05, -2.819858491420746e-05, -2.5792978703975677e-05, -2.3387372493743896e-05, -2.0981766283512115e-05, -1.8576160073280334e-05, -1.6170553863048553e-05, -1.3764947652816772e-05, -1.1359341442584991e-05, -8.95373523235321e-06, -6.5481290221214294e-06, -4.1425228118896484e-06, -1.7369166016578674e-06, 6.686896085739136e-07, 3.0742958188056946e-06, 5.479902029037476e-06, 7.885508239269257e-06, 1.0291114449501038e-05, 1.2696720659732819e-05, 1.51023268699646e-05, 1.750793308019638e-05, 1.991353929042816e-05, 2.2319145500659943e-05, 2.4724751710891724e-05, 2.7130357921123505e-05, 2.9535964131355286e-05, 3.194157034158707e-05, 3.434717655181885e-05, 3.675278276205063e-05, 3.915838897228241e-05, 4.156399518251419e-05, 4.396960139274597e-05, 4.637520760297775e-05, 4.8780813813209534e-05, 5.1186420023441315e-05, 5.3592026233673096e-05, 5.599763244390488e-05, 5.840323865413666e-05, 6.080884486436844e-05, 6.321445107460022e-05, 6.5620057284832e-05, 6.802566349506378e-05, 7.043126970529556e-05, 7.283687591552734e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 7.0, 6.0, 13.0, 18.0, 22.0, 31.0, 43.0, 57.0, 76.0, 137.0, 142.0, 109.0, 91.0, 62.0, 50.0, 44.0, 38.0, 13.0, 7.0, 10.0, 8.0, 7.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.711483001708984e-05, -6.532948464155197e-05, -6.35441392660141e-05, -6.175879389047623e-05, -5.9973448514938354e-05, -5.818810313940048e-05, -5.640275776386261e-05, -5.461741238832474e-05, -5.2832067012786865e-05, -5.104672163724899e-05, -4.926137626171112e-05, -4.747603088617325e-05, -4.5690685510635376e-05, -4.3905340135097504e-05, -4.211999475955963e-05, -4.033464938402176e-05, -3.854930400848389e-05, -3.6763958632946014e-05, -3.497861325740814e-05, -3.319326788187027e-05, -3.14079225063324e-05, -2.9622577130794525e-05, -2.7837231755256653e-05, -2.605188637971878e-05, -2.4266541004180908e-05, -2.2481195628643036e-05, -2.0695850253105164e-05, -1.891050487756729e-05, -1.712515950202942e-05, -1.5339814126491547e-05, -1.3554468750953674e-05, -1.1769123375415802e-05, -9.98377799987793e-06, -8.198432624340057e-06, -6.413087248802185e-06, -4.627741873264313e-06, -2.8423964977264404e-06, -1.0570511221885681e-06, 7.282942533493042e-07, 2.5136396288871765e-06, 4.298985004425049e-06, 6.084330379962921e-06, 7.869675755500793e-06, 9.655021131038666e-06, 1.1440366506576538e-05, 1.322571188211441e-05, 1.5011057257652283e-05, 1.6796402633190155e-05, 1.8581748008728027e-05, 2.03670933842659e-05, 2.2152438759803772e-05, 2.3937784135341644e-05, 2.5723129510879517e-05, 2.750847488641739e-05, 2.929382026195526e-05, 3.1079165637493134e-05, 3.2864511013031006e-05, 3.464985638856888e-05, 3.643520176410675e-05, 3.822054713964462e-05, 4.0005892515182495e-05, 4.179123789072037e-05, 4.357658326625824e-05, 4.536192864179611e-05, 4.7147274017333984e-05]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 11.0, 52.0, 716.0, 201.0, 24.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4307551980018616, -0.4211329221725464, -0.4115106761455536, -0.4018884301185608, -0.3922661542892456, -0.3826438784599304, -0.3730216324329376, -0.3633993864059448, -0.35377711057662964, -0.34415483474731445, -0.33453258872032166, -0.32491034269332886, -0.31528806686401367, -0.3056657910346985, -0.2960435450077057, -0.2864212989807129, -0.2767990231513977, -0.2671767473220825, -0.2575545012950897, -0.24793224036693573, -0.23830997943878174, -0.22868771851062775, -0.21906545758247375, -0.20944319665431976, -0.19982093572616577, -0.19019867479801178, -0.1805764138698578, -0.1709541529417038, -0.1613318920135498, -0.1517096310853958, -0.14208737015724182, -0.13246510922908783, -0.12284283339977264, -0.11322057247161865, -0.10359831154346466, -0.09397605061531067, -0.08435378968715668, -0.07473152875900269, -0.0651092678308487, -0.0554870069026947, -0.04586474597454071, -0.03624248504638672, -0.026620224118232727, -0.016997963190078735, -0.007375702261924744, 0.002246558666229248, 0.01186881959438324, 0.02149108052253723, 0.031113341450691223, 0.040735602378845215, 0.05035786330699921, 0.0599801242351532, 0.06960238516330719, 0.07922464609146118, 0.08884690701961517, 0.09846916794776917, 0.10809142887592316, 0.11771368980407715, 0.12733595073223114, 0.13695821166038513, 0.14658047258853912, 0.15620273351669312, 0.1658249944448471, 0.1754472553730011, 0.1850695163011551]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 9.0, 9.0, 9.0, 17.0, 23.0, 25.0, 21.0, 25.0, 34.0, 23.0, 33.0, 41.0, 34.0, 41.0, 53.0, 57.0, 54.0, 49.0, 36.0, 52.0, 52.0, 28.0, 34.0, 33.0, 31.0, 24.0, 23.0, 11.0, 21.0, 23.0, 12.0, 21.0, 10.0, 15.0, 9.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23304694890975952, -0.223457932472229, -0.21386893093585968, -0.20427991449832916, -0.19469091296195984, -0.18510189652442932, -0.1755128800868988, -0.16592387855052948, -0.15633487701416016, -0.14674586057662964, -0.13715685904026031, -0.1275678426027298, -0.11797884106636047, -0.10838982462882996, -0.09880081564188004, -0.08921180665493011, -0.0796227902173996, -0.07003378123044968, -0.060444772243499756, -0.05085575953125954, -0.041266750544309616, -0.031677741557359695, -0.022088728845119476, -0.012499719858169556, -0.002910710871219635, 0.00667829904705286, 0.016267308965325356, 0.025856319814920425, 0.035445328801870346, 0.04503433778882027, 0.054623350501060486, 0.0642123594880104, 0.07380136847496033, 0.08339037746191025, 0.09297938644886017, 0.10256840288639069, 0.11215740442276001, 0.12174642086029053, 0.13133543729782104, 0.14092443883419037, 0.1505134403705597, 0.1601024568080902, 0.16969145834445953, 0.17928047478199005, 0.18886947631835938, 0.1984584927558899, 0.2080475091934204, 0.21763651072978973, 0.22722552716732025, 0.23681454360485077, 0.2464035451412201, 0.2559925615787506, 0.26558157801628113, 0.27517056465148926, 0.2847595810890198, 0.2943485975265503, 0.3039376139640808, 0.31352663040161133, 0.32311564683914185, 0.33270463347435, 0.3422936499118805, 0.351882666349411, 0.36147168278694153, 0.37106066942214966, 0.3806496858596802]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 6.0, 4.0, 8.0, 6.0, 5.0, 9.0, 4.0, 15.0, 19.0, 41.0, 49.0, 49.0, 1063.0, 4180859.0, 11200.0, 711.0, 55.0, 28.0, 17.0, 19.0, 19.0, 16.0, 12.0, 9.0, 8.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07177734375, -0.0695199966430664, -0.06726264953613281, -0.06500530242919922, -0.06274795532226562, -0.06049060821533203, -0.05823326110839844, -0.055975914001464844, -0.05371856689453125, -0.051461219787597656, -0.04920387268066406, -0.04694652557373047, -0.044689178466796875, -0.04243183135986328, -0.04017448425292969, -0.037917137145996094, -0.0356597900390625, -0.033402442932128906, -0.031145095825195312, -0.02888774871826172, -0.026630401611328125, -0.02437305450439453, -0.022115707397460938, -0.019858360290527344, -0.01760101318359375, -0.015343666076660156, -0.013086318969726562, -0.010828971862792969, -0.008571624755859375, -0.006314277648925781, -0.0040569305419921875, -0.0017995834350585938, 0.000457763671875, 0.0027151107788085938, 0.0049724578857421875, 0.007229804992675781, 0.009487152099609375, 0.011744499206542969, 0.014001846313476562, 0.016259193420410156, 0.01851654052734375, 0.020773887634277344, 0.023031234741210938, 0.02528858184814453, 0.027545928955078125, 0.02980327606201172, 0.03206062316894531, 0.034317970275878906, 0.0365753173828125, 0.038832664489746094, 0.04109001159667969, 0.04334735870361328, 0.045604705810546875, 0.04786205291748047, 0.05011940002441406, 0.052376747131347656, 0.05463409423828125, 0.056891441345214844, 0.05914878845214844, 0.06140613555908203, 0.06366348266601562, 0.06592082977294922, 0.06817817687988281, 0.0704355239868164, 0.07269287109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 6.0, 12.0, 17.0, 16.0, 10.0, 46.0, 250.0, 405.0, 105.0, 21.0, 18.0, 10.0, 5.0, 9.0, 11.0, 10.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.019247770309448242, -0.018628597259521484, -0.018009424209594727, -0.01739025115966797, -0.01677107810974121, -0.016151905059814453, -0.015532732009887695, -0.014913558959960938, -0.01429438591003418, -0.013675212860107422, -0.013056039810180664, -0.012436866760253906, -0.011817693710327148, -0.01119852066040039, -0.010579347610473633, -0.009960174560546875, -0.009341001510620117, -0.00872182846069336, -0.008102655410766602, -0.007483482360839844, -0.006864309310913086, -0.006245136260986328, -0.00562596321105957, -0.0050067901611328125, -0.004387617111206055, -0.003768444061279297, -0.003149271011352539, -0.0025300979614257812, -0.0019109249114990234, -0.0012917518615722656, -0.0006725788116455078, -5.340576171875e-05, 0.0005657672882080078, 0.0011849403381347656, 0.0018041133880615234, 0.0024232864379882812, 0.003042459487915039, 0.003661632537841797, 0.004280805587768555, 0.0048999786376953125, 0.00551915168762207, 0.006138324737548828, 0.006757497787475586, 0.007376670837402344, 0.007995843887329102, 0.00861501693725586, 0.009234189987182617, 0.009853363037109375, 0.010472536087036133, 0.01109170913696289, 0.011710882186889648, 0.012330055236816406, 0.012949228286743164, 0.013568401336669922, 0.01418757438659668, 0.014806747436523438, 0.015425920486450195, 0.016045093536376953, 0.01666426658630371, 0.01728343963623047, 0.017902612686157227, 0.018521785736083984, 0.019140958786010742, 0.0197601318359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 9.0, 20.0, 45.0, 95.0, 300.0, 1008.0, 4574.0, 4170601.0, 15512.0, 1431.0, 414.0, 132.0, 59.0, 30.0, 14.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0222015380859375, -0.021561384201049805, -0.02092123031616211, -0.020281076431274414, -0.01964092254638672, -0.019000768661499023, -0.018360614776611328, -0.017720460891723633, -0.017080307006835938, -0.016440153121948242, -0.015799999237060547, -0.015159845352172852, -0.014519691467285156, -0.013879537582397461, -0.013239383697509766, -0.01259922981262207, -0.011959075927734375, -0.01131892204284668, -0.010678768157958984, -0.010038614273071289, -0.009398460388183594, -0.008758306503295898, -0.008118152618408203, -0.007477998733520508, -0.0068378448486328125, -0.006197690963745117, -0.005557537078857422, -0.0049173831939697266, -0.004277229309082031, -0.003637075424194336, -0.0029969215393066406, -0.0023567676544189453, -0.00171661376953125, -0.0010764598846435547, -0.0004363059997558594, 0.00020384788513183594, 0.0008440017700195312, 0.0014841556549072266, 0.002124309539794922, 0.002764463424682617, 0.0034046173095703125, 0.004044771194458008, 0.004684925079345703, 0.0053250789642333984, 0.005965232849121094, 0.006605386734008789, 0.007245540618896484, 0.00788569450378418, 0.008525848388671875, 0.00916600227355957, 0.009806156158447266, 0.010446310043334961, 0.011086463928222656, 0.011726617813110352, 0.012366771697998047, 0.013006925582885742, 0.013647079467773438, 0.014287233352661133, 0.014927387237548828, 0.015567541122436523, 0.01620769500732422, 0.016847848892211914, 0.01748800277709961, 0.018128156661987305, 0.018768310546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 10.0, 15.0, 26.0, 64.0, 493.0, 3278.0, 119.0, 30.0, 21.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00795745849609375, -0.007684588432312012, -0.0074117183685302734, -0.007138848304748535, -0.006865978240966797, -0.006593108177185059, -0.00632023811340332, -0.006047368049621582, -0.005774497985839844, -0.0055016279220581055, -0.005228757858276367, -0.004955887794494629, -0.004683017730712891, -0.004410147666931152, -0.004137277603149414, -0.0038644075393676758, -0.0035915374755859375, -0.0033186674118041992, -0.003045797348022461, -0.0027729272842407227, -0.0025000572204589844, -0.002227187156677246, -0.001954317092895508, -0.0016814470291137695, -0.0014085769653320312, -0.001135706901550293, -0.0008628368377685547, -0.0005899667739868164, -0.0003170967102050781, -4.4226646423339844e-05, 0.00022864341735839844, 0.0005015134811401367, 0.000774383544921875, 0.0010472536087036133, 0.0013201236724853516, 0.0015929937362670898, 0.0018658638000488281, 0.0021387338638305664, 0.0024116039276123047, 0.002684473991394043, 0.0029573440551757812, 0.0032302141189575195, 0.003503084182739258, 0.003775954246520996, 0.004048824310302734, 0.004321694374084473, 0.004594564437866211, 0.004867434501647949, 0.0051403045654296875, 0.005413174629211426, 0.005686044692993164, 0.005958914756774902, 0.006231784820556641, 0.006504654884338379, 0.006777524948120117, 0.0070503950119018555, 0.007323265075683594, 0.007596135139465332, 0.00786900520324707, 0.008141875267028809, 0.008414745330810547, 0.008687615394592285, 0.008960485458374023, 0.009233355522155762, 0.0095062255859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1013.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016311002895236015, -0.006879863329231739, 0.0025512762367725372, 0.011982416734099388, 0.02141355536878109, 0.03084469400346279, 0.04027583450078964, 0.049706973135471344, 0.059138111770153046, 0.06856925040483475, 0.07800038903951645, 0.08743153512477875, 0.09686267375946045, 0.10629381239414215, 0.11572495102882385, 0.12515608966350555, 0.13458722829818726, 0.14401836693286896, 0.15344950556755066, 0.16288064420223236, 0.17231178283691406, 0.18174292147159576, 0.19117406010627747, 0.20060521364212036, 0.21003635227680206, 0.21946749091148376, 0.22889862954616547, 0.23832976818084717, 0.24776090681552887, 0.25719204545021057, 0.26662319898605347, 0.276054322719574, 0.28548547625541687, 0.29491662979125977, 0.3043477535247803, 0.31377890706062317, 0.3232100307941437, 0.3326411843299866, 0.3420723080635071, 0.35150346159935, 0.3609345853328705, 0.3703657388687134, 0.3797968626022339, 0.3892280161380768, 0.3986591398715973, 0.4080902934074402, 0.4175214171409607, 0.4269525706768036, 0.4363837242126465, 0.4458148777484894, 0.4552460014820099, 0.4646771550178528, 0.4741082787513733, 0.4835394322872162, 0.4929705560207367, 0.5024017095565796, 0.5118328332901001, 0.5212639570236206, 0.5306951403617859, 0.5401262640953064, 0.5495573878288269, 0.5589885115623474, 0.5684196949005127, 0.5778508186340332, 0.5872819423675537]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 0.0, 9.0, 6.0, 9.0, 15.0, 15.0, 22.0, 27.0, 37.0, 41.0, 33.0, 38.0, 65.0, 84.0, 81.0, 70.0, 72.0, 79.0, 50.0, 60.0, 42.0, 41.0, 34.0, 24.0, 21.0, 9.0, 8.0, 7.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015378296375274658, -0.014831936918199062, -0.014285577461123466, -0.01373921800404787, -0.013192858546972275, -0.012646499089896679, -0.012100139632821083, -0.011553780175745487, -0.011007420718669891, -0.010461061261594296, -0.0099147018045187, -0.009368342347443104, -0.008821982890367508, -0.008275623433291912, -0.007729263976216316, -0.00718290451914072, -0.0066365450620651245, -0.006090185604989529, -0.005543826147913933, -0.004997466690838337, -0.004451107233762741, -0.0039047477766871452, -0.0033583883196115494, -0.0028120288625359535, -0.0022656694054603577, -0.0017193099483847618, -0.001172950491309166, -0.0006265910342335701, -8.023157715797424e-05, 0.0004661278799176216, 0.0010124873369932175, 0.0015588467940688133, 0.002105206251144409, 0.002651565708220005, 0.003197925165295601, 0.0037442846223711967, 0.004290644079446793, 0.0048370035365223885, 0.005383362993597984, 0.00592972245067358, 0.006476081907749176, 0.007022441364824772, 0.007568800821900368, 0.008115160278975964, 0.00866151973605156, 0.009207879193127155, 0.009754238650202751, 0.010300598107278347, 0.010846957564353943, 0.011393317021429539, 0.011939676478505135, 0.01248603593558073, 0.013032395392656326, 0.013578754849731922, 0.014125114306807518, 0.014671473763883114, 0.01521783322095871, 0.01576419174671173, 0.0163105521351099, 0.016856912523508072, 0.017403271049261093, 0.017949629575014114, 0.018495989963412285, 0.019042350351810455, 0.019588708877563477]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 11.0, 4.0, 9.0, 14.0, 17.0, 20.0, 37.0, 42.0, 72.0, 87.0, 129.0, 187.0, 304.0, 547.0, 999.0, 1862.0, 4038.0, 11348.0, 96464.0, 904549.0, 17091.0, 5511.0, 2271.0, 1171.0, 652.0, 377.0, 234.0, 149.0, 94.0, 73.0, 45.0, 45.0, 22.0, 17.0, 12.0, 7.0, 10.0, 5.0, 3.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019744873046875, -0.019130706787109375, -0.01851654052734375, -0.017902374267578125, -0.0172882080078125, -0.016674041748046875, -0.01605987548828125, -0.015445709228515625, -0.01483154296875, -0.014217376708984375, -0.01360321044921875, -0.012989044189453125, -0.0123748779296875, -0.011760711669921875, -0.01114654541015625, -0.010532379150390625, -0.009918212890625, -0.009304046630859375, -0.00868988037109375, -0.008075714111328125, -0.0074615478515625, -0.006847381591796875, -0.00623321533203125, -0.005619049072265625, -0.0050048828125, -0.004390716552734375, -0.00377655029296875, -0.003162384033203125, -0.0025482177734375, -0.001934051513671875, -0.00131988525390625, -0.000705718994140625, -9.1552734375e-05, 0.000522613525390625, 0.00113677978515625, 0.001750946044921875, 0.0023651123046875, 0.002979278564453125, 0.00359344482421875, 0.004207611083984375, 0.00482177734375, 0.005435943603515625, 0.00605010986328125, 0.006664276123046875, 0.0072784423828125, 0.007892608642578125, 0.00850677490234375, 0.009120941162109375, 0.009735107421875, 0.010349273681640625, 0.01096343994140625, 0.011577606201171875, 0.0121917724609375, 0.012805938720703125, 0.01342010498046875, 0.014034271240234375, 0.0146484375, 0.015262603759765625, 0.01587677001953125, 0.016490936279296875, 0.0171051025390625, 0.017719268798828125, 0.01833343505859375, 0.018947601318359375, 0.019561767578125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 6.0, 12.0, 17.0, 16.0, 10.0, 46.0, 251.0, 404.0, 105.0, 21.0, 18.0, 10.0, 5.0, 9.0, 11.0, 10.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.019247770309448242, -0.018628597259521484, -0.018009424209594727, -0.01739025115966797, -0.01677107810974121, -0.016151905059814453, -0.015532732009887695, -0.014913558959960938, -0.01429438591003418, -0.013675212860107422, -0.013056039810180664, -0.012436866760253906, -0.011817693710327148, -0.01119852066040039, -0.010579347610473633, -0.009960174560546875, -0.009341001510620117, -0.00872182846069336, -0.008102655410766602, -0.007483482360839844, -0.006864309310913086, -0.006245136260986328, -0.00562596321105957, -0.0050067901611328125, -0.004387617111206055, -0.003768444061279297, -0.003149271011352539, -0.0025300979614257812, -0.0019109249114990234, -0.0012917518615722656, -0.0006725788116455078, -5.340576171875e-05, 0.0005657672882080078, 0.0011849403381347656, 0.0018041133880615234, 0.0024232864379882812, 0.003042459487915039, 0.003661632537841797, 0.004280805587768555, 0.0048999786376953125, 0.00551915168762207, 0.006138324737548828, 0.006757497787475586, 0.007376670837402344, 0.007995843887329102, 0.00861501693725586, 0.009234189987182617, 0.009853363037109375, 0.010472536087036133, 0.01109170913696289, 0.011710882186889648, 0.012330055236816406, 0.012949228286743164, 0.013568401336669922, 0.01418757438659668, 0.014806747436523438, 0.015425920486450195, 0.016045093536376953, 0.01666426658630371, 0.01728343963623047, 0.017902612686157227, 0.018521785736083984, 0.019140958786010742, 0.0197601318359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 7.0, 3.0, 12.0, 15.0, 26.0, 16.0, 21.0, 32.0, 50.0, 55.0, 83.0, 89.0, 114.0, 134.0, 194.0, 315.0, 593.0, 1426.0, 25646.0, 1004707.0, 12175.0, 1152.0, 543.0, 308.0, 212.0, 145.0, 78.0, 87.0, 73.0, 39.0, 29.0, 36.0, 30.0, 18.0, 16.0, 18.0, 11.0, 10.0, 3.0, 6.0, 11.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.031524658203125, -0.030521392822265625, -0.02951812744140625, -0.028514862060546875, -0.0275115966796875, -0.026508331298828125, -0.02550506591796875, -0.024501800537109375, -0.02349853515625, -0.022495269775390625, -0.02149200439453125, -0.020488739013671875, -0.0194854736328125, -0.018482208251953125, -0.01747894287109375, -0.016475677490234375, -0.015472412109375, -0.014469146728515625, -0.01346588134765625, -0.012462615966796875, -0.0114593505859375, -0.010456085205078125, -0.00945281982421875, -0.008449554443359375, -0.0074462890625, -0.006443023681640625, -0.00543975830078125, -0.004436492919921875, -0.0034332275390625, -0.002429962158203125, -0.00142669677734375, -0.000423431396484375, 0.000579833984375, 0.001583099365234375, 0.00258636474609375, 0.003589630126953125, 0.0045928955078125, 0.005596160888671875, 0.00659942626953125, 0.007602691650390625, 0.00860595703125, 0.009609222412109375, 0.01061248779296875, 0.011615753173828125, 0.0126190185546875, 0.013622283935546875, 0.01462554931640625, 0.015628814697265625, 0.016632080078125, 0.017635345458984375, 0.01863861083984375, 0.019641876220703125, 0.0206451416015625, 0.021648406982421875, 0.02265167236328125, 0.023654937744140625, 0.024658203125, 0.025661468505859375, 0.02666473388671875, 0.027667999267578125, 0.0286712646484375, 0.029674530029296875, 0.03067779541015625, 0.031681060791015625, 0.032684326171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 5.0, 2.0, 8.0, 12.0, 21.0, 12.0, 10.0, 15.0, 29.0, 30.0, 33.0, 35.0, 42.0, 39.0, 36.0, 37.0, 29.0, 43.0, 39.0, 35.0, 34.0, 35.0, 37.0, 47.0, 42.0, 33.0, 34.0, 27.0, 33.0, 19.0, 15.0, 21.0, 20.0, 15.0, 12.0, 14.0, 9.0, 6.0, 5.0, 5.0, 11.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.039886474609375, -0.038616180419921875, -0.03734588623046875, -0.036075592041015625, -0.0348052978515625, -0.033535003662109375, -0.03226470947265625, -0.030994415283203125, -0.02972412109375, -0.028453826904296875, -0.02718353271484375, -0.025913238525390625, -0.0246429443359375, -0.023372650146484375, -0.02210235595703125, -0.020832061767578125, -0.019561767578125, -0.018291473388671875, -0.01702117919921875, -0.015750885009765625, -0.0144805908203125, -0.013210296630859375, -0.01194000244140625, -0.010669708251953125, -0.0093994140625, -0.008129119873046875, -0.00685882568359375, -0.005588531494140625, -0.0043182373046875, -0.003047943115234375, -0.00177764892578125, -0.000507354736328125, 0.000762939453125, 0.002033233642578125, 0.00330352783203125, 0.004573822021484375, 0.0058441162109375, 0.007114410400390625, 0.00838470458984375, 0.009654998779296875, 0.01092529296875, 0.012195587158203125, 0.01346588134765625, 0.014736175537109375, 0.0160064697265625, 0.017276763916015625, 0.01854705810546875, 0.019817352294921875, 0.021087646484375, 0.022357940673828125, 0.02362823486328125, 0.024898529052734375, 0.0261688232421875, 0.027439117431640625, 0.02870941162109375, 0.029979705810546875, 0.03125, 0.032520294189453125, 0.03379058837890625, 0.035060882568359375, 0.0363311767578125, 0.037601470947265625, 0.03887176513671875, 0.040142059326171875, 0.041412353515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 5.0, 17.0, 21.0, 30.0, 49.0, 79.0, 113.0, 208.0, 425.0, 816.0, 1961.0, 7426.0, 47921.0, 930445.0, 48914.0, 6379.0, 2061.0, 741.0, 392.0, 216.0, 117.0, 67.0, 44.0, 26.0, 23.0, 13.0, 9.0, 7.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1278858184814453e-05, -2.0602717995643616e-05, -1.992657780647278e-05, -1.925043761730194e-05, -1.8574297428131104e-05, -1.7898157238960266e-05, -1.722201704978943e-05, -1.654587686061859e-05, -1.5869736671447754e-05, -1.5193596482276917e-05, -1.4517456293106079e-05, -1.3841316103935242e-05, -1.3165175914764404e-05, -1.2489035725593567e-05, -1.181289553642273e-05, -1.1136755347251892e-05, -1.0460615158081055e-05, -9.784474968910217e-06, -9.10833477973938e-06, -8.432194590568542e-06, -7.756054401397705e-06, -7.079914212226868e-06, -6.40377402305603e-06, -5.727633833885193e-06, -5.0514936447143555e-06, -4.375353455543518e-06, -3.6992132663726807e-06, -3.0230730772018433e-06, -2.346932888031006e-06, -1.6707926988601685e-06, -9.94652509689331e-07, -3.1851232051849365e-07, 3.5762786865234375e-07, 1.0337680578231812e-06, 1.7099082469940186e-06, 2.386048436164856e-06, 3.0621886253356934e-06, 3.7383288145065308e-06, 4.414469003677368e-06, 5.0906091928482056e-06, 5.766749382019043e-06, 6.44288957118988e-06, 7.119029760360718e-06, 7.795169949531555e-06, 8.471310138702393e-06, 9.14745032787323e-06, 9.823590517044067e-06, 1.0499730706214905e-05, 1.1175870895385742e-05, 1.185201108455658e-05, 1.2528151273727417e-05, 1.3204291462898254e-05, 1.3880431652069092e-05, 1.455657184123993e-05, 1.5232712030410767e-05, 1.5908852219581604e-05, 1.658499240875244e-05, 1.726113259792328e-05, 1.7937272787094116e-05, 1.8613412976264954e-05, 1.928955316543579e-05, 1.996569335460663e-05, 2.0641833543777466e-05, 2.1317973732948303e-05, 2.199411392211914e-05]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 4.0, 9.0, 13.0, 17.0, 23.0, 33.0, 46.0, 30.0, 71.0, 67.0, 75.0, 62.0, 71.0, 76.0, 79.0, 31.0, 63.0, 38.0, 29.0, 48.0, 28.0, 14.0, 6.0, 13.0, 7.0, 5.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.470348358154297e-06, -4.307366907596588e-06, -4.144385457038879e-06, -3.981404006481171e-06, -3.818422555923462e-06, -3.655441105365753e-06, -3.4924596548080444e-06, -3.3294782042503357e-06, -3.166496753692627e-06, -3.0035153031349182e-06, -2.8405338525772095e-06, -2.6775524020195007e-06, -2.514570951461792e-06, -2.3515895009040833e-06, -2.1886080503463745e-06, -2.0256265997886658e-06, -1.862645149230957e-06, -1.6996636986732483e-06, -1.5366822481155396e-06, -1.3737007975578308e-06, -1.210719347000122e-06, -1.0477378964424133e-06, -8.847564458847046e-07, -7.217749953269958e-07, -5.587935447692871e-07, -3.9581209421157837e-07, -2.3283064365386963e-07, -6.984919309616089e-08, 9.313225746154785e-08, 2.561137080192566e-07, 4.1909515857696533e-07, 5.820766091346741e-07, 7.450580596923828e-07, 9.080395102500916e-07, 1.0710209608078003e-06, 1.234002411365509e-06, 1.3969838619232178e-06, 1.5599653124809265e-06, 1.7229467630386353e-06, 1.885928213596344e-06, 2.0489096641540527e-06, 2.2118911147117615e-06, 2.3748725652694702e-06, 2.537854015827179e-06, 2.7008354663848877e-06, 2.8638169169425964e-06, 3.026798367500305e-06, 3.189779818058014e-06, 3.3527612686157227e-06, 3.5157427191734314e-06, 3.67872416973114e-06, 3.841705620288849e-06, 4.004687070846558e-06, 4.167668521404266e-06, 4.330649971961975e-06, 4.493631422519684e-06, 4.656612873077393e-06, 4.819594323635101e-06, 4.98257577419281e-06, 5.145557224750519e-06, 5.3085386753082275e-06, 5.471520125865936e-06, 5.634501576423645e-06, 5.797483026981354e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 10.0, 14.0, 21.0, 22.0, 47.0, 111.0, 315.0, 1516.0, 1042033.0, 3786.0, 393.0, 126.0, 53.0, 27.0, 33.0, 20.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.589557647705078e-05, -4.395097494125366e-05, -4.200637340545654e-05, -4.0061771869659424e-05, -3.8117170333862305e-05, -3.6172568798065186e-05, -3.4227967262268066e-05, -3.228336572647095e-05, -3.0338764190673828e-05, -2.839416265487671e-05, -2.644956111907959e-05, -2.450495958328247e-05, -2.256035804748535e-05, -2.0615756511688232e-05, -1.8671154975891113e-05, -1.6726553440093994e-05, -1.4781951904296875e-05, -1.2837350368499756e-05, -1.0892748832702637e-05, -8.948147296905518e-06, -7.0035457611083984e-06, -5.058944225311279e-06, -3.11434268951416e-06, -1.169741153717041e-06, 7.748603820800781e-07, 2.7194619178771973e-06, 4.664063453674316e-06, 6.6086649894714355e-06, 8.553266525268555e-06, 1.0497868061065674e-05, 1.2442469596862793e-05, 1.4387071132659912e-05, 1.633167266845703e-05, 1.827627420425415e-05, 2.022087574005127e-05, 2.216547727584839e-05, 2.4110078811645508e-05, 2.6054680347442627e-05, 2.7999281883239746e-05, 2.9943883419036865e-05, 3.1888484954833984e-05, 3.3833086490631104e-05, 3.577768802642822e-05, 3.772228956222534e-05, 3.966689109802246e-05, 4.161149263381958e-05, 4.35560941696167e-05, 4.550069570541382e-05, 4.744529724121094e-05, 4.938989877700806e-05, 5.1334500312805176e-05, 5.3279101848602295e-05, 5.5223703384399414e-05, 5.716830492019653e-05, 5.911290645599365e-05, 6.105750799179077e-05, 6.300210952758789e-05, 6.494671106338501e-05, 6.689131259918213e-05, 6.883591413497925e-05, 7.078051567077637e-05, 7.272511720657349e-05, 7.46697187423706e-05, 7.661432027816772e-05, 7.855892181396484e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 4.0, 4.0, 3.0, 3.0, 7.0, 5.0, 13.0, 12.0, 26.0, 45.0, 75.0, 104.0, 243.0, 203.0, 87.0, 63.0, 41.0, 20.0, 12.0, 10.0, 10.0, 4.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.319978713989258e-05, -3.1109899282455444e-05, -2.902001142501831e-05, -2.6930123567581177e-05, -2.4840235710144043e-05, -2.275034785270691e-05, -2.0660459995269775e-05, -1.857057213783264e-05, -1.6480684280395508e-05, -1.4390796422958374e-05, -1.230090856552124e-05, -1.0211020708084106e-05, -8.121132850646973e-06, -6.031244993209839e-06, -3.941357135772705e-06, -1.8514692783355713e-06, 2.384185791015625e-07, 2.3283064365386963e-06, 4.41819429397583e-06, 6.508082151412964e-06, 8.597970008850098e-06, 1.0687857866287231e-05, 1.2777745723724365e-05, 1.4867633581161499e-05, 1.6957521438598633e-05, 1.9047409296035767e-05, 2.11372971534729e-05, 2.3227185010910034e-05, 2.5317072868347168e-05, 2.7406960725784302e-05, 2.9496848583221436e-05, 3.158673644065857e-05, 3.36766242980957e-05, 3.576651215553284e-05, 3.785640001296997e-05, 3.9946287870407104e-05, 4.203617572784424e-05, 4.412606358528137e-05, 4.6215951442718506e-05, 4.830583930015564e-05, 5.0395727157592773e-05, 5.248561501502991e-05, 5.457550287246704e-05, 5.6665390729904175e-05, 5.875527858734131e-05, 6.084516644477844e-05, 6.293505430221558e-05, 6.502494215965271e-05, 6.711483001708984e-05, 6.920471787452698e-05, 7.129460573196411e-05, 7.338449358940125e-05, 7.547438144683838e-05, 7.756426930427551e-05, 7.965415716171265e-05, 8.174404501914978e-05, 8.383393287658691e-05, 8.592382073402405e-05, 8.801370859146118e-05, 9.010359644889832e-05, 9.219348430633545e-05, 9.428337216377258e-05, 9.637326002120972e-05, 9.846314787864685e-05, 0.00010055303573608398]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 44.0, 921.0, 45.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12164964526891708, -0.1073518842458725, -0.09305412322282791, -0.07875636219978333, -0.06445860862731934, -0.05016084760427475, -0.035863086581230164, -0.021565325558185577, -0.007267564535140991, 0.00703019555658102, 0.021327955648303032, 0.03562571480870247, 0.049923475831747055, 0.06422123312950134, 0.07851899415254593, 0.09281675517559052, 0.1071145161986351, 0.12141227722167969, 0.13571003079414368, 0.15000779926776886, 0.16430555284023285, 0.17860332131385803, 0.19290107488632202, 0.207198828458786, 0.2214965969324112, 0.23579435050487518, 0.25009211897850037, 0.26438987255096436, 0.27868762612342834, 0.29298537969589233, 0.3072831630706787, 0.3215809166431427, 0.3358787000179291, 0.35017645359039307, 0.36447420716285706, 0.37877199053764343, 0.3930697441101074, 0.4073674976825714, 0.4216652512550354, 0.4359630346298218, 0.45026078820228577, 0.46455854177474976, 0.47885629534721375, 0.4931540787220001, 0.5074518322944641, 0.5217496156692505, 0.5360473394393921, 0.5503451228141785, 0.5646428465843201, 0.5789406299591064, 0.593238353729248, 0.6075361371040344, 0.621833860874176, 0.6361316442489624, 0.6504294276237488, 0.6647271513938904, 0.6790249347686768, 0.6933227181434631, 0.7076204419136047, 0.7219182252883911, 0.7362159490585327, 0.7505137324333191, 0.7648115158081055, 0.7791092395782471, 0.7934070229530334]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 5.0, 0.0, 6.0, 7.0, 10.0, 15.0, 8.0, 16.0, 22.0, 23.0, 27.0, 27.0, 41.0, 38.0, 52.0, 50.0, 45.0, 59.0, 46.0, 58.0, 45.0, 57.0, 60.0, 40.0, 30.0, 35.0, 38.0, 24.0, 23.0, 26.0, 18.0, 11.0, 12.0, 12.0, 5.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.28734254837036133, -0.27920255064964294, -0.27106255292892456, -0.2629225552082062, -0.2547825574874878, -0.24664254486560822, -0.23850254714488983, -0.23036254942417145, -0.22222253680229187, -0.2140825390815735, -0.2059425413608551, -0.19780254364013672, -0.18966253101825714, -0.18152253329753876, -0.17338253557682037, -0.165242537856102, -0.1571025401353836, -0.14896254241466522, -0.14082254469394684, -0.13268253207206726, -0.12454253435134888, -0.1164025366306305, -0.10826253890991211, -0.10012254118919373, -0.09198253601789474, -0.08384253829717636, -0.07570253312587738, -0.067562535405159, -0.059422533959150314, -0.05128253251314163, -0.04314253479242325, -0.035002533346414566, -0.026862531900405884, -0.0187225304543972, -0.010582530871033669, -0.0024425312876701355, 0.005697470158338547, 0.013837471604347229, 0.021977469325065613, 0.030117470771074295, 0.03825747221708298, 0.04639747366309166, 0.05453747510910034, 0.06267747282981873, 0.07081747055053711, 0.07895747572183609, 0.08709747344255447, 0.09523747861385345, 0.10337747633457184, 0.11151747405529022, 0.1196574792265892, 0.12779748439788818, 0.13593748211860657, 0.14407747983932495, 0.15221747756004333, 0.16035747528076172, 0.1684974730014801, 0.1766374707221985, 0.18477746844291687, 0.19291746616363525, 0.20105747878551483, 0.20919747650623322, 0.2173374742269516, 0.22547747194766998, 0.23361748456954956]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 7.0, 3.0, 4.0, 6.0, 12.0, 23.0, 23.0, 25.0, 30.0, 111.0, 4189373.0, 4375.0, 112.0, 48.0, 29.0, 16.0, 7.0, 15.0, 12.0, 10.0, 4.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.202392578125, -0.19605064392089844, -0.18970870971679688, -0.1833667755126953, -0.17702484130859375, -0.1706829071044922, -0.16434097290039062, -0.15799903869628906, -0.1516571044921875, -0.14531517028808594, -0.13897323608398438, -0.1326313018798828, -0.12628936767578125, -0.11994743347167969, -0.11360549926757812, -0.10726356506347656, -0.100921630859375, -0.09457969665527344, -0.08823776245117188, -0.08189582824707031, -0.07555389404296875, -0.06921195983886719, -0.06287002563476562, -0.05652809143066406, -0.0501861572265625, -0.04384422302246094, -0.037502288818359375, -0.031160354614257812, -0.02481842041015625, -0.018476486206054688, -0.012134552001953125, -0.0057926177978515625, 0.00054931640625, 0.0068912506103515625, 0.013233184814453125, 0.019575119018554688, 0.02591705322265625, 0.03225898742675781, 0.038600921630859375, 0.04494285583496094, 0.0512847900390625, 0.05762672424316406, 0.06396865844726562, 0.07031059265136719, 0.07665252685546875, 0.08299446105957031, 0.08933639526367188, 0.09567832946777344, 0.102020263671875, 0.10836219787597656, 0.11470413208007812, 0.12104606628417969, 0.12738800048828125, 0.1337299346923828, 0.14007186889648438, 0.14641380310058594, 0.1527557373046875, 0.15909767150878906, 0.16543960571289062, 0.1717815399169922, 0.17812347412109375, 0.1844654083251953, 0.19080734252929688, 0.19714927673339844, 0.2034912109375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 13.0, 19.0, 16.0, 10.0, 58.0, 290.0, 369.0, 91.0, 20.0, 17.0, 9.0, 4.0, 10.0, 11.0, 10.0, 3.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019775390625, -0.019156932830810547, -0.018538475036621094, -0.01792001724243164, -0.017301559448242188, -0.016683101654052734, -0.01606464385986328, -0.015446186065673828, -0.014827728271484375, -0.014209270477294922, -0.013590812683105469, -0.012972354888916016, -0.012353897094726562, -0.01173543930053711, -0.011116981506347656, -0.010498523712158203, -0.00988006591796875, -0.009261608123779297, -0.008643150329589844, -0.00802469253540039, -0.0074062347412109375, -0.006787776947021484, -0.006169319152832031, -0.005550861358642578, -0.004932403564453125, -0.004313945770263672, -0.0036954879760742188, -0.0030770301818847656, -0.0024585723876953125, -0.0018401145935058594, -0.0012216567993164062, -0.0006031990051269531, 1.52587890625e-05, 0.0006337165832519531, 0.0012521743774414062, 0.0018706321716308594, 0.0024890899658203125, 0.0031075477600097656, 0.0037260055541992188, 0.004344463348388672, 0.004962921142578125, 0.005581378936767578, 0.006199836730957031, 0.006818294525146484, 0.0074367523193359375, 0.00805521011352539, 0.008673667907714844, 0.009292125701904297, 0.00991058349609375, 0.010529041290283203, 0.011147499084472656, 0.01176595687866211, 0.012384414672851562, 0.013002872467041016, 0.013621330261230469, 0.014239788055419922, 0.014858245849609375, 0.015476703643798828, 0.01609516143798828, 0.016713619232177734, 0.017332077026367188, 0.01795053482055664, 0.018568992614746094, 0.019187450408935547, 0.019805908203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 21.0, 65.0, 226.0, 638.0, 12560.0, 4179228.0, 1078.0, 307.0, 98.0, 29.0, 11.0, 8.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0267791748046875, -0.025891542434692383, -0.025003910064697266, -0.02411627769470215, -0.02322864532470703, -0.022341012954711914, -0.021453380584716797, -0.02056574821472168, -0.019678115844726562, -0.018790483474731445, -0.017902851104736328, -0.01701521873474121, -0.016127586364746094, -0.015239953994750977, -0.01435232162475586, -0.013464689254760742, -0.012577056884765625, -0.011689424514770508, -0.01080179214477539, -0.009914159774780273, -0.009026527404785156, -0.008138895034790039, -0.007251262664794922, -0.006363630294799805, -0.0054759979248046875, -0.00458836555480957, -0.003700733184814453, -0.002813100814819336, -0.0019254684448242188, -0.0010378360748291016, -0.00015020370483398438, 0.0007374286651611328, 0.00162506103515625, 0.002512693405151367, 0.0034003257751464844, 0.0042879581451416016, 0.005175590515136719, 0.006063222885131836, 0.006950855255126953, 0.00783848762512207, 0.008726119995117188, 0.009613752365112305, 0.010501384735107422, 0.011389017105102539, 0.012276649475097656, 0.013164281845092773, 0.01405191421508789, 0.014939546585083008, 0.015827178955078125, 0.016714811325073242, 0.01760244369506836, 0.018490076065063477, 0.019377708435058594, 0.02026534080505371, 0.021152973175048828, 0.022040605545043945, 0.022928237915039062, 0.02381587028503418, 0.024703502655029297, 0.025591135025024414, 0.02647876739501953, 0.02736639976501465, 0.028254032135009766, 0.029141664505004883, 0.030029296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 8.0, 24.0, 448.0, 3553.0, 21.0, 13.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00959014892578125, -0.009308338165283203, -0.009026527404785156, -0.00874471664428711, -0.008462905883789062, -0.008181095123291016, -0.007899284362792969, -0.007617473602294922, -0.007335662841796875, -0.007053852081298828, -0.006772041320800781, -0.006490230560302734, -0.0062084197998046875, -0.005926609039306641, -0.005644798278808594, -0.005362987518310547, -0.0050811767578125, -0.004799365997314453, -0.004517555236816406, -0.004235744476318359, -0.0039539337158203125, -0.0036721229553222656, -0.0033903121948242188, -0.003108501434326172, -0.002826690673828125, -0.002544879913330078, -0.0022630691528320312, -0.0019812583923339844, -0.0016994476318359375, -0.0014176368713378906, -0.0011358261108398438, -0.0008540153503417969, -0.00057220458984375, -0.0002903938293457031, -8.58306884765625e-06, 0.0002732276916503906, 0.0005550384521484375, 0.0008368492126464844, 0.0011186599731445312, 0.0014004707336425781, 0.001682281494140625, 0.001964092254638672, 0.0022459030151367188, 0.0025277137756347656, 0.0028095245361328125, 0.0030913352966308594, 0.0033731460571289062, 0.003654956817626953, 0.003936767578125, 0.004218578338623047, 0.004500389099121094, 0.004782199859619141, 0.0050640106201171875, 0.005345821380615234, 0.005627632141113281, 0.005909442901611328, 0.006191253662109375, 0.006473064422607422, 0.006754875183105469, 0.007036685943603516, 0.0073184967041015625, 0.007600307464599609, 0.007882118225097656, 0.008163928985595703, 0.00844573974609375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 869.0, 147.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04307457059621811, -0.0419674776494503, -0.040860384702682495, -0.03975329548120499, -0.03864620253443718, -0.03753910958766937, -0.036432020366191864, -0.03532492741942406, -0.03421783447265625, -0.03311074152588844, -0.032003648579120636, -0.030896559357643127, -0.02978946641087532, -0.028682373464107513, -0.027575282379984856, -0.026468191295862198, -0.02536109834909439, -0.024254005402326584, -0.023146914318203926, -0.02203982323408127, -0.02093273028731346, -0.019825637340545654, -0.018718546256422997, -0.01761145517230034, -0.016504362225532532, -0.0153972702100873, -0.014290178194642067, -0.013183086179196835, -0.012075994163751602, -0.01096890214830637, -0.009861810132861137, -0.008754718117415905, -0.007647629827260971, -0.006540537811815739, -0.005433445796370506, -0.004326353780925274, -0.0032192617654800415, -0.002112169750034809, -0.0010050777345895767, 0.00010201428085565567, 0.001209106296300888, 0.0023161983117461205, 0.003423290327191353, 0.004530382342636585, 0.005637474358081818, 0.00674456637352705, 0.007851658388972282, 0.008958750404417515, 0.010065842419862747, 0.01117293443530798, 0.012280026450753212, 0.013387118466198444, 0.014494210481643677, 0.01560130249708891, 0.01670839451253414, 0.0178154855966568, 0.018922578543424606, 0.020029671490192413, 0.02113676257431507, 0.02224385365843773, 0.023350946605205536, 0.024458039551973343, 0.025565130636096, 0.02667222172021866, 0.027779314666986465]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 10.0, 8.0, 10.0, 13.0, 19.0, 18.0, 22.0, 20.0, 21.0, 32.0, 29.0, 42.0, 37.0, 40.0, 58.0, 46.0, 48.0, 38.0, 44.0, 38.0, 46.0, 47.0, 41.0, 41.0, 35.0, 27.0, 41.0, 19.0, 16.0, 15.0, 22.0, 8.0, 12.0, 9.0, 5.0, 9.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006440162658691406, -0.006217312067747116, -0.005994461476802826, -0.005771610885858536, -0.005548760294914246, -0.0053259097039699554, -0.005103059113025665, -0.004880208522081375, -0.004657357931137085, -0.004434507340192795, -0.004211656749248505, -0.0039888061583042145, -0.0037659555673599243, -0.003543104976415634, -0.003320254385471344, -0.003097403794527054, -0.0028745532035827637, -0.0026517026126384735, -0.0024288520216941833, -0.002206001430749893, -0.001983150839805603, -0.0017603002488613129, -0.0015374496579170227, -0.0013145990669727325, -0.0010917484760284424, -0.0008688978850841522, -0.0006460472941398621, -0.0004231967031955719, -0.00020034611225128174, 2.2504478693008423e-05, 0.0002453550696372986, 0.00046820566058158875, 0.0006910562515258789, 0.0009139068424701691, 0.0011367574334144592, 0.0013596080243587494, 0.0015824586153030396, 0.0018053092062473297, 0.00202815979719162, 0.00225101038813591, 0.0024738609790802, 0.0026967115700244904, 0.0029195621609687805, 0.0031424127519130707, 0.003365263342857361, 0.003588113933801651, 0.003810964524745941, 0.004033815115690231, 0.0042566657066345215, 0.004479516297578812, 0.004702366888523102, 0.004925217479467392, 0.005148068070411682, 0.005370918661355972, 0.0055937692523002625, 0.005816619843244553, 0.006039470434188843, 0.006262321025133133, 0.006485171616077423, 0.006708022207021713, 0.006930872797966003, 0.007153723388910294, 0.007376573979854584, 0.007599424570798874, 0.007822275161743164]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 10.0, 15.0, 6.0, 22.0, 28.0, 35.0, 52.0, 47.0, 78.0, 109.0, 146.0, 233.0, 339.0, 494.0, 721.0, 1142.0, 1999.0, 3581.0, 7202.0, 19055.0, 725012.0, 255535.0, 17310.0, 6669.0, 3318.0, 1896.0, 1136.0, 744.0, 498.0, 326.0, 215.0, 166.0, 102.0, 81.0, 60.0, 50.0, 28.0, 25.0, 21.0, 6.0, 11.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0147705078125, -0.014308333396911621, -0.013846158981323242, -0.013383984565734863, -0.012921810150146484, -0.012459635734558105, -0.011997461318969727, -0.011535286903381348, -0.011073112487792969, -0.01061093807220459, -0.010148763656616211, -0.009686589241027832, -0.009224414825439453, -0.008762240409851074, -0.008300065994262695, -0.007837891578674316, -0.0073757171630859375, -0.006913542747497559, -0.00645136833190918, -0.005989193916320801, -0.005527019500732422, -0.005064845085144043, -0.004602670669555664, -0.004140496253967285, -0.0036783218383789062, -0.0032161474227905273, -0.0027539730072021484, -0.0022917985916137695, -0.0018296241760253906, -0.0013674497604370117, -0.0009052753448486328, -0.0004431009292602539, 1.9073486328125e-05, 0.0004812479019165039, 0.0009434223175048828, 0.0014055967330932617, 0.0018677711486816406, 0.0023299455642700195, 0.0027921199798583984, 0.0032542943954467773, 0.0037164688110351562, 0.004178643226623535, 0.004640817642211914, 0.005102992057800293, 0.005565166473388672, 0.006027340888977051, 0.00648951530456543, 0.006951689720153809, 0.0074138641357421875, 0.007876038551330566, 0.008338212966918945, 0.008800387382507324, 0.009262561798095703, 0.009724736213684082, 0.010186910629272461, 0.01064908504486084, 0.011111259460449219, 0.011573433876037598, 0.012035608291625977, 0.012497782707214355, 0.012959957122802734, 0.013422131538391113, 0.013884305953979492, 0.014346480369567871, 0.01480865478515625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 13.0, 19.0, 16.0, 10.0, 57.0, 291.0, 369.0, 91.0, 20.0, 17.0, 9.0, 4.0, 10.0, 11.0, 10.0, 3.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019775390625, -0.019156932830810547, -0.018538475036621094, -0.01792001724243164, -0.017301559448242188, -0.016683101654052734, -0.01606464385986328, -0.015446186065673828, -0.014827728271484375, -0.014209270477294922, -0.013590812683105469, -0.012972354888916016, -0.012353897094726562, -0.01173543930053711, -0.011116981506347656, -0.010498523712158203, -0.00988006591796875, -0.009261608123779297, -0.008643150329589844, -0.00802469253540039, -0.0074062347412109375, -0.006787776947021484, -0.006169319152832031, -0.005550861358642578, -0.004932403564453125, -0.004313945770263672, -0.0036954879760742188, -0.0030770301818847656, -0.0024585723876953125, -0.0018401145935058594, -0.0012216567993164062, -0.0006031990051269531, 1.52587890625e-05, 0.0006337165832519531, 0.0012521743774414062, 0.0018706321716308594, 0.0024890899658203125, 0.0031075477600097656, 0.0037260055541992188, 0.004344463348388672, 0.004962921142578125, 0.005581378936767578, 0.006199836730957031, 0.006818294525146484, 0.0074367523193359375, 0.00805521011352539, 0.008673667907714844, 0.009292125701904297, 0.00991058349609375, 0.010529041290283203, 0.011147499084472656, 0.01176595687866211, 0.012384414672851562, 0.013002872467041016, 0.013621330261230469, 0.014239788055419922, 0.014858245849609375, 0.015476703643798828, 0.01609516143798828, 0.016713619232177734, 0.017332077026367188, 0.01795053482055664, 0.018568992614746094, 0.019187450408935547, 0.019805908203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 8.0, 12.0, 10.0, 14.0, 21.0, 17.0, 25.0, 27.0, 41.0, 43.0, 46.0, 62.0, 59.0, 103.0, 131.0, 194.0, 319.0, 533.0, 1348.0, 11500.0, 929446.0, 99249.0, 3129.0, 830.0, 437.0, 227.0, 167.0, 109.0, 75.0, 64.0, 57.0, 46.0, 34.0, 33.0, 30.0, 23.0, 22.0, 17.0, 7.0, 7.0, 5.0, 7.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0274810791015625, -0.02661585807800293, -0.02575063705444336, -0.02488541603088379, -0.02402019500732422, -0.02315497398376465, -0.022289752960205078, -0.021424531936645508, -0.020559310913085938, -0.019694089889526367, -0.018828868865966797, -0.017963647842407227, -0.017098426818847656, -0.016233205795288086, -0.015367984771728516, -0.014502763748168945, -0.013637542724609375, -0.012772321701049805, -0.011907100677490234, -0.011041879653930664, -0.010176658630371094, -0.009311437606811523, -0.008446216583251953, -0.007580995559692383, -0.0067157745361328125, -0.005850553512573242, -0.004985332489013672, -0.0041201114654541016, -0.0032548904418945312, -0.002389669418334961, -0.0015244483947753906, -0.0006592273712158203, 0.00020599365234375, 0.0010712146759033203, 0.0019364356994628906, 0.002801656723022461, 0.0036668777465820312, 0.0045320987701416016, 0.005397319793701172, 0.006262540817260742, 0.0071277618408203125, 0.007992982864379883, 0.008858203887939453, 0.009723424911499023, 0.010588645935058594, 0.011453866958618164, 0.012319087982177734, 0.013184309005737305, 0.014049530029296875, 0.014914751052856445, 0.015779972076416016, 0.016645193099975586, 0.017510414123535156, 0.018375635147094727, 0.019240856170654297, 0.020106077194213867, 0.020971298217773438, 0.021836519241333008, 0.022701740264892578, 0.02356696128845215, 0.02443218231201172, 0.02529740333557129, 0.02616262435913086, 0.02702784538269043, 0.02789306640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 6.0, 5.0, 10.0, 8.0, 12.0, 11.0, 11.0, 18.0, 16.0, 22.0, 23.0, 25.0, 23.0, 29.0, 34.0, 34.0, 44.0, 46.0, 39.0, 40.0, 38.0, 26.0, 45.0, 42.0, 49.0, 38.0, 27.0, 33.0, 26.0, 33.0, 23.0, 25.0, 22.0, 19.0, 16.0, 16.0, 13.0, 13.0, 17.0, 4.0, 6.0, 3.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03948974609375, -0.03824615478515625, -0.0370025634765625, -0.03575897216796875, -0.034515380859375, -0.03327178955078125, -0.0320281982421875, -0.03078460693359375, -0.029541015625, -0.02829742431640625, -0.0270538330078125, -0.02581024169921875, -0.024566650390625, -0.02332305908203125, -0.0220794677734375, -0.02083587646484375, -0.01959228515625, -0.01834869384765625, -0.0171051025390625, -0.01586151123046875, -0.014617919921875, -0.01337432861328125, -0.0121307373046875, -0.01088714599609375, -0.0096435546875, -0.00839996337890625, -0.0071563720703125, -0.00591278076171875, -0.004669189453125, -0.00342559814453125, -0.0021820068359375, -0.00093841552734375, 0.00030517578125, 0.00154876708984375, 0.0027923583984375, 0.00403594970703125, 0.005279541015625, 0.00652313232421875, 0.0077667236328125, 0.00901031494140625, 0.01025390625, 0.01149749755859375, 0.0127410888671875, 0.01398468017578125, 0.015228271484375, 0.01647186279296875, 0.0177154541015625, 0.01895904541015625, 0.02020263671875, 0.02144622802734375, 0.0226898193359375, 0.02393341064453125, 0.025177001953125, 0.02642059326171875, 0.0276641845703125, 0.02890777587890625, 0.0301513671875, 0.03139495849609375, 0.0326385498046875, 0.03388214111328125, 0.035125732421875, 0.03636932373046875, 0.0376129150390625, 0.03885650634765625, 0.04010009765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 12.0, 10.0, 9.0, 9.0, 24.0, 34.0, 38.0, 52.0, 80.0, 156.0, 178.0, 271.0, 360.0, 670.0, 879.0, 1958.0, 2916.0, 7614.0, 15639.0, 88125.0, 810682.0, 80499.0, 22760.0, 6638.0, 4147.0, 1736.0, 1168.0, 580.0, 470.0, 227.0, 212.0, 133.0, 66.0, 62.0, 34.0, 41.0, 12.0, 12.0, 8.0, 11.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.821487426757812e-06, -8.550472557544708e-06, -8.279457688331604e-06, -8.0084428191185e-06, -7.737427949905396e-06, -7.466413080692291e-06, -7.195398211479187e-06, -6.924383342266083e-06, -6.6533684730529785e-06, -6.382353603839874e-06, -6.11133873462677e-06, -5.840323865413666e-06, -5.5693089962005615e-06, -5.298294126987457e-06, -5.027279257774353e-06, -4.756264388561249e-06, -4.4852495193481445e-06, -4.21423465013504e-06, -3.943219780921936e-06, -3.6722049117088318e-06, -3.4011900424957275e-06, -3.1301751732826233e-06, -2.859160304069519e-06, -2.588145434856415e-06, -2.3171305656433105e-06, -2.0461156964302063e-06, -1.775100827217102e-06, -1.5040859580039978e-06, -1.2330710887908936e-06, -9.620562195777893e-07, -6.910413503646851e-07, -4.200264811515808e-07, -1.4901161193847656e-07, 1.2200325727462769e-07, 3.9301812648773193e-07, 6.640329957008362e-07, 9.350478649139404e-07, 1.2060627341270447e-06, 1.477077603340149e-06, 1.7480924725532532e-06, 2.0191073417663574e-06, 2.2901222109794617e-06, 2.561137080192566e-06, 2.83215194940567e-06, 3.1031668186187744e-06, 3.3741816878318787e-06, 3.645196557044983e-06, 3.916211426258087e-06, 4.187226295471191e-06, 4.458241164684296e-06, 4.7292560338974e-06, 5.000270903110504e-06, 5.271285772323608e-06, 5.542300641536713e-06, 5.813315510749817e-06, 6.084330379962921e-06, 6.355345249176025e-06, 6.62636011838913e-06, 6.897374987602234e-06, 7.168389856815338e-06, 7.439404726028442e-06, 7.710419595241547e-06, 7.981434464454651e-06, 8.252449333667755e-06, 8.52346420288086e-06]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 18.0, 15.0, 20.0, 27.0, 36.0, 39.0, 77.0, 46.0, 85.0, 77.0, 102.0, 58.0, 92.0, 62.0, 73.0, 45.0, 39.0, 14.0, 15.0, 12.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.066394805908203e-06, -4.9173831939697266e-06, -4.76837158203125e-06, -4.6193599700927734e-06, -4.470348358154297e-06, -4.32133674621582e-06, -4.172325134277344e-06, -4.023313522338867e-06, -3.874301910400391e-06, -3.725290298461914e-06, -3.5762786865234375e-06, -3.427267074584961e-06, -3.2782554626464844e-06, -3.129243850708008e-06, -2.9802322387695312e-06, -2.8312206268310547e-06, -2.682209014892578e-06, -2.5331974029541016e-06, -2.384185791015625e-06, -2.2351741790771484e-06, -2.086162567138672e-06, -1.9371509552001953e-06, -1.7881393432617188e-06, -1.6391277313232422e-06, -1.4901161193847656e-06, -1.341104507446289e-06, -1.1920928955078125e-06, -1.043081283569336e-06, -8.940696716308594e-07, -7.450580596923828e-07, -5.960464477539062e-07, -4.470348358154297e-07, -2.980232238769531e-07, -1.4901161193847656e-07, 0.0, 1.4901161193847656e-07, 2.980232238769531e-07, 4.470348358154297e-07, 5.960464477539062e-07, 7.450580596923828e-07, 8.940696716308594e-07, 1.043081283569336e-06, 1.1920928955078125e-06, 1.341104507446289e-06, 1.4901161193847656e-06, 1.6391277313232422e-06, 1.7881393432617188e-06, 1.9371509552001953e-06, 2.086162567138672e-06, 2.2351741790771484e-06, 2.384185791015625e-06, 2.5331974029541016e-06, 2.682209014892578e-06, 2.8312206268310547e-06, 2.9802322387695312e-06, 3.129243850708008e-06, 3.2782554626464844e-06, 3.427267074584961e-06, 3.5762786865234375e-06, 3.725290298461914e-06, 3.874301910400391e-06, 4.023313522338867e-06, 4.172325134277344e-06, 4.32133674621582e-06, 4.470348358154297e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 0.0, 9.0, 8.0, 8.0, 18.0, 28.0, 37.0, 64.0, 111.0, 215.0, 736.0, 11247.0, 1032216.0, 3011.0, 411.0, 175.0, 89.0, 62.0, 34.0, 21.0, 14.0, 10.0, 5.0, 2.0, 5.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0471553802490234e-05, -3.935769200325012e-05, -3.824383020401001e-05, -3.71299684047699e-05, -3.6016106605529785e-05, -3.490224480628967e-05, -3.378838300704956e-05, -3.267452120780945e-05, -3.1560659408569336e-05, -3.0446797609329224e-05, -2.933293581008911e-05, -2.8219074010849e-05, -2.7105212211608887e-05, -2.5991350412368774e-05, -2.4877488613128662e-05, -2.376362681388855e-05, -2.2649765014648438e-05, -2.1535903215408325e-05, -2.0422041416168213e-05, -1.93081796169281e-05, -1.8194317817687988e-05, -1.7080456018447876e-05, -1.5966594219207764e-05, -1.4852732419967651e-05, -1.3738870620727539e-05, -1.2625008821487427e-05, -1.1511147022247314e-05, -1.0397285223007202e-05, -9.28342342376709e-06, -8.169561624526978e-06, -7.055699825286865e-06, -5.941838026046753e-06, -4.827976226806641e-06, -3.7141144275665283e-06, -2.600252628326416e-06, -1.4863908290863037e-06, -3.725290298461914e-07, 7.413327693939209e-07, 1.8551945686340332e-06, 2.9690563678741455e-06, 4.082918167114258e-06, 5.19677996635437e-06, 6.310641765594482e-06, 7.424503564834595e-06, 8.538365364074707e-06, 9.65222716331482e-06, 1.0766088962554932e-05, 1.1879950761795044e-05, 1.2993812561035156e-05, 1.4107674360275269e-05, 1.5221536159515381e-05, 1.6335397958755493e-05, 1.7449259757995605e-05, 1.8563121557235718e-05, 1.967698335647583e-05, 2.0790845155715942e-05, 2.1904706954956055e-05, 2.3018568754196167e-05, 2.413243055343628e-05, 2.524629235267639e-05, 2.6360154151916504e-05, 2.7474015951156616e-05, 2.858787775039673e-05, 2.970173954963684e-05, 3.081560134887695e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 6.0, 3.0, 7.0, 9.0, 16.0, 16.0, 22.0, 28.0, 48.0, 71.0, 114.0, 238.0, 133.0, 87.0, 60.0, 39.0, 37.0, 21.0, 19.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.823373794555664e-05, -5.6692399084568024e-05, -5.515106022357941e-05, -5.360972136259079e-05, -5.206838250160217e-05, -5.0527043640613556e-05, -4.898570477962494e-05, -4.744436591863632e-05, -4.5903027057647705e-05, -4.436168819665909e-05, -4.282034933567047e-05, -4.1279010474681854e-05, -3.973767161369324e-05, -3.819633275270462e-05, -3.6654993891716003e-05, -3.5113655030727386e-05, -3.357231616973877e-05, -3.203097730875015e-05, -3.0489638447761536e-05, -2.894829958677292e-05, -2.7406960725784302e-05, -2.5865621864795685e-05, -2.4324283003807068e-05, -2.278294414281845e-05, -2.1241605281829834e-05, -1.9700266420841217e-05, -1.81589275598526e-05, -1.6617588698863983e-05, -1.5076249837875366e-05, -1.353491097688675e-05, -1.1993572115898132e-05, -1.0452233254909515e-05, -8.910894393920898e-06, -7.3695555329322815e-06, -5.8282166719436646e-06, -4.286877810955048e-06, -2.7455389499664307e-06, -1.2042000889778137e-06, 3.371387720108032e-07, 1.8784776329994202e-06, 3.419816493988037e-06, 4.961155354976654e-06, 6.502494215965271e-06, 8.043833076953888e-06, 9.585171937942505e-06, 1.1126510798931122e-05, 1.2667849659919739e-05, 1.4209188520908356e-05, 1.5750527381896973e-05, 1.729186624288559e-05, 1.8833205103874207e-05, 2.0374543964862823e-05, 2.191588282585144e-05, 2.3457221686840057e-05, 2.4998560547828674e-05, 2.653989940881729e-05, 2.8081238269805908e-05, 2.9622577130794525e-05, 3.116391599178314e-05, 3.270525485277176e-05, 3.4246593713760376e-05, 3.578793257474899e-05, 3.732927143573761e-05, 3.887061029672623e-05, 4.0411949157714844e-05]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 15.0, 77.0, 756.0, 146.0, 15.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07345671206712723, -0.06657340377569199, -0.059690095484256744, -0.0528067909181118, -0.04592348262667656, -0.03904017433524132, -0.032156869769096375, -0.025273561477661133, -0.01839025318622589, -0.011506945826113224, -0.004623638466000557, 0.0022596679627895355, 0.009142976254224777, 0.01602628454566002, 0.022909589111804962, 0.029792897403240204, 0.036676205694675446, 0.04355951398611069, 0.05044282227754593, 0.05732612684369087, 0.06420943140983582, 0.07109273970127106, 0.0779760479927063, 0.08485935628414154, 0.09174266457557678, 0.09862597286701202, 0.10550928115844727, 0.11239258944988251, 0.11927589774131775, 0.126159206032753, 0.13304251432418823, 0.13992580771446228, 0.14680913090705872, 0.15369243919849396, 0.1605757474899292, 0.16745905578136444, 0.17434236407279968, 0.18122567236423492, 0.18810898065567017, 0.1949922740459442, 0.20187559723854065, 0.2087589055299759, 0.21564221382141113, 0.22252552211284637, 0.22940883040428162, 0.23629213869571686, 0.2431754469871521, 0.25005874037742615, 0.2569420337677002, 0.26382532715797424, 0.2707086503505707, 0.2775919437408447, 0.28447526693344116, 0.2913585603237152, 0.29824188351631165, 0.3051251769065857, 0.31200850009918213, 0.3188917934894562, 0.3257751166820526, 0.33265841007232666, 0.3395417332649231, 0.34642502665519714, 0.3533083498477936, 0.3601916432380676, 0.36707496643066406]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 12.0, 20.0, 24.0, 9.0, 17.0, 23.0, 28.0, 30.0, 31.0, 31.0, 43.0, 35.0, 42.0, 52.0, 47.0, 48.0, 58.0, 60.0, 42.0, 51.0, 41.0, 35.0, 26.0, 24.0, 18.0, 17.0, 12.0, 18.0, 16.0, 14.0, 10.0, 8.0, 6.0, 5.0, 5.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17874622344970703, -0.1722867786884308, -0.16582733392715454, -0.1593678891658783, -0.15290844440460205, -0.1464489996433258, -0.13998955488204956, -0.13353011012077332, -0.12707066535949707, -0.12061122059822083, -0.11415177583694458, -0.10769233107566833, -0.10123288631439209, -0.09477344155311584, -0.088313989341259, -0.08185454457998276, -0.07539509236812592, -0.06893564760684967, -0.062476202845573425, -0.05601675435900688, -0.04955730959773064, -0.04309786483645439, -0.03663841634988785, -0.030178971588611603, -0.023719526827335358, -0.017260082066059113, -0.010800635442137718, -0.004341188818216324, 0.0021182559430599213, 0.008577700704336166, 0.01503714919090271, 0.021496593952178955, 0.0279560387134552, 0.034415483474731445, 0.04087492823600769, 0.047334376722574234, 0.05379382148385048, 0.060253266245126724, 0.06671271473169327, 0.07317215949296951, 0.07963160425424576, 0.086091049015522, 0.09255049377679825, 0.09900994598865509, 0.10546939074993134, 0.11192883551120758, 0.11838828027248383, 0.12484772503376007, 0.13130716979503632, 0.13776661455631256, 0.1442260593175888, 0.15068550407886505, 0.1571449488401413, 0.16360439360141754, 0.17006385326385498, 0.17652329802513123, 0.18298274278640747, 0.18944218754768372, 0.19590163230895996, 0.2023610770702362, 0.20882052183151245, 0.2152799665927887, 0.22173941135406494, 0.2281988561153412, 0.23465830087661743]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 2.0, 7.0, 14.0, 19.0, 21.0, 21.0, 143.0, 4193415.0, 429.0, 88.0, 23.0, 11.0, 9.0, 2.0, 13.0, 9.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.43648529052734375, -0.4222869873046875, -0.40808868408203125, -0.393890380859375, -0.37969207763671875, -0.3654937744140625, -0.35129547119140625, -0.33709716796875, -0.32289886474609375, -0.3087005615234375, -0.29450225830078125, -0.280303955078125, -0.26610565185546875, -0.2519073486328125, -0.23770904541015625, -0.2235107421875, -0.20931243896484375, -0.1951141357421875, -0.18091583251953125, -0.166717529296875, -0.15251922607421875, -0.1383209228515625, -0.12412261962890625, -0.10992431640625, -0.09572601318359375, -0.0815277099609375, -0.06732940673828125, -0.053131103515625, -0.03893280029296875, -0.0247344970703125, -0.01053619384765625, 0.003662109375, 0.01786041259765625, 0.0320587158203125, 0.04625701904296875, 0.060455322265625, 0.07465362548828125, 0.0888519287109375, 0.10305023193359375, 0.11724853515625, 0.13144683837890625, 0.1456451416015625, 0.15984344482421875, 0.174041748046875, 0.18824005126953125, 0.2024383544921875, 0.21663665771484375, 0.2308349609375, 0.24503326416015625, 0.2592315673828125, 0.27342987060546875, 0.287628173828125, 0.30182647705078125, 0.3160247802734375, 0.33022308349609375, 0.34442138671875, 0.35861968994140625, 0.3728179931640625, 0.38701629638671875, 0.401214599609375, 0.41541290283203125, 0.4296112060546875, 0.44380950927734375, 0.4580078125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 7.0, 13.0, 20.0, 15.0, 13.0, 85.0, 342.0, 307.0, 75.0, 21.0, 12.0, 10.0, 2.0, 12.0, 8.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196075439453125, -0.018990755081176758, -0.018373966217041016, -0.017757177352905273, -0.01714038848876953, -0.01652359962463379, -0.015906810760498047, -0.015290021896362305, -0.014673233032226562, -0.01405644416809082, -0.013439655303955078, -0.012822866439819336, -0.012206077575683594, -0.011589288711547852, -0.01097249984741211, -0.010355710983276367, -0.009738922119140625, -0.009122133255004883, -0.00850534439086914, -0.007888555526733398, -0.007271766662597656, -0.006654977798461914, -0.006038188934326172, -0.00542140007019043, -0.0048046112060546875, -0.004187822341918945, -0.003571033477783203, -0.002954244613647461, -0.0023374557495117188, -0.0017206668853759766, -0.0011038780212402344, -0.0004870891571044922, 0.00012969970703125, 0.0007464885711669922, 0.0013632774353027344, 0.0019800662994384766, 0.0025968551635742188, 0.003213644027709961, 0.003830432891845703, 0.004447221755981445, 0.0050640106201171875, 0.00568079948425293, 0.006297588348388672, 0.006914377212524414, 0.007531166076660156, 0.008147954940795898, 0.00876474380493164, 0.009381532669067383, 0.009998321533203125, 0.010615110397338867, 0.01123189926147461, 0.011848688125610352, 0.012465476989746094, 0.013082265853881836, 0.013699054718017578, 0.01431584358215332, 0.014932632446289062, 0.015549421310424805, 0.016166210174560547, 0.01678299903869629, 0.01739978790283203, 0.018016576766967773, 0.018633365631103516, 0.019250154495239258, 0.019866943359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 57.0, 134.0, 229.0, 4188416.0, 5108.0, 175.0, 118.0, 41.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10382080078125, -0.10076045989990234, -0.09770011901855469, -0.09463977813720703, -0.09157943725585938, -0.08851909637451172, -0.08545875549316406, -0.0823984146118164, -0.07933807373046875, -0.0762777328491211, -0.07321739196777344, -0.07015705108642578, -0.06709671020507812, -0.06403636932373047, -0.06097602844238281, -0.057915687561035156, -0.0548553466796875, -0.051795005798339844, -0.04873466491699219, -0.04567432403564453, -0.042613983154296875, -0.03955364227294922, -0.03649330139160156, -0.033432960510253906, -0.03037261962890625, -0.027312278747558594, -0.024251937866210938, -0.02119159698486328, -0.018131256103515625, -0.015070915222167969, -0.012010574340820312, -0.008950233459472656, -0.005889892578125, -0.0028295516967773438, 0.0002307891845703125, 0.0032911300659179688, 0.006351470947265625, 0.009411811828613281, 0.012472152709960938, 0.015532493591308594, 0.01859283447265625, 0.021653175354003906, 0.024713516235351562, 0.02777385711669922, 0.030834197998046875, 0.03389453887939453, 0.03695487976074219, 0.040015220642089844, 0.0430755615234375, 0.046135902404785156, 0.04919624328613281, 0.05225658416748047, 0.055316925048828125, 0.05837726593017578, 0.06143760681152344, 0.0644979476928711, 0.06755828857421875, 0.0706186294555664, 0.07367897033691406, 0.07673931121826172, 0.07979965209960938, 0.08285999298095703, 0.08592033386230469, 0.08898067474365234, 0.092041015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 40.0, 4023.0, 15.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.02752685546875, -0.02705511450767517, -0.026583373546600342, -0.026111632585525513, -0.025639891624450684, -0.025168150663375854, -0.024696409702301025, -0.024224668741226196, -0.023752927780151367, -0.023281186819076538, -0.02280944585800171, -0.02233770489692688, -0.02186596393585205, -0.02139422297477722, -0.020922482013702393, -0.020450741052627563, -0.019979000091552734, -0.019507259130477905, -0.019035518169403076, -0.018563777208328247, -0.018092036247253418, -0.01762029528617859, -0.01714855432510376, -0.01667681336402893, -0.0162050724029541, -0.015733331441879272, -0.015261590480804443, -0.014789849519729614, -0.014318108558654785, -0.013846367597579956, -0.013374626636505127, -0.012902885675430298, -0.012431144714355469, -0.01195940375328064, -0.01148766279220581, -0.011015921831130981, -0.010544180870056152, -0.010072439908981323, -0.009600698947906494, -0.009128957986831665, -0.008657217025756836, -0.008185476064682007, -0.007713735103607178, -0.007241994142532349, -0.0067702531814575195, -0.00629851222038269, -0.005826771259307861, -0.005355030298233032, -0.004883289337158203, -0.004411548376083374, -0.003939807415008545, -0.003468066453933716, -0.0029963254928588867, -0.0025245845317840576, -0.0020528435707092285, -0.0015811026096343994, -0.0011093616485595703, -0.0006376206874847412, -0.0001658797264099121, 0.000305861234664917, 0.0007776021957397461, 0.0012493431568145752, 0.0017210841178894043, 0.0021928250789642334, 0.0026645660400390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1010.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264337956905365, -0.2596517503261566, -0.25496554374694824, -0.25027933716773987, -0.2455931305885315, -0.24090690910816193, -0.23622070252895355, -0.23153449594974518, -0.2268482893705368, -0.22216208279132843, -0.21747587621212006, -0.21278966963291168, -0.20810344815254211, -0.20341724157333374, -0.19873103499412537, -0.194044828414917, -0.18935862183570862, -0.18467241525650024, -0.17998620867729187, -0.1753000020980835, -0.17061379551887512, -0.16592757403850555, -0.16124136745929718, -0.1565551608800888, -0.15186895430088043, -0.14718274772167206, -0.14249654114246368, -0.1378103345632553, -0.13312411308288574, -0.12843790650367737, -0.123751699924469, -0.11906549334526062, -0.11437928676605225, -0.10969308018684387, -0.1050068736076355, -0.10032065957784653, -0.09563445299863815, -0.09094824641942978, -0.08626203238964081, -0.08157582581043243, -0.07688961923122406, -0.07220341265201569, -0.06751720607280731, -0.06283099204301834, -0.05814478546380997, -0.05345857888460159, -0.04877236858010292, -0.04408615827560425, -0.039399951696395874, -0.0347137451171875, -0.030027534812688828, -0.025341326370835304, -0.02065511792898178, -0.015968909487128258, -0.011282701045274734, -0.006596490740776062, -0.001910284161567688, 0.0027759242802858353, 0.0074621327221393585, 0.012148341163992882, 0.016834549605846405, 0.02152075804769993, 0.02620696648955345, 0.030893176794052124, 0.0355793833732605]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 13.0, 8.0, 15.0, 8.0, 23.0, 21.0, 28.0, 17.0, 39.0, 39.0, 40.0, 32.0, 39.0, 49.0, 39.0, 38.0, 47.0, 50.0, 41.0, 36.0, 33.0, 29.0, 36.0, 41.0, 28.0, 29.0, 18.0, 24.0, 21.0, 14.0, 13.0, 26.0, 10.0, 10.0, 5.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011171936988830566, -0.01081587839871645, -0.010459819808602333, -0.010103761218488216, -0.0097477026283741, -0.009391644038259983, -0.009035585448145866, -0.00867952685803175, -0.008323468267917633, -0.007967409677803516, -0.0076113510876894, -0.007255292497575283, -0.006899233907461166, -0.00654317531734705, -0.006187116727232933, -0.005831058137118816, -0.0054749995470047, -0.005118940956890583, -0.004762882366776466, -0.00440682377666235, -0.004050765186548233, -0.0036947065964341164, -0.0033386480063199997, -0.002982589416205883, -0.0026265308260917664, -0.0022704722359776497, -0.001914413645863533, -0.0015583550557494164, -0.0012022964656352997, -0.000846237875521183, -0.0004901792854070663, -0.00013412069529294968, 0.000221937894821167, 0.0005779964849352837, 0.0009340550750494003, 0.001290113665163517, 0.0016461722552776337, 0.0020022308453917503, 0.002358289435505867, 0.0027143480256199837, 0.0030704066157341003, 0.003426465205848217, 0.0037825237959623337, 0.00413858238607645, 0.004494640976190567, 0.004850699566304684, 0.0052067581564188, 0.005562816746532917, 0.005918875336647034, 0.00627493392676115, 0.006630992516875267, 0.006987051106989384, 0.0073431096971035, 0.007699168287217617, 0.008055226877331734, 0.00841128546744585, 0.008767344057559967, 0.009123402647674084, 0.0094794612377882, 0.009835519827902317, 0.010191578418016434, 0.01054763700813055, 0.010903695598244667, 0.011259754188358784, 0.0116158127784729]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 5.0, 11.0, 9.0, 13.0, 22.0, 54.0, 51.0, 82.0, 109.0, 133.0, 233.0, 338.0, 629.0, 890.0, 1554.0, 2896.0, 5653.0, 14042.0, 93113.0, 889195.0, 22922.0, 7657.0, 3739.0, 1982.0, 1178.0, 704.0, 453.0, 267.0, 195.0, 121.0, 92.0, 51.0, 40.0, 34.0, 18.0, 14.0, 16.0, 4.0, 10.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.028778076171875, -0.027884244918823242, -0.026990413665771484, -0.026096582412719727, -0.02520275115966797, -0.02430891990661621, -0.023415088653564453, -0.022521257400512695, -0.021627426147460938, -0.02073359489440918, -0.019839763641357422, -0.018945932388305664, -0.018052101135253906, -0.01715826988220215, -0.01626443862915039, -0.015370607376098633, -0.014476776123046875, -0.013582944869995117, -0.01268911361694336, -0.011795282363891602, -0.010901451110839844, -0.010007619857788086, -0.009113788604736328, -0.00821995735168457, -0.0073261260986328125, -0.006432294845581055, -0.005538463592529297, -0.004644632339477539, -0.0037508010864257812, -0.0028569698333740234, -0.0019631385803222656, -0.0010693073272705078, -0.00017547607421875, 0.0007183551788330078, 0.0016121864318847656, 0.0025060176849365234, 0.0033998489379882812, 0.004293680191040039, 0.005187511444091797, 0.006081342697143555, 0.0069751739501953125, 0.00786900520324707, 0.008762836456298828, 0.009656667709350586, 0.010550498962402344, 0.011444330215454102, 0.01233816146850586, 0.013231992721557617, 0.014125823974609375, 0.015019655227661133, 0.01591348648071289, 0.01680731773376465, 0.017701148986816406, 0.018594980239868164, 0.019488811492919922, 0.02038264274597168, 0.021276473999023438, 0.022170305252075195, 0.023064136505126953, 0.02395796775817871, 0.02485179901123047, 0.025745630264282227, 0.026639461517333984, 0.027533292770385742, 0.0284271240234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 7.0, 13.0, 20.0, 14.0, 14.0, 82.0, 342.0, 309.0, 76.0, 21.0, 12.0, 10.0, 2.0, 12.0, 8.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196075439453125, -0.01899099349975586, -0.01837444305419922, -0.017757892608642578, -0.017141342163085938, -0.016524791717529297, -0.015908241271972656, -0.015291690826416016, -0.014675140380859375, -0.014058589935302734, -0.013442039489746094, -0.012825489044189453, -0.012208938598632812, -0.011592388153076172, -0.010975837707519531, -0.01035928726196289, -0.00974273681640625, -0.00912618637084961, -0.008509635925292969, -0.007893085479736328, -0.0072765350341796875, -0.006659984588623047, -0.006043434143066406, -0.005426883697509766, -0.004810333251953125, -0.004193782806396484, -0.0035772323608398438, -0.002960681915283203, -0.0023441314697265625, -0.0017275810241699219, -0.0011110305786132812, -0.0004944801330566406, 0.0001220703125, 0.0007386207580566406, 0.0013551712036132812, 0.001971721649169922, 0.0025882720947265625, 0.003204822540283203, 0.0038213729858398438, 0.004437923431396484, 0.005054473876953125, 0.005671024322509766, 0.006287574768066406, 0.006904125213623047, 0.0075206756591796875, 0.008137226104736328, 0.008753776550292969, 0.00937032699584961, 0.00998687744140625, 0.01060342788696289, 0.011219978332519531, 0.011836528778076172, 0.012453079223632812, 0.013069629669189453, 0.013686180114746094, 0.014302730560302734, 0.014919281005859375, 0.015535831451416016, 0.016152381896972656, 0.016768932342529297, 0.017385482788085938, 0.018002033233642578, 0.01861858367919922, 0.01923513412475586, 0.0198516845703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 5.0, 4.0, 6.0, 7.0, 10.0, 9.0, 11.0, 11.0, 23.0, 25.0, 36.0, 49.0, 46.0, 68.0, 115.0, 154.0, 219.0, 341.0, 744.0, 1436.0, 14241.0, 1017728.0, 10064.0, 1381.0, 698.0, 351.0, 220.0, 145.0, 80.0, 69.0, 38.0, 51.0, 34.0, 21.0, 23.0, 21.0, 24.0, 9.0, 5.0, 8.0, 1.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.051849365234375, -0.050201416015625, -0.048553466796875, -0.046905517578125, -0.045257568359375, -0.043609619140625, -0.041961669921875, -0.040313720703125, -0.038665771484375, -0.037017822265625, -0.035369873046875, -0.033721923828125, -0.032073974609375, -0.030426025390625, -0.028778076171875, -0.027130126953125, -0.025482177734375, -0.023834228515625, -0.022186279296875, -0.020538330078125, -0.018890380859375, -0.017242431640625, -0.015594482421875, -0.013946533203125, -0.012298583984375, -0.010650634765625, -0.009002685546875, -0.007354736328125, -0.005706787109375, -0.004058837890625, -0.002410888671875, -0.000762939453125, 0.000885009765625, 0.002532958984375, 0.004180908203125, 0.005828857421875, 0.007476806640625, 0.009124755859375, 0.010772705078125, 0.012420654296875, 0.014068603515625, 0.015716552734375, 0.017364501953125, 0.019012451171875, 0.020660400390625, 0.022308349609375, 0.023956298828125, 0.025604248046875, 0.027252197265625, 0.028900146484375, 0.030548095703125, 0.032196044921875, 0.033843994140625, 0.035491943359375, 0.037139892578125, 0.038787841796875, 0.040435791015625, 0.042083740234375, 0.043731689453125, 0.045379638671875, 0.047027587890625, 0.048675537109375, 0.050323486328125, 0.051971435546875, 0.053619384765625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 8.0, 4.0, 4.0, 6.0, 7.0, 10.0, 7.0, 11.0, 10.0, 20.0, 21.0, 22.0, 31.0, 23.0, 27.0, 41.0, 38.0, 39.0, 40.0, 42.0, 37.0, 36.0, 50.0, 41.0, 42.0, 45.0, 33.0, 34.0, 46.0, 23.0, 28.0, 14.0, 31.0, 20.0, 16.0, 18.0, 19.0, 21.0, 7.0, 5.0, 8.0, 1.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.040008544921875, -0.03873395919799805, -0.037459373474121094, -0.03618478775024414, -0.03491020202636719, -0.033635616302490234, -0.03236103057861328, -0.031086444854736328, -0.029811859130859375, -0.028537273406982422, -0.02726268768310547, -0.025988101959228516, -0.024713516235351562, -0.02343893051147461, -0.022164344787597656, -0.020889759063720703, -0.01961517333984375, -0.018340587615966797, -0.017066001892089844, -0.01579141616821289, -0.014516830444335938, -0.013242244720458984, -0.011967658996582031, -0.010693073272705078, -0.009418487548828125, -0.008143901824951172, -0.006869316101074219, -0.005594730377197266, -0.0043201446533203125, -0.0030455589294433594, -0.0017709732055664062, -0.0004963874816894531, 0.0007781982421875, 0.002052783966064453, 0.0033273696899414062, 0.004601955413818359, 0.0058765411376953125, 0.007151126861572266, 0.008425712585449219, 0.009700298309326172, 0.010974884033203125, 0.012249469757080078, 0.013524055480957031, 0.014798641204833984, 0.016073226928710938, 0.01734781265258789, 0.018622398376464844, 0.019896984100341797, 0.02117156982421875, 0.022446155548095703, 0.023720741271972656, 0.02499532699584961, 0.026269912719726562, 0.027544498443603516, 0.02881908416748047, 0.030093669891357422, 0.031368255615234375, 0.03264284133911133, 0.03391742706298828, 0.035192012786865234, 0.03646659851074219, 0.03774118423461914, 0.039015769958496094, 0.04029035568237305, 0.04156494140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 13.0, 12.0, 18.0, 33.0, 31.0, 37.0, 64.0, 100.0, 129.0, 228.0, 391.0, 599.0, 1127.0, 2405.0, 4700.0, 11556.0, 37895.0, 348190.0, 574449.0, 43084.0, 12945.0, 5185.0, 2345.0, 1177.0, 673.0, 386.0, 294.0, 137.0, 96.0, 68.0, 52.0, 32.0, 18.0, 18.0, 16.0, 15.0, 3.0, 10.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9848346710205078e-05, -1.9188039004802704e-05, -1.852773129940033e-05, -1.7867423593997955e-05, -1.720711588859558e-05, -1.6546808183193207e-05, -1.5886500477790833e-05, -1.5226192772388458e-05, -1.4565885066986084e-05, -1.390557736158371e-05, -1.3245269656181335e-05, -1.2584961950778961e-05, -1.1924654245376587e-05, -1.1264346539974213e-05, -1.0604038834571838e-05, -9.943731129169464e-06, -9.28342342376709e-06, -8.623115718364716e-06, -7.962808012962341e-06, -7.302500307559967e-06, -6.642192602157593e-06, -5.9818848967552185e-06, -5.321577191352844e-06, -4.66126948595047e-06, -4.000961780548096e-06, -3.3406540751457214e-06, -2.680346369743347e-06, -2.020038664340973e-06, -1.3597309589385986e-06, -6.994232535362244e-07, -3.91155481338501e-08, 6.211921572685242e-07, 1.2814998626708984e-06, 1.9418075680732727e-06, 2.602115273475647e-06, 3.2624229788780212e-06, 3.9227306842803955e-06, 4.58303838968277e-06, 5.243346095085144e-06, 5.903653800487518e-06, 6.563961505889893e-06, 7.224269211292267e-06, 7.884576916694641e-06, 8.544884622097015e-06, 9.20519232749939e-06, 9.865500032901764e-06, 1.0525807738304138e-05, 1.1186115443706512e-05, 1.1846423149108887e-05, 1.2506730854511261e-05, 1.3167038559913635e-05, 1.382734626531601e-05, 1.4487653970718384e-05, 1.5147961676120758e-05, 1.5808269381523132e-05, 1.6468577086925507e-05, 1.712888479232788e-05, 1.7789192497730255e-05, 1.844950020313263e-05, 1.9109807908535004e-05, 1.9770115613937378e-05, 2.0430423319339752e-05, 2.1090731024742126e-05, 2.17510387301445e-05, 2.2411346435546875e-05]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 9.0, 11.0, 19.0, 37.0, 33.0, 53.0, 86.0, 127.0, 176.0, 131.0, 109.0, 61.0, 52.0, 39.0, 21.0, 13.0, 9.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.531839370727539e-05, -1.4865770936012268e-05, -1.4413148164749146e-05, -1.3960525393486023e-05, -1.35079026222229e-05, -1.3055279850959778e-05, -1.2602657079696655e-05, -1.2150034308433533e-05, -1.169741153717041e-05, -1.1244788765907288e-05, -1.0792165994644165e-05, -1.0339543223381042e-05, -9.88692045211792e-06, -9.434297680854797e-06, -8.981674909591675e-06, -8.529052138328552e-06, -8.07642936706543e-06, -7.623806595802307e-06, -7.1711838245391846e-06, -6.718561053276062e-06, -6.2659382820129395e-06, -5.813315510749817e-06, -5.360692739486694e-06, -4.908069968223572e-06, -4.455447196960449e-06, -4.002824425697327e-06, -3.550201654434204e-06, -3.0975788831710815e-06, -2.644956111907959e-06, -2.1923333406448364e-06, -1.7397105693817139e-06, -1.2870877981185913e-06, -8.344650268554688e-07, -3.818422555923462e-07, 7.078051567077637e-08, 5.234032869338989e-07, 9.760260581970215e-07, 1.428648829460144e-06, 1.8812716007232666e-06, 2.333894371986389e-06, 2.7865171432495117e-06, 3.2391399145126343e-06, 3.691762685775757e-06, 4.144385457038879e-06, 4.597008228302002e-06, 5.0496309995651245e-06, 5.502253770828247e-06, 5.95487654209137e-06, 6.407499313354492e-06, 6.860122084617615e-06, 7.312744855880737e-06, 7.76536762714386e-06, 8.217990398406982e-06, 8.670613169670105e-06, 9.123235940933228e-06, 9.57585871219635e-06, 1.0028481483459473e-05, 1.0481104254722595e-05, 1.0933727025985718e-05, 1.138634979724884e-05, 1.1838972568511963e-05, 1.2291595339775085e-05, 1.2744218111038208e-05, 1.319684088230133e-05, 1.3649463653564453e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 14.0, 17.0, 19.0, 29.0, 55.0, 78.0, 155.0, 392.0, 1531.0, 1034680.0, 10369.0, 714.0, 233.0, 102.0, 54.0, 30.0, 27.0, 19.0, 6.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.751319885253906e-05, -9.453482925891876e-05, -9.155645966529846e-05, -8.857809007167816e-05, -8.559972047805786e-05, -8.262135088443756e-05, -7.964298129081726e-05, -7.666461169719696e-05, -7.368624210357666e-05, -7.070787250995636e-05, -6.772950291633606e-05, -6.475113332271576e-05, -6.177276372909546e-05, -5.879439413547516e-05, -5.581602454185486e-05, -5.283765494823456e-05, -4.985928535461426e-05, -4.688091576099396e-05, -4.390254616737366e-05, -4.092417657375336e-05, -3.794580698013306e-05, -3.4967437386512756e-05, -3.1989067792892456e-05, -2.9010698199272156e-05, -2.6032328605651855e-05, -2.3053959012031555e-05, -2.0075589418411255e-05, -1.7097219824790955e-05, -1.4118850231170654e-05, -1.1140480637550354e-05, -8.162111043930054e-06, -5.183741450309753e-06, -2.205371856689453e-06, 7.729977369308472e-07, 3.7513673305511475e-06, 6.729736924171448e-06, 9.708106517791748e-06, 1.2686476111412048e-05, 1.566484570503235e-05, 1.864321529865265e-05, 2.162158489227295e-05, 2.459995448589325e-05, 2.757832407951355e-05, 3.055669367313385e-05, 3.353506326675415e-05, 3.651343286037445e-05, 3.949180245399475e-05, 4.247017204761505e-05, 4.544854164123535e-05, 4.842691123485565e-05, 5.140528082847595e-05, 5.438365042209625e-05, 5.736202001571655e-05, 6.034038960933685e-05, 6.331875920295715e-05, 6.629712879657745e-05, 6.927549839019775e-05, 7.225386798381805e-05, 7.523223757743835e-05, 7.821060717105865e-05, 8.118897676467896e-05, 8.416734635829926e-05, 8.714571595191956e-05, 9.012408554553986e-05, 9.310245513916016e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 12.0, 13.0, 10.0, 14.0, 27.0, 33.0, 39.0, 69.0, 102.0, 160.0, 207.0, 108.0, 60.0, 42.0, 24.0, 19.0, 13.0, 17.0, 10.0, 10.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.539987564086914e-05, -7.31172040104866e-05, -7.083453238010406e-05, -6.855186074972153e-05, -6.626918911933899e-05, -6.398651748895645e-05, -6.170384585857391e-05, -5.9421174228191376e-05, -5.713850259780884e-05, -5.48558309674263e-05, -5.257315933704376e-05, -5.0290487706661224e-05, -4.8007816076278687e-05, -4.572514444589615e-05, -4.344247281551361e-05, -4.115980118513107e-05, -3.8877129554748535e-05, -3.6594457924366e-05, -3.431178629398346e-05, -3.202911466360092e-05, -2.9746443033218384e-05, -2.7463771402835846e-05, -2.5181099772453308e-05, -2.289842814207077e-05, -2.0615756511688232e-05, -1.8333084881305695e-05, -1.6050413250923157e-05, -1.3767741620540619e-05, -1.1485069990158081e-05, -9.202398359775543e-06, -6.919726729393005e-06, -4.6370550990104675e-06, -2.3543834686279297e-06, -7.171183824539185e-08, 2.210959792137146e-06, 4.493631422519684e-06, 6.776303052902222e-06, 9.05897468328476e-06, 1.1341646313667297e-05, 1.3624317944049835e-05, 1.5906989574432373e-05, 1.818966120481491e-05, 2.047233283519745e-05, 2.2755004465579987e-05, 2.5037676095962524e-05, 2.7320347726345062e-05, 2.96030193567276e-05, 3.188569098711014e-05, 3.4168362617492676e-05, 3.6451034247875214e-05, 3.873370587825775e-05, 4.101637750864029e-05, 4.329904913902283e-05, 4.5581720769405365e-05, 4.78643923997879e-05, 5.014706403017044e-05, 5.242973566055298e-05, 5.4712407290935516e-05, 5.6995078921318054e-05, 5.927775055170059e-05, 6.156042218208313e-05, 6.384309381246567e-05, 6.61257654428482e-05, 6.840843707323074e-05, 7.069110870361328e-05]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 44.0, 356.0, 570.0, 38.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3561144471168518, -0.3476490080356598, -0.3391835689544678, -0.33071815967559814, -0.32225272059440613, -0.3137872815132141, -0.3053218722343445, -0.29685643315315247, -0.28839099407196045, -0.27992555499076843, -0.2714601159095764, -0.2629947066307068, -0.25452926754951477, -0.24606382846832275, -0.23759840428829193, -0.2291329801082611, -0.2206675410270691, -0.21220210194587708, -0.20373667776584625, -0.19527125358581543, -0.1868058145046234, -0.1783403754234314, -0.16987495124340057, -0.16140952706336975, -0.15294408798217773, -0.14447864890098572, -0.1360132247209549, -0.12754780054092407, -0.11908236145973206, -0.11061692982912064, -0.10215149819850922, -0.0936860665678978, -0.08522063493728638, -0.07675520330667496, -0.06828977167606354, -0.05982434004545212, -0.0513589084148407, -0.04289347678422928, -0.03442804515361786, -0.02596261352300644, -0.01749718189239502, -0.0090317502617836, -0.0005663186311721802, 0.00789911299943924, 0.01636454463005066, 0.02482997626066208, 0.0332954078912735, 0.04176083952188492, 0.05022627115249634, 0.05869170278310776, 0.06715713441371918, 0.0756225660443306, 0.08408799767494202, 0.09255342930555344, 0.10101886093616486, 0.10948429256677628, 0.1179497241973877, 0.1264151632785797, 0.13488058745861053, 0.14334601163864136, 0.15181145071983337, 0.1602768898010254, 0.1687423139810562, 0.17720773816108704, 0.18567317724227905]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 9.0, 8.0, 10.0, 11.0, 23.0, 24.0, 21.0, 27.0, 36.0, 24.0, 43.0, 31.0, 42.0, 41.0, 48.0, 36.0, 45.0, 43.0, 54.0, 44.0, 46.0, 41.0, 33.0, 29.0, 30.0, 31.0, 31.0, 27.0, 17.0, 12.0, 17.0, 9.0, 9.0, 4.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20078426599502563, -0.1936047375202179, -0.18642519414424896, -0.17924565076828003, -0.1720661222934723, -0.16488659381866455, -0.15770705044269562, -0.15052750706672668, -0.14334797859191895, -0.1361684501171112, -0.12898890674114227, -0.12180937081575394, -0.1146298348903656, -0.10745029896497726, -0.10027076303958893, -0.09309122711420059, -0.08591169118881226, -0.07873215526342392, -0.07155261933803558, -0.06437308341264725, -0.05719354748725891, -0.050014011561870575, -0.04283447563648224, -0.0356549397110939, -0.028475403785705566, -0.02129586786031723, -0.014116331934928894, -0.006936796009540558, 0.00024273991584777832, 0.0074222758412361145, 0.01460181176662445, 0.021781347692012787, 0.028960883617401123, 0.03614041954278946, 0.043319955468177795, 0.05049949139356613, 0.05767902731895447, 0.0648585632443428, 0.07203809916973114, 0.07921763509511948, 0.08639717102050781, 0.09357670694589615, 0.10075624287128448, 0.10793577879667282, 0.11511531472206116, 0.1222948506474495, 0.12947438657283783, 0.13665392994880676, 0.1438334584236145, 0.15101298689842224, 0.15819253027439117, 0.1653720736503601, 0.17255160212516785, 0.17973113059997559, 0.18691067397594452, 0.19409021735191345, 0.2012697458267212, 0.20844927430152893, 0.21562881767749786, 0.2228083610534668, 0.22998788952827454, 0.23716741800308228, 0.2443469613790512, 0.25152650475502014, 0.2587060332298279]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 0.0, 4.0, 5.0, 3.0, 6.0, 4.0, 9.0, 8.0, 10.0, 5.0, 9.0, 9.0, 20.0, 28.0, 37.0, 47.0, 220.0, 2282.0, 4184046.0, 6318.0, 983.0, 62.0, 29.0, 26.0, 24.0, 19.0, 15.0, 14.0, 9.0, 9.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04644775390625, -0.044981956481933594, -0.04351615905761719, -0.04205036163330078, -0.040584564208984375, -0.03911876678466797, -0.03765296936035156, -0.036187171936035156, -0.03472137451171875, -0.033255577087402344, -0.03178977966308594, -0.03032398223876953, -0.028858184814453125, -0.02739238739013672, -0.025926589965820312, -0.024460792541503906, -0.0229949951171875, -0.021529197692871094, -0.020063400268554688, -0.01859760284423828, -0.017131805419921875, -0.01566600799560547, -0.014200210571289062, -0.012734413146972656, -0.01126861572265625, -0.009802818298339844, -0.008337020874023438, -0.006871223449707031, -0.005405426025390625, -0.003939628601074219, -0.0024738311767578125, -0.0010080337524414062, 0.000457763671875, 0.0019235610961914062, 0.0033893585205078125, 0.004855155944824219, 0.006320953369140625, 0.007786750793457031, 0.009252548217773438, 0.010718345642089844, 0.01218414306640625, 0.013649940490722656, 0.015115737915039062, 0.01658153533935547, 0.018047332763671875, 0.01951313018798828, 0.020978927612304688, 0.022444725036621094, 0.0239105224609375, 0.025376319885253906, 0.026842117309570312, 0.02830791473388672, 0.029773712158203125, 0.03123950958251953, 0.03270530700683594, 0.034171104431152344, 0.03563690185546875, 0.037102699279785156, 0.03856849670410156, 0.04003429412841797, 0.041500091552734375, 0.04296588897705078, 0.04443168640136719, 0.045897483825683594, 0.04736328125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 11.0, 14.0, 18.0, 12.0, 19.0, 118.0, 411.0, 226.0, 49.0, 24.0, 9.0, 8.0, 3.0, 13.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193328857421875, -0.018720626831054688, -0.018108367919921875, -0.017496109008789062, -0.01688385009765625, -0.016271591186523438, -0.015659332275390625, -0.015047073364257812, -0.014434814453125, -0.013822555541992188, -0.013210296630859375, -0.012598037719726562, -0.01198577880859375, -0.011373519897460938, -0.010761260986328125, -0.010149002075195312, -0.0095367431640625, -0.008924484252929688, -0.008312225341796875, -0.0076999664306640625, -0.00708770751953125, -0.0064754486083984375, -0.005863189697265625, -0.0052509307861328125, -0.004638671875, -0.0040264129638671875, -0.003414154052734375, -0.0028018951416015625, -0.00218963623046875, -0.0015773773193359375, -0.000965118408203125, -0.0003528594970703125, 0.0002593994140625, 0.0008716583251953125, 0.001483917236328125, 0.0020961761474609375, 0.00270843505859375, 0.0033206939697265625, 0.003932952880859375, 0.0045452117919921875, 0.005157470703125, 0.0057697296142578125, 0.006381988525390625, 0.0069942474365234375, 0.00760650634765625, 0.008218765258789062, 0.008831024169921875, 0.009443283081054688, 0.0100555419921875, 0.010667800903320312, 0.011280059814453125, 0.011892318725585938, 0.01250457763671875, 0.013116836547851562, 0.013729095458984375, 0.014341354370117188, 0.01495361328125, 0.015565872192382812, 0.016178131103515625, 0.016790390014648438, 0.01740264892578125, 0.018014907836914062, 0.018627166748046875, 0.019239425659179688, 0.0198516845703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 20.0, 53.0, 111.0, 179.0, 1071.0, 4186533.0, 5646.0, 424.0, 136.0, 64.0, 27.0, 11.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042266845703125, -0.04111671447753906, -0.039966583251953125, -0.03881645202636719, -0.03766632080078125, -0.03651618957519531, -0.035366058349609375, -0.03421592712402344, -0.0330657958984375, -0.03191566467285156, -0.030765533447265625, -0.029615402221679688, -0.02846527099609375, -0.027315139770507812, -0.026165008544921875, -0.025014877319335938, -0.02386474609375, -0.022714614868164062, -0.021564483642578125, -0.020414352416992188, -0.01926422119140625, -0.018114089965820312, -0.016963958740234375, -0.015813827514648438, -0.0146636962890625, -0.013513565063476562, -0.012363433837890625, -0.011213302612304688, -0.01006317138671875, -0.008913040161132812, -0.007762908935546875, -0.0066127777099609375, -0.005462646484375, -0.0043125152587890625, -0.003162384033203125, -0.0020122528076171875, -0.00086212158203125, 0.0002880096435546875, 0.001438140869140625, 0.0025882720947265625, 0.0037384033203125, 0.0048885345458984375, 0.006038665771484375, 0.0071887969970703125, 0.00833892822265625, 0.009489059448242188, 0.010639190673828125, 0.011789321899414062, 0.012939453125, 0.014089584350585938, 0.015239715576171875, 0.016389846801757812, 0.01753997802734375, 0.018690109252929688, 0.019840240478515625, 0.020990371704101562, 0.0221405029296875, 0.023290634155273438, 0.024440765380859375, 0.025590896606445312, 0.02674102783203125, 0.027891159057617188, 0.029041290283203125, 0.030191421508789062, 0.031341552734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 18.0, 106.0, 3903.0, 32.0, 10.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0060882568359375, -0.005753874778747559, -0.005419492721557617, -0.005085110664367676, -0.004750728607177734, -0.004416346549987793, -0.0040819644927978516, -0.00374758243560791, -0.0034132003784179688, -0.0030788183212280273, -0.002744436264038086, -0.0024100542068481445, -0.002075672149658203, -0.0017412900924682617, -0.0014069080352783203, -0.001072525978088379, -0.0007381439208984375, -0.0004037618637084961, -6.937980651855469e-05, 0.0002650022506713867, 0.0005993843078613281, 0.0009337663650512695, 0.001268148422241211, 0.0016025304794311523, 0.0019369125366210938, 0.002271294593811035, 0.0026056766510009766, 0.002940058708190918, 0.0032744407653808594, 0.0036088228225708008, 0.003943204879760742, 0.004277586936950684, 0.004611968994140625, 0.004946351051330566, 0.005280733108520508, 0.005615115165710449, 0.005949497222900391, 0.006283879280090332, 0.0066182613372802734, 0.006952643394470215, 0.007287025451660156, 0.007621407508850098, 0.007955789566040039, 0.00829017162322998, 0.008624553680419922, 0.008958935737609863, 0.009293317794799805, 0.009627699851989746, 0.009962081909179688, 0.010296463966369629, 0.01063084602355957, 0.010965228080749512, 0.011299610137939453, 0.011633992195129395, 0.011968374252319336, 0.012302756309509277, 0.012637138366699219, 0.01297152042388916, 0.013305902481079102, 0.013640284538269043, 0.013974666595458984, 0.014309048652648926, 0.014643430709838867, 0.014977812767028809, 0.01531219482421875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 937.0, 79.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16899053752422333, -0.16585859656333923, -0.16272667050361633, -0.15959472954273224, -0.15646280348300934, -0.15333086252212524, -0.15019893646240234, -0.14706699550151825, -0.14393505454063416, -0.14080311357975006, -0.13767118752002716, -0.13453924655914307, -0.13140732049942017, -0.12827537953853607, -0.12514345347881317, -0.12201151251792908, -0.11887958645820618, -0.11574765294790268, -0.11261571943759918, -0.10948378592729568, -0.10635185241699219, -0.1032199114561081, -0.1000879779458046, -0.0969560444355011, -0.0938241109251976, -0.0906921774148941, -0.0875602439045906, -0.08442831039428711, -0.08129636943340302, -0.07816444337368011, -0.07503250241279602, -0.07190056890249252, -0.06876863539218903, -0.06563670188188553, -0.06250476837158203, -0.059372831135988235, -0.05624089762568474, -0.05310896411538124, -0.049977026879787445, -0.04684509336948395, -0.04371316358447075, -0.04058123007416725, -0.037449292838573456, -0.03431735932826996, -0.03118542581796646, -0.028053492307662964, -0.024921556934714317, -0.02178962156176567, -0.018657688051462173, -0.015525753609836102, -0.01239381916821003, -0.009261884726583958, -0.006129950284957886, -0.0029980167746543884, 0.00013391859829425812, 0.0032658539712429047, 0.006397787481546402, 0.009529721923172474, 0.012661656364798546, 0.015793591737747192, 0.01892552524805069, 0.022057458758354187, 0.025189394131302834, 0.02832132950425148, 0.03145326301455498]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 16.0, 28.0, 32.0, 53.0, 77.0, 83.0, 114.0, 107.0, 78.0, 102.0, 82.0, 61.0, 48.0, 39.0, 31.0, 15.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018790721893310547, -0.01829395815730095, -0.01779719442129135, -0.017300430685281754, -0.016803666949272156, -0.016306903213262558, -0.01581013947725296, -0.015313375741243362, -0.014816612005233765, -0.014319848269224167, -0.013823084533214569, -0.013326320797204971, -0.012829557061195374, -0.012332793325185776, -0.011836029589176178, -0.01133926585316658, -0.010842502117156982, -0.010345738381147385, -0.009848974645137787, -0.009352210909128189, -0.008855447173118591, -0.008358683437108994, -0.007861919701099396, -0.007365155965089798, -0.0068683922290802, -0.006371628493070602, -0.005874864757061005, -0.005378101021051407, -0.004881337285041809, -0.004384573549032211, -0.0038878098130226135, -0.0033910460770130157, -0.002894282341003418, -0.00239751860499382, -0.0019007548689842224, -0.0014039911329746246, -0.0009072273969650269, -0.0004104636609554291, 8.63000750541687e-05, 0.0005830638110637665, 0.0010798275470733643, 0.001576591283082962, 0.00207335501909256, 0.0025701187551021576, 0.0030668824911117554, 0.003563646227121353, 0.004060409963130951, 0.004557173699140549, 0.0050539374351501465, 0.005550701171159744, 0.006047464907169342, 0.00654422864317894, 0.007040992379188538, 0.007537756115198135, 0.008034519851207733, 0.008531283587217331, 0.009028047323226929, 0.009524811059236526, 0.010021574795246124, 0.010518338531255722, 0.01101510226726532, 0.011511866003274918, 0.012008629739284515, 0.012505393475294113, 0.013002157211303711]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 4.0, 15.0, 7.0, 14.0, 22.0, 37.0, 36.0, 69.0, 83.0, 133.0, 188.0, 350.0, 599.0, 1126.0, 2374.0, 6567.0, 31552.0, 967019.0, 27037.0, 6153.0, 2499.0, 1126.0, 585.0, 343.0, 191.0, 105.0, 80.0, 63.0, 44.0, 29.0, 13.0, 18.0, 6.0, 15.0, 7.0, 5.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.02655029296875, -0.02573251724243164, -0.02491474151611328, -0.024096965789794922, -0.023279190063476562, -0.022461414337158203, -0.021643638610839844, -0.020825862884521484, -0.020008087158203125, -0.019190311431884766, -0.018372535705566406, -0.017554759979248047, -0.016736984252929688, -0.015919208526611328, -0.015101432800292969, -0.01428365707397461, -0.01346588134765625, -0.01264810562133789, -0.011830329895019531, -0.011012554168701172, -0.010194778442382812, -0.009377002716064453, -0.008559226989746094, -0.007741451263427734, -0.006923675537109375, -0.006105899810791016, -0.005288124084472656, -0.004470348358154297, -0.0036525726318359375, -0.002834796905517578, -0.0020170211791992188, -0.0011992454528808594, -0.0003814697265625, 0.0004363059997558594, 0.0012540817260742188, 0.002071857452392578, 0.0028896331787109375, 0.003707408905029297, 0.004525184631347656, 0.005342960357666016, 0.006160736083984375, 0.006978511810302734, 0.007796287536621094, 0.008614063262939453, 0.009431838989257812, 0.010249614715576172, 0.011067390441894531, 0.01188516616821289, 0.01270294189453125, 0.01352071762084961, 0.014338493347167969, 0.015156269073486328, 0.015974044799804688, 0.016791820526123047, 0.017609596252441406, 0.018427371978759766, 0.019245147705078125, 0.020062923431396484, 0.020880699157714844, 0.021698474884033203, 0.022516250610351562, 0.023334026336669922, 0.02415180206298828, 0.02496957778930664, 0.025787353515625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 11.0, 14.0, 18.0, 13.0, 18.0, 118.0, 417.0, 223.0, 46.0, 24.0, 10.0, 7.0, 3.0, 13.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193328857421875, -0.018720388412475586, -0.018107891082763672, -0.017495393753051758, -0.016882896423339844, -0.01627039909362793, -0.015657901763916016, -0.015045404434204102, -0.014432907104492188, -0.013820409774780273, -0.01320791244506836, -0.012595415115356445, -0.011982917785644531, -0.011370420455932617, -0.010757923126220703, -0.010145425796508789, -0.009532928466796875, -0.008920431137084961, -0.008307933807373047, -0.007695436477661133, -0.007082939147949219, -0.006470441818237305, -0.005857944488525391, -0.0052454471588134766, -0.0046329498291015625, -0.0040204524993896484, -0.0034079551696777344, -0.0027954578399658203, -0.0021829605102539062, -0.0015704631805419922, -0.0009579658508300781, -0.00034546852111816406, 0.00026702880859375, 0.0008795261383056641, 0.0014920234680175781, 0.002104520797729492, 0.0027170181274414062, 0.0033295154571533203, 0.003942012786865234, 0.0045545101165771484, 0.0051670074462890625, 0.0057795047760009766, 0.006392002105712891, 0.007004499435424805, 0.007616996765136719, 0.008229494094848633, 0.008841991424560547, 0.009454488754272461, 0.010066986083984375, 0.010679483413696289, 0.011291980743408203, 0.011904478073120117, 0.012516975402832031, 0.013129472732543945, 0.01374197006225586, 0.014354467391967773, 0.014966964721679688, 0.015579462051391602, 0.016191959381103516, 0.01680445671081543, 0.017416954040527344, 0.018029451370239258, 0.018641948699951172, 0.019254446029663086, 0.019866943359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 5.0, 5.0, 9.0, 6.0, 9.0, 13.0, 15.0, 19.0, 33.0, 31.0, 32.0, 57.0, 50.0, 91.0, 110.0, 201.0, 436.0, 1162.0, 8989.0, 1025580.0, 9389.0, 1156.0, 438.0, 211.0, 124.0, 73.0, 55.0, 47.0, 37.0, 28.0, 22.0, 19.0, 18.0, 22.0, 13.0, 6.0, 8.0, 7.0, 5.0, 8.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.04315185546875, -0.04186391830444336, -0.04057598114013672, -0.03928804397583008, -0.03800010681152344, -0.0367121696472168, -0.035424232482910156, -0.034136295318603516, -0.032848358154296875, -0.031560420989990234, -0.030272483825683594, -0.028984546661376953, -0.027696609497070312, -0.026408672332763672, -0.02512073516845703, -0.02383279800415039, -0.02254486083984375, -0.02125692367553711, -0.01996898651123047, -0.018681049346923828, -0.017393112182617188, -0.016105175018310547, -0.014817237854003906, -0.013529300689697266, -0.012241363525390625, -0.010953426361083984, -0.009665489196777344, -0.008377552032470703, -0.0070896148681640625, -0.005801677703857422, -0.004513740539550781, -0.0032258033752441406, -0.0019378662109375, -0.0006499290466308594, 0.0006380081176757812, 0.0019259452819824219, 0.0032138824462890625, 0.004501819610595703, 0.005789756774902344, 0.007077693939208984, 0.008365631103515625, 0.009653568267822266, 0.010941505432128906, 0.012229442596435547, 0.013517379760742188, 0.014805316925048828, 0.01609325408935547, 0.01738119125366211, 0.01866912841796875, 0.01995706558227539, 0.02124500274658203, 0.022532939910888672, 0.023820877075195312, 0.025108814239501953, 0.026396751403808594, 0.027684688568115234, 0.028972625732421875, 0.030260562896728516, 0.031548500061035156, 0.0328364372253418, 0.03412437438964844, 0.03541231155395508, 0.03670024871826172, 0.03798818588256836, 0.039276123046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 5.0, 9.0, 6.0, 10.0, 11.0, 13.0, 18.0, 30.0, 27.0, 22.0, 40.0, 24.0, 39.0, 36.0, 35.0, 50.0, 45.0, 36.0, 51.0, 51.0, 52.0, 36.0, 35.0, 39.0, 30.0, 37.0, 28.0, 27.0, 23.0, 17.0, 16.0, 18.0, 19.0, 13.0, 6.0, 8.0, 7.0, 5.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.043975830078125, -0.042662620544433594, -0.04134941101074219, -0.04003620147705078, -0.038722991943359375, -0.03740978240966797, -0.03609657287597656, -0.034783363342285156, -0.03347015380859375, -0.032156944274902344, -0.030843734741210938, -0.02953052520751953, -0.028217315673828125, -0.02690410614013672, -0.025590896606445312, -0.024277687072753906, -0.0229644775390625, -0.021651268005371094, -0.020338058471679688, -0.01902484893798828, -0.017711639404296875, -0.01639842987060547, -0.015085220336914062, -0.013772010803222656, -0.01245880126953125, -0.011145591735839844, -0.009832382202148438, -0.008519172668457031, -0.007205963134765625, -0.005892753601074219, -0.0045795440673828125, -0.0032663345336914062, -0.001953125, -0.0006399154663085938, 0.0006732940673828125, 0.0019865036010742188, 0.003299713134765625, 0.004612922668457031, 0.0059261322021484375, 0.007239341735839844, 0.00855255126953125, 0.009865760803222656, 0.011178970336914062, 0.012492179870605469, 0.013805389404296875, 0.015118598937988281, 0.016431808471679688, 0.017745018005371094, 0.0190582275390625, 0.020371437072753906, 0.021684646606445312, 0.02299785614013672, 0.024311065673828125, 0.02562427520751953, 0.026937484741210938, 0.028250694274902344, 0.02956390380859375, 0.030877113342285156, 0.03219032287597656, 0.03350353240966797, 0.034816741943359375, 0.03612995147705078, 0.03744316101074219, 0.038756370544433594, 0.040069580078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 8.0, 8.0, 19.0, 18.0, 32.0, 54.0, 78.0, 100.0, 184.0, 364.0, 522.0, 945.0, 1872.0, 4954.0, 12847.0, 49882.0, 798504.0, 140544.0, 23669.0, 7484.0, 3309.0, 1336.0, 745.0, 408.0, 240.0, 138.0, 90.0, 68.0, 35.0, 37.0, 15.0, 8.0, 9.0, 10.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6689300537109375e-05, -1.6194768249988556e-05, -1.5700235962867737e-05, -1.5205703675746918e-05, -1.4711171388626099e-05, -1.421663910150528e-05, -1.372210681438446e-05, -1.3227574527263641e-05, -1.2733042240142822e-05, -1.2238509953022003e-05, -1.1743977665901184e-05, -1.1249445378780365e-05, -1.0754913091659546e-05, -1.0260380804538727e-05, -9.765848517417908e-06, -9.271316230297089e-06, -8.77678394317627e-06, -8.28225165605545e-06, -7.787719368934631e-06, -7.293187081813812e-06, -6.798654794692993e-06, -6.304122507572174e-06, -5.809590220451355e-06, -5.315057933330536e-06, -4.820525646209717e-06, -4.325993359088898e-06, -3.831461071968079e-06, -3.3369287848472595e-06, -2.8423964977264404e-06, -2.3478642106056213e-06, -1.8533319234848022e-06, -1.3587996363639832e-06, -8.642673492431641e-07, -3.6973506212234497e-07, 1.2479722499847412e-07, 6.193295121192932e-07, 1.1138617992401123e-06, 1.6083940863609314e-06, 2.1029263734817505e-06, 2.5974586606025696e-06, 3.0919909477233887e-06, 3.5865232348442078e-06, 4.081055521965027e-06, 4.575587809085846e-06, 5.070120096206665e-06, 5.564652383327484e-06, 6.059184670448303e-06, 6.553716957569122e-06, 7.048249244689941e-06, 7.5427815318107605e-06, 8.03731381893158e-06, 8.531846106052399e-06, 9.026378393173218e-06, 9.520910680294037e-06, 1.0015442967414856e-05, 1.0509975254535675e-05, 1.1004507541656494e-05, 1.1499039828777313e-05, 1.1993572115898132e-05, 1.2488104403018951e-05, 1.298263669013977e-05, 1.347716897726059e-05, 1.3971701264381409e-05, 1.4466233551502228e-05, 1.4960765838623047e-05]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 12.0, 8.0, 24.0, 18.0, 30.0, 22.0, 52.0, 78.0, 48.0, 89.0, 55.0, 93.0, 59.0, 76.0, 50.0, 52.0, 45.0, 21.0, 39.0, 22.0, 21.0, 16.0, 11.0, 16.0, 4.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.351139068603516e-06, -4.198402166366577e-06, -4.045665264129639e-06, -3.8929283618927e-06, -3.7401914596557617e-06, -3.5874545574188232e-06, -3.4347176551818848e-06, -3.2819807529449463e-06, -3.129243850708008e-06, -2.9765069484710693e-06, -2.823770046234131e-06, -2.6710331439971924e-06, -2.518296241760254e-06, -2.3655593395233154e-06, -2.212822437286377e-06, -2.0600855350494385e-06, -1.9073486328125e-06, -1.7546117305755615e-06, -1.601874828338623e-06, -1.4491379261016846e-06, -1.296401023864746e-06, -1.1436641216278076e-06, -9.909272193908691e-07, -8.381903171539307e-07, -6.854534149169922e-07, -5.327165126800537e-07, -3.7997961044311523e-07, -2.2724270820617676e-07, -7.450580596923828e-08, 7.82310962677002e-08, 2.3096799850463867e-07, 3.8370490074157715e-07, 5.364418029785156e-07, 6.891787052154541e-07, 8.419156074523926e-07, 9.94652509689331e-07, 1.1473894119262695e-06, 1.300126314163208e-06, 1.4528632164001465e-06, 1.605600118637085e-06, 1.7583370208740234e-06, 1.911073923110962e-06, 2.0638108253479004e-06, 2.216547727584839e-06, 2.3692846298217773e-06, 2.522021532058716e-06, 2.6747584342956543e-06, 2.8274953365325928e-06, 2.9802322387695312e-06, 3.1329691410064697e-06, 3.285706043243408e-06, 3.4384429454803467e-06, 3.591179847717285e-06, 3.7439167499542236e-06, 3.896653652191162e-06, 4.049390554428101e-06, 4.202127456665039e-06, 4.3548643589019775e-06, 4.507601261138916e-06, 4.6603381633758545e-06, 4.813075065612793e-06, 4.9658119678497314e-06, 5.11854887008667e-06, 5.271285772323608e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 11.0, 4.0, 8.0, 17.0, 18.0, 22.0, 23.0, 36.0, 46.0, 90.0, 159.0, 361.0, 1570.0, 999818.0, 44801.0, 899.0, 288.0, 123.0, 83.0, 40.0, 35.0, 30.0, 12.0, 18.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.1140785217285156e-05, -4.963018000125885e-05, -4.8119574785232544e-05, -4.660896956920624e-05, -4.509836435317993e-05, -4.3587759137153625e-05, -4.207715392112732e-05, -4.056654870510101e-05, -3.905594348907471e-05, -3.75453382730484e-05, -3.6034733057022095e-05, -3.452412784099579e-05, -3.301352262496948e-05, -3.1502917408943176e-05, -2.999231219291687e-05, -2.8481706976890564e-05, -2.6971101760864258e-05, -2.546049654483795e-05, -2.3949891328811646e-05, -2.243928611278534e-05, -2.0928680896759033e-05, -1.9418075680732727e-05, -1.790747046470642e-05, -1.6396865248680115e-05, -1.4886260032653809e-05, -1.3375654816627502e-05, -1.1865049600601196e-05, -1.035444438457489e-05, -8.843839168548584e-06, -7.333233952522278e-06, -5.822628736495972e-06, -4.3120235204696655e-06, -2.8014183044433594e-06, -1.2908130884170532e-06, 2.1979212760925293e-07, 1.730397343635559e-06, 3.2410025596618652e-06, 4.751607775688171e-06, 6.2622129917144775e-06, 7.772818207740784e-06, 9.28342342376709e-06, 1.0794028639793396e-05, 1.2304633855819702e-05, 1.3815239071846008e-05, 1.5325844287872314e-05, 1.683644950389862e-05, 1.8347054719924927e-05, 1.9857659935951233e-05, 2.136826515197754e-05, 2.2878870368003845e-05, 2.438947558403015e-05, 2.5900080800056458e-05, 2.7410686016082764e-05, 2.892129123210907e-05, 3.0431896448135376e-05, 3.194250166416168e-05, 3.345310688018799e-05, 3.4963712096214294e-05, 3.64743173122406e-05, 3.798492252826691e-05, 3.949552774429321e-05, 4.100613296031952e-05, 4.2516738176345825e-05, 4.402734339237213e-05, 4.553794860839844e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 10.0, 1.0, 9.0, 18.0, 15.0, 16.0, 18.0, 27.0, 24.0, 44.0, 50.0, 65.0, 89.0, 149.0, 114.0, 83.0, 60.0, 44.0, 30.0, 26.0, 23.0, 22.0, 11.0, 14.0, 11.0, 7.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.227327346801758e-05, -5.072541534900665e-05, -4.917755722999573e-05, -4.76296991109848e-05, -4.608184099197388e-05, -4.453398287296295e-05, -4.2986124753952026e-05, -4.14382666349411e-05, -3.9890408515930176e-05, -3.834255039691925e-05, -3.6794692277908325e-05, -3.52468341588974e-05, -3.3698976039886475e-05, -3.215111792087555e-05, -3.0603259801864624e-05, -2.90554016828537e-05, -2.7507543563842773e-05, -2.5959685444831848e-05, -2.4411827325820923e-05, -2.2863969206809998e-05, -2.1316111087799072e-05, -1.9768252968788147e-05, -1.822039484977722e-05, -1.6672536730766296e-05, -1.5124678611755371e-05, -1.3576820492744446e-05, -1.202896237373352e-05, -1.0481104254722595e-05, -8.93324613571167e-06, -7.385388016700745e-06, -5.837529897689819e-06, -4.289671778678894e-06, -2.7418136596679688e-06, -1.1939555406570435e-06, 3.5390257835388184e-07, 1.9017606973648071e-06, 3.4496188163757324e-06, 4.997476935386658e-06, 6.545335054397583e-06, 8.093193173408508e-06, 9.641051292419434e-06, 1.1188909411430359e-05, 1.2736767530441284e-05, 1.428462564945221e-05, 1.5832483768463135e-05, 1.738034188747406e-05, 1.8928200006484985e-05, 2.047605812549591e-05, 2.2023916244506836e-05, 2.357177436351776e-05, 2.5119632482528687e-05, 2.6667490601539612e-05, 2.8215348720550537e-05, 2.9763206839561462e-05, 3.131106495857239e-05, 3.285892307758331e-05, 3.440678119659424e-05, 3.5954639315605164e-05, 3.750249743461609e-05, 3.9050355553627014e-05, 4.059821367263794e-05, 4.2146071791648865e-05, 4.369392991065979e-05, 4.5241788029670715e-05, 4.678964614868164e-05]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 962.0, 55.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1434638798236847, -0.10585266351699829, -0.06824144721031189, -0.03063023090362549, 0.006980985403060913, 0.044592201709747314, 0.08220341801643372, 0.11981463432312012, 0.15742585062980652, 0.19503706693649292, 0.23264828324317932, 0.2702594995498657, 0.3078707158565521, 0.3454819321632385, 0.3830931484699249, 0.42070436477661133, 0.45831558108329773, 0.49592679738998413, 0.5335379838943481, 0.5711492300033569, 0.6087604761123657, 0.6463716626167297, 0.6839828491210938, 0.7215940952301025, 0.7592053413391113, 0.7968165874481201, 0.8344277739524841, 0.8720389604568481, 0.9096502065658569, 0.9472614526748657, 0.9848726391792297, 1.0224838256835938, 1.0600950717926025, 1.0977063179016113, 1.1353175640106201, 1.1729286909103394, 1.2105399370193481, 1.248151183128357, 1.2857623100280762, 1.323373556137085, 1.3609848022460938, 1.3985960483551025, 1.4362072944641113, 1.4738184213638306, 1.5114296674728394, 1.5490409135818481, 1.5866520404815674, 1.6242632865905762, 1.661874532699585, 1.6994857788085938, 1.7370970249176025, 1.7747081518173218, 1.8123193979263306, 1.8499306440353394, 1.8875417709350586, 1.9251530170440674, 1.9627642631530762, 2.000375509262085, 2.0379867553710938, 2.0755980014801025, 2.1132092475891113, 2.150820255279541, 2.18843150138855, 2.2260427474975586, 2.2636539936065674]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 6.0, 17.0, 20.0, 10.0, 11.0, 16.0, 21.0, 22.0, 21.0, 24.0, 31.0, 31.0, 42.0, 37.0, 38.0, 44.0, 42.0, 54.0, 34.0, 41.0, 47.0, 45.0, 35.0, 34.0, 24.0, 35.0, 32.0, 30.0, 16.0, 19.0, 20.0, 13.0, 14.0, 7.0, 9.0, 5.0, 8.0, 4.0, 4.0, 0.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18014496564865112, -0.17396490275859833, -0.16778483986854553, -0.16160479187965393, -0.15542472898960114, -0.14924466609954834, -0.14306460320949554, -0.13688454031944275, -0.13070449233055115, -0.12452442944049835, -0.11834437400102615, -0.11216431111097336, -0.10598425567150116, -0.09980419278144836, -0.09362412989139557, -0.08744406700134277, -0.08126400411128998, -0.07508394122123718, -0.06890388578176498, -0.06272382289171219, -0.05654376372694969, -0.050363704562187195, -0.0441836416721344, -0.0380035825073719, -0.031823523342609406, -0.02564346417784691, -0.019463403150439262, -0.013283342123031616, -0.007103282958269119, -0.0009232237935066223, 0.005256839096546173, 0.01143689826130867, 0.017616957426071167, 0.023797016590833664, 0.02997707761824131, 0.036157138645648956, 0.04233719781041145, 0.04851725697517395, 0.054697319865226746, 0.06087737902998924, 0.06705743819475174, 0.07323750108480453, 0.07941755652427673, 0.08559761941432953, 0.09177768230438232, 0.09795773774385452, 0.10413780063390732, 0.11031785607337952, 0.11649791896343231, 0.12267798185348511, 0.1288580447435379, 0.1350381076335907, 0.1412181556224823, 0.1473982185125351, 0.1535782814025879, 0.15975834429264069, 0.16593840718269348, 0.17211847007274628, 0.17829853296279907, 0.18447858095169067, 0.19065864384174347, 0.19683870673179626, 0.20301876962184906, 0.20919883251190186, 0.21537888050079346]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 7.0, 7.0, 10.0, 10.0, 9.0, 10.0, 24.0, 106.0, 4193696.0, 247.0, 44.0, 14.0, 15.0, 10.0, 13.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00033211708068847656, -0.0003213733434677124, -0.00031062960624694824, -0.0002998858690261841, -0.0002891421318054199, -0.00027839839458465576, -0.0002676546573638916, -0.00025691092014312744, -0.0002461671829223633, -0.00023542344570159912, -0.00022467970848083496, -0.0002139359712600708, -0.00020319223403930664, -0.00019244849681854248, -0.00018170475959777832, -0.00017096102237701416, -0.00016021728515625, -0.00014947354793548584, -0.00013872981071472168, -0.00012798607349395752, -0.00011724233627319336, -0.0001064985990524292, -9.575486183166504e-05, -8.501112461090088e-05, -7.426738739013672e-05, -6.352365016937256e-05, -5.27799129486084e-05, -4.203617572784424e-05, -3.129243850708008e-05, -2.0548701286315918e-05, -9.804964065551758e-06, 9.387731552124023e-07, 1.1682510375976562e-05, 2.2426247596740723e-05, 3.316998481750488e-05, 4.391372203826904e-05, 5.46574592590332e-05, 6.540119647979736e-05, 7.614493370056152e-05, 8.688867092132568e-05, 9.763240814208984e-05, 0.000108376145362854, 0.00011911988258361816, 0.00012986361980438232, 0.00014060735702514648, 0.00015135109424591064, 0.0001620948314666748, 0.00017283856868743896, 0.00018358230590820312, 0.00019432604312896729, 0.00020506978034973145, 0.0002158135175704956, 0.00022655725479125977, 0.00023730099201202393, 0.0002480447292327881, 0.00025878846645355225, 0.0002695322036743164, 0.00028027594089508057, 0.0002910196781158447, 0.0003017634153366089, 0.00031250715255737305, 0.0003232508897781372, 0.00033399462699890137, 0.00034473836421966553, 0.0003554821014404297]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 4.0, 9.0, 15.0, 17.0, 15.0, 18.0, 119.0, 400.0, 239.0, 47.0, 23.0, 9.0, 8.0, 5.0, 12.0, 9.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 22.0, 15.0, 34.0, 69.0, 84.0, 84.0, 90.0, 4193364.0, 87.0, 92.0, 112.0, 92.0, 64.0, 35.0, 32.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015115737915039062, -0.0014669299125671387, -0.001422286033630371, -0.0013776421546936035, -0.001332998275756836, -0.0012883543968200684, -0.0012437105178833008, -0.0011990666389465332, -0.0011544227600097656, -0.001109778881072998, -0.0010651350021362305, -0.0010204911231994629, -0.0009758472442626953, -0.0009312033653259277, -0.0008865594863891602, -0.0008419156074523926, -0.000797271728515625, -0.0007526278495788574, -0.0007079839706420898, -0.0006633400917053223, -0.0006186962127685547, -0.0005740523338317871, -0.0005294084548950195, -0.00048476457595825195, -0.0004401206970214844, -0.0003954768180847168, -0.0003508329391479492, -0.00030618906021118164, -0.00026154518127441406, -0.00021690130233764648, -0.0001722574234008789, -0.00012761354446411133, -8.296966552734375e-05, -3.832578659057617e-05, 6.318092346191406e-06, 5.0961971282958984e-05, 9.560585021972656e-05, 0.00014024972915649414, 0.00018489360809326172, 0.0002295374870300293, 0.0002741813659667969, 0.00031882524490356445, 0.00036346912384033203, 0.0004081130027770996, 0.0004527568817138672, 0.0004974007606506348, 0.0005420446395874023, 0.0005866885185241699, 0.0006313323974609375, 0.0006759762763977051, 0.0007206201553344727, 0.0007652640342712402, 0.0008099079132080078, 0.0008545517921447754, 0.000899195671081543, 0.0009438395500183105, 0.0009884834289550781, 0.0010331273078918457, 0.0010777711868286133, 0.0011224150657653809, 0.0011670589447021484, 0.001211702823638916, 0.0012563467025756836, 0.0013009905815124512, 0.0013456344604492188]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4095.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 7.059425115585327e-06, 1.4118850231170654e-05, 2.117827534675598e-05, 2.823770046234131e-05, 3.5297125577926636e-05, 4.235655069351196e-05, 4.941597580909729e-05, 5.647540092468262e-05, 6.353482604026794e-05, 7.059425115585327e-05, 7.76536762714386e-05, 8.471310138702393e-05, 9.177252650260925e-05, 9.883195161819458e-05, 0.00010589137673377991, 0.00011295080184936523, 0.00012001022696495056, 0.0001270696520805359, 0.00013412907719612122, 0.00014118850231170654, 0.00014824792742729187, 0.0001553073525428772, 0.00016236677765846252, 0.00016942620277404785, 0.00017648562788963318, 0.0001835450530052185, 0.00019060447812080383, 0.00019766390323638916, 0.0002047233283519745, 0.00021178275346755981, 0.00021884217858314514, 0.00022590160369873047, 0.0002329610288143158, 0.00024002045392990112, 0.00024707987904548645, 0.0002541393041610718, 0.0002611987292766571, 0.00026825815439224243, 0.00027531757950782776, 0.0002823770046234131, 0.0002894364297389984, 0.00029649585485458374, 0.00030355527997016907, 0.0003106147050857544, 0.0003176741302013397, 0.00032473355531692505, 0.0003317929804325104, 0.0003388524055480957, 0.00034591183066368103, 0.00035297125577926636, 0.0003600306808948517, 0.000367090106010437, 0.00037414953112602234, 0.00038120895624160767, 0.000388268381357193, 0.0003953278064727783, 0.00040238723158836365, 0.000409446656703949, 0.0004165060818195343, 0.00042356550693511963, 0.00043062493205070496, 0.0004376843571662903, 0.0004447437822818756, 0.00045180320739746094]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1011.0, 7.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024557714350521564, -0.002335949568077922, -0.0022161277011036873, -0.0020963058341294527, -0.001976483967155218, -0.0018566621001809835, -0.001736840233206749, -0.0016170183662325144, -0.0014971964992582798, -0.0013773746322840452, -0.0012575527653098106, -0.001137730898335576, -0.0010179090313613415, -0.000898087106179446, -0.0007782652392052114, -0.0006584433722309768, -0.0005386214470490813, -0.00041879958007484674, -0.00029897771310061216, -0.00017915581702254713, -5.9333950048312545e-05, 6.048794602975249e-05, 0.00018030981300398707, 0.00030013167997822165, 0.00041995354695245624, 0.0005397754139266908, 0.0006595972809009254, 0.0007794192060828209, 0.0008992410730570555, 0.00101906294003129, 0.0011388848070055246, 0.0012587066739797592, 0.0013785285409539938, 0.0014983504079282284, 0.001618172274902463, 0.0017379941418766975, 0.0018578160088509321, 0.0019776378758251667, 0.0020974597427994013, 0.002217281609773636, 0.0023371034767478704, 0.002456925343722105, 0.0025767472106963396, 0.002696569077670574, 0.0028163909446448088, 0.0029362128116190434, 0.003056034678593278, 0.0031758565455675125, 0.0032956786453723907, 0.0034155005123466253, 0.00353532237932086, 0.0036551442462950945, 0.003774966113269329, 0.0038947879802435637, 0.004014609847217798, 0.0041344319470226765, 0.004254253581166267, 0.004374075680971146, 0.0044938973151147366, 0.004613719414919615, 0.004733541049063206, 0.004853363148868084, 0.004973184783011675, 0.005093006882816553, 0.005212828516960144]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 12.0, 16.0, 36.0, 86.0, 129.0, 210.0, 164.0, 136.0, 98.0, 53.0, 26.0, 16.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039565563201904297, -0.0003751404583454132, -0.00035462528467178345, -0.0003341101109981537, -0.0003135949373245239, -0.00029307976365089417, -0.0002725645899772644, -0.00025204941630363464, -0.00023153424263000488, -0.00021101906895637512, -0.00019050389528274536, -0.0001699887216091156, -0.00014947354793548584, -0.00012895837426185608, -0.00010844320058822632, -8.792802691459656e-05, -6.74128532409668e-05, -4.6897679567337036e-05, -2.6382505893707275e-05, -5.867332220077515e-06, 1.4647841453552246e-05, 3.516301512718201e-05, 5.567818880081177e-05, 7.619336247444153e-05, 9.670853614807129e-05, 0.00011722370982170105, 0.0001377388834953308, 0.00015825405716896057, 0.00017876923084259033, 0.0001992844045162201, 0.00021979957818984985, 0.00024031475186347961, 0.0002608299255371094, 0.00028134509921073914, 0.0003018602728843689, 0.00032237544655799866, 0.0003428906202316284, 0.0003634057939052582, 0.00038392096757888794, 0.0004044361412525177, 0.00042495131492614746, 0.0004454664885997772, 0.000465981662273407, 0.00048649683594703674, 0.0005070120096206665, 0.0005275271832942963, 0.000548042356967926, 0.0005685575306415558, 0.0005890727043151855, 0.0006095878779888153, 0.0006301030516624451, 0.0006506182253360748, 0.0006711333990097046, 0.0006916485726833344, 0.0007121637463569641, 0.0007326789200305939, 0.0007531940937042236, 0.0007737092673778534, 0.0007942244410514832, 0.0008147396147251129, 0.0008352547883987427, 0.0008557699620723724, 0.0008762851357460022, 0.000896800309419632, 0.0009173154830932617]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 8.0, 3.0, 9.0, 11.0, 16.0, 19.0, 30.0, 26.0, 46.0, 67.0, 108.0, 136.0, 227.0, 368.0, 644.0, 1066.0, 2036.0, 5016.0, 20546.0, 964614.0, 40333.0, 7310.0, 2663.0, 1276.0, 728.0, 404.0, 242.0, 161.0, 110.0, 81.0, 55.0, 56.0, 23.0, 30.0, 15.0, 14.0, 16.0, 3.0, 6.0, 9.0, 1.0, 2.0, 7.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0295562744140625, -0.02862238883972168, -0.02768850326538086, -0.02675461769104004, -0.02582073211669922, -0.0248868465423584, -0.023952960968017578, -0.023019075393676758, -0.022085189819335938, -0.021151304244995117, -0.020217418670654297, -0.019283533096313477, -0.018349647521972656, -0.017415761947631836, -0.016481876373291016, -0.015547990798950195, -0.014614105224609375, -0.013680219650268555, -0.012746334075927734, -0.011812448501586914, -0.010878562927246094, -0.009944677352905273, -0.009010791778564453, -0.008076906204223633, -0.0071430206298828125, -0.006209135055541992, -0.005275249481201172, -0.0043413639068603516, -0.0034074783325195312, -0.002473592758178711, -0.0015397071838378906, -0.0006058216094970703, 0.00032806396484375, 0.0012619495391845703, 0.0021958351135253906, 0.003129720687866211, 0.004063606262207031, 0.0049974918365478516, 0.005931377410888672, 0.006865262985229492, 0.0077991485595703125, 0.008733034133911133, 0.009666919708251953, 0.010600805282592773, 0.011534690856933594, 0.012468576431274414, 0.013402462005615234, 0.014336347579956055, 0.015270233154296875, 0.016204118728637695, 0.017138004302978516, 0.018071889877319336, 0.019005775451660156, 0.019939661026000977, 0.020873546600341797, 0.021807432174682617, 0.022741317749023438, 0.023675203323364258, 0.024609088897705078, 0.0255429744720459, 0.02647686004638672, 0.02741074562072754, 0.02834463119506836, 0.02927851676940918, 0.03021240234375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 4.0, 9.0, 15.0, 17.0, 15.0, 18.0, 119.0, 400.0, 239.0, 47.0, 23.0, 9.0, 8.0, 5.0, 12.0, 9.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 8.0, 4.0, 8.0, 11.0, 12.0, 13.0, 17.0, 17.0, 20.0, 21.0, 35.0, 31.0, 41.0, 78.0, 75.0, 110.0, 140.0, 236.0, 423.0, 908.0, 2732.0, 916797.0, 122973.0, 1913.0, 727.0, 384.0, 197.0, 129.0, 91.0, 84.0, 54.0, 53.0, 39.0, 32.0, 20.0, 19.0, 10.0, 13.0, 15.0, 13.0, 11.0, 7.0, 3.0, 3.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03192138671875, -0.030776500701904297, -0.029631614685058594, -0.02848672866821289, -0.027341842651367188, -0.026196956634521484, -0.02505207061767578, -0.023907184600830078, -0.022762298583984375, -0.021617412567138672, -0.02047252655029297, -0.019327640533447266, -0.018182754516601562, -0.01703786849975586, -0.015892982482910156, -0.014748096466064453, -0.01360321044921875, -0.012458324432373047, -0.011313438415527344, -0.01016855239868164, -0.009023666381835938, -0.007878780364990234, -0.006733894348144531, -0.005589008331298828, -0.004444122314453125, -0.003299236297607422, -0.0021543502807617188, -0.0010094642639160156, 0.0001354217529296875, 0.0012803077697753906, 0.0024251937866210938, 0.003570079803466797, 0.0047149658203125, 0.005859851837158203, 0.007004737854003906, 0.00814962387084961, 0.009294509887695312, 0.010439395904541016, 0.011584281921386719, 0.012729167938232422, 0.013874053955078125, 0.015018939971923828, 0.01616382598876953, 0.017308712005615234, 0.018453598022460938, 0.01959848403930664, 0.020743370056152344, 0.021888256072998047, 0.02303314208984375, 0.024178028106689453, 0.025322914123535156, 0.02646780014038086, 0.027612686157226562, 0.028757572174072266, 0.02990245819091797, 0.031047344207763672, 0.032192230224609375, 0.03333711624145508, 0.03448200225830078, 0.035626888275146484, 0.03677177429199219, 0.03791666030883789, 0.039061546325683594, 0.0402064323425293, 0.041351318359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 4.0, 9.0, 11.0, 8.0, 12.0, 19.0, 13.0, 16.0, 15.0, 20.0, 21.0, 20.0, 42.0, 24.0, 32.0, 41.0, 35.0, 24.0, 45.0, 40.0, 36.0, 29.0, 35.0, 33.0, 36.0, 33.0, 32.0, 31.0, 36.0, 19.0, 35.0, 26.0, 24.0, 18.0, 18.0, 9.0, 13.0, 16.0, 13.0, 12.0, 7.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03009033203125, -0.02901458740234375, -0.0279388427734375, -0.02686309814453125, -0.025787353515625, -0.02471160888671875, -0.0236358642578125, -0.02256011962890625, -0.021484375, -0.02040863037109375, -0.0193328857421875, -0.01825714111328125, -0.017181396484375, -0.01610565185546875, -0.0150299072265625, -0.01395416259765625, -0.01287841796875, -0.01180267333984375, -0.0107269287109375, -0.00965118408203125, -0.008575439453125, -0.00749969482421875, -0.0064239501953125, -0.00534820556640625, -0.0042724609375, -0.00319671630859375, -0.0021209716796875, -0.00104522705078125, 3.0517578125e-05, 0.00110626220703125, 0.0021820068359375, 0.00325775146484375, 0.00433349609375, 0.00540924072265625, 0.0064849853515625, 0.00756072998046875, 0.008636474609375, 0.00971221923828125, 0.0107879638671875, 0.01186370849609375, 0.012939453125, 0.01401519775390625, 0.0150909423828125, 0.01616668701171875, 0.017242431640625, 0.01831817626953125, 0.0193939208984375, 0.02046966552734375, 0.02154541015625, 0.02262115478515625, 0.0236968994140625, 0.02477264404296875, 0.025848388671875, 0.02692413330078125, 0.0279998779296875, 0.02907562255859375, 0.0301513671875, 0.03122711181640625, 0.0323028564453125, 0.03337860107421875, 0.034454345703125, 0.03553009033203125, 0.0366058349609375, 0.03768157958984375, 0.03875732421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 8.0, 3.0, 3.0, 13.0, 12.0, 25.0, 32.0, 58.0, 92.0, 153.0, 337.0, 529.0, 984.0, 2886.0, 7178.0, 41365.0, 685606.0, 269217.0, 29712.0, 5947.0, 2469.0, 862.0, 440.0, 250.0, 118.0, 78.0, 60.0, 39.0, 31.0, 12.0, 16.0, 9.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.1861324310302734e-05, -1.1540018022060394e-05, -1.1218711733818054e-05, -1.0897405445575714e-05, -1.0576099157333374e-05, -1.0254792869091034e-05, -9.933486580848694e-06, -9.612180292606354e-06, -9.290874004364014e-06, -8.969567716121674e-06, -8.648261427879333e-06, -8.326955139636993e-06, -8.005648851394653e-06, -7.684342563152313e-06, -7.363036274909973e-06, -7.041729986667633e-06, -6.720423698425293e-06, -6.399117410182953e-06, -6.077811121940613e-06, -5.756504833698273e-06, -5.435198545455933e-06, -5.1138922572135925e-06, -4.7925859689712524e-06, -4.471279680728912e-06, -4.149973392486572e-06, -3.828667104244232e-06, -3.507360816001892e-06, -3.186054527759552e-06, -2.864748239517212e-06, -2.543441951274872e-06, -2.2221356630325317e-06, -1.9008293747901917e-06, -1.5795230865478516e-06, -1.2582167983055115e-06, -9.369105100631714e-07, -6.156042218208313e-07, -2.942979335784912e-07, 2.7008354663848877e-08, 3.4831464290618896e-07, 6.69620931148529e-07, 9.909272193908691e-07, 1.3122335076332092e-06, 1.6335397958755493e-06, 1.9548460841178894e-06, 2.2761523723602295e-06, 2.5974586606025696e-06, 2.9187649488449097e-06, 3.2400712370872498e-06, 3.56137752532959e-06, 3.88268381357193e-06, 4.20399010181427e-06, 4.52529639005661e-06, 4.84660267829895e-06, 5.16790896654129e-06, 5.48921525478363e-06, 5.8105215430259705e-06, 6.1318278312683105e-06, 6.453134119510651e-06, 6.774440407752991e-06, 7.095746695995331e-06, 7.417052984237671e-06, 7.738359272480011e-06, 8.059665560722351e-06, 8.380971848964691e-06, 8.702278137207031e-06]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 6.0, 11.0, 19.0, 25.0, 34.0, 57.0, 78.0, 64.0, 128.0, 124.0, 88.0, 113.0, 55.0, 39.0, 39.0, 17.0, 22.0, 8.0, 8.0, 10.0, 9.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.472001016139984e-06, -7.255002856254578e-06, -7.038004696369171e-06, -6.821006536483765e-06, -6.604008376598358e-06, -6.387010216712952e-06, -6.170012056827545e-06, -5.953013896942139e-06, -5.736015737056732e-06, -5.519017577171326e-06, -5.302019417285919e-06, -5.085021257400513e-06, -4.868023097515106e-06, -4.6510249376297e-06, -4.434026777744293e-06, -4.217028617858887e-06, -4.00003045797348e-06, -3.7830322980880737e-06, -3.5660341382026672e-06, -3.3490359783172607e-06, -3.1320378184318542e-06, -2.9150396585464478e-06, -2.6980414986610413e-06, -2.4810433387756348e-06, -2.2640451788902283e-06, -2.0470470190048218e-06, -1.8300488591194153e-06, -1.6130506992340088e-06, -1.3960525393486023e-06, -1.1790543794631958e-06, -9.620562195777893e-07, -7.450580596923828e-07, -5.280598998069763e-07, -3.110617399215698e-07, -9.406358003616333e-08, 1.2293457984924316e-07, 3.3993273973464966e-07, 5.569308996200562e-07, 7.739290595054626e-07, 9.909272193908691e-07, 1.2079253792762756e-06, 1.4249235391616821e-06, 1.6419216990470886e-06, 1.8589198589324951e-06, 2.0759180188179016e-06, 2.292916178703308e-06, 2.5099143385887146e-06, 2.726912498474121e-06, 2.9439106583595276e-06, 3.160908818244934e-06, 3.3779069781303406e-06, 3.594905138015747e-06, 3.8119032979011536e-06, 4.02890145778656e-06, 4.2458996176719666e-06, 4.462897777557373e-06, 4.6798959374427795e-06, 4.896894097328186e-06, 5.1138922572135925e-06, 5.330890417098999e-06, 5.5478885769844055e-06, 5.764886736869812e-06, 5.9818848967552185e-06, 6.198883056640625e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 4.0, 8.0, 4.0, 12.0, 11.0, 20.0, 16.0, 32.0, 43.0, 64.0, 99.0, 181.0, 422.0, 1451.0, 977116.0, 67314.0, 905.0, 362.0, 152.0, 100.0, 61.0, 42.0, 32.0, 26.0, 20.0, 10.0, 8.0, 7.0, 5.0, 2.0, 7.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.49879264831543e-05, -3.406405448913574e-05, -3.314018249511719e-05, -3.221631050109863e-05, -3.129243850708008e-05, -3.0368566513061523e-05, -2.944469451904297e-05, -2.8520822525024414e-05, -2.759695053100586e-05, -2.6673078536987305e-05, -2.574920654296875e-05, -2.4825334548950195e-05, -2.390146255493164e-05, -2.2977590560913086e-05, -2.205371856689453e-05, -2.1129846572875977e-05, -2.0205974578857422e-05, -1.9282102584838867e-05, -1.8358230590820312e-05, -1.7434358596801758e-05, -1.6510486602783203e-05, -1.558661460876465e-05, -1.4662742614746094e-05, -1.3738870620727539e-05, -1.2814998626708984e-05, -1.189112663269043e-05, -1.0967254638671875e-05, -1.004338264465332e-05, -9.119510650634766e-06, -8.195638656616211e-06, -7.271766662597656e-06, -6.3478946685791016e-06, -5.424022674560547e-06, -4.500150680541992e-06, -3.5762786865234375e-06, -2.652406692504883e-06, -1.7285346984863281e-06, -8.046627044677734e-07, 1.1920928955078125e-07, 1.043081283569336e-06, 1.9669532775878906e-06, 2.8908252716064453e-06, 3.814697265625e-06, 4.738569259643555e-06, 5.662441253662109e-06, 6.586313247680664e-06, 7.510185241699219e-06, 8.434057235717773e-06, 9.357929229736328e-06, 1.0281801223754883e-05, 1.1205673217773438e-05, 1.2129545211791992e-05, 1.3053417205810547e-05, 1.3977289199829102e-05, 1.4901161193847656e-05, 1.582503318786621e-05, 1.6748905181884766e-05, 1.767277717590332e-05, 1.8596649169921875e-05, 1.952052116394043e-05, 2.0444393157958984e-05, 2.136826515197754e-05, 2.2292137145996094e-05, 2.321600914001465e-05, 2.4139881134033203e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 5.0, 8.0, 7.0, 7.0, 12.0, 11.0, 15.0, 17.0, 30.0, 34.0, 34.0, 44.0, 66.0, 96.0, 132.0, 107.0, 76.0, 67.0, 43.0, 46.0, 20.0, 18.0, 19.0, 23.0, 14.0, 9.0, 6.0, 6.0, 5.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.266334533691406e-05, -3.17990779876709e-05, -3.0934810638427734e-05, -3.007054328918457e-05, -2.9206275939941406e-05, -2.8342008590698242e-05, -2.7477741241455078e-05, -2.6613473892211914e-05, -2.574920654296875e-05, -2.4884939193725586e-05, -2.4020671844482422e-05, -2.3156404495239258e-05, -2.2292137145996094e-05, -2.142786979675293e-05, -2.0563602447509766e-05, -1.96993350982666e-05, -1.8835067749023438e-05, -1.7970800399780273e-05, -1.710653305053711e-05, -1.6242265701293945e-05, -1.537799835205078e-05, -1.4513731002807617e-05, -1.3649463653564453e-05, -1.2785196304321289e-05, -1.1920928955078125e-05, -1.1056661605834961e-05, -1.0192394256591797e-05, -9.328126907348633e-06, -8.463859558105469e-06, -7.599592208862305e-06, -6.735324859619141e-06, -5.8710575103759766e-06, -5.0067901611328125e-06, -4.1425228118896484e-06, -3.2782554626464844e-06, -2.4139881134033203e-06, -1.5497207641601562e-06, -6.854534149169922e-07, 1.7881393432617188e-07, 1.043081283569336e-06, 1.9073486328125e-06, 2.771615982055664e-06, 3.635883331298828e-06, 4.500150680541992e-06, 5.364418029785156e-06, 6.22868537902832e-06, 7.092952728271484e-06, 7.957220077514648e-06, 8.821487426757812e-06, 9.685754776000977e-06, 1.055002212524414e-05, 1.1414289474487305e-05, 1.2278556823730469e-05, 1.3142824172973633e-05, 1.4007091522216797e-05, 1.4871358871459961e-05, 1.5735626220703125e-05, 1.659989356994629e-05, 1.7464160919189453e-05, 1.8328428268432617e-05, 1.919269561767578e-05, 2.0056962966918945e-05, 2.092123031616211e-05, 2.1785497665405273e-05, 2.2649765014648438e-05]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 27.0, 871.0, 115.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5965543985366821, -0.5840434432029724, -0.5715325474739075, -0.5590215921401978, -0.546510636806488, -0.5339996814727783, -0.5214887857437134, -0.5089778304100037, -0.49646687507629395, -0.4839559495449066, -0.4714449942111969, -0.45893406867980957, -0.44642311334609985, -0.4339121878147125, -0.4214012324810028, -0.4088903069496155, -0.39637935161590576, -0.38386842608451843, -0.3713574707508087, -0.3588465452194214, -0.34633558988571167, -0.33382466435432434, -0.3213137090206146, -0.3088027834892273, -0.29629185795783997, -0.28378093242645264, -0.2712699770927429, -0.2587590515613556, -0.24624809622764587, -0.23373717069625854, -0.22122621536254883, -0.2087152898311615, -0.19620433449745178, -0.18369339406490326, -0.17118245363235474, -0.1586715131998062, -0.1461605727672577, -0.13364964723587036, -0.12113869935274124, -0.10862775892019272, -0.0961168184876442, -0.08360587805509567, -0.07109493762254715, -0.058584000915288925, -0.0460730604827404, -0.03356212377548218, -0.021051183342933655, -0.008540242910385132, 0.003970697522163391, 0.016481637954711914, 0.028992576524615288, 0.04150351509451866, 0.054014455527067184, 0.06652539223432541, 0.07903633266687393, 0.09154727309942245, 0.10405821353197098, 0.1165691539645195, 0.12908008694648743, 0.14159102737903595, 0.15410196781158447, 0.166612908244133, 0.17912384867668152, 0.19163478910923004, 0.20414572954177856]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 3.0, 3.0, 10.0, 8.0, 12.0, 11.0, 13.0, 22.0, 25.0, 33.0, 35.0, 45.0, 33.0, 45.0, 49.0, 47.0, 68.0, 69.0, 55.0, 46.0, 53.0, 39.0, 38.0, 30.0, 27.0, 23.0, 35.0, 23.0, 18.0, 14.0, 19.0, 12.0, 11.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.25194251537323, -0.2448427826166153, -0.2377430647611618, -0.23064333200454712, -0.22354361414909363, -0.21644388139247894, -0.20934414863586426, -0.20224443078041077, -0.19514471292495728, -0.1880449801683426, -0.1809452623128891, -0.17384552955627441, -0.16674581170082092, -0.15964607894420624, -0.15254634618759155, -0.14544662833213806, -0.13834689557552338, -0.1312471628189087, -0.1241474449634552, -0.11704771220684052, -0.10994799435138702, -0.10284826159477234, -0.09574853628873825, -0.08864881098270416, -0.08154908567667007, -0.07444936037063599, -0.0673496350646019, -0.06024990603327751, -0.05315018072724342, -0.046050455421209335, -0.03895072638988495, -0.03185100108385086, -0.024751275777816772, -0.017651550471782684, -0.010551823303103447, -0.0034520961344242096, 0.0036476291716098785, 0.010747354477643967, 0.017847083508968353, 0.02494680881500244, 0.03204653412103653, 0.03914625942707062, 0.046245984733104706, 0.05334571376442909, 0.06044543907046318, 0.06754516065120697, 0.07464489340782166, 0.08174461871385574, 0.08884434401988983, 0.09594406932592392, 0.10304379463195801, 0.11014352738857269, 0.11724324524402618, 0.12434297800064087, 0.13144269585609436, 0.13854242861270905, 0.14564216136932373, 0.15274189412593842, 0.1598416119813919, 0.1669413447380066, 0.17404106259346008, 0.18114079535007477, 0.18824052810668945, 0.19534024596214294, 0.20243996381759644]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 6.0, 10.0, 12.0, 4.0, 8.0, 10.0, 24.0, 53.0, 264.0, 4193670.0, 100.0, 14.0, 19.0, 16.0, 14.0, 8.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0033054351806640625, -0.003203153610229492, -0.003100872039794922, -0.0029985904693603516, -0.0028963088989257812, -0.002794027328491211, -0.0026917457580566406, -0.0025894641876220703, -0.0024871826171875, -0.0023849010467529297, -0.0022826194763183594, -0.002180337905883789, -0.0020780563354492188, -0.0019757747650146484, -0.0018734931945800781, -0.0017712116241455078, -0.0016689300537109375, -0.0015666484832763672, -0.0014643669128417969, -0.0013620853424072266, -0.0012598037719726562, -0.001157522201538086, -0.0010552406311035156, -0.0009529590606689453, -0.000850677490234375, -0.0007483959197998047, -0.0006461143493652344, -0.0005438327789306641, -0.00044155120849609375, -0.00033926963806152344, -0.00023698806762695312, -0.0001347064971923828, -3.24249267578125e-05, 6.985664367675781e-05, 0.00017213821411132812, 0.00027441978454589844, 0.00037670135498046875, 0.00047898292541503906, 0.0005812644958496094, 0.0006835460662841797, 0.00078582763671875, 0.0008881092071533203, 0.0009903907775878906, 0.001092672348022461, 0.0011949539184570312, 0.0012972354888916016, 0.0013995170593261719, 0.0015017986297607422, 0.0016040802001953125, 0.0017063617706298828, 0.0018086433410644531, 0.0019109249114990234, 0.0020132064819335938, 0.002115488052368164, 0.0022177696228027344, 0.0023200511932373047, 0.002422332763671875, 0.0025246143341064453, 0.0026268959045410156, 0.002729177474975586, 0.0028314590454101562, 0.0029337406158447266, 0.003036022186279297, 0.003138303756713867, 0.0032405853271484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 9.0, 15.0, 15.0, 17.0, 18.0, 116.0, 419.0, 225.0, 46.0, 22.0, 9.0, 8.0, 5.0, 12.0, 10.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 7.0, 33.0, 60.0, 99.0, 157.0, 282.0, 420.0, 4192347.0, 349.0, 231.0, 107.0, 93.0, 51.0, 24.0, 5.0, 12.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003685951232910156, -0.0003584921360015869, -0.0003483891487121582, -0.0003382861614227295, -0.0003281831741333008, -0.00031808018684387207, -0.00030797719955444336, -0.00029787421226501465, -0.00028777122497558594, -0.0002776682376861572, -0.0002675652503967285, -0.0002574622631072998, -0.0002473592758178711, -0.00023725628852844238, -0.00022715330123901367, -0.00021705031394958496, -0.00020694732666015625, -0.00019684433937072754, -0.00018674135208129883, -0.00017663836479187012, -0.0001665353775024414, -0.0001564323902130127, -0.00014632940292358398, -0.00013622641563415527, -0.00012612342834472656, -0.00011602044105529785, -0.00010591745376586914, -9.581446647644043e-05, -8.571147918701172e-05, -7.560849189758301e-05, -6.55055046081543e-05, -5.5402517318725586e-05, -4.5299530029296875e-05, -3.5196542739868164e-05, -2.5093555450439453e-05, -1.4990568161010742e-05, -4.887580871582031e-06, 5.21540641784668e-06, 1.531839370727539e-05, 2.54213809967041e-05, 3.552436828613281e-05, 4.5627355575561523e-05, 5.5730342864990234e-05, 6.583333015441895e-05, 7.593631744384766e-05, 8.603930473327637e-05, 9.614229202270508e-05, 0.00010624527931213379, 0.0001163482666015625, 0.0001264512538909912, 0.00013655424118041992, 0.00014665722846984863, 0.00015676021575927734, 0.00016686320304870605, 0.00017696619033813477, 0.00018706917762756348, 0.0001971721649169922, 0.0002072751522064209, 0.0002173781394958496, 0.00022748112678527832, 0.00023758411407470703, 0.00024768710136413574, 0.00025779008865356445, 0.00026789307594299316, 0.0002779960632324219]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4088.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.834766387939453e-06, -7.948838174343109e-06, -6.062909960746765e-06, -4.176981747150421e-06, -2.291053533554077e-06, -4.0512531995773315e-07, 1.4808028936386108e-06, 3.366731107234955e-06, 5.252659320831299e-06, 7.138587534427643e-06, 9.024515748023987e-06, 1.091044396162033e-05, 1.2796372175216675e-05, 1.4682300388813019e-05, 1.6568228602409363e-05, 1.8454156816005707e-05, 2.034008502960205e-05, 2.2226013243198395e-05, 2.411194145679474e-05, 2.5997869670391083e-05, 2.7883797883987427e-05, 2.976972609758377e-05, 3.1655654311180115e-05, 3.354158252477646e-05, 3.54275107383728e-05, 3.731343895196915e-05, 3.919936716556549e-05, 4.1085295379161835e-05, 4.297122359275818e-05, 4.485715180635452e-05, 4.674308001995087e-05, 4.862900823354721e-05, 5.0514936447143555e-05, 5.24008646607399e-05, 5.428679287433624e-05, 5.617272108793259e-05, 5.805864930152893e-05, 5.9944577515125275e-05, 6.183050572872162e-05, 6.371643394231796e-05, 6.56023621559143e-05, 6.748829036951065e-05, 6.9374218583107e-05, 7.126014679670334e-05, 7.314607501029968e-05, 7.503200322389603e-05, 7.691793143749237e-05, 7.880385965108871e-05, 8.068978786468506e-05, 8.25757160782814e-05, 8.446164429187775e-05, 8.634757250547409e-05, 8.823350071907043e-05, 9.011942893266678e-05, 9.200535714626312e-05, 9.389128535985947e-05, 9.577721357345581e-05, 9.766314178705215e-05, 9.95490700006485e-05, 0.00010143499821424484, 0.00010332092642784119, 0.00010520685464143753, 0.00010709278285503387, 0.00010897871106863022, 0.00011086463928222656]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 30.0, 977.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040220562368631363, -0.0003933222615160048, -0.00038443889934569597, -0.0003755555080715567, -0.00036667214590124786, -0.00035778878373093903, -0.0003489054215606302, -0.0003400220593903214, -0.0003311386681161821, -0.00032225530594587326, -0.00031337194377556443, -0.00030448855250142515, -0.0002956051903311163, -0.0002867218281608075, -0.00027783846599049866, -0.00026895510382018983, -0.000260071741649881, -0.0002511883794795722, -0.00024230500275734812, -0.0002334216405870393, -0.00022453826386481524, -0.0002156549016945064, -0.00020677153952419758, -0.00019788817735388875, -0.0001890048006316647, -0.00018012143846135587, -0.0001712380617391318, -0.00016235469956882298, -0.00015347133739851415, -0.0001445879606762901, -0.00013570459850598127, -0.0001268212217837572, -0.00011793785961344838, -0.00010905449016718194, -0.0001001711207209155, -9.128775855060667e-05, -8.240438910434023e-05, -7.352101965807378e-05, -6.463765748776495e-05, -5.575428804149851e-05, -4.687091859523207e-05, -3.798754914896563e-05, -2.910418334067799e-05, -2.0220815713400953e-05, -1.1337448086123914e-05, -2.454078639857471e-06, 6.4292871684301645e-06, 1.53126529767178e-05, 2.4196022422984242e-05, 3.3079391869250685e-05, 4.196275767753832e-05, 5.0846123485825956e-05, 5.97294929320924e-05, 6.861286237835884e-05, 7.749622454866767e-05, 8.637959399493411e-05, 9.526296344120055e-05, 0.000104146332887467, 0.00011302970233373344, 0.00012191306450404227, 0.0001307964266743511, 0.00013967980339657515, 0.00014856316556688398, 0.00015744654228910804, 0.00016632990445941687]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 13.0, 14.0, 59.0, 111.0, 134.0, 160.0, 175.0, 137.0, 95.0, 41.0, 25.0, 15.0, 8.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010627508163452148, -0.00010160170495510101, -9.692832827568054e-05, -9.225495159626007e-05, -8.75815749168396e-05, -8.290819823741913e-05, -7.823482155799866e-05, -7.356144487857819e-05, -6.888806819915771e-05, -6.421469151973724e-05, -5.954131484031677e-05, -5.48679381608963e-05, -5.019456148147583e-05, -4.552118480205536e-05, -4.084780812263489e-05, -3.6174431443214417e-05, -3.1501054763793945e-05, -2.6827678084373474e-05, -2.2154301404953003e-05, -1.7480924725532532e-05, -1.280754804611206e-05, -8.13417136669159e-06, -3.460794687271118e-06, 1.212581992149353e-06, 5.885958671569824e-06, 1.0559335350990295e-05, 1.5232712030410767e-05, 1.9906088709831238e-05, 2.457946538925171e-05, 2.925284206867218e-05, 3.392621874809265e-05, 3.859959542751312e-05, 4.3272972106933594e-05, 4.7946348786354065e-05, 5.2619725465774536e-05, 5.729310214519501e-05, 6.196647882461548e-05, 6.663985550403595e-05, 7.131323218345642e-05, 7.598660886287689e-05, 8.065998554229736e-05, 8.533336222171783e-05, 9.00067389011383e-05, 9.468011558055878e-05, 9.935349225997925e-05, 0.00010402686893939972, 0.00010870024561882019, 0.00011337362229824066, 0.00011804699897766113, 0.0001227203756570816, 0.00012739375233650208, 0.00013206712901592255, 0.00013674050569534302, 0.0001414138823747635, 0.00014608725905418396, 0.00015076063573360443, 0.0001554340124130249, 0.00016010738909244537, 0.00016478076577186584, 0.00016945414245128632, 0.0001741275191307068, 0.00017880089581012726, 0.00018347427248954773, 0.0001881476491689682, 0.00019282102584838867]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 0.0, 4.0, 7.0, 3.0, 0.0, 2.0, 6.0, 7.0, 5.0, 15.0, 12.0, 24.0, 24.0, 27.0, 59.0, 56.0, 79.0, 94.0, 143.0, 186.0, 312.0, 474.0, 699.0, 1198.0, 2262.0, 4935.0, 14597.0, 613614.0, 384787.0, 14249.0, 4947.0, 2429.0, 1228.0, 651.0, 389.0, 297.0, 181.0, 134.0, 81.0, 66.0, 54.0, 56.0, 30.0, 40.0, 25.0, 14.0, 12.0, 8.0, 5.0, 11.0, 2.0, 5.0, 8.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.0285797119140625, -0.027686357498168945, -0.02679300308227539, -0.025899648666381836, -0.02500629425048828, -0.024112939834594727, -0.023219585418701172, -0.022326231002807617, -0.021432876586914062, -0.020539522171020508, -0.019646167755126953, -0.0187528133392334, -0.017859458923339844, -0.01696610450744629, -0.016072750091552734, -0.01517939567565918, -0.014286041259765625, -0.01339268684387207, -0.012499332427978516, -0.011605978012084961, -0.010712623596191406, -0.009819269180297852, -0.008925914764404297, -0.008032560348510742, -0.0071392059326171875, -0.006245851516723633, -0.005352497100830078, -0.0044591426849365234, -0.0035657882690429688, -0.002672433853149414, -0.0017790794372558594, -0.0008857250213623047, 7.62939453125e-06, 0.0009009838104248047, 0.0017943382263183594, 0.002687692642211914, 0.0035810470581054688, 0.0044744014739990234, 0.005367755889892578, 0.006261110305786133, 0.0071544647216796875, 0.008047819137573242, 0.008941173553466797, 0.009834527969360352, 0.010727882385253906, 0.011621236801147461, 0.012514591217041016, 0.01340794563293457, 0.014301300048828125, 0.01519465446472168, 0.016088008880615234, 0.01698136329650879, 0.017874717712402344, 0.0187680721282959, 0.019661426544189453, 0.020554780960083008, 0.021448135375976562, 0.022341489791870117, 0.023234844207763672, 0.024128198623657227, 0.02502155303955078, 0.025914907455444336, 0.02680826187133789, 0.027701616287231445, 0.028594970703125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 9.0, 15.0, 15.0, 17.0, 18.0, 116.0, 419.0, 225.0, 46.0, 22.0, 9.0, 8.0, 5.0, 12.0, 10.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 8.0, 10.0, 7.0, 12.0, 13.0, 11.0, 16.0, 19.0, 20.0, 27.0, 38.0, 45.0, 57.0, 98.0, 189.0, 405.0, 837.0, 2175.0, 123505.0, 916249.0, 2768.0, 943.0, 413.0, 190.0, 123.0, 80.0, 52.0, 43.0, 28.0, 30.0, 32.0, 15.0, 17.0, 13.0, 12.0, 10.0, 4.0, 13.0, 2.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04583740234375, -0.04436302185058594, -0.042888641357421875, -0.04141426086425781, -0.03993988037109375, -0.03846549987792969, -0.036991119384765625, -0.03551673889160156, -0.0340423583984375, -0.03256797790527344, -0.031093597412109375, -0.029619216918945312, -0.02814483642578125, -0.026670455932617188, -0.025196075439453125, -0.023721694946289062, -0.022247314453125, -0.020772933959960938, -0.019298553466796875, -0.017824172973632812, -0.01634979248046875, -0.014875411987304688, -0.013401031494140625, -0.011926651000976562, -0.0104522705078125, -0.008977890014648438, -0.007503509521484375, -0.0060291290283203125, -0.00455474853515625, -0.0030803680419921875, -0.001605987548828125, -0.0001316070556640625, 0.0013427734375, 0.0028171539306640625, 0.004291534423828125, 0.0057659149169921875, 0.00724029541015625, 0.008714675903320312, 0.010189056396484375, 0.011663436889648438, 0.0131378173828125, 0.014612197875976562, 0.016086578369140625, 0.017560958862304688, 0.01903533935546875, 0.020509719848632812, 0.021984100341796875, 0.023458480834960938, 0.024932861328125, 0.026407241821289062, 0.027881622314453125, 0.029356002807617188, 0.03083038330078125, 0.03230476379394531, 0.033779144287109375, 0.03525352478027344, 0.0367279052734375, 0.03820228576660156, 0.039676666259765625, 0.04115104675292969, 0.04262542724609375, 0.04409980773925781, 0.045574188232421875, 0.04704856872558594, 0.04852294921875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 7.0, 11.0, 10.0, 15.0, 11.0, 16.0, 17.0, 19.0, 28.0, 31.0, 34.0, 30.0, 27.0, 42.0, 36.0, 38.0, 44.0, 46.0, 47.0, 51.0, 40.0, 36.0, 24.0, 34.0, 38.0, 34.0, 34.0, 25.0, 27.0, 29.0, 18.0, 17.0, 12.0, 12.0, 10.0, 5.0, 10.0, 5.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036407470703125, -0.035237789154052734, -0.03406810760498047, -0.0328984260559082, -0.03172874450683594, -0.030559062957763672, -0.029389381408691406, -0.02821969985961914, -0.027050018310546875, -0.02588033676147461, -0.024710655212402344, -0.023540973663330078, -0.022371292114257812, -0.021201610565185547, -0.02003192901611328, -0.018862247467041016, -0.01769256591796875, -0.016522884368896484, -0.015353202819824219, -0.014183521270751953, -0.013013839721679688, -0.011844158172607422, -0.010674476623535156, -0.00950479507446289, -0.008335113525390625, -0.007165431976318359, -0.005995750427246094, -0.004826068878173828, -0.0036563873291015625, -0.002486705780029297, -0.0013170242309570312, -0.00014734268188476562, 0.0010223388671875, 0.0021920204162597656, 0.0033617019653320312, 0.004531383514404297, 0.0057010650634765625, 0.006870746612548828, 0.008040428161621094, 0.00921010971069336, 0.010379791259765625, 0.01154947280883789, 0.012719154357910156, 0.013888835906982422, 0.015058517456054688, 0.016228199005126953, 0.01739788055419922, 0.018567562103271484, 0.01973724365234375, 0.020906925201416016, 0.02207660675048828, 0.023246288299560547, 0.024415969848632812, 0.025585651397705078, 0.026755332946777344, 0.02792501449584961, 0.029094696044921875, 0.03026437759399414, 0.031434059143066406, 0.03260374069213867, 0.03377342224121094, 0.0349431037902832, 0.03611278533935547, 0.037282466888427734, 0.0384521484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 0.0, 9.0, 5.0, 10.0, 9.0, 12.0, 22.0, 24.0, 34.0, 61.0, 87.0, 124.0, 203.0, 345.0, 645.0, 1607.0, 3932.0, 11807.0, 59239.0, 828121.0, 115763.0, 17397.0, 5036.0, 1948.0, 926.0, 434.0, 265.0, 178.0, 93.0, 50.0, 48.0, 43.0, 29.0, 16.0, 10.0, 6.0, 5.0, 2.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-1.5437602996826172e-05, -1.5016645193099976e-05, -1.459568738937378e-05, -1.4174729585647583e-05, -1.3753771781921387e-05, -1.333281397819519e-05, -1.2911856174468994e-05, -1.2490898370742798e-05, -1.2069940567016602e-05, -1.1648982763290405e-05, -1.1228024959564209e-05, -1.0807067155838013e-05, -1.0386109352111816e-05, -9.96515154838562e-06, -9.544193744659424e-06, -9.123235940933228e-06, -8.702278137207031e-06, -8.281320333480835e-06, -7.860362529754639e-06, -7.439404726028442e-06, -7.018446922302246e-06, -6.59748911857605e-06, -6.1765313148498535e-06, -5.755573511123657e-06, -5.334615707397461e-06, -4.913657903671265e-06, -4.492700099945068e-06, -4.071742296218872e-06, -3.6507844924926758e-06, -3.2298266887664795e-06, -2.808868885040283e-06, -2.387911081314087e-06, -1.9669532775878906e-06, -1.5459954738616943e-06, -1.125037670135498e-06, -7.040798664093018e-07, -2.8312206268310547e-07, 1.3783574104309082e-07, 5.587935447692871e-07, 9.797513484954834e-07, 1.4007091522216797e-06, 1.821666955947876e-06, 2.2426247596740723e-06, 2.6635825634002686e-06, 3.084540367126465e-06, 3.505498170852661e-06, 3.926455974578857e-06, 4.347413778305054e-06, 4.76837158203125e-06, 5.189329385757446e-06, 5.610287189483643e-06, 6.031244993209839e-06, 6.452202796936035e-06, 6.8731606006622314e-06, 7.294118404388428e-06, 7.715076208114624e-06, 8.13603401184082e-06, 8.556991815567017e-06, 8.977949619293213e-06, 9.39890742301941e-06, 9.819865226745605e-06, 1.0240823030471802e-05, 1.0661780834197998e-05, 1.1082738637924194e-05, 1.150369644165039e-05]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 10.0, 16.0, 17.0, 17.0, 16.0, 36.0, 38.0, 52.0, 75.0, 84.0, 82.0, 93.0, 65.0, 106.0, 74.0, 53.0, 36.0, 26.0, 24.0, 14.0, 6.0, 6.0, 11.0, 9.0, 6.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.794929504394531e-06, -6.61797821521759e-06, -6.441026926040649e-06, -6.2640756368637085e-06, -6.087124347686768e-06, -5.910173058509827e-06, -5.733221769332886e-06, -5.556270480155945e-06, -5.379319190979004e-06, -5.202367901802063e-06, -5.025416612625122e-06, -4.848465323448181e-06, -4.67151403427124e-06, -4.494562745094299e-06, -4.317611455917358e-06, -4.1406601667404175e-06, -3.9637088775634766e-06, -3.7867575883865356e-06, -3.6098062992095947e-06, -3.432855010032654e-06, -3.255903720855713e-06, -3.078952431678772e-06, -2.902001142501831e-06, -2.72504985332489e-06, -2.5480985641479492e-06, -2.3711472749710083e-06, -2.1941959857940674e-06, -2.0172446966171265e-06, -1.8402934074401855e-06, -1.6633421182632446e-06, -1.4863908290863037e-06, -1.3094395399093628e-06, -1.1324882507324219e-06, -9.55536961555481e-07, -7.7858567237854e-07, -6.016343832015991e-07, -4.246830940246582e-07, -2.477318048477173e-07, -7.078051567077637e-08, 1.0617077350616455e-07, 2.8312206268310547e-07, 4.600733518600464e-07, 6.370246410369873e-07, 8.139759302139282e-07, 9.909272193908691e-07, 1.16787850856781e-06, 1.344829797744751e-06, 1.521781086921692e-06, 1.6987323760986328e-06, 1.8756836652755737e-06, 2.0526349544525146e-06, 2.2295862436294556e-06, 2.4065375328063965e-06, 2.5834888219833374e-06, 2.7604401111602783e-06, 2.9373914003372192e-06, 3.11434268951416e-06, 3.291293978691101e-06, 3.468245267868042e-06, 3.645196557044983e-06, 3.822147846221924e-06, 3.999099135398865e-06, 4.176050424575806e-06, 4.353001713752747e-06, 4.5299530029296875e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 8.0, 9.0, 14.0, 25.0, 37.0, 51.0, 78.0, 180.0, 603.0, 3417.0, 1040397.0, 2800.0, 491.0, 168.0, 86.0, 54.0, 36.0, 30.0, 24.0, 15.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.994340896606445e-05, -8.766446262598038e-05, -8.53855162858963e-05, -8.310656994581223e-05, -8.082762360572815e-05, -7.854867726564407e-05, -7.626973092556e-05, -7.399078458547592e-05, -7.171183824539185e-05, -6.943289190530777e-05, -6.71539455652237e-05, -6.487499922513962e-05, -6.259605288505554e-05, -6.0317106544971466e-05, -5.803816020488739e-05, -5.5759213864803314e-05, -5.348026752471924e-05, -5.120132118463516e-05, -4.8922374844551086e-05, -4.664342850446701e-05, -4.4364482164382935e-05, -4.208553582429886e-05, -3.980658948421478e-05, -3.752764314413071e-05, -3.524869680404663e-05, -3.2969750463962555e-05, -3.069080412387848e-05, -2.8411857783794403e-05, -2.6132911443710327e-05, -2.385396510362625e-05, -2.1575018763542175e-05, -1.92960724234581e-05, -1.7017126083374023e-05, -1.4738179743289948e-05, -1.2459233403205872e-05, -1.0180287063121796e-05, -7.90134072303772e-06, -5.622394382953644e-06, -3.343448042869568e-06, -1.064501702785492e-06, 1.214444637298584e-06, 3.49339097738266e-06, 5.772337317466736e-06, 8.051283657550812e-06, 1.0330229997634888e-05, 1.2609176337718964e-05, 1.488812267780304e-05, 1.7167069017887115e-05, 1.944601535797119e-05, 2.1724961698055267e-05, 2.4003908038139343e-05, 2.628285437822342e-05, 2.8561800718307495e-05, 3.084074705839157e-05, 3.311969339847565e-05, 3.539863973855972e-05, 3.76775860786438e-05, 3.9956532418727875e-05, 4.223547875881195e-05, 4.4514425098896027e-05, 4.67933714389801e-05, 4.907231777906418e-05, 5.1351264119148254e-05, 5.363021045923233e-05, 5.5909156799316406e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 7.0, 4.0, 14.0, 8.0, 23.0, 30.0, 36.0, 48.0, 50.0, 75.0, 85.0, 161.0, 116.0, 61.0, 68.0, 49.0, 51.0, 29.0, 30.0, 19.0, 17.0, 10.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265806198120117e-05, -7.082521915435791e-05, -6.899237632751465e-05, -6.715953350067139e-05, -6.532669067382812e-05, -6.349384784698486e-05, -6.16610050201416e-05, -5.982816219329834e-05, -5.799531936645508e-05, -5.6162476539611816e-05, -5.4329633712768555e-05, -5.249679088592529e-05, -5.066394805908203e-05, -4.883110523223877e-05, -4.699826240539551e-05, -4.5165419578552246e-05, -4.3332576751708984e-05, -4.149973392486572e-05, -3.966689109802246e-05, -3.78340482711792e-05, -3.600120544433594e-05, -3.4168362617492676e-05, -3.2335519790649414e-05, -3.0502676963806152e-05, -2.866983413696289e-05, -2.683699131011963e-05, -2.5004148483276367e-05, -2.3171305656433105e-05, -2.1338462829589844e-05, -1.9505620002746582e-05, -1.767277717590332e-05, -1.583993434906006e-05, -1.4007091522216797e-05, -1.2174248695373535e-05, -1.0341405868530273e-05, -8.508563041687012e-06, -6.67572021484375e-06, -4.842877388000488e-06, -3.0100345611572266e-06, -1.1771917343139648e-06, 6.556510925292969e-07, 2.4884939193725586e-06, 4.32133674621582e-06, 6.154179573059082e-06, 7.987022399902344e-06, 9.819865226745605e-06, 1.1652708053588867e-05, 1.3485550880432129e-05, 1.531839370727539e-05, 1.7151236534118652e-05, 1.8984079360961914e-05, 2.0816922187805176e-05, 2.2649765014648438e-05, 2.44826078414917e-05, 2.631545066833496e-05, 2.8148293495178223e-05, 2.9981136322021484e-05, 3.1813979148864746e-05, 3.364682197570801e-05, 3.547966480255127e-05, 3.731250762939453e-05, 3.914535045623779e-05, 4.0978193283081055e-05, 4.2811036109924316e-05, 4.464387893676758e-05]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 731.0, 274.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13766838610172272, -0.12499868124723434, -0.11232897639274597, -0.0996592789888382, -0.08698957413434982, -0.07431986927986145, -0.061650171875953674, -0.0489804670214653, -0.03631076216697693, -0.023641059175133705, -0.010971356183290482, 0.0016983449459075928, 0.014368049800395966, 0.02703775465488434, 0.039707452058792114, 0.05237715691328049, 0.06504686176776886, 0.07771656662225723, 0.0903862714767456, 0.10305596888065338, 0.11572567373514175, 0.12839537858963013, 0.1410650759935379, 0.15373477339744568, 0.16640448570251465, 0.17907418310642242, 0.1917438954114914, 0.20441359281539917, 0.21708330512046814, 0.22975300252437592, 0.2424226999282837, 0.25509241223335266, 0.26776212453842163, 0.2804318368434906, 0.2931015193462372, 0.30577123165130615, 0.3184409439563751, 0.3311106562614441, 0.3437803387641907, 0.35645005106925964, 0.3691197633743286, 0.3817894756793976, 0.39445915818214417, 0.40712887048721313, 0.4197985827922821, 0.4324682950973511, 0.44513797760009766, 0.4578076899051666, 0.4704773724079132, 0.4831470847129822, 0.49581676721572876, 0.5084865093231201, 0.5211561918258667, 0.5338258743286133, 0.5464955568313599, 0.5591652989387512, 0.5718349814414978, 0.5845046639442444, 0.5971744060516357, 0.6098440885543823, 0.6225137710571289, 0.6351835131645203, 0.6478531956672668, 0.6605228781700134, 0.6731926202774048]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 4.0, 3.0, 8.0, 11.0, 11.0, 10.0, 22.0, 17.0, 19.0, 31.0, 29.0, 37.0, 45.0, 36.0, 50.0, 44.0, 48.0, 52.0, 48.0, 57.0, 62.0, 44.0, 28.0, 48.0, 38.0, 22.0, 42.0, 18.0, 20.0, 25.0, 12.0, 10.0, 7.0, 11.0, 3.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2037792205810547, -0.1968652904033661, -0.1899513602256775, -0.1830374300479889, -0.1761235147714615, -0.1692095845937729, -0.1622956544160843, -0.1553817242383957, -0.1484678089618683, -0.1415538787841797, -0.1346399486064911, -0.1277260184288025, -0.12081210315227509, -0.11389817297458649, -0.10698424279689789, -0.10007031261920929, -0.09315638244152069, -0.08624245226383209, -0.07932852953672409, -0.07241459935903549, -0.06550067663192749, -0.05858674645423889, -0.05167281627655029, -0.04475888982415199, -0.03784496337175369, -0.030931036919355392, -0.024017108604311943, -0.017103180289268494, -0.010189253836870193, -0.0032753273844718933, 0.0036386027932167053, 0.010552529245615005, 0.017466455698013306, 0.024380382150411606, 0.031294308602809906, 0.038208238780498505, 0.045122165232896805, 0.052036091685295105, 0.058950021862983704, 0.0658639520406723, 0.0727778747677803, 0.0796918049454689, 0.0866057276725769, 0.0935196578502655, 0.1004335880279541, 0.1073475107550621, 0.1142614409327507, 0.1211753636598587, 0.1280892938375473, 0.1350032240152359, 0.1419171541929245, 0.1488310694694519, 0.1557449996471405, 0.1626589298248291, 0.1695728600025177, 0.1764867901802063, 0.1834007203578949, 0.1903146505355835, 0.1972285807132721, 0.2041425108909607, 0.2110564261674881, 0.2179703563451767, 0.2248842865228653, 0.2317982167005539, 0.2387121319770813]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 8.0, 0.0, 9.0, 11.0, 7.0, 7.0, 9.0, 11.0, 20.0, 90.0, 512.0, 4193382.0, 103.0, 23.0, 14.0, 18.0, 13.0, 6.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0006060600280761719, -0.0005877837538719177, -0.0005695074796676636, -0.0005512312054634094, -0.0005329549312591553, -0.0005146786570549011, -0.000496402382850647, -0.0004781261086463928, -0.00045984983444213867, -0.0004415735602378845, -0.00042329728603363037, -0.0004050210118293762, -0.00038674473762512207, -0.0003684684634208679, -0.00035019218921661377, -0.0003319159150123596, -0.00031363964080810547, -0.0002953633666038513, -0.00027708709239959717, -0.000258810818195343, -0.00024053454399108887, -0.00022225826978683472, -0.00020398199558258057, -0.00018570572137832642, -0.00016742944717407227, -0.00014915317296981812, -0.00013087689876556396, -0.00011260062456130981, -9.432435035705566e-05, -7.604807615280151e-05, -5.777180194854736e-05, -3.949552774429321e-05, -2.1219253540039062e-05, -2.942979335784912e-06, 1.5333294868469238e-05, 3.360956907272339e-05, 5.188584327697754e-05, 7.016211748123169e-05, 8.843839168548584e-05, 0.00010671466588973999, 0.00012499094009399414, 0.0001432672142982483, 0.00016154348850250244, 0.0001798197627067566, 0.00019809603691101074, 0.0002163723111152649, 0.00023464858531951904, 0.0002529248595237732, 0.00027120113372802734, 0.0002894774079322815, 0.00030775368213653564, 0.0003260299563407898, 0.00034430623054504395, 0.0003625825047492981, 0.00038085877895355225, 0.0003991350531578064, 0.00041741132736206055, 0.0004356876015663147, 0.00045396387577056885, 0.000472240149974823, 0.0004905164241790771, 0.0005087926983833313, 0.0005270689725875854, 0.0005453452467918396, 0.0005636215209960938]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 8.0, 15.0, 15.0, 17.0, 19.0, 116.0, 413.0, 231.0, 46.0, 23.0, 9.0, 7.0, 7.0, 11.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 6.0, 12.0, 27.0, 43.0, 85.0, 138.0, 222.0, 305.0, 4191970.0, 788.0, 244.0, 190.0, 100.0, 67.0, 42.0, 18.0, 11.0, 10.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00016355514526367188, -0.00015944987535476685, -0.00015534460544586182, -0.0001512393355369568, -0.00014713406562805176, -0.00014302879571914673, -0.0001389235258102417, -0.00013481825590133667, -0.00013071298599243164, -0.0001266077160835266, -0.00012250244617462158, -0.00011839717626571655, -0.00011429190635681152, -0.0001101866364479065, -0.00010608136653900146, -0.00010197609663009644, -9.78708267211914e-05, -9.376555681228638e-05, -8.966028690338135e-05, -8.555501699447632e-05, -8.144974708557129e-05, -7.734447717666626e-05, -7.323920726776123e-05, -6.91339373588562e-05, -6.502866744995117e-05, -6.092339754104614e-05, -5.681812763214111e-05, -5.2712857723236084e-05, -4.8607587814331055e-05, -4.4502317905426025e-05, -4.0397047996520996e-05, -3.629177808761597e-05, -3.218650817871094e-05, -2.8081238269805908e-05, -2.397596836090088e-05, -1.987069845199585e-05, -1.576542854309082e-05, -1.1660158634185791e-05, -7.554888725280762e-06, -3.4496188163757324e-06, 6.556510925292969e-07, 4.760921001434326e-06, 8.866190910339355e-06, 1.2971460819244385e-05, 1.7076730728149414e-05, 2.1182000637054443e-05, 2.5287270545959473e-05, 2.9392540454864502e-05, 3.349781036376953e-05, 3.760308027267456e-05, 4.170835018157959e-05, 4.581362009048462e-05, 4.991888999938965e-05, 5.402415990829468e-05, 5.812942981719971e-05, 6.223469972610474e-05, 6.633996963500977e-05, 7.04452395439148e-05, 7.455050945281982e-05, 7.865577936172485e-05, 8.276104927062988e-05, 8.686631917953491e-05, 9.097158908843994e-05, 9.507685899734497e-05, 9.918212890625e-05]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4088.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.245208740234375e-06, -4.484318196773529e-06, -3.723427653312683e-06, -2.962537109851837e-06, -2.201646566390991e-06, -1.4407560229301453e-06, -6.798654794692993e-07, 8.102506399154663e-08, 8.419156074523926e-07, 1.6028061509132385e-06, 2.3636966943740845e-06, 3.1245872378349304e-06, 3.885477781295776e-06, 4.646368324756622e-06, 5.407258868217468e-06, 6.168149411678314e-06, 6.92903995513916e-06, 7.689930498600006e-06, 8.450821042060852e-06, 9.211711585521698e-06, 9.972602128982544e-06, 1.073349267244339e-05, 1.1494383215904236e-05, 1.2255273759365082e-05, 1.3016164302825928e-05, 1.3777054846286774e-05, 1.453794538974762e-05, 1.5298835933208466e-05, 1.605972647666931e-05, 1.6820617020130157e-05, 1.7581507563591003e-05, 1.834239810705185e-05, 1.9103288650512695e-05, 1.986417919397354e-05, 2.0625069737434387e-05, 2.1385960280895233e-05, 2.214685082435608e-05, 2.2907741367816925e-05, 2.366863191127777e-05, 2.4429522454738617e-05, 2.5190412998199463e-05, 2.595130354166031e-05, 2.6712194085121155e-05, 2.7473084628582e-05, 2.8233975172042847e-05, 2.8994865715503693e-05, 2.975575625896454e-05, 3.0516646802425385e-05, 3.127753734588623e-05, 3.2038427889347076e-05, 3.279931843280792e-05, 3.356020897626877e-05, 3.4321099519729614e-05, 3.508199006319046e-05, 3.5842880606651306e-05, 3.660377115011215e-05, 3.7364661693573e-05, 3.8125552237033844e-05, 3.888644278049469e-05, 3.9647333323955536e-05, 4.040822386741638e-05, 4.116911441087723e-05, 4.1930004954338074e-05, 4.269089549779892e-05, 4.3451786041259766e-05]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 28.0, 972.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013577780919149518, -0.0001312948443228379, -0.00012681189400609583, -0.00012232892913743854, -0.00011784596426878124, -0.00011336300667608157, -0.00010888004908338189, -0.0001043970842147246, -9.991412662202492e-05, -9.543116902932525e-05, -9.094820416066796e-05, -8.646524656796828e-05, -8.19822889752686e-05, -7.749932410661131e-05, -7.301636651391163e-05, -6.853340892121196e-05, -6.405044405255467e-05, -5.956748282187618e-05, -5.50845215911977e-05, -5.060156399849802e-05, -4.611860276781954e-05, -4.1635641537141055e-05, -3.715268394444138e-05, -3.2669722713762894e-05, -2.818676148308441e-05, -2.3703800252405927e-05, -1.9220840840716846e-05, -1.4737880519533064e-05, -1.0254920198349282e-05, -5.771958967670798e-06, -1.288999555981718e-06, 3.1939598557073623e-06, 7.676921086385846e-06, 1.2159881407569628e-05, 1.664284172875341e-05, 2.112580114044249e-05, 2.5608762371120974e-05, 3.0091723601799458e-05, 3.4574681194499135e-05, 3.905764242517762e-05, 4.35406036558561e-05, 4.8023564886534587e-05, 5.250652611721307e-05, 5.698948370991275e-05, 6.147244130261242e-05, 6.595540617126971e-05, 7.043836376396939e-05, 7.492132135666907e-05, 7.940428622532636e-05, 8.388724381802604e-05, 8.837020868668333e-05, 9.2853166279383e-05, 9.73361311480403e-05, 0.00010181908874073997, 0.00010630204633343965, 0.00011078501120209694, 0.00011526796879479662, 0.00011975092638749629, 0.00012423389125615358, 0.00012871685612481087, 0.00013319980644155294, 0.00013768277131021023, 0.00014216573617886752, 0.00014664868649560958, 0.00015113165136426687]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 6.0, 14.0, 19.0, 62.0, 151.0, 134.0, 132.0, 149.0, 142.0, 126.0, 29.0, 17.0, 13.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7610530853271484e-05, -3.56016680598259e-05, -3.359280526638031e-05, -3.158394247293472e-05, -2.9575079679489136e-05, -2.756621688604355e-05, -2.555735409259796e-05, -2.3548491299152374e-05, -2.1539628505706787e-05, -1.95307657122612e-05, -1.7521902918815613e-05, -1.5513040125370026e-05, -1.3504177331924438e-05, -1.1495314538478851e-05, -9.486451745033264e-06, -7.477588951587677e-06, -5.46872615814209e-06, -3.4598633646965027e-06, -1.4510005712509155e-06, 5.578622221946716e-07, 2.566725015640259e-06, 4.575587809085846e-06, 6.584450602531433e-06, 8.59331339597702e-06, 1.0602176189422607e-05, 1.2611038982868195e-05, 1.4619901776313782e-05, 1.662876456975937e-05, 1.8637627363204956e-05, 2.0646490156650543e-05, 2.265535295009613e-05, 2.4664215743541718e-05, 2.6673078536987305e-05, 2.8681941330432892e-05, 3.069080412387848e-05, 3.2699666917324066e-05, 3.470852971076965e-05, 3.671739250421524e-05, 3.872625529766083e-05, 4.0735118091106415e-05, 4.2743980884552e-05, 4.475284367799759e-05, 4.6761706471443176e-05, 4.8770569264888763e-05, 5.077943205833435e-05, 5.278829485177994e-05, 5.4797157645225525e-05, 5.680602043867111e-05, 5.88148832321167e-05, 6.0823746025562286e-05, 6.283260881900787e-05, 6.484147161245346e-05, 6.685033440589905e-05, 6.885919719934464e-05, 7.086805999279022e-05, 7.287692278623581e-05, 7.48857855796814e-05, 7.689464837312698e-05, 7.890351116657257e-05, 8.091237396001816e-05, 8.292123675346375e-05, 8.493009954690933e-05, 8.693896234035492e-05, 8.89478251338005e-05, 9.09566879272461e-05]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 3.0, 6.0, 9.0, 13.0, 16.0, 31.0, 39.0, 56.0, 146.0, 292.0, 810.0, 2787.0, 18170.0, 1005833.0, 16279.0, 2530.0, 833.0, 345.0, 151.0, 78.0, 41.0, 28.0, 9.0, 11.0, 4.0, 3.0, 1.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0684814453125, -0.06637287139892578, -0.06426429748535156, -0.062155723571777344, -0.060047149658203125, -0.057938575744628906, -0.05583000183105469, -0.05372142791748047, -0.05161285400390625, -0.04950428009033203, -0.04739570617675781, -0.045287132263183594, -0.043178558349609375, -0.041069984436035156, -0.03896141052246094, -0.03685283660888672, -0.0347442626953125, -0.03263568878173828, -0.030527114868164062, -0.028418540954589844, -0.026309967041015625, -0.024201393127441406, -0.022092819213867188, -0.01998424530029297, -0.01787567138671875, -0.01576709747314453, -0.013658523559570312, -0.011549949645996094, -0.009441375732421875, -0.007332801818847656, -0.0052242279052734375, -0.0031156539916992188, -0.001007080078125, 0.0011014938354492188, 0.0032100677490234375, 0.005318641662597656, 0.007427215576171875, 0.009535789489746094, 0.011644363403320312, 0.013752937316894531, 0.01586151123046875, 0.01797008514404297, 0.020078659057617188, 0.022187232971191406, 0.024295806884765625, 0.026404380798339844, 0.028512954711914062, 0.03062152862548828, 0.0327301025390625, 0.03483867645263672, 0.03694725036621094, 0.039055824279785156, 0.041164398193359375, 0.043272972106933594, 0.04538154602050781, 0.04749011993408203, 0.04959869384765625, 0.05170726776123047, 0.05381584167480469, 0.055924415588378906, 0.058032989501953125, 0.060141563415527344, 0.06225013732910156, 0.06435871124267578, 0.06646728515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 8.0, 15.0, 15.0, 17.0, 19.0, 116.0, 413.0, 231.0, 46.0, 23.0, 9.0, 7.0, 7.0, 11.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 5.0, 4.0, 5.0, 7.0, 4.0, 11.0, 13.0, 14.0, 18.0, 30.0, 27.0, 25.0, 35.0, 59.0, 79.0, 136.0, 292.0, 632.0, 1699.0, 114936.0, 926830.0, 2095.0, 758.0, 307.0, 158.0, 84.0, 54.0, 38.0, 29.0, 24.0, 20.0, 23.0, 21.0, 20.0, 8.0, 8.0, 6.0, 8.0, 3.0, 5.0, 9.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049468994140625, -0.0479273796081543, -0.046385765075683594, -0.04484415054321289, -0.04330253601074219, -0.041760921478271484, -0.04021930694580078, -0.03867769241333008, -0.037136077880859375, -0.03559446334838867, -0.03405284881591797, -0.032511234283447266, -0.030969619750976562, -0.02942800521850586, -0.027886390686035156, -0.026344776153564453, -0.02480316162109375, -0.023261547088623047, -0.021719932556152344, -0.02017831802368164, -0.018636703491210938, -0.017095088958740234, -0.015553474426269531, -0.014011859893798828, -0.012470245361328125, -0.010928630828857422, -0.009387016296386719, -0.007845401763916016, -0.0063037872314453125, -0.004762172698974609, -0.0032205581665039062, -0.0016789436340332031, -0.0001373291015625, 0.0014042854309082031, 0.0029458999633789062, 0.004487514495849609, 0.0060291290283203125, 0.007570743560791016, 0.009112358093261719, 0.010653972625732422, 0.012195587158203125, 0.013737201690673828, 0.015278816223144531, 0.016820430755615234, 0.018362045288085938, 0.01990365982055664, 0.021445274353027344, 0.022986888885498047, 0.02452850341796875, 0.026070117950439453, 0.027611732482910156, 0.02915334701538086, 0.030694961547851562, 0.032236576080322266, 0.03377819061279297, 0.03531980514526367, 0.036861419677734375, 0.03840303421020508, 0.03994464874267578, 0.041486263275146484, 0.04302787780761719, 0.04456949234008789, 0.046111106872558594, 0.0476527214050293, 0.0491943359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 5.0, 4.0, 5.0, 6.0, 5.0, 11.0, 13.0, 14.0, 20.0, 26.0, 29.0, 24.0, 34.0, 37.0, 33.0, 34.0, 31.0, 65.0, 46.0, 48.0, 55.0, 43.0, 42.0, 38.0, 38.0, 37.0, 32.0, 30.0, 28.0, 23.0, 19.0, 24.0, 21.0, 21.0, 6.0, 9.0, 5.0, 9.0, 3.0, 5.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0382080078125, -0.037016868591308594, -0.03582572937011719, -0.03463459014892578, -0.033443450927734375, -0.03225231170654297, -0.031061172485351562, -0.029870033264160156, -0.02867889404296875, -0.027487754821777344, -0.026296615600585938, -0.02510547637939453, -0.023914337158203125, -0.02272319793701172, -0.021532058715820312, -0.020340919494628906, -0.0191497802734375, -0.017958641052246094, -0.016767501831054688, -0.015576362609863281, -0.014385223388671875, -0.013194084167480469, -0.012002944946289062, -0.010811805725097656, -0.00962066650390625, -0.008429527282714844, -0.0072383880615234375, -0.006047248840332031, -0.004856109619140625, -0.0036649703979492188, -0.0024738311767578125, -0.0012826919555664062, -9.1552734375e-05, 0.0010995864868164062, 0.0022907257080078125, 0.0034818649291992188, 0.004673004150390625, 0.005864143371582031, 0.0070552825927734375, 0.008246421813964844, 0.00943756103515625, 0.010628700256347656, 0.011819839477539062, 0.013010978698730469, 0.014202117919921875, 0.015393257141113281, 0.016584396362304688, 0.017775535583496094, 0.0189666748046875, 0.020157814025878906, 0.021348953247070312, 0.02254009246826172, 0.023731231689453125, 0.02492237091064453, 0.026113510131835938, 0.027304649353027344, 0.02849578857421875, 0.029686927795410156, 0.030878067016601562, 0.03206920623779297, 0.033260345458984375, 0.03445148468017578, 0.03564262390136719, 0.036833763122558594, 0.03802490234375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 13.0, 21.0, 38.0, 69.0, 102.0, 175.0, 441.0, 1280.0, 5927.0, 194587.0, 835830.0, 7460.0, 1557.0, 525.0, 201.0, 129.0, 65.0, 30.0, 36.0, 17.0, 12.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.066394805908203e-05, -4.9297697842121124e-05, -4.793144762516022e-05, -4.656519740819931e-05, -4.51989471912384e-05, -4.3832696974277496e-05, -4.246644675731659e-05, -4.110019654035568e-05, -3.9733946323394775e-05, -3.836769610643387e-05, -3.700144588947296e-05, -3.5635195672512054e-05, -3.426894545555115e-05, -3.290269523859024e-05, -3.1536445021629333e-05, -3.0170194804668427e-05, -2.880394458770752e-05, -2.7437694370746613e-05, -2.6071444153785706e-05, -2.47051939368248e-05, -2.333894371986389e-05, -2.1972693502902985e-05, -2.0606443285942078e-05, -1.924019306898117e-05, -1.7873942852020264e-05, -1.6507692635059357e-05, -1.514144241809845e-05, -1.3775192201137543e-05, -1.2408941984176636e-05, -1.1042691767215729e-05, -9.676441550254822e-06, -8.310191333293915e-06, -6.943941116333008e-06, -5.577690899372101e-06, -4.211440682411194e-06, -2.845190465450287e-06, -1.4789402484893799e-06, -1.126900315284729e-07, 1.253560185432434e-06, 2.619810402393341e-06, 3.986060619354248e-06, 5.352310836315155e-06, 6.718561053276062e-06, 8.084811270236969e-06, 9.451061487197876e-06, 1.0817311704158783e-05, 1.218356192111969e-05, 1.3549812138080597e-05, 1.4916062355041504e-05, 1.628231257200241e-05, 1.7648562788963318e-05, 1.9014813005924225e-05, 2.0381063222885132e-05, 2.174731343984604e-05, 2.3113563656806946e-05, 2.4479813873767853e-05, 2.584606409072876e-05, 2.7212314307689667e-05, 2.8578564524650574e-05, 2.994481474161148e-05, 3.131106495857239e-05, 3.2677315175533295e-05, 3.40435653924942e-05, 3.540981560945511e-05, 3.6776065826416016e-05]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 0.0, 5.0, 3.0, 5.0, 12.0, 7.0, 15.0, 17.0, 20.0, 19.0, 32.0, 53.0, 33.0, 62.0, 41.0, 81.0, 64.0, 48.0, 81.0, 49.0, 59.0, 47.0, 44.0, 39.0, 19.0, 36.0, 30.0, 25.0, 20.0, 12.0, 11.0, 7.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.139278411865234e-06, -5.984678864479065e-06, -5.8300793170928955e-06, -5.675479769706726e-06, -5.520880222320557e-06, -5.366280674934387e-06, -5.211681127548218e-06, -5.057081580162048e-06, -4.902482032775879e-06, -4.7478824853897095e-06, -4.59328293800354e-06, -4.438683390617371e-06, -4.284083843231201e-06, -4.129484295845032e-06, -3.974884748458862e-06, -3.820285201072693e-06, -3.6656856536865234e-06, -3.511086106300354e-06, -3.3564865589141846e-06, -3.201887011528015e-06, -3.0472874641418457e-06, -2.8926879167556763e-06, -2.738088369369507e-06, -2.5834888219833374e-06, -2.428889274597168e-06, -2.2742897272109985e-06, -2.119690179824829e-06, -1.9650906324386597e-06, -1.8104910850524902e-06, -1.6558915376663208e-06, -1.5012919902801514e-06, -1.346692442893982e-06, -1.1920928955078125e-06, -1.037493348121643e-06, -8.828938007354736e-07, -7.282942533493042e-07, -5.736947059631348e-07, -4.1909515857696533e-07, -2.644956111907959e-07, -1.0989606380462646e-07, 4.470348358154297e-08, 1.993030309677124e-07, 3.5390257835388184e-07, 5.085021257400513e-07, 6.631016731262207e-07, 8.177012205123901e-07, 9.723007678985596e-07, 1.126900315284729e-06, 1.2814998626708984e-06, 1.4360994100570679e-06, 1.5906989574432373e-06, 1.7452985048294067e-06, 1.8998980522155762e-06, 2.0544975996017456e-06, 2.209097146987915e-06, 2.3636966943740845e-06, 2.518296241760254e-06, 2.6728957891464233e-06, 2.8274953365325928e-06, 2.982094883918762e-06, 3.1366944313049316e-06, 3.291293978691101e-06, 3.4458935260772705e-06, 3.60049307346344e-06, 3.7550926208496094e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 8.0, 3.0, 10.0, 12.0, 13.0, 11.0, 26.0, 63.0, 131.0, 343.0, 1993.0, 1043547.0, 1793.0, 314.0, 140.0, 52.0, 22.0, 11.0, 14.0, 17.0, 4.0, 11.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012612342834472656, -0.00012292899191379547, -0.00011973455548286438, -0.00011654011905193329, -0.0001133456826210022, -0.0001101512461900711, -0.00010695680975914001, -0.00010376237332820892, -0.00010056793689727783, -9.737350046634674e-05, -9.417906403541565e-05, -9.098462760448456e-05, -8.779019117355347e-05, -8.459575474262238e-05, -8.140131831169128e-05, -7.820688188076019e-05, -7.50124454498291e-05, -7.181800901889801e-05, -6.862357258796692e-05, -6.542913615703583e-05, -6.223469972610474e-05, -5.9040263295173645e-05, -5.5845826864242554e-05, -5.265139043331146e-05, -4.945695400238037e-05, -4.626251757144928e-05, -4.306808114051819e-05, -3.98736447095871e-05, -3.6679208278656006e-05, -3.3484771847724915e-05, -3.0290335416793823e-05, -2.7095898985862732e-05, -2.390146255493164e-05, -2.070702612400055e-05, -1.7512589693069458e-05, -1.4318153262138367e-05, -1.1123716831207275e-05, -7.929280400276184e-06, -4.734843969345093e-06, -1.5404075384140015e-06, 1.6540288925170898e-06, 4.848465323448181e-06, 8.042901754379272e-06, 1.1237338185310364e-05, 1.4431774616241455e-05, 1.7626211047172546e-05, 2.0820647478103638e-05, 2.401508390903473e-05, 2.720952033996582e-05, 3.040395677089691e-05, 3.3598393201828e-05, 3.6792829632759094e-05, 3.9987266063690186e-05, 4.318170249462128e-05, 4.637613892555237e-05, 4.957057535648346e-05, 5.276501178741455e-05, 5.595944821834564e-05, 5.9153884649276733e-05, 6.234832108020782e-05, 6.554275751113892e-05, 6.873719394207001e-05, 7.19316303730011e-05, 7.512606680393219e-05, 7.832050323486328e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 2.0, 10.0, 12.0, 10.0, 9.0, 16.0, 28.0, 54.0, 63.0, 124.0, 308.0, 127.0, 76.0, 48.0, 28.0, 16.0, 6.0, 11.0, 15.0, 5.0, 11.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.810924530029297e-05, -9.562913328409195e-05, -9.314902126789093e-05, -9.066890925168991e-05, -8.818879723548889e-05, -8.570868521928787e-05, -8.322857320308685e-05, -8.074846118688583e-05, -7.826834917068481e-05, -7.57882371544838e-05, -7.330812513828278e-05, -7.082801312208176e-05, -6.834790110588074e-05, -6.586778908967972e-05, -6.33876770734787e-05, -6.090756505727768e-05, -5.842745304107666e-05, -5.594734102487564e-05, -5.346722900867462e-05, -5.09871169924736e-05, -4.850700497627258e-05, -4.6026892960071564e-05, -4.3546780943870544e-05, -4.1066668927669525e-05, -3.8586556911468506e-05, -3.6106444895267487e-05, -3.362633287906647e-05, -3.114622086286545e-05, -2.866610884666443e-05, -2.618599683046341e-05, -2.370588481426239e-05, -2.122577279806137e-05, -1.874566078186035e-05, -1.6265548765659332e-05, -1.3785436749458313e-05, -1.1305324733257294e-05, -8.825212717056274e-06, -6.345100700855255e-06, -3.864988684654236e-06, -1.3848766684532166e-06, 1.0952353477478027e-06, 3.575347363948822e-06, 6.055459380149841e-06, 8.53557139635086e-06, 1.101568341255188e-05, 1.34957954287529e-05, 1.597590744495392e-05, 1.8456019461154938e-05, 2.0936131477355957e-05, 2.3416243493556976e-05, 2.5896355509757996e-05, 2.8376467525959015e-05, 3.0856579542160034e-05, 3.3336691558361053e-05, 3.581680357456207e-05, 3.829691559076309e-05, 4.077702760696411e-05, 4.325713962316513e-05, 4.573725163936615e-05, 4.821736365556717e-05, 5.069747567176819e-05, 5.317758768796921e-05, 5.565769970417023e-05, 5.8137811720371246e-05, 6.0617923736572266e-05]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 849.0, 155.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15546324849128723, -0.1422867476940155, -0.12911024689674377, -0.11593374609947205, -0.10275724530220032, -0.08958074450492859, -0.07640424370765686, -0.06322774291038513, -0.0500512421131134, -0.036874741315841675, -0.023698240518569946, -0.010521739721298218, 0.0026547610759735107, 0.01583126187324524, 0.029007762670516968, 0.042184263467788696, 0.055360764265060425, 0.06853726506233215, 0.08171376585960388, 0.09489026665687561, 0.10806676745414734, 0.12124326825141907, 0.1344197690486908, 0.14759626984596252, 0.16077277064323425, 0.17394927144050598, 0.1871257722377777, 0.20030227303504944, 0.21347877383232117, 0.2266552746295929, 0.23983177542686462, 0.25300827622413635, 0.26618480682373047, 0.2793613076210022, 0.2925378084182739, 0.30571430921554565, 0.3188908100128174, 0.3320673108100891, 0.34524381160736084, 0.35842031240463257, 0.3715968132019043, 0.384773313999176, 0.39794981479644775, 0.4111263155937195, 0.4243028163909912, 0.43747931718826294, 0.45065581798553467, 0.4638323187828064, 0.4770088195800781, 0.49018532037734985, 0.5033618211746216, 0.5165383219718933, 0.529714822769165, 0.5428913235664368, 0.5560678243637085, 0.5692443251609802, 0.582420825958252, 0.5955973267555237, 0.6087738275527954, 0.6219503283500671, 0.6351268291473389, 0.6483033299446106, 0.6614798307418823, 0.674656331539154, 0.6878328323364258]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 14.0, 15.0, 12.0, 18.0, 20.0, 32.0, 34.0, 37.0, 49.0, 56.0, 55.0, 68.0, 76.0, 64.0, 69.0, 64.0, 61.0, 38.0, 37.0, 40.0, 37.0, 17.0, 17.0, 17.0, 20.0, 13.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24812549352645874, -0.2404186725616455, -0.23271186649799347, -0.22500504553318024, -0.2172982394695282, -0.20959141850471497, -0.20188459753990173, -0.1941777765750885, -0.18647097051143646, -0.17876414954662323, -0.1710573434829712, -0.16335052251815796, -0.15564370155334473, -0.1479368954896927, -0.14023007452487946, -0.13252326846122742, -0.12481644749641418, -0.11710963398218155, -0.10940282046794891, -0.10169599950313568, -0.09398918598890305, -0.08628237247467041, -0.07857555150985718, -0.07086873799562454, -0.0631619244813919, -0.05545511096715927, -0.04774829372763634, -0.0400414764881134, -0.03233466297388077, -0.024627849459648132, -0.0169210322201252, -0.009214214980602264, -0.001507401466369629, 0.006199413910508156, 0.01390622928738594, 0.021613044664263725, 0.02931986004114151, 0.037026673555374146, 0.04473349079489708, 0.05244030803442001, 0.06014712154865265, 0.06785393506288528, 0.07556074857711792, 0.08326756954193115, 0.09097438305616379, 0.09868119657039642, 0.10638801753520966, 0.11409483104944229, 0.12180164456367493, 0.12950846552848816, 0.1372152715921402, 0.14492209255695343, 0.15262889862060547, 0.1603357195854187, 0.16804254055023193, 0.17574936151504517, 0.1834561675786972, 0.19116298854351044, 0.19886979460716248, 0.2065766155719757, 0.21428343653678894, 0.22199024260044098, 0.2296970635652542, 0.23740386962890625, 0.24511069059371948]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 4.0, 5.0, 11.0, 9.0, 12.0, 14.0, 15.0, 25.0, 41.0, 31.0, 29.0, 53.0, 104.0, 214.0, 964.0, 4191612.0, 619.0, 121.0, 98.0, 69.0, 53.0, 31.0, 22.0, 10.0, 10.0, 15.0, 3.0, 10.0, 10.0, 11.0, 12.0, 12.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0], "bins": [-0.0033283233642578125, -0.003225773572921753, -0.0031232237815856934, -0.003020673990249634, -0.0029181241989135742, -0.0028155744075775146, -0.002713024616241455, -0.0026104748249053955, -0.002507925033569336, -0.0024053752422332764, -0.002302825450897217, -0.0022002756595611572, -0.0020977258682250977, -0.001995176076889038, -0.0018926262855529785, -0.001790076494216919, -0.0016875267028808594, -0.0015849769115447998, -0.0014824271202087402, -0.0013798773288726807, -0.001277327537536621, -0.0011747777462005615, -0.001072227954864502, -0.0009696781635284424, -0.0008671283721923828, -0.0007645785808563232, -0.0006620287895202637, -0.0005594789981842041, -0.00045692920684814453, -0.00035437941551208496, -0.0002518296241760254, -0.00014927983283996582, -4.673004150390625e-05, 5.581974983215332e-05, 0.0001583695411682129, 0.00026091933250427246, 0.00036346912384033203, 0.0004660189151763916, 0.0005685687065124512, 0.0006711184978485107, 0.0007736682891845703, 0.0008762180805206299, 0.0009787678718566895, 0.001081317663192749, 0.0011838674545288086, 0.0012864172458648682, 0.0013889670372009277, 0.0014915168285369873, 0.0015940666198730469, 0.0016966164112091064, 0.001799166202545166, 0.0019017159938812256, 0.002004265785217285, 0.0021068155765533447, 0.0022093653678894043, 0.002311915159225464, 0.0024144649505615234, 0.002517014741897583, 0.0026195645332336426, 0.002722114324569702, 0.0028246641159057617, 0.0029272139072418213, 0.003029763698577881, 0.0031323134899139404, 0.00323486328125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 8.0, 15.0, 15.0, 19.0, 21.0, 114.0, 413.0, 229.0, 46.0, 22.0, 9.0, 9.0, 5.0, 12.0, 10.0, 5.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 9.0, 45.0, 96.0, 221.0, 552.0, 1247.0, 3936.0, 4182354.0, 3698.0, 1182.0, 552.0, 226.0, 102.0, 52.0, 8.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008339881896972656, -0.0008074939250946045, -0.0007809996604919434, -0.0007545053958892822, -0.0007280111312866211, -0.00070151686668396, -0.0006750226020812988, -0.0006485283374786377, -0.0006220340728759766, -0.0005955398082733154, -0.0005690455436706543, -0.0005425512790679932, -0.000516057014465332, -0.0004895627498626709, -0.00046306848526000977, -0.00043657422065734863, -0.0004100799560546875, -0.00038358569145202637, -0.00035709142684936523, -0.0003305971622467041, -0.00030410289764404297, -0.00027760863304138184, -0.0002511143684387207, -0.00022462010383605957, -0.00019812583923339844, -0.0001716315746307373, -0.00014513731002807617, -0.00011864304542541504, -9.21487808227539e-05, -6.565451622009277e-05, -3.916025161743164e-05, -1.2665987014770508e-05, 1.3828277587890625e-05, 4.032254219055176e-05, 6.681680679321289e-05, 9.331107139587402e-05, 0.00011980533599853516, 0.0001462996006011963, 0.00017279386520385742, 0.00019928812980651855, 0.0002257823944091797, 0.0002522766590118408, 0.00027877092361450195, 0.0003052651882171631, 0.0003317594528198242, 0.00035825371742248535, 0.0003847479820251465, 0.0004112422466278076, 0.00043773651123046875, 0.0004642307758331299, 0.000490725040435791, 0.0005172193050384521, 0.0005437135696411133, 0.0005702078342437744, 0.0005967020988464355, 0.0006231963634490967, 0.0006496906280517578, 0.0006761848926544189, 0.0007026791572570801, 0.0007291734218597412, 0.0007556676864624023, 0.0007821619510650635, 0.0008086562156677246, 0.0008351504802703857, 0.0008616447448730469]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4031.0, 34.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035858154296875, -0.00034769997000694275, -0.0003368183970451355, -0.00032593682408332825, -0.000315055251121521, -0.00030417367815971375, -0.0002932921051979065, -0.00028241053223609924, -0.000271528959274292, -0.00026064738631248474, -0.0002497658133506775, -0.00023888424038887024, -0.000228002667427063, -0.00021712109446525574, -0.00020623952150344849, -0.00019535794854164124, -0.00018447637557983398, -0.00017359480261802673, -0.00016271322965621948, -0.00015183165669441223, -0.00014095008373260498, -0.00013006851077079773, -0.00011918693780899048, -0.00010830536484718323, -9.742379188537598e-05, -8.654221892356873e-05, -7.566064596176147e-05, -6.477907299995422e-05, -5.389750003814697e-05, -4.301592707633972e-05, -3.213435411453247e-05, -2.125278115272522e-05, -1.0371208190917969e-05, 5.103647708892822e-07, 1.1391937732696533e-05, 2.2273510694503784e-05, 3.3155083656311035e-05, 4.4036656618118286e-05, 5.491822957992554e-05, 6.579980254173279e-05, 7.668137550354004e-05, 8.756294846534729e-05, 9.844452142715454e-05, 0.00010932609438896179, 0.00012020766735076904, 0.0001310892403125763, 0.00014197081327438354, 0.0001528523862361908, 0.00016373395919799805, 0.0001746155321598053, 0.00018549710512161255, 0.0001963786780834198, 0.00020726025104522705, 0.0002181418240070343, 0.00022902339696884155, 0.0002399049699306488, 0.00025078654289245605, 0.0002616681158542633, 0.00027254968881607056, 0.0002834312617778778, 0.00029431283473968506, 0.0003051944077014923, 0.00031607598066329956, 0.0003269575536251068, 0.00033783912658691406]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 15.0, 703.0, 280.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005295274313539267, -0.0004999681259505451, -0.0004704088205471635, -0.0004408495151437819, -0.0004112902097404003, -0.00038173090433701873, -0.0003521716280374676, -0.000322612322634086, -0.0002930530172307044, -0.00026349371182732284, -0.00023393440642394125, -0.0002043751155724749, -0.0001748158101690933, -0.00014525650476571172, -0.00011569721391424537, -8.613790851086378e-05, -5.6578603107482195e-05, -2.7019301342079416e-05, 2.540000423323363e-06, 3.2099298550747335e-05, 6.165860395412892e-05, 9.121790935751051e-05, 0.00012077720020897686, 0.00015033650561235845, 0.00017989581101574004, 0.00020945511641912162, 0.0002390144218225032, 0.00026857369812205434, 0.0002981330035254359, 0.0003276923089288175, 0.0003572516143321991, 0.0003868109197355807, 0.00041637022513896227, 0.00044592953054234385, 0.00047548883594572544, 0.000505048141349107, 0.0005346074467524886, 0.0005641667521558702, 0.0005937260575592518, 0.0006232853047549725, 0.000652844668366015, 0.0006824039737693965, 0.0007119632791727781, 0.0007415225845761597, 0.0007710818899795413, 0.0008006411953829229, 0.0008302005007863045, 0.0008597597479820251, 0.0008893190533854067, 0.0009188783587887883, 0.0009484376641921699, 0.0009779969695955515, 0.0010075562167912722, 0.0010371155804023147, 0.0010666748275980353, 0.0010962341912090778, 0.0011257934384047985, 0.0011553526856005192, 0.0011849120492115617, 0.0012144712964072824, 0.0012440306600183249, 0.0012735899072140455, 0.001303149270825088, 0.0013327085180208087, 0.0013622678816318512]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 10.0, 26.0, 25.0, 25.0, 40.0, 51.0, 85.0, 93.0, 119.0, 114.0, 93.0, 77.0, 74.0, 53.0, 39.0, 28.0, 19.0, 8.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000954747200012207, -0.0009284215047955513, -0.0009020958095788956, -0.0008757701143622398, -0.0008494444191455841, -0.0008231187239289284, -0.0007967930287122726, -0.0007704673334956169, -0.0007441416382789612, -0.0007178159430623055, -0.0006914902478456497, -0.000665164552628994, -0.0006388388574123383, -0.0006125131621956825, -0.0005861874669790268, -0.0005598617717623711, -0.0005335360765457153, -0.0005072103813290596, -0.00048088468611240387, -0.00045455899089574814, -0.0004282332956790924, -0.0004019076004624367, -0.00037558190524578094, -0.0003492562100291252, -0.0003229305148124695, -0.00029660481959581375, -0.000270279124379158, -0.0002439534291625023, -0.00021762773394584656, -0.00019130203872919083, -0.0001649763435125351, -0.00013865064829587936, -0.00011232495307922363, -8.59992578625679e-05, -5.967356264591217e-05, -3.334786742925644e-05, -7.022172212600708e-06, 1.9303523004055023e-05, 4.5629218220710754e-05, 7.195491343736649e-05, 9.828060865402222e-05, 0.00012460630387067795, 0.00015093199908733368, 0.0001772576943039894, 0.00020358338952064514, 0.00022990908473730087, 0.0002562347799539566, 0.00028256047517061234, 0.00030888617038726807, 0.0003352118656039238, 0.00036153756082057953, 0.00038786325603723526, 0.000414188951253891, 0.0004405146464705467, 0.00046684034168720245, 0.0004931660369038582, 0.0005194917321205139, 0.0005458174273371696, 0.0005721431225538254, 0.0005984688177704811, 0.0006247945129871368, 0.0006511202082037926, 0.0006774459034204483, 0.000703771598637104, 0.0007300972938537598]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 7.0, 10.0, 5.0, 15.0, 11.0, 16.0, 17.0, 43.0, 44.0, 78.0, 128.0, 232.0, 546.0, 1262.0, 3896.0, 18872.0, 991451.0, 24983.0, 4271.0, 1389.0, 539.0, 271.0, 163.0, 92.0, 58.0, 53.0, 27.0, 15.0, 13.0, 8.0, 14.0, 1.0, 5.0, 10.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053009033203125, -0.05132913589477539, -0.04964923858642578, -0.04796934127807617, -0.04628944396972656, -0.04460954666137695, -0.042929649353027344, -0.041249752044677734, -0.039569854736328125, -0.037889957427978516, -0.036210060119628906, -0.0345301628112793, -0.03285026550292969, -0.031170368194580078, -0.02949047088623047, -0.02781057357788086, -0.02613067626953125, -0.02445077896118164, -0.02277088165283203, -0.021090984344482422, -0.019411087036132812, -0.017731189727783203, -0.016051292419433594, -0.014371395111083984, -0.012691497802734375, -0.011011600494384766, -0.009331703186035156, -0.007651805877685547, -0.0059719085693359375, -0.004292011260986328, -0.0026121139526367188, -0.0009322166442871094, 0.0007476806640625, 0.0024275779724121094, 0.004107475280761719, 0.005787372589111328, 0.0074672698974609375, 0.009147167205810547, 0.010827064514160156, 0.012506961822509766, 0.014186859130859375, 0.015866756439208984, 0.017546653747558594, 0.019226551055908203, 0.020906448364257812, 0.022586345672607422, 0.02426624298095703, 0.02594614028930664, 0.02762603759765625, 0.02930593490600586, 0.03098583221435547, 0.03266572952270508, 0.03434562683105469, 0.0360255241394043, 0.037705421447753906, 0.039385318756103516, 0.041065216064453125, 0.042745113372802734, 0.044425010681152344, 0.04610490798950195, 0.04778480529785156, 0.04946470260620117, 0.05114459991455078, 0.05282449722290039, 0.05450439453125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 8.0, 15.0, 15.0, 19.0, 21.0, 114.0, 413.0, 229.0, 46.0, 22.0, 9.0, 9.0, 5.0, 12.0, 10.0, 5.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 5.0, 5.0, 12.0, 10.0, 24.0, 12.0, 10.0, 17.0, 21.0, 27.0, 37.0, 27.0, 29.0, 59.0, 104.0, 187.0, 357.0, 823.0, 3203.0, 998589.0, 42075.0, 1538.0, 579.0, 280.0, 140.0, 68.0, 42.0, 35.0, 27.0, 20.0, 34.0, 23.0, 17.0, 17.0, 13.0, 20.0, 12.0, 10.0, 5.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.053497314453125, -0.051914215087890625, -0.05033111572265625, -0.048748016357421875, -0.0471649169921875, -0.045581817626953125, -0.04399871826171875, -0.042415618896484375, -0.04083251953125, -0.039249420166015625, -0.03766632080078125, -0.036083221435546875, -0.0345001220703125, -0.032917022705078125, -0.03133392333984375, -0.029750823974609375, -0.028167724609375, -0.026584625244140625, -0.02500152587890625, -0.023418426513671875, -0.0218353271484375, -0.020252227783203125, -0.01866912841796875, -0.017086029052734375, -0.0155029296875, -0.013919830322265625, -0.01233673095703125, -0.010753631591796875, -0.0091705322265625, -0.007587432861328125, -0.00600433349609375, -0.004421234130859375, -0.002838134765625, -0.001255035400390625, 0.00032806396484375, 0.001911163330078125, 0.0034942626953125, 0.005077362060546875, 0.00666046142578125, 0.008243560791015625, 0.00982666015625, 0.011409759521484375, 0.01299285888671875, 0.014575958251953125, 0.0161590576171875, 0.017742156982421875, 0.01932525634765625, 0.020908355712890625, 0.022491455078125, 0.024074554443359375, 0.02565765380859375, 0.027240753173828125, 0.0288238525390625, 0.030406951904296875, 0.03199005126953125, 0.033573150634765625, 0.03515625, 0.036739349365234375, 0.03832244873046875, 0.039905548095703125, 0.0414886474609375, 0.043071746826171875, 0.04465484619140625, 0.046237945556640625, 0.047821044921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 5.0, 5.0, 13.0, 10.0, 22.0, 14.0, 9.0, 17.0, 21.0, 28.0, 38.0, 24.0, 23.0, 33.0, 41.0, 30.0, 31.0, 41.0, 40.0, 39.0, 35.0, 38.0, 41.0, 35.0, 46.0, 24.0, 30.0, 29.0, 29.0, 19.0, 35.0, 22.0, 16.0, 19.0, 11.0, 21.0, 12.0, 9.0, 6.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.03387451171875, -0.03287172317504883, -0.031868934631347656, -0.030866146087646484, -0.029863357543945312, -0.02886056900024414, -0.02785778045654297, -0.026854991912841797, -0.025852203369140625, -0.024849414825439453, -0.02384662628173828, -0.02284383773803711, -0.021841049194335938, -0.020838260650634766, -0.019835472106933594, -0.018832683563232422, -0.01782989501953125, -0.016827106475830078, -0.015824317932128906, -0.014821529388427734, -0.013818740844726562, -0.01281595230102539, -0.011813163757324219, -0.010810375213623047, -0.009807586669921875, -0.008804798126220703, -0.007802009582519531, -0.006799221038818359, -0.0057964324951171875, -0.004793643951416016, -0.0037908554077148438, -0.002788066864013672, -0.0017852783203125, -0.0007824897766113281, 0.00022029876708984375, 0.0012230873107910156, 0.0022258758544921875, 0.0032286643981933594, 0.004231452941894531, 0.005234241485595703, 0.006237030029296875, 0.007239818572998047, 0.008242607116699219, 0.00924539566040039, 0.010248184204101562, 0.011250972747802734, 0.012253761291503906, 0.013256549835205078, 0.01425933837890625, 0.015262126922607422, 0.016264915466308594, 0.017267704010009766, 0.018270492553710938, 0.01927328109741211, 0.02027606964111328, 0.021278858184814453, 0.022281646728515625, 0.023284435272216797, 0.02428722381591797, 0.02529001235961914, 0.026292800903320312, 0.027295589447021484, 0.028298377990722656, 0.029301166534423828, 0.030303955078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 8.0, 9.0, 13.0, 12.0, 16.0, 37.0, 37.0, 59.0, 87.0, 122.0, 203.0, 342.0, 609.0, 1686.0, 4201.0, 17952.0, 911409.0, 96681.0, 9688.0, 2832.0, 1227.0, 510.0, 257.0, 176.0, 126.0, 75.0, 39.0, 24.0, 32.0, 19.0, 21.0, 11.0, 3.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-2.2709369659423828e-05, -2.2037886083126068e-05, -2.1366402506828308e-05, -2.0694918930530548e-05, -2.0023435354232788e-05, -1.9351951777935028e-05, -1.8680468201637268e-05, -1.8008984625339508e-05, -1.7337501049041748e-05, -1.6666017472743988e-05, -1.5994533896446228e-05, -1.5323050320148468e-05, -1.4651566743850708e-05, -1.3980083167552948e-05, -1.3308599591255188e-05, -1.2637116014957428e-05, -1.1965632438659668e-05, -1.1294148862361908e-05, -1.0622665286064148e-05, -9.951181709766388e-06, -9.279698133468628e-06, -8.608214557170868e-06, -7.936730980873108e-06, -7.265247404575348e-06, -6.593763828277588e-06, -5.922280251979828e-06, -5.250796675682068e-06, -4.579313099384308e-06, -3.907829523086548e-06, -3.236345946788788e-06, -2.564862370491028e-06, -1.8933787941932678e-06, -1.2218952178955078e-06, -5.504116415977478e-07, 1.210719347000122e-07, 7.925555109977722e-07, 1.4640390872955322e-06, 2.1355226635932922e-06, 2.8070062398910522e-06, 3.4784898161888123e-06, 4.149973392486572e-06, 4.821456968784332e-06, 5.492940545082092e-06, 6.164424121379852e-06, 6.835907697677612e-06, 7.507391273975372e-06, 8.178874850273132e-06, 8.850358426570892e-06, 9.521842002868652e-06, 1.0193325579166412e-05, 1.0864809155464172e-05, 1.1536292731761932e-05, 1.2207776308059692e-05, 1.2879259884357452e-05, 1.3550743460655212e-05, 1.4222227036952972e-05, 1.4893710613250732e-05, 1.5565194189548492e-05, 1.6236677765846252e-05, 1.6908161342144012e-05, 1.7579644918441772e-05, 1.8251128494739532e-05, 1.8922612071037292e-05, 1.9594095647335052e-05, 2.0265579223632812e-05]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 2.0, 9.0, 10.0, 6.0, 10.0, 18.0, 15.0, 19.0, 15.0, 28.0, 44.0, 37.0, 40.0, 54.0, 48.0, 50.0, 49.0, 105.0, 60.0, 41.0, 55.0, 54.0, 33.0, 39.0, 25.0, 29.0, 15.0, 16.0, 13.0, 14.0, 6.0, 5.0, 7.0, 7.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.291534423828125e-06, -4.157423973083496e-06, -4.023313522338867e-06, -3.889203071594238e-06, -3.7550926208496094e-06, -3.6209821701049805e-06, -3.4868717193603516e-06, -3.3527612686157227e-06, -3.2186508178710938e-06, -3.084540367126465e-06, -2.950429916381836e-06, -2.816319465637207e-06, -2.682209014892578e-06, -2.5480985641479492e-06, -2.4139881134033203e-06, -2.2798776626586914e-06, -2.1457672119140625e-06, -2.0116567611694336e-06, -1.8775463104248047e-06, -1.7434358596801758e-06, -1.6093254089355469e-06, -1.475214958190918e-06, -1.341104507446289e-06, -1.2069940567016602e-06, -1.0728836059570312e-06, -9.387731552124023e-07, -8.046627044677734e-07, -6.705522537231445e-07, -5.364418029785156e-07, -4.023313522338867e-07, -2.682209014892578e-07, -1.341104507446289e-07, 0.0, 1.341104507446289e-07, 2.682209014892578e-07, 4.023313522338867e-07, 5.364418029785156e-07, 6.705522537231445e-07, 8.046627044677734e-07, 9.387731552124023e-07, 1.0728836059570312e-06, 1.2069940567016602e-06, 1.341104507446289e-06, 1.475214958190918e-06, 1.6093254089355469e-06, 1.7434358596801758e-06, 1.8775463104248047e-06, 2.0116567611694336e-06, 2.1457672119140625e-06, 2.2798776626586914e-06, 2.4139881134033203e-06, 2.5480985641479492e-06, 2.682209014892578e-06, 2.816319465637207e-06, 2.950429916381836e-06, 3.084540367126465e-06, 3.2186508178710938e-06, 3.3527612686157227e-06, 3.4868717193603516e-06, 3.6209821701049805e-06, 3.7550926208496094e-06, 3.889203071594238e-06, 4.023313522338867e-06, 4.157423973083496e-06, 4.291534423828125e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 4.0, 4.0, 20.0, 16.0, 27.0, 41.0, 67.0, 90.0, 178.0, 569.0, 5291.0, 1038816.0, 2540.0, 412.0, 165.0, 91.0, 53.0, 40.0, 18.0, 17.0, 11.0, 13.0, 7.0, 7.0, 3.0, 3.0, 6.0, 9.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.0558319091796875e-05, -5.868915468454361e-05, -5.6819990277290344e-05, -5.495082587003708e-05, -5.3081661462783813e-05, -5.121249705553055e-05, -4.934333264827728e-05, -4.747416824102402e-05, -4.560500383377075e-05, -4.3735839426517487e-05, -4.186667501926422e-05, -3.9997510612010956e-05, -3.812834620475769e-05, -3.6259181797504425e-05, -3.439001739025116e-05, -3.2520852982997894e-05, -3.065168857574463e-05, -2.8782524168491364e-05, -2.6913359761238098e-05, -2.5044195353984833e-05, -2.3175030946731567e-05, -2.1305866539478302e-05, -1.9436702132225037e-05, -1.756753772497177e-05, -1.5698373317718506e-05, -1.382920891046524e-05, -1.1960044503211975e-05, -1.009088009595871e-05, -8.221715688705444e-06, -6.352551281452179e-06, -4.4833868741989136e-06, -2.614222466945648e-06, -7.450580596923828e-07, 1.1241063475608826e-06, 2.993270754814148e-06, 4.862435162067413e-06, 6.731599569320679e-06, 8.600763976573944e-06, 1.046992838382721e-05, 1.2339092791080475e-05, 1.420825719833374e-05, 1.6077421605587006e-05, 1.794658601284027e-05, 1.9815750420093536e-05, 2.1684914827346802e-05, 2.3554079234600067e-05, 2.5423243641853333e-05, 2.7292408049106598e-05, 2.9161572456359863e-05, 3.103073686361313e-05, 3.2899901270866394e-05, 3.476906567811966e-05, 3.6638230085372925e-05, 3.850739449262619e-05, 4.0376558899879456e-05, 4.224572330713272e-05, 4.4114887714385986e-05, 4.598405212163925e-05, 4.785321652889252e-05, 4.972238093614578e-05, 5.159154534339905e-05, 5.346070975065231e-05, 5.532987415790558e-05, 5.7199038565158844e-05, 5.906820297241211e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 5.0, 3.0, 4.0, 8.0, 5.0, 3.0, 21.0, 14.0, 23.0, 25.0, 36.0, 33.0, 47.0, 79.0, 104.0, 197.0, 95.0, 67.0, 45.0, 39.0, 22.0, 26.0, 11.0, 17.0, 11.0, 11.0, 7.0, 8.0, 5.0, 3.0, 5.0, 7.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.838539123535156e-05, -3.719702363014221e-05, -3.600865602493286e-05, -3.482028841972351e-05, -3.363192081451416e-05, -3.244355320930481e-05, -3.125518560409546e-05, -3.006681799888611e-05, -2.8878450393676758e-05, -2.7690082788467407e-05, -2.6501715183258057e-05, -2.5313347578048706e-05, -2.4124979972839355e-05, -2.2936612367630005e-05, -2.1748244762420654e-05, -2.0559877157211304e-05, -1.9371509552001953e-05, -1.8183141946792603e-05, -1.6994774341583252e-05, -1.58064067363739e-05, -1.461803913116455e-05, -1.34296715259552e-05, -1.224130392074585e-05, -1.1052936315536499e-05, -9.864568710327148e-06, -8.676201105117798e-06, -7.487833499908447e-06, -6.299465894699097e-06, -5.111098289489746e-06, -3.9227306842803955e-06, -2.734363079071045e-06, -1.5459954738616943e-06, -3.5762786865234375e-07, 8.307397365570068e-07, 2.0191073417663574e-06, 3.207474946975708e-06, 4.395842552185059e-06, 5.584210157394409e-06, 6.77257776260376e-06, 7.96094536781311e-06, 9.149312973022461e-06, 1.0337680578231812e-05, 1.1526048183441162e-05, 1.2714415788650513e-05, 1.3902783393859863e-05, 1.5091150999069214e-05, 1.6279518604278564e-05, 1.7467886209487915e-05, 1.8656253814697266e-05, 1.9844621419906616e-05, 2.1032989025115967e-05, 2.2221356630325317e-05, 2.3409724235534668e-05, 2.459809184074402e-05, 2.578645944595337e-05, 2.697482705116272e-05, 2.816319465637207e-05, 2.935156226158142e-05, 3.053992986679077e-05, 3.172829747200012e-05, 3.291666507720947e-05, 3.410503268241882e-05, 3.5293400287628174e-05, 3.6481767892837524e-05, 3.7670135498046875e-05]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 18.0, 851.0, 142.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08945082128047943, -0.07633531838655472, -0.06321981549263, -0.050104305148124695, -0.03698880225419998, -0.02387329936027527, -0.010757789015769958, 0.0023577138781547546, 0.015473216772079468, 0.02858872152864933, 0.04170422628521919, 0.054819732904434204, 0.06793523579835892, 0.08105073869228363, 0.09416624903678894, 0.10728175193071365, 0.12039725482463837, 0.13351276516914368, 0.1466282606124878, 0.1597437709569931, 0.1728592813014984, 0.18597477674484253, 0.19909028708934784, 0.21220579743385315, 0.22532129287719727, 0.23843680322170258, 0.2515523135662079, 0.264667809009552, 0.2777833044528961, 0.29089879989624023, 0.30401432514190674, 0.31712982058525085, 0.33024531602859497, 0.3433608114719391, 0.3564763367176056, 0.3695918321609497, 0.3827073276042938, 0.39582282304763794, 0.40893834829330444, 0.42205384373664856, 0.4351693391799927, 0.4482848346233368, 0.4614003598690033, 0.4745158553123474, 0.48763135075569153, 0.5007468461990356, 0.5138623714447021, 0.5269778966903687, 0.5400934219360352, 0.5532089471817017, 0.5663244128227234, 0.5794399380683899, 0.5925554633140564, 0.6056709289550781, 0.6187864542007446, 0.6319019794464111, 0.6450174450874329, 0.6581329703330994, 0.6712484359741211, 0.6843639612197876, 0.6974794864654541, 0.7105949521064758, 0.7237104773521423, 0.7368260025978088, 0.7499414682388306]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 8.0, 5.0, 8.0, 7.0, 18.0, 15.0, 11.0, 26.0, 21.0, 35.0, 31.0, 52.0, 50.0, 48.0, 61.0, 72.0, 68.0, 60.0, 69.0, 52.0, 53.0, 33.0, 42.0, 32.0, 27.0, 18.0, 18.0, 8.0, 15.0, 9.0, 7.0, 8.0, 9.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17363351583480835, -0.16735723614692688, -0.1610809564590454, -0.15480467677116394, -0.14852839708328247, -0.142252117395401, -0.13597583770751953, -0.12969955801963806, -0.12342328578233719, -0.11714700609445572, -0.11087072640657425, -0.10459445416927338, -0.0983181744813919, -0.09204189479351044, -0.08576561510562897, -0.0794893354177475, -0.07321305572986603, -0.06693677604198456, -0.06066049635410309, -0.05438422039151192, -0.04810794070363045, -0.04183166101574898, -0.035555385053157806, -0.029279105365276337, -0.023002825677394867, -0.016726545989513397, -0.010450268164277077, -0.004173990339040756, 0.0021022893488407135, 0.008378569036722183, 0.014654844999313354, 0.020931124687194824, 0.027207404375076294, 0.033483684062957764, 0.03975996375083923, 0.046036239713430405, 0.052312519401311874, 0.058588799089193344, 0.06486507505178452, 0.07114135473966599, 0.07741763442754745, 0.08369391411542892, 0.0899701938033104, 0.09624646604061127, 0.10252274572849274, 0.1087990254163742, 0.11507530510425568, 0.12135158479213715, 0.12762786448001862, 0.13390414416790009, 0.14018042385578156, 0.14645670354366302, 0.1527329832315445, 0.15900926291942596, 0.16528552770614624, 0.1715618073940277, 0.17783808708190918, 0.18411436676979065, 0.19039064645767212, 0.1966669261455536, 0.20294320583343506, 0.20921948552131653, 0.215495765209198, 0.22177204489707947, 0.22804832458496094]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 0.0, 4.0, 4.0, 4.0, 1.0, 8.0, 4.0, 1.0, 8.0, 11.0, 10.0, 25.0, 26.0, 31.0, 23.0, 19.0, 36.0, 54.0, 84.0, 111.0, 202.0, 309.0, 650.0, 2545.0, 4185075.0, 3494.0, 646.0, 329.0, 139.0, 125.0, 82.0, 68.0, 35.0, 27.0, 23.0, 15.0, 11.0, 15.0, 14.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348388671875, -0.3373374938964844, -0.32628631591796875, -0.3152351379394531, -0.3041839599609375, -0.2931327819824219, -0.28208160400390625, -0.2710304260253906, -0.259979248046875, -0.24892807006835938, -0.23787689208984375, -0.22682571411132812, -0.2157745361328125, -0.20472335815429688, -0.19367218017578125, -0.18262100219726562, -0.17156982421875, -0.16051864624023438, -0.14946746826171875, -0.13841629028320312, -0.1273651123046875, -0.11631393432617188, -0.10526275634765625, -0.09421157836914062, -0.083160400390625, -0.07210922241210938, -0.06105804443359375, -0.050006866455078125, -0.0389556884765625, -0.027904510498046875, -0.01685333251953125, -0.005802154541015625, 0.0052490234375, 0.016300201416015625, 0.02735137939453125, 0.038402557373046875, 0.0494537353515625, 0.060504913330078125, 0.07155609130859375, 0.08260726928710938, 0.093658447265625, 0.10470962524414062, 0.11576080322265625, 0.12681198120117188, 0.1378631591796875, 0.14891433715820312, 0.15996551513671875, 0.17101669311523438, 0.18206787109375, 0.19311904907226562, 0.20417022705078125, 0.21522140502929688, 0.2262725830078125, 0.23732376098632812, 0.24837493896484375, 0.2594261169433594, 0.270477294921875, 0.2815284729003906, 0.29257965087890625, 0.3036308288574219, 0.3146820068359375, 0.3257331848144531, 0.33678436279296875, 0.3478355407714844, 0.35888671875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 16.0, 17.0, 17.0, 19.0, 118.0, 407.0, 233.0, 47.0, 22.0, 10.0, 8.0, 5.0, 14.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 5.0, 11.0, 11.0, 20.0, 17.0, 26.0, 29.0, 53.0, 91.0, 365.0, 6899.0, 4177356.0, 8592.0, 409.0, 126.0, 57.0, 48.0, 31.0, 16.0, 17.0, 16.0, 13.0, 11.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07476806640625, -0.07194995880126953, -0.06913185119628906, -0.0663137435913086, -0.06349563598632812, -0.060677528381347656, -0.05785942077636719, -0.05504131317138672, -0.05222320556640625, -0.04940509796142578, -0.04658699035644531, -0.043768882751464844, -0.040950775146484375, -0.038132667541503906, -0.03531455993652344, -0.03249645233154297, -0.0296783447265625, -0.02686023712158203, -0.024042129516601562, -0.021224021911621094, -0.018405914306640625, -0.015587806701660156, -0.012769699096679688, -0.009951591491699219, -0.00713348388671875, -0.004315376281738281, -0.0014972686767578125, 0.0013208389282226562, 0.004138946533203125, 0.006957054138183594, 0.009775161743164062, 0.012593269348144531, 0.015411376953125, 0.01822948455810547, 0.021047592163085938, 0.023865699768066406, 0.026683807373046875, 0.029501914978027344, 0.03232002258300781, 0.03513813018798828, 0.03795623779296875, 0.04077434539794922, 0.04359245300292969, 0.046410560607910156, 0.049228668212890625, 0.052046775817871094, 0.05486488342285156, 0.05768299102783203, 0.0605010986328125, 0.06331920623779297, 0.06613731384277344, 0.0689554214477539, 0.07177352905273438, 0.07459163665771484, 0.07740974426269531, 0.08022785186767578, 0.08304595947265625, 0.08586406707763672, 0.08868217468261719, 0.09150028228759766, 0.09431838989257812, 0.0971364974975586, 0.09995460510253906, 0.10277271270751953, 0.1055908203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 4.0, 4.0, 5.0, 14.0, 16.0, 24.0, 56.0, 170.0, 2866.0, 730.0, 94.0, 19.0, 12.0, 8.0, 3.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.033447265625, -0.03256368637084961, -0.03168010711669922, -0.030796527862548828, -0.029912948608398438, -0.029029369354248047, -0.028145790100097656, -0.027262210845947266, -0.026378631591796875, -0.025495052337646484, -0.024611473083496094, -0.023727893829345703, -0.022844314575195312, -0.021960735321044922, -0.02107715606689453, -0.02019357681274414, -0.01930999755859375, -0.01842641830444336, -0.01754283905029297, -0.016659259796142578, -0.015775680541992188, -0.014892101287841797, -0.014008522033691406, -0.013124942779541016, -0.012241363525390625, -0.011357784271240234, -0.010474205017089844, -0.009590625762939453, -0.008707046508789062, -0.007823467254638672, -0.006939888000488281, -0.006056308746337891, -0.0051727294921875, -0.004289150238037109, -0.0034055709838867188, -0.002521991729736328, -0.0016384124755859375, -0.0007548332214355469, 0.00012874603271484375, 0.0010123252868652344, 0.001895904541015625, 0.0027794837951660156, 0.0036630630493164062, 0.004546642303466797, 0.0054302215576171875, 0.006313800811767578, 0.007197380065917969, 0.00808095932006836, 0.00896453857421875, 0.00984811782836914, 0.010731697082519531, 0.011615276336669922, 0.012498855590820312, 0.013382434844970703, 0.014266014099121094, 0.015149593353271484, 0.016033172607421875, 0.016916751861572266, 0.017800331115722656, 0.018683910369873047, 0.019567489624023438, 0.020451068878173828, 0.02133464813232422, 0.02221822738647461, 0.023101806640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 20.0, 998.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7024952173233032, -0.6819820404052734, -0.6614688038825989, -0.6409556269645691, -0.6204423904418945, -0.5999292135238647, -0.579416036605835, -0.5589028596878052, -0.5383896231651306, -0.5178764462471008, -0.49736320972442627, -0.4768500328063965, -0.4563368260860443, -0.43582361936569214, -0.41531044244766235, -0.3947972357273102, -0.374284029006958, -0.35377082228660583, -0.33325761556625366, -0.3127444386482239, -0.2922312319278717, -0.27171802520751953, -0.25120484828948975, -0.23069164156913757, -0.2101784348487854, -0.18966522812843323, -0.16915203630924225, -0.14863884449005127, -0.1281256377696991, -0.10761243849992752, -0.08709923923015594, -0.06658604741096497, -0.04607284069061279, -0.025559641420841217, -0.005046442151069641, 0.015466757118701935, 0.03597995638847351, 0.05649315565824509, 0.07700635492801666, 0.09751954674720764, 0.11803275346755981, 0.138545960187912, 0.15905915200710297, 0.17957234382629395, 0.20008555054664612, 0.2205987572669983, 0.24111194908618927, 0.26162514090538025, 0.2821383476257324, 0.3026515543460846, 0.32316476106643677, 0.34367793798446655, 0.3641911447048187, 0.3847043514251709, 0.4052175283432007, 0.42573073506355286, 0.44624394178390503, 0.4667571485042572, 0.4872703552246094, 0.5077835321426392, 0.528296709060669, 0.5488099455833435, 0.5693231225013733, 0.5898363590240479, 0.6103495359420776]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 13.0, 16.0, 13.0, 21.0, 33.0, 33.0, 37.0, 48.0, 60.0, 56.0, 46.0, 52.0, 58.0, 44.0, 50.0, 51.0, 62.0, 37.0, 51.0, 39.0, 35.0, 40.0, 22.0, 15.0, 13.0, 13.0, 9.0, 14.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09828883409500122, -0.09575214236974716, -0.0932154506444931, -0.09067875891923904, -0.08814206719398499, -0.08560537546873093, -0.08306868374347687, -0.08053199201822281, -0.07799530029296875, -0.07545860856771469, -0.07292191684246063, -0.07038522511720657, -0.06784853339195251, -0.06531184166669846, -0.0627751499414444, -0.06023845821619034, -0.05770176649093628, -0.05516507476568222, -0.05262838304042816, -0.0500916913151741, -0.047554999589920044, -0.045018307864665985, -0.042481616139411926, -0.03994492441415787, -0.03740823268890381, -0.03487154096364975, -0.03233484923839569, -0.029798157513141632, -0.027261465787887573, -0.024724774062633514, -0.022188082337379456, -0.019651390612125397, -0.017114698886871338, -0.014578007161617279, -0.01204131543636322, -0.009504623711109161, -0.0069679319858551025, -0.004431240260601044, -0.0018945485353469849, 0.000642143189907074, 0.003178834915161133, 0.005715526640415192, 0.00825221836566925, 0.01078891009092331, 0.013325601816177368, 0.015862293541431427, 0.018398985266685486, 0.020935676991939545, 0.023472368717193604, 0.026009060442447662, 0.02854575216770172, 0.03108244389295578, 0.03361913561820984, 0.0361558273434639, 0.03869251906871796, 0.041229210793972015, 0.043765902519226074, 0.04630259424448013, 0.04883928596973419, 0.05137597769498825, 0.05391266942024231, 0.05644936114549637, 0.05898605287075043, 0.061522744596004486, 0.06405943632125854]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 9.0, 9.0, 24.0, 19.0, 42.0, 33.0, 55.0, 68.0, 88.0, 118.0, 205.0, 255.0, 358.0, 507.0, 796.0, 1260.0, 2400.0, 5875.0, 27352.0, 977527.0, 20531.0, 4996.0, 2244.0, 1304.0, 815.0, 527.0, 314.0, 235.0, 156.0, 126.0, 60.0, 60.0, 42.0, 30.0, 25.0, 27.0, 10.0, 11.0, 11.0, 6.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.1270751953125, -0.12315750122070312, -0.11923980712890625, -0.11532211303710938, -0.1114044189453125, -0.10748672485351562, -0.10356903076171875, -0.09965133666992188, -0.095733642578125, -0.09181594848632812, -0.08789825439453125, -0.08398056030273438, -0.0800628662109375, -0.07614517211914062, -0.07222747802734375, -0.06830978393554688, -0.06439208984375, -0.060474395751953125, -0.05655670166015625, -0.052639007568359375, -0.0487213134765625, -0.044803619384765625, -0.04088592529296875, -0.036968231201171875, -0.033050537109375, -0.029132843017578125, -0.02521514892578125, -0.021297454833984375, -0.0173797607421875, -0.013462066650390625, -0.00954437255859375, -0.005626678466796875, -0.001708984375, 0.002208709716796875, 0.00612640380859375, 0.010044097900390625, 0.0139617919921875, 0.017879486083984375, 0.02179718017578125, 0.025714874267578125, 0.029632568359375, 0.033550262451171875, 0.03746795654296875, 0.041385650634765625, 0.0453033447265625, 0.049221038818359375, 0.05313873291015625, 0.057056427001953125, 0.06097412109375, 0.06489181518554688, 0.06880950927734375, 0.07272720336914062, 0.0766448974609375, 0.08056259155273438, 0.08448028564453125, 0.08839797973632812, 0.092315673828125, 0.09623336791992188, 0.10015106201171875, 0.10406875610351562, 0.1079864501953125, 0.11190414428710938, 0.11582183837890625, 0.11973953247070312, 0.1236572265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 16.0, 17.0, 16.0, 22.0, 122.0, 398.0, 238.0, 45.0, 23.0, 9.0, 8.0, 5.0, 14.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 4.0, 13.0, 10.0, 17.0, 21.0, 26.0, 32.0, 43.0, 61.0, 53.0, 78.0, 89.0, 127.0, 143.0, 221.0, 355.0, 611.0, 1575.0, 76466.0, 963147.0, 3219.0, 793.0, 415.0, 243.0, 155.0, 122.0, 94.0, 97.0, 62.0, 50.0, 42.0, 37.0, 28.0, 16.0, 22.0, 14.0, 8.0, 7.0, 8.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.09222412109375, -0.08960151672363281, -0.08697891235351562, -0.08435630798339844, -0.08173370361328125, -0.07911109924316406, -0.07648849487304688, -0.07386589050292969, -0.0712432861328125, -0.06862068176269531, -0.06599807739257812, -0.06337547302246094, -0.06075286865234375, -0.05813026428222656, -0.055507659912109375, -0.05288505554199219, -0.050262451171875, -0.04763984680175781, -0.045017242431640625, -0.04239463806152344, -0.03977203369140625, -0.03714942932128906, -0.034526824951171875, -0.03190422058105469, -0.0292816162109375, -0.026659011840820312, -0.024036407470703125, -0.021413803100585938, -0.01879119873046875, -0.016168594360351562, -0.013545989990234375, -0.010923385620117188, -0.00830078125, -0.0056781768798828125, -0.003055572509765625, -0.0004329681396484375, 0.00218963623046875, 0.0048122406005859375, 0.007434844970703125, 0.010057449340820312, 0.0126800537109375, 0.015302658081054688, 0.017925262451171875, 0.020547866821289062, 0.02317047119140625, 0.025793075561523438, 0.028415679931640625, 0.031038284301757812, 0.033660888671875, 0.03628349304199219, 0.038906097412109375, 0.04152870178222656, 0.04415130615234375, 0.04677391052246094, 0.049396514892578125, 0.05201911926269531, 0.0546417236328125, 0.05726432800292969, 0.059886932373046875, 0.06250953674316406, 0.06513214111328125, 0.06775474548339844, 0.07037734985351562, 0.07299995422363281, 0.07562255859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 3.0, 10.0, 7.0, 11.0, 12.0, 16.0, 18.0, 20.0, 35.0, 16.0, 27.0, 25.0, 27.0, 29.0, 40.0, 43.0, 51.0, 49.0, 44.0, 48.0, 61.0, 39.0, 42.0, 39.0, 33.0, 30.0, 30.0, 30.0, 29.0, 17.0, 21.0, 21.0, 14.0, 11.0, 12.0, 7.0, 5.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.03851318359375, -0.03741884231567383, -0.036324501037597656, -0.035230159759521484, -0.03413581848144531, -0.03304147720336914, -0.03194713592529297, -0.030852794647216797, -0.029758453369140625, -0.028664112091064453, -0.02756977081298828, -0.02647542953491211, -0.025381088256835938, -0.024286746978759766, -0.023192405700683594, -0.022098064422607422, -0.02100372314453125, -0.019909381866455078, -0.018815040588378906, -0.017720699310302734, -0.016626358032226562, -0.01553201675415039, -0.014437675476074219, -0.013343334197998047, -0.012248992919921875, -0.011154651641845703, -0.010060310363769531, -0.00896596908569336, -0.007871627807617188, -0.006777286529541016, -0.005682945251464844, -0.004588603973388672, -0.0034942626953125, -0.002399921417236328, -0.0013055801391601562, -0.00021123886108398438, 0.0008831024169921875, 0.0019774436950683594, 0.0030717849731445312, 0.004166126251220703, 0.005260467529296875, 0.006354808807373047, 0.007449150085449219, 0.00854349136352539, 0.009637832641601562, 0.010732173919677734, 0.011826515197753906, 0.012920856475830078, 0.01401519775390625, 0.015109539031982422, 0.016203880310058594, 0.017298221588134766, 0.018392562866210938, 0.01948690414428711, 0.02058124542236328, 0.021675586700439453, 0.022769927978515625, 0.023864269256591797, 0.02495861053466797, 0.02605295181274414, 0.027147293090820312, 0.028241634368896484, 0.029335975646972656, 0.030430316925048828, 0.031524658203125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 12.0, 13.0, 18.0, 24.0, 28.0, 48.0, 69.0, 138.0, 271.0, 570.0, 1549.0, 6624.0, 185614.0, 843126.0, 7508.0, 1697.0, 566.0, 275.0, 130.0, 88.0, 62.0, 37.0, 26.0, 14.0, 11.0, 9.0, 8.0, 5.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002390146255493164, -0.0002313125878572464, -0.0002236105501651764, -0.00021590851247310638, -0.00020820647478103638, -0.00020050443708896637, -0.00019280239939689636, -0.00018510036170482635, -0.00017739832401275635, -0.00016969628632068634, -0.00016199424862861633, -0.00015429221093654633, -0.00014659017324447632, -0.0001388881355524063, -0.0001311860978603363, -0.0001234840601682663, -0.00011578202247619629, -0.00010807998478412628, -0.00010037794709205627, -9.267590939998627e-05, -8.497387170791626e-05, -7.727183401584625e-05, -6.956979632377625e-05, -6.186775863170624e-05, -5.416572093963623e-05, -4.646368324756622e-05, -3.8761645555496216e-05, -3.105960786342621e-05, -2.33575701713562e-05, -1.5655532479286194e-05, -7.953494787216187e-06, -2.514570951461792e-07, 7.450580596923828e-06, 1.5152618288993835e-05, 2.2854655981063843e-05, 3.055669367313385e-05, 3.825873136520386e-05, 4.5960769057273865e-05, 5.366280674934387e-05, 6.136484444141388e-05, 6.906688213348389e-05, 7.67689198255539e-05, 8.44709575176239e-05, 9.217299520969391e-05, 9.987503290176392e-05, 0.00010757707059383392, 0.00011527910828590393, 0.00012298114597797394, 0.00013068318367004395, 0.00013838522136211395, 0.00014608725905418396, 0.00015378929674625397, 0.00016149133443832397, 0.00016919337213039398, 0.000176895409822464, 0.000184597447514534, 0.000192299485206604, 0.000200001522898674, 0.00020770356059074402, 0.00021540559828281403, 0.00022310763597488403, 0.00023080967366695404, 0.00023851171135902405, 0.00024621374905109406, 0.00025391578674316406]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 11.0, 9.0, 20.0, 14.0, 26.0, 27.0, 45.0, 38.0, 76.0, 66.0, 112.0, 93.0, 81.0, 71.0, 57.0, 49.0, 36.0, 29.0, 32.0, 21.0, 16.0, 15.0, 9.0, 4.0, 5.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.569789886474609e-06, -7.242895662784576e-06, -6.9160014390945435e-06, -6.5891072154045105e-06, -6.2622129917144775e-06, -5.935318768024445e-06, -5.608424544334412e-06, -5.281530320644379e-06, -4.954636096954346e-06, -4.627741873264313e-06, -4.30084764957428e-06, -3.973953425884247e-06, -3.647059202194214e-06, -3.320164978504181e-06, -2.993270754814148e-06, -2.666376531124115e-06, -2.339482307434082e-06, -2.012588083744049e-06, -1.6856938600540161e-06, -1.3587996363639832e-06, -1.0319054126739502e-06, -7.050111889839172e-07, -3.781169652938843e-07, -5.122274160385132e-08, 2.7567148208618164e-07, 6.025657057762146e-07, 9.294599294662476e-07, 1.2563541531562805e-06, 1.5832483768463135e-06, 1.9101426005363464e-06, 2.2370368242263794e-06, 2.5639310479164124e-06, 2.8908252716064453e-06, 3.2177194952964783e-06, 3.5446137189865112e-06, 3.871507942676544e-06, 4.198402166366577e-06, 4.52529639005661e-06, 4.852190613746643e-06, 5.179084837436676e-06, 5.505979061126709e-06, 5.832873284816742e-06, 6.159767508506775e-06, 6.486661732196808e-06, 6.813555955886841e-06, 7.140450179576874e-06, 7.467344403266907e-06, 7.79423862695694e-06, 8.121132850646973e-06, 8.448027074337006e-06, 8.774921298027039e-06, 9.101815521717072e-06, 9.428709745407104e-06, 9.755603969097137e-06, 1.008249819278717e-05, 1.0409392416477203e-05, 1.0736286640167236e-05, 1.106318086385727e-05, 1.1390075087547302e-05, 1.1716969311237335e-05, 1.2043863534927368e-05, 1.2370757758617401e-05, 1.2697651982307434e-05, 1.3024546205997467e-05, 1.33514404296875e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 5.0, 9.0, 14.0, 19.0, 29.0, 27.0, 52.0, 85.0, 139.0, 391.0, 2235.0, 1038831.0, 5708.0, 469.0, 190.0, 103.0, 63.0, 39.0, 28.0, 10.0, 14.0, 15.0, 11.0, 4.0, 4.0, 6.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003311634063720703, -0.000321313738822937, -0.0003114640712738037, -0.0003016144037246704, -0.0002917647361755371, -0.0002819150686264038, -0.0002720654010772705, -0.0002622157335281372, -0.0002523660659790039, -0.0002425163984298706, -0.0002326667308807373, -0.000222817063331604, -0.0002129673957824707, -0.0002031177282333374, -0.0001932680606842041, -0.0001834183931350708, -0.0001735687255859375, -0.0001637190580368042, -0.0001538693904876709, -0.0001440197229385376, -0.0001341700553894043, -0.000124320387840271, -0.0001144707202911377, -0.0001046210527420044, -9.47713851928711e-05, -8.492171764373779e-05, -7.507205009460449e-05, -6.522238254547119e-05, -5.537271499633789e-05, -4.552304744720459e-05, -3.567337989807129e-05, -2.5823712348937988e-05, -1.5974044799804688e-05, -6.124377250671387e-06, 3.725290298461914e-06, 1.3574957847595215e-05, 2.3424625396728516e-05, 3.3274292945861816e-05, 4.312396049499512e-05, 5.297362804412842e-05, 6.282329559326172e-05, 7.267296314239502e-05, 8.252263069152832e-05, 9.237229824066162e-05, 0.00010222196578979492, 0.00011207163333892822, 0.00012192130088806152, 0.00013177096843719482, 0.00014162063598632812, 0.00015147030353546143, 0.00016131997108459473, 0.00017116963863372803, 0.00018101930618286133, 0.00019086897373199463, 0.00020071864128112793, 0.00021056830883026123, 0.00022041797637939453, 0.00023026764392852783, 0.00024011731147766113, 0.00024996697902679443, 0.00025981664657592773, 0.00026966631412506104, 0.00027951598167419434, 0.00028936564922332764, 0.00029921531677246094]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 8.0, 7.0, 10.0, 10.0, 12.0, 20.0, 40.0, 79.0, 127.0, 298.0, 160.0, 77.0, 45.0, 25.0, 16.0, 12.0, 8.0, 2.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001385211944580078, -0.00013440102338790894, -0.00013028085231781006, -0.00012616068124771118, -0.0001220405101776123, -0.00011792033910751343, -0.00011380016803741455, -0.00010967999696731567, -0.0001055598258972168, -0.00010143965482711792, -9.731948375701904e-05, -9.319931268692017e-05, -8.907914161682129e-05, -8.495897054672241e-05, -8.083879947662354e-05, -7.671862840652466e-05, -7.259845733642578e-05, -6.84782862663269e-05, -6.435811519622803e-05, -6.023794412612915e-05, -5.6117773056030273e-05, -5.1997601985931396e-05, -4.787743091583252e-05, -4.375725984573364e-05, -3.9637088775634766e-05, -3.551691770553589e-05, -3.139674663543701e-05, -2.7276575565338135e-05, -2.3156404495239258e-05, -1.903623342514038e-05, -1.4916062355041504e-05, -1.0795891284942627e-05, -6.67572021484375e-06, -2.555549144744873e-06, 1.564621925354004e-06, 5.684792995452881e-06, 9.804964065551758e-06, 1.3925135135650635e-05, 1.8045306205749512e-05, 2.216547727584839e-05, 2.6285648345947266e-05, 3.0405819416046143e-05, 3.452599048614502e-05, 3.8646161556243896e-05, 4.2766332626342773e-05, 4.688650369644165e-05, 5.100667476654053e-05, 5.5126845836639404e-05, 5.924701690673828e-05, 6.336718797683716e-05, 6.748735904693604e-05, 7.160753011703491e-05, 7.572770118713379e-05, 7.984787225723267e-05, 8.396804332733154e-05, 8.808821439743042e-05, 9.22083854675293e-05, 9.632855653762817e-05, 0.00010044872760772705, 0.00010456889867782593, 0.0001086890697479248, 0.00011280924081802368, 0.00011692941188812256, 0.00012104958295822144, 0.0001251697540283203]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 29.0, 970.0, 16.0], "bins": [-1.6110010147094727, -1.5852724313735962, -1.5595438480377197, -1.5338152647018433, -1.5080865621566772, -1.4823579788208008, -1.4566293954849243, -1.4309008121490479, -1.4051722288131714, -1.379443645477295, -1.3537150621414185, -1.327986478805542, -1.302257776260376, -1.2765291929244995, -1.250800609588623, -1.2250720262527466, -1.1993434429168701, -1.1736148595809937, -1.1478862762451172, -1.1221576929092407, -1.0964289903640747, -1.0707004070281982, -1.0449718236923218, -1.0192432403564453, -0.9935145974159241, -0.9677860140800476, -0.9420573711395264, -0.9163287878036499, -0.8906002044677734, -0.864871621131897, -0.8391429781913757, -0.8134143948554993, -0.7876858711242676, -0.7619572877883911, -0.7362286448478699, -0.7105000615119934, -0.6847714781761169, -0.6590428352355957, -0.6333142518997192, -0.6075856685638428, -0.5818570256233215, -0.5561284422874451, -0.5303997993469238, -0.5046712160110474, -0.4789426326751709, -0.45321401953697205, -0.4274854063987732, -0.40175682306289673, -0.37602823972702026, -0.3502996265888214, -0.32457104325294495, -0.2988424301147461, -0.27311384677886963, -0.24738523364067078, -0.22165663540363312, -0.19592803716659546, -0.1701994389295578, -0.14447084069252014, -0.11874224245548248, -0.09301363676786423, -0.06728503853082657, -0.04155643284320831, -0.015827834606170654, 0.009900763630867004, 0.03562936186790466]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 12.0, 13.0, 13.0, 14.0, 26.0, 31.0, 29.0, 34.0, 50.0, 42.0, 51.0, 49.0, 59.0, 46.0, 51.0, 57.0, 50.0, 43.0, 42.0, 39.0, 39.0, 32.0, 23.0, 21.0, 20.0, 15.0, 14.0, 12.0, 12.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14257240295410156, -0.13748376071453094, -0.13239511847496033, -0.1273064762353897, -0.12221783399581909, -0.11712919175624847, -0.11204054951667786, -0.10695190727710724, -0.10186326503753662, -0.096774622797966, -0.09168598055839539, -0.08659733831882477, -0.08150869607925415, -0.07642005383968353, -0.07133141160011292, -0.0662427693605423, -0.06115412712097168, -0.05606548488140106, -0.050976842641830444, -0.04588820040225983, -0.04079955816268921, -0.03571091592311859, -0.030622273683547974, -0.025533631443977356, -0.02044498920440674, -0.01535634696483612, -0.010267704725265503, -0.005179062485694885, -9.042024612426758e-05, 0.00499822199344635, 0.010086864233016968, 0.015175506472587585, 0.020264148712158203, 0.02535279095172882, 0.03044143319129944, 0.035530075430870056, 0.040618717670440674, 0.04570735991001129, 0.05079600214958191, 0.05588464438915253, 0.060973286628723145, 0.06606192886829376, 0.07115057110786438, 0.076239213347435, 0.08132785558700562, 0.08641649782657623, 0.09150514006614685, 0.09659378230571747, 0.10168242454528809, 0.1067710667848587, 0.11185970902442932, 0.11694835126399994, 0.12203699350357056, 0.12712563574314117, 0.1322142779827118, 0.1373029202222824, 0.14239156246185303, 0.14748020470142365, 0.15256884694099426, 0.15765748918056488, 0.1627461314201355, 0.16783477365970612, 0.17292341589927673, 0.17801205813884735, 0.18310070037841797]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 2.0, 5.0, 6.0, 11.0, 11.0, 7.0, 7.0, 13.0, 22.0, 28.0, 38.0, 66.0, 142.0, 1198.0, 4191849.0, 554.0, 102.0, 57.0, 31.0, 27.0, 22.0, 16.0, 13.0, 13.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.63677978515625, -6.4180908203125, -6.19940185546875, -5.980712890625, -5.76202392578125, -5.5433349609375, -5.32464599609375, -5.10595703125, -4.88726806640625, -4.6685791015625, -4.44989013671875, -4.231201171875, -4.01251220703125, -3.7938232421875, -3.57513427734375, -3.3564453125, -3.13775634765625, -2.9190673828125, -2.70037841796875, -2.481689453125, -2.26300048828125, -2.0443115234375, -1.82562255859375, -1.60693359375, -1.38824462890625, -1.1695556640625, -0.95086669921875, -0.732177734375, -0.51348876953125, -0.2947998046875, -0.07611083984375, 0.142578125, 0.36126708984375, 0.5799560546875, 0.79864501953125, 1.017333984375, 1.23602294921875, 1.4547119140625, 1.67340087890625, 1.89208984375, 2.11077880859375, 2.3294677734375, 2.54815673828125, 2.766845703125, 2.98553466796875, 3.2042236328125, 3.42291259765625, 3.6416015625, 3.86029052734375, 4.0789794921875, 4.29766845703125, 4.516357421875, 4.73504638671875, 4.9537353515625, 5.17242431640625, 5.39111328125, 5.60980224609375, 5.8284912109375, 6.04718017578125, 6.265869140625, 6.48455810546875, 6.7032470703125, 6.92193603515625, 7.140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 16.0, 17.0, 15.0, 20.0, 122.0, 407.0, 234.0, 43.0, 23.0, 9.0, 8.0, 6.0, 13.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01875019073486328, -0.018136978149414062, -0.017523765563964844, -0.016910552978515625, -0.016297340393066406, -0.015684127807617188, -0.015070915222167969, -0.01445770263671875, -0.013844490051269531, -0.013231277465820312, -0.012618064880371094, -0.012004852294921875, -0.011391639709472656, -0.010778427124023438, -0.010165214538574219, -0.009552001953125, -0.008938789367675781, -0.008325576782226562, -0.007712364196777344, -0.007099151611328125, -0.006485939025878906, -0.0058727264404296875, -0.005259513854980469, -0.00464630126953125, -0.004033088684082031, -0.0034198760986328125, -0.0028066635131835938, -0.002193450927734375, -0.0015802383422851562, -0.0009670257568359375, -0.00035381317138671875, 0.0002593994140625, 0.0008726119995117188, 0.0014858245849609375, 0.0020990371704101562, 0.002712249755859375, 0.0033254623413085938, 0.0039386749267578125, 0.004551887512207031, 0.00516510009765625, 0.005778312683105469, 0.0063915252685546875, 0.007004737854003906, 0.007617950439453125, 0.008231163024902344, 0.008844375610351562, 0.009457588195800781, 0.01007080078125, 0.010684013366699219, 0.011297225952148438, 0.011910438537597656, 0.012523651123046875, 0.013136863708496094, 0.013750076293945312, 0.014363288879394531, 0.01497650146484375, 0.015589714050292969, 0.016202926635742188, 0.016816139221191406, 0.017429351806640625, 0.018042564392089844, 0.018655776977539062, 0.01926898956298828, 0.0198822021484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 8.0, 6.0, 8.0, 13.0, 26.0, 46.0, 77.0, 125.0, 308.0, 697.0, 2257.0, 14334.0, 4165774.0, 7808.0, 1713.0, 553.0, 237.0, 127.0, 57.0, 39.0, 24.0, 7.0, 10.0, 3.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.123779296875, -0.11995601654052734, -0.11613273620605469, -0.11230945587158203, -0.10848617553710938, -0.10466289520263672, -0.10083961486816406, -0.0970163345336914, -0.09319305419921875, -0.0893697738647461, -0.08554649353027344, -0.08172321319580078, -0.07789993286132812, -0.07407665252685547, -0.07025337219238281, -0.06643009185791016, -0.0626068115234375, -0.058783531188964844, -0.05496025085449219, -0.05113697052001953, -0.047313690185546875, -0.04349040985107422, -0.03966712951660156, -0.035843849182128906, -0.03202056884765625, -0.028197288513183594, -0.024374008178710938, -0.02055072784423828, -0.016727447509765625, -0.012904167175292969, -0.009080886840820312, -0.005257606506347656, -0.001434326171875, 0.0023889541625976562, 0.0062122344970703125, 0.010035514831542969, 0.013858795166015625, 0.01768207550048828, 0.021505355834960938, 0.025328636169433594, 0.02915191650390625, 0.032975196838378906, 0.03679847717285156, 0.04062175750732422, 0.044445037841796875, 0.04826831817626953, 0.05209159851074219, 0.055914878845214844, 0.0597381591796875, 0.06356143951416016, 0.06738471984863281, 0.07120800018310547, 0.07503128051757812, 0.07885456085205078, 0.08267784118652344, 0.0865011215209961, 0.09032440185546875, 0.0941476821899414, 0.09797096252441406, 0.10179424285888672, 0.10561752319335938, 0.10944080352783203, 0.11326408386230469, 0.11708736419677734, 0.12091064453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 8.0, 40.0, 759.0, 3171.0, 41.0, 15.0, 3.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03204345703125, -0.031073331832885742, -0.030103206634521484, -0.029133081436157227, -0.02816295623779297, -0.02719283103942871, -0.026222705841064453, -0.025252580642700195, -0.024282455444335938, -0.02331233024597168, -0.022342205047607422, -0.021372079849243164, -0.020401954650878906, -0.01943182945251465, -0.01846170425415039, -0.017491579055786133, -0.016521453857421875, -0.015551328659057617, -0.01458120346069336, -0.013611078262329102, -0.012640953063964844, -0.011670827865600586, -0.010700702667236328, -0.00973057746887207, -0.008760452270507812, -0.007790327072143555, -0.006820201873779297, -0.005850076675415039, -0.004879951477050781, -0.0039098262786865234, -0.0029397010803222656, -0.001969575881958008, -0.00099945068359375, -2.9325485229492188e-05, 0.0009407997131347656, 0.0019109249114990234, 0.0028810501098632812, 0.003851175308227539, 0.004821300506591797, 0.005791425704956055, 0.0067615509033203125, 0.00773167610168457, 0.008701801300048828, 0.009671926498413086, 0.010642051696777344, 0.011612176895141602, 0.01258230209350586, 0.013552427291870117, 0.014522552490234375, 0.015492677688598633, 0.01646280288696289, 0.01743292808532715, 0.018403053283691406, 0.019373178482055664, 0.020343303680419922, 0.02131342887878418, 0.022283554077148438, 0.023253679275512695, 0.024223804473876953, 0.02519392967224121, 0.02616405487060547, 0.027134180068969727, 0.028104305267333984, 0.029074430465698242, 0.0300445556640625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 199.0, 550.0, 117.0, 57.0, 25.0, 15.0, 10.0, 8.0, 9.0, 6.0, 1.0, 6.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07240816950798035, -0.062193647027015686, -0.051979128271341324, -0.04176460951566696, -0.0315500870347023, -0.02133556455373764, -0.011121045798063278, -0.000906527042388916, 0.009307995438575745, 0.019522516056895256, 0.029737036675214767, 0.03995155543088913, 0.05016607791185379, 0.06038060039281845, 0.07059511542320251, 0.08080963790416718, 0.09102416038513184, 0.1012386828660965, 0.11145320534706116, 0.12166772037744522, 0.13188225030899048, 0.14209675788879395, 0.1523112803697586, 0.16252580285072327, 0.17274032533168793, 0.1829548478126526, 0.19316937029361725, 0.2033838927745819, 0.21359840035438538, 0.22381293773651123, 0.2340274453163147, 0.24424196779727936, 0.25445646047592163, 0.2646709680557251, 0.27488550543785095, 0.2851000130176544, 0.2953145503997803, 0.30552905797958374, 0.3157435953617096, 0.32595810294151306, 0.3361726403236389, 0.3463871479034424, 0.35660168528556824, 0.3668161928653717, 0.37703073024749756, 0.387245237827301, 0.3974597752094269, 0.40767428278923035, 0.4178887903690338, 0.4281032979488373, 0.43831783533096313, 0.4485323429107666, 0.45874688029289246, 0.4689613878726959, 0.4791759252548218, 0.48939043283462524, 0.4996049404144287, 0.5098194479942322, 0.5200339555740356, 0.5302485227584839, 0.5404630303382874, 0.5506775379180908, 0.5608920454978943, 0.5711065530776978, 0.581321120262146]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 3.0, 3.0, 6.0, 6.0, 11.0, 7.0, 10.0, 17.0, 11.0, 21.0, 28.0, 40.0, 32.0, 28.0, 37.0, 48.0, 51.0, 60.0, 67.0, 70.0, 63.0, 49.0, 48.0, 53.0, 41.0, 32.0, 28.0, 24.0, 14.0, 27.0, 13.0, 11.0, 4.0, 9.0, 10.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07161343097686768, -0.06956803798675537, -0.06752265244722366, -0.06547726690769196, -0.06343187391757965, -0.061386484652757645, -0.05934109538793564, -0.05729570612311363, -0.055250316858291626, -0.05320492759346962, -0.051159538328647614, -0.04911414906382561, -0.0470687597990036, -0.045023370534181595, -0.04297798126935959, -0.04093259200453758, -0.038887202739715576, -0.03684181347489357, -0.034796424210071564, -0.03275103494524956, -0.03070564568042755, -0.028660256415605545, -0.02661486715078354, -0.024569477885961533, -0.022524088621139526, -0.02047869935631752, -0.018433310091495514, -0.016387920826673508, -0.014342531561851501, -0.012297142297029495, -0.010251753032207489, -0.008206363767385483, -0.0061609745025634766, -0.00411558523774147, -0.002070195972919464, -2.4806708097457886e-05, 0.0020205825567245483, 0.0040659718215465546, 0.006111361086368561, 0.008156750351190567, 0.010202139616012573, 0.01224752888083458, 0.014292918145656586, 0.016338307410478592, 0.018383696675300598, 0.020429085940122604, 0.02247447520494461, 0.024519864469766617, 0.026565253734588623, 0.02861064299941063, 0.030656032264232635, 0.03270142152905464, 0.03474681079387665, 0.036792200058698654, 0.03883758932352066, 0.04088297858834267, 0.04292836785316467, 0.04497375711798668, 0.047019146382808685, 0.04906453564763069, 0.0511099249124527, 0.053155314177274704, 0.05520070344209671, 0.057246092706918716, 0.05929148197174072]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 2.0, 7.0, 7.0, 14.0, 19.0, 37.0, 76.0, 121.0, 258.0, 517.0, 1114.0, 3099.0, 13235.0, 972705.0, 48272.0, 5960.0, 1690.0, 673.0, 276.0, 176.0, 110.0, 52.0, 35.0, 27.0, 15.0, 17.0, 13.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1387939453125, -0.13442230224609375, -0.1300506591796875, -0.12567901611328125, -0.121307373046875, -0.11693572998046875, -0.1125640869140625, -0.10819244384765625, -0.10382080078125, -0.09944915771484375, -0.0950775146484375, -0.09070587158203125, -0.086334228515625, -0.08196258544921875, -0.0775909423828125, -0.07321929931640625, -0.06884765625, -0.06447601318359375, -0.0601043701171875, -0.05573272705078125, -0.051361083984375, -0.04698944091796875, -0.0426177978515625, -0.03824615478515625, -0.03387451171875, -0.02950286865234375, -0.0251312255859375, -0.02075958251953125, -0.016387939453125, -0.01201629638671875, -0.0076446533203125, -0.00327301025390625, 0.0010986328125, 0.00547027587890625, 0.0098419189453125, 0.01421356201171875, 0.018585205078125, 0.02295684814453125, 0.0273284912109375, 0.03170013427734375, 0.03607177734375, 0.04044342041015625, 0.0448150634765625, 0.04918670654296875, 0.053558349609375, 0.05792999267578125, 0.0623016357421875, 0.06667327880859375, 0.071044921875, 0.07541656494140625, 0.0797882080078125, 0.08415985107421875, 0.088531494140625, 0.09290313720703125, 0.0972747802734375, 0.10164642333984375, 0.10601806640625, 0.11038970947265625, 0.1147613525390625, 0.11913299560546875, 0.123504638671875, 0.12787628173828125, 0.1322479248046875, 0.13661956787109375, 0.1409912109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 9.0, 12.0, 15.0, 17.0, 27.0, 109.0, 363.0, 248.0, 80.0, 22.0, 10.0, 7.0, 5.0, 12.0, 10.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019256591796875, -0.018648624420166016, -0.01804065704345703, -0.017432689666748047, -0.016824722290039062, -0.016216754913330078, -0.015608787536621094, -0.01500082015991211, -0.014392852783203125, -0.01378488540649414, -0.013176918029785156, -0.012568950653076172, -0.011960983276367188, -0.011353015899658203, -0.010745048522949219, -0.010137081146240234, -0.00952911376953125, -0.008921146392822266, -0.008313179016113281, -0.007705211639404297, -0.0070972442626953125, -0.006489276885986328, -0.005881309509277344, -0.005273342132568359, -0.004665374755859375, -0.004057407379150391, -0.0034494400024414062, -0.002841472625732422, -0.0022335052490234375, -0.0016255378723144531, -0.0010175704956054688, -0.0004096031188964844, 0.0001983642578125, 0.0008063316345214844, 0.0014142990112304688, 0.002022266387939453, 0.0026302337646484375, 0.003238201141357422, 0.0038461685180664062, 0.004454135894775391, 0.005062103271484375, 0.005670070648193359, 0.006278038024902344, 0.006886005401611328, 0.0074939727783203125, 0.008101940155029297, 0.008709907531738281, 0.009317874908447266, 0.00992584228515625, 0.010533809661865234, 0.011141777038574219, 0.011749744415283203, 0.012357711791992188, 0.012965679168701172, 0.013573646545410156, 0.01418161392211914, 0.014789581298828125, 0.01539754867553711, 0.016005516052246094, 0.016613483428955078, 0.017221450805664062, 0.017829418182373047, 0.01843738555908203, 0.019045352935791016, 0.0196533203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 4.0, 16.0, 22.0, 21.0, 21.0, 48.0, 60.0, 66.0, 90.0, 147.0, 222.0, 331.0, 556.0, 904.0, 1862.0, 4268.0, 12179.0, 50620.0, 604855.0, 316746.0, 38003.0, 9960.0, 3596.0, 1607.0, 841.0, 432.0, 310.0, 228.0, 147.0, 86.0, 66.0, 54.0, 53.0, 25.0, 24.0, 18.0, 8.0, 6.0, 12.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0], "bins": [-0.053375244140625, -0.05188894271850586, -0.05040264129638672, -0.04891633987426758, -0.04743003845214844, -0.0459437370300293, -0.044457435607910156, -0.042971134185791016, -0.041484832763671875, -0.039998531341552734, -0.038512229919433594, -0.03702592849731445, -0.03553962707519531, -0.03405332565307617, -0.03256702423095703, -0.03108072280883789, -0.02959442138671875, -0.02810811996459961, -0.02662181854248047, -0.025135517120361328, -0.023649215698242188, -0.022162914276123047, -0.020676612854003906, -0.019190311431884766, -0.017704010009765625, -0.016217708587646484, -0.014731407165527344, -0.013245105743408203, -0.011758804321289062, -0.010272502899169922, -0.008786201477050781, -0.007299900054931641, -0.0058135986328125, -0.004327297210693359, -0.0028409957885742188, -0.0013546943664550781, 0.0001316070556640625, 0.0016179084777832031, 0.0031042098999023438, 0.004590511322021484, 0.006076812744140625, 0.007563114166259766, 0.009049415588378906, 0.010535717010498047, 0.012022018432617188, 0.013508319854736328, 0.014994621276855469, 0.01648092269897461, 0.01796722412109375, 0.01945352554321289, 0.02093982696533203, 0.022426128387451172, 0.023912429809570312, 0.025398731231689453, 0.026885032653808594, 0.028371334075927734, 0.029857635498046875, 0.031343936920166016, 0.032830238342285156, 0.0343165397644043, 0.03580284118652344, 0.03728914260864258, 0.03877544403076172, 0.04026174545288086, 0.041748046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 10.0, 15.0, 10.0, 11.0, 17.0, 18.0, 25.0, 34.0, 24.0, 41.0, 42.0, 39.0, 46.0, 56.0, 48.0, 52.0, 52.0, 48.0, 35.0, 38.0, 38.0, 31.0, 33.0, 35.0, 31.0, 25.0, 22.0, 23.0, 14.0, 11.0, 7.0, 13.0, 9.0, 6.0, 3.0, 5.0, 2.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.038726806640625, -0.03764986991882324, -0.036572933197021484, -0.03549599647521973, -0.03441905975341797, -0.03334212303161621, -0.03226518630981445, -0.031188249588012695, -0.030111312866210938, -0.02903437614440918, -0.027957439422607422, -0.026880502700805664, -0.025803565979003906, -0.02472662925720215, -0.02364969253540039, -0.022572755813598633, -0.021495819091796875, -0.020418882369995117, -0.01934194564819336, -0.0182650089263916, -0.017188072204589844, -0.016111135482788086, -0.015034198760986328, -0.01395726203918457, -0.012880325317382812, -0.011803388595581055, -0.010726451873779297, -0.009649515151977539, -0.008572578430175781, -0.0074956417083740234, -0.006418704986572266, -0.005341768264770508, -0.00426483154296875, -0.003187894821166992, -0.0021109580993652344, -0.0010340213775634766, 4.291534423828125e-05, 0.001119852066040039, 0.002196788787841797, 0.0032737255096435547, 0.0043506622314453125, 0.00542759895324707, 0.006504535675048828, 0.007581472396850586, 0.008658409118652344, 0.009735345840454102, 0.01081228256225586, 0.011889219284057617, 0.012966156005859375, 0.014043092727661133, 0.01512002944946289, 0.01619696617126465, 0.017273902893066406, 0.018350839614868164, 0.019427776336669922, 0.02050471305847168, 0.021581649780273438, 0.022658586502075195, 0.023735523223876953, 0.02481245994567871, 0.02588939666748047, 0.026966333389282227, 0.028043270111083984, 0.029120206832885742, 0.0301971435546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 6.0, 4.0, 16.0, 19.0, 26.0, 39.0, 41.0, 50.0, 82.0, 118.0, 226.0, 392.0, 630.0, 1185.0, 2633.0, 6712.0, 41891.0, 965899.0, 19262.0, 4921.0, 2073.0, 1001.0, 454.0, 280.0, 172.0, 124.0, 83.0, 62.0, 35.0, 26.0, 18.0, 14.0, 15.0, 12.0, 9.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01226806640625, -0.011835336685180664, -0.011402606964111328, -0.010969877243041992, -0.010537147521972656, -0.01010441780090332, -0.009671688079833984, -0.009238958358764648, -0.008806228637695312, -0.008373498916625977, -0.00794076919555664, -0.007508039474487305, -0.007075309753417969, -0.006642580032348633, -0.006209850311279297, -0.005777120590209961, -0.005344390869140625, -0.004911661148071289, -0.004478931427001953, -0.004046201705932617, -0.0036134719848632812, -0.0031807422637939453, -0.0027480125427246094, -0.0023152828216552734, -0.0018825531005859375, -0.0014498233795166016, -0.0010170936584472656, -0.0005843639373779297, -0.00015163421630859375, 0.0002810955047607422, 0.0007138252258300781, 0.001146554946899414, 0.00157928466796875, 0.002012014389038086, 0.002444744110107422, 0.002877473831176758, 0.0033102035522460938, 0.0037429332733154297, 0.004175662994384766, 0.0046083927154541016, 0.0050411224365234375, 0.0054738521575927734, 0.005906581878662109, 0.006339311599731445, 0.006772041320800781, 0.007204771041870117, 0.007637500762939453, 0.008070230484008789, 0.008502960205078125, 0.008935689926147461, 0.009368419647216797, 0.009801149368286133, 0.010233879089355469, 0.010666608810424805, 0.01109933853149414, 0.011532068252563477, 0.011964797973632812, 0.012397527694702148, 0.012830257415771484, 0.01326298713684082, 0.013695716857910156, 0.014128446578979492, 0.014561176300048828, 0.014993906021118164, 0.0154266357421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 14.0, 24.0, 48.0, 65.0, 114.0, 147.0, 171.0, 138.0, 87.0, 83.0, 36.0, 15.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2650154531002045e-05, -1.2246891856193542e-05, -1.184362918138504e-05, -1.1440366506576538e-05, -1.1037103831768036e-05, -1.0633841156959534e-05, -1.0230578482151031e-05, -9.82731580734253e-06, -9.424053132534027e-06, -9.020790457725525e-06, -8.617527782917023e-06, -8.21426510810852e-06, -7.811002433300018e-06, -7.407739758491516e-06, -7.004477083683014e-06, -6.601214408874512e-06, -6.1979517340660095e-06, -5.794689059257507e-06, -5.391426384449005e-06, -4.988163709640503e-06, -4.584901034832001e-06, -4.1816383600234985e-06, -3.7783756852149963e-06, -3.375113010406494e-06, -2.971850335597992e-06, -2.5685876607894897e-06, -2.1653249859809875e-06, -1.7620623111724854e-06, -1.3587996363639832e-06, -9.55536961555481e-07, -5.522742867469788e-07, -1.4901161193847656e-07, 2.5425106287002563e-07, 6.575137376785278e-07, 1.06077641248703e-06, 1.4640390872955322e-06, 1.8673017621040344e-06, 2.2705644369125366e-06, 2.673827111721039e-06, 3.077089786529541e-06, 3.4803524613380432e-06, 3.883615136146545e-06, 4.286877810955048e-06, 4.69014048576355e-06, 5.093403160572052e-06, 5.496665835380554e-06, 5.899928510189056e-06, 6.303191184997559e-06, 6.706453859806061e-06, 7.109716534614563e-06, 7.512979209423065e-06, 7.916241884231567e-06, 8.31950455904007e-06, 8.722767233848572e-06, 9.126029908657074e-06, 9.529292583465576e-06, 9.932555258274078e-06, 1.033581793308258e-05, 1.0739080607891083e-05, 1.1142343282699585e-05, 1.1545605957508087e-05, 1.194886863231659e-05, 1.2352131307125092e-05, 1.2755393981933594e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 7.0, 10.0, 4.0, 21.0, 19.0, 25.0, 28.0, 48.0, 87.0, 124.0, 172.0, 288.0, 557.0, 1148.0, 2920.0, 10164.0, 86482.0, 907990.0, 28854.0, 5644.0, 1978.0, 867.0, 427.0, 230.0, 140.0, 88.0, 63.0, 51.0, 23.0, 20.0, 11.0, 12.0, 6.0, 10.0, 6.0, 5.0, 6.0, 1.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00806427001953125, -0.007779240608215332, -0.007494211196899414, -0.007209181785583496, -0.006924152374267578, -0.00663912296295166, -0.006354093551635742, -0.006069064140319824, -0.005784034729003906, -0.005499005317687988, -0.00521397590637207, -0.004928946495056152, -0.004643917083740234, -0.004358887672424316, -0.0040738582611083984, -0.0037888288497924805, -0.0035037994384765625, -0.0032187700271606445, -0.0029337406158447266, -0.0026487112045288086, -0.0023636817932128906, -0.0020786523818969727, -0.0017936229705810547, -0.0015085935592651367, -0.0012235641479492188, -0.0009385347366333008, -0.0006535053253173828, -0.00036847591400146484, -8.344650268554688e-05, 0.0002015829086303711, 0.00048661231994628906, 0.000771641731262207, 0.001056671142578125, 0.001341700553894043, 0.001626729965209961, 0.001911759376525879, 0.002196788787841797, 0.002481818199157715, 0.002766847610473633, 0.0030518770217895508, 0.0033369064331054688, 0.0036219358444213867, 0.003906965255737305, 0.004191994667053223, 0.004477024078369141, 0.004762053489685059, 0.0050470829010009766, 0.0053321123123168945, 0.0056171417236328125, 0.0059021711349487305, 0.0061872005462646484, 0.006472229957580566, 0.006757259368896484, 0.007042288780212402, 0.00732731819152832, 0.007612347602844238, 0.007897377014160156, 0.008182406425476074, 0.008467435836791992, 0.00875246524810791, 0.009037494659423828, 0.009322524070739746, 0.009607553482055664, 0.009892582893371582, 0.0101776123046875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 17.0, 16.0, 15.0, 24.0, 27.0, 31.0, 59.0, 96.0, 146.0, 123.0, 103.0, 76.0, 61.0, 45.0, 27.0, 26.0, 18.0, 14.0, 11.0, 9.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00530242919921875, -0.005108952522277832, -0.004915475845336914, -0.004721999168395996, -0.004528522491455078, -0.00433504581451416, -0.004141569137573242, -0.003948092460632324, -0.0037546157836914062, -0.0035611391067504883, -0.0033676624298095703, -0.0031741857528686523, -0.0029807090759277344, -0.0027872323989868164, -0.0025937557220458984, -0.0024002790451049805, -0.0022068023681640625, -0.0020133256912231445, -0.0018198490142822266, -0.0016263723373413086, -0.0014328956604003906, -0.0012394189834594727, -0.0010459423065185547, -0.0008524656295776367, -0.0006589889526367188, -0.0004655122756958008, -0.0002720355987548828, -7.855892181396484e-05, 0.00011491775512695312, 0.0003083944320678711, 0.0005018711090087891, 0.000695347785949707, 0.000888824462890625, 0.001082301139831543, 0.001275777816772461, 0.001469254493713379, 0.0016627311706542969, 0.0018562078475952148, 0.002049684524536133, 0.0022431612014770508, 0.0024366378784179688, 0.0026301145553588867, 0.0028235912322998047, 0.0030170679092407227, 0.0032105445861816406, 0.0034040212631225586, 0.0035974979400634766, 0.0037909746170043945, 0.0039844512939453125, 0.0041779279708862305, 0.0043714046478271484, 0.004564881324768066, 0.004758358001708984, 0.004951834678649902, 0.00514531135559082, 0.005338788032531738, 0.005532264709472656, 0.005725741386413574, 0.005919218063354492, 0.00611269474029541, 0.006306171417236328, 0.006499648094177246, 0.006693124771118164, 0.006886601448059082, 0.007080078125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 10.0, 30.0, 67.0, 213.0, 397.0, 173.0, 51.0, 30.0, 8.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5540460348129272, -0.5379233360290527, -0.5218006372451782, -0.5056779384613037, -0.4895552694797516, -0.47343260049819946, -0.45730990171432495, -0.44118720293045044, -0.4250645041465759, -0.4089418053627014, -0.3928191363811493, -0.3766964375972748, -0.36057373881340027, -0.34445106983184814, -0.32832837104797363, -0.3122056722640991, -0.296083003282547, -0.2799603044986725, -0.26383763551712036, -0.24771493673324585, -0.23159223794937134, -0.21546955406665802, -0.1993468701839447, -0.1832241714000702, -0.16710148751735687, -0.15097880363464355, -0.13485610485076904, -0.11873342096805573, -0.10261072963476181, -0.0864880383014679, -0.07036535441875458, -0.05424266308546066, -0.03811994194984436, -0.021997252479195595, -0.005874563008546829, 0.010248124599456787, 0.026370815932750702, 0.04249350726604462, 0.058616191148757935, 0.07473888248205185, 0.09086157381534576, 0.10698426514863968, 0.1231069564819336, 0.1392296403646469, 0.15535232424736023, 0.17147502303123474, 0.18759770691394806, 0.20372039079666138, 0.2198430895805359, 0.2359657734632492, 0.2520884573459625, 0.26821115612983704, 0.28433385491371155, 0.30045652389526367, 0.3165792226791382, 0.3327019214630127, 0.3488246202468872, 0.3649473190307617, 0.38106998801231384, 0.39719268679618835, 0.41331538558006287, 0.429438054561615, 0.4455607533454895, 0.461683452129364, 0.47780612111091614]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 13.0, 10.0, 20.0, 27.0, 21.0, 25.0, 19.0, 32.0, 35.0, 46.0, 63.0, 51.0, 74.0, 81.0, 82.0, 69.0, 51.0, 53.0, 44.0, 27.0, 39.0, 21.0, 22.0, 13.0, 19.0, 8.0, 8.0, 9.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2035682201385498, -0.1978914737701416, -0.1922147274017334, -0.1865379810333252, -0.1808612197637558, -0.1751844733953476, -0.1695077270269394, -0.1638309806585312, -0.1581542193889618, -0.1524774730205536, -0.14680072665214539, -0.14112398028373718, -0.13544721901416779, -0.12977047264575958, -0.12409372627735138, -0.11841697990894318, -0.11274023354053497, -0.10706348717212677, -0.10138673335313797, -0.09570998698472977, -0.09003323316574097, -0.08435648679733276, -0.07867974042892456, -0.07300299406051636, -0.06732624024152756, -0.061649490147829056, -0.055972740054130554, -0.05029599368572235, -0.04461924359202385, -0.03894249349832535, -0.033265747129917145, -0.027588997036218643, -0.02191224694252014, -0.01623549684882164, -0.010558748617768288, -0.004882000386714935, 0.0007947497069835663, 0.006471499800682068, 0.012148246169090271, 0.017824996262788773, 0.023501746356487274, 0.029178496450185776, 0.03485524654388428, 0.04053199291229248, 0.04620874300599098, 0.051885493099689484, 0.05756223946809769, 0.06323899328708649, 0.06891573965549469, 0.0745924860239029, 0.0802692398428917, 0.0859459862112999, 0.0916227400302887, 0.0972994863986969, 0.1029762327671051, 0.1086529791355133, 0.1143297329545021, 0.12000647932291031, 0.1256832331418991, 0.1313599795103073, 0.13703672587871552, 0.1427134871482849, 0.14839023351669312, 0.15406697988510132, 0.15974372625350952]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 7.0, 8.0, 14.0, 21.0, 48.0, 79.0, 129.0, 437.0, 4192348.0, 775.0, 206.0, 74.0, 33.0, 22.0, 16.0, 11.0, 4.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.5764846801757812, -0.5582427978515625, -0.5400009155273438, -0.521759033203125, -0.5035171508789062, -0.4852752685546875, -0.46703338623046875, -0.44879150390625, -0.43054962158203125, -0.4123077392578125, -0.39406585693359375, -0.375823974609375, -0.35758209228515625, -0.3393402099609375, -0.32109832763671875, -0.3028564453125, -0.28461456298828125, -0.2663726806640625, -0.24813079833984375, -0.229888916015625, -0.21164703369140625, -0.1934051513671875, -0.17516326904296875, -0.15692138671875, -0.13867950439453125, -0.1204376220703125, -0.10219573974609375, -0.083953857421875, -0.06571197509765625, -0.0474700927734375, -0.02922821044921875, -0.010986328125, 0.00725555419921875, 0.0254974365234375, 0.04373931884765625, 0.061981201171875, 0.08022308349609375, 0.0984649658203125, 0.11670684814453125, 0.13494873046875, 0.15319061279296875, 0.1714324951171875, 0.18967437744140625, 0.207916259765625, 0.22615814208984375, 0.2444000244140625, 0.26264190673828125, 0.2808837890625, 0.29912567138671875, 0.3173675537109375, 0.33560943603515625, 0.353851318359375, 0.37209320068359375, 0.3903350830078125, 0.40857696533203125, 0.42681884765625, 0.44506072998046875, 0.4633026123046875, 0.48154449462890625, 0.499786376953125, 0.5180282592773438, 0.5362701416015625, 0.5545120239257812, 0.57275390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 8.0, 4.0, 5.0, 3.0, 9.0, 10.0, 15.0, 29.0, 52.0, 152.0, 262.0, 240.0, 94.0, 35.0, 19.0, 10.0, 5.0, 12.0, 9.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191802978515625, -0.018573760986328125, -0.01796722412109375, -0.017360687255859375, -0.016754150390625, -0.016147613525390625, -0.01554107666015625, -0.014934539794921875, -0.0143280029296875, -0.013721466064453125, -0.01311492919921875, -0.012508392333984375, -0.01190185546875, -0.011295318603515625, -0.01068878173828125, -0.010082244873046875, -0.0094757080078125, -0.008869171142578125, -0.00826263427734375, -0.007656097412109375, -0.007049560546875, -0.006443023681640625, -0.00583648681640625, -0.005229949951171875, -0.0046234130859375, -0.004016876220703125, -0.00341033935546875, -0.002803802490234375, -0.002197265625, -0.001590728759765625, -0.00098419189453125, -0.000377655029296875, 0.0002288818359375, 0.000835418701171875, 0.00144195556640625, 0.002048492431640625, 0.002655029296875, 0.003261566162109375, 0.00386810302734375, 0.004474639892578125, 0.0050811767578125, 0.005687713623046875, 0.00629425048828125, 0.006900787353515625, 0.00750732421875, 0.008113861083984375, 0.00872039794921875, 0.009326934814453125, 0.0099334716796875, 0.010540008544921875, 0.01114654541015625, 0.011753082275390625, 0.012359619140625, 0.012966156005859375, 0.01357269287109375, 0.014179229736328125, 0.0147857666015625, 0.015392303466796875, 0.01599884033203125, 0.016605377197265625, 0.0172119140625, 0.017818450927734375, 0.01842498779296875, 0.019031524658203125, 0.0196380615234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 2.0, 6.0, 3.0, 10.0, 16.0, 30.0, 43.0, 49.0, 90.0, 147.0, 262.0, 445.0, 881.0, 1872.0, 5632.0, 34491.0, 3817566.0, 305870.0, 19430.0, 4409.0, 1510.0, 655.0, 322.0, 206.0, 113.0, 73.0, 43.0, 32.0, 28.0, 20.0, 5.0, 7.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0262603759765625, -0.025546789169311523, -0.024833202362060547, -0.02411961555480957, -0.023406028747558594, -0.022692441940307617, -0.02197885513305664, -0.021265268325805664, -0.020551681518554688, -0.01983809471130371, -0.019124507904052734, -0.018410921096801758, -0.01769733428955078, -0.016983747482299805, -0.016270160675048828, -0.015556573867797852, -0.014842987060546875, -0.014129400253295898, -0.013415813446044922, -0.012702226638793945, -0.011988639831542969, -0.011275053024291992, -0.010561466217041016, -0.009847879409790039, -0.009134292602539062, -0.008420705795288086, -0.007707118988037109, -0.006993532180786133, -0.006279945373535156, -0.00556635856628418, -0.004852771759033203, -0.0041391849517822266, -0.00342559814453125, -0.0027120113372802734, -0.001998424530029297, -0.0012848377227783203, -0.0005712509155273438, 0.0001423358917236328, 0.0008559226989746094, 0.001569509506225586, 0.0022830963134765625, 0.002996683120727539, 0.0037102699279785156, 0.004423856735229492, 0.005137443542480469, 0.005851030349731445, 0.006564617156982422, 0.0072782039642333984, 0.007991790771484375, 0.008705377578735352, 0.009418964385986328, 0.010132551193237305, 0.010846138000488281, 0.011559724807739258, 0.012273311614990234, 0.012986898422241211, 0.013700485229492188, 0.014414072036743164, 0.01512765884399414, 0.015841245651245117, 0.016554832458496094, 0.01726841926574707, 0.017982006072998047, 0.018695592880249023, 0.0194091796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 14.0, 14.0, 23.0, 34.0, 70.0, 188.0, 703.0, 1956.0, 629.0, 187.0, 74.0, 42.0, 31.0, 23.0, 17.0, 13.0, 12.0, 15.0, 7.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0218658447265625, -0.021325230598449707, -0.020784616470336914, -0.02024400234222412, -0.019703388214111328, -0.019162774085998535, -0.018622159957885742, -0.01808154582977295, -0.017540931701660156, -0.017000317573547363, -0.01645970344543457, -0.015919089317321777, -0.015378475189208984, -0.014837861061096191, -0.014297246932983398, -0.013756632804870605, -0.013216018676757812, -0.01267540454864502, -0.012134790420532227, -0.011594176292419434, -0.01105356216430664, -0.010512948036193848, -0.009972333908081055, -0.009431719779968262, -0.008891105651855469, -0.008350491523742676, -0.007809877395629883, -0.00726926326751709, -0.006728649139404297, -0.006188035011291504, -0.005647420883178711, -0.005106806755065918, -0.004566192626953125, -0.004025578498840332, -0.003484964370727539, -0.002944350242614746, -0.002403736114501953, -0.0018631219863891602, -0.0013225078582763672, -0.0007818937301635742, -0.00024127960205078125, 0.0002993345260620117, 0.0008399486541748047, 0.0013805627822875977, 0.0019211769104003906, 0.0024617910385131836, 0.0030024051666259766, 0.0035430192947387695, 0.0040836334228515625, 0.0046242475509643555, 0.0051648616790771484, 0.005705475807189941, 0.006246089935302734, 0.006786704063415527, 0.00732731819152832, 0.007867932319641113, 0.008408546447753906, 0.0089491605758667, 0.009489774703979492, 0.010030388832092285, 0.010571002960205078, 0.011111617088317871, 0.011652231216430664, 0.012192845344543457, 0.01273345947265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 15.0, 17.0, 43.0, 93.0, 159.0, 251.0, 167.0, 83.0, 59.0, 37.0, 23.0, 12.0, 4.0, 11.0, 6.0, 8.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07211392372846603, -0.06743697077035904, -0.06276002526283264, -0.05808307230472565, -0.05340611934661865, -0.04872916638851166, -0.04405221715569496, -0.039375267922878265, -0.03469831496477127, -0.030021363869309425, -0.02534441277384758, -0.020667461678385735, -0.01599051058292389, -0.011313559487462044, -0.006636608392000198, -0.001959659159183502, 0.0027172937989234924, 0.007394244894385338, 0.012071195989847183, 0.01674814708530903, 0.021425098180770874, 0.02610204927623272, 0.030779000371694565, 0.03545594960451126, 0.040132902562618256, 0.04480985552072525, 0.049486804753541946, 0.05416375398635864, 0.05884070694446564, 0.06351765990257263, 0.06819461286067963, 0.07287155836820602, 0.07754851877689362, 0.08222547173500061, 0.0869024246931076, 0.091579370200634, 0.096256323158741, 0.10093327611684799, 0.10561022162437439, 0.11028717458248138, 0.11496412754058838, 0.11964108049869537, 0.12431803345680237, 0.12899498641490936, 0.13367193937301636, 0.13834887742996216, 0.14302583038806915, 0.14770278334617615, 0.15237973630428314, 0.15705668926239014, 0.16173364222049713, 0.16641059517860413, 0.17108753323554993, 0.17576448619365692, 0.18044143915176392, 0.1851183921098709, 0.1897953450679779, 0.1944722980260849, 0.1991492509841919, 0.2038262039422989, 0.20850315690040588, 0.21318009495735168, 0.21785704791545868, 0.22253400087356567, 0.22721095383167267]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 6.0, 8.0, 10.0, 12.0, 18.0, 18.0, 25.0, 18.0, 25.0, 25.0, 37.0, 47.0, 35.0, 54.0, 31.0, 53.0, 35.0, 41.0, 51.0, 48.0, 38.0, 45.0, 47.0, 29.0, 40.0, 22.0, 27.0, 20.0, 26.0, 14.0, 13.0, 15.0, 17.0, 10.0, 10.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.045414865016937256, -0.043896742165088654, -0.04237861931324005, -0.04086049273610115, -0.03934236988425255, -0.037824247032403946, -0.036306120455265045, -0.03478799760341644, -0.03326987475156784, -0.03175175189971924, -0.030233627185225487, -0.028715502470731735, -0.027197379618883133, -0.02567925676703453, -0.02416113205254078, -0.022643007338047028, -0.021124884486198425, -0.019606761634349823, -0.01808863691985607, -0.01657051220536232, -0.015052389353513718, -0.01353426557034254, -0.012016141787171364, -0.010498018004000187, -0.00897989422082901, -0.007461770437657833, -0.005943646654486656, -0.004425522871315479, -0.0029073990881443024, -0.0013892753049731255, 0.00012884847819805145, 0.0016469722613692284, 0.0031650960445404053, 0.004683219827711582, 0.006201343610882759, 0.007719467394053936, 0.009237591177225113, 0.01075571496039629, 0.012273838743567467, 0.013791962526738644, 0.01531008630990982, 0.016828209161758423, 0.018346333876252174, 0.019864458590745926, 0.021382581442594528, 0.02290070429444313, 0.024418829008936882, 0.025936953723430634, 0.027455076575279236, 0.028973199427127838, 0.03049132414162159, 0.03200944885611534, 0.033527571707963943, 0.035045694559812546, 0.03656382113695145, 0.03808194398880005, 0.03960006684064865, 0.04111818969249725, 0.042636312544345856, 0.044154439121484756, 0.04567256197333336, 0.04719068482518196, 0.04870881140232086, 0.050226934254169464, 0.051745057106018066]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 18.0, 8.0, 20.0, 25.0, 41.0, 66.0, 104.0, 139.0, 199.0, 304.0, 554.0, 854.0, 1535.0, 3164.0, 7040.0, 20571.0, 139274.0, 778100.0, 70024.0, 14837.0, 5573.0, 2582.0, 1420.0, 731.0, 507.0, 295.0, 174.0, 131.0, 75.0, 41.0, 39.0, 31.0, 11.0, 19.0, 7.0, 10.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03240966796875, -0.03137636184692383, -0.030343055725097656, -0.029309749603271484, -0.028276443481445312, -0.02724313735961914, -0.02620983123779297, -0.025176525115966797, -0.024143218994140625, -0.023109912872314453, -0.02207660675048828, -0.02104330062866211, -0.020009994506835938, -0.018976688385009766, -0.017943382263183594, -0.016910076141357422, -0.01587677001953125, -0.014843463897705078, -0.013810157775878906, -0.012776851654052734, -0.011743545532226562, -0.01071023941040039, -0.009676933288574219, -0.008643627166748047, -0.007610321044921875, -0.006577014923095703, -0.005543708801269531, -0.004510402679443359, -0.0034770965576171875, -0.0024437904357910156, -0.0014104843139648438, -0.0003771781921386719, 0.0006561279296875, 0.0016894340515136719, 0.0027227401733398438, 0.0037560462951660156, 0.0047893524169921875, 0.005822658538818359, 0.006855964660644531, 0.007889270782470703, 0.008922576904296875, 0.009955883026123047, 0.010989189147949219, 0.01202249526977539, 0.013055801391601562, 0.014089107513427734, 0.015122413635253906, 0.016155719757080078, 0.01718902587890625, 0.018222332000732422, 0.019255638122558594, 0.020288944244384766, 0.021322250366210938, 0.02235555648803711, 0.02338886260986328, 0.024422168731689453, 0.025455474853515625, 0.026488780975341797, 0.02752208709716797, 0.02855539321899414, 0.029588699340820312, 0.030622005462646484, 0.031655311584472656, 0.03268861770629883, 0.033721923828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 9.0, 11.0, 15.0, 31.0, 69.0, 178.0, 266.0, 199.0, 89.0, 37.0, 16.0, 11.0, 7.0, 12.0, 5.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01885986328125, -0.018260955810546875, -0.01766204833984375, -0.017063140869140625, -0.0164642333984375, -0.015865325927734375, -0.01526641845703125, -0.014667510986328125, -0.014068603515625, -0.013469696044921875, -0.01287078857421875, -0.012271881103515625, -0.0116729736328125, -0.011074066162109375, -0.01047515869140625, -0.009876251220703125, -0.00927734375, -0.008678436279296875, -0.00807952880859375, -0.007480621337890625, -0.0068817138671875, -0.006282806396484375, -0.00568389892578125, -0.005084991455078125, -0.004486083984375, -0.003887176513671875, -0.00328826904296875, -0.002689361572265625, -0.0020904541015625, -0.001491546630859375, -0.00089263916015625, -0.000293731689453125, 0.00030517578125, 0.000904083251953125, 0.00150299072265625, 0.002101898193359375, 0.0027008056640625, 0.003299713134765625, 0.00389862060546875, 0.004497528076171875, 0.005096435546875, 0.005695343017578125, 0.00629425048828125, 0.006893157958984375, 0.0074920654296875, 0.008090972900390625, 0.00868988037109375, 0.009288787841796875, 0.0098876953125, 0.010486602783203125, 0.01108551025390625, 0.011684417724609375, 0.0122833251953125, 0.012882232666015625, 0.01348114013671875, 0.014080047607421875, 0.014678955078125, 0.015277862548828125, 0.01587677001953125, 0.016475677490234375, 0.0170745849609375, 0.017673492431640625, 0.01827239990234375, 0.018871307373046875, 0.01947021484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 4.0, 9.0, 7.0, 8.0, 5.0, 12.0, 28.0, 26.0, 31.0, 35.0, 58.0, 85.0, 121.0, 139.0, 247.0, 320.0, 533.0, 864.0, 1603.0, 3561.0, 9350.0, 32708.0, 178791.0, 665786.0, 116259.0, 23941.0, 7422.0, 2943.0, 1382.0, 752.0, 464.0, 295.0, 221.0, 152.0, 119.0, 68.0, 51.0, 44.0, 33.0, 20.0, 14.0, 16.0, 13.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0257568359375, -0.024780750274658203, -0.023804664611816406, -0.02282857894897461, -0.021852493286132812, -0.020876407623291016, -0.01990032196044922, -0.018924236297607422, -0.017948150634765625, -0.016972064971923828, -0.01599597930908203, -0.015019893646240234, -0.014043807983398438, -0.01306772232055664, -0.012091636657714844, -0.011115550994873047, -0.01013946533203125, -0.009163379669189453, -0.008187294006347656, -0.007211208343505859, -0.0062351226806640625, -0.005259037017822266, -0.004282951354980469, -0.003306865692138672, -0.002330780029296875, -0.0013546943664550781, -0.00037860870361328125, 0.0005974769592285156, 0.0015735626220703125, 0.0025496482849121094, 0.0035257339477539062, 0.004501819610595703, 0.0054779052734375, 0.006453990936279297, 0.007430076599121094, 0.00840616226196289, 0.009382247924804688, 0.010358333587646484, 0.011334419250488281, 0.012310504913330078, 0.013286590576171875, 0.014262676239013672, 0.015238761901855469, 0.016214847564697266, 0.017190933227539062, 0.01816701889038086, 0.019143104553222656, 0.020119190216064453, 0.02109527587890625, 0.022071361541748047, 0.023047447204589844, 0.02402353286743164, 0.024999618530273438, 0.025975704193115234, 0.02695178985595703, 0.027927875518798828, 0.028903961181640625, 0.029880046844482422, 0.03085613250732422, 0.031832218170166016, 0.03280830383300781, 0.03378438949584961, 0.034760475158691406, 0.0357365608215332, 0.036712646484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 3.0, 4.0, 8.0, 12.0, 10.0, 15.0, 19.0, 18.0, 16.0, 16.0, 33.0, 37.0, 30.0, 47.0, 27.0, 43.0, 48.0, 40.0, 51.0, 45.0, 56.0, 55.0, 37.0, 34.0, 26.0, 25.0, 33.0, 37.0, 26.0, 19.0, 22.0, 10.0, 12.0, 11.0, 7.0, 11.0, 10.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.033233642578125, -0.03226876258850098, -0.03130388259887695, -0.03033900260925293, -0.029374122619628906, -0.028409242630004883, -0.02744436264038086, -0.026479482650756836, -0.025514602661132812, -0.02454972267150879, -0.023584842681884766, -0.022619962692260742, -0.02165508270263672, -0.020690202713012695, -0.019725322723388672, -0.01876044273376465, -0.017795562744140625, -0.0168306827545166, -0.015865802764892578, -0.014900922775268555, -0.013936042785644531, -0.012971162796020508, -0.012006282806396484, -0.011041402816772461, -0.010076522827148438, -0.009111642837524414, -0.00814676284790039, -0.007181882858276367, -0.006217002868652344, -0.00525212287902832, -0.004287242889404297, -0.0033223628997802734, -0.00235748291015625, -0.0013926029205322266, -0.0004277229309082031, 0.0005371570587158203, 0.0015020370483398438, 0.002466917037963867, 0.0034317970275878906, 0.004396677017211914, 0.0053615570068359375, 0.006326436996459961, 0.007291316986083984, 0.008256196975708008, 0.009221076965332031, 0.010185956954956055, 0.011150836944580078, 0.012115716934204102, 0.013080596923828125, 0.014045476913452148, 0.015010356903076172, 0.015975236892700195, 0.01694011688232422, 0.017904996871948242, 0.018869876861572266, 0.01983475685119629, 0.020799636840820312, 0.021764516830444336, 0.02272939682006836, 0.023694276809692383, 0.024659156799316406, 0.02562403678894043, 0.026588916778564453, 0.027553796768188477, 0.0285186767578125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 4.0, 10.0, 11.0, 21.0, 22.0, 36.0, 73.0, 179.0, 325.0, 679.0, 1713.0, 5350.0, 47308.0, 971538.0, 15670.0, 3340.0, 1184.0, 537.0, 253.0, 118.0, 60.0, 45.0, 16.0, 15.0, 9.0, 12.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0304412841796875, -0.02952742576599121, -0.028613567352294922, -0.027699708938598633, -0.026785850524902344, -0.025871992111206055, -0.024958133697509766, -0.024044275283813477, -0.023130416870117188, -0.0222165584564209, -0.02130270004272461, -0.02038884162902832, -0.01947498321533203, -0.018561124801635742, -0.017647266387939453, -0.016733407974243164, -0.015819549560546875, -0.014905691146850586, -0.013991832733154297, -0.013077974319458008, -0.012164115905761719, -0.01125025749206543, -0.01033639907836914, -0.009422540664672852, -0.008508682250976562, -0.0075948238372802734, -0.006680965423583984, -0.005767107009887695, -0.004853248596191406, -0.003939390182495117, -0.003025531768798828, -0.002111673355102539, -0.00119781494140625, -0.00028395652770996094, 0.0006299018859863281, 0.0015437602996826172, 0.0024576187133789062, 0.0033714771270751953, 0.004285335540771484, 0.0051991939544677734, 0.0061130523681640625, 0.0070269107818603516, 0.00794076919555664, 0.00885462760925293, 0.009768486022949219, 0.010682344436645508, 0.011596202850341797, 0.012510061264038086, 0.013423919677734375, 0.014337778091430664, 0.015251636505126953, 0.016165494918823242, 0.01707935333251953, 0.01799321174621582, 0.01890707015991211, 0.0198209285736084, 0.020734786987304688, 0.021648645401000977, 0.022562503814697266, 0.023476362228393555, 0.024390220642089844, 0.025304079055786133, 0.026217937469482422, 0.02713179588317871, 0.028045654296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 8.0, 3.0, 9.0, 10.0, 12.0, 26.0, 13.0, 23.0, 27.0, 32.0, 26.0, 60.0, 57.0, 62.0, 70.0, 63.0, 57.0, 75.0, 57.0, 58.0, 52.0, 39.0, 28.0, 21.0, 16.0, 17.0, 17.0, 7.0, 13.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.271766662597656e-06, -7.038004696369171e-06, -6.804242730140686e-06, -6.570480763912201e-06, -6.336718797683716e-06, -6.102956831455231e-06, -5.869194865226746e-06, -5.6354328989982605e-06, -5.401670932769775e-06, -5.16790896654129e-06, -4.934147000312805e-06, -4.70038503408432e-06, -4.466623067855835e-06, -4.23286110162735e-06, -3.999099135398865e-06, -3.7653371691703796e-06, -3.5315752029418945e-06, -3.2978132367134094e-06, -3.0640512704849243e-06, -2.830289304256439e-06, -2.596527338027954e-06, -2.362765371799469e-06, -2.129003405570984e-06, -1.8952414393424988e-06, -1.6614794731140137e-06, -1.4277175068855286e-06, -1.1939555406570435e-06, -9.601935744285583e-07, -7.264316082000732e-07, -4.926696419715881e-07, -2.5890767574310303e-07, -2.514570951461792e-08, 2.086162567138672e-07, 4.423782229423523e-07, 6.761401891708374e-07, 9.099021553993225e-07, 1.1436641216278076e-06, 1.3774260878562927e-06, 1.6111880540847778e-06, 1.844950020313263e-06, 2.078711986541748e-06, 2.312473952770233e-06, 2.5462359189987183e-06, 2.7799978852272034e-06, 3.0137598514556885e-06, 3.2475218176841736e-06, 3.4812837839126587e-06, 3.715045750141144e-06, 3.948807716369629e-06, 4.182569682598114e-06, 4.416331648826599e-06, 4.650093615055084e-06, 4.883855581283569e-06, 5.1176175475120544e-06, 5.3513795137405396e-06, 5.585141479969025e-06, 5.81890344619751e-06, 6.052665412425995e-06, 6.28642737865448e-06, 6.520189344882965e-06, 6.75395131111145e-06, 6.987713277339935e-06, 7.22147524356842e-06, 7.4552372097969055e-06, 7.68899917602539e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 1.0, 4.0, 2.0, 10.0, 13.0, 15.0, 20.0, 25.0, 30.0, 51.0, 59.0, 103.0, 180.0, 289.0, 529.0, 945.0, 1971.0, 5002.0, 26676.0, 977926.0, 25490.0, 4857.0, 2008.0, 987.0, 539.0, 264.0, 167.0, 115.0, 61.0, 53.0, 39.0, 30.0, 19.0, 13.0, 10.0, 9.0, 19.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.031402587890625, -0.0305178165435791, -0.029633045196533203, -0.028748273849487305, -0.027863502502441406, -0.026978731155395508, -0.02609395980834961, -0.02520918846130371, -0.024324417114257812, -0.023439645767211914, -0.022554874420166016, -0.021670103073120117, -0.02078533172607422, -0.01990056037902832, -0.019015789031982422, -0.018131017684936523, -0.017246246337890625, -0.016361474990844727, -0.015476703643798828, -0.01459193229675293, -0.013707160949707031, -0.012822389602661133, -0.011937618255615234, -0.011052846908569336, -0.010168075561523438, -0.009283304214477539, -0.00839853286743164, -0.007513761520385742, -0.006628990173339844, -0.005744218826293945, -0.004859447479248047, -0.0039746761322021484, -0.00308990478515625, -0.0022051334381103516, -0.0013203620910644531, -0.0004355907440185547, 0.00044918060302734375, 0.0013339519500732422, 0.0022187232971191406, 0.003103494644165039, 0.0039882659912109375, 0.004873037338256836, 0.005757808685302734, 0.006642580032348633, 0.007527351379394531, 0.00841212272644043, 0.009296894073486328, 0.010181665420532227, 0.011066436767578125, 0.011951208114624023, 0.012835979461669922, 0.01372075080871582, 0.014605522155761719, 0.015490293502807617, 0.016375064849853516, 0.017259836196899414, 0.018144607543945312, 0.01902937889099121, 0.01991415023803711, 0.020798921585083008, 0.021683692932128906, 0.022568464279174805, 0.023453235626220703, 0.0243380069732666, 0.0252227783203125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 2.0, 3.0, 6.0, 6.0, 14.0, 16.0, 50.0, 83.0, 237.0, 306.0, 142.0, 56.0, 24.0, 13.0, 10.0, 6.0, 6.0, 3.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02752685546875, -0.026698827743530273, -0.025870800018310547, -0.02504277229309082, -0.024214744567871094, -0.023386716842651367, -0.02255868911743164, -0.021730661392211914, -0.020902633666992188, -0.02007460594177246, -0.019246578216552734, -0.018418550491333008, -0.01759052276611328, -0.016762495040893555, -0.015934467315673828, -0.015106439590454102, -0.014278411865234375, -0.013450384140014648, -0.012622356414794922, -0.011794328689575195, -0.010966300964355469, -0.010138273239135742, -0.009310245513916016, -0.008482217788696289, -0.0076541900634765625, -0.006826162338256836, -0.005998134613037109, -0.005170106887817383, -0.004342079162597656, -0.0035140514373779297, -0.002686023712158203, -0.0018579959869384766, -0.00102996826171875, -0.00020194053649902344, 0.0006260871887207031, 0.0014541149139404297, 0.0022821426391601562, 0.003110170364379883, 0.003938198089599609, 0.004766225814819336, 0.0055942535400390625, 0.006422281265258789, 0.007250308990478516, 0.008078336715698242, 0.008906364440917969, 0.009734392166137695, 0.010562419891357422, 0.011390447616577148, 0.012218475341796875, 0.013046503067016602, 0.013874530792236328, 0.014702558517456055, 0.015530586242675781, 0.016358613967895508, 0.017186641693115234, 0.01801466941833496, 0.018842697143554688, 0.019670724868774414, 0.02049875259399414, 0.021326780319213867, 0.022154808044433594, 0.02298283576965332, 0.023810863494873047, 0.024638891220092773, 0.0254669189453125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 9.0, 33.0, 52.0, 178.0, 371.0, 208.0, 90.0, 20.0, 17.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6343634724617004, -0.616607129573822, -0.5988508462905884, -0.58109450340271, -0.5633381605148315, -0.5455818176269531, -0.5278254747390747, -0.5100691914558411, -0.49231284856796265, -0.47455650568008423, -0.4568001925945282, -0.43904387950897217, -0.42128753662109375, -0.40353119373321533, -0.3857748806476593, -0.36801856756210327, -0.35026222467422485, -0.33250588178634644, -0.3147495687007904, -0.2969932556152344, -0.27923691272735596, -0.26148056983947754, -0.2437242567539215, -0.22596792876720428, -0.20821160078048706, -0.19045527279376984, -0.1726989448070526, -0.1549426168203354, -0.13718628883361816, -0.11942996084690094, -0.10167363286018372, -0.08391730487346649, -0.06616097688674927, -0.04840464890003204, -0.03064832091331482, -0.012891992926597595, 0.004864335060119629, 0.022620663046836853, 0.04037699103355408, 0.0581333190202713, 0.07588964700698853, 0.09364597499370575, 0.11140230298042297, 0.1291586309671402, 0.14691495895385742, 0.16467128694057465, 0.18242761492729187, 0.2001839429140091, 0.21794027090072632, 0.23569659888744354, 0.25345292687416077, 0.2712092399597168, 0.2889655828475952, 0.30672192573547363, 0.32447823882102966, 0.3422345519065857, 0.3599908947944641, 0.37774723768234253, 0.39550355076789856, 0.4132598638534546, 0.431016206741333, 0.4487725496292114, 0.46652886271476746, 0.4842851758003235, 0.5020415186882019]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 9.0, 5.0, 6.0, 10.0, 7.0, 5.0, 5.0, 17.0, 15.0, 13.0, 24.0, 20.0, 23.0, 28.0, 30.0, 26.0, 35.0, 39.0, 45.0, 61.0, 62.0, 61.0, 61.0, 48.0, 41.0, 34.0, 27.0, 33.0, 24.0, 25.0, 20.0, 24.0, 11.0, 21.0, 19.0, 14.0, 8.0, 12.0, 11.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13028067350387573, -0.12612950801849365, -0.12197835743427277, -0.11782719939947128, -0.1136760413646698, -0.10952488332986832, -0.10537372529506683, -0.10122256726026535, -0.09707140922546387, -0.09292025119066238, -0.0887690931558609, -0.08461793512105942, -0.08046677708625793, -0.07631561905145645, -0.07216446101665497, -0.06801330298185349, -0.063862144947052, -0.05971098691225052, -0.055559828877449036, -0.05140867084264755, -0.04725751280784607, -0.043106354773044586, -0.0389551967382431, -0.03480403870344162, -0.030652880668640137, -0.026501722633838654, -0.02235056459903717, -0.018199406564235687, -0.014048248529434204, -0.009897090494632721, -0.005745932459831238, -0.0015947744250297546, 0.0025563836097717285, 0.006707541644573212, 0.010858699679374695, 0.015009857714176178, 0.01916101574897766, 0.023312173783779144, 0.027463331818580627, 0.03161448985338211, 0.035765647888183594, 0.03991680592298508, 0.04406796395778656, 0.04821912199258804, 0.052370280027389526, 0.05652143806219101, 0.06067259609699249, 0.06482375413179398, 0.06897491216659546, 0.07312607020139694, 0.07727722823619843, 0.08142838627099991, 0.08557954430580139, 0.08973070234060287, 0.09388186037540436, 0.09803301841020584, 0.10218417644500732, 0.10633533447980881, 0.11048649251461029, 0.11463765054941177, 0.11878880858421326, 0.12293996661901474, 0.12709112465381622, 0.1312422752380371, 0.1353934407234192]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 9.0, 10.0, 16.0, 8.0, 13.0, 24.0, 30.0, 54.0, 96.0, 245.0, 1013.0, 60016.0, 4127823.0, 4147.0, 410.0, 159.0, 83.0, 45.0, 31.0, 14.0, 8.0, 8.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07965087890625, -0.07756757736206055, -0.0754842758178711, -0.07340097427368164, -0.07131767272949219, -0.06923437118530273, -0.06715106964111328, -0.06506776809692383, -0.06298446655273438, -0.06090116500854492, -0.05881786346435547, -0.056734561920166016, -0.05465126037597656, -0.05256795883178711, -0.050484657287597656, -0.0484013557434082, -0.04631805419921875, -0.0442347526550293, -0.042151451110839844, -0.04006814956665039, -0.03798484802246094, -0.035901546478271484, -0.03381824493408203, -0.03173494338989258, -0.029651641845703125, -0.027568340301513672, -0.02548503875732422, -0.023401737213134766, -0.021318435668945312, -0.01923513412475586, -0.017151832580566406, -0.015068531036376953, -0.0129852294921875, -0.010901927947998047, -0.008818626403808594, -0.006735324859619141, -0.0046520233154296875, -0.0025687217712402344, -0.00048542022705078125, 0.0015978813171386719, 0.003681182861328125, 0.005764484405517578, 0.007847785949707031, 0.009931087493896484, 0.012014389038085938, 0.01409769058227539, 0.016180992126464844, 0.018264293670654297, 0.02034759521484375, 0.022430896759033203, 0.024514198303222656, 0.02659749984741211, 0.028680801391601562, 0.030764102935791016, 0.03284740447998047, 0.03493070602416992, 0.037014007568359375, 0.03909730911254883, 0.04118061065673828, 0.043263912200927734, 0.04534721374511719, 0.04743051528930664, 0.049513816833496094, 0.05159711837768555, 0.053680419921875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 3.0, 7.0, 11.0, 20.0, 32.0, 57.0, 79.0, 150.0, 158.0, 171.0, 124.0, 71.0, 31.0, 22.0, 17.0, 10.0, 7.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0189666748046875, -0.018368005752563477, -0.017769336700439453, -0.01717066764831543, -0.016571998596191406, -0.015973329544067383, -0.01537466049194336, -0.014775991439819336, -0.014177322387695312, -0.013578653335571289, -0.012979984283447266, -0.012381315231323242, -0.011782646179199219, -0.011183977127075195, -0.010585308074951172, -0.009986639022827148, -0.009387969970703125, -0.008789300918579102, -0.008190631866455078, -0.007591962814331055, -0.006993293762207031, -0.006394624710083008, -0.005795955657958984, -0.005197286605834961, -0.0045986175537109375, -0.003999948501586914, -0.0034012794494628906, -0.002802610397338867, -0.0022039413452148438, -0.0016052722930908203, -0.0010066032409667969, -0.00040793418884277344, 0.00019073486328125, 0.0007894039154052734, 0.0013880729675292969, 0.0019867420196533203, 0.0025854110717773438, 0.003184080123901367, 0.0037827491760253906, 0.004381418228149414, 0.0049800872802734375, 0.005578756332397461, 0.006177425384521484, 0.006776094436645508, 0.007374763488769531, 0.007973432540893555, 0.008572101593017578, 0.009170770645141602, 0.009769439697265625, 0.010368108749389648, 0.010966777801513672, 0.011565446853637695, 0.012164115905761719, 0.012762784957885742, 0.013361454010009766, 0.013960123062133789, 0.014558792114257812, 0.015157461166381836, 0.01575613021850586, 0.016354799270629883, 0.016953468322753906, 0.01755213737487793, 0.018150806427001953, 0.018749475479125977, 0.01934814453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 15.0, 35.0, 59.0, 118.0, 184.0, 569.0, 4109.0, 143041.0, 4024358.0, 18324.0, 2196.0, 534.0, 259.0, 176.0, 109.0, 73.0, 38.0, 27.0, 11.0, 13.0, 4.0, 9.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.047393798828125, -0.04592275619506836, -0.04445171356201172, -0.04298067092895508, -0.04150962829589844, -0.0400385856628418, -0.038567543029785156, -0.037096500396728516, -0.035625457763671875, -0.034154415130615234, -0.032683372497558594, -0.031212329864501953, -0.029741287231445312, -0.028270244598388672, -0.02679920196533203, -0.02532815933227539, -0.02385711669921875, -0.02238607406616211, -0.02091503143310547, -0.019443988800048828, -0.017972946166992188, -0.016501903533935547, -0.015030860900878906, -0.013559818267822266, -0.012088775634765625, -0.010617733001708984, -0.009146690368652344, -0.007675647735595703, -0.0062046051025390625, -0.004733562469482422, -0.0032625198364257812, -0.0017914772033691406, -0.0003204345703125, 0.0011506080627441406, 0.0026216506958007812, 0.004092693328857422, 0.0055637359619140625, 0.007034778594970703, 0.008505821228027344, 0.009976863861083984, 0.011447906494140625, 0.012918949127197266, 0.014389991760253906, 0.015861034393310547, 0.017332077026367188, 0.018803119659423828, 0.02027416229248047, 0.02174520492553711, 0.02321624755859375, 0.02468729019165039, 0.02615833282470703, 0.027629375457763672, 0.029100418090820312, 0.030571460723876953, 0.032042503356933594, 0.033513545989990234, 0.034984588623046875, 0.036455631256103516, 0.037926673889160156, 0.0393977165222168, 0.04086875915527344, 0.04233980178833008, 0.04381084442138672, 0.04528188705444336, 0.0467529296875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 20.0, 32.0, 78.0, 278.0, 1510.0, 1567.0, 302.0, 107.0, 61.0, 32.0, 20.0, 20.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0128021240234375, -0.011816740036010742, -0.010831356048583984, -0.009845972061157227, -0.008860588073730469, -0.007875204086303711, -0.006889820098876953, -0.005904436111450195, -0.0049190521240234375, -0.00393366813659668, -0.002948284149169922, -0.001962900161743164, -0.0009775161743164062, 7.867813110351562e-06, 0.0009932518005371094, 0.001978635787963867, 0.002964019775390625, 0.003949403762817383, 0.004934787750244141, 0.0059201717376708984, 0.006905555725097656, 0.007890939712524414, 0.008876323699951172, 0.00986170768737793, 0.010847091674804688, 0.011832475662231445, 0.012817859649658203, 0.013803243637084961, 0.014788627624511719, 0.015774011611938477, 0.016759395599365234, 0.017744779586791992, 0.01873016357421875, 0.019715547561645508, 0.020700931549072266, 0.021686315536499023, 0.02267169952392578, 0.02365708351135254, 0.024642467498779297, 0.025627851486206055, 0.026613235473632812, 0.02759861946105957, 0.028584003448486328, 0.029569387435913086, 0.030554771423339844, 0.0315401554107666, 0.03252553939819336, 0.03351092338562012, 0.034496307373046875, 0.03548169136047363, 0.03646707534790039, 0.03745245933532715, 0.038437843322753906, 0.039423227310180664, 0.04040861129760742, 0.04139399528503418, 0.04237937927246094, 0.043364763259887695, 0.04435014724731445, 0.04533553123474121, 0.04632091522216797, 0.04730629920959473, 0.048291683197021484, 0.04927706718444824, 0.050262451171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 10.0, 17.0, 63.0, 213.0, 304.0, 188.0, 100.0, 46.0, 22.0, 14.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11292285472154617, -0.10438553988933563, -0.09584823250770569, -0.08731091767549515, -0.0787736028432846, -0.07023629546165466, -0.06169898062944412, -0.05316166952252388, -0.04462435841560364, -0.036087047308683395, -0.027549734339118004, -0.019012421369552612, -0.01047511026263237, -0.0019377991557121277, 0.006599515676498413, 0.015136826783418655, 0.023674137890338898, 0.03221144899725914, 0.04074876010417938, 0.04928607493638992, 0.057823386043310165, 0.06636069715023041, 0.07489801198244095, 0.08343532681465149, 0.09197263419628143, 0.10050994902849197, 0.10904725641012192, 0.11758457124233246, 0.1261218786239624, 0.13465920090675354, 0.14319650828838348, 0.15173381567001343, 0.16027113795280457, 0.1688084453344345, 0.17734576761722565, 0.1858830749988556, 0.19442038238048553, 0.20295768976211548, 0.21149501204490662, 0.22003231942653656, 0.2285696268081665, 0.23710693418979645, 0.24564425647258759, 0.25418156385421753, 0.26271888613700867, 0.2712561786174774, 0.27979350090026855, 0.2883308231830597, 0.29686814546585083, 0.30540546774864197, 0.3139427602291107, 0.32248008251190186, 0.331017404794693, 0.33955469727516174, 0.3480920195579529, 0.356629341840744, 0.36516663432121277, 0.3737039566040039, 0.38224124908447266, 0.3907785713672638, 0.39931589365005493, 0.4078531861305237, 0.4163905084133148, 0.42492783069610596, 0.4334651231765747]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 5.0, 8.0, 14.0, 13.0, 26.0, 19.0, 18.0, 23.0, 36.0, 39.0, 49.0, 38.0, 49.0, 41.0, 37.0, 48.0, 54.0, 53.0, 30.0, 46.0, 40.0, 46.0, 23.0, 26.0, 28.0, 36.0, 30.0, 23.0, 9.0, 12.0, 8.0, 14.0, 9.0, 10.0, 6.0, 8.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.11703497171401978, -0.11370910704135895, -0.11038324236869812, -0.10705737769603729, -0.10373151302337646, -0.10040564835071564, -0.0970797911286354, -0.09375392645597458, -0.09042806178331375, -0.08710219711065292, -0.0837763324379921, -0.08045046776533127, -0.07712461054325104, -0.07379874587059021, -0.07047288119792938, -0.06714701652526855, -0.06382115185260773, -0.0604952871799469, -0.05716942250728607, -0.05384356155991554, -0.050517696887254715, -0.04719183221459389, -0.04386597126722336, -0.04054010659456253, -0.0372142419219017, -0.033888377249240875, -0.030562514439225197, -0.02723665162920952, -0.02391078695654869, -0.020584922283887863, -0.017259059473872185, -0.013933196663856506, -0.010607331991195679, -0.007281468249857426, -0.003955604508519173, -0.0006297407671809196, 0.0026961229741573334, 0.006021987646818161, 0.00934785045683384, 0.012673713266849518, 0.015999577939510345, 0.019325442612171173, 0.02265130542218685, 0.02597716823220253, 0.029303032904863358, 0.032628897577524185, 0.035954758524894714, 0.03928062319755554, 0.04260648787021637, 0.0459323525428772, 0.049258217215538025, 0.052584078162908554, 0.05590994283556938, 0.05923580750823021, 0.06256166845560074, 0.06588753312826157, 0.0692133978009224, 0.07253926247358322, 0.07586512714624405, 0.07919099181890488, 0.08251684904098511, 0.08584271371364594, 0.08916857838630676, 0.09249444305896759, 0.09582030773162842]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 11.0, 11.0, 13.0, 16.0, 30.0, 38.0, 45.0, 74.0, 108.0, 160.0, 216.0, 354.0, 678.0, 1233.0, 2574.0, 6017.0, 17338.0, 68595.0, 425799.0, 427004.0, 69015.0, 17572.0, 6042.0, 2589.0, 1236.0, 662.0, 362.0, 235.0, 156.0, 91.0, 72.0, 47.0, 32.0, 23.0, 32.0, 22.0, 13.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0259246826171875, -0.025162220001220703, -0.024399757385253906, -0.02363729476928711, -0.022874832153320312, -0.022112369537353516, -0.02134990692138672, -0.020587444305419922, -0.019824981689453125, -0.019062519073486328, -0.01830005645751953, -0.017537593841552734, -0.016775131225585938, -0.01601266860961914, -0.015250205993652344, -0.014487743377685547, -0.01372528076171875, -0.012962818145751953, -0.012200355529785156, -0.01143789291381836, -0.010675430297851562, -0.009912967681884766, -0.009150505065917969, -0.008388042449951172, -0.007625579833984375, -0.006863117218017578, -0.006100654602050781, -0.005338191986083984, -0.0045757293701171875, -0.0038132667541503906, -0.0030508041381835938, -0.002288341522216797, -0.00152587890625, -0.0007634162902832031, -9.5367431640625e-07, 0.0007615089416503906, 0.0015239715576171875, 0.0022864341735839844, 0.0030488967895507812, 0.003811359405517578, 0.004573822021484375, 0.005336284637451172, 0.006098747253417969, 0.006861209869384766, 0.0076236724853515625, 0.00838613510131836, 0.009148597717285156, 0.009911060333251953, 0.01067352294921875, 0.011435985565185547, 0.012198448181152344, 0.01296091079711914, 0.013723373413085938, 0.014485836029052734, 0.015248298645019531, 0.016010761260986328, 0.016773223876953125, 0.017535686492919922, 0.01829814910888672, 0.019060611724853516, 0.019823074340820312, 0.02058553695678711, 0.021347999572753906, 0.022110462188720703, 0.0228729248046875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 4.0, 6.0, 18.0, 26.0, 34.0, 57.0, 112.0, 112.0, 163.0, 153.0, 100.0, 84.0, 40.0, 22.0, 13.0, 20.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179595947265625, -0.01737236976623535, -0.016785144805908203, -0.016197919845581055, -0.015610694885253906, -0.015023469924926758, -0.01443624496459961, -0.013849020004272461, -0.013261795043945312, -0.012674570083618164, -0.012087345123291016, -0.011500120162963867, -0.010912895202636719, -0.01032567024230957, -0.009738445281982422, -0.009151220321655273, -0.008563995361328125, -0.007976770401000977, -0.007389545440673828, -0.00680232048034668, -0.006215095520019531, -0.005627870559692383, -0.005040645599365234, -0.004453420639038086, -0.0038661956787109375, -0.003278970718383789, -0.0026917457580566406, -0.002104520797729492, -0.0015172958374023438, -0.0009300708770751953, -0.0003428459167480469, 0.00024437904357910156, 0.00083160400390625, 0.0014188289642333984, 0.002006053924560547, 0.0025932788848876953, 0.0031805038452148438, 0.003767728805541992, 0.004354953765869141, 0.004942178726196289, 0.0055294036865234375, 0.006116628646850586, 0.006703853607177734, 0.007291078567504883, 0.007878303527832031, 0.00846552848815918, 0.009052753448486328, 0.009639978408813477, 0.010227203369140625, 0.010814428329467773, 0.011401653289794922, 0.01198887825012207, 0.012576103210449219, 0.013163328170776367, 0.013750553131103516, 0.014337778091430664, 0.014925003051757812, 0.015512228012084961, 0.01609945297241211, 0.016686677932739258, 0.017273902893066406, 0.017861127853393555, 0.018448352813720703, 0.01903557777404785, 0.019622802734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 2.0, 5.0, 17.0, 14.0, 20.0, 15.0, 22.0, 42.0, 58.0, 72.0, 125.0, 165.0, 258.0, 404.0, 707.0, 1359.0, 2813.0, 7144.0, 23138.0, 105072.0, 645026.0, 204729.0, 38597.0, 10685.0, 3975.0, 1765.0, 871.0, 492.0, 315.0, 192.0, 127.0, 81.0, 75.0, 42.0, 34.0, 25.0, 18.0, 14.0, 6.0, 9.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0289764404296875, -0.028061866760253906, -0.027147293090820312, -0.02623271942138672, -0.025318145751953125, -0.02440357208251953, -0.023488998413085938, -0.022574424743652344, -0.02165985107421875, -0.020745277404785156, -0.019830703735351562, -0.01891613006591797, -0.018001556396484375, -0.01708698272705078, -0.016172409057617188, -0.015257835388183594, -0.01434326171875, -0.013428688049316406, -0.012514114379882812, -0.011599540710449219, -0.010684967041015625, -0.009770393371582031, -0.008855819702148438, -0.007941246032714844, -0.00702667236328125, -0.006112098693847656, -0.0051975250244140625, -0.004282951354980469, -0.003368377685546875, -0.0024538040161132812, -0.0015392303466796875, -0.0006246566772460938, 0.0002899169921875, 0.0012044906616210938, 0.0021190643310546875, 0.0030336380004882812, 0.003948211669921875, 0.004862785339355469, 0.0057773590087890625, 0.006691932678222656, 0.00760650634765625, 0.008521080017089844, 0.009435653686523438, 0.010350227355957031, 0.011264801025390625, 0.012179374694824219, 0.013093948364257812, 0.014008522033691406, 0.014923095703125, 0.015837669372558594, 0.016752243041992188, 0.01766681671142578, 0.018581390380859375, 0.01949596405029297, 0.020410537719726562, 0.021325111389160156, 0.02223968505859375, 0.023154258728027344, 0.024068832397460938, 0.02498340606689453, 0.025897979736328125, 0.02681255340576172, 0.027727127075195312, 0.028641700744628906, 0.0295562744140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 12.0, 11.0, 11.0, 12.0, 15.0, 15.0, 18.0, 30.0, 36.0, 59.0, 59.0, 43.0, 44.0, 60.0, 67.0, 54.0, 54.0, 68.0, 56.0, 38.0, 47.0, 29.0, 39.0, 30.0, 19.0, 20.0, 12.0, 8.0, 12.0, 3.0, 6.0, 5.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.047210693359375, -0.045955657958984375, -0.04470062255859375, -0.043445587158203125, -0.0421905517578125, -0.040935516357421875, -0.03968048095703125, -0.038425445556640625, -0.03717041015625, -0.035915374755859375, -0.03466033935546875, -0.033405303955078125, -0.0321502685546875, -0.030895233154296875, -0.02964019775390625, -0.028385162353515625, -0.027130126953125, -0.025875091552734375, -0.02462005615234375, -0.023365020751953125, -0.0221099853515625, -0.020854949951171875, -0.01959991455078125, -0.018344879150390625, -0.01708984375, -0.015834808349609375, -0.01457977294921875, -0.013324737548828125, -0.0120697021484375, -0.010814666748046875, -0.00955963134765625, -0.008304595947265625, -0.007049560546875, -0.005794525146484375, -0.00453948974609375, -0.003284454345703125, -0.0020294189453125, -0.000774383544921875, 0.00048065185546875, 0.001735687255859375, 0.00299072265625, 0.004245758056640625, 0.00550079345703125, 0.006755828857421875, 0.0080108642578125, 0.009265899658203125, 0.01052093505859375, 0.011775970458984375, 0.013031005859375, 0.014286041259765625, 0.01554107666015625, 0.016796112060546875, 0.0180511474609375, 0.019306182861328125, 0.02056121826171875, 0.021816253662109375, 0.0230712890625, 0.024326324462890625, 0.02558135986328125, 0.026836395263671875, 0.0280914306640625, 0.029346466064453125, 0.03060150146484375, 0.031856536865234375, 0.033111572265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 11.0, 11.0, 17.0, 24.0, 24.0, 33.0, 35.0, 55.0, 94.0, 136.0, 221.0, 419.0, 849.0, 2004.0, 6021.0, 27192.0, 357440.0, 611269.0, 31925.0, 6597.0, 2135.0, 909.0, 422.0, 243.0, 116.0, 102.0, 62.0, 35.0, 36.0, 24.0, 25.0, 15.0, 10.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01200103759765625, -0.011601567268371582, -0.011202096939086914, -0.010802626609802246, -0.010403156280517578, -0.01000368595123291, -0.009604215621948242, -0.009204745292663574, -0.008805274963378906, -0.008405804634094238, -0.00800633430480957, -0.007606863975524902, -0.007207393646240234, -0.006807923316955566, -0.0064084529876708984, -0.0060089826583862305, -0.0056095123291015625, -0.0052100419998168945, -0.0048105716705322266, -0.004411101341247559, -0.004011631011962891, -0.0036121606826782227, -0.0032126903533935547, -0.0028132200241088867, -0.0024137496948242188, -0.0020142793655395508, -0.0016148090362548828, -0.0012153387069702148, -0.0008158683776855469, -0.0004163980484008789, -1.6927719116210938e-05, 0.00038254261016845703, 0.000782012939453125, 0.001181483268737793, 0.001580953598022461, 0.001980423927307129, 0.002379894256591797, 0.002779364585876465, 0.003178834915161133, 0.0035783052444458008, 0.003977775573730469, 0.004377245903015137, 0.004776716232299805, 0.005176186561584473, 0.005575656890869141, 0.005975127220153809, 0.0063745975494384766, 0.0067740678787231445, 0.0071735382080078125, 0.0075730085372924805, 0.007972478866577148, 0.008371949195861816, 0.008771419525146484, 0.009170889854431152, 0.00957036018371582, 0.009969830513000488, 0.010369300842285156, 0.010768771171569824, 0.011168241500854492, 0.01156771183013916, 0.011967182159423828, 0.012366652488708496, 0.012766122817993164, 0.013165593147277832, 0.0135650634765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 4.0, 4.0, 11.0, 9.0, 8.0, 20.0, 14.0, 18.0, 34.0, 40.0, 42.0, 51.0, 61.0, 71.0, 100.0, 56.0, 81.0, 74.0, 46.0, 60.0, 33.0, 41.0, 34.0, 24.0, 10.0, 2.0, 15.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.556510925292969e-06, -6.3320621848106384e-06, -6.107613444328308e-06, -5.883164703845978e-06, -5.6587159633636475e-06, -5.434267222881317e-06, -5.209818482398987e-06, -4.9853697419166565e-06, -4.760921001434326e-06, -4.536472260951996e-06, -4.3120235204696655e-06, -4.087574779987335e-06, -3.863126039505005e-06, -3.6386772990226746e-06, -3.4142285585403442e-06, -3.189779818058014e-06, -2.9653310775756836e-06, -2.7408823370933533e-06, -2.516433596611023e-06, -2.2919848561286926e-06, -2.0675361156463623e-06, -1.843087375164032e-06, -1.6186386346817017e-06, -1.3941898941993713e-06, -1.169741153717041e-06, -9.452924132347107e-07, -7.208436727523804e-07, -4.9639493227005e-07, -2.7194619178771973e-07, -4.7497451305389404e-08, 1.7695128917694092e-07, 4.0140002965927124e-07, 6.258487701416016e-07, 8.502975106239319e-07, 1.0747462511062622e-06, 1.2991949915885925e-06, 1.5236437320709229e-06, 1.7480924725532532e-06, 1.9725412130355835e-06, 2.196989953517914e-06, 2.421438694000244e-06, 2.6458874344825745e-06, 2.8703361749649048e-06, 3.094784915447235e-06, 3.3192336559295654e-06, 3.5436823964118958e-06, 3.768131136894226e-06, 3.992579877376556e-06, 4.217028617858887e-06, 4.441477358341217e-06, 4.665926098823547e-06, 4.890374839305878e-06, 5.114823579788208e-06, 5.339272320270538e-06, 5.563721060752869e-06, 5.788169801235199e-06, 6.012618541717529e-06, 6.23706728219986e-06, 6.46151602268219e-06, 6.68596476316452e-06, 6.910413503646851e-06, 7.134862244129181e-06, 7.359310984611511e-06, 7.5837597250938416e-06, 7.808208465576172e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 2.0, 11.0, 11.0, 7.0, 15.0, 19.0, 12.0, 24.0, 42.0, 62.0, 83.0, 141.0, 243.0, 333.0, 657.0, 1248.0, 2705.0, 6763.0, 26000.0, 354292.0, 612108.0, 30520.0, 7498.0, 2716.0, 1309.0, 682.0, 364.0, 221.0, 137.0, 86.0, 65.0, 60.0, 30.0, 19.0, 21.0, 11.0, 9.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.012542724609375, -0.012095451354980469, -0.011648178100585938, -0.011200904846191406, -0.010753631591796875, -0.010306358337402344, -0.009859085083007812, -0.009411811828613281, -0.00896453857421875, -0.008517265319824219, -0.008069992065429688, -0.007622718811035156, -0.007175445556640625, -0.006728172302246094, -0.0062808990478515625, -0.005833625793457031, -0.0053863525390625, -0.004939079284667969, -0.0044918060302734375, -0.004044532775878906, -0.003597259521484375, -0.0031499862670898438, -0.0027027130126953125, -0.0022554397583007812, -0.00180816650390625, -0.0013608932495117188, -0.0009136199951171875, -0.00046634674072265625, -1.9073486328125e-05, 0.00042819976806640625, 0.0008754730224609375, 0.0013227462768554688, 0.00177001953125, 0.0022172927856445312, 0.0026645660400390625, 0.0031118392944335938, 0.003559112548828125, 0.004006385803222656, 0.0044536590576171875, 0.004900932312011719, 0.00534820556640625, 0.005795478820800781, 0.0062427520751953125, 0.006690025329589844, 0.007137298583984375, 0.007584571838378906, 0.008031845092773438, 0.008479118347167969, 0.0089263916015625, 0.009373664855957031, 0.009820938110351562, 0.010268211364746094, 0.010715484619140625, 0.011162757873535156, 0.011610031127929688, 0.012057304382324219, 0.01250457763671875, 0.012951850891113281, 0.013399124145507812, 0.013846397399902344, 0.014293670654296875, 0.014740943908691406, 0.015188217163085938, 0.01563549041748047, 0.016082763671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 5.0, 9.0, 13.0, 13.0, 19.0, 32.0, 27.0, 52.0, 78.0, 103.0, 116.0, 118.0, 107.0, 83.0, 55.0, 36.0, 25.0, 24.0, 24.0, 7.0, 8.0, 4.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01313018798828125, -0.012662768363952637, -0.012195348739624023, -0.01172792911529541, -0.011260509490966797, -0.010793089866638184, -0.01032567024230957, -0.009858250617980957, -0.009390830993652344, -0.00892341136932373, -0.008455991744995117, -0.007988572120666504, -0.007521152496337891, -0.007053732872009277, -0.006586313247680664, -0.006118893623352051, -0.0056514739990234375, -0.005184054374694824, -0.004716634750366211, -0.004249215126037598, -0.0037817955017089844, -0.003314375877380371, -0.002846956253051758, -0.0023795366287231445, -0.0019121170043945312, -0.001444697380065918, -0.0009772777557373047, -0.0005098581314086914, -4.2438507080078125e-05, 0.00042498111724853516, 0.0008924007415771484, 0.0013598203659057617, 0.001827239990234375, 0.0022946596145629883, 0.0027620792388916016, 0.003229498863220215, 0.003696918487548828, 0.004164338111877441, 0.004631757736206055, 0.005099177360534668, 0.005566596984863281, 0.0060340166091918945, 0.006501436233520508, 0.006968855857849121, 0.007436275482177734, 0.007903695106506348, 0.008371114730834961, 0.008838534355163574, 0.009305953979492188, 0.0097733736038208, 0.010240793228149414, 0.010708212852478027, 0.01117563247680664, 0.011643052101135254, 0.012110471725463867, 0.01257789134979248, 0.013045310974121094, 0.013512730598449707, 0.01398015022277832, 0.014447569847106934, 0.014914989471435547, 0.01538240909576416, 0.015849828720092773, 0.016317248344421387, 0.01678466796875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 7.0, 0.0, 5.0, 14.0, 25.0, 51.0, 86.0, 205.0, 317.0, 184.0, 62.0, 17.0, 11.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4073047637939453, -0.39484289288520813, -0.38238105177879333, -0.36991918087005615, -0.35745733976364136, -0.3449954688549042, -0.332533597946167, -0.3200717568397522, -0.3076099157333374, -0.2951480448246002, -0.2826862037181854, -0.27022433280944824, -0.25776249170303345, -0.24530062079429626, -0.23283876478672028, -0.2203769087791443, -0.2079150378704071, -0.19545318186283112, -0.18299132585525513, -0.17052945494651794, -0.15806761384010315, -0.14560574293136597, -0.13314388692378998, -0.12068203091621399, -0.108220174908638, -0.09575831890106201, -0.08329646289348602, -0.07083459943532944, -0.05837274342775345, -0.04591088742017746, -0.033449023962020874, -0.020987167954444885, -0.008525311946868896, 0.0039365459233522415, 0.01639840379357338, 0.028860263526439667, 0.041322119534015656, 0.053783975541591644, 0.06624583899974823, 0.07870769500732422, 0.09116955101490021, 0.1036314070224762, 0.11609326303005219, 0.12855511903762817, 0.14101698994636536, 0.15347883105278015, 0.16594070196151733, 0.17840255796909332, 0.1908644139766693, 0.2033262699842453, 0.2157881259918213, 0.22824999690055847, 0.24071183800697327, 0.25317370891571045, 0.26563555002212524, 0.2780974209308624, 0.2905592918395996, 0.3030211627483368, 0.3154830038547516, 0.32794487476348877, 0.34040671586990356, 0.35286858677864075, 0.36533045768737793, 0.3777922987937927, 0.3902541399002075]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 10.0, 8.0, 17.0, 18.0, 9.0, 15.0, 25.0, 37.0, 27.0, 25.0, 26.0, 40.0, 52.0, 72.0, 72.0, 95.0, 49.0, 51.0, 49.0, 34.0, 40.0, 27.0, 18.0, 29.0, 14.0, 22.0, 21.0, 11.0, 14.0, 8.0, 20.0, 5.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16855734586715698, -0.1632978916168213, -0.1580384373664856, -0.1527789831161499, -0.1475195437669754, -0.1422600895166397, -0.13700063526630402, -0.13174118101596832, -0.12648174166679382, -0.12122228741645813, -0.11596284061670303, -0.11070338636636734, -0.10544393956661224, -0.10018448531627655, -0.09492503106594086, -0.08966557681560516, -0.08440612256526947, -0.07914666831493378, -0.07388722151517868, -0.06862776726484299, -0.06336832046508789, -0.0581088662147522, -0.052849411964416504, -0.04758996143937111, -0.042330510914325714, -0.03707106038928032, -0.031811609864234924, -0.02655215561389923, -0.021292705088853836, -0.01603325456380844, -0.010773800313472748, -0.005514349788427353, -0.000254899263381958, 0.0050045521929860115, 0.010264003649353981, 0.015523456037044525, 0.02078290656208992, 0.026042357087135315, 0.03130181133747101, 0.0365612618625164, 0.0418207123875618, 0.04708016291260719, 0.05233961343765259, 0.05759906768798828, 0.06285852193832397, 0.06811796873807907, 0.07337742298841476, 0.07863686978816986, 0.08389632403850555, 0.08915577828884125, 0.09441522508859634, 0.09967467933893204, 0.10493412613868713, 0.11019358038902283, 0.11545303463935852, 0.12071248888969421, 0.1259719431400299, 0.1312313973903656, 0.1364908516407013, 0.141750305891037, 0.1470097452402115, 0.15226919949054718, 0.15752865374088287, 0.16278810799121857, 0.16804754734039307]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 11.0, 15.0, 13.0, 24.0, 43.0, 90.0, 209.0, 658.0, 6316.0, 4079828.0, 104362.0, 2052.0, 371.0, 144.0, 51.0, 41.0, 18.0, 18.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06793212890625, -0.06618022918701172, -0.06442832946777344, -0.06267642974853516, -0.060924530029296875, -0.059172630310058594, -0.05742073059082031, -0.05566883087158203, -0.05391693115234375, -0.05216503143310547, -0.05041313171386719, -0.048661231994628906, -0.046909332275390625, -0.045157432556152344, -0.04340553283691406, -0.04165363311767578, -0.0399017333984375, -0.03814983367919922, -0.03639793395996094, -0.034646034240722656, -0.032894134521484375, -0.031142234802246094, -0.029390335083007812, -0.02763843536376953, -0.02588653564453125, -0.02413463592529297, -0.022382736206054688, -0.020630836486816406, -0.018878936767578125, -0.017127037048339844, -0.015375137329101562, -0.013623237609863281, -0.011871337890625, -0.010119438171386719, -0.008367538452148438, -0.006615638732910156, -0.004863739013671875, -0.0031118392944335938, -0.0013599395751953125, 0.00039196014404296875, 0.00214385986328125, 0.0038957595825195312, 0.0056476593017578125, 0.007399559020996094, 0.009151458740234375, 0.010903358459472656, 0.012655258178710938, 0.014407157897949219, 0.0161590576171875, 0.01791095733642578, 0.019662857055664062, 0.021414756774902344, 0.023166656494140625, 0.024918556213378906, 0.026670455932617188, 0.02842235565185547, 0.03017425537109375, 0.03192615509033203, 0.03367805480957031, 0.035429954528808594, 0.037181854248046875, 0.038933753967285156, 0.04068565368652344, 0.04243755340576172, 0.044189453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 8.0, 16.0, 32.0, 37.0, 60.0, 88.0, 92.0, 157.0, 157.0, 116.0, 69.0, 43.0, 41.0, 26.0, 16.0, 10.0, 11.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0182647705078125, -0.017673254013061523, -0.017081737518310547, -0.01649022102355957, -0.015898704528808594, -0.015307188034057617, -0.01471567153930664, -0.014124155044555664, -0.013532638549804688, -0.012941122055053711, -0.012349605560302734, -0.011758089065551758, -0.011166572570800781, -0.010575056076049805, -0.009983539581298828, -0.009392023086547852, -0.008800506591796875, -0.008208990097045898, -0.007617473602294922, -0.007025957107543945, -0.006434440612792969, -0.005842924118041992, -0.005251407623291016, -0.004659891128540039, -0.0040683746337890625, -0.003476858139038086, -0.0028853416442871094, -0.002293825149536133, -0.0017023086547851562, -0.0011107921600341797, -0.0005192756652832031, 7.224082946777344e-05, 0.00066375732421875, 0.0012552738189697266, 0.0018467903137207031, 0.0024383068084716797, 0.0030298233032226562, 0.003621339797973633, 0.004212856292724609, 0.004804372787475586, 0.0053958892822265625, 0.005987405776977539, 0.006578922271728516, 0.007170438766479492, 0.007761955261230469, 0.008353471755981445, 0.008944988250732422, 0.009536504745483398, 0.010128021240234375, 0.010719537734985352, 0.011311054229736328, 0.011902570724487305, 0.012494087219238281, 0.013085603713989258, 0.013677120208740234, 0.014268636703491211, 0.014860153198242188, 0.015451669692993164, 0.01604318618774414, 0.016634702682495117, 0.017226219177246094, 0.01781773567199707, 0.018409252166748047, 0.019000768661499023, 0.01959228515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 4.0, 7.0, 11.0, 26.0, 42.0, 49.0, 94.0, 173.0, 321.0, 619.0, 1822.0, 10694.0, 1665126.0, 2499586.0, 12409.0, 2045.0, 633.0, 292.0, 145.0, 87.0, 39.0, 24.0, 9.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0386962890625, -0.03736257553100586, -0.03602886199951172, -0.03469514846801758, -0.03336143493652344, -0.0320277214050293, -0.030694007873535156, -0.029360294342041016, -0.028026580810546875, -0.026692867279052734, -0.025359153747558594, -0.024025440216064453, -0.022691726684570312, -0.021358013153076172, -0.02002429962158203, -0.01869058609008789, -0.01735687255859375, -0.01602315902709961, -0.014689445495605469, -0.013355731964111328, -0.012022018432617188, -0.010688304901123047, -0.009354591369628906, -0.008020877838134766, -0.006687164306640625, -0.005353450775146484, -0.004019737243652344, -0.002686023712158203, -0.0013523101806640625, -1.8596649169921875e-05, 0.0013151168823242188, 0.0026488304138183594, 0.0039825439453125, 0.005316257476806641, 0.006649971008300781, 0.007983684539794922, 0.009317398071289062, 0.010651111602783203, 0.011984825134277344, 0.013318538665771484, 0.014652252197265625, 0.015985965728759766, 0.017319679260253906, 0.018653392791748047, 0.019987106323242188, 0.021320819854736328, 0.02265453338623047, 0.02398824691772461, 0.02532196044921875, 0.02665567398071289, 0.02798938751220703, 0.029323101043701172, 0.030656814575195312, 0.03199052810668945, 0.033324241638183594, 0.034657955169677734, 0.035991668701171875, 0.037325382232666016, 0.038659095764160156, 0.0399928092956543, 0.04132652282714844, 0.04266023635864258, 0.04399394989013672, 0.04532766342163086, 0.046661376953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 9.0, 15.0, 13.0, 25.0, 42.0, 66.0, 189.0, 832.0, 1775.0, 732.0, 176.0, 65.0, 41.0, 25.0, 13.0, 14.0, 11.0, 7.0, 6.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.034515380859375, -0.033682823181152344, -0.03285026550292969, -0.03201770782470703, -0.031185150146484375, -0.03035259246826172, -0.029520034790039062, -0.028687477111816406, -0.02785491943359375, -0.027022361755371094, -0.026189804077148438, -0.02535724639892578, -0.024524688720703125, -0.02369213104248047, -0.022859573364257812, -0.022027015686035156, -0.0211944580078125, -0.020361900329589844, -0.019529342651367188, -0.01869678497314453, -0.017864227294921875, -0.01703166961669922, -0.016199111938476562, -0.015366554260253906, -0.01453399658203125, -0.013701438903808594, -0.012868881225585938, -0.012036323547363281, -0.011203765869140625, -0.010371208190917969, -0.009538650512695312, -0.008706092834472656, -0.00787353515625, -0.007040977478027344, -0.0062084197998046875, -0.005375862121582031, -0.004543304443359375, -0.0037107467651367188, -0.0028781890869140625, -0.0020456314086914062, -0.00121307373046875, -0.00038051605224609375, 0.0004520416259765625, 0.0012845993041992188, 0.002117156982421875, 0.0029497146606445312, 0.0037822723388671875, 0.004614830017089844, 0.0054473876953125, 0.006279945373535156, 0.0071125030517578125, 0.007945060729980469, 0.008777618408203125, 0.009610176086425781, 0.010442733764648438, 0.011275291442871094, 0.01210784912109375, 0.012940406799316406, 0.013772964477539062, 0.014605522155761719, 0.015438079833984375, 0.01627063751220703, 0.017103195190429688, 0.017935752868652344, 0.018768310546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 20.0, 63.0, 170.0, 396.0, 232.0, 73.0, 17.0, 9.0, 8.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.37230390310287476, -0.36357614398002625, -0.35484838485717773, -0.3461206257343292, -0.3373928666114807, -0.3286651074886322, -0.3199373483657837, -0.3112095892429352, -0.30248183012008667, -0.29375407099723816, -0.28502631187438965, -0.27629855275154114, -0.2675707936286926, -0.2588430345058441, -0.2501152753829956, -0.2413875162601471, -0.2326597422361374, -0.22393198311328888, -0.21520422399044037, -0.20647646486759186, -0.19774870574474335, -0.18902094662189484, -0.18029317259788513, -0.17156541347503662, -0.1628376543521881, -0.1541098952293396, -0.1453821361064911, -0.13665437698364258, -0.12792661786079407, -0.11919885873794556, -0.11047109216451645, -0.10174333304166794, -0.09301559627056122, -0.08428783714771271, -0.0755600780248642, -0.06683231890201569, -0.05810455605387688, -0.049376796931028366, -0.04064903408288956, -0.031921274960041046, -0.023193515837192535, -0.01446575578302145, -0.005737995728850365, 0.0029897652566432953, 0.011717524379491806, 0.020445283502340317, 0.029173046350479126, 0.03790080547332764, 0.04662856459617615, 0.05535632371902466, 0.06408408284187317, 0.07281184196472168, 0.08153960108757019, 0.0902673602104187, 0.09899512678384781, 0.10772288590669632, 0.11645064502954483, 0.12517841160297394, 0.13390617072582245, 0.14263392984867096, 0.15136168897151947, 0.16008944809436798, 0.1688172072172165, 0.177544966340065, 0.1862727254629135]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 7.0, 10.0, 8.0, 12.0, 20.0, 38.0, 33.0, 47.0, 67.0, 79.0, 75.0, 81.0, 82.0, 83.0, 77.0, 79.0, 47.0, 37.0, 42.0, 25.0, 20.0, 14.0, 11.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13930761814117432, -0.1355796456336975, -0.1318516731262207, -0.1281237006187439, -0.12439573556184769, -0.12066776305437088, -0.11693979799747467, -0.11321182548999786, -0.10948385298252106, -0.10575588047504425, -0.10202790796756744, -0.09829994291067123, -0.09457197040319443, -0.09084399789571762, -0.08711603283882141, -0.0833880603313446, -0.0796600878238678, -0.07593211531639099, -0.07220414280891418, -0.06847617775201797, -0.06474820524454117, -0.06102023273706436, -0.05729226395487785, -0.053564295172691345, -0.04983632266521454, -0.04610835015773773, -0.042380381375551224, -0.038652412593364716, -0.03492444008588791, -0.03119646944105625, -0.027468498796224594, -0.023740528151392937, -0.02001255750656128, -0.016284586861729622, -0.012556616216897964, -0.008828645572066307, -0.00510067492723465, -0.0013727042824029922, 0.002355266362428665, 0.006083237007260323, 0.00981120765209198, 0.013539178296923637, 0.017267148941755295, 0.020995119586586952, 0.02472309023141861, 0.028451060876250267, 0.032179031521081924, 0.03590700030326843, 0.03963497281074524, 0.043362945318222046, 0.047090914100408554, 0.05081888288259506, 0.05454685539007187, 0.058274827897548676, 0.062002796679735184, 0.06573076546192169, 0.0694587379693985, 0.0731867104768753, 0.07691468298435211, 0.08064264804124832, 0.08437062054872513, 0.08809859305620193, 0.09182655811309814, 0.09555453062057495, 0.09928250312805176]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 7.0, 16.0, 16.0, 25.0, 26.0, 47.0, 79.0, 117.0, 213.0, 380.0, 664.0, 1336.0, 3087.0, 9310.0, 41401.0, 302556.0, 584488.0, 81272.0, 15374.0, 4349.0, 1772.0, 837.0, 468.0, 257.0, 174.0, 94.0, 61.0, 43.0, 27.0, 18.0, 6.0, 9.0, 8.0, 6.0, 1.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0255279541015625, -0.02455306053161621, -0.023578166961669922, -0.022603273391723633, -0.021628379821777344, -0.020653486251831055, -0.019678592681884766, -0.018703699111938477, -0.017728805541992188, -0.0167539119720459, -0.01577901840209961, -0.01480412483215332, -0.013829231262207031, -0.012854337692260742, -0.011879444122314453, -0.010904550552368164, -0.009929656982421875, -0.008954763412475586, -0.007979869842529297, -0.007004976272583008, -0.006030082702636719, -0.00505518913269043, -0.004080295562744141, -0.0031054019927978516, -0.0021305084228515625, -0.0011556148529052734, -0.00018072128295898438, 0.0007941722869873047, 0.0017690658569335938, 0.002743959426879883, 0.003718852996826172, 0.004693746566772461, 0.00566864013671875, 0.006643533706665039, 0.007618427276611328, 0.008593320846557617, 0.009568214416503906, 0.010543107986450195, 0.011518001556396484, 0.012492895126342773, 0.013467788696289062, 0.014442682266235352, 0.01541757583618164, 0.01639246940612793, 0.01736736297607422, 0.018342256546020508, 0.019317150115966797, 0.020292043685913086, 0.021266937255859375, 0.022241830825805664, 0.023216724395751953, 0.024191617965698242, 0.02516651153564453, 0.02614140510559082, 0.02711629867553711, 0.0280911922454834, 0.029066085815429688, 0.030040979385375977, 0.031015872955322266, 0.031990766525268555, 0.032965660095214844, 0.03394055366516113, 0.03491544723510742, 0.03589034080505371, 0.036865234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 4.0, 7.0, 7.0, 16.0, 27.0, 32.0, 66.0, 80.0, 129.0, 139.0, 146.0, 114.0, 74.0, 50.0, 37.0, 28.0, 15.0, 6.0, 11.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0182952880859375, -0.017702341079711914, -0.017109394073486328, -0.016516447067260742, -0.015923500061035156, -0.01533055305480957, -0.014737606048583984, -0.014144659042358398, -0.013551712036132812, -0.012958765029907227, -0.01236581802368164, -0.011772871017456055, -0.011179924011230469, -0.010586977005004883, -0.009994029998779297, -0.009401082992553711, -0.008808135986328125, -0.008215188980102539, -0.007622241973876953, -0.007029294967651367, -0.006436347961425781, -0.005843400955200195, -0.005250453948974609, -0.0046575069427490234, -0.0040645599365234375, -0.0034716129302978516, -0.0028786659240722656, -0.0022857189178466797, -0.0016927719116210938, -0.0010998249053955078, -0.0005068778991699219, 8.606910705566406e-05, 0.00067901611328125, 0.001271963119506836, 0.0018649101257324219, 0.002457857131958008, 0.0030508041381835938, 0.0036437511444091797, 0.004236698150634766, 0.0048296451568603516, 0.0054225921630859375, 0.0060155391693115234, 0.006608486175537109, 0.007201433181762695, 0.007794380187988281, 0.008387327194213867, 0.008980274200439453, 0.009573221206665039, 0.010166168212890625, 0.010759115219116211, 0.011352062225341797, 0.011945009231567383, 0.012537956237792969, 0.013130903244018555, 0.01372385025024414, 0.014316797256469727, 0.014909744262695312, 0.015502691268920898, 0.016095638275146484, 0.01668858528137207, 0.017281532287597656, 0.017874479293823242, 0.018467426300048828, 0.019060373306274414, 0.0196533203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 6.0, 13.0, 16.0, 34.0, 30.0, 65.0, 112.0, 123.0, 202.0, 378.0, 669.0, 1255.0, 2807.0, 6433.0, 17953.0, 60927.0, 249572.0, 551606.0, 109338.0, 29403.0, 9837.0, 3943.0, 1714.0, 878.0, 483.0, 264.0, 158.0, 89.0, 71.0, 43.0, 35.0, 27.0, 15.0, 10.0, 7.0, 9.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0224151611328125, -0.021673202514648438, -0.020931243896484375, -0.020189285278320312, -0.01944732666015625, -0.018705368041992188, -0.017963409423828125, -0.017221450805664062, -0.0164794921875, -0.015737533569335938, -0.014995574951171875, -0.014253616333007812, -0.01351165771484375, -0.012769699096679688, -0.012027740478515625, -0.011285781860351562, -0.0105438232421875, -0.009801864624023438, -0.009059906005859375, -0.008317947387695312, -0.00757598876953125, -0.0068340301513671875, -0.006092071533203125, -0.0053501129150390625, -0.004608154296875, -0.0038661956787109375, -0.003124237060546875, -0.0023822784423828125, -0.00164031982421875, -0.0008983612060546875, -0.000156402587890625, 0.0005855560302734375, 0.0013275146484375, 0.0020694732666015625, 0.002811431884765625, 0.0035533905029296875, 0.00429534912109375, 0.0050373077392578125, 0.005779266357421875, 0.0065212249755859375, 0.00726318359375, 0.008005142211914062, 0.008747100830078125, 0.009489059448242188, 0.01023101806640625, 0.010972976684570312, 0.011714935302734375, 0.012456893920898438, 0.0131988525390625, 0.013940811157226562, 0.014682769775390625, 0.015424728393554688, 0.01616668701171875, 0.016908645629882812, 0.017650604248046875, 0.018392562866210938, 0.019134521484375, 0.019876480102539062, 0.020618438720703125, 0.021360397338867188, 0.02210235595703125, 0.022844314575195312, 0.023586273193359375, 0.024328231811523438, 0.0250701904296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 3.0, 8.0, 6.0, 12.0, 12.0, 17.0, 17.0, 15.0, 16.0, 27.0, 24.0, 30.0, 40.0, 24.0, 37.0, 32.0, 39.0, 37.0, 37.0, 34.0, 53.0, 35.0, 43.0, 32.0, 33.0, 40.0, 39.0, 30.0, 37.0, 35.0, 21.0, 24.0, 8.0, 12.0, 14.0, 14.0, 9.0, 4.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.02728271484375, -0.02645087242126465, -0.025619029998779297, -0.024787187576293945, -0.023955345153808594, -0.023123502731323242, -0.02229166030883789, -0.02145981788635254, -0.020627975463867188, -0.019796133041381836, -0.018964290618896484, -0.018132448196411133, -0.01730060577392578, -0.01646876335144043, -0.015636920928955078, -0.014805078506469727, -0.013973236083984375, -0.013141393661499023, -0.012309551239013672, -0.01147770881652832, -0.010645866394042969, -0.009814023971557617, -0.008982181549072266, -0.008150339126586914, -0.0073184967041015625, -0.006486654281616211, -0.005654811859130859, -0.004822969436645508, -0.003991127014160156, -0.0031592845916748047, -0.002327442169189453, -0.0014955997467041016, -0.00066375732421875, 0.00016808509826660156, 0.0009999275207519531, 0.0018317699432373047, 0.0026636123657226562, 0.003495454788208008, 0.004327297210693359, 0.005159139633178711, 0.0059909820556640625, 0.006822824478149414, 0.007654666900634766, 0.008486509323120117, 0.009318351745605469, 0.01015019416809082, 0.010982036590576172, 0.011813879013061523, 0.012645721435546875, 0.013477563858032227, 0.014309406280517578, 0.01514124870300293, 0.01597309112548828, 0.016804933547973633, 0.017636775970458984, 0.018468618392944336, 0.019300460815429688, 0.02013230323791504, 0.02096414566040039, 0.021795988082885742, 0.022627830505371094, 0.023459672927856445, 0.024291515350341797, 0.02512335777282715, 0.0259552001953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 6.0, 5.0, 11.0, 14.0, 16.0, 26.0, 41.0, 63.0, 127.0, 215.0, 395.0, 831.0, 1870.0, 5055.0, 18826.0, 117266.0, 747040.0, 127586.0, 20120.0, 5339.0, 1950.0, 797.0, 403.0, 233.0, 117.0, 69.0, 51.0, 27.0, 15.0, 13.0, 5.0, 6.0, 6.0, 6.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005924224853515625, -0.005716502666473389, -0.005508780479431152, -0.005301058292388916, -0.00509333610534668, -0.004885613918304443, -0.004677891731262207, -0.004470169544219971, -0.004262447357177734, -0.004054725170135498, -0.0038470029830932617, -0.0036392807960510254, -0.003431558609008789, -0.0032238364219665527, -0.0030161142349243164, -0.00280839204788208, -0.0026006698608398438, -0.0023929476737976074, -0.002185225486755371, -0.0019775032997131348, -0.0017697811126708984, -0.0015620589256286621, -0.0013543367385864258, -0.0011466145515441895, -0.0009388923645019531, -0.0007311701774597168, -0.0005234479904174805, -0.00031572580337524414, -0.00010800361633300781, 9.971857070922852e-05, 0.00030744075775146484, 0.0005151629447937012, 0.0007228851318359375, 0.0009306073188781738, 0.0011383295059204102, 0.0013460516929626465, 0.0015537738800048828, 0.0017614960670471191, 0.0019692182540893555, 0.002176940441131592, 0.002384662628173828, 0.0025923848152160645, 0.0028001070022583008, 0.003007829189300537, 0.0032155513763427734, 0.0034232735633850098, 0.003630995750427246, 0.0038387179374694824, 0.004046440124511719, 0.004254162311553955, 0.004461884498596191, 0.004669606685638428, 0.004877328872680664, 0.0050850510597229, 0.005292773246765137, 0.005500495433807373, 0.005708217620849609, 0.005915939807891846, 0.006123661994934082, 0.006331384181976318, 0.006539106369018555, 0.006746828556060791, 0.006954550743103027, 0.007162272930145264, 0.0073699951171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 4.0, 12.0, 17.0, 17.0, 24.0, 38.0, 56.0, 57.0, 81.0, 69.0, 83.0, 64.0, 69.0, 81.0, 63.0, 51.0, 39.0, 37.0, 40.0, 23.0, 14.0, 12.0, 11.0, 9.0, 4.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.735324859619141e-06, -6.545335054397583e-06, -6.355345249176025e-06, -6.165355443954468e-06, -5.97536563873291e-06, -5.7853758335113525e-06, -5.595386028289795e-06, -5.405396223068237e-06, -5.21540641784668e-06, -5.025416612625122e-06, -4.8354268074035645e-06, -4.645437002182007e-06, -4.455447196960449e-06, -4.265457391738892e-06, -4.075467586517334e-06, -3.885477781295776e-06, -3.6954879760742188e-06, -3.505498170852661e-06, -3.3155083656311035e-06, -3.125518560409546e-06, -2.9355287551879883e-06, -2.7455389499664307e-06, -2.555549144744873e-06, -2.3655593395233154e-06, -2.175569534301758e-06, -1.9855797290802e-06, -1.7955899238586426e-06, -1.605600118637085e-06, -1.4156103134155273e-06, -1.2256205081939697e-06, -1.0356307029724121e-06, -8.456408977508545e-07, -6.556510925292969e-07, -4.6566128730773926e-07, -2.7567148208618164e-07, -8.568167686462402e-08, 1.043081283569336e-07, 2.942979335784912e-07, 4.842877388000488e-07, 6.742775440216064e-07, 8.642673492431641e-07, 1.0542571544647217e-06, 1.2442469596862793e-06, 1.434236764907837e-06, 1.6242265701293945e-06, 1.8142163753509521e-06, 2.0042061805725098e-06, 2.1941959857940674e-06, 2.384185791015625e-06, 2.5741755962371826e-06, 2.7641654014587402e-06, 2.954155206680298e-06, 3.1441450119018555e-06, 3.334134817123413e-06, 3.5241246223449707e-06, 3.7141144275665283e-06, 3.904104232788086e-06, 4.0940940380096436e-06, 4.284083843231201e-06, 4.474073648452759e-06, 4.664063453674316e-06, 4.854053258895874e-06, 5.044043064117432e-06, 5.234032869338989e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 12.0, 4.0, 14.0, 23.0, 24.0, 24.0, 41.0, 76.0, 116.0, 199.0, 304.0, 562.0, 992.0, 2085.0, 5140.0, 15600.0, 65178.0, 527149.0, 349122.0, 58339.0, 14387.0, 4814.0, 2032.0, 958.0, 514.0, 289.0, 173.0, 125.0, 85.0, 34.0, 43.0, 23.0, 12.0, 10.0, 6.0, 8.0, 11.0, 3.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.00551605224609375, -0.005343496799468994, -0.005170941352844238, -0.004998385906219482, -0.0048258304595947266, -0.004653275012969971, -0.004480719566345215, -0.004308164119720459, -0.004135608673095703, -0.003963053226470947, -0.0037904977798461914, -0.0036179423332214355, -0.0034453868865966797, -0.003272831439971924, -0.003100275993347168, -0.002927720546722412, -0.0027551651000976562, -0.0025826096534729004, -0.0024100542068481445, -0.0022374987602233887, -0.002064943313598633, -0.001892387866973877, -0.001719832420349121, -0.0015472769737243652, -0.0013747215270996094, -0.0012021660804748535, -0.0010296106338500977, -0.0008570551872253418, -0.0006844997406005859, -0.0005119442939758301, -0.0003393888473510742, -0.00016683340072631836, 5.7220458984375e-06, 0.00017827749252319336, 0.0003508329391479492, 0.0005233883857727051, 0.0006959438323974609, 0.0008684992790222168, 0.0010410547256469727, 0.0012136101722717285, 0.0013861656188964844, 0.0015587210655212402, 0.001731276512145996, 0.001903831958770752, 0.002076387405395508, 0.0022489428520202637, 0.0024214982986450195, 0.0025940537452697754, 0.0027666091918945312, 0.002939164638519287, 0.003111720085144043, 0.003284275531768799, 0.0034568309783935547, 0.0036293864250183105, 0.0038019418716430664, 0.003974497318267822, 0.004147052764892578, 0.004319608211517334, 0.00449216365814209, 0.004664719104766846, 0.0048372745513916016, 0.005009829998016357, 0.005182385444641113, 0.005354940891265869, 0.005527496337890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 5.0, 16.0, 20.0, 14.0, 30.0, 38.0, 50.0, 59.0, 84.0, 94.0, 93.0, 104.0, 87.0, 68.0, 44.0, 48.0, 37.0, 24.0, 17.0, 15.0, 8.0, 5.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0081787109375, -0.007892131805419922, -0.007605552673339844, -0.007318973541259766, -0.0070323944091796875, -0.006745815277099609, -0.006459236145019531, -0.006172657012939453, -0.005886077880859375, -0.005599498748779297, -0.005312919616699219, -0.005026340484619141, -0.0047397613525390625, -0.004453182220458984, -0.004166603088378906, -0.003880023956298828, -0.00359344482421875, -0.003306865692138672, -0.0030202865600585938, -0.0027337074279785156, -0.0024471282958984375, -0.0021605491638183594, -0.0018739700317382812, -0.0015873908996582031, -0.001300811767578125, -0.0010142326354980469, -0.0007276535034179688, -0.0004410743713378906, -0.0001544952392578125, 0.00013208389282226562, 0.00041866302490234375, 0.0007052421569824219, 0.0009918212890625, 0.0012784004211425781, 0.0015649795532226562, 0.0018515586853027344, 0.0021381378173828125, 0.0024247169494628906, 0.0027112960815429688, 0.002997875213623047, 0.003284454345703125, 0.003571033477783203, 0.0038576126098632812, 0.004144191741943359, 0.0044307708740234375, 0.004717350006103516, 0.005003929138183594, 0.005290508270263672, 0.00557708740234375, 0.005863666534423828, 0.006150245666503906, 0.006436824798583984, 0.0067234039306640625, 0.007009983062744141, 0.007296562194824219, 0.007583141326904297, 0.007869720458984375, 0.008156299591064453, 0.008442878723144531, 0.00872945785522461, 0.009016036987304688, 0.009302616119384766, 0.009589195251464844, 0.009875774383544922, 0.010162353515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 5.0, 3.0, 1.0, 10.0, 13.0, 12.0, 23.0, 50.0, 85.0, 133.0, 221.0, 197.0, 112.0, 66.0, 27.0, 14.0, 12.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26822367310523987, -0.2616836726665497, -0.2551436722278595, -0.2486036717891693, -0.24206367135047913, -0.23552367091178894, -0.22898367047309875, -0.22244367003440857, -0.21590366959571838, -0.2093636691570282, -0.202823668718338, -0.19628366827964783, -0.18974366784095764, -0.18320366740226746, -0.17666366696357727, -0.17012366652488708, -0.1635836660861969, -0.1570436656475067, -0.15050366520881653, -0.14396366477012634, -0.13742366433143616, -0.13088366389274597, -0.12434366345405579, -0.1178036630153656, -0.11126366257667542, -0.10472366213798523, -0.09818366169929504, -0.09164366126060486, -0.08510366082191467, -0.07856366038322449, -0.0720236599445343, -0.06548365950584412, -0.05894364416599274, -0.05240364372730255, -0.045863643288612366, -0.03932364284992218, -0.032783642411231995, -0.02624364197254181, -0.019703641533851624, -0.013163641095161438, -0.0066236406564712524, -8.36402177810669e-05, 0.006456360220909119, 0.012996360659599304, 0.01953636109828949, 0.026076361536979675, 0.03261636197566986, 0.039156362414360046, 0.04569636285305023, 0.05223636329174042, 0.0587763637304306, 0.06531636416912079, 0.07185636460781097, 0.07839636504650116, 0.08493636548519135, 0.09147636592388153, 0.09801636636257172, 0.1045563668012619, 0.11109636723995209, 0.11763636767864227, 0.12417636811733246, 0.13071636855602264, 0.13725636899471283, 0.14379636943340302, 0.1503363698720932]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 4.0, 12.0, 9.0, 12.0, 8.0, 12.0, 19.0, 19.0, 11.0, 16.0, 17.0, 19.0, 28.0, 33.0, 19.0, 33.0, 39.0, 49.0, 66.0, 73.0, 73.0, 62.0, 49.0, 43.0, 29.0, 38.0, 28.0, 19.0, 22.0, 19.0, 26.0, 15.0, 14.0, 15.0, 9.0, 7.0, 5.0, 5.0, 6.0, 7.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.12892520427703857, -0.12518279254436493, -0.12144038826227188, -0.11769797652959824, -0.11395557224750519, -0.11021316051483154, -0.1064707487821579, -0.10272833704948425, -0.0989859327673912, -0.09524352103471756, -0.09150111675262451, -0.08775870501995087, -0.08401629328727722, -0.08027388900518417, -0.07653147727251053, -0.07278907299041748, -0.06904666125774384, -0.06530424952507019, -0.06156184524297714, -0.0578194335103035, -0.05407702550292015, -0.050334617495536804, -0.04659220576286316, -0.04284979775547981, -0.039107389748096466, -0.03536498174071312, -0.03162257373332977, -0.027880162000656128, -0.02413775399327278, -0.020395345985889435, -0.01665293611586094, -0.012910526245832443, -0.009168118238449097, -0.0054257092997431755, -0.0016833003610372543, 0.002059108577668667, 0.005801517516374588, 0.009543925523757935, 0.01328633539378643, 0.017028745263814926, 0.020771153271198273, 0.02451356127858162, 0.028255971148610115, 0.03199838101863861, 0.03574078902602196, 0.039483197033405304, 0.04322560876607895, 0.046968016773462296, 0.05071042478084564, 0.05445283278822899, 0.058195240795612335, 0.06193765252828598, 0.06568005681037903, 0.06942246854305267, 0.07316488027572632, 0.07690729200839996, 0.08064969629049301, 0.08439210802316666, 0.0881345123052597, 0.09187692403793335, 0.095619335770607, 0.09936174005270004, 0.10310415178537369, 0.10684655606746674, 0.11058896780014038]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 3.0, 8.0, 3.0, 11.0, 9.0, 18.0, 21.0, 41.0, 51.0, 103.0, 179.0, 363.0, 820.0, 2116.0, 6987.0, 42268.0, 2654113.0, 1440820.0, 35181.0, 7297.0, 2241.0, 847.0, 360.0, 189.0, 91.0, 46.0, 33.0, 19.0, 18.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0201416015625, -0.019610881805419922, -0.019080162048339844, -0.018549442291259766, -0.018018722534179688, -0.01748800277709961, -0.01695728302001953, -0.016426563262939453, -0.015895843505859375, -0.015365123748779297, -0.014834403991699219, -0.01430368423461914, -0.013772964477539062, -0.013242244720458984, -0.012711524963378906, -0.012180805206298828, -0.01165008544921875, -0.011119365692138672, -0.010588645935058594, -0.010057926177978516, -0.009527206420898438, -0.00899648666381836, -0.008465766906738281, -0.007935047149658203, -0.007404327392578125, -0.006873607635498047, -0.006342887878417969, -0.005812168121337891, -0.0052814483642578125, -0.004750728607177734, -0.004220008850097656, -0.003689289093017578, -0.0031585693359375, -0.002627849578857422, -0.0020971298217773438, -0.0015664100646972656, -0.0010356903076171875, -0.0005049705505371094, 2.574920654296875e-05, 0.0005564689636230469, 0.001087188720703125, 0.0016179084777832031, 0.0021486282348632812, 0.0026793479919433594, 0.0032100677490234375, 0.0037407875061035156, 0.004271507263183594, 0.004802227020263672, 0.00533294677734375, 0.005863666534423828, 0.006394386291503906, 0.006925106048583984, 0.0074558258056640625, 0.00798654556274414, 0.008517265319824219, 0.009047985076904297, 0.009578704833984375, 0.010109424591064453, 0.010640144348144531, 0.01117086410522461, 0.011701583862304688, 0.012232303619384766, 0.012763023376464844, 0.013293743133544922, 0.013824462890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 18.0, 25.0, 42.0, 59.0, 86.0, 104.0, 151.0, 135.0, 119.0, 84.0, 55.0, 45.0, 22.0, 17.0, 16.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184326171875, -0.0178377628326416, -0.017242908477783203, -0.016648054122924805, -0.016053199768066406, -0.015458345413208008, -0.01486349105834961, -0.014268636703491211, -0.013673782348632812, -0.013078927993774414, -0.012484073638916016, -0.011889219284057617, -0.011294364929199219, -0.01069951057434082, -0.010104656219482422, -0.009509801864624023, -0.008914947509765625, -0.008320093154907227, -0.007725238800048828, -0.00713038444519043, -0.006535530090332031, -0.005940675735473633, -0.005345821380615234, -0.004750967025756836, -0.0041561126708984375, -0.003561258316040039, -0.0029664039611816406, -0.002371549606323242, -0.0017766952514648438, -0.0011818408966064453, -0.0005869865417480469, 7.867813110351562e-06, 0.00060272216796875, 0.0011975765228271484, 0.0017924308776855469, 0.0023872852325439453, 0.0029821395874023438, 0.003576993942260742, 0.004171848297119141, 0.004766702651977539, 0.0053615570068359375, 0.005956411361694336, 0.006551265716552734, 0.007146120071411133, 0.007740974426269531, 0.00833582878112793, 0.008930683135986328, 0.009525537490844727, 0.010120391845703125, 0.010715246200561523, 0.011310100555419922, 0.01190495491027832, 0.012499809265136719, 0.013094663619995117, 0.013689517974853516, 0.014284372329711914, 0.014879226684570312, 0.015474081039428711, 0.01606893539428711, 0.016663789749145508, 0.017258644104003906, 0.017853498458862305, 0.018448352813720703, 0.0190432071685791, 0.0196380615234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 9.0, 20.0, 19.0, 20.0, 50.0, 70.0, 177.0, 561.0, 1684.0, 5762.0, 35450.0, 3840756.0, 290430.0, 14257.0, 3331.0, 1038.0, 349.0, 121.0, 52.0, 39.0, 25.0, 13.0, 8.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0242767333984375, -0.023402929306030273, -0.022529125213623047, -0.02165532112121582, -0.020781517028808594, -0.019907712936401367, -0.01903390884399414, -0.018160104751586914, -0.017286300659179688, -0.01641249656677246, -0.015538692474365234, -0.014664888381958008, -0.013791084289550781, -0.012917280197143555, -0.012043476104736328, -0.011169672012329102, -0.010295867919921875, -0.009422063827514648, -0.008548259735107422, -0.007674455642700195, -0.006800651550292969, -0.005926847457885742, -0.005053043365478516, -0.004179239273071289, -0.0033054351806640625, -0.002431631088256836, -0.0015578269958496094, -0.0006840229034423828, 0.00018978118896484375, 0.0010635852813720703, 0.0019373893737792969, 0.0028111934661865234, 0.00368499755859375, 0.0045588016510009766, 0.005432605743408203, 0.00630640983581543, 0.007180213928222656, 0.008054018020629883, 0.00892782211303711, 0.009801626205444336, 0.010675430297851562, 0.011549234390258789, 0.012423038482666016, 0.013296842575073242, 0.014170646667480469, 0.015044450759887695, 0.015918254852294922, 0.01679205894470215, 0.017665863037109375, 0.0185396671295166, 0.019413471221923828, 0.020287275314331055, 0.02116107940673828, 0.022034883499145508, 0.022908687591552734, 0.02378249168395996, 0.024656295776367188, 0.025530099868774414, 0.02640390396118164, 0.027277708053588867, 0.028151512145996094, 0.02902531623840332, 0.029899120330810547, 0.030772924423217773, 0.031646728515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 9.0, 13.0, 21.0, 25.0, 39.0, 64.0, 130.0, 329.0, 814.0, 1340.0, 659.0, 265.0, 135.0, 59.0, 36.0, 31.0, 28.0, 7.0, 10.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0178680419921875, -0.017348527908325195, -0.01682901382446289, -0.016309499740600586, -0.01578998565673828, -0.015270471572875977, -0.014750957489013672, -0.014231443405151367, -0.013711929321289062, -0.013192415237426758, -0.012672901153564453, -0.012153387069702148, -0.011633872985839844, -0.011114358901977539, -0.010594844818115234, -0.01007533073425293, -0.009555816650390625, -0.00903630256652832, -0.008516788482666016, -0.007997274398803711, -0.007477760314941406, -0.0069582462310791016, -0.006438732147216797, -0.005919218063354492, -0.0053997039794921875, -0.004880189895629883, -0.004360675811767578, -0.0038411617279052734, -0.0033216476440429688, -0.002802133560180664, -0.0022826194763183594, -0.0017631053924560547, -0.00124359130859375, -0.0007240772247314453, -0.00020456314086914062, 0.00031495094299316406, 0.0008344650268554688, 0.0013539791107177734, 0.0018734931945800781, 0.002393007278442383, 0.0029125213623046875, 0.003432035446166992, 0.003951549530029297, 0.0044710636138916016, 0.004990577697753906, 0.005510091781616211, 0.006029605865478516, 0.00654911994934082, 0.007068634033203125, 0.00758814811706543, 0.008107662200927734, 0.008627176284790039, 0.009146690368652344, 0.009666204452514648, 0.010185718536376953, 0.010705232620239258, 0.011224746704101562, 0.011744260787963867, 0.012263774871826172, 0.012783288955688477, 0.013302803039550781, 0.013822317123413086, 0.01434183120727539, 0.014861345291137695, 0.015380859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 12.0, 37.0, 109.0, 327.0, 335.0, 116.0, 44.0, 13.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1360357701778412, -0.12922190129756927, -0.12240803986787796, -0.11559417843818665, -0.10878030955791473, -0.10196644812822342, -0.0951525866985321, -0.08833871781826019, -0.08152485638856888, -0.07471099495887756, -0.06789712607860565, -0.06108326464891434, -0.054269399493932724, -0.04745553433895111, -0.040641672909259796, -0.03382780775427818, -0.02701394259929657, -0.020200077444314957, -0.013386214151978493, -0.006572350859642029, 0.00024151429533958435, 0.0070553794503211975, 0.013869240880012512, 0.020683106034994125, 0.02749697118997574, 0.03431083634495735, 0.041124701499938965, 0.04793856292963028, 0.05475242808461189, 0.061566293239593506, 0.06838015466928482, 0.07519401609897614, 0.08200788497924805, 0.08882174640893936, 0.09563561528921127, 0.10244947671890259, 0.1092633455991745, 0.11607720702886581, 0.12289106845855713, 0.12970493733882904, 0.13651880621910095, 0.14333267509937286, 0.15014652907848358, 0.1569603979587555, 0.1637742668390274, 0.17058813571929932, 0.17740198969841003, 0.18421585857868195, 0.19102971255779266, 0.19784358143806458, 0.2046574354171753, 0.2114713042974472, 0.21828517317771912, 0.22509902715682983, 0.23191289603710175, 0.23872676491737366, 0.24554061889648438, 0.2523544728755951, 0.2591683566570282, 0.2659822106361389, 0.27279606461524963, 0.27960994839668274, 0.28642380237579346, 0.2932376563549042, 0.3000515401363373]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 8.0, 15.0, 9.0, 8.0, 17.0, 19.0, 23.0, 26.0, 34.0, 34.0, 28.0, 46.0, 42.0, 47.0, 48.0, 51.0, 50.0, 50.0, 42.0, 39.0, 47.0, 41.0, 35.0, 31.0, 35.0, 21.0, 29.0, 14.0, 18.0, 13.0, 9.0, 12.0, 9.0, 6.0, 3.0, 3.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.05185800790786743, -0.050297170877456665, -0.0487363338470459, -0.04717549681663513, -0.045614659786224365, -0.0440538227558136, -0.04249298572540283, -0.040932148694992065, -0.0393713116645813, -0.03781047463417053, -0.036249637603759766, -0.034688800573349, -0.03312796354293823, -0.031567126512527466, -0.0300062894821167, -0.028445452451705933, -0.026884615421295166, -0.0253237783908844, -0.023762941360473633, -0.022202104330062866, -0.0206412672996521, -0.019080430269241333, -0.017519593238830566, -0.0159587562084198, -0.014397919178009033, -0.012837082147598267, -0.0112762451171875, -0.009715408086776733, -0.008154571056365967, -0.0065937340259552, -0.005032896995544434, -0.003472059965133667, -0.0019112229347229004, -0.0003503859043121338, 0.0012104511260986328, 0.0027712881565093994, 0.004332125186920166, 0.005892962217330933, 0.007453799247741699, 0.009014636278152466, 0.010575473308563232, 0.012136310338973999, 0.013697147369384766, 0.015257984399795532, 0.0168188214302063, 0.018379658460617065, 0.019940495491027832, 0.0215013325214386, 0.023062169551849365, 0.024623006582260132, 0.0261838436126709, 0.027744680643081665, 0.02930551767349243, 0.030866354703903198, 0.032427191734313965, 0.03398802876472473, 0.0355488657951355, 0.037109702825546265, 0.03867053985595703, 0.0402313768863678, 0.041792213916778564, 0.04335305094718933, 0.0449138879776001, 0.046474725008010864, 0.04803556203842163]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 10.0, 23.0, 22.0, 21.0, 31.0, 36.0, 60.0, 92.0, 140.0, 213.0, 312.0, 511.0, 894.0, 1693.0, 3247.0, 7777.0, 21607.0, 74377.0, 357908.0, 443938.0, 92898.0, 25535.0, 9011.0, 3795.0, 1842.0, 970.0, 579.0, 303.0, 219.0, 147.0, 82.0, 68.0, 52.0, 34.0, 24.0, 16.0, 20.0, 6.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0233612060546875, -0.022609472274780273, -0.021857738494873047, -0.02110600471496582, -0.020354270935058594, -0.019602537155151367, -0.01885080337524414, -0.018099069595336914, -0.017347335815429688, -0.01659560203552246, -0.015843868255615234, -0.015092134475708008, -0.014340400695800781, -0.013588666915893555, -0.012836933135986328, -0.012085199356079102, -0.011333465576171875, -0.010581731796264648, -0.009829998016357422, -0.009078264236450195, -0.008326530456542969, -0.007574796676635742, -0.006823062896728516, -0.006071329116821289, -0.0053195953369140625, -0.004567861557006836, -0.0038161277770996094, -0.003064393997192383, -0.0023126602172851562, -0.0015609264373779297, -0.0008091926574707031, -5.745887756347656e-05, 0.00069427490234375, 0.0014460086822509766, 0.002197742462158203, 0.0029494762420654297, 0.0037012100219726562, 0.004452943801879883, 0.005204677581787109, 0.005956411361694336, 0.0067081451416015625, 0.007459878921508789, 0.008211612701416016, 0.008963346481323242, 0.009715080261230469, 0.010466814041137695, 0.011218547821044922, 0.011970281600952148, 0.012722015380859375, 0.013473749160766602, 0.014225482940673828, 0.014977216720581055, 0.01572895050048828, 0.016480684280395508, 0.017232418060302734, 0.01798415184020996, 0.018735885620117188, 0.019487619400024414, 0.02023935317993164, 0.020991086959838867, 0.021742820739746094, 0.02249455451965332, 0.023246288299560547, 0.023998022079467773, 0.024749755859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 18.0, 26.0, 51.0, 59.0, 89.0, 108.0, 142.0, 139.0, 110.0, 82.0, 58.0, 38.0, 20.0, 18.0, 7.0, 18.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0183868408203125, -0.0177919864654541, -0.017197132110595703, -0.016602277755737305, -0.016007423400878906, -0.015412569046020508, -0.01481771469116211, -0.014222860336303711, -0.013628005981445312, -0.013033151626586914, -0.012438297271728516, -0.011843442916870117, -0.011248588562011719, -0.01065373420715332, -0.010058879852294922, -0.009464025497436523, -0.008869171142578125, -0.008274316787719727, -0.007679462432861328, -0.00708460807800293, -0.006489753723144531, -0.005894899368286133, -0.005300045013427734, -0.004705190658569336, -0.0041103363037109375, -0.003515481948852539, -0.0029206275939941406, -0.002325773239135742, -0.0017309188842773438, -0.0011360645294189453, -0.0005412101745605469, 5.364418029785156e-05, 0.00064849853515625, 0.0012433528900146484, 0.0018382072448730469, 0.0024330615997314453, 0.0030279159545898438, 0.003622770309448242, 0.004217624664306641, 0.004812479019165039, 0.0054073333740234375, 0.006002187728881836, 0.006597042083740234, 0.007191896438598633, 0.007786750793457031, 0.00838160514831543, 0.008976459503173828, 0.009571313858032227, 0.010166168212890625, 0.010761022567749023, 0.011355876922607422, 0.01195073127746582, 0.012545585632324219, 0.013140439987182617, 0.013735294342041016, 0.014330148696899414, 0.014925003051757812, 0.015519857406616211, 0.01611471176147461, 0.016709566116333008, 0.017304420471191406, 0.017899274826049805, 0.018494129180908203, 0.0190889835357666, 0.019683837890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 19.0, 14.0, 26.0, 45.0, 58.0, 102.0, 167.0, 243.0, 426.0, 780.0, 1463.0, 3122.0, 7500.0, 21376.0, 80477.0, 610545.0, 247701.0, 49111.0, 14711.0, 5575.0, 2374.0, 1120.0, 604.0, 336.0, 238.0, 144.0, 76.0, 54.0, 38.0, 31.0, 21.0, 13.0, 4.0, 7.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0274200439453125, -0.026558637619018555, -0.02569723129272461, -0.024835824966430664, -0.02397441864013672, -0.023113012313842773, -0.022251605987548828, -0.021390199661254883, -0.020528793334960938, -0.019667387008666992, -0.018805980682373047, -0.0179445743560791, -0.017083168029785156, -0.01622176170349121, -0.015360355377197266, -0.01449894905090332, -0.013637542724609375, -0.01277613639831543, -0.011914730072021484, -0.011053323745727539, -0.010191917419433594, -0.009330511093139648, -0.008469104766845703, -0.007607698440551758, -0.0067462921142578125, -0.005884885787963867, -0.005023479461669922, -0.0041620731353759766, -0.0033006668090820312, -0.002439260482788086, -0.0015778541564941406, -0.0007164478302001953, 0.00014495849609375, 0.0010063648223876953, 0.0018677711486816406, 0.002729177474975586, 0.0035905838012695312, 0.0044519901275634766, 0.005313396453857422, 0.006174802780151367, 0.0070362091064453125, 0.007897615432739258, 0.008759021759033203, 0.009620428085327148, 0.010481834411621094, 0.011343240737915039, 0.012204647064208984, 0.01306605339050293, 0.013927459716796875, 0.01478886604309082, 0.015650272369384766, 0.01651167869567871, 0.017373085021972656, 0.0182344913482666, 0.019095897674560547, 0.019957304000854492, 0.020818710327148438, 0.021680116653442383, 0.022541522979736328, 0.023402929306030273, 0.02426433563232422, 0.025125741958618164, 0.02598714828491211, 0.026848554611206055, 0.0277099609375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 3.0, 4.0, 2.0, 7.0, 10.0, 11.0, 21.0, 19.0, 22.0, 20.0, 30.0, 32.0, 40.0, 35.0, 44.0, 49.0, 42.0, 52.0, 52.0, 65.0, 68.0, 56.0, 47.0, 39.0, 35.0, 28.0, 39.0, 27.0, 25.0, 14.0, 8.0, 10.0, 11.0, 7.0, 4.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.033416748046875, -0.03235816955566406, -0.031299591064453125, -0.030241012573242188, -0.02918243408203125, -0.028123855590820312, -0.027065277099609375, -0.026006698608398438, -0.0249481201171875, -0.023889541625976562, -0.022830963134765625, -0.021772384643554688, -0.02071380615234375, -0.019655227661132812, -0.018596649169921875, -0.017538070678710938, -0.0164794921875, -0.015420913696289062, -0.014362335205078125, -0.013303756713867188, -0.01224517822265625, -0.011186599731445312, -0.010128021240234375, -0.009069442749023438, -0.0080108642578125, -0.0069522857666015625, -0.005893707275390625, -0.0048351287841796875, -0.00377655029296875, -0.0027179718017578125, -0.001659393310546875, -0.0006008148193359375, 0.000457763671875, 0.0015163421630859375, 0.002574920654296875, 0.0036334991455078125, 0.00469207763671875, 0.0057506561279296875, 0.006809234619140625, 0.007867813110351562, 0.0089263916015625, 0.009984970092773438, 0.011043548583984375, 0.012102127075195312, 0.01316070556640625, 0.014219284057617188, 0.015277862548828125, 0.016336441040039062, 0.01739501953125, 0.018453598022460938, 0.019512176513671875, 0.020570755004882812, 0.02162933349609375, 0.022687911987304688, 0.023746490478515625, 0.024805068969726562, 0.0258636474609375, 0.026922225952148438, 0.027980804443359375, 0.029039382934570312, 0.03009796142578125, 0.031156539916992188, 0.032215118408203125, 0.03327369689941406, 0.034332275390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 1.0, 4.0, 8.0, 15.0, 18.0, 22.0, 34.0, 68.0, 106.0, 181.0, 367.0, 756.0, 1883.0, 5716.0, 26944.0, 310126.0, 657158.0, 34398.0, 6919.0, 2070.0, 845.0, 408.0, 189.0, 117.0, 63.0, 41.0, 20.0, 13.0, 14.0, 10.0, 9.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0083465576171875, -0.008077859878540039, -0.007809162139892578, -0.007540464401245117, -0.007271766662597656, -0.007003068923950195, -0.006734371185302734, -0.0064656734466552734, -0.0061969757080078125, -0.0059282779693603516, -0.005659580230712891, -0.00539088249206543, -0.005122184753417969, -0.004853487014770508, -0.004584789276123047, -0.004316091537475586, -0.004047393798828125, -0.003778696060180664, -0.003509998321533203, -0.003241300582885742, -0.0029726028442382812, -0.0027039051055908203, -0.0024352073669433594, -0.0021665096282958984, -0.0018978118896484375, -0.0016291141510009766, -0.0013604164123535156, -0.0010917186737060547, -0.0008230209350585938, -0.0005543231964111328, -0.0002856254577636719, -1.6927719116210938e-05, 0.00025177001953125, 0.0005204677581787109, 0.0007891654968261719, 0.0010578632354736328, 0.0013265609741210938, 0.0015952587127685547, 0.0018639564514160156, 0.0021326541900634766, 0.0024013519287109375, 0.0026700496673583984, 0.0029387474060058594, 0.0032074451446533203, 0.0034761428833007812, 0.003744840621948242, 0.004013538360595703, 0.004282236099243164, 0.004550933837890625, 0.004819631576538086, 0.005088329315185547, 0.005357027053833008, 0.005625724792480469, 0.00589442253112793, 0.006163120269775391, 0.0064318180084228516, 0.0067005157470703125, 0.0069692134857177734, 0.007237911224365234, 0.007506608963012695, 0.007775306701660156, 0.008044004440307617, 0.008312702178955078, 0.008581399917602539, 0.00885009765625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 7.0, 7.0, 9.0, 13.0, 15.0, 31.0, 26.0, 29.0, 46.0, 47.0, 41.0, 77.0, 48.0, 57.0, 82.0, 46.0, 56.0, 62.0, 47.0, 42.0, 68.0, 21.0, 25.0, 24.0, 10.0, 13.0, 16.0, 6.0, 2.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.231929779052734e-06, -4.093162715435028e-06, -3.954395651817322e-06, -3.8156285881996155e-06, -3.676861524581909e-06, -3.538094460964203e-06, -3.3993273973464966e-06, -3.2605603337287903e-06, -3.121793270111084e-06, -2.9830262064933777e-06, -2.8442591428756714e-06, -2.705492079257965e-06, -2.566725015640259e-06, -2.4279579520225525e-06, -2.289190888404846e-06, -2.15042382478714e-06, -2.0116567611694336e-06, -1.8728896975517273e-06, -1.734122633934021e-06, -1.5953555703163147e-06, -1.4565885066986084e-06, -1.317821443080902e-06, -1.1790543794631958e-06, -1.0402873158454895e-06, -9.015202522277832e-07, -7.627531886100769e-07, -6.239861249923706e-07, -4.852190613746643e-07, -3.46451997756958e-07, -2.076849341392517e-07, -6.891787052154541e-08, 6.984919309616089e-08, 2.086162567138672e-07, 3.473833203315735e-07, 4.861503839492798e-07, 6.249174475669861e-07, 7.636845111846924e-07, 9.024515748023987e-07, 1.041218638420105e-06, 1.1799857020378113e-06, 1.3187527656555176e-06, 1.4575198292732239e-06, 1.5962868928909302e-06, 1.7350539565086365e-06, 1.8738210201263428e-06, 2.012588083744049e-06, 2.1513551473617554e-06, 2.2901222109794617e-06, 2.428889274597168e-06, 2.5676563382148743e-06, 2.7064234018325806e-06, 2.845190465450287e-06, 2.983957529067993e-06, 3.1227245926856995e-06, 3.2614916563034058e-06, 3.400258719921112e-06, 3.5390257835388184e-06, 3.6777928471565247e-06, 3.816559910774231e-06, 3.955326974391937e-06, 4.0940940380096436e-06, 4.23286110162735e-06, 4.371628165245056e-06, 4.5103952288627625e-06, 4.649162292480469e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 13.0, 22.0, 27.0, 42.0, 41.0, 80.0, 134.0, 209.0, 377.0, 642.0, 1151.0, 2572.0, 6293.0, 18668.0, 76075.0, 652451.0, 227269.0, 42157.0, 11897.0, 4377.0, 1821.0, 901.0, 510.0, 284.0, 178.0, 114.0, 73.0, 47.0, 36.0, 27.0, 17.0, 8.0, 12.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005596160888671875, -0.005425572395324707, -0.005254983901977539, -0.005084395408630371, -0.004913806915283203, -0.004743218421936035, -0.004572629928588867, -0.004402041435241699, -0.004231452941894531, -0.004060864448547363, -0.0038902759552001953, -0.0037196874618530273, -0.0035490989685058594, -0.0033785104751586914, -0.0032079219818115234, -0.0030373334884643555, -0.0028667449951171875, -0.0026961565017700195, -0.0025255680084228516, -0.0023549795150756836, -0.0021843910217285156, -0.0020138025283813477, -0.0018432140350341797, -0.0016726255416870117, -0.0015020370483398438, -0.0013314485549926758, -0.0011608600616455078, -0.0009902715682983398, -0.0008196830749511719, -0.0006490945816040039, -0.00047850608825683594, -0.00030791759490966797, -0.0001373291015625, 3.325939178466797e-05, 0.00020384788513183594, 0.0003744363784790039, 0.0005450248718261719, 0.0007156133651733398, 0.0008862018585205078, 0.0010567903518676758, 0.0012273788452148438, 0.0013979673385620117, 0.0015685558319091797, 0.0017391443252563477, 0.0019097328186035156, 0.0020803213119506836, 0.0022509098052978516, 0.0024214982986450195, 0.0025920867919921875, 0.0027626752853393555, 0.0029332637786865234, 0.0031038522720336914, 0.0032744407653808594, 0.0034450292587280273, 0.0036156177520751953, 0.0037862062454223633, 0.003956794738769531, 0.004127383232116699, 0.004297971725463867, 0.004468560218811035, 0.004639148712158203, 0.004809737205505371, 0.004980325698852539, 0.005150914192199707, 0.005321502685546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 5.0, 7.0, 5.0, 10.0, 18.0, 20.0, 23.0, 28.0, 41.0, 52.0, 89.0, 83.0, 108.0, 99.0, 92.0, 82.0, 59.0, 38.0, 32.0, 23.0, 16.0, 12.0, 8.0, 14.0, 7.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00861358642578125, -0.008326530456542969, -0.008039474487304688, -0.007752418518066406, -0.007465362548828125, -0.007178306579589844, -0.0068912506103515625, -0.006604194641113281, -0.006317138671875, -0.006030082702636719, -0.0057430267333984375, -0.005455970764160156, -0.005168914794921875, -0.004881858825683594, -0.0045948028564453125, -0.004307746887207031, -0.00402069091796875, -0.0037336349487304688, -0.0034465789794921875, -0.0031595230102539062, -0.002872467041015625, -0.0025854110717773438, -0.0022983551025390625, -0.0020112991333007812, -0.0017242431640625, -0.0014371871948242188, -0.0011501312255859375, -0.0008630752563476562, -0.000576019287109375, -0.00028896331787109375, -1.9073486328125e-06, 0.00028514862060546875, 0.00057220458984375, 0.0008592605590820312, 0.0011463165283203125, 0.0014333724975585938, 0.001720428466796875, 0.0020074844360351562, 0.0022945404052734375, 0.0025815963745117188, 0.00286865234375, 0.0031557083129882812, 0.0034427642822265625, 0.0037298202514648438, 0.004016876220703125, 0.004303932189941406, 0.0045909881591796875, 0.004878044128417969, 0.00516510009765625, 0.005452156066894531, 0.0057392120361328125, 0.006026268005371094, 0.006313323974609375, 0.006600379943847656, 0.0068874359130859375, 0.007174491882324219, 0.0074615478515625, 0.007748603820800781, 0.008035659790039062, 0.008322715759277344, 0.008609771728515625, 0.008896827697753906, 0.009183883666992188, 0.009470939636230469, 0.00975799560546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 14.0, 13.0, 13.0, 37.0, 31.0, 58.0, 102.0, 130.0, 254.0, 141.0, 73.0, 47.0, 21.0, 12.0, 14.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2625066637992859, -0.2566257417201996, -0.2507448196411133, -0.24486388266086578, -0.23898296058177948, -0.23310202360153198, -0.22722110152244568, -0.22134017944335938, -0.21545924246311188, -0.20957832038402557, -0.20369738340377808, -0.19781646132469177, -0.19193553924560547, -0.18605460226535797, -0.18017368018627167, -0.17429274320602417, -0.16841182112693787, -0.16253089904785156, -0.15664996206760406, -0.15076903998851776, -0.14488811790943146, -0.13900718092918396, -0.13312625885009766, -0.12724533677101135, -0.12136441469192505, -0.11548348516225815, -0.10960256308317184, -0.10372163355350494, -0.09784070402383804, -0.09195977449417114, -0.08607885241508484, -0.08019792288541794, -0.07431699335575104, -0.06843606382608414, -0.06255514174699783, -0.05667421221733093, -0.05079328268766403, -0.04491235688328743, -0.03903143107891083, -0.03315050154924393, -0.027269575744867325, -0.021388648077845573, -0.015507721342146397, -0.00962679460644722, -0.0037458669394254684, 0.002135060727596283, 0.008015986531972885, 0.013896916061639786, 0.019777841866016388, 0.02565876953303814, 0.03153969720005989, 0.03742062300443649, 0.043301552534103394, 0.049182478338479996, 0.0550634041428566, 0.0609443336725235, 0.0668252557516098, 0.0727061852812767, 0.078587107360363, 0.08446803689002991, 0.09034896641969681, 0.09622989594936371, 0.10211081802845001, 0.10799174755811691, 0.11387267708778381]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 3.0, 9.0, 12.0, 6.0, 8.0, 11.0, 7.0, 12.0, 25.0, 8.0, 11.0, 23.0, 21.0, 27.0, 34.0, 37.0, 36.0, 52.0, 72.0, 66.0, 71.0, 58.0, 42.0, 45.0, 25.0, 27.0, 23.0, 29.0, 16.0, 14.0, 22.0, 17.0, 18.0, 15.0, 15.0, 13.0, 13.0, 8.0, 4.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.09438371658325195, -0.091534823179245, -0.08868593722581863, -0.08583704382181168, -0.08298815786838531, -0.08013926446437836, -0.0772903710603714, -0.07444147765636444, -0.07159259170293808, -0.06874369829893112, -0.06589481234550476, -0.0630459189414978, -0.06019702926278114, -0.057348139584064484, -0.054499246180057526, -0.051650356501340866, -0.04880146682262421, -0.04595257714390755, -0.04310368746519089, -0.04025479406118393, -0.03740590438246727, -0.03455701470375061, -0.03170812129974365, -0.028859231621026993, -0.026010341942310333, -0.023161452263593674, -0.020312560722231865, -0.017463669180870056, -0.014614779502153397, -0.011765888892114162, -0.008916998282074928, -0.0060681067407131195, -0.00321921706199646, -0.0003703264519572258, 0.0024785641580820084, 0.0053274547681212425, 0.008176345378160477, 0.01102523598819971, 0.013874126598238945, 0.016723018139600754, 0.019571907818317413, 0.022420797497034073, 0.02526968903839588, 0.02811858057975769, 0.03096747025847435, 0.03381635993719101, 0.03666525334119797, 0.03951414301991463, 0.04236303269863129, 0.045211922377347946, 0.048060812056064606, 0.050909705460071564, 0.05375859513878822, 0.05660748481750488, 0.05945637822151184, 0.0623052679002285, 0.06515415757894516, 0.06800305098295212, 0.07085193693637848, 0.07370083034038544, 0.0765497237443924, 0.07939860969781876, 0.08224750310182571, 0.08509638905525208, 0.08794528245925903]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 12.0, 7.0, 26.0, 30.0, 34.0, 55.0, 105.0, 211.0, 394.0, 863.0, 2140.0, 7024.0, 44198.0, 2409457.0, 1677919.0, 40288.0, 7580.0, 2169.0, 864.0, 401.0, 205.0, 117.0, 64.0, 48.0, 15.0, 16.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0235137939453125, -0.022910356521606445, -0.02230691909790039, -0.021703481674194336, -0.02110004425048828, -0.020496606826782227, -0.019893169403076172, -0.019289731979370117, -0.018686294555664062, -0.018082857131958008, -0.017479419708251953, -0.0168759822845459, -0.016272544860839844, -0.01566910743713379, -0.015065670013427734, -0.01446223258972168, -0.013858795166015625, -0.01325535774230957, -0.012651920318603516, -0.012048482894897461, -0.011445045471191406, -0.010841608047485352, -0.010238170623779297, -0.009634733200073242, -0.009031295776367188, -0.008427858352661133, -0.007824420928955078, -0.0072209835052490234, -0.006617546081542969, -0.006014108657836914, -0.005410671234130859, -0.004807233810424805, -0.00420379638671875, -0.0036003589630126953, -0.0029969215393066406, -0.002393484115600586, -0.0017900466918945312, -0.0011866092681884766, -0.0005831718444824219, 2.0265579223632812e-05, 0.0006237030029296875, 0.0012271404266357422, 0.0018305778503417969, 0.0024340152740478516, 0.0030374526977539062, 0.003640890121459961, 0.004244327545166016, 0.00484776496887207, 0.005451202392578125, 0.00605463981628418, 0.006658077239990234, 0.007261514663696289, 0.007864952087402344, 0.008468389511108398, 0.009071826934814453, 0.009675264358520508, 0.010278701782226562, 0.010882139205932617, 0.011485576629638672, 0.012089014053344727, 0.012692451477050781, 0.013295888900756836, 0.01389932632446289, 0.014502763748168945, 0.015106201171875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 7.0, 7.0, 5.0, 19.0, 20.0, 33.0, 59.0, 98.0, 103.0, 131.0, 146.0, 106.0, 86.0, 55.0, 53.0, 31.0, 17.0, 12.0, 9.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185089111328125, -0.017913341522216797, -0.017317771911621094, -0.01672220230102539, -0.016126632690429688, -0.015531063079833984, -0.014935493469238281, -0.014339923858642578, -0.013744354248046875, -0.013148784637451172, -0.012553215026855469, -0.011957645416259766, -0.011362075805664062, -0.01076650619506836, -0.010170936584472656, -0.009575366973876953, -0.00897979736328125, -0.008384227752685547, -0.007788658142089844, -0.007193088531494141, -0.0065975189208984375, -0.006001949310302734, -0.005406379699707031, -0.004810810089111328, -0.004215240478515625, -0.003619670867919922, -0.0030241012573242188, -0.0024285316467285156, -0.0018329620361328125, -0.0012373924255371094, -0.0006418228149414062, -4.6253204345703125e-05, 0.00054931640625, 0.0011448860168457031, 0.0017404556274414062, 0.0023360252380371094, 0.0029315948486328125, 0.0035271644592285156, 0.004122734069824219, 0.004718303680419922, 0.005313873291015625, 0.005909442901611328, 0.006505012512207031, 0.007100582122802734, 0.0076961517333984375, 0.00829172134399414, 0.008887290954589844, 0.009482860565185547, 0.01007843017578125, 0.010673999786376953, 0.011269569396972656, 0.01186513900756836, 0.012460708618164062, 0.013056278228759766, 0.013651847839355469, 0.014247417449951172, 0.014842987060546875, 0.015438556671142578, 0.01603412628173828, 0.016629695892333984, 0.017225265502929688, 0.01782083511352539, 0.018416404724121094, 0.019011974334716797, 0.0196075439453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 13.0, 15.0, 24.0, 33.0, 65.0, 137.0, 319.0, 943.0, 3456.0, 19323.0, 1973645.0, 2170640.0, 20482.0, 3522.0, 1003.0, 349.0, 145.0, 50.0, 37.0, 28.0, 15.0, 8.0, 4.0, 2.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031341552734375, -0.030180931091308594, -0.029020309448242188, -0.02785968780517578, -0.026699066162109375, -0.02553844451904297, -0.024377822875976562, -0.023217201232910156, -0.02205657958984375, -0.020895957946777344, -0.019735336303710938, -0.01857471466064453, -0.017414093017578125, -0.01625347137451172, -0.015092849731445312, -0.013932228088378906, -0.0127716064453125, -0.011610984802246094, -0.010450363159179688, -0.009289741516113281, -0.008129119873046875, -0.006968498229980469, -0.0058078765869140625, -0.004647254943847656, -0.00348663330078125, -0.0023260116577148438, -0.0011653900146484375, -4.76837158203125e-06, 0.001155853271484375, 0.0023164749145507812, 0.0034770965576171875, 0.004637718200683594, 0.00579833984375, 0.006958961486816406, 0.008119583129882812, 0.009280204772949219, 0.010440826416015625, 0.011601448059082031, 0.012762069702148438, 0.013922691345214844, 0.01508331298828125, 0.016243934631347656, 0.017404556274414062, 0.01856517791748047, 0.019725799560546875, 0.02088642120361328, 0.022047042846679688, 0.023207664489746094, 0.0243682861328125, 0.025528907775878906, 0.026689529418945312, 0.02785015106201172, 0.029010772705078125, 0.03017139434814453, 0.03133201599121094, 0.032492637634277344, 0.03365325927734375, 0.034813880920410156, 0.03597450256347656, 0.03713512420654297, 0.038295745849609375, 0.03945636749267578, 0.04061698913574219, 0.041777610778808594, 0.042938232421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 13.0, 17.0, 18.0, 42.0, 73.0, 184.0, 565.0, 1461.0, 1051.0, 323.0, 125.0, 60.0, 25.0, 31.0, 17.0, 14.0, 10.0, 7.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0308380126953125, -0.029950380325317383, -0.029062747955322266, -0.02817511558532715, -0.02728748321533203, -0.026399850845336914, -0.025512218475341797, -0.02462458610534668, -0.023736953735351562, -0.022849321365356445, -0.021961688995361328, -0.02107405662536621, -0.020186424255371094, -0.019298791885375977, -0.01841115951538086, -0.017523527145385742, -0.016635894775390625, -0.015748262405395508, -0.01486063003540039, -0.013972997665405273, -0.013085365295410156, -0.012197732925415039, -0.011310100555419922, -0.010422468185424805, -0.009534835815429688, -0.00864720344543457, -0.007759571075439453, -0.006871938705444336, -0.005984306335449219, -0.0050966739654541016, -0.004209041595458984, -0.003321409225463867, -0.00243377685546875, -0.0015461444854736328, -0.0006585121154785156, 0.00022912025451660156, 0.0011167526245117188, 0.002004384994506836, 0.002892017364501953, 0.0037796497344970703, 0.0046672821044921875, 0.005554914474487305, 0.006442546844482422, 0.007330179214477539, 0.008217811584472656, 0.009105443954467773, 0.00999307632446289, 0.010880708694458008, 0.011768341064453125, 0.012655973434448242, 0.01354360580444336, 0.014431238174438477, 0.015318870544433594, 0.01620650291442871, 0.017094135284423828, 0.017981767654418945, 0.018869400024414062, 0.01975703239440918, 0.020644664764404297, 0.021532297134399414, 0.02241992950439453, 0.02330756187438965, 0.024195194244384766, 0.025082826614379883, 0.025970458984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 6.0, 14.0, 25.0, 35.0, 94.0, 115.0, 192.0, 198.0, 141.0, 74.0, 40.0, 23.0, 12.0, 12.0, 7.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08114591985940933, -0.07632295042276382, -0.07149998098611832, -0.06667700409889221, -0.061854034662246704, -0.057031065225601196, -0.05220809578895569, -0.04738512262701988, -0.042562153190374374, -0.03773918375372887, -0.03291621059179306, -0.028093241155147552, -0.023270269855856895, -0.01844729855656624, -0.01362432911992073, -0.008801355957984924, -0.0039783865213394165, 0.0008445843122899532, 0.005667555145919323, 0.010490525513887405, 0.015313496813178062, 0.02013646811246872, 0.024959437549114227, 0.029782410711050034, 0.03460538014769554, 0.03942834958434105, 0.044251322746276855, 0.04907429218292236, 0.05389726161956787, 0.05872023478150368, 0.06354320049285889, 0.06836617738008499, 0.0731891542673111, 0.0780121237039566, 0.08283509314060211, 0.08765806257724762, 0.09248103946447372, 0.09730400890111923, 0.10212697833776474, 0.10694995522499084, 0.11177292466163635, 0.11659589409828186, 0.12141886353492737, 0.12624183297157288, 0.13106480240821838, 0.1358877718448639, 0.1407107412815094, 0.1455337256193161, 0.15035668015480042, 0.15517964959144592, 0.16000261902809143, 0.16482558846473694, 0.16964855790138245, 0.17447152733802795, 0.17929449677467346, 0.18411748111248016, 0.18894045054912567, 0.19376341998577118, 0.1985863894224167, 0.2034093588590622, 0.2082323282957077, 0.2130553126335144, 0.2178782820701599, 0.22270125150680542, 0.22752422094345093]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 8.0, 7.0, 10.0, 5.0, 7.0, 17.0, 18.0, 21.0, 31.0, 22.0, 30.0, 43.0, 47.0, 37.0, 38.0, 53.0, 46.0, 46.0, 51.0, 36.0, 50.0, 48.0, 37.0, 42.0, 41.0, 40.0, 26.0, 28.0, 23.0, 22.0, 12.0, 5.0, 15.0, 6.0, 5.0, 7.0, 2.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09113991260528564, -0.08831251412630081, -0.08548511564731598, -0.08265771716833115, -0.07983031868934631, -0.07700292766094208, -0.07417552918195724, -0.07134813070297241, -0.06852073222398758, -0.06569333374500275, -0.06286593526601791, -0.06003854051232338, -0.05721114203333855, -0.054383743554353714, -0.05155634880065918, -0.04872895032167435, -0.045901551842689514, -0.04307415336370468, -0.04024675488471985, -0.037419360131025314, -0.03459196165204048, -0.03176456317305565, -0.028937166556715965, -0.026109769940376282, -0.02328237146139145, -0.020454972982406616, -0.017627576366066933, -0.014800178818404675, -0.011972781270742416, -0.009145383723080158, -0.0063179861754179, -0.0034905895590782166, -0.0006631910800933838, 0.0021642064675688744, 0.0049916040152311325, 0.00781900156289339, 0.010646399110555649, 0.013473796658217907, 0.016301194205880165, 0.01912859082221985, 0.02195598930120468, 0.024783387780189514, 0.027610784396529198, 0.03043818101286888, 0.033265579491853714, 0.03609297797083855, 0.03892037272453308, 0.041747771203517914, 0.04457516968250275, 0.04740256816148758, 0.05022996664047241, 0.053057361394166946, 0.05588475987315178, 0.05871215835213661, 0.061539553105831146, 0.06436695158481598, 0.06719435006380081, 0.07002174854278564, 0.07284914702177048, 0.07567654550075531, 0.07850393652915955, 0.08133133500814438, 0.08415873348712921, 0.08698613196611404, 0.08981353044509888]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 4.0, 4.0, 7.0, 6.0, 21.0, 18.0, 29.0, 55.0, 52.0, 85.0, 119.0, 198.0, 356.0, 576.0, 1063.0, 2113.0, 4179.0, 9616.0, 25827.0, 88883.0, 460747.0, 347137.0, 69994.0, 21488.0, 8136.0, 3597.0, 1798.0, 1013.0, 536.0, 324.0, 180.0, 131.0, 88.0, 57.0, 47.0, 14.0, 28.0, 15.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.032501220703125, -0.03144979476928711, -0.03039836883544922, -0.029346942901611328, -0.028295516967773438, -0.027244091033935547, -0.026192665100097656, -0.025141239166259766, -0.024089813232421875, -0.023038387298583984, -0.021986961364746094, -0.020935535430908203, -0.019884109497070312, -0.018832683563232422, -0.01778125762939453, -0.01672983169555664, -0.01567840576171875, -0.01462697982788086, -0.013575553894042969, -0.012524127960205078, -0.011472702026367188, -0.010421276092529297, -0.009369850158691406, -0.008318424224853516, -0.007266998291015625, -0.006215572357177734, -0.005164146423339844, -0.004112720489501953, -0.0030612945556640625, -0.002009868621826172, -0.0009584426879882812, 9.298324584960938e-05, 0.0011444091796875, 0.0021958351135253906, 0.0032472610473632812, 0.004298686981201172, 0.0053501129150390625, 0.006401538848876953, 0.007452964782714844, 0.008504390716552734, 0.009555816650390625, 0.010607242584228516, 0.011658668518066406, 0.012710094451904297, 0.013761520385742188, 0.014812946319580078, 0.01586437225341797, 0.01691579818725586, 0.01796722412109375, 0.01901865005493164, 0.02007007598876953, 0.021121501922607422, 0.022172927856445312, 0.023224353790283203, 0.024275779724121094, 0.025327205657958984, 0.026378631591796875, 0.027430057525634766, 0.028481483459472656, 0.029532909393310547, 0.030584335327148438, 0.03163576126098633, 0.03268718719482422, 0.03373861312866211, 0.0347900390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 5.0, 10.0, 16.0, 15.0, 30.0, 42.0, 67.0, 96.0, 104.0, 127.0, 108.0, 109.0, 75.0, 60.0, 47.0, 26.0, 28.0, 11.0, 10.0, 11.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018341064453125, -0.017747879028320312, -0.017154693603515625, -0.016561508178710938, -0.01596832275390625, -0.015375137329101562, -0.014781951904296875, -0.014188766479492188, -0.0135955810546875, -0.013002395629882812, -0.012409210205078125, -0.011816024780273438, -0.01122283935546875, -0.010629653930664062, -0.010036468505859375, -0.009443283081054688, -0.00885009765625, -0.008256912231445312, -0.007663726806640625, -0.0070705413818359375, -0.00647735595703125, -0.0058841705322265625, -0.005290985107421875, -0.0046977996826171875, -0.0041046142578125, -0.0035114288330078125, -0.002918243408203125, -0.0023250579833984375, -0.00173187255859375, -0.0011386871337890625, -0.000545501708984375, 4.76837158203125e-05, 0.000640869140625, 0.0012340545654296875, 0.001827239990234375, 0.0024204254150390625, 0.00301361083984375, 0.0036067962646484375, 0.004199981689453125, 0.0047931671142578125, 0.0053863525390625, 0.0059795379638671875, 0.006572723388671875, 0.0071659088134765625, 0.00775909423828125, 0.008352279663085938, 0.008945465087890625, 0.009538650512695312, 0.0101318359375, 0.010725021362304688, 0.011318206787109375, 0.011911392211914062, 0.01250457763671875, 0.013097763061523438, 0.013690948486328125, 0.014284133911132812, 0.0148773193359375, 0.015470504760742188, 0.016063690185546875, 0.016656875610351562, 0.01725006103515625, 0.017843246459960938, 0.018436431884765625, 0.019029617309570312, 0.019622802734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 10.0, 13.0, 15.0, 17.0, 31.0, 45.0, 65.0, 101.0, 143.0, 244.0, 359.0, 653.0, 1085.0, 2222.0, 4958.0, 13483.0, 49961.0, 596189.0, 314173.0, 43458.0, 12087.0, 4519.0, 2043.0, 1079.0, 568.0, 355.0, 201.0, 139.0, 94.0, 62.0, 51.0, 39.0, 25.0, 21.0, 7.0, 6.0, 7.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042449951171875, -0.041121482849121094, -0.03979301452636719, -0.03846454620361328, -0.037136077880859375, -0.03580760955810547, -0.03447914123535156, -0.033150672912597656, -0.03182220458984375, -0.030493736267089844, -0.029165267944335938, -0.02783679962158203, -0.026508331298828125, -0.02517986297607422, -0.023851394653320312, -0.022522926330566406, -0.0211944580078125, -0.019865989685058594, -0.018537521362304688, -0.01720905303955078, -0.015880584716796875, -0.014552116394042969, -0.013223648071289062, -0.011895179748535156, -0.01056671142578125, -0.009238243103027344, -0.007909774780273438, -0.006581306457519531, -0.005252838134765625, -0.003924369812011719, -0.0025959014892578125, -0.0012674331665039062, 6.103515625e-05, 0.0013895034790039062, 0.0027179718017578125, 0.004046440124511719, 0.005374908447265625, 0.006703376770019531, 0.008031845092773438, 0.009360313415527344, 0.01068878173828125, 0.012017250061035156, 0.013345718383789062, 0.014674186706542969, 0.016002655029296875, 0.01733112335205078, 0.018659591674804688, 0.019988059997558594, 0.0213165283203125, 0.022644996643066406, 0.023973464965820312, 0.02530193328857422, 0.026630401611328125, 0.02795886993408203, 0.029287338256835938, 0.030615806579589844, 0.03194427490234375, 0.033272743225097656, 0.03460121154785156, 0.03592967987060547, 0.037258148193359375, 0.03858661651611328, 0.03991508483886719, 0.041243553161621094, 0.042572021484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 12.0, 12.0, 19.0, 21.0, 15.0, 30.0, 31.0, 34.0, 33.0, 64.0, 58.0, 73.0, 53.0, 57.0, 69.0, 54.0, 53.0, 51.0, 53.0, 36.0, 27.0, 32.0, 20.0, 10.0, 21.0, 9.0, 9.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.048492431640625, -0.047118186950683594, -0.04574394226074219, -0.04436969757080078, -0.042995452880859375, -0.04162120819091797, -0.04024696350097656, -0.038872718811035156, -0.03749847412109375, -0.036124229431152344, -0.03474998474121094, -0.03337574005126953, -0.032001495361328125, -0.03062725067138672, -0.029253005981445312, -0.027878761291503906, -0.0265045166015625, -0.025130271911621094, -0.023756027221679688, -0.02238178253173828, -0.021007537841796875, -0.01963329315185547, -0.018259048461914062, -0.016884803771972656, -0.01551055908203125, -0.014136314392089844, -0.012762069702148438, -0.011387825012207031, -0.010013580322265625, -0.008639335632324219, -0.0072650909423828125, -0.005890846252441406, -0.0045166015625, -0.0031423568725585938, -0.0017681121826171875, -0.00039386749267578125, 0.000980377197265625, 0.0023546218872070312, 0.0037288665771484375, 0.005103111267089844, 0.00647735595703125, 0.007851600646972656, 0.009225845336914062, 0.010600090026855469, 0.011974334716796875, 0.013348579406738281, 0.014722824096679688, 0.016097068786621094, 0.0174713134765625, 0.018845558166503906, 0.020219802856445312, 0.02159404754638672, 0.022968292236328125, 0.02434253692626953, 0.025716781616210938, 0.027091026306152344, 0.02846527099609375, 0.029839515686035156, 0.031213760375976562, 0.03258800506591797, 0.033962249755859375, 0.03533649444580078, 0.03671073913574219, 0.038084983825683594, 0.039459228515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 3.0, 11.0, 12.0, 20.0, 43.0, 45.0, 78.0, 136.0, 233.0, 536.0, 1580.0, 6369.0, 39824.0, 826847.0, 153044.0, 14994.0, 3063.0, 885.0, 346.0, 176.0, 106.0, 54.0, 34.0, 27.0, 13.0, 15.0, 12.0, 14.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0132598876953125, -0.012855052947998047, -0.012450218200683594, -0.01204538345336914, -0.011640548706054688, -0.011235713958740234, -0.010830879211425781, -0.010426044464111328, -0.010021209716796875, -0.009616374969482422, -0.009211540222167969, -0.008806705474853516, -0.008401870727539062, -0.00799703598022461, -0.007592201232910156, -0.007187366485595703, -0.00678253173828125, -0.006377696990966797, -0.005972862243652344, -0.005568027496337891, -0.0051631927490234375, -0.004758358001708984, -0.004353523254394531, -0.003948688507080078, -0.003543853759765625, -0.003139019012451172, -0.0027341842651367188, -0.0023293495178222656, -0.0019245147705078125, -0.0015196800231933594, -0.0011148452758789062, -0.0007100105285644531, -0.00030517578125, 9.965896606445312e-05, 0.0005044937133789062, 0.0009093284606933594, 0.0013141632080078125, 0.0017189979553222656, 0.0021238327026367188, 0.002528667449951172, 0.002933502197265625, 0.003338336944580078, 0.0037431716918945312, 0.004148006439208984, 0.0045528411865234375, 0.004957675933837891, 0.005362510681152344, 0.005767345428466797, 0.00617218017578125, 0.006577014923095703, 0.006981849670410156, 0.007386684417724609, 0.0077915191650390625, 0.008196353912353516, 0.008601188659667969, 0.009006023406982422, 0.009410858154296875, 0.009815692901611328, 0.010220527648925781, 0.010625362396240234, 0.011030197143554688, 0.01143503189086914, 0.011839866638183594, 0.012244701385498047, 0.0126495361328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 4.0, 4.0, 5.0, 5.0, 11.0, 2.0, 5.0, 14.0, 11.0, 9.0, 14.0, 23.0, 16.0, 38.0, 44.0, 32.0, 56.0, 68.0, 70.0, 49.0, 73.0, 66.0, 51.0, 60.0, 69.0, 47.0, 29.0, 44.0, 15.0, 15.0, 16.0, 5.0, 4.0, 6.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.066394805908203e-06, -4.905276000499725e-06, -4.7441571950912476e-06, -4.58303838968277e-06, -4.421919584274292e-06, -4.260800778865814e-06, -4.0996819734573364e-06, -3.938563168048859e-06, -3.777444362640381e-06, -3.616325557231903e-06, -3.4552067518234253e-06, -3.2940879464149475e-06, -3.1329691410064697e-06, -2.971850335597992e-06, -2.810731530189514e-06, -2.6496127247810364e-06, -2.4884939193725586e-06, -2.327375113964081e-06, -2.166256308555603e-06, -2.0051375031471252e-06, -1.8440186977386475e-06, -1.6828998923301697e-06, -1.521781086921692e-06, -1.3606622815132141e-06, -1.1995434761047363e-06, -1.0384246706962585e-06, -8.773058652877808e-07, -7.16187059879303e-07, -5.550682544708252e-07, -3.939494490623474e-07, -2.3283064365386963e-07, -7.171183824539185e-08, 8.940696716308594e-08, 2.505257725715637e-07, 4.116445779800415e-07, 5.727633833885193e-07, 7.338821887969971e-07, 8.950009942054749e-07, 1.0561197996139526e-06, 1.2172386050224304e-06, 1.3783574104309082e-06, 1.539476215839386e-06, 1.7005950212478638e-06, 1.8617138266563416e-06, 2.0228326320648193e-06, 2.183951437473297e-06, 2.345070242881775e-06, 2.5061890482902527e-06, 2.6673078536987305e-06, 2.8284266591072083e-06, 2.989545464515686e-06, 3.150664269924164e-06, 3.3117830753326416e-06, 3.4729018807411194e-06, 3.634020686149597e-06, 3.795139491558075e-06, 3.956258296966553e-06, 4.1173771023750305e-06, 4.278495907783508e-06, 4.439614713191986e-06, 4.600733518600464e-06, 4.761852324008942e-06, 4.9229711294174194e-06, 5.084089934825897e-06, 5.245208740234375e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 13.0, 9.0, 23.0, 29.0, 40.0, 65.0, 85.0, 114.0, 164.0, 284.0, 471.0, 790.0, 1414.0, 3084.0, 7706.0, 23491.0, 107738.0, 739355.0, 122895.0, 25836.0, 7972.0, 3209.0, 1540.0, 863.0, 482.0, 290.0, 187.0, 120.0, 78.0, 55.0, 42.0, 34.0, 10.0, 14.0, 12.0, 10.0, 8.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.007781982421875, -0.007562994956970215, -0.00734400749206543, -0.0071250200271606445, -0.006906032562255859, -0.006687045097351074, -0.006468057632446289, -0.006249070167541504, -0.006030082702636719, -0.005811095237731934, -0.0055921077728271484, -0.005373120307922363, -0.005154132843017578, -0.004935145378112793, -0.004716157913208008, -0.004497170448303223, -0.0042781829833984375, -0.004059195518493652, -0.003840208053588867, -0.003621220588684082, -0.003402233123779297, -0.0031832456588745117, -0.0029642581939697266, -0.0027452707290649414, -0.0025262832641601562, -0.002307295799255371, -0.002088308334350586, -0.0018693208694458008, -0.0016503334045410156, -0.0014313459396362305, -0.0012123584747314453, -0.0009933710098266602, -0.000774383544921875, -0.0005553960800170898, -0.0003364086151123047, -0.00011742115020751953, 0.00010156631469726562, 0.0003205537796020508, 0.0005395412445068359, 0.0007585287094116211, 0.0009775161743164062, 0.0011965036392211914, 0.0014154911041259766, 0.0016344785690307617, 0.0018534660339355469, 0.002072453498840332, 0.002291440963745117, 0.0025104284286499023, 0.0027294158935546875, 0.0029484033584594727, 0.003167390823364258, 0.003386378288269043, 0.003605365753173828, 0.0038243532180786133, 0.0040433406829833984, 0.004262328147888184, 0.004481315612792969, 0.004700303077697754, 0.004919290542602539, 0.005138278007507324, 0.005357265472412109, 0.0055762529373168945, 0.00579524040222168, 0.006014227867126465, 0.00623321533203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 3.0, 5.0, 11.0, 6.0, 14.0, 11.0, 25.0, 22.0, 32.0, 43.0, 52.0, 42.0, 54.0, 78.0, 84.0, 87.0, 79.0, 75.0, 58.0, 51.0, 29.0, 28.0, 18.0, 16.0, 7.0, 19.0, 15.0, 8.0, 6.0, 2.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0100250244140625, -0.00970911979675293, -0.00939321517944336, -0.009077310562133789, -0.008761405944824219, -0.008445501327514648, -0.008129596710205078, -0.007813692092895508, -0.0074977874755859375, -0.007181882858276367, -0.006865978240966797, -0.0065500736236572266, -0.006234169006347656, -0.005918264389038086, -0.005602359771728516, -0.005286455154418945, -0.004970550537109375, -0.004654645919799805, -0.004338741302490234, -0.004022836685180664, -0.0037069320678710938, -0.0033910274505615234, -0.003075122833251953, -0.002759218215942383, -0.0024433135986328125, -0.002127408981323242, -0.0018115043640136719, -0.0014955997467041016, -0.0011796951293945312, -0.0008637905120849609, -0.0005478858947753906, -0.0002319812774658203, 8.392333984375e-05, 0.0003998279571533203, 0.0007157325744628906, 0.001031637191772461, 0.0013475418090820312, 0.0016634464263916016, 0.001979351043701172, 0.002295255661010742, 0.0026111602783203125, 0.002927064895629883, 0.003242969512939453, 0.0035588741302490234, 0.0038747787475585938, 0.004190683364868164, 0.004506587982177734, 0.004822492599487305, 0.005138397216796875, 0.005454301834106445, 0.005770206451416016, 0.006086111068725586, 0.006402015686035156, 0.0067179203033447266, 0.007033824920654297, 0.007349729537963867, 0.0076656341552734375, 0.007981538772583008, 0.008297443389892578, 0.008613348007202148, 0.008929252624511719, 0.009245157241821289, 0.00956106185913086, 0.00987696647644043, 0.01019287109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 10.0, 11.0, 12.0, 11.0, 43.0, 49.0, 139.0, 347.0, 278.0, 64.0, 20.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5150738954544067, -0.4994322657585144, -0.48379063606262207, -0.46814897656440735, -0.452507346868515, -0.4368657171726227, -0.42122405767440796, -0.4055824279785156, -0.3899407982826233, -0.37429916858673096, -0.3586575388908386, -0.3430158793926239, -0.32737424969673157, -0.31173262000083923, -0.2960909605026245, -0.2804493308067322, -0.26480770111083984, -0.2491660714149475, -0.23352442681789398, -0.21788278222084045, -0.20224115252494812, -0.1865995228290558, -0.17095787823200226, -0.15531623363494873, -0.1396746039390564, -0.12403296679258347, -0.10839132964611053, -0.0927496924996376, -0.07710805535316467, -0.06146641820669174, -0.04582478106021881, -0.03018314391374588, -0.014541566371917725, 0.0011000707745552063, 0.016741707921028137, 0.03238334506750107, 0.048024982213974, 0.06366661936044693, 0.07930825650691986, 0.09494989365339279, 0.11059153079986572, 0.12623316049575806, 0.14187480509281158, 0.1575164496898651, 0.17315807938575745, 0.18879970908164978, 0.2044413536787033, 0.22008299827575684, 0.23572462797164917, 0.2513662576675415, 0.26700788736343384, 0.28264954686164856, 0.2982911765575409, 0.3139328062534332, 0.32957446575164795, 0.3452160954475403, 0.3608577251434326, 0.37649935483932495, 0.3921409845352173, 0.407782644033432, 0.42342427372932434, 0.4390659034252167, 0.4547075629234314, 0.47034919261932373, 0.48599082231521606]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 6.0, 4.0, 3.0, 14.0, 11.0, 9.0, 17.0, 23.0, 15.0, 25.0, 15.0, 22.0, 26.0, 28.0, 32.0, 47.0, 88.0, 107.0, 106.0, 64.0, 49.0, 28.0, 30.0, 29.0, 26.0, 17.0, 19.0, 18.0, 20.0, 14.0, 15.0, 15.0, 11.0, 7.0, 4.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11476194858551025, -0.11114710569381714, -0.10753225535154343, -0.10391741245985031, -0.1003025621175766, -0.09668771922588348, -0.09307287633419037, -0.08945803344249725, -0.08584318310022354, -0.08222834020853043, -0.07861348986625671, -0.0749986469745636, -0.07138380408287048, -0.06776895374059677, -0.06415411084890366, -0.06053926423192024, -0.05692441761493683, -0.053309570997953415, -0.04969472438097, -0.046079881489276886, -0.04246503487229347, -0.03885018825531006, -0.03523534536361694, -0.03162049874663353, -0.028005652129650116, -0.024390805512666702, -0.020775960758328438, -0.017161116003990173, -0.01354626938700676, -0.009931422770023346, -0.0063165780156850815, -0.002701733261346817, 0.0009131133556365967, 0.004527959041297436, 0.008142804726958275, 0.011757650412619114, 0.015372496098279953, 0.018987342715263367, 0.02260218746960163, 0.026217032223939896, 0.02983187884092331, 0.03344672545790672, 0.03706157207489014, 0.04067641496658325, 0.044291261583566666, 0.04790610820055008, 0.051520951092243195, 0.05513579770922661, 0.05875064432621002, 0.062365490943193436, 0.06598033756017685, 0.06959518045186996, 0.07321003079414368, 0.07682487368583679, 0.08043971657752991, 0.08405455946922302, 0.08766940981149673, 0.09128425270318985, 0.09489910304546356, 0.09851394593715668, 0.10212878882884979, 0.1057436391711235, 0.10935848206281662, 0.11297333240509033, 0.11658817529678345]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 7.0, 5.0, 8.0, 17.0, 12.0, 18.0, 32.0, 25.0, 49.0, 60.0, 107.0, 141.0, 212.0, 306.0, 430.0, 623.0, 1041.0, 1607.0, 2753.0, 5450.0, 12193.0, 36961.0, 198086.0, 2689070.0, 1103875.0, 97411.0, 24334.0, 9142.0, 4278.0, 2237.0, 1369.0, 816.0, 519.0, 352.0, 240.0, 146.0, 95.0, 78.0, 62.0, 44.0, 25.0, 14.0, 10.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.027435302734375, -0.02657294273376465, -0.025710582733154297, -0.024848222732543945, -0.023985862731933594, -0.023123502731323242, -0.02226114273071289, -0.02139878273010254, -0.020536422729492188, -0.019674062728881836, -0.018811702728271484, -0.017949342727661133, -0.01708698272705078, -0.01622462272644043, -0.015362262725830078, -0.014499902725219727, -0.013637542724609375, -0.012775182723999023, -0.011912822723388672, -0.01105046272277832, -0.010188102722167969, -0.009325742721557617, -0.008463382720947266, -0.007601022720336914, -0.0067386627197265625, -0.005876302719116211, -0.005013942718505859, -0.004151582717895508, -0.0032892227172851562, -0.0024268627166748047, -0.0015645027160644531, -0.0007021427154541016, 0.00016021728515625, 0.0010225772857666016, 0.0018849372863769531, 0.0027472972869873047, 0.0036096572875976562, 0.004472017288208008, 0.005334377288818359, 0.006196737289428711, 0.0070590972900390625, 0.007921457290649414, 0.008783817291259766, 0.009646177291870117, 0.010508537292480469, 0.01137089729309082, 0.012233257293701172, 0.013095617294311523, 0.013957977294921875, 0.014820337295532227, 0.015682697296142578, 0.01654505729675293, 0.01740741729736328, 0.018269777297973633, 0.019132137298583984, 0.019994497299194336, 0.020856857299804688, 0.02171921730041504, 0.02258157730102539, 0.023443937301635742, 0.024306297302246094, 0.025168657302856445, 0.026031017303466797, 0.02689337730407715, 0.0277557373046875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 11.0, 18.0, 23.0, 25.0, 65.0, 93.0, 114.0, 120.0, 120.0, 103.0, 88.0, 58.0, 51.0, 32.0, 33.0, 14.0, 7.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185546875, -0.0179598331451416, -0.017364978790283203, -0.016770124435424805, -0.016175270080566406, -0.015580415725708008, -0.01498556137084961, -0.014390707015991211, -0.013795852661132812, -0.013200998306274414, -0.012606143951416016, -0.012011289596557617, -0.011416435241699219, -0.01082158088684082, -0.010226726531982422, -0.009631872177124023, -0.009037017822265625, -0.008442163467407227, -0.007847309112548828, -0.00725245475769043, -0.006657600402832031, -0.006062746047973633, -0.005467891693115234, -0.004873037338256836, -0.0042781829833984375, -0.003683328628540039, -0.0030884742736816406, -0.002493619918823242, -0.0018987655639648438, -0.0013039112091064453, -0.0007090568542480469, -0.00011420249938964844, 0.00048065185546875, 0.0010755062103271484, 0.0016703605651855469, 0.0022652149200439453, 0.0028600692749023438, 0.003454923629760742, 0.004049777984619141, 0.004644632339477539, 0.0052394866943359375, 0.005834341049194336, 0.006429195404052734, 0.007024049758911133, 0.007618904113769531, 0.00821375846862793, 0.008808612823486328, 0.009403467178344727, 0.009998321533203125, 0.010593175888061523, 0.011188030242919922, 0.01178288459777832, 0.012377738952636719, 0.012972593307495117, 0.013567447662353516, 0.014162302017211914, 0.014757156372070312, 0.015352010726928711, 0.01594686508178711, 0.016541719436645508, 0.017136573791503906, 0.017731428146362305, 0.018326282501220703, 0.0189211368560791, 0.0195159912109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 10.0, 13.0, 33.0, 68.0, 147.0, 439.0, 2143.0, 74696.0, 4111088.0, 4555.0, 663.0, 217.0, 78.0, 43.0, 24.0, 17.0, 10.0, 6.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.22034835815429688, -0.21193695068359375, -0.20352554321289062, -0.1951141357421875, -0.18670272827148438, -0.17829132080078125, -0.16987991333007812, -0.161468505859375, -0.15305709838867188, -0.14464569091796875, -0.13623428344726562, -0.1278228759765625, -0.11941146850585938, -0.11100006103515625, -0.10258865356445312, -0.09417724609375, -0.08576583862304688, -0.07735443115234375, -0.06894302368164062, -0.0605316162109375, -0.052120208740234375, -0.04370880126953125, -0.035297393798828125, -0.026885986328125, -0.018474578857421875, -0.01006317138671875, -0.001651763916015625, 0.0067596435546875, 0.015171051025390625, 0.02358245849609375, 0.031993865966796875, 0.0404052734375, 0.048816680908203125, 0.05722808837890625, 0.06563949584960938, 0.0740509033203125, 0.08246231079101562, 0.09087371826171875, 0.09928512573242188, 0.107696533203125, 0.11610794067382812, 0.12451934814453125, 0.13293075561523438, 0.1413421630859375, 0.14975357055664062, 0.15816497802734375, 0.16657638549804688, 0.17498779296875, 0.18339920043945312, 0.19181060791015625, 0.20022201538085938, 0.2086334228515625, 0.21704483032226562, 0.22545623779296875, 0.23386764526367188, 0.242279052734375, 0.2506904602050781, 0.25910186767578125, 0.2675132751464844, 0.2759246826171875, 0.2843360900878906, 0.29274749755859375, 0.3011589050292969, 0.3095703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 6.0, 6.0, 1.0, 5.0, 7.0, 7.0, 12.0, 15.0, 19.0, 50.0, 74.0, 149.0, 299.0, 869.0, 1491.0, 607.0, 226.0, 116.0, 59.0, 28.0, 11.0, 12.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1168212890625, -0.11351394653320312, -0.11020660400390625, -0.10689926147460938, -0.1035919189453125, -0.10028457641601562, -0.09697723388671875, -0.09366989135742188, -0.090362548828125, -0.08705520629882812, -0.08374786376953125, -0.08044052124023438, -0.0771331787109375, -0.07382583618164062, -0.07051849365234375, -0.06721115112304688, -0.06390380859375, -0.060596466064453125, -0.05728912353515625, -0.053981781005859375, -0.0506744384765625, -0.047367095947265625, -0.04405975341796875, -0.040752410888671875, -0.037445068359375, -0.034137725830078125, -0.03083038330078125, -0.027523040771484375, -0.0242156982421875, -0.020908355712890625, -0.01760101318359375, -0.014293670654296875, -0.010986328125, -0.007678985595703125, -0.00437164306640625, -0.001064300537109375, 0.0022430419921875, 0.005550384521484375, 0.00885772705078125, 0.012165069580078125, 0.015472412109375, 0.018779754638671875, 0.02208709716796875, 0.025394439697265625, 0.0287017822265625, 0.032009124755859375, 0.03531646728515625, 0.038623809814453125, 0.04193115234375, 0.045238494873046875, 0.04854583740234375, 0.051853179931640625, 0.0551605224609375, 0.058467864990234375, 0.06177520751953125, 0.06508255004882812, 0.068389892578125, 0.07169723510742188, 0.07500457763671875, 0.07831192016601562, 0.0816192626953125, 0.08492660522460938, 0.08823394775390625, 0.09154129028320312, 0.0948486328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 10.0, 14.0, 21.0, 44.0, 43.0, 98.0, 161.0, 254.0, 165.0, 73.0, 39.0, 23.0, 18.0, 14.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-1.0359103679656982, -1.015360951423645, -0.994811475276947, -0.974261999130249, -0.9537125825881958, -0.9331631660461426, -0.9126136898994446, -0.8920642137527466, -0.8715147972106934, -0.8509653806686401, -0.8304159045219421, -0.8098664283752441, -0.7893170118331909, -0.7687675952911377, -0.7482181191444397, -0.7276686429977417, -0.7071192264556885, -0.6865698099136353, -0.6660203337669373, -0.6454708576202393, -0.624921441078186, -0.6043720245361328, -0.5838225483894348, -0.5632730722427368, -0.5427236557006836, -0.5221742391586304, -0.5016247630119324, -0.48107531666755676, -0.46052587032318115, -0.43997642397880554, -0.41942697763442993, -0.3988775312900543, -0.3783281147480011, -0.3577786684036255, -0.3372292220592499, -0.31667977571487427, -0.29613032937049866, -0.27558088302612305, -0.25503143668174744, -0.23448199033737183, -0.21393254399299622, -0.1933830976486206, -0.172833651304245, -0.15228420495986938, -0.13173475861549377, -0.11118531227111816, -0.09063586592674255, -0.07008641958236694, -0.04953697323799133, -0.028987526893615723, -0.008438080549240112, 0.012111365795135498, 0.03266081213951111, 0.05321025848388672, 0.07375970482826233, 0.09430915117263794, 0.11485859751701355, 0.13540804386138916, 0.15595749020576477, 0.17650693655014038, 0.197056382894516, 0.2176058292388916, 0.2381552755832672, 0.2587047219276428, 0.27925416827201843]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 9.0, 9.0, 17.0, 25.0, 26.0, 24.0, 37.0, 43.0, 57.0, 72.0, 80.0, 105.0, 77.0, 71.0, 64.0, 49.0, 64.0, 39.0, 32.0, 27.0, 21.0, 16.0, 8.0, 9.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.566375195980072, -0.5489749312400818, -0.5315747261047363, -0.5141744613647461, -0.49677419662475586, -0.4793739318847656, -0.4619736969470978, -0.44457346200942993, -0.4271731972694397, -0.40977293252944946, -0.3923726975917816, -0.37497246265411377, -0.35757219791412354, -0.3401719331741333, -0.32277169823646545, -0.3053714632987976, -0.2879711985588074, -0.27057093381881714, -0.2531706988811493, -0.23577044904232025, -0.2183701992034912, -0.20096994936466217, -0.18356969952583313, -0.1661694496870041, -0.14876919984817505, -0.131368950009346, -0.11396870017051697, -0.09656845033168793, -0.07916820049285889, -0.061767950654029846, -0.044367700815200806, -0.026967450976371765, -0.0095672607421875, 0.00783298909664154, 0.02523323893547058, 0.04263348877429962, 0.06003373861312866, 0.0774339884519577, 0.09483423829078674, 0.11223448812961578, 0.12963473796844482, 0.14703498780727386, 0.1644352376461029, 0.18183548748493195, 0.199235737323761, 0.21663598716259003, 0.23403623700141907, 0.2514364719390869, 0.26883673667907715, 0.2862370014190674, 0.30363723635673523, 0.3210374712944031, 0.3384377360343933, 0.35583800077438354, 0.3732382357120514, 0.39063847064971924, 0.4080387353897095, 0.4254390001296997, 0.44283923506736755, 0.4602394700050354, 0.47763973474502563, 0.49503999948501587, 0.5124402046203613, 0.5298404693603516, 0.5472407341003418]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 2.0, 2.0, 6.0, 12.0, 22.0, 33.0, 53.0, 96.0, 158.0, 373.0, 904.0, 3346.0, 19965.0, 757643.0, 250296.0, 11870.0, 2413.0, 736.0, 275.0, 139.0, 88.0, 46.0, 27.0, 13.0, 10.0, 4.0, 3.0, 3.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.14806556701660156, -0.14342117309570312, -0.1387767791748047, -0.13413238525390625, -0.1294879913330078, -0.12484359741210938, -0.12019920349121094, -0.1155548095703125, -0.11091041564941406, -0.10626602172851562, -0.10162162780761719, -0.09697723388671875, -0.09233283996582031, -0.08768844604492188, -0.08304405212402344, -0.078399658203125, -0.07375526428222656, -0.06911087036132812, -0.06446647644042969, -0.05982208251953125, -0.05517768859863281, -0.050533294677734375, -0.04588890075683594, -0.0412445068359375, -0.03660011291503906, -0.031955718994140625, -0.027311325073242188, -0.02266693115234375, -0.018022537231445312, -0.013378143310546875, -0.008733749389648438, -0.00408935546875, 0.0005550384521484375, 0.005199432373046875, 0.009843826293945312, 0.01448822021484375, 0.019132614135742188, 0.023777008056640625, 0.028421401977539062, 0.0330657958984375, 0.03771018981933594, 0.042354583740234375, 0.04699897766113281, 0.05164337158203125, 0.05628776550292969, 0.060932159423828125, 0.06557655334472656, 0.070220947265625, 0.07486534118652344, 0.07950973510742188, 0.08415412902832031, 0.08879852294921875, 0.09344291687011719, 0.09808731079101562, 0.10273170471191406, 0.1073760986328125, 0.11202049255371094, 0.11666488647460938, 0.12130928039550781, 0.12595367431640625, 0.1305980682373047, 0.13524246215820312, 0.13988685607910156, 0.14453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 15.0, 20.0, 23.0, 33.0, 52.0, 50.0, 74.0, 99.0, 117.0, 111.0, 108.0, 83.0, 60.0, 39.0, 33.0, 26.0, 16.0, 13.0, 9.0, 6.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04345703125, -0.042314767837524414, -0.04117250442504883, -0.04003024101257324, -0.038887977600097656, -0.03774571418762207, -0.036603450775146484, -0.0354611873626709, -0.03431892395019531, -0.03317666053771973, -0.03203439712524414, -0.030892133712768555, -0.02974987030029297, -0.028607606887817383, -0.027465343475341797, -0.02632308006286621, -0.025180816650390625, -0.02403855323791504, -0.022896289825439453, -0.021754026412963867, -0.02061176300048828, -0.019469499588012695, -0.01832723617553711, -0.017184972763061523, -0.016042709350585938, -0.014900445938110352, -0.013758182525634766, -0.01261591911315918, -0.011473655700683594, -0.010331392288208008, -0.009189128875732422, -0.008046865463256836, -0.00690460205078125, -0.005762338638305664, -0.004620075225830078, -0.003477811813354492, -0.0023355484008789062, -0.0011932849884033203, -5.1021575927734375e-05, 0.0010912418365478516, 0.0022335052490234375, 0.0033757686614990234, 0.004518032073974609, 0.005660295486450195, 0.006802558898925781, 0.007944822311401367, 0.009087085723876953, 0.010229349136352539, 0.011371612548828125, 0.012513875961303711, 0.013656139373779297, 0.014798402786254883, 0.01594066619873047, 0.017082929611206055, 0.01822519302368164, 0.019367456436157227, 0.020509719848632812, 0.0216519832611084, 0.022794246673583984, 0.02393651008605957, 0.025078773498535156, 0.026221036911010742, 0.027363300323486328, 0.028505563735961914, 0.0296478271484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 7.0, 9.0, 6.0, 23.0, 36.0, 69.0, 119.0, 295.0, 695.0, 2842.0, 37206.0, 986371.0, 17721.0, 2026.0, 599.0, 236.0, 120.0, 66.0, 37.0, 23.0, 16.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1195068359375, -0.11334419250488281, -0.10718154907226562, -0.10101890563964844, -0.09485626220703125, -0.08869361877441406, -0.08253097534179688, -0.07636833190917969, -0.0702056884765625, -0.06404304504394531, -0.057880401611328125, -0.05171775817871094, -0.04555511474609375, -0.03939247131347656, -0.033229827880859375, -0.027067184448242188, -0.020904541015625, -0.014741897583007812, -0.008579254150390625, -0.0024166107177734375, 0.00374603271484375, 0.009908676147460938, 0.016071319580078125, 0.022233963012695312, 0.0283966064453125, 0.03455924987792969, 0.040721893310546875, 0.04688453674316406, 0.05304718017578125, 0.05920982360839844, 0.06537246704101562, 0.07153511047363281, 0.07769775390625, 0.08386039733886719, 0.09002304077148438, 0.09618568420410156, 0.10234832763671875, 0.10851097106933594, 0.11467361450195312, 0.12083625793457031, 0.1269989013671875, 0.1331615447998047, 0.13932418823242188, 0.14548683166503906, 0.15164947509765625, 0.15781211853027344, 0.16397476196289062, 0.1701374053955078, 0.176300048828125, 0.1824626922607422, 0.18862533569335938, 0.19478797912597656, 0.20095062255859375, 0.20711326599121094, 0.21327590942382812, 0.2194385528564453, 0.2256011962890625, 0.2317638397216797, 0.23792648315429688, 0.24408912658691406, 0.25025177001953125, 0.25641441345214844, 0.2625770568847656, 0.2687397003173828, 0.27490234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 17.0, 7.0, 20.0, 27.0, 31.0, 42.0, 60.0, 78.0, 128.0, 134.0, 120.0, 81.0, 60.0, 48.0, 32.0, 30.0, 23.0, 18.0, 12.0, 9.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1607666015625, -0.15582275390625, -0.15087890625, -0.14593505859375, -0.1409912109375, -0.13604736328125, -0.131103515625, -0.12615966796875, -0.1212158203125, -0.11627197265625, -0.111328125, -0.10638427734375, -0.1014404296875, -0.09649658203125, -0.091552734375, -0.08660888671875, -0.0816650390625, -0.07672119140625, -0.07177734375, -0.06683349609375, -0.0618896484375, -0.05694580078125, -0.052001953125, -0.04705810546875, -0.0421142578125, -0.03717041015625, -0.0322265625, -0.02728271484375, -0.0223388671875, -0.01739501953125, -0.012451171875, -0.00750732421875, -0.0025634765625, 0.00238037109375, 0.00732421875, 0.01226806640625, 0.0172119140625, 0.02215576171875, 0.027099609375, 0.03204345703125, 0.0369873046875, 0.04193115234375, 0.046875, 0.05181884765625, 0.0567626953125, 0.06170654296875, 0.066650390625, 0.07159423828125, 0.0765380859375, 0.08148193359375, 0.08642578125, 0.09136962890625, 0.0963134765625, 0.10125732421875, 0.106201171875, 0.11114501953125, 0.1160888671875, 0.12103271484375, 0.1259765625, 0.13092041015625, 0.1358642578125, 0.14080810546875, 0.145751953125, 0.15069580078125, 0.1556396484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 5.0, 12.0, 16.0, 9.0, 25.0, 34.0, 45.0, 62.0, 88.0, 157.0, 258.0, 532.0, 1228.0, 2930.0, 8880.0, 40186.0, 862049.0, 107795.0, 16326.0, 4539.0, 1731.0, 700.0, 352.0, 193.0, 128.0, 73.0, 54.0, 39.0, 21.0, 13.0, 12.0, 4.0, 9.0, 6.0, 4.0, 2.0, 6.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0166168212890625, -0.016108989715576172, -0.015601158142089844, -0.015093326568603516, -0.014585494995117188, -0.01407766342163086, -0.013569831848144531, -0.013062000274658203, -0.012554168701171875, -0.012046337127685547, -0.011538505554199219, -0.01103067398071289, -0.010522842407226562, -0.010015010833740234, -0.009507179260253906, -0.008999347686767578, -0.00849151611328125, -0.007983684539794922, -0.007475852966308594, -0.006968021392822266, -0.0064601898193359375, -0.005952358245849609, -0.005444526672363281, -0.004936695098876953, -0.004428863525390625, -0.003921031951904297, -0.0034132003784179688, -0.0029053688049316406, -0.0023975372314453125, -0.0018897056579589844, -0.0013818740844726562, -0.0008740425109863281, -0.0003662109375, 0.00014162063598632812, 0.0006494522094726562, 0.0011572837829589844, 0.0016651153564453125, 0.0021729469299316406, 0.0026807785034179688, 0.003188610076904297, 0.003696441650390625, 0.004204273223876953, 0.004712104797363281, 0.005219936370849609, 0.0057277679443359375, 0.006235599517822266, 0.006743431091308594, 0.007251262664794922, 0.00775909423828125, 0.008266925811767578, 0.008774757385253906, 0.009282588958740234, 0.009790420532226562, 0.01029825210571289, 0.010806083679199219, 0.011313915252685547, 0.011821746826171875, 0.012329578399658203, 0.012837409973144531, 0.01334524154663086, 0.013853073120117188, 0.014360904693603516, 0.014868736267089844, 0.015376567840576172, 0.0158843994140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 6.0, 11.0, 8.0, 18.0, 12.0, 16.0, 18.0, 36.0, 41.0, 45.0, 46.0, 70.0, 69.0, 81.0, 83.0, 60.0, 74.0, 61.0, 53.0, 45.0, 20.0, 25.0, 22.0, 14.0, 5.0, 8.0, 7.0, 12.0, 3.0, 4.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.867813110351562e-06, -7.642433047294617e-06, -7.417052984237671e-06, -7.191672921180725e-06, -6.966292858123779e-06, -6.7409127950668335e-06, -6.515532732009888e-06, -6.290152668952942e-06, -6.064772605895996e-06, -5.83939254283905e-06, -5.6140124797821045e-06, -5.388632416725159e-06, -5.163252353668213e-06, -4.937872290611267e-06, -4.712492227554321e-06, -4.4871121644973755e-06, -4.26173210144043e-06, -4.036352038383484e-06, -3.810971975326538e-06, -3.5855919122695923e-06, -3.3602118492126465e-06, -3.1348317861557007e-06, -2.909451723098755e-06, -2.684071660041809e-06, -2.4586915969848633e-06, -2.2333115339279175e-06, -2.0079314708709717e-06, -1.7825514078140259e-06, -1.55717134475708e-06, -1.3317912817001343e-06, -1.1064112186431885e-06, -8.810311555862427e-07, -6.556510925292969e-07, -4.302710294723511e-07, -2.0489096641540527e-07, 2.0489096641540527e-08, 2.4586915969848633e-07, 4.7124922275543213e-07, 6.966292858123779e-07, 9.220093488693237e-07, 1.1473894119262695e-06, 1.3727694749832153e-06, 1.5981495380401611e-06, 1.823529601097107e-06, 2.0489096641540527e-06, 2.2742897272109985e-06, 2.4996697902679443e-06, 2.72504985332489e-06, 2.950429916381836e-06, 3.1758099794387817e-06, 3.4011900424957275e-06, 3.6265701055526733e-06, 3.851950168609619e-06, 4.077330231666565e-06, 4.302710294723511e-06, 4.5280903577804565e-06, 4.753470420837402e-06, 4.978850483894348e-06, 5.204230546951294e-06, 5.42961061000824e-06, 5.6549906730651855e-06, 5.880370736122131e-06, 6.105750799179077e-06, 6.331130862236023e-06, 6.556510925292969e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 7.0, 6.0, 19.0, 15.0, 31.0, 43.0, 55.0, 92.0, 124.0, 215.0, 384.0, 711.0, 1496.0, 3978.0, 17798.0, 659033.0, 340635.0, 17040.0, 3909.0, 1378.0, 671.0, 343.0, 189.0, 138.0, 75.0, 57.0, 29.0, 26.0, 15.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.011077880859375, -0.010770082473754883, -0.010462284088134766, -0.010154485702514648, -0.009846687316894531, -0.009538888931274414, -0.009231090545654297, -0.00892329216003418, -0.008615493774414062, -0.008307695388793945, -0.007999897003173828, -0.007692098617553711, -0.007384300231933594, -0.0070765018463134766, -0.006768703460693359, -0.006460905075073242, -0.006153106689453125, -0.005845308303833008, -0.005537509918212891, -0.0052297115325927734, -0.004921913146972656, -0.004614114761352539, -0.004306316375732422, -0.003998517990112305, -0.0036907196044921875, -0.0033829212188720703, -0.003075122833251953, -0.002767324447631836, -0.0024595260620117188, -0.0021517276763916016, -0.0018439292907714844, -0.0015361309051513672, -0.00122833251953125, -0.0009205341339111328, -0.0006127357482910156, -0.00030493736267089844, 2.86102294921875e-06, 0.00031065940856933594, 0.0006184577941894531, 0.0009262561798095703, 0.0012340545654296875, 0.0015418529510498047, 0.0018496513366699219, 0.002157449722290039, 0.0024652481079101562, 0.0027730464935302734, 0.0030808448791503906, 0.003388643264770508, 0.003696441650390625, 0.004004240036010742, 0.004312038421630859, 0.0046198368072509766, 0.004927635192871094, 0.005235433578491211, 0.005543231964111328, 0.005851030349731445, 0.0061588287353515625, 0.00646662712097168, 0.006774425506591797, 0.007082223892211914, 0.007390022277832031, 0.0076978206634521484, 0.008005619049072266, 0.008313417434692383, 0.0086212158203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 14.0, 21.0, 21.0, 38.0, 51.0, 91.0, 119.0, 138.0, 120.0, 100.0, 95.0, 61.0, 36.0, 21.0, 23.0, 8.0, 8.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0209503173828125, -0.020254850387573242, -0.019559383392333984, -0.018863916397094727, -0.01816844940185547, -0.01747298240661621, -0.016777515411376953, -0.016082048416137695, -0.015386581420898438, -0.01469111442565918, -0.013995647430419922, -0.013300180435180664, -0.012604713439941406, -0.011909246444702148, -0.01121377944946289, -0.010518312454223633, -0.009822845458984375, -0.009127378463745117, -0.00843191146850586, -0.0077364444732666016, -0.007040977478027344, -0.006345510482788086, -0.005650043487548828, -0.00495457649230957, -0.0042591094970703125, -0.0035636425018310547, -0.002868175506591797, -0.002172708511352539, -0.0014772415161132812, -0.0007817745208740234, -8.630752563476562e-05, 0.0006091594696044922, 0.00130462646484375, 0.002000093460083008, 0.0026955604553222656, 0.0033910274505615234, 0.004086494445800781, 0.004781961441040039, 0.005477428436279297, 0.006172895431518555, 0.0068683624267578125, 0.00756382942199707, 0.008259296417236328, 0.008954763412475586, 0.009650230407714844, 0.010345697402954102, 0.01104116439819336, 0.011736631393432617, 0.012432098388671875, 0.013127565383911133, 0.01382303237915039, 0.014518499374389648, 0.015213966369628906, 0.015909433364868164, 0.016604900360107422, 0.01730036735534668, 0.017995834350585938, 0.018691301345825195, 0.019386768341064453, 0.02008223533630371, 0.02077770233154297, 0.021473169326782227, 0.022168636322021484, 0.022864103317260742, 0.0235595703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 10.0, 18.0, 35.0, 103.0, 511.0, 246.0, 46.0, 24.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8921020030975342, -1.8548486232757568, -1.81759512424469, -1.7803417444229126, -1.7430883646011353, -1.7058348655700684, -1.668581485748291, -1.6313281059265137, -1.5940747261047363, -1.556821346282959, -1.519567847251892, -1.4823144674301147, -1.4450610876083374, -1.4078075885772705, -1.3705542087554932, -1.3333008289337158, -1.296047329902649, -1.2587939500808716, -1.2215404510498047, -1.1842870712280273, -1.14703369140625, -1.1097803115844727, -1.0725268125534058, -1.0352734327316284, -0.9980199933052063, -0.9607665538787842, -0.9235131740570068, -0.8862597346305847, -0.8490062952041626, -0.8117529153823853, -0.7744994759559631, -0.737246036529541, -0.6999927759170532, -0.6627393364906311, -0.6254859566688538, -0.5882325172424316, -0.5509791374206543, -0.5137256979942322, -0.47647225856781006, -0.4392188489437103, -0.4019654393196106, -0.36471202969551086, -0.32745862007141113, -0.290205180644989, -0.2529517710208893, -0.21569836139678955, -0.17844493687152863, -0.1411915123462677, -0.10393810272216797, -0.06668468564748764, -0.029431268572807312, 0.007822148501873016, 0.045075565576553345, 0.08232897520065308, 0.119582399725914, 0.15683582425117493, 0.19408923387527466, 0.2313426434993744, 0.2685960531234741, 0.30584949254989624, 0.34310290217399597, 0.3803563117980957, 0.4176097512245178, 0.45486316084861755, 0.4921165704727173]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 4.0, 7.0, 9.0, 5.0, 8.0, 12.0, 32.0, 22.0, 23.0, 28.0, 29.0, 36.0, 89.0, 103.0, 64.0, 48.0, 93.0, 108.0, 78.0, 39.0, 21.0, 19.0, 15.0, 17.0, 10.0, 10.0, 14.0, 11.0, 8.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0], "bins": [-0.3038482069969177, -0.2952592968940735, -0.28667035698890686, -0.27808141708374023, -0.269492506980896, -0.26090359687805176, -0.25231465697288513, -0.2437257319688797, -0.23513680696487427, -0.22654788196086884, -0.2179589569568634, -0.20937003195285797, -0.20078110694885254, -0.1921921819448471, -0.18360325694084167, -0.17501433193683624, -0.1664254069328308, -0.15783648192882538, -0.14924755692481995, -0.14065863192081451, -0.13206970691680908, -0.12348078191280365, -0.11489185690879822, -0.10630293190479279, -0.09771400690078735, -0.08912508189678192, -0.08053615689277649, -0.07194723188877106, -0.06335830688476562, -0.05476938188076019, -0.04618045687675476, -0.03759153187274933, -0.029002606868743896, -0.020413681864738464, -0.011824756860733032, -0.0032358318567276, 0.005353093147277832, 0.013942018151283264, 0.022530943155288696, 0.03111986815929413, 0.03970879316329956, 0.04829771816730499, 0.056886643171310425, 0.06547556817531586, 0.07406449317932129, 0.08265341818332672, 0.09124234318733215, 0.09983126819133759, 0.10842019319534302, 0.11700911819934845, 0.12559804320335388, 0.13418696820735931, 0.14277589321136475, 0.15136481821537018, 0.1599537432193756, 0.16854266822338104, 0.17713159322738647, 0.1857205182313919, 0.19430944323539734, 0.20289836823940277, 0.2114872932434082, 0.22007621824741364, 0.22866514325141907, 0.2372540682554245, 0.24584299325942993]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 9.0, 9.0, 17.0, 16.0, 29.0, 39.0, 34.0, 62.0, 213.0, 284.0, 78.0, 48.0, 45.0, 33.0, 28.0, 11.0, 15.0, 11.0, 4.0, 6.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031524658203125, -0.030510902404785156, -0.029497146606445312, -0.02848339080810547, -0.027469635009765625, -0.02645587921142578, -0.025442123413085938, -0.024428367614746094, -0.02341461181640625, -0.022400856018066406, -0.021387100219726562, -0.02037334442138672, -0.019359588623046875, -0.01834583282470703, -0.017332077026367188, -0.016318321228027344, -0.0153045654296875, -0.014290809631347656, -0.013277053833007812, -0.012263298034667969, -0.011249542236328125, -0.010235786437988281, -0.009222030639648438, -0.008208274841308594, -0.00719451904296875, -0.006180763244628906, -0.0051670074462890625, -0.004153251647949219, -0.003139495849609375, -0.0021257400512695312, -0.0011119842529296875, -9.822845458984375e-05, 0.00091552734375, 0.0019292831420898438, 0.0029430389404296875, 0.003956794738769531, 0.004970550537109375, 0.005984306335449219, 0.0069980621337890625, 0.008011817932128906, 0.00902557373046875, 0.010039329528808594, 0.011053085327148438, 0.012066841125488281, 0.013080596923828125, 0.014094352722167969, 0.015108108520507812, 0.016121864318847656, 0.0171356201171875, 0.018149375915527344, 0.019163131713867188, 0.02017688751220703, 0.021190643310546875, 0.02220439910888672, 0.023218154907226562, 0.024231910705566406, 0.02524566650390625, 0.026259422302246094, 0.027273178100585938, 0.02828693389892578, 0.029300689697265625, 0.03031444549560547, 0.03132820129394531, 0.032341957092285156, 0.033355712890625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 9.0, 0.0, 12.0, 3.0, 3.0, 12.0, 27.0, 18.0, 17.0, 30.0, 65.0, 76.0, 171.0, 420.0, 1627.0, 33356.0, 8348995.0, 2780.0, 522.0, 176.0, 90.0, 59.0, 45.0, 22.0, 15.0, 2.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4398147165775299, -0.42886215448379517, -0.4179095923900604, -0.4069570302963257, -0.39600449800491333, -0.3850519359111786, -0.37409937381744385, -0.3631468117237091, -0.35219424962997437, -0.3412416875362396, -0.3302891254425049, -0.31933656334877014, -0.3083840012550354, -0.29743146896362305, -0.2864789068698883, -0.27552634477615356, -0.2645737826824188, -0.2536212205886841, -0.24266865849494934, -0.2317161113023758, -0.22076354920864105, -0.2098109871149063, -0.19885843992233276, -0.18790587782859802, -0.17695331573486328, -0.16600075364112854, -0.1550481915473938, -0.14409564435482025, -0.1331430822610855, -0.12219052016735077, -0.11123796552419662, -0.10028541088104248, -0.08933281898498535, -0.07838025689125061, -0.06742770224809647, -0.05647514387965202, -0.04552258551120758, -0.03457002714276314, -0.023617468774318695, -0.01266491413116455, -0.0017123520374298096, 0.009240206331014633, 0.020192764699459076, 0.03114532306790352, 0.04209788143634796, 0.053050439804792404, 0.06400299817323685, 0.07495555281639099, 0.08590811491012573, 0.09686067700386047, 0.10781323164701462, 0.11876578629016876, 0.1297183483839035, 0.14067091047763824, 0.1516234576702118, 0.16257601976394653, 0.17352858185768127, 0.18448114395141602, 0.19543370604515076, 0.2063862532377243, 0.21733881533145905, 0.2282913774251938, 0.23924392461776733, 0.2501964867115021, 0.2611490488052368]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 5.0, 0.0, 3.0, 5.0, 2.0, 2.0, 7.0, 5.0, 8.0, 7.0, 2.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07983268797397614, -0.07632064074277878, -0.07280860096216202, -0.06929655373096466, -0.0657845139503479, -0.06227246671915054, -0.058760419487953186, -0.05524837598204613, -0.05173633247613907, -0.04822428897023201, -0.04471224546432495, -0.041200198233127594, -0.037688154727220535, -0.03417611122131348, -0.03066406585276127, -0.02715202048420906, -0.023639976978302002, -0.020127933472394943, -0.016615888103842735, -0.013103843666613102, -0.009591799229383469, -0.00607975572347641, -0.002567710354924202, 0.000944335013628006, 0.004456378519535065, 0.007968422956764698, 0.011480467393994331, 0.014992511831223965, 0.018504556268453598, 0.022016599774360657, 0.025528645142912865, 0.029040690511465073, 0.03255273401737213, 0.03606477752327919, 0.03957682102918625, 0.043088868260383606, 0.046600911766290665, 0.05011295527219772, 0.05362500250339508, 0.05713704600930214, 0.0606490895152092, 0.06416113674640656, 0.06767317652702332, 0.07118522375822067, 0.07469727098941803, 0.07820931077003479, 0.08172135800123215, 0.0852334052324295, 0.08874544501304626, 0.09225749224424362, 0.09576953202486038, 0.09928157925605774, 0.1027936190366745, 0.10630566626787186, 0.10981771349906921, 0.11332975327968597, 0.11684180051088333, 0.12035384774208069, 0.12386588752269745, 0.1273779273033142, 0.13088998198509216, 0.13440202176570892, 0.13791406154632568, 0.14142611622810364, 0.1449381560087204]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 6.0, 9.0, 11.0, 19.0, 25.0, 19.0, 46.0, 55.0, 106.0, 140.0, 287.0, 516.0, 981.0, 2429.0, 6230.0, 19363.0, 73765.0, 243797.0, 128471.0, 31796.0, 9601.0, 3511.0, 1422.0, 710.0, 364.0, 230.0, 120.0, 75.0, 56.0, 37.0, 16.0, 10.0, 8.0, 10.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1815185546875, -0.17670249938964844, -0.17188644409179688, -0.1670703887939453, -0.16225433349609375, -0.1574382781982422, -0.15262222290039062, -0.14780616760253906, -0.1429901123046875, -0.13817405700683594, -0.13335800170898438, -0.1285419464111328, -0.12372589111328125, -0.11890983581542969, -0.11409378051757812, -0.10927772521972656, -0.104461669921875, -0.09964561462402344, -0.09482955932617188, -0.09001350402832031, -0.08519744873046875, -0.08038139343261719, -0.07556533813476562, -0.07074928283691406, -0.0659332275390625, -0.06111717224121094, -0.056301116943359375, -0.05148506164550781, -0.04666900634765625, -0.04185295104980469, -0.037036895751953125, -0.03222084045410156, -0.02740478515625, -0.022588729858398438, -0.017772674560546875, -0.012956619262695312, -0.00814056396484375, -0.0033245086669921875, 0.001491546630859375, 0.0063076019287109375, 0.0111236572265625, 0.015939712524414062, 0.020755767822265625, 0.025571823120117188, 0.03038787841796875, 0.03520393371582031, 0.040019989013671875, 0.04483604431152344, 0.049652099609375, 0.05446815490722656, 0.059284210205078125, 0.06410026550292969, 0.06891632080078125, 0.07373237609863281, 0.07854843139648438, 0.08336448669433594, 0.0881805419921875, 0.09299659729003906, 0.09781265258789062, 0.10262870788574219, 0.10744476318359375, 0.11226081848144531, 0.11707687377929688, 0.12189292907714844, 0.126708984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 3.0, 7.0, 9.0, 12.0, 11.0, 22.0, 26.0, 30.0, 44.0, 63.0, 74.0, 88.0, 99.0, 90.0, 102.0, 61.0, 54.0, 36.0, 40.0, 16.0, 28.0, 10.0, 17.0, 10.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0380859375, -0.037030696868896484, -0.03597545623779297, -0.03492021560668945, -0.03386497497558594, -0.03280973434448242, -0.031754493713378906, -0.03069925308227539, -0.029644012451171875, -0.02858877182006836, -0.027533531188964844, -0.026478290557861328, -0.025423049926757812, -0.024367809295654297, -0.02331256866455078, -0.022257328033447266, -0.02120208740234375, -0.020146846771240234, -0.01909160614013672, -0.018036365509033203, -0.016981124877929688, -0.015925884246826172, -0.014870643615722656, -0.01381540298461914, -0.012760162353515625, -0.01170492172241211, -0.010649681091308594, -0.009594440460205078, -0.008539199829101562, -0.007483959197998047, -0.006428718566894531, -0.005373477935791016, -0.0043182373046875, -0.0032629966735839844, -0.0022077560424804688, -0.0011525154113769531, -9.72747802734375e-05, 0.0009579658508300781, 0.0020132064819335938, 0.0030684471130371094, 0.004123687744140625, 0.005178928375244141, 0.006234169006347656, 0.007289409637451172, 0.008344650268554688, 0.009399890899658203, 0.010455131530761719, 0.011510372161865234, 0.01256561279296875, 0.013620853424072266, 0.014676094055175781, 0.015731334686279297, 0.016786575317382812, 0.017841815948486328, 0.018897056579589844, 0.01995229721069336, 0.021007537841796875, 0.02206277847290039, 0.023118019104003906, 0.024173259735107422, 0.025228500366210938, 0.026283740997314453, 0.02733898162841797, 0.028394222259521484, 0.029449462890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 18.0, 105.0, 197.0, 78.0, 41.0, 22.0, 10.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8479621410369873, -0.8298379778862, -0.8117138743400574, -0.79358971118927, -0.7754656076431274, -0.7573414444923401, -0.7392173409461975, -0.7210931777954102, -0.7029690742492676, -0.6848449110984802, -0.6667208075523376, -0.6485966444015503, -0.6304725408554077, -0.6123483777046204, -0.5942242741584778, -0.5761001110076904, -0.5579760074615479, -0.5398518443107605, -0.5217277407646179, -0.5036035776138306, -0.485479474067688, -0.467355340719223, -0.44923120737075806, -0.4311070442199707, -0.41298288106918335, -0.3948587477207184, -0.3767346143722534, -0.35861048102378845, -0.3404863476753235, -0.3223622143268585, -0.30423808097839355, -0.2861139178276062, -0.267989844083786, -0.24986571073532104, -0.23174157738685608, -0.2136174440383911, -0.19549331068992615, -0.17736917734146118, -0.15924502909183502, -0.14112089574337006, -0.12299676239490509, -0.10487262904644012, -0.08674849569797516, -0.0686243548989296, -0.05050022155046463, -0.032376088201999664, -0.014251947402954102, 0.0038721859455108643, 0.02199631929397583, 0.040120452642440796, 0.05824458971619606, 0.07636872678995132, 0.09449286013841629, 0.11261699348688126, 0.13074113428592682, 0.14886526763439178, 0.16698940098285675, 0.18511353433132172, 0.20323766767978668, 0.22136181592941284, 0.2394859492778778, 0.2576100826263428, 0.27573421597480774, 0.2938583493232727, 0.31198248267173767]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 11.0, 10.0, 53.0, 113.0, 124.0, 85.0, 22.0, 19.0, 11.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1873171329498291, -0.1781158745288849, -0.16891461610794067, -0.15971335768699646, -0.15051209926605225, -0.14131084084510803, -0.132109597325325, -0.1229083389043808, -0.11370708048343658, -0.10450582206249237, -0.09530456364154816, -0.08610331267118454, -0.07690205425024033, -0.06770079582929611, -0.0584995411336422, -0.04929828643798828, -0.04009702801704407, -0.030895771458745003, -0.021694514900445938, -0.012493258342146873, -0.003292001783847809, 0.005909256637096405, 0.01511051133275032, 0.024311766028404236, 0.03351302444934845, 0.042714282870292664, 0.05191553756594658, 0.061116792261600494, 0.07031805068254471, 0.07951930910348892, 0.08872056007385254, 0.09792181849479675, 0.10712307691574097, 0.11632433533668518, 0.1255255937576294, 0.1347268521785736, 0.14392811059951782, 0.15312936902046204, 0.16233061254024506, 0.17153187096118927, 0.18073312938213348, 0.1899343878030777, 0.1991356462240219, 0.20833690464496613, 0.21753814816474915, 0.22673940658569336, 0.23594066500663757, 0.2451419234275818, 0.254343181848526, 0.2635444402694702, 0.27274569869041443, 0.28194695711135864, 0.29114821553230286, 0.30034947395324707, 0.3095507323741913, 0.3187519907951355, 0.3279532194137573, 0.33715447783470154, 0.34635573625564575, 0.35555699467658997, 0.3647582530975342, 0.3739595115184784, 0.3831607699394226, 0.39236199855804443, 0.40156328678131104]}, "eval/loss": 4.852334976196289, "eval/wer": 2.476675922253074, "eval/runtime": 935.2262, "eval/samples_per_second": 2.825, "eval/steps_per_second": 0.236, "train/train_runtime": 6750.5443, "train/train_samples_per_second": 4.228, "train/train_steps_per_second": 0.176, "train/total_flos": 0.0, "train/train_loss": 4.993681282832704} \ No newline at end of file