diff --git "a/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" "b/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.4678, "train/learning_rate": 0.0002982, "train/epoch": 1.12, "train/global_step": 500, "_runtime": 6103, "_timestamp": 1647972858, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 94.0, 708.0, 200.0, 16.0], "bins": [-178.4449920654297, -175.54197692871094, -172.63894653320312, -169.73593139648438, -166.83291625976562, -163.92990112304688, -161.02687072753906, -158.1238555908203, -155.22084045410156, -152.3178253173828, -149.414794921875, -146.51177978515625, -143.6087646484375, -140.70574951171875, -137.80271911621094, -134.8997039794922, -131.99667358398438, -129.09365844726562, -126.19063568115234, -123.28761291503906, -120.38459777832031, -117.48157501220703, -114.57855224609375, -111.675537109375, -108.77252197265625, -105.86949920654297, -102.96648406982422, -100.06346130371094, -97.16044616699219, -94.2574234008789, -91.35440063476562, -88.45138549804688, -85.54837036132812, -82.64534759521484, -79.7423324584961, -76.83930969238281, -73.93629455566406, -71.03327178955078, -68.1302490234375, -65.22723388671875, -62.324214935302734, -59.42119598388672, -56.5181770324707, -53.61515808105469, -50.712135314941406, -47.809120178222656, -44.906097412109375, -42.00307846069336, -39.100059509277344, -36.19704055786133, -33.29402160644531, -30.391000747680664, -27.48798179626465, -24.584962844848633, -21.681941986083984, -18.77892303466797, -15.875904083251953, -12.972885131835938, -10.069865226745605, -7.166845321655273, -4.263826370239258, -1.3608074188232422, 1.5422134399414062, 4.445232391357422, 7.348250865936279]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 6.0, 5.0, 6.0, 6.0, 6.0, 14.0, 12.0, 10.0, 17.0, 22.0, 17.0, 35.0, 24.0, 23.0, 30.0, 24.0, 35.0, 42.0, 33.0, 46.0, 40.0, 49.0, 40.0, 42.0, 37.0, 34.0, 35.0, 44.0, 29.0, 31.0, 27.0, 26.0, 20.0, 23.0, 26.0, 17.0, 11.0, 18.0, 14.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.406150817871094, -11.98697566986084, -11.567801475524902, -11.148626327514648, -10.729452133178711, -10.310276985168457, -9.891101837158203, -9.471927642822266, -9.052753448486328, -8.633578300476074, -8.214404106140137, -7.795228958129883, -7.376054763793945, -6.956879615783691, -6.537704944610596, -6.1185302734375, -5.699355125427246, -5.28018045425415, -4.861005783081055, -4.441830635070801, -4.022656440734863, -3.6034815311431885, -3.1843066215515137, -2.765131950378418, -2.3459572792053223, -1.9267826080322266, -1.5076078176498413, -1.088433027267456, -0.6692583560943604, -0.25008368492126465, 0.16909122467041016, 0.5882658958435059, 1.0074405670166016, 1.4266152381896973, 1.8457900285720825, 2.2649648189544678, 2.6841394901275635, 3.103314161300659, 3.522489070892334, 3.9416637420654297, 4.360838413238525, 4.780013084411621, 5.199187755584717, 5.6183624267578125, 6.037537574768066, 6.456711769104004, 6.875886917114258, 7.2950615882873535, 7.714236259460449, 8.133411407470703, 8.55258560180664, 8.971760749816895, 9.390934944152832, 9.810110092163086, 10.229284286499023, 10.648459434509277, 11.067634582519531, 11.486809730529785, 11.905983924865723, 12.325159072875977, 12.744333267211914, 13.163508415222168, 13.582683563232422, 14.00185775756836, 14.421031951904297]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 14.0, 11.0, 24.0, 27.0, 33.0, 42.0, 73.0, 154.0, 286.0, 693.0, 1799.0, 6621.0, 32918.0, 190326.0, 930982.0, 2119213.0, 728323.0, 148403.0, 26366.0, 5318.0, 1451.0, 582.0, 256.0, 122.0, 74.0, 48.0, 28.0, 19.0, 16.0, 13.0, 12.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.9375, -21.281005859375, -20.62451171875, -19.968017578125, -19.3115234375, -18.655029296875, -17.99853515625, -17.342041015625, -16.685546875, -16.029052734375, -15.37255859375, -14.716064453125, -14.0595703125, -13.403076171875, -12.74658203125, -12.090087890625, -11.43359375, -10.777099609375, -10.12060546875, -9.464111328125, -8.8076171875, -8.151123046875, -7.49462890625, -6.838134765625, -6.181640625, -5.525146484375, -4.86865234375, -4.212158203125, -3.5556640625, -2.899169921875, -2.24267578125, -1.586181640625, -0.9296875, -0.273193359375, 0.38330078125, 1.039794921875, 1.6962890625, 2.352783203125, 3.00927734375, 3.665771484375, 4.322265625, 4.978759765625, 5.63525390625, 6.291748046875, 6.9482421875, 7.604736328125, 8.26123046875, 8.917724609375, 9.57421875, 10.230712890625, 10.88720703125, 11.543701171875, 12.2001953125, 12.856689453125, 13.51318359375, 14.169677734375, 14.826171875, 15.482666015625, 16.13916015625, 16.795654296875, 17.4521484375, 18.108642578125, 18.76513671875, 19.421630859375, 20.078125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 8.0, 8.0, 9.0, 21.0, 14.0, 20.0, 21.0, 22.0, 33.0, 27.0, 23.0, 22.0, 33.0, 39.0, 45.0, 47.0, 42.0, 35.0, 49.0, 33.0, 49.0, 51.0, 40.0, 38.0, 30.0, 31.0, 21.0, 24.0, 20.0, 21.0, 23.0, 24.0, 10.0, 15.0, 10.0, 6.0, 10.0, 2.0, 2.0, 2.0, 1.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.703125, -15.1982421875, -14.693359375, -14.1884765625, -13.68359375, -13.1787109375, -12.673828125, -12.1689453125, -11.6640625, -11.1591796875, -10.654296875, -10.1494140625, -9.64453125, -9.1396484375, -8.634765625, -8.1298828125, -7.625, -7.1201171875, -6.615234375, -6.1103515625, -5.60546875, -5.1005859375, -4.595703125, -4.0908203125, -3.5859375, -3.0810546875, -2.576171875, -2.0712890625, -1.56640625, -1.0615234375, -0.556640625, -0.0517578125, 0.453125, 0.9580078125, 1.462890625, 1.9677734375, 2.47265625, 2.9775390625, 3.482421875, 3.9873046875, 4.4921875, 4.9970703125, 5.501953125, 6.0068359375, 6.51171875, 7.0166015625, 7.521484375, 8.0263671875, 8.53125, 9.0361328125, 9.541015625, 10.0458984375, 10.55078125, 11.0556640625, 11.560546875, 12.0654296875, 12.5703125, 13.0751953125, 13.580078125, 14.0849609375, 14.58984375, 15.0947265625, 15.599609375, 16.1044921875, 16.609375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 8.0, 15.0, 28.0, 34.0, 86.0, 183.0, 561.0, 4167565.0, 25098.0, 395.0, 139.0, 83.0, 28.0, 24.0, 10.0, 4.0, 8.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-464.0, -447.375, -430.75, -414.125, -397.5, -380.875, -364.25, -347.625, -331.0, -314.375, -297.75, -281.125, -264.5, -247.875, -231.25, -214.625, -198.0, -181.375, -164.75, -148.125, -131.5, -114.875, -98.25, -81.625, -65.0, -48.375, -31.75, -15.125, 1.5, 18.125, 34.75, 51.375, 68.0, 84.625, 101.25, 117.875, 134.5, 151.125, 167.75, 184.375, 201.0, 217.625, 234.25, 250.875, 267.5, 284.125, 300.75, 317.375, 334.0, 350.625, 367.25, 383.875, 400.5, 417.125, 433.75, 450.375, 467.0, 483.625, 500.25, 516.875, 533.5, 550.125, 566.75, 583.375, 600.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0, 8.0, 23.0, 26.0, 46.0, 103.0, 236.0, 635.0, 1505.0, 892.0, 304.0, 140.0, 67.0, 31.0, 19.0, 14.0, 6.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3125, -11.8515625, -11.390625, -10.9296875, -10.46875, -10.0078125, -9.546875, -9.0859375, -8.625, -8.1640625, -7.703125, -7.2421875, -6.78125, -6.3203125, -5.859375, -5.3984375, -4.9375, -4.4765625, -4.015625, -3.5546875, -3.09375, -2.6328125, -2.171875, -1.7109375, -1.25, -0.7890625, -0.328125, 0.1328125, 0.59375, 1.0546875, 1.515625, 1.9765625, 2.4375, 2.8984375, 3.359375, 3.8203125, 4.28125, 4.7421875, 5.203125, 5.6640625, 6.125, 6.5859375, 7.046875, 7.5078125, 7.96875, 8.4296875, 8.890625, 9.3515625, 9.8125, 10.2734375, 10.734375, 11.1953125, 11.65625, 12.1171875, 12.578125, 13.0390625, 13.5, 13.9609375, 14.421875, 14.8828125, 15.34375, 15.8046875, 16.265625, 16.7265625, 17.1875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 12.0, 62.0, 231.0, 413.0, 216.0, 57.0, 20.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.77368927001953, -116.27946472167969, -112.78524017333984, -109.291015625, -105.79679107666016, -102.30256652832031, -98.808349609375, -95.31412506103516, -91.81990051269531, -88.32567596435547, -84.83145141601562, -81.33722686767578, -77.84300231933594, -74.34878540039062, -70.85455322265625, -67.36033630371094, -63.86610794067383, -60.371883392333984, -56.87765884399414, -53.38343811035156, -49.88921356201172, -46.394989013671875, -42.90076446533203, -39.40653991699219, -35.912315368652344, -32.4180908203125, -28.92386817932129, -25.429643630981445, -21.935420989990234, -18.44119644165039, -14.946971893310547, -11.452749252319336, -7.958526611328125, -4.464303016662598, -0.9700789451599121, 2.5241451263427734, 6.018368721008301, 9.512592315673828, 13.006816864013672, 16.501039505004883, 19.995264053344727, 23.48948860168457, 26.98371124267578, 30.477935791015625, 33.97216033935547, 37.46638488769531, 40.960609436035156, 44.454830169677734, 47.94905471801758, 51.44327926635742, 54.937503814697266, 58.431724548339844, 61.92594909667969, 65.42017364501953, 68.91439819335938, 72.40862274169922, 75.90284729003906, 79.3970718383789, 82.89129638671875, 86.3855209350586, 89.87974548339844, 93.37396240234375, 96.86819458007812, 100.36241149902344, 103.85663604736328]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 6.0, 18.0, 13.0, 17.0, 24.0, 29.0, 37.0, 42.0, 44.0, 49.0, 53.0, 51.0, 64.0, 59.0, 53.0, 70.0, 46.0, 43.0, 59.0, 37.0, 34.0, 34.0, 22.0, 24.0, 21.0, 11.0, 9.0, 9.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-28.967430114746094, -28.299497604370117, -27.631563186645508, -26.96363067626953, -26.295696258544922, -25.627763748168945, -24.95983123779297, -24.29189682006836, -23.62396240234375, -22.956029891967773, -22.288095474243164, -21.620162963867188, -20.952228546142578, -20.2842960357666, -19.616363525390625, -18.948429107666016, -18.28049659729004, -17.612564086914062, -16.944629669189453, -16.276697158813477, -15.608762741088867, -14.94083023071289, -14.272896766662598, -13.604963302612305, -12.937029838562012, -12.269096374511719, -11.601162910461426, -10.933229446411133, -10.265296936035156, -9.597362518310547, -8.92943000793457, -8.261496543884277, -7.593563079833984, -6.925629615783691, -6.257696151733398, -5.589763164520264, -4.921829700469971, -4.253896236419678, -3.585963249206543, -2.91802978515625, -2.250096321105957, -1.5821629762649536, -0.9142296314239502, -0.24629640579223633, 0.42163705825805664, 1.0895705223083496, 1.7575035095214844, 2.4254369735717773, 3.0933704376220703, 3.7613039016723633, 4.429237365722656, 5.097170352935791, 5.765103816986084, 6.433037281036377, 7.100970268249512, 7.768903732299805, 8.436837196350098, 9.10477066040039, 9.772704124450684, 10.440637588500977, 11.108570098876953, 11.776504516601562, 12.444437026977539, 13.112370491027832, 13.780303955078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 18.0, 21.0, 32.0, 55.0, 90.0, 142.0, 258.0, 550.0, 1125.0, 3085.0, 8553.0, 28911.0, 100630.0, 288343.0, 371338.0, 171757.0, 50806.0, 14696.0, 4676.0, 1850.0, 763.0, 370.0, 200.0, 106.0, 64.0, 37.0, 30.0, 13.0, 12.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -4.98944091796875, -4.8187255859375, -4.64801025390625, -4.477294921875, -4.30657958984375, -4.1358642578125, -3.96514892578125, -3.79443359375, -3.62371826171875, -3.4530029296875, -3.28228759765625, -3.111572265625, -2.94085693359375, -2.7701416015625, -2.59942626953125, -2.4287109375, -2.25799560546875, -2.0872802734375, -1.91656494140625, -1.745849609375, -1.57513427734375, -1.4044189453125, -1.23370361328125, -1.06298828125, -0.89227294921875, -0.7215576171875, -0.55084228515625, -0.380126953125, -0.20941162109375, -0.0386962890625, 0.13201904296875, 0.302734375, 0.47344970703125, 0.6441650390625, 0.81488037109375, 0.985595703125, 1.15631103515625, 1.3270263671875, 1.49774169921875, 1.66845703125, 1.83917236328125, 2.0098876953125, 2.18060302734375, 2.351318359375, 2.52203369140625, 2.6927490234375, 2.86346435546875, 3.0341796875, 3.20489501953125, 3.3756103515625, 3.54632568359375, 3.717041015625, 3.88775634765625, 4.0584716796875, 4.22918701171875, 4.39990234375, 4.57061767578125, 4.7413330078125, 4.91204833984375, 5.082763671875, 5.25347900390625, 5.4241943359375, 5.59490966796875, 5.765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 14.0, 15.0, 23.0, 25.0, 33.0, 34.0, 40.0, 60.0, 66.0, 57.0, 72.0, 70.0, 59.0, 74.0, 69.0, 48.0, 61.0, 39.0, 31.0, 24.0, 14.0, 20.0, 11.0, 6.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.265625, -25.6181640625, -24.970703125, -24.3232421875, -23.67578125, -23.0283203125, -22.380859375, -21.7333984375, -21.0859375, -20.4384765625, -19.791015625, -19.1435546875, -18.49609375, -17.8486328125, -17.201171875, -16.5537109375, -15.90625, -15.2587890625, -14.611328125, -13.9638671875, -13.31640625, -12.6689453125, -12.021484375, -11.3740234375, -10.7265625, -10.0791015625, -9.431640625, -8.7841796875, -8.13671875, -7.4892578125, -6.841796875, -6.1943359375, -5.546875, -4.8994140625, -4.251953125, -3.6044921875, -2.95703125, -2.3095703125, -1.662109375, -1.0146484375, -0.3671875, 0.2802734375, 0.927734375, 1.5751953125, 2.22265625, 2.8701171875, 3.517578125, 4.1650390625, 4.8125, 5.4599609375, 6.107421875, 6.7548828125, 7.40234375, 8.0498046875, 8.697265625, 9.3447265625, 9.9921875, 10.6396484375, 11.287109375, 11.9345703125, 12.58203125, 13.2294921875, 13.876953125, 14.5244140625, 15.171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 10.0, 20.0, 21.0, 30.0, 63.0, 109.0, 153.0, 260.0, 402.0, 672.0, 1189.0, 2335.0, 4663.0, 9570.0, 20165.0, 42235.0, 86610.0, 161797.0, 233970.0, 214363.0, 133742.0, 69079.0, 34237.0, 16287.0, 8002.0, 3968.0, 2038.0, 1098.0, 631.0, 305.0, 217.0, 121.0, 77.0, 39.0, 20.0, 13.0, 18.0, 4.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.11468505859375, -2.0438232421875, -1.97296142578125, -1.902099609375, -1.83123779296875, -1.7603759765625, -1.68951416015625, -1.61865234375, -1.54779052734375, -1.4769287109375, -1.40606689453125, -1.335205078125, -1.26434326171875, -1.1934814453125, -1.12261962890625, -1.0517578125, -0.98089599609375, -0.9100341796875, -0.83917236328125, -0.768310546875, -0.69744873046875, -0.6265869140625, -0.55572509765625, -0.48486328125, -0.41400146484375, -0.3431396484375, -0.27227783203125, -0.201416015625, -0.13055419921875, -0.0596923828125, 0.01116943359375, 0.08203125, 0.15289306640625, 0.2237548828125, 0.29461669921875, 0.365478515625, 0.43634033203125, 0.5072021484375, 0.57806396484375, 0.64892578125, 0.71978759765625, 0.7906494140625, 0.86151123046875, 0.932373046875, 1.00323486328125, 1.0740966796875, 1.14495849609375, 1.2158203125, 1.28668212890625, 1.3575439453125, 1.42840576171875, 1.499267578125, 1.57012939453125, 1.6409912109375, 1.71185302734375, 1.78271484375, 1.85357666015625, 1.9244384765625, 1.99530029296875, 2.066162109375, 2.13702392578125, 2.2078857421875, 2.27874755859375, 2.349609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 10.0, 12.0, 10.0, 16.0, 7.0, 19.0, 26.0, 28.0, 37.0, 32.0, 33.0, 50.0, 37.0, 41.0, 42.0, 50.0, 43.0, 57.0, 38.0, 45.0, 43.0, 22.0, 32.0, 29.0, 26.0, 34.0, 24.0, 21.0, 17.0, 14.0, 16.0, 15.0, 12.0, 10.0, 5.0, 7.0, 4.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-28.828125, -27.968994140625, -27.10986328125, -26.250732421875, -25.3916015625, -24.532470703125, -23.67333984375, -22.814208984375, -21.955078125, -21.095947265625, -20.23681640625, -19.377685546875, -18.5185546875, -17.659423828125, -16.80029296875, -15.941162109375, -15.08203125, -14.222900390625, -13.36376953125, -12.504638671875, -11.6455078125, -10.786376953125, -9.92724609375, -9.068115234375, -8.208984375, -7.349853515625, -6.49072265625, -5.631591796875, -4.7724609375, -3.913330078125, -3.05419921875, -2.195068359375, -1.3359375, -0.476806640625, 0.38232421875, 1.241455078125, 2.1005859375, 2.959716796875, 3.81884765625, 4.677978515625, 5.537109375, 6.396240234375, 7.25537109375, 8.114501953125, 8.9736328125, 9.832763671875, 10.69189453125, 11.551025390625, 12.41015625, 13.269287109375, 14.12841796875, 14.987548828125, 15.8466796875, 16.705810546875, 17.56494140625, 18.424072265625, 19.283203125, 20.142333984375, 21.00146484375, 21.860595703125, 22.7197265625, 23.578857421875, 24.43798828125, 25.297119140625, 26.15625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 13.0, 10.0, 21.0, 18.0, 37.0, 29.0, 43.0, 54.0, 78.0, 131.0, 223.0, 316.0, 593.0, 1119.0, 2080.0, 4255.0, 10036.0, 30041.0, 148404.0, 568529.0, 219671.0, 40178.0, 12266.0, 4911.0, 2398.0, 1270.0, 718.0, 417.0, 233.0, 140.0, 117.0, 61.0, 37.0, 29.0, 23.0, 9.0, 20.0, 10.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5279312133789062, -0.5094757080078125, -0.49102020263671875, -0.472564697265625, -0.45410919189453125, -0.4356536865234375, -0.41719818115234375, -0.39874267578125, -0.38028717041015625, -0.3618316650390625, -0.34337615966796875, -0.324920654296875, -0.30646514892578125, -0.2880096435546875, -0.26955413818359375, -0.2510986328125, -0.23264312744140625, -0.2141876220703125, -0.19573211669921875, -0.177276611328125, -0.15882110595703125, -0.1403656005859375, -0.12191009521484375, -0.10345458984375, -0.08499908447265625, -0.0665435791015625, -0.04808807373046875, -0.029632568359375, -0.01117706298828125, 0.0072784423828125, 0.02573394775390625, 0.044189453125, 0.06264495849609375, 0.0811004638671875, 0.09955596923828125, 0.118011474609375, 0.13646697998046875, 0.1549224853515625, 0.17337799072265625, 0.19183349609375, 0.21028900146484375, 0.2287445068359375, 0.24720001220703125, 0.265655517578125, 0.28411102294921875, 0.3025665283203125, 0.32102203369140625, 0.3394775390625, 0.35793304443359375, 0.3763885498046875, 0.39484405517578125, 0.413299560546875, 0.43175506591796875, 0.4502105712890625, 0.46866607666015625, 0.48712158203125, 0.5055770874023438, 0.5240325927734375, 0.5424880981445312, 0.560943603515625, 0.5793991088867188, 0.5978546142578125, 0.6163101196289062, 0.634765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 11.0, 15.0, 30.0, 42.0, 79.0, 113.0, 127.0, 158.0, 146.0, 89.0, 53.0, 38.0, 20.0, 24.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005621910095214844, -0.0005442425608634949, -0.0005262941122055054, -0.0005083456635475159, -0.0004903972148895264, -0.00047244876623153687, -0.00045450031757354736, -0.00043655186891555786, -0.00041860342025756836, -0.00040065497159957886, -0.00038270652294158936, -0.00036475807428359985, -0.00034680962562561035, -0.00032886117696762085, -0.00031091272830963135, -0.00029296427965164185, -0.00027501583099365234, -0.00025706738233566284, -0.00023911893367767334, -0.00022117048501968384, -0.00020322203636169434, -0.00018527358770370483, -0.00016732513904571533, -0.00014937669038772583, -0.00013142824172973633, -0.00011347979307174683, -9.553134441375732e-05, -7.758289575576782e-05, -5.963444709777832e-05, -4.168599843978882e-05, -2.3737549781799316e-05, -5.7891011238098145e-06, 1.2159347534179688e-05, 3.010779619216919e-05, 4.805624485015869e-05, 6.60046935081482e-05, 8.39531421661377e-05, 0.0001019015908241272, 0.0001198500394821167, 0.0001377984881401062, 0.0001557469367980957, 0.0001736953854560852, 0.0001916438341140747, 0.0002095922827720642, 0.0002275407314300537, 0.0002454891800880432, 0.0002634376287460327, 0.0002813860774040222, 0.0002993345260620117, 0.0003172829747200012, 0.0003352314233779907, 0.0003531798720359802, 0.0003711283206939697, 0.00038907676935195923, 0.00040702521800994873, 0.00042497366666793823, 0.00044292211532592773, 0.00046087056398391724, 0.00047881901264190674, 0.0004967674612998962, 0.0005147159099578857, 0.0005326643586158752, 0.0005506128072738647, 0.0005685612559318542, 0.0005865097045898438]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 9.0, 22.0, 25.0, 41.0, 91.0, 268.0, 1721.0, 118767.0, 922671.0, 4289.0, 397.0, 90.0, 55.0, 27.0, 15.0, 10.0, 9.0, 8.0, 5.0, 7.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.275390625, -3.1822509765625, -3.089111328125, -2.9959716796875, -2.90283203125, -2.8096923828125, -2.716552734375, -2.6234130859375, -2.5302734375, -2.4371337890625, -2.343994140625, -2.2508544921875, -2.15771484375, -2.0645751953125, -1.971435546875, -1.8782958984375, -1.78515625, -1.6920166015625, -1.598876953125, -1.5057373046875, -1.41259765625, -1.3194580078125, -1.226318359375, -1.1331787109375, -1.0400390625, -0.9468994140625, -0.853759765625, -0.7606201171875, -0.66748046875, -0.5743408203125, -0.481201171875, -0.3880615234375, -0.294921875, -0.2017822265625, -0.108642578125, -0.0155029296875, 0.07763671875, 0.1707763671875, 0.263916015625, 0.3570556640625, 0.4501953125, 0.5433349609375, 0.636474609375, 0.7296142578125, 0.82275390625, 0.9158935546875, 1.009033203125, 1.1021728515625, 1.1953125, 1.2884521484375, 1.381591796875, 1.4747314453125, 1.56787109375, 1.6610107421875, 1.754150390625, 1.8472900390625, 1.9404296875, 2.0335693359375, 2.126708984375, 2.2198486328125, 2.31298828125, 2.4061279296875, 2.499267578125, 2.5924072265625, 2.685546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 11.0, 14.0, 22.0, 44.0, 60.0, 109.0, 150.0, 148.0, 149.0, 103.0, 66.0, 36.0, 24.0, 13.0, 5.0, 7.0, 3.0, 6.0, 4.0, 1.0, 8.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.290283203125, -0.28185272216796875, -0.2734222412109375, -0.26499176025390625, -0.256561279296875, -0.24813079833984375, -0.2397003173828125, -0.23126983642578125, -0.22283935546875, -0.21440887451171875, -0.2059783935546875, -0.19754791259765625, -0.189117431640625, -0.18068695068359375, -0.1722564697265625, -0.16382598876953125, -0.1553955078125, -0.14696502685546875, -0.1385345458984375, -0.13010406494140625, -0.121673583984375, -0.11324310302734375, -0.1048126220703125, -0.09638214111328125, -0.08795166015625, -0.07952117919921875, -0.0710906982421875, -0.06266021728515625, -0.054229736328125, -0.04579925537109375, -0.0373687744140625, -0.02893829345703125, -0.0205078125, -0.01207733154296875, -0.0036468505859375, 0.00478363037109375, 0.013214111328125, 0.02164459228515625, 0.0300750732421875, 0.03850555419921875, 0.04693603515625, 0.05536651611328125, 0.0637969970703125, 0.07222747802734375, 0.080657958984375, 0.08908843994140625, 0.0975189208984375, 0.10594940185546875, 0.1143798828125, 0.12281036376953125, 0.1312408447265625, 0.13967132568359375, 0.148101806640625, 0.15653228759765625, 0.1649627685546875, 0.17339324951171875, 0.18182373046875, 0.19025421142578125, 0.1986846923828125, 0.20711517333984375, 0.215545654296875, 0.22397613525390625, 0.2324066162109375, 0.24083709716796875, 0.249267578125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 93.0, 735.0, 175.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.7721252441406, -291.2267761230469, -285.6814270019531, -280.1360778808594, -274.5906982421875, -269.04534912109375, -263.5, -257.95465087890625, -252.4093017578125, -246.86395263671875, -241.318603515625, -235.7732391357422, -230.22789001464844, -224.6825408935547, -219.13717651367188, -213.59182739257812, -208.04647827148438, -202.50112915039062, -196.95578002929688, -191.41041564941406, -185.8650665283203, -180.31971740722656, -174.77435302734375, -169.22900390625, -163.68365478515625, -158.1383056640625, -152.59295654296875, -147.04759216308594, -141.5022430419922, -135.95689392089844, -130.41152954101562, -124.86618041992188, -119.32081604003906, -113.77546691894531, -108.23011016845703, -102.68475341796875, -97.139404296875, -91.59405517578125, -86.04869842529297, -80.50334167480469, -74.95799255371094, -69.41264343261719, -63.867286682128906, -58.32193374633789, -52.776580810546875, -47.23122787475586, -41.685874938964844, -36.14052200317383, -30.595169067382812, -25.049816131591797, -19.50446319580078, -13.959110260009766, -8.41375732421875, -2.8684043884277344, 2.6769485473632812, 8.222301483154297, 13.767654418945312, 19.313007354736328, 24.858360290527344, 30.40371322631836, 35.949066162109375, 41.49441909790039, 47.039772033691406, 52.58512496948242, 58.13047790527344]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 5.0, 12.0, 9.0, 21.0, 17.0, 26.0, 37.0, 45.0, 52.0, 57.0, 71.0, 58.0, 73.0, 68.0, 72.0, 60.0, 57.0, 64.0, 39.0, 36.0, 31.0, 30.0, 16.0, 14.0, 9.0, 3.0, 7.0, 4.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-26.025175094604492, -25.408254623413086, -24.79133415222168, -24.17441177368164, -23.557491302490234, -22.940570831298828, -22.323650360107422, -21.706729888916016, -21.089807510375977, -20.47288703918457, -19.855966567993164, -19.239044189453125, -18.62212371826172, -18.005203247070312, -17.388282775878906, -16.7713623046875, -16.154441833496094, -15.537521362304688, -14.920599937438965, -14.303679466247559, -13.686758041381836, -13.06983757019043, -12.452917098999023, -11.8359956741333, -11.219074249267578, -10.602153778076172, -9.98523235321045, -9.368311882019043, -8.75139045715332, -8.134469985961914, -7.51754903793335, -6.900628089904785, -6.283707618713379, -5.6667866706848145, -5.04986572265625, -4.432945251464844, -3.8160240650177, -3.1991031169891357, -2.5821824073791504, -1.965261459350586, -1.3483405113220215, -0.7314196228981018, -0.11449873447418213, 0.5024220943450928, 1.1193430423736572, 1.7362639904022217, 2.353184700012207, 2.9701056480407715, 3.587026596069336, 4.2039475440979, 4.820868492126465, 5.437788963317871, 6.054710388183594, 6.671630859375, 7.2885518074035645, 7.905472755432129, 8.522394180297852, 9.139314651489258, 9.75623607635498, 10.373156547546387, 10.99007797241211, 11.606998443603516, 12.223918914794922, 12.840840339660645, 13.45776081085205]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 4.0, 22.0, 30.0, 31.0, 77.0, 152.0, 244.0, 431.0, 850.0, 1836.0, 4126.0, 9674.0, 24539.0, 63852.0, 175500.0, 399304.0, 231861.0, 82813.0, 31138.0, 12443.0, 5165.0, 2227.0, 1077.0, 483.0, 267.0, 135.0, 110.0, 67.0, 29.0, 21.0, 8.0, 12.0, 5.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.731689453125, -3.60986328125, -3.488037109375, -3.3662109375, -3.244384765625, -3.12255859375, -3.000732421875, -2.87890625, -2.757080078125, -2.63525390625, -2.513427734375, -2.3916015625, -2.269775390625, -2.14794921875, -2.026123046875, -1.904296875, -1.782470703125, -1.66064453125, -1.538818359375, -1.4169921875, -1.295166015625, -1.17333984375, -1.051513671875, -0.9296875, -0.807861328125, -0.68603515625, -0.564208984375, -0.4423828125, -0.320556640625, -0.19873046875, -0.076904296875, 0.044921875, 0.166748046875, 0.28857421875, 0.410400390625, 0.5322265625, 0.654052734375, 0.77587890625, 0.897705078125, 1.01953125, 1.141357421875, 1.26318359375, 1.385009765625, 1.5068359375, 1.628662109375, 1.75048828125, 1.872314453125, 1.994140625, 2.115966796875, 2.23779296875, 2.359619140625, 2.4814453125, 2.603271484375, 2.72509765625, 2.846923828125, 2.96875, 3.090576171875, 3.21240234375, 3.334228515625, 3.4560546875, 3.577880859375, 3.69970703125, 3.821533203125, 3.943359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 8.0, 11.0, 12.0, 15.0, 24.0, 23.0, 35.0, 44.0, 38.0, 46.0, 48.0, 45.0, 68.0, 68.0, 47.0, 45.0, 43.0, 50.0, 38.0, 37.0, 37.0, 34.0, 38.0, 22.0, 19.0, 15.0, 16.0, 13.0, 7.0, 5.0, 8.0, 2.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-33.71875, -32.762939453125, -31.80712890625, -30.851318359375, -29.8955078125, -28.939697265625, -27.98388671875, -27.028076171875, -26.072265625, -25.116455078125, -24.16064453125, -23.204833984375, -22.2490234375, -21.293212890625, -20.33740234375, -19.381591796875, -18.42578125, -17.469970703125, -16.51416015625, -15.558349609375, -14.6025390625, -13.646728515625, -12.69091796875, -11.735107421875, -10.779296875, -9.823486328125, -8.86767578125, -7.911865234375, -6.9560546875, -6.000244140625, -5.04443359375, -4.088623046875, -3.1328125, -2.177001953125, -1.22119140625, -0.265380859375, 0.6904296875, 1.646240234375, 2.60205078125, 3.557861328125, 4.513671875, 5.469482421875, 6.42529296875, 7.381103515625, 8.3369140625, 9.292724609375, 10.24853515625, 11.204345703125, 12.16015625, 13.115966796875, 14.07177734375, 15.027587890625, 15.9833984375, 16.939208984375, 17.89501953125, 18.850830078125, 19.806640625, 20.762451171875, 21.71826171875, 22.674072265625, 23.6298828125, 24.585693359375, 25.54150390625, 26.497314453125, 27.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 3.0, 5.0, 5.0, 13.0, 4.0, 9.0, 10.0, 7.0, 16.0, 22.0, 24.0, 35.0, 24.0, 42.0, 43.0, 54.0, 59.0, 88.0, 115.0, 188.0, 317.0, 734.0, 2861.0, 48842.0, 933607.0, 56249.0, 3215.0, 804.0, 319.0, 167.0, 136.0, 98.0, 86.0, 63.0, 54.0, 49.0, 37.0, 30.0, 29.0, 18.0, 8.0, 13.0, 16.0, 5.0, 13.0, 9.0, 1.0, 1.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.25, -13.7830810546875, -13.316162109375, -12.8492431640625, -12.38232421875, -11.9154052734375, -11.448486328125, -10.9815673828125, -10.5146484375, -10.0477294921875, -9.580810546875, -9.1138916015625, -8.64697265625, -8.1800537109375, -7.713134765625, -7.2462158203125, -6.779296875, -6.3123779296875, -5.845458984375, -5.3785400390625, -4.91162109375, -4.4447021484375, -3.977783203125, -3.5108642578125, -3.0439453125, -2.5770263671875, -2.110107421875, -1.6431884765625, -1.17626953125, -0.7093505859375, -0.242431640625, 0.2244873046875, 0.69140625, 1.1583251953125, 1.625244140625, 2.0921630859375, 2.55908203125, 3.0260009765625, 3.492919921875, 3.9598388671875, 4.4267578125, 4.8936767578125, 5.360595703125, 5.8275146484375, 6.29443359375, 6.7613525390625, 7.228271484375, 7.6951904296875, 8.162109375, 8.6290283203125, 9.095947265625, 9.5628662109375, 10.02978515625, 10.4967041015625, 10.963623046875, 11.4305419921875, 11.8974609375, 12.3643798828125, 12.831298828125, 13.2982177734375, 13.76513671875, 14.2320556640625, 14.698974609375, 15.1658935546875, 15.6328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 4.0, 5.0, 6.0, 15.0, 11.0, 16.0, 17.0, 20.0, 23.0, 19.0, 27.0, 37.0, 41.0, 40.0, 30.0, 47.0, 36.0, 54.0, 57.0, 38.0, 41.0, 36.0, 39.0, 39.0, 33.0, 44.0, 33.0, 28.0, 35.0, 23.0, 20.0, 13.0, 9.0, 13.0, 7.0, 7.0, 10.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.390625, -24.5595703125, -23.728515625, -22.8974609375, -22.06640625, -21.2353515625, -20.404296875, -19.5732421875, -18.7421875, -17.9111328125, -17.080078125, -16.2490234375, -15.41796875, -14.5869140625, -13.755859375, -12.9248046875, -12.09375, -11.2626953125, -10.431640625, -9.6005859375, -8.76953125, -7.9384765625, -7.107421875, -6.2763671875, -5.4453125, -4.6142578125, -3.783203125, -2.9521484375, -2.12109375, -1.2900390625, -0.458984375, 0.3720703125, 1.203125, 2.0341796875, 2.865234375, 3.6962890625, 4.52734375, 5.3583984375, 6.189453125, 7.0205078125, 7.8515625, 8.6826171875, 9.513671875, 10.3447265625, 11.17578125, 12.0068359375, 12.837890625, 13.6689453125, 14.5, 15.3310546875, 16.162109375, 16.9931640625, 17.82421875, 18.6552734375, 19.486328125, 20.3173828125, 21.1484375, 21.9794921875, 22.810546875, 23.6416015625, 24.47265625, 25.3037109375, 26.134765625, 26.9658203125, 27.796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 14.0, 16.0, 31.0, 40.0, 68.0, 148.0, 390.0, 1027.0, 4050.0, 35118.0, 916693.0, 82434.0, 6192.0, 1437.0, 455.0, 213.0, 85.0, 51.0, 25.0, 17.0, 9.0, 14.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.390625, -4.242431640625, -4.09423828125, -3.946044921875, -3.7978515625, -3.649658203125, -3.50146484375, -3.353271484375, -3.205078125, -3.056884765625, -2.90869140625, -2.760498046875, -2.6123046875, -2.464111328125, -2.31591796875, -2.167724609375, -2.01953125, -1.871337890625, -1.72314453125, -1.574951171875, -1.4267578125, -1.278564453125, -1.13037109375, -0.982177734375, -0.833984375, -0.685791015625, -0.53759765625, -0.389404296875, -0.2412109375, -0.093017578125, 0.05517578125, 0.203369140625, 0.3515625, 0.499755859375, 0.64794921875, 0.796142578125, 0.9443359375, 1.092529296875, 1.24072265625, 1.388916015625, 1.537109375, 1.685302734375, 1.83349609375, 1.981689453125, 2.1298828125, 2.278076171875, 2.42626953125, 2.574462890625, 2.72265625, 2.870849609375, 3.01904296875, 3.167236328125, 3.3154296875, 3.463623046875, 3.61181640625, 3.760009765625, 3.908203125, 4.056396484375, 4.20458984375, 4.352783203125, 4.5009765625, 4.649169921875, 4.79736328125, 4.945556640625, 5.09375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 9.0, 21.0, 36.0, 35.0, 76.0, 151.0, 326.0, 149.0, 85.0, 37.0, 26.0, 16.0, 9.0, 7.0, 6.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0009641647338867188, -0.0009434446692466736, -0.0009227246046066284, -0.0009020045399665833, -0.0008812844753265381, -0.0008605644106864929, -0.0008398443460464478, -0.0008191242814064026, -0.0007984042167663574, -0.0007776841521263123, -0.0007569640874862671, -0.0007362440228462219, -0.0007155239582061768, -0.0006948038935661316, -0.0006740838289260864, -0.0006533637642860413, -0.0006326436996459961, -0.0006119236350059509, -0.0005912035703659058, -0.0005704835057258606, -0.0005497634410858154, -0.0005290433764457703, -0.0005083233118057251, -0.00048760324716567993, -0.00046688318252563477, -0.0004461631178855896, -0.00042544305324554443, -0.00040472298860549927, -0.0003840029239654541, -0.00036328285932540894, -0.00034256279468536377, -0.0003218427300453186, -0.00030112266540527344, -0.00028040260076522827, -0.0002596825361251831, -0.00023896247148513794, -0.00021824240684509277, -0.0001975223422050476, -0.00017680227756500244, -0.00015608221292495728, -0.0001353621482849121, -0.00011464208364486694, -9.392201900482178e-05, -7.320195436477661e-05, -5.2481889724731445e-05, -3.176182508468628e-05, -1.1041760444641113e-05, 9.678304195404053e-06, 3.039836883544922e-05, 5.1118433475494385e-05, 7.183849811553955e-05, 9.255856275558472e-05, 0.00011327862739562988, 0.00013399869203567505, 0.00015471875667572021, 0.00017543882131576538, 0.00019615888595581055, 0.0002168789505958557, 0.00023759901523590088, 0.00025831907987594604, 0.0002790391445159912, 0.0002997592091560364, 0.00032047927379608154, 0.0003411993384361267, 0.0003619194030761719]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 7.0, 6.0, 10.0, 22.0, 37.0, 46.0, 61.0, 114.0, 223.0, 537.0, 2028.0, 12839.0, 336343.0, 674713.0, 17875.0, 2422.0, 642.0, 263.0, 146.0, 51.0, 41.0, 31.0, 24.0, 14.0, 12.0, 9.0, 9.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.0078125, -3.86993408203125, -3.7320556640625, -3.59417724609375, -3.456298828125, -3.31842041015625, -3.1805419921875, -3.04266357421875, -2.90478515625, -2.76690673828125, -2.6290283203125, -2.49114990234375, -2.353271484375, -2.21539306640625, -2.0775146484375, -1.93963623046875, -1.8017578125, -1.66387939453125, -1.5260009765625, -1.38812255859375, -1.250244140625, -1.11236572265625, -0.9744873046875, -0.83660888671875, -0.69873046875, -0.56085205078125, -0.4229736328125, -0.28509521484375, -0.147216796875, -0.00933837890625, 0.1285400390625, 0.26641845703125, 0.404296875, 0.54217529296875, 0.6800537109375, 0.81793212890625, 0.955810546875, 1.09368896484375, 1.2315673828125, 1.36944580078125, 1.50732421875, 1.64520263671875, 1.7830810546875, 1.92095947265625, 2.058837890625, 2.19671630859375, 2.3345947265625, 2.47247314453125, 2.6103515625, 2.74822998046875, 2.8861083984375, 3.02398681640625, 3.161865234375, 3.29974365234375, 3.4376220703125, 3.57550048828125, 3.71337890625, 3.85125732421875, 3.9891357421875, 4.12701416015625, 4.264892578125, 4.40277099609375, 4.5406494140625, 4.67852783203125, 4.81640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 5.0, 1.0, 6.0, 10.0, 11.0, 11.0, 15.0, 13.0, 24.0, 27.0, 50.0, 62.0, 108.0, 166.0, 150.0, 80.0, 61.0, 48.0, 28.0, 23.0, 18.0, 13.0, 16.0, 12.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.72216796875, -0.6972274780273438, -0.6722869873046875, -0.6473464965820312, -0.622406005859375, -0.5974655151367188, -0.5725250244140625, -0.5475845336914062, -0.52264404296875, -0.49770355224609375, -0.4727630615234375, -0.44782257080078125, -0.422882080078125, -0.39794158935546875, -0.3730010986328125, -0.34806060791015625, -0.3231201171875, -0.29817962646484375, -0.2732391357421875, -0.24829864501953125, -0.223358154296875, -0.19841766357421875, -0.1734771728515625, -0.14853668212890625, -0.12359619140625, -0.09865570068359375, -0.0737152099609375, -0.04877471923828125, -0.023834228515625, 0.00110626220703125, 0.0260467529296875, 0.05098724365234375, 0.075927734375, 0.10086822509765625, 0.1258087158203125, 0.15074920654296875, 0.175689697265625, 0.20063018798828125, 0.2255706787109375, 0.25051116943359375, 0.27545166015625, 0.30039215087890625, 0.3253326416015625, 0.35027313232421875, 0.375213623046875, 0.40015411376953125, 0.4250946044921875, 0.45003509521484375, 0.4749755859375, 0.49991607666015625, 0.5248565673828125, 0.5497970581054688, 0.574737548828125, 0.5996780395507812, 0.6246185302734375, 0.6495590209960938, 0.67449951171875, 0.6994400024414062, 0.7243804931640625, 0.7493209838867188, 0.774261474609375, 0.7992019653320312, 0.8241424560546875, 0.8490829467773438, 0.8740234375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 21.0, 531.0, 437.0, 25.0, 3.0], "bins": [-546.2600708007812, -537.2894287109375, -528.3187866210938, -519.34814453125, -510.3774719238281, -501.4068298339844, -492.4361572265625, -483.46551513671875, -474.494873046875, -465.52423095703125, -456.5535888671875, -447.5829162597656, -438.6122741699219, -429.6416320800781, -420.67095947265625, -411.7003173828125, -402.72967529296875, -393.759033203125, -384.78839111328125, -375.8177185058594, -366.8470764160156, -357.8764343261719, -348.90576171875, -339.93511962890625, -330.9644775390625, -321.99383544921875, -313.023193359375, -304.0525207519531, -295.0818786621094, -286.1112365722656, -277.14056396484375, -268.169921875, -259.19927978515625, -250.2286376953125, -241.2579803466797, -232.28732299804688, -223.31668090820312, -214.34603881835938, -205.37538146972656, -196.40472412109375, -187.43408203125, -178.46343994140625, -169.49278259277344, -160.52212524414062, -151.55148315429688, -142.58084106445312, -133.6101837158203, -124.63953399658203, -115.66888427734375, -106.69823455810547, -97.72758483886719, -88.7569351196289, -79.78628540039062, -70.81563568115234, -61.84498596191406, -52.87433624267578, -43.903682708740234, -34.93303298950195, -25.962383270263672, -16.99173355102539, -8.02108383178711, 0.9495658874511719, 9.920215606689453, 18.890865325927734, 27.861515045166016]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 6.0, 10.0, 16.0, 15.0, 15.0, 25.0, 18.0, 32.0, 25.0, 34.0, 33.0, 41.0, 48.0, 44.0, 53.0, 44.0, 41.0, 45.0, 44.0, 40.0, 46.0, 48.0, 38.0, 27.0, 34.0, 25.0, 26.0, 20.0, 18.0, 12.0, 20.0, 8.0, 4.0, 7.0, 12.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.62749481201172, -43.26785659790039, -41.90821838378906, -40.548583984375, -39.18894577026367, -37.829307556152344, -36.469669342041016, -35.11003112792969, -33.750396728515625, -32.3907585144043, -31.0311222076416, -29.671483993530273, -28.311847686767578, -26.95220947265625, -25.592571258544922, -24.232934951782227, -22.8732967376709, -21.51365852355957, -20.154022216796875, -18.794384002685547, -17.43474769592285, -16.075109481811523, -14.715472221374512, -13.3558349609375, -11.996197700500488, -10.636560440063477, -9.276923179626465, -7.917285442352295, -6.557648181915283, -5.1980109214782715, -3.8383731842041016, -2.47873592376709, -1.1190986633300781, 0.24053871631622314, 1.6001760959625244, 2.9598135948181152, 4.319450855255127, 5.679088115692139, 7.038725852966309, 8.39836311340332, 9.758000373840332, 11.117637634277344, 12.477274894714355, 13.836912155151367, 15.196550369262695, 16.55618667602539, 17.91582489013672, 19.275463104248047, 20.635099411010742, 21.99473762512207, 23.354373931884766, 24.714012145996094, 26.07364845275879, 27.433286666870117, 28.792922973632812, 30.15256118774414, 31.51219940185547, 32.8718376159668, 34.231475830078125, 35.59111022949219, 36.950748443603516, 38.310386657714844, 39.67002487182617, 41.0296630859375, 42.38929748535156]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 10.0, 8.0, 14.0, 23.0, 47.0, 83.0, 195.0, 758.0, 8336.0, 532880.0, 3565196.0, 81474.0, 4057.0, 893.0, 163.0, 73.0, 35.0, 17.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-77.875, -76.228759765625, -74.58251953125, -72.936279296875, -71.2900390625, -69.643798828125, -67.99755859375, -66.351318359375, -64.705078125, -63.058837890625, -61.41259765625, -59.766357421875, -58.1201171875, -56.473876953125, -54.82763671875, -53.181396484375, -51.53515625, -49.888916015625, -48.24267578125, -46.596435546875, -44.9501953125, -43.303955078125, -41.65771484375, -40.011474609375, -38.365234375, -36.718994140625, -35.07275390625, -33.426513671875, -31.7802734375, -30.134033203125, -28.48779296875, -26.841552734375, -25.1953125, -23.549072265625, -21.90283203125, -20.256591796875, -18.6103515625, -16.964111328125, -15.31787109375, -13.671630859375, -12.025390625, -10.379150390625, -8.73291015625, -7.086669921875, -5.4404296875, -3.794189453125, -2.14794921875, -0.501708984375, 1.14453125, 2.790771484375, 4.43701171875, 6.083251953125, 7.7294921875, 9.375732421875, 11.02197265625, 12.668212890625, 14.314453125, 15.960693359375, 17.60693359375, 19.253173828125, 20.8994140625, 22.545654296875, 24.19189453125, 25.838134765625, 27.484375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 8.0, 9.0, 18.0, 24.0, 47.0, 44.0, 83.0, 86.0, 125.0, 107.0, 98.0, 88.0, 91.0, 52.0, 48.0, 32.0, 16.0, 6.0, 12.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-39.71875, -38.865478515625, -38.01220703125, -37.158935546875, -36.3056640625, -35.452392578125, -34.59912109375, -33.745849609375, -32.892578125, -32.039306640625, -31.18603515625, -30.332763671875, -29.4794921875, -28.626220703125, -27.77294921875, -26.919677734375, -26.06640625, -25.213134765625, -24.35986328125, -23.506591796875, -22.6533203125, -21.800048828125, -20.94677734375, -20.093505859375, -19.240234375, -18.386962890625, -17.53369140625, -16.680419921875, -15.8271484375, -14.973876953125, -14.12060546875, -13.267333984375, -12.4140625, -11.560791015625, -10.70751953125, -9.854248046875, -9.0009765625, -8.147705078125, -7.29443359375, -6.441162109375, -5.587890625, -4.734619140625, -3.88134765625, -3.028076171875, -2.1748046875, -1.321533203125, -0.46826171875, 0.385009765625, 1.23828125, 2.091552734375, 2.94482421875, 3.798095703125, 4.6513671875, 5.504638671875, 6.35791015625, 7.211181640625, 8.064453125, 8.917724609375, 9.77099609375, 10.624267578125, 11.4775390625, 12.330810546875, 13.18408203125, 14.037353515625, 14.890625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 8.0, 14.0, 21.0, 33.0, 130.0, 403.0, 4089.0, 4138162.0, 50113.0, 947.0, 189.0, 66.0, 30.0, 20.0, 15.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-147.625, -143.9072265625, -140.189453125, -136.4716796875, -132.75390625, -129.0361328125, -125.318359375, -121.6005859375, -117.8828125, -114.1650390625, -110.447265625, -106.7294921875, -103.01171875, -99.2939453125, -95.576171875, -91.8583984375, -88.140625, -84.4228515625, -80.705078125, -76.9873046875, -73.26953125, -69.5517578125, -65.833984375, -62.1162109375, -58.3984375, -54.6806640625, -50.962890625, -47.2451171875, -43.52734375, -39.8095703125, -36.091796875, -32.3740234375, -28.65625, -24.9384765625, -21.220703125, -17.5029296875, -13.78515625, -10.0673828125, -6.349609375, -2.6318359375, 1.0859375, 4.8037109375, 8.521484375, 12.2392578125, 15.95703125, 19.6748046875, 23.392578125, 27.1103515625, 30.828125, 34.5458984375, 38.263671875, 41.9814453125, 45.69921875, 49.4169921875, 53.134765625, 56.8525390625, 60.5703125, 64.2880859375, 68.005859375, 71.7236328125, 75.44140625, 79.1591796875, 82.876953125, 86.5947265625, 90.3125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 12.0, 27.0, 47.0, 64.0, 150.0, 251.0, 560.0, 1009.0, 959.0, 495.0, 270.0, 112.0, 45.0, 32.0, 12.0, 7.0, 6.0, 6.0, 1.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21484375, -5.82476806640625, -5.4346923828125, -5.04461669921875, -4.654541015625, -4.26446533203125, -3.8743896484375, -3.48431396484375, -3.09423828125, -2.70416259765625, -2.3140869140625, -1.92401123046875, -1.533935546875, -1.14385986328125, -0.7537841796875, -0.36370849609375, 0.0263671875, 0.41644287109375, 0.8065185546875, 1.19659423828125, 1.586669921875, 1.97674560546875, 2.3668212890625, 2.75689697265625, 3.14697265625, 3.53704833984375, 3.9271240234375, 4.31719970703125, 4.707275390625, 5.09735107421875, 5.4874267578125, 5.87750244140625, 6.267578125, 6.65765380859375, 7.0477294921875, 7.43780517578125, 7.827880859375, 8.21795654296875, 8.6080322265625, 8.99810791015625, 9.38818359375, 9.77825927734375, 10.1683349609375, 10.55841064453125, 10.948486328125, 11.33856201171875, 11.7286376953125, 12.11871337890625, 12.5087890625, 12.89886474609375, 13.2889404296875, 13.67901611328125, 14.069091796875, 14.45916748046875, 14.8492431640625, 15.23931884765625, 15.62939453125, 16.01947021484375, 16.4095458984375, 16.79962158203125, 17.189697265625, 17.57977294921875, 17.9698486328125, 18.35992431640625, 18.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 37.0, 200.0, 428.0, 265.0, 62.0, 11.0, 3.0, 2.0, 3.0], "bins": [-188.96583557128906, -185.68060302734375, -182.39537048339844, -179.11013793945312, -175.8249053955078, -172.5396728515625, -169.25442504882812, -165.96920776367188, -162.6839599609375, -159.3987274169922, -156.11349487304688, -152.82826232910156, -149.54302978515625, -146.25779724121094, -142.97256469726562, -139.68731689453125, -136.402099609375, -133.1168670654297, -129.83163452148438, -126.54640197753906, -123.26116180419922, -119.9759292602539, -116.6906967163086, -113.40546417236328, -110.12022399902344, -106.83499145507812, -103.54975891113281, -100.2645263671875, -96.97928619384766, -93.69405364990234, -90.40882110595703, -87.12358856201172, -83.83836364746094, -80.55313110351562, -77.26789855957031, -73.982666015625, -70.69742584228516, -67.41219329833984, -64.12696075439453, -60.84172821044922, -57.556488037109375, -54.27125549316406, -50.986019134521484, -47.70078659057617, -44.41555404663086, -41.13031768798828, -37.84508514404297, -34.559852600097656, -31.274620056152344, -27.9893856048584, -24.704153060913086, -21.41891860961914, -18.133686065673828, -14.848451614379883, -11.563217163085938, -8.277984619140625, -4.99275016784668, -1.7075164318084717, 1.5777173042297363, 4.862951278686523, 8.148184776306152, 11.433418273925781, 14.718652725219727, 18.00388526916504, 21.289119720458984]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 18.0, 15.0, 13.0, 25.0, 35.0, 56.0, 59.0, 78.0, 68.0, 82.0, 83.0, 87.0, 79.0, 65.0, 55.0, 47.0, 45.0, 39.0, 13.0, 16.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-35.95747756958008, -35.166969299316406, -34.376461029052734, -33.5859489440918, -32.795440673828125, -32.00493240356445, -31.21442413330078, -30.42391586303711, -29.633405685424805, -28.842897415161133, -28.052387237548828, -27.261878967285156, -26.471370697021484, -25.68086051940918, -24.890352249145508, -24.099842071533203, -23.30933380126953, -22.51882553100586, -21.728315353393555, -20.937807083129883, -20.147296905517578, -19.356788635253906, -18.566280364990234, -17.775772094726562, -16.985261917114258, -16.194753646850586, -15.404243469238281, -14.61373519897461, -13.823225975036621, -13.032716751098633, -12.242208480834961, -11.451699256896973, -10.661189079284668, -9.87067985534668, -9.080171585083008, -8.28966236114502, -7.499153137207031, -6.708643913269043, -5.918135166168213, -5.127626419067383, -4.3371171951293945, -3.5466082096099854, -2.756099224090576, -1.965590238571167, -1.1750812530517578, -0.38457226753234863, 0.40593671798706055, 1.1964454650878906, 1.986954689025879, 2.777463674545288, 3.5679726600646973, 4.358481407165527, 5.148990631103516, 5.939499855041504, 6.730008602142334, 7.520517349243164, 8.311026573181152, 9.10153579711914, 9.892044067382812, 10.6825532913208, 11.473062515258789, 12.263571739196777, 13.054080963134766, 13.844589233398438, 14.635098457336426]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 14.0, 15.0, 24.0, 44.0, 97.0, 165.0, 413.0, 862.0, 2470.0, 10399.0, 108943.0, 726577.0, 178561.0, 15003.0, 2989.0, 1084.0, 456.0, 185.0, 96.0, 52.0, 36.0, 16.0, 15.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.65234375, -7.41754150390625, -7.1827392578125, -6.94793701171875, -6.713134765625, -6.47833251953125, -6.2435302734375, -6.00872802734375, -5.77392578125, -5.53912353515625, -5.3043212890625, -5.06951904296875, -4.834716796875, -4.59991455078125, -4.3651123046875, -4.13031005859375, -3.8955078125, -3.66070556640625, -3.4259033203125, -3.19110107421875, -2.956298828125, -2.72149658203125, -2.4866943359375, -2.25189208984375, -2.01708984375, -1.78228759765625, -1.5474853515625, -1.31268310546875, -1.077880859375, -0.84307861328125, -0.6082763671875, -0.37347412109375, -0.138671875, 0.09613037109375, 0.3309326171875, 0.56573486328125, 0.800537109375, 1.03533935546875, 1.2701416015625, 1.50494384765625, 1.73974609375, 1.97454833984375, 2.2093505859375, 2.44415283203125, 2.678955078125, 2.91375732421875, 3.1485595703125, 3.38336181640625, 3.6181640625, 3.85296630859375, 4.0877685546875, 4.32257080078125, 4.557373046875, 4.79217529296875, 5.0269775390625, 5.26177978515625, 5.49658203125, 5.73138427734375, 5.9661865234375, 6.20098876953125, 6.435791015625, 6.67059326171875, 6.9053955078125, 7.14019775390625, 7.375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 15.0, 28.0, 25.0, 50.0, 72.0, 78.0, 83.0, 81.0, 114.0, 106.0, 97.0, 54.0, 60.0, 39.0, 42.0, 23.0, 10.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-30.0625, -29.3836669921875, -28.704833984375, -28.0260009765625, -27.34716796875, -26.6683349609375, -25.989501953125, -25.3106689453125, -24.6318359375, -23.9530029296875, -23.274169921875, -22.5953369140625, -21.91650390625, -21.2376708984375, -20.558837890625, -19.8800048828125, -19.201171875, -18.5223388671875, -17.843505859375, -17.1646728515625, -16.48583984375, -15.8070068359375, -15.128173828125, -14.4493408203125, -13.7705078125, -13.0916748046875, -12.412841796875, -11.7340087890625, -11.05517578125, -10.3763427734375, -9.697509765625, -9.0186767578125, -8.33984375, -7.6610107421875, -6.982177734375, -6.3033447265625, -5.62451171875, -4.9456787109375, -4.266845703125, -3.5880126953125, -2.9091796875, -2.2303466796875, -1.551513671875, -0.8726806640625, -0.19384765625, 0.4849853515625, 1.163818359375, 1.8426513671875, 2.521484375, 3.2003173828125, 3.879150390625, 4.5579833984375, 5.23681640625, 5.9156494140625, 6.594482421875, 7.2733154296875, 7.9521484375, 8.6309814453125, 9.309814453125, 9.9886474609375, 10.66748046875, 11.3463134765625, 12.025146484375, 12.7039794921875, 13.3828125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 12.0, 9.0, 15.0, 28.0, 28.0, 54.0, 61.0, 114.0, 166.0, 280.0, 402.0, 571.0, 974.0, 1545.0, 2389.0, 3754.0, 6192.0, 9748.0, 16179.0, 25236.0, 40428.0, 63263.0, 93080.0, 127268.0, 151507.0, 148765.0, 119606.0, 84471.0, 56052.0, 36384.0, 22486.0, 13952.0, 8655.0, 5564.0, 3453.0, 2078.0, 1310.0, 829.0, 573.0, 376.0, 207.0, 151.0, 112.0, 62.0, 59.0, 34.0, 14.0, 14.0, 14.0, 8.0, 7.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.93994140625, -0.9104461669921875, -0.880950927734375, -0.8514556884765625, -0.82196044921875, -0.7924652099609375, -0.762969970703125, -0.7334747314453125, -0.7039794921875, -0.6744842529296875, -0.644989013671875, -0.6154937744140625, -0.58599853515625, -0.5565032958984375, -0.527008056640625, -0.4975128173828125, -0.468017578125, -0.4385223388671875, -0.409027099609375, -0.3795318603515625, -0.35003662109375, -0.3205413818359375, -0.291046142578125, -0.2615509033203125, -0.2320556640625, -0.2025604248046875, -0.173065185546875, -0.1435699462890625, -0.11407470703125, -0.0845794677734375, -0.055084228515625, -0.0255889892578125, 0.00390625, 0.0334014892578125, 0.062896728515625, 0.0923919677734375, 0.12188720703125, 0.1513824462890625, 0.180877685546875, 0.2103729248046875, 0.2398681640625, 0.2693634033203125, 0.298858642578125, 0.3283538818359375, 0.35784912109375, 0.3873443603515625, 0.416839599609375, 0.4463348388671875, 0.475830078125, 0.5053253173828125, 0.534820556640625, 0.5643157958984375, 0.59381103515625, 0.6233062744140625, 0.652801513671875, 0.6822967529296875, 0.7117919921875, 0.7412872314453125, 0.770782470703125, 0.8002777099609375, 0.82977294921875, 0.8592681884765625, 0.888763427734375, 0.9182586669921875, 0.94775390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 7.0, 2.0, 5.0, 15.0, 13.0, 13.0, 21.0, 11.0, 17.0, 26.0, 23.0, 29.0, 31.0, 27.0, 28.0, 35.0, 41.0, 49.0, 32.0, 48.0, 48.0, 47.0, 32.0, 33.0, 41.0, 31.0, 40.0, 39.0, 24.0, 33.0, 29.0, 20.0, 16.0, 16.0, 13.0, 11.0, 8.0, 8.0, 10.0, 5.0, 5.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-18.8125, -18.2451171875, -17.677734375, -17.1103515625, -16.54296875, -15.9755859375, -15.408203125, -14.8408203125, -14.2734375, -13.7060546875, -13.138671875, -12.5712890625, -12.00390625, -11.4365234375, -10.869140625, -10.3017578125, -9.734375, -9.1669921875, -8.599609375, -8.0322265625, -7.46484375, -6.8974609375, -6.330078125, -5.7626953125, -5.1953125, -4.6279296875, -4.060546875, -3.4931640625, -2.92578125, -2.3583984375, -1.791015625, -1.2236328125, -0.65625, -0.0888671875, 0.478515625, 1.0458984375, 1.61328125, 2.1806640625, 2.748046875, 3.3154296875, 3.8828125, 4.4501953125, 5.017578125, 5.5849609375, 6.15234375, 6.7197265625, 7.287109375, 7.8544921875, 8.421875, 8.9892578125, 9.556640625, 10.1240234375, 10.69140625, 11.2587890625, 11.826171875, 12.3935546875, 12.9609375, 13.5283203125, 14.095703125, 14.6630859375, 15.23046875, 15.7978515625, 16.365234375, 16.9326171875, 17.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 7.0, 6.0, 5.0, 8.0, 15.0, 18.0, 31.0, 48.0, 50.0, 91.0, 164.0, 308.0, 534.0, 1018.0, 2160.0, 4572.0, 11540.0, 37692.0, 160450.0, 472749.0, 266893.0, 61482.0, 16841.0, 6227.0, 2743.0, 1317.0, 671.0, 377.0, 190.0, 121.0, 82.0, 51.0, 23.0, 17.0, 9.0, 16.0, 9.0, 5.0, 6.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2972984313964844, -0.28820037841796875, -0.2791023254394531, -0.2700042724609375, -0.2609062194824219, -0.25180816650390625, -0.24271011352539062, -0.233612060546875, -0.22451400756835938, -0.21541595458984375, -0.20631790161132812, -0.1972198486328125, -0.18812179565429688, -0.17902374267578125, -0.16992568969726562, -0.16082763671875, -0.15172958374023438, -0.14263153076171875, -0.13353347778320312, -0.1244354248046875, -0.11533737182617188, -0.10623931884765625, -0.09714126586914062, -0.088043212890625, -0.07894515991210938, -0.06984710693359375, -0.060749053955078125, -0.0516510009765625, -0.042552947998046875, -0.03345489501953125, -0.024356842041015625, -0.0152587890625, -0.006160736083984375, 0.00293731689453125, 0.012035369873046875, 0.0211334228515625, 0.030231475830078125, 0.03932952880859375, 0.048427581787109375, 0.057525634765625, 0.06662368774414062, 0.07572174072265625, 0.08481979370117188, 0.0939178466796875, 0.10301589965820312, 0.11211395263671875, 0.12121200561523438, 0.13031005859375, 0.13940811157226562, 0.14850616455078125, 0.15760421752929688, 0.1667022705078125, 0.17580032348632812, 0.18489837646484375, 0.19399642944335938, 0.203094482421875, 0.21219253540039062, 0.22129058837890625, 0.23038864135742188, 0.2394866943359375, 0.24858474731445312, 0.25768280029296875, 0.2667808532714844, 0.27587890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 2.0, 3.0, 11.0, 7.0, 11.0, 16.0, 29.0, 52.0, 59.0, 101.0, 102.0, 124.0, 123.0, 117.0, 78.0, 48.0, 31.0, 35.0, 10.0, 12.0, 4.0, 8.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0003180503845214844, -0.0003094002604484558, -0.00030075013637542725, -0.0002921000123023987, -0.0002834498882293701, -0.00027479976415634155, -0.000266149640083313, -0.0002574995160102844, -0.00024884939193725586, -0.0002401992678642273, -0.00023154914379119873, -0.00022289901971817017, -0.0002142488956451416, -0.00020559877157211304, -0.00019694864749908447, -0.0001882985234260559, -0.00017964839935302734, -0.00017099827527999878, -0.00016234815120697021, -0.00015369802713394165, -0.00014504790306091309, -0.00013639777898788452, -0.00012774765491485596, -0.00011909753084182739, -0.00011044740676879883, -0.00010179728269577026, -9.31471586227417e-05, -8.449703454971313e-05, -7.584691047668457e-05, -6.7196786403656e-05, -5.854666233062744e-05, -4.989653825759888e-05, -4.124641418457031e-05, -3.259629011154175e-05, -2.3946166038513184e-05, -1.529604196548462e-05, -6.645917892456055e-06, 2.0042061805725098e-06, 1.0654330253601074e-05, 1.930445432662964e-05, 2.7954578399658203e-05, 3.660470247268677e-05, 4.525482654571533e-05, 5.3904950618743896e-05, 6.255507469177246e-05, 7.120519876480103e-05, 7.985532283782959e-05, 8.850544691085815e-05, 9.715557098388672e-05, 0.00010580569505691528, 0.00011445581912994385, 0.0001231059432029724, 0.00013175606727600098, 0.00014040619134902954, 0.0001490563154220581, 0.00015770643949508667, 0.00016635656356811523, 0.0001750066876411438, 0.00018365681171417236, 0.00019230693578720093, 0.0002009570598602295, 0.00020960718393325806, 0.00021825730800628662, 0.00022690743207931519, 0.00023555755615234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 10.0, 10.0, 12.0, 18.0, 21.0, 31.0, 48.0, 81.0, 125.0, 209.0, 367.0, 706.0, 1590.0, 4026.0, 13903.0, 91616.0, 631482.0, 263758.0, 29566.0, 6451.0, 2302.0, 1007.0, 483.0, 294.0, 141.0, 86.0, 57.0, 41.0, 31.0, 24.0, 17.0, 4.0, 4.0, 11.0, 7.0, 3.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.481689453125, -0.4665069580078125, -0.451324462890625, -0.4361419677734375, -0.42095947265625, -0.4057769775390625, -0.390594482421875, -0.3754119873046875, -0.3602294921875, -0.3450469970703125, -0.329864501953125, -0.3146820068359375, -0.29949951171875, -0.2843170166015625, -0.269134521484375, -0.2539520263671875, -0.23876953125, -0.2235870361328125, -0.208404541015625, -0.1932220458984375, -0.17803955078125, -0.1628570556640625, -0.147674560546875, -0.1324920654296875, -0.1173095703125, -0.1021270751953125, -0.086944580078125, -0.0717620849609375, -0.05657958984375, -0.0413970947265625, -0.026214599609375, -0.0110321044921875, 0.004150390625, 0.0193328857421875, 0.034515380859375, 0.0496978759765625, 0.06488037109375, 0.0800628662109375, 0.095245361328125, 0.1104278564453125, 0.1256103515625, 0.1407928466796875, 0.155975341796875, 0.1711578369140625, 0.18634033203125, 0.2015228271484375, 0.216705322265625, 0.2318878173828125, 0.2470703125, 0.2622528076171875, 0.277435302734375, 0.2926177978515625, 0.30780029296875, 0.3229827880859375, 0.338165283203125, 0.3533477783203125, 0.3685302734375, 0.3837127685546875, 0.398895263671875, 0.4140777587890625, 0.42926025390625, 0.4444427490234375, 0.459625244140625, 0.4748077392578125, 0.489990234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 12.0, 10.0, 11.0, 7.0, 17.0, 12.0, 19.0, 21.0, 27.0, 41.0, 54.0, 45.0, 58.0, 73.0, 72.0, 83.0, 85.0, 63.0, 45.0, 47.0, 35.0, 23.0, 20.0, 22.0, 16.0, 17.0, 8.0, 7.0, 8.0, 6.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07159423828125, -0.06919384002685547, -0.06679344177246094, -0.0643930435180664, -0.061992645263671875, -0.059592247009277344, -0.05719184875488281, -0.05479145050048828, -0.05239105224609375, -0.04999065399169922, -0.04759025573730469, -0.045189857482910156, -0.042789459228515625, -0.040389060974121094, -0.03798866271972656, -0.03558826446533203, -0.0331878662109375, -0.03078746795654297, -0.028387069702148438, -0.025986671447753906, -0.023586273193359375, -0.021185874938964844, -0.018785476684570312, -0.01638507843017578, -0.01398468017578125, -0.011584281921386719, -0.009183883666992188, -0.006783485412597656, -0.004383087158203125, -0.0019826889038085938, 0.0004177093505859375, 0.0028181076049804688, 0.005218505859375, 0.007618904113769531, 0.010019302368164062, 0.012419700622558594, 0.014820098876953125, 0.017220497131347656, 0.019620895385742188, 0.02202129364013672, 0.02442169189453125, 0.02682209014892578, 0.029222488403320312, 0.031622886657714844, 0.034023284912109375, 0.036423683166503906, 0.03882408142089844, 0.04122447967529297, 0.0436248779296875, 0.04602527618408203, 0.04842567443847656, 0.050826072692871094, 0.053226470947265625, 0.055626869201660156, 0.05802726745605469, 0.06042766571044922, 0.06282806396484375, 0.06522846221923828, 0.06762886047363281, 0.07002925872802734, 0.07242965698242188, 0.0748300552368164, 0.07723045349121094, 0.07963085174560547, 0.08203125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 12.0, 78.0, 382.0, 425.0, 100.0, 13.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-136.1502685546875, -133.67391967773438, -131.19757080078125, -128.7212371826172, -126.24488830566406, -123.76853942871094, -121.29219818115234, -118.81585693359375, -116.33950805664062, -113.8631591796875, -111.3868179321289, -108.91047668457031, -106.43412780761719, -103.95777893066406, -101.48143768310547, -99.00509643554688, -96.52874755859375, -94.05239868164062, -91.57605743408203, -89.09971618652344, -86.62336730957031, -84.14701843261719, -81.6706771850586, -79.1943359375, -76.71798706054688, -74.24163818359375, -71.76529693603516, -69.28895568847656, -66.81260681152344, -64.33625793457031, -61.85991668701172, -59.38357162475586, -56.90723419189453, -54.43088912963867, -51.95454406738281, -49.47819900512695, -47.001853942871094, -44.525508880615234, -42.049163818359375, -39.572818756103516, -37.096473693847656, -34.6201286315918, -32.14378356933594, -29.667438507080078, -27.19109344482422, -24.71474838256836, -22.2384033203125, -19.76205825805664, -17.28571319580078, -14.809368133544922, -12.333023071289062, -9.856678009033203, -7.380332946777344, -4.903987884521484, -2.427642822265625, 0.048702239990234375, 2.5250473022460938, 5.001392364501953, 7.4777374267578125, 9.954082489013672, 12.430427551269531, 14.90677261352539, 17.38311767578125, 19.85946273803711, 22.33580780029297]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 5.0, 18.0, 15.0, 30.0, 47.0, 77.0, 79.0, 97.0, 100.0, 121.0, 99.0, 82.0, 70.0, 48.0, 56.0, 21.0, 17.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.912860870361328, -30.212923049926758, -29.512985229492188, -28.813047409057617, -28.113109588623047, -27.413171768188477, -26.713233947753906, -26.013294219970703, -25.313358306884766, -24.613420486450195, -23.913482666015625, -23.213544845581055, -22.513607025146484, -21.813669204711914, -21.113731384277344, -20.41379165649414, -19.71385383605957, -19.013916015625, -18.31397819519043, -17.61404037475586, -16.91410255432129, -16.21416473388672, -15.514225959777832, -14.814288139343262, -14.114350318908691, -13.414412498474121, -12.71447467803955, -12.014535903930664, -11.314598083496094, -10.614660263061523, -9.914722442626953, -9.214784622192383, -8.514845848083496, -7.814908027648926, -7.1149702072143555, -6.415031909942627, -5.715094089508057, -5.015156269073486, -4.315217971801758, -3.6152801513671875, -2.915342330932617, -2.215404510498047, -1.5154664516448975, -0.815528392791748, -0.11559057235717773, 0.5843472480773926, 1.284285545349121, 1.9842233657836914, 2.6841611862182617, 3.384099006652832, 4.084036827087402, 4.783975124359131, 5.483912944793701, 6.1838507652282715, 6.8837890625, 7.58372688293457, 8.28366470336914, 8.983602523803711, 9.683540344238281, 10.383478164672852, 11.083415985107422, 11.783353805541992, 12.483292579650879, 13.18323040008545, 13.88316822052002]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 11.0, 8.0, 20.0, 28.0, 43.0, 68.0, 122.0, 180.0, 302.0, 615.0, 1112.0, 2697.0, 6487.0, 19741.0, 79787.0, 398051.0, 420503.0, 85851.0, 20657.0, 6867.0, 2739.0, 1195.0, 610.0, 296.0, 201.0, 125.0, 59.0, 39.0, 41.0, 19.0, 15.0, 11.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.703125, -7.446533203125, -7.18994140625, -6.933349609375, -6.6767578125, -6.420166015625, -6.16357421875, -5.906982421875, -5.650390625, -5.393798828125, -5.13720703125, -4.880615234375, -4.6240234375, -4.367431640625, -4.11083984375, -3.854248046875, -3.59765625, -3.341064453125, -3.08447265625, -2.827880859375, -2.5712890625, -2.314697265625, -2.05810546875, -1.801513671875, -1.544921875, -1.288330078125, -1.03173828125, -0.775146484375, -0.5185546875, -0.261962890625, -0.00537109375, 0.251220703125, 0.5078125, 0.764404296875, 1.02099609375, 1.277587890625, 1.5341796875, 1.790771484375, 2.04736328125, 2.303955078125, 2.560546875, 2.817138671875, 3.07373046875, 3.330322265625, 3.5869140625, 3.843505859375, 4.10009765625, 4.356689453125, 4.61328125, 4.869873046875, 5.12646484375, 5.383056640625, 5.6396484375, 5.896240234375, 6.15283203125, 6.409423828125, 6.666015625, 6.922607421875, 7.17919921875, 7.435791015625, 7.6923828125, 7.948974609375, 8.20556640625, 8.462158203125, 8.71875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 5.0, 6.0, 15.0, 14.0, 30.0, 30.0, 42.0, 52.0, 60.0, 72.0, 69.0, 105.0, 87.0, 82.0, 72.0, 56.0, 65.0, 39.0, 29.0, 30.0, 16.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-49.90625, -48.81787109375, -47.7294921875, -46.64111328125, -45.552734375, -44.46435546875, -43.3759765625, -42.28759765625, -41.19921875, -40.11083984375, -39.0224609375, -37.93408203125, -36.845703125, -35.75732421875, -34.6689453125, -33.58056640625, -32.4921875, -31.40380859375, -30.3154296875, -29.22705078125, -28.138671875, -27.05029296875, -25.9619140625, -24.87353515625, -23.78515625, -22.69677734375, -21.6083984375, -20.52001953125, -19.431640625, -18.34326171875, -17.2548828125, -16.16650390625, -15.078125, -13.98974609375, -12.9013671875, -11.81298828125, -10.724609375, -9.63623046875, -8.5478515625, -7.45947265625, -6.37109375, -5.28271484375, -4.1943359375, -3.10595703125, -2.017578125, -0.92919921875, 0.1591796875, 1.24755859375, 2.3359375, 3.42431640625, 4.5126953125, 5.60107421875, 6.689453125, 7.77783203125, 8.8662109375, 9.95458984375, 11.04296875, 12.13134765625, 13.2197265625, 14.30810546875, 15.396484375, 16.48486328125, 17.5732421875, 18.66162109375, 19.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 4.0, 11.0, 23.0, 22.0, 34.0, 13.0, 44.0, 62.0, 87.0, 102.0, 283.0, 6856.0, 1039502.0, 920.0, 185.0, 107.0, 76.0, 42.0, 37.0, 36.0, 28.0, 20.0, 13.0, 8.0, 7.0, 6.0, 1.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.875, -67.1142578125, -64.353515625, -61.5927734375, -58.83203125, -56.0712890625, -53.310546875, -50.5498046875, -47.7890625, -45.0283203125, -42.267578125, -39.5068359375, -36.74609375, -33.9853515625, -31.224609375, -28.4638671875, -25.703125, -22.9423828125, -20.181640625, -17.4208984375, -14.66015625, -11.8994140625, -9.138671875, -6.3779296875, -3.6171875, -0.8564453125, 1.904296875, 4.6650390625, 7.42578125, 10.1865234375, 12.947265625, 15.7080078125, 18.46875, 21.2294921875, 23.990234375, 26.7509765625, 29.51171875, 32.2724609375, 35.033203125, 37.7939453125, 40.5546875, 43.3154296875, 46.076171875, 48.8369140625, 51.59765625, 54.3583984375, 57.119140625, 59.8798828125, 62.640625, 65.4013671875, 68.162109375, 70.9228515625, 73.68359375, 76.4443359375, 79.205078125, 81.9658203125, 84.7265625, 87.4873046875, 90.248046875, 93.0087890625, 95.76953125, 98.5302734375, 101.291015625, 104.0517578125, 106.8125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 7.0, 11.0, 23.0, 17.0, 28.0, 23.0, 40.0, 53.0, 48.0, 65.0, 64.0, 75.0, 76.0, 66.0, 67.0, 64.0, 63.0, 40.0, 26.0, 33.0, 29.0, 21.0, 15.0, 10.0, 5.0, 7.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.71875, -29.5478515625, -28.376953125, -27.2060546875, -26.03515625, -24.8642578125, -23.693359375, -22.5224609375, -21.3515625, -20.1806640625, -19.009765625, -17.8388671875, -16.66796875, -15.4970703125, -14.326171875, -13.1552734375, -11.984375, -10.8134765625, -9.642578125, -8.4716796875, -7.30078125, -6.1298828125, -4.958984375, -3.7880859375, -2.6171875, -1.4462890625, -0.275390625, 0.8955078125, 2.06640625, 3.2373046875, 4.408203125, 5.5791015625, 6.75, 7.9208984375, 9.091796875, 10.2626953125, 11.43359375, 12.6044921875, 13.775390625, 14.9462890625, 16.1171875, 17.2880859375, 18.458984375, 19.6298828125, 20.80078125, 21.9716796875, 23.142578125, 24.3134765625, 25.484375, 26.6552734375, 27.826171875, 28.9970703125, 30.16796875, 31.3388671875, 32.509765625, 33.6806640625, 34.8515625, 36.0224609375, 37.193359375, 38.3642578125, 39.53515625, 40.7060546875, 41.876953125, 43.0478515625, 44.21875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 1.0, 8.0, 9.0, 24.0, 42.0, 91.0, 351.0, 3011.0, 911305.0, 131563.0, 1712.0, 252.0, 92.0, 39.0, 18.0, 6.0, 5.0, 2.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.921875, -24.140625, -23.359375, -22.578125, -21.796875, -21.015625, -20.234375, -19.453125, -18.671875, -17.890625, -17.109375, -16.328125, -15.546875, -14.765625, -13.984375, -13.203125, -12.421875, -11.640625, -10.859375, -10.078125, -9.296875, -8.515625, -7.734375, -6.953125, -6.171875, -5.390625, -4.609375, -3.828125, -3.046875, -2.265625, -1.484375, -0.703125, 0.078125, 0.859375, 1.640625, 2.421875, 3.203125, 3.984375, 4.765625, 5.546875, 6.328125, 7.109375, 7.890625, 8.671875, 9.453125, 10.234375, 11.015625, 11.796875, 12.578125, 13.359375, 14.140625, 14.921875, 15.703125, 16.484375, 17.265625, 18.046875, 18.828125, 19.609375, 20.390625, 21.171875, 21.953125, 22.734375, 23.515625, 24.296875, 25.078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 8.0, 19.0, 24.0, 43.0, 104.0, 213.0, 258.0, 163.0, 79.0, 35.0, 20.0, 14.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014352798461914062, -0.0013935714960098267, -0.001351863145828247, -0.0013101547956466675, -0.0012684464454650879, -0.0012267380952835083, -0.0011850297451019287, -0.0011433213949203491, -0.0011016130447387695, -0.00105990469455719, -0.0010181963443756104, -0.0009764879941940308, -0.0009347796440124512, -0.0008930712938308716, -0.000851362943649292, -0.0008096545934677124, -0.0007679462432861328, -0.0007262378931045532, -0.0006845295429229736, -0.000642821192741394, -0.0006011128425598145, -0.0005594044923782349, -0.0005176961421966553, -0.0004759877920150757, -0.0004342794418334961, -0.0003925710916519165, -0.0003508627414703369, -0.0003091543912887573, -0.00026744604110717773, -0.00022573769092559814, -0.00018402934074401855, -0.00014232099056243896, -0.00010061264038085938, -5.8904290199279785e-05, -1.7195940017700195e-05, 2.4512410163879395e-05, 6.622076034545898e-05, 0.00010792911052703857, 0.00014963746070861816, 0.00019134581089019775, 0.00023305416107177734, 0.00027476251125335693, 0.0003164708614349365, 0.0003581792116165161, 0.0003998875617980957, 0.0004415959119796753, 0.0004833042621612549, 0.0005250126123428345, 0.0005667209625244141, 0.0006084293127059937, 0.0006501376628875732, 0.0006918460130691528, 0.0007335543632507324, 0.000775262713432312, 0.0008169710636138916, 0.0008586794137954712, 0.0009003877639770508, 0.0009420961141586304, 0.00098380446434021, 0.0010255128145217896, 0.0010672211647033691, 0.0011089295148849487, 0.0011506378650665283, 0.001192346215248108, 0.0012340545654296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 10.0, 8.0, 11.0, 19.0, 49.0, 100.0, 204.0, 803.0, 5997.0, 598260.0, 436715.0, 5155.0, 802.0, 230.0, 73.0, 59.0, 22.0, 11.0, 4.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.875, -17.4278564453125, -16.980712890625, -16.5335693359375, -16.08642578125, -15.6392822265625, -15.192138671875, -14.7449951171875, -14.2978515625, -13.8507080078125, -13.403564453125, -12.9564208984375, -12.50927734375, -12.0621337890625, -11.614990234375, -11.1678466796875, -10.720703125, -10.2735595703125, -9.826416015625, -9.3792724609375, -8.93212890625, -8.4849853515625, -8.037841796875, -7.5906982421875, -7.1435546875, -6.6964111328125, -6.249267578125, -5.8021240234375, -5.35498046875, -4.9078369140625, -4.460693359375, -4.0135498046875, -3.56640625, -3.1192626953125, -2.672119140625, -2.2249755859375, -1.77783203125, -1.3306884765625, -0.883544921875, -0.4364013671875, 0.0107421875, 0.4578857421875, 0.905029296875, 1.3521728515625, 1.79931640625, 2.2464599609375, 2.693603515625, 3.1407470703125, 3.587890625, 4.0350341796875, 4.482177734375, 4.9293212890625, 5.37646484375, 5.8236083984375, 6.270751953125, 6.7178955078125, 7.1650390625, 7.6121826171875, 8.059326171875, 8.5064697265625, 8.95361328125, 9.4007568359375, 9.847900390625, 10.2950439453125, 10.7421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 5.0, 2.0, 11.0, 19.0, 36.0, 36.0, 52.0, 97.0, 132.0, 152.0, 141.0, 110.0, 69.0, 46.0, 28.0, 21.0, 11.0, 6.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5927734375, -1.5229949951171875, -1.453216552734375, -1.3834381103515625, -1.31365966796875, -1.2438812255859375, -1.174102783203125, -1.1043243408203125, -1.0345458984375, -0.9647674560546875, -0.894989013671875, -0.8252105712890625, -0.75543212890625, -0.6856536865234375, -0.615875244140625, -0.5460968017578125, -0.476318359375, -0.4065399169921875, -0.336761474609375, -0.2669830322265625, -0.19720458984375, -0.1274261474609375, -0.057647705078125, 0.0121307373046875, 0.0819091796875, 0.1516876220703125, 0.221466064453125, 0.2912445068359375, 0.36102294921875, 0.4308013916015625, 0.500579833984375, 0.5703582763671875, 0.64013671875, 0.7099151611328125, 0.779693603515625, 0.8494720458984375, 0.91925048828125, 0.9890289306640625, 1.058807373046875, 1.1285858154296875, 1.1983642578125, 1.2681427001953125, 1.337921142578125, 1.4076995849609375, 1.47747802734375, 1.5472564697265625, 1.617034912109375, 1.6868133544921875, 1.756591796875, 1.8263702392578125, 1.896148681640625, 1.9659271240234375, 2.03570556640625, 2.1054840087890625, 2.175262451171875, 2.2450408935546875, 2.3148193359375, 2.3845977783203125, 2.454376220703125, 2.5241546630859375, 2.59393310546875, 2.6637115478515625, 2.733489990234375, 2.8032684326171875, 2.873046875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 17.0, 113.0, 361.0, 369.0, 124.0, 20.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-220.63658142089844, -216.4689178466797, -212.30125427246094, -208.1335906982422, -203.96592712402344, -199.79827880859375, -195.630615234375, -191.46295166015625, -187.2952880859375, -183.12762451171875, -178.9599609375, -174.79229736328125, -170.6246337890625, -166.45697021484375, -162.289306640625, -158.1216583251953, -153.9539794921875, -149.78631591796875, -145.61865234375, -141.45098876953125, -137.2833251953125, -133.11566162109375, -128.947998046875, -124.78034210205078, -120.61268615722656, -116.44502258300781, -112.27735900878906, -108.10969543457031, -103.9420394897461, -99.77437591552734, -95.6067123413086, -91.43904876708984, -87.27139282226562, -83.10372924804688, -78.93606567382812, -74.76840209960938, -70.60074615478516, -66.4330825805664, -62.265419006347656, -58.097755432128906, -53.930091857910156, -49.762428283691406, -45.59476852416992, -41.42710494995117, -37.25944519042969, -33.09178161621094, -28.924118041992188, -24.75645637512207, -20.588794708251953, -16.421133041381836, -12.253470420837402, -8.085807800292969, -3.9181461334228516, 0.24951553344726562, 4.417179107666016, 8.584840774536133, 12.75250244140625, 16.920164108276367, 21.087825775146484, 25.255489349365234, 29.42315101623535, 33.59081268310547, 37.75847625732422, 41.92613983154297, 46.09379959106445]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 11.0, 12.0, 15.0, 11.0, 23.0, 21.0, 20.0, 23.0, 31.0, 35.0, 29.0, 30.0, 28.0, 55.0, 57.0, 46.0, 41.0, 40.0, 38.0, 43.0, 30.0, 41.0, 32.0, 40.0, 40.0, 42.0, 24.0, 20.0, 17.0, 15.0, 14.0, 18.0, 9.0, 6.0, 8.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.787109375, -32.79904556274414, -31.810983657836914, -30.822921752929688, -29.834857940673828, -28.8467960357666, -27.858732223510742, -26.870670318603516, -25.882606506347656, -24.89454460144043, -23.90648078918457, -22.918418884277344, -21.930355072021484, -20.942293167114258, -19.9542293548584, -18.966167449951172, -17.978103637695312, -16.990041732788086, -16.001977920532227, -15.013915061950684, -14.02585220336914, -13.037790298461914, -12.049726486206055, -11.061664581298828, -10.073602676391602, -9.085539817810059, -8.097476959228516, -7.109414100646973, -6.12135124206543, -5.133288860321045, -4.145226001739502, -3.157163143157959, -2.169099807739258, -1.1810369491577148, -0.19297420978546143, 0.795088529586792, 1.783151388168335, 2.771214008331299, 3.759276866912842, 4.747339725494385, 5.735402584075928, 6.723465442657471, 7.711528301239014, 8.699590682983398, 9.687653541564941, 10.675716400146484, 11.663779258728027, 12.65184211730957, 13.639904975891113, 14.627967834472656, 15.6160306930542, 16.604093551635742, 17.59215545654297, 18.580219268798828, 19.568281173706055, 20.556344985961914, 21.54440689086914, 22.532468795776367, 23.520532608032227, 24.508594512939453, 25.496658325195312, 26.48472023010254, 27.4727840423584, 28.460845947265625, 29.448909759521484]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 15.0, 12.0, 16.0, 18.0, 25.0, 33.0, 36.0, 82.0, 114.0, 175.0, 454.0, 1296.0, 5151.0, 32454.0, 337130.0, 2527625.0, 1167023.0, 102783.0, 13401.0, 3266.0, 1443.0, 871.0, 403.0, 204.0, 81.0, 33.0, 22.0, 27.0, 12.0, 12.0, 9.0, 10.0, 10.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.90625, -28.119873046875, -27.33349609375, -26.547119140625, -25.7607421875, -24.974365234375, -24.18798828125, -23.401611328125, -22.615234375, -21.828857421875, -21.04248046875, -20.256103515625, -19.4697265625, -18.683349609375, -17.89697265625, -17.110595703125, -16.32421875, -15.537841796875, -14.75146484375, -13.965087890625, -13.1787109375, -12.392333984375, -11.60595703125, -10.819580078125, -10.033203125, -9.246826171875, -8.46044921875, -7.674072265625, -6.8876953125, -6.101318359375, -5.31494140625, -4.528564453125, -3.7421875, -2.955810546875, -2.16943359375, -1.383056640625, -0.5966796875, 0.189697265625, 0.97607421875, 1.762451171875, 2.548828125, 3.335205078125, 4.12158203125, 4.907958984375, 5.6943359375, 6.480712890625, 7.26708984375, 8.053466796875, 8.83984375, 9.626220703125, 10.41259765625, 11.198974609375, 11.9853515625, 12.771728515625, 13.55810546875, 14.344482421875, 15.130859375, 15.917236328125, 16.70361328125, 17.489990234375, 18.2763671875, 19.062744140625, 19.84912109375, 20.635498046875, 21.421875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 7.0, 6.0, 14.0, 20.0, 44.0, 47.0, 95.0, 101.0, 110.0, 121.0, 104.0, 95.0, 82.0, 54.0, 44.0, 24.0, 19.0, 10.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-41.71875, -40.8580322265625, -39.997314453125, -39.1365966796875, -38.27587890625, -37.4151611328125, -36.554443359375, -35.6937255859375, -34.8330078125, -33.9722900390625, -33.111572265625, -32.2508544921875, -31.39013671875, -30.5294189453125, -29.668701171875, -28.8079833984375, -27.947265625, -27.0865478515625, -26.225830078125, -25.3651123046875, -24.50439453125, -23.6436767578125, -22.782958984375, -21.9222412109375, -21.0615234375, -20.2008056640625, -19.340087890625, -18.4793701171875, -17.61865234375, -16.7579345703125, -15.897216796875, -15.0364990234375, -14.17578125, -13.3150634765625, -12.454345703125, -11.5936279296875, -10.73291015625, -9.8721923828125, -9.011474609375, -8.1507568359375, -7.2900390625, -6.4293212890625, -5.568603515625, -4.7078857421875, -3.84716796875, -2.9864501953125, -2.125732421875, -1.2650146484375, -0.404296875, 0.4564208984375, 1.317138671875, 2.1778564453125, 3.03857421875, 3.8992919921875, 4.760009765625, 5.6207275390625, 6.4814453125, 7.3421630859375, 8.202880859375, 9.0635986328125, 9.92431640625, 10.7850341796875, 11.645751953125, 12.5064697265625, 13.3671875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 9.0, 5.0, 13.0, 30.0, 50.0, 113.0, 374.0, 2302.0, 3309730.0, 879663.0, 1532.0, 289.0, 90.0, 34.0, 23.0, 13.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.3125, -78.8740234375, -75.435546875, -71.9970703125, -68.55859375, -65.1201171875, -61.681640625, -58.2431640625, -54.8046875, -51.3662109375, -47.927734375, -44.4892578125, -41.05078125, -37.6123046875, -34.173828125, -30.7353515625, -27.296875, -23.8583984375, -20.419921875, -16.9814453125, -13.54296875, -10.1044921875, -6.666015625, -3.2275390625, 0.2109375, 3.6494140625, 7.087890625, 10.5263671875, 13.96484375, 17.4033203125, 20.841796875, 24.2802734375, 27.71875, 31.1572265625, 34.595703125, 38.0341796875, 41.47265625, 44.9111328125, 48.349609375, 51.7880859375, 55.2265625, 58.6650390625, 62.103515625, 65.5419921875, 68.98046875, 72.4189453125, 75.857421875, 79.2958984375, 82.734375, 86.1728515625, 89.611328125, 93.0498046875, 96.48828125, 99.9267578125, 103.365234375, 106.8037109375, 110.2421875, 113.6806640625, 117.119140625, 120.5576171875, 123.99609375, 127.4345703125, 130.873046875, 134.3115234375, 137.75]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 8.0, 10.0, 18.0, 48.0, 40.0, 84.0, 139.0, 201.0, 353.0, 552.0, 706.0, 664.0, 464.0, 318.0, 163.0, 125.0, 56.0, 34.0, 20.0, 21.0, 16.0, 7.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1484375, -6.88134765625, -6.6142578125, -6.34716796875, -6.080078125, -5.81298828125, -5.5458984375, -5.27880859375, -5.01171875, -4.74462890625, -4.4775390625, -4.21044921875, -3.943359375, -3.67626953125, -3.4091796875, -3.14208984375, -2.875, -2.60791015625, -2.3408203125, -2.07373046875, -1.806640625, -1.53955078125, -1.2724609375, -1.00537109375, -0.73828125, -0.47119140625, -0.2041015625, 0.06298828125, 0.330078125, 0.59716796875, 0.8642578125, 1.13134765625, 1.3984375, 1.66552734375, 1.9326171875, 2.19970703125, 2.466796875, 2.73388671875, 3.0009765625, 3.26806640625, 3.53515625, 3.80224609375, 4.0693359375, 4.33642578125, 4.603515625, 4.87060546875, 5.1376953125, 5.40478515625, 5.671875, 5.93896484375, 6.2060546875, 6.47314453125, 6.740234375, 7.00732421875, 7.2744140625, 7.54150390625, 7.80859375, 8.07568359375, 8.3427734375, 8.60986328125, 8.876953125, 9.14404296875, 9.4111328125, 9.67822265625, 9.9453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 18.0, 36.0, 81.0, 141.0, 194.0, 196.0, 151.0, 99.0, 35.0, 30.0, 11.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.2865219116211, -73.78534698486328, -72.2841796875, -70.78300476074219, -69.2818374633789, -67.7806625366211, -66.27949523925781, -64.7783203125, -63.27714920043945, -61.775978088378906, -60.27480697631836, -58.77363586425781, -57.2724609375, -55.77128982543945, -54.270118713378906, -52.76894760131836, -51.26777648925781, -49.766605377197266, -48.26543426513672, -46.76426315307617, -45.263092041015625, -43.76191711425781, -42.260746002197266, -40.75957489013672, -39.25840377807617, -37.757232666015625, -36.25606155395508, -34.75489044189453, -33.25371551513672, -31.752546310424805, -30.251373291015625, -28.750202178955078, -27.249034881591797, -25.74786376953125, -24.246692657470703, -22.745519638061523, -21.244348526000977, -19.74317741394043, -18.24200439453125, -16.740833282470703, -15.239662170410156, -13.73849105834961, -12.237318992614746, -10.736146926879883, -9.234975814819336, -7.733804225921631, -6.232632637023926, -4.7314605712890625, -3.2302894592285156, -1.7291178703308105, -0.22794628143310547, 1.2732253074645996, 2.7743968963623047, 4.27556848526001, 5.776740074157715, 7.277912139892578, 8.779083251953125, 10.280254364013672, 11.781426429748535, 13.282598495483398, 14.783769607543945, 16.284940719604492, 17.786113739013672, 19.28728485107422, 20.788455963134766]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 7.0, 12.0, 20.0, 26.0, 25.0, 52.0, 54.0, 71.0, 64.0, 85.0, 100.0, 79.0, 85.0, 73.0, 72.0, 44.0, 31.0, 32.0, 25.0, 19.0, 15.0, 6.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.36582946777344, -32.552520751953125, -31.739215850830078, -30.9259090423584, -30.11260223388672, -29.299293518066406, -28.485986709594727, -27.672679901123047, -26.859373092651367, -26.046066284179688, -25.232759475708008, -24.419452667236328, -23.606143951416016, -22.79283905029297, -21.979530334472656, -21.166223526000977, -20.352916717529297, -19.539609909057617, -18.726303100585938, -17.912996292114258, -17.099689483642578, -16.286380767822266, -15.473073959350586, -14.659767150878906, -13.846460342407227, -13.033153533935547, -12.219846725463867, -11.406538963317871, -10.593232154846191, -9.779925346374512, -8.966617584228516, -8.153310775756836, -7.340003967285156, -6.526697158813477, -5.713389873504639, -4.900082588195801, -4.086775779724121, -3.2734689712524414, -2.4601616859436035, -1.6468544006347656, -0.8335475921630859, -0.02024054527282715, 0.7930665016174316, 1.6063735485076904, 2.419680595397949, 3.232987403869629, 4.046294689178467, 4.859601974487305, 5.672908782958984, 6.486215591430664, 7.299522876739502, 8.11283016204834, 8.92613697052002, 9.7394437789917, 10.552751541137695, 11.366058349609375, 12.179365158081055, 12.992671966552734, 13.805978775024414, 14.61928653717041, 15.43259334564209, 16.245899200439453, 17.059207916259766, 17.872514724731445, 18.685821533203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 5.0, 7.0, 7.0, 17.0, 28.0, 31.0, 75.0, 167.0, 361.0, 1021.0, 3311.0, 17096.0, 417710.0, 579764.0, 23284.0, 3746.0, 1147.0, 431.0, 160.0, 73.0, 35.0, 24.0, 15.0, 12.0, 9.0, 5.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51171875, -6.25189208984375, -5.9920654296875, -5.73223876953125, -5.472412109375, -5.21258544921875, -4.9527587890625, -4.69293212890625, -4.43310546875, -4.17327880859375, -3.9134521484375, -3.65362548828125, -3.393798828125, -3.13397216796875, -2.8741455078125, -2.61431884765625, -2.3544921875, -2.09466552734375, -1.8348388671875, -1.57501220703125, -1.315185546875, -1.05535888671875, -0.7955322265625, -0.53570556640625, -0.27587890625, -0.01605224609375, 0.2437744140625, 0.50360107421875, 0.763427734375, 1.02325439453125, 1.2830810546875, 1.54290771484375, 1.802734375, 2.06256103515625, 2.3223876953125, 2.58221435546875, 2.842041015625, 3.10186767578125, 3.3616943359375, 3.62152099609375, 3.88134765625, 4.14117431640625, 4.4010009765625, 4.66082763671875, 4.920654296875, 5.18048095703125, 5.4403076171875, 5.70013427734375, 5.9599609375, 6.21978759765625, 6.4796142578125, 6.73944091796875, 6.999267578125, 7.25909423828125, 7.5189208984375, 7.77874755859375, 8.03857421875, 8.29840087890625, 8.5582275390625, 8.81805419921875, 9.077880859375, 9.33770751953125, 9.5975341796875, 9.85736083984375, 10.1171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 12.0, 14.0, 26.0, 45.0, 59.0, 78.0, 87.0, 123.0, 102.0, 114.0, 102.0, 82.0, 45.0, 34.0, 36.0, 20.0, 10.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.078125, -25.43505859375, -24.7919921875, -24.14892578125, -23.505859375, -22.86279296875, -22.2197265625, -21.57666015625, -20.93359375, -20.29052734375, -19.6474609375, -19.00439453125, -18.361328125, -17.71826171875, -17.0751953125, -16.43212890625, -15.7890625, -15.14599609375, -14.5029296875, -13.85986328125, -13.216796875, -12.57373046875, -11.9306640625, -11.28759765625, -10.64453125, -10.00146484375, -9.3583984375, -8.71533203125, -8.072265625, -7.42919921875, -6.7861328125, -6.14306640625, -5.5, -4.85693359375, -4.2138671875, -3.57080078125, -2.927734375, -2.28466796875, -1.6416015625, -0.99853515625, -0.35546875, 0.28759765625, 0.9306640625, 1.57373046875, 2.216796875, 2.85986328125, 3.5029296875, 4.14599609375, 4.7890625, 5.43212890625, 6.0751953125, 6.71826171875, 7.361328125, 8.00439453125, 8.6474609375, 9.29052734375, 9.93359375, 10.57666015625, 11.2197265625, 11.86279296875, 12.505859375, 13.14892578125, 13.7919921875, 14.43505859375, 15.078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 10.0, 7.0, 14.0, 21.0, 30.0, 46.0, 75.0, 108.0, 146.0, 242.0, 353.0, 557.0, 884.0, 1508.0, 2604.0, 4910.0, 9267.0, 17937.0, 35106.0, 68445.0, 127558.0, 201401.0, 221749.0, 162271.0, 93088.0, 47981.0, 24585.0, 12416.0, 6483.0, 3522.0, 1999.0, 1176.0, 696.0, 459.0, 291.0, 184.0, 131.0, 93.0, 77.0, 46.0, 27.0, 13.0, 12.0, 11.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9755859375, -0.9422149658203125, -0.908843994140625, -0.8754730224609375, -0.84210205078125, -0.8087310791015625, -0.775360107421875, -0.7419891357421875, -0.7086181640625, -0.6752471923828125, -0.641876220703125, -0.6085052490234375, -0.57513427734375, -0.5417633056640625, -0.508392333984375, -0.4750213623046875, -0.441650390625, -0.4082794189453125, -0.374908447265625, -0.3415374755859375, -0.30816650390625, -0.2747955322265625, -0.241424560546875, -0.2080535888671875, -0.1746826171875, -0.1413116455078125, -0.107940673828125, -0.0745697021484375, -0.04119873046875, -0.0078277587890625, 0.025543212890625, 0.0589141845703125, 0.09228515625, 0.1256561279296875, 0.159027099609375, 0.1923980712890625, 0.22576904296875, 0.2591400146484375, 0.292510986328125, 0.3258819580078125, 0.3592529296875, 0.3926239013671875, 0.425994873046875, 0.4593658447265625, 0.49273681640625, 0.5261077880859375, 0.559478759765625, 0.5928497314453125, 0.626220703125, 0.6595916748046875, 0.692962646484375, 0.7263336181640625, 0.75970458984375, 0.7930755615234375, 0.826446533203125, 0.8598175048828125, 0.8931884765625, 0.9265594482421875, 0.959930419921875, 0.9933013916015625, 1.02667236328125, 1.0600433349609375, 1.093414306640625, 1.1267852783203125, 1.16015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 12.0, 16.0, 18.0, 27.0, 38.0, 33.0, 37.0, 47.0, 55.0, 70.0, 62.0, 52.0, 60.0, 61.0, 53.0, 54.0, 49.0, 42.0, 41.0, 25.0, 36.0, 18.0, 18.0, 14.0, 11.0, 6.0, 12.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-20.640625, -20.0166015625, -19.392578125, -18.7685546875, -18.14453125, -17.5205078125, -16.896484375, -16.2724609375, -15.6484375, -15.0244140625, -14.400390625, -13.7763671875, -13.15234375, -12.5283203125, -11.904296875, -11.2802734375, -10.65625, -10.0322265625, -9.408203125, -8.7841796875, -8.16015625, -7.5361328125, -6.912109375, -6.2880859375, -5.6640625, -5.0400390625, -4.416015625, -3.7919921875, -3.16796875, -2.5439453125, -1.919921875, -1.2958984375, -0.671875, -0.0478515625, 0.576171875, 1.2001953125, 1.82421875, 2.4482421875, 3.072265625, 3.6962890625, 4.3203125, 4.9443359375, 5.568359375, 6.1923828125, 6.81640625, 7.4404296875, 8.064453125, 8.6884765625, 9.3125, 9.9365234375, 10.560546875, 11.1845703125, 11.80859375, 12.4326171875, 13.056640625, 13.6806640625, 14.3046875, 14.9287109375, 15.552734375, 16.1767578125, 16.80078125, 17.4248046875, 18.048828125, 18.6728515625, 19.296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 14.0, 24.0, 36.0, 66.0, 69.0, 151.0, 249.0, 432.0, 803.0, 1677.0, 3301.0, 7982.0, 22409.0, 96641.0, 493557.0, 336498.0, 57870.0, 15525.0, 5907.0, 2511.0, 1269.0, 642.0, 381.0, 209.0, 129.0, 65.0, 46.0, 24.0, 17.0, 11.0, 8.0, 4.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.289306640625, -0.2796134948730469, -0.26992034912109375, -0.2602272033691406, -0.2505340576171875, -0.24084091186523438, -0.23114776611328125, -0.22145462036132812, -0.211761474609375, -0.20206832885742188, -0.19237518310546875, -0.18268203735351562, -0.1729888916015625, -0.16329574584960938, -0.15360260009765625, -0.14390945434570312, -0.13421630859375, -0.12452316284179688, -0.11483001708984375, -0.10513687133789062, -0.0954437255859375, -0.08575057983398438, -0.07605743408203125, -0.06636428833007812, -0.056671142578125, -0.046977996826171875, -0.03728485107421875, -0.027591705322265625, -0.0178985595703125, -0.008205413818359375, 0.00148773193359375, 0.011180877685546875, 0.0208740234375, 0.030567169189453125, 0.04026031494140625, 0.049953460693359375, 0.0596466064453125, 0.06933975219726562, 0.07903289794921875, 0.08872604370117188, 0.098419189453125, 0.10811233520507812, 0.11780548095703125, 0.12749862670898438, 0.1371917724609375, 0.14688491821289062, 0.15657806396484375, 0.16627120971679688, 0.17596435546875, 0.18565750122070312, 0.19535064697265625, 0.20504379272460938, 0.2147369384765625, 0.22443008422851562, 0.23412322998046875, 0.24381637573242188, 0.253509521484375, 0.2632026672363281, 0.27289581298828125, 0.2825889587402344, 0.2922821044921875, 0.3019752502441406, 0.31166839599609375, 0.3213615417480469, 0.3310546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 9.0, 7.0, 8.0, 4.0, 14.0, 11.0, 32.0, 47.0, 54.0, 113.0, 135.0, 169.0, 127.0, 81.0, 57.0, 43.0, 26.0, 23.0, 14.0, 12.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003018379211425781, -0.00029334239661693573, -0.00028484687209129333, -0.00027635134756565094, -0.00026785582304000854, -0.00025936029851436615, -0.00025086477398872375, -0.00024236924946308136, -0.00023387372493743896, -0.00022537820041179657, -0.00021688267588615417, -0.00020838715136051178, -0.00019989162683486938, -0.000191396102309227, -0.0001829005777835846, -0.0001744050532579422, -0.0001659095287322998, -0.0001574140042066574, -0.00014891847968101501, -0.00014042295515537262, -0.00013192743062973022, -0.00012343190610408783, -0.00011493638157844543, -0.00010644085705280304, -9.794533252716064e-05, -8.944980800151825e-05, -8.095428347587585e-05, -7.245875895023346e-05, -6.396323442459106e-05, -5.546770989894867e-05, -4.6972185373306274e-05, -3.847666084766388e-05, -2.9981136322021484e-05, -2.148561179637909e-05, -1.2990087270736694e-05, -4.494562745094299e-06, 4.000961780548096e-06, 1.249648630619049e-05, 2.0992010831832886e-05, 2.948753535747528e-05, 3.7983059883117676e-05, 4.647858440876007e-05, 5.4974108934402466e-05, 6.346963346004486e-05, 7.196515798568726e-05, 8.046068251132965e-05, 8.895620703697205e-05, 9.745173156261444e-05, 0.00010594725608825684, 0.00011444278061389923, 0.00012293830513954163, 0.00013143382966518402, 0.00013992935419082642, 0.0001484248787164688, 0.0001569204032421112, 0.0001654159277677536, 0.000173911452293396, 0.0001824069768190384, 0.00019090250134468079, 0.00019939802587032318, 0.00020789355039596558, 0.00021638907492160797, 0.00022488459944725037, 0.00023338012397289276, 0.00024187564849853516]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 6.0, 11.0, 16.0, 31.0, 43.0, 40.0, 75.0, 102.0, 140.0, 233.0, 331.0, 552.0, 880.0, 1376.0, 2276.0, 4112.0, 7864.0, 18476.0, 66679.0, 353047.0, 453081.0, 95335.0, 23242.0, 9073.0, 4566.0, 2656.0, 1556.0, 1004.0, 608.0, 339.0, 260.0, 188.0, 120.0, 70.0, 43.0, 38.0, 14.0, 16.0, 13.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.29931640625, -0.29027557373046875, -0.2812347412109375, -0.27219390869140625, -0.263153076171875, -0.25411224365234375, -0.2450714111328125, -0.23603057861328125, -0.22698974609375, -0.21794891357421875, -0.2089080810546875, -0.19986724853515625, -0.190826416015625, -0.18178558349609375, -0.1727447509765625, -0.16370391845703125, -0.1546630859375, -0.14562225341796875, -0.1365814208984375, -0.12754058837890625, -0.118499755859375, -0.10945892333984375, -0.1004180908203125, -0.09137725830078125, -0.08233642578125, -0.07329559326171875, -0.0642547607421875, -0.05521392822265625, -0.046173095703125, -0.03713226318359375, -0.0280914306640625, -0.01905059814453125, -0.010009765625, -0.00096893310546875, 0.0080718994140625, 0.01711273193359375, 0.026153564453125, 0.03519439697265625, 0.0442352294921875, 0.05327606201171875, 0.06231689453125, 0.07135772705078125, 0.0803985595703125, 0.08943939208984375, 0.098480224609375, 0.10752105712890625, 0.1165618896484375, 0.12560272216796875, 0.1346435546875, 0.14368438720703125, 0.1527252197265625, 0.16176605224609375, 0.170806884765625, 0.17984771728515625, 0.1888885498046875, 0.19792938232421875, 0.20697021484375, 0.21601104736328125, 0.2250518798828125, 0.23409271240234375, 0.243133544921875, 0.25217437744140625, 0.2612152099609375, 0.27025604248046875, 0.279296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 4.0, 0.0, 4.0, 6.0, 5.0, 4.0, 15.0, 6.0, 7.0, 24.0, 29.0, 38.0, 80.0, 98.0, 129.0, 135.0, 139.0, 94.0, 67.0, 38.0, 25.0, 7.0, 13.0, 9.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11907958984375, -0.1158905029296875, -0.112701416015625, -0.1095123291015625, -0.1063232421875, -0.1031341552734375, -0.099945068359375, -0.0967559814453125, -0.09356689453125, -0.0903778076171875, -0.087188720703125, -0.0839996337890625, -0.080810546875, -0.0776214599609375, -0.074432373046875, -0.0712432861328125, -0.06805419921875, -0.0648651123046875, -0.061676025390625, -0.0584869384765625, -0.0552978515625, -0.0521087646484375, -0.048919677734375, -0.0457305908203125, -0.04254150390625, -0.0393524169921875, -0.036163330078125, -0.0329742431640625, -0.02978515625, -0.0265960693359375, -0.023406982421875, -0.0202178955078125, -0.01702880859375, -0.0138397216796875, -0.010650634765625, -0.0074615478515625, -0.0042724609375, -0.0010833740234375, 0.002105712890625, 0.0052947998046875, 0.00848388671875, 0.0116729736328125, 0.014862060546875, 0.0180511474609375, 0.021240234375, 0.0244293212890625, 0.027618408203125, 0.0308074951171875, 0.03399658203125, 0.0371856689453125, 0.040374755859375, 0.0435638427734375, 0.0467529296875, 0.0499420166015625, 0.053131103515625, 0.0563201904296875, 0.05950927734375, 0.0626983642578125, 0.065887451171875, 0.0690765380859375, 0.072265625, 0.0754547119140625, 0.078643798828125, 0.0818328857421875, 0.08502197265625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 8.0, 34.0, 55.0, 127.0, 191.0, 205.0, 168.0, 108.0, 49.0, 25.0, 17.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.25265884399414, -41.35907745361328, -40.46549987792969, -39.571922302246094, -38.678340911865234, -37.784759521484375, -36.89118194580078, -35.99760437011719, -35.10402297973633, -34.21044158935547, -33.316864013671875, -32.42328643798828, -31.529705047607422, -30.636125564575195, -29.74254608154297, -28.848966598510742, -27.955387115478516, -27.06180763244629, -26.168228149414062, -25.274648666381836, -24.38106918334961, -23.487489700317383, -22.593910217285156, -21.70033073425293, -20.806751251220703, -19.913171768188477, -19.01959228515625, -18.126012802124023, -17.232433319091797, -16.33885383605957, -15.445274353027344, -14.551694869995117, -13.658116340637207, -12.76453685760498, -11.870957374572754, -10.977377891540527, -10.0837984085083, -9.190218925476074, -8.296639442443848, -7.403059959411621, -6.5094804763793945, -5.615900993347168, -4.722321510314941, -3.828742027282715, -2.9351625442504883, -2.0415830612182617, -1.1480035781860352, -0.2544240951538086, 0.639155387878418, 1.5327348709106445, 2.426314353942871, 3.3198938369750977, 4.213473320007324, 5.107052803039551, 6.000632286071777, 6.894211769104004, 7.7877912521362305, 8.681370735168457, 9.574950218200684, 10.46852970123291, 11.362109184265137, 12.255688667297363, 13.14926815032959, 14.042847633361816, 14.936427116394043]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 12.0, 25.0, 28.0, 37.0, 73.0, 81.0, 90.0, 122.0, 118.0, 109.0, 100.0, 71.0, 35.0, 40.0, 26.0, 17.0, 13.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.878023147583008, -26.242292404174805, -25.60655975341797, -24.970829010009766, -24.335098266601562, -23.699365615844727, -23.063634872436523, -22.427902221679688, -21.792171478271484, -21.15644073486328, -20.520708084106445, -19.884977340698242, -19.249244689941406, -18.613513946533203, -17.977783203125, -17.342052459716797, -16.70631980895996, -16.070589065551758, -15.434856414794922, -14.799125671386719, -14.1633939743042, -13.52766227722168, -12.891931533813477, -12.256199836730957, -11.620468139648438, -10.984736442565918, -10.349004745483398, -9.713274002075195, -9.077542304992676, -8.441810607910156, -7.806079387664795, -7.170348167419434, -6.5346174240112305, -5.898885726928711, -5.26315450668335, -4.627423286437988, -3.9916915893554688, -3.3559601306915283, -2.720228672027588, -2.0844974517822266, -1.448765754699707, -0.8130342960357666, -0.17730283737182617, 0.45842862129211426, 1.0941600799560547, 1.7298915386199951, 2.3656229972839355, 3.001354217529297, 3.6370859146118164, 4.272817611694336, 4.908548831939697, 5.544280052185059, 6.180011749267578, 6.815743446350098, 7.451474666595459, 8.08720588684082, 8.72293758392334, 9.35866928100586, 9.994400024414062, 10.630131721496582, 11.265863418579102, 11.901595115661621, 12.53732681274414, 13.173057556152344, 13.808789253234863]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 6.0, 9.0, 15.0, 26.0, 30.0, 63.0, 145.0, 306.0, 716.0, 2039.0, 6820.0, 24181.0, 100812.0, 436202.0, 368243.0, 80450.0, 19901.0, 5658.0, 1763.0, 631.0, 269.0, 113.0, 60.0, 35.0, 20.0, 12.0, 8.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.6015625, -10.2890625, -9.9765625, -9.6640625, -9.3515625, -9.0390625, -8.7265625, -8.4140625, -8.1015625, -7.7890625, -7.4765625, -7.1640625, -6.8515625, -6.5390625, -6.2265625, -5.9140625, -5.6015625, -5.2890625, -4.9765625, -4.6640625, -4.3515625, -4.0390625, -3.7265625, -3.4140625, -3.1015625, -2.7890625, -2.4765625, -2.1640625, -1.8515625, -1.5390625, -1.2265625, -0.9140625, -0.6015625, -0.2890625, 0.0234375, 0.3359375, 0.6484375, 0.9609375, 1.2734375, 1.5859375, 1.8984375, 2.2109375, 2.5234375, 2.8359375, 3.1484375, 3.4609375, 3.7734375, 4.0859375, 4.3984375, 4.7109375, 5.0234375, 5.3359375, 5.6484375, 5.9609375, 6.2734375, 6.5859375, 6.8984375, 7.2109375, 7.5234375, 7.8359375, 8.1484375, 8.4609375, 8.7734375, 9.0859375, 9.3984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 9.0, 10.0, 15.0, 30.0, 35.0, 42.0, 50.0, 52.0, 67.0, 72.0, 83.0, 91.0, 78.0, 87.0, 57.0, 47.0, 51.0, 30.0, 23.0, 19.0, 13.0, 15.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.5, -29.63232421875, -28.7646484375, -27.89697265625, -27.029296875, -26.16162109375, -25.2939453125, -24.42626953125, -23.55859375, -22.69091796875, -21.8232421875, -20.95556640625, -20.087890625, -19.22021484375, -18.3525390625, -17.48486328125, -16.6171875, -15.74951171875, -14.8818359375, -14.01416015625, -13.146484375, -12.27880859375, -11.4111328125, -10.54345703125, -9.67578125, -8.80810546875, -7.9404296875, -7.07275390625, -6.205078125, -5.33740234375, -4.4697265625, -3.60205078125, -2.734375, -1.86669921875, -0.9990234375, -0.13134765625, 0.736328125, 1.60400390625, 2.4716796875, 3.33935546875, 4.20703125, 5.07470703125, 5.9423828125, 6.81005859375, 7.677734375, 8.54541015625, 9.4130859375, 10.28076171875, 11.1484375, 12.01611328125, 12.8837890625, 13.75146484375, 14.619140625, 15.48681640625, 16.3544921875, 17.22216796875, 18.08984375, 18.95751953125, 19.8251953125, 20.69287109375, 21.560546875, 22.42822265625, 23.2958984375, 24.16357421875, 25.03125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 9.0, 7.0, 9.0, 12.0, 17.0, 12.0, 18.0, 26.0, 28.0, 28.0, 20.0, 26.0, 37.0, 30.0, 33.0, 55.0, 90.0, 183.0, 3714.0, 1034959.0, 8647.0, 203.0, 61.0, 40.0, 31.0, 42.0, 31.0, 26.0, 24.0, 21.0, 16.0, 17.0, 11.0, 13.0, 13.0, 7.0, 11.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-65.625, -63.5458984375, -61.466796875, -59.3876953125, -57.30859375, -55.2294921875, -53.150390625, -51.0712890625, -48.9921875, -46.9130859375, -44.833984375, -42.7548828125, -40.67578125, -38.5966796875, -36.517578125, -34.4384765625, -32.359375, -30.2802734375, -28.201171875, -26.1220703125, -24.04296875, -21.9638671875, -19.884765625, -17.8056640625, -15.7265625, -13.6474609375, -11.568359375, -9.4892578125, -7.41015625, -5.3310546875, -3.251953125, -1.1728515625, 0.90625, 2.9853515625, 5.064453125, 7.1435546875, 9.22265625, 11.3017578125, 13.380859375, 15.4599609375, 17.5390625, 19.6181640625, 21.697265625, 23.7763671875, 25.85546875, 27.9345703125, 30.013671875, 32.0927734375, 34.171875, 36.2509765625, 38.330078125, 40.4091796875, 42.48828125, 44.5673828125, 46.646484375, 48.7255859375, 50.8046875, 52.8837890625, 54.962890625, 57.0419921875, 59.12109375, 61.2001953125, 63.279296875, 65.3583984375, 67.4375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 9.0, 4.0, 8.0, 13.0, 11.0, 8.0, 10.0, 21.0, 20.0, 17.0, 30.0, 34.0, 24.0, 22.0, 37.0, 37.0, 31.0, 46.0, 41.0, 44.0, 36.0, 39.0, 39.0, 41.0, 38.0, 35.0, 32.0, 26.0, 30.0, 33.0, 28.0, 25.0, 16.0, 18.0, 23.0, 10.0, 12.0, 7.0, 9.0, 7.0, 10.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.015625, -14.525634765625, -14.03564453125, -13.545654296875, -13.0556640625, -12.565673828125, -12.07568359375, -11.585693359375, -11.095703125, -10.605712890625, -10.11572265625, -9.625732421875, -9.1357421875, -8.645751953125, -8.15576171875, -7.665771484375, -7.17578125, -6.685791015625, -6.19580078125, -5.705810546875, -5.2158203125, -4.725830078125, -4.23583984375, -3.745849609375, -3.255859375, -2.765869140625, -2.27587890625, -1.785888671875, -1.2958984375, -0.805908203125, -0.31591796875, 0.174072265625, 0.6640625, 1.154052734375, 1.64404296875, 2.134033203125, 2.6240234375, 3.114013671875, 3.60400390625, 4.093994140625, 4.583984375, 5.073974609375, 5.56396484375, 6.053955078125, 6.5439453125, 7.033935546875, 7.52392578125, 8.013916015625, 8.50390625, 8.993896484375, 9.48388671875, 9.973876953125, 10.4638671875, 10.953857421875, 11.44384765625, 11.933837890625, 12.423828125, 12.913818359375, 13.40380859375, 13.893798828125, 14.3837890625, 14.873779296875, 15.36376953125, 15.853759765625, 16.34375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 21.0, 21.0, 28.0, 64.0, 160.0, 463.0, 1719.0, 13152.0, 704624.0, 318600.0, 7729.0, 1276.0, 388.0, 133.0, 72.0, 36.0, 18.0, 11.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4765625, -11.147705078125, -10.81884765625, -10.489990234375, -10.1611328125, -9.832275390625, -9.50341796875, -9.174560546875, -8.845703125, -8.516845703125, -8.18798828125, -7.859130859375, -7.5302734375, -7.201416015625, -6.87255859375, -6.543701171875, -6.21484375, -5.885986328125, -5.55712890625, -5.228271484375, -4.8994140625, -4.570556640625, -4.24169921875, -3.912841796875, -3.583984375, -3.255126953125, -2.92626953125, -2.597412109375, -2.2685546875, -1.939697265625, -1.61083984375, -1.281982421875, -0.953125, -0.624267578125, -0.29541015625, 0.033447265625, 0.3623046875, 0.691162109375, 1.02001953125, 1.348876953125, 1.677734375, 2.006591796875, 2.33544921875, 2.664306640625, 2.9931640625, 3.322021484375, 3.65087890625, 3.979736328125, 4.30859375, 4.637451171875, 4.96630859375, 5.295166015625, 5.6240234375, 5.952880859375, 6.28173828125, 6.610595703125, 6.939453125, 7.268310546875, 7.59716796875, 7.926025390625, 8.2548828125, 8.583740234375, 8.91259765625, 9.241455078125, 9.5703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 10.0, 23.0, 28.0, 39.0, 55.0, 102.0, 140.0, 152.0, 156.0, 105.0, 58.0, 39.0, 33.0, 20.0, 8.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010709762573242188, -0.0010416507720947266, -0.0010123252868652344, -0.0009829998016357422, -0.00095367431640625, -0.0009243488311767578, -0.0008950233459472656, -0.0008656978607177734, -0.0008363723754882812, -0.0008070468902587891, -0.0007777214050292969, -0.0007483959197998047, -0.0007190704345703125, -0.0006897449493408203, -0.0006604194641113281, -0.0006310939788818359, -0.0006017684936523438, -0.0005724430084228516, -0.0005431175231933594, -0.0005137920379638672, -0.000484466552734375, -0.0004551410675048828, -0.0004258155822753906, -0.00039649009704589844, -0.00036716461181640625, -0.00033783912658691406, -0.0003085136413574219, -0.0002791881561279297, -0.0002498626708984375, -0.0002205371856689453, -0.00019121170043945312, -0.00016188621520996094, -0.00013256072998046875, -0.00010323524475097656, -7.390975952148438e-05, -4.458427429199219e-05, -1.52587890625e-05, 1.4066696166992188e-05, 4.3392181396484375e-05, 7.271766662597656e-05, 0.00010204315185546875, 0.00013136863708496094, 0.00016069412231445312, 0.0001900196075439453, 0.0002193450927734375, 0.0002486705780029297, 0.0002779960632324219, 0.00030732154846191406, 0.00033664703369140625, 0.00036597251892089844, 0.0003952980041503906, 0.0004246234893798828, 0.000453948974609375, 0.0004832744598388672, 0.0005125999450683594, 0.0005419254302978516, 0.0005712509155273438, 0.0006005764007568359, 0.0006299018859863281, 0.0006592273712158203, 0.0006885528564453125, 0.0007178783416748047, 0.0007472038269042969, 0.0007765293121337891, 0.0008058547973632812]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 10.0, 13.0, 14.0, 26.0, 65.0, 81.0, 158.0, 256.0, 543.0, 1414.0, 5029.0, 27945.0, 266759.0, 650961.0, 80136.0, 10920.0, 2548.0, 826.0, 355.0, 213.0, 113.0, 61.0, 29.0, 21.0, 20.0, 5.0, 13.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.74609375, -5.58306884765625, -5.4200439453125, -5.25701904296875, -5.093994140625, -4.93096923828125, -4.7679443359375, -4.60491943359375, -4.44189453125, -4.27886962890625, -4.1158447265625, -3.95281982421875, -3.789794921875, -3.62677001953125, -3.4637451171875, -3.30072021484375, -3.1376953125, -2.97467041015625, -2.8116455078125, -2.64862060546875, -2.485595703125, -2.32257080078125, -2.1595458984375, -1.99652099609375, -1.83349609375, -1.67047119140625, -1.5074462890625, -1.34442138671875, -1.181396484375, -1.01837158203125, -0.8553466796875, -0.69232177734375, -0.529296875, -0.36627197265625, -0.2032470703125, -0.04022216796875, 0.122802734375, 0.28582763671875, 0.4488525390625, 0.61187744140625, 0.77490234375, 0.93792724609375, 1.1009521484375, 1.26397705078125, 1.427001953125, 1.59002685546875, 1.7530517578125, 1.91607666015625, 2.0791015625, 2.24212646484375, 2.4051513671875, 2.56817626953125, 2.731201171875, 2.89422607421875, 3.0572509765625, 3.22027587890625, 3.38330078125, 3.54632568359375, 3.7093505859375, 3.87237548828125, 4.035400390625, 4.19842529296875, 4.3614501953125, 4.52447509765625, 4.6875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 7.0, 9.0, 15.0, 14.0, 22.0, 57.0, 51.0, 84.0, 129.0, 140.0, 108.0, 113.0, 78.0, 50.0, 32.0, 27.0, 18.0, 13.0, 11.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.396087646484375, -2.32733154296875, -2.258575439453125, -2.1898193359375, -2.121063232421875, -2.05230712890625, -1.983551025390625, -1.914794921875, -1.846038818359375, -1.77728271484375, -1.708526611328125, -1.6397705078125, -1.571014404296875, -1.50225830078125, -1.433502197265625, -1.36474609375, -1.295989990234375, -1.22723388671875, -1.158477783203125, -1.0897216796875, -1.020965576171875, -0.95220947265625, -0.883453369140625, -0.814697265625, -0.745941162109375, -0.67718505859375, -0.608428955078125, -0.5396728515625, -0.470916748046875, -0.40216064453125, -0.333404541015625, -0.2646484375, -0.195892333984375, -0.12713623046875, -0.058380126953125, 0.0103759765625, 0.079132080078125, 0.14788818359375, 0.216644287109375, 0.285400390625, 0.354156494140625, 0.42291259765625, 0.491668701171875, 0.5604248046875, 0.629180908203125, 0.69793701171875, 0.766693115234375, 0.83544921875, 0.904205322265625, 0.97296142578125, 1.041717529296875, 1.1104736328125, 1.179229736328125, 1.24798583984375, 1.316741943359375, 1.385498046875, 1.454254150390625, 1.52301025390625, 1.591766357421875, 1.6605224609375, 1.729278564453125, 1.79803466796875, 1.866790771484375, 1.935546875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 11.0, 34.0, 92.0, 206.0, 271.0, 209.0, 116.0, 45.0, 13.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-125.36949157714844, -123.02763366699219, -120.6857681274414, -118.34391021728516, -116.00204467773438, -113.66018676757812, -111.31832885742188, -108.9764633178711, -106.63460540771484, -104.2927474975586, -101.95088195800781, -99.60902404785156, -97.26715850830078, -94.92530059814453, -92.58343505859375, -90.2415771484375, -87.89971923828125, -85.557861328125, -83.21599578857422, -80.87413787841797, -78.53227233886719, -76.19041442871094, -73.84855651855469, -71.5066909790039, -69.16482543945312, -66.82296752929688, -64.4811019897461, -62.139244079589844, -59.79738235473633, -57.45552062988281, -55.1136589050293, -52.77179718017578, -50.429931640625, -48.088069915771484, -45.74620819091797, -43.40435028076172, -41.0624885559082, -38.72062683105469, -36.37876510620117, -34.036903381347656, -31.695045471191406, -29.35318374633789, -27.011323928833008, -24.669462203979492, -22.32760238647461, -19.985740661621094, -17.643878936767578, -15.302019119262695, -12.96015739440918, -10.61829662322998, -8.276435852050781, -5.934574127197266, -3.5927133560180664, -1.2508525848388672, 1.0910091400146484, 3.4328689575195312, 5.774730682373047, 8.116591453552246, 10.458452224731445, 12.800313949584961, 15.14217472076416, 17.48403549194336, 19.825897216796875, 22.167757034301758, 24.509618759155273]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 13.0, 6.0, 8.0, 23.0, 31.0, 39.0, 34.0, 59.0, 58.0, 50.0, 71.0, 68.0, 57.0, 53.0, 46.0, 49.0, 59.0, 46.0, 55.0, 34.0, 29.0, 23.0, 15.0, 16.0, 17.0, 13.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.14080810546875, -37.02959060668945, -35.918373107910156, -34.80715560913086, -33.69593811035156, -32.584720611572266, -31.473501205444336, -30.36228370666504, -29.251066207885742, -28.139848709106445, -27.02863121032715, -25.91741371154785, -24.806194305419922, -23.694976806640625, -22.583759307861328, -21.47254180908203, -20.361324310302734, -19.250106811523438, -18.13888931274414, -17.027671813964844, -15.91645336151123, -14.805235862731934, -13.69401741027832, -12.582799911499023, -11.471582412719727, -10.36036491394043, -9.249147415161133, -8.13792896270752, -7.026711463928223, -5.915493965148926, -4.804275989532471, -3.6930580139160156, -2.581836700439453, -1.4706189632415771, -0.35940122604370117, 0.7518165111541748, 1.8630342483520508, 2.9742517471313477, 4.085469722747803, 5.196687698364258, 6.307905197143555, 7.419122695922852, 8.530340194702148, 9.641558647155762, 10.752776145935059, 11.863993644714355, 12.975212097167969, 14.086429595947266, 15.197647094726562, 16.30886459350586, 17.420082092285156, 18.531299591064453, 19.64251708984375, 20.753734588623047, 21.864953994750977, 22.976171493530273, 24.08738899230957, 25.198606491088867, 26.309823989868164, 27.42104148864746, 28.53226089477539, 29.643478393554688, 30.754695892333984, 31.86591339111328, 32.97713088989258]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 4.0, 3.0, 5.0, 11.0, 10.0, 21.0, 14.0, 30.0, 39.0, 47.0, 76.0, 101.0, 154.0, 240.0, 514.0, 1117.0, 3126.0, 12069.0, 70926.0, 614218.0, 2406646.0, 942211.0, 115511.0, 18275.0, 4610.0, 1978.0, 1114.0, 555.0, 228.0, 126.0, 78.0, 53.0, 48.0, 32.0, 22.0, 9.0, 15.0, 12.0, 7.0, 4.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -21.0224609375, -20.357421875, -19.6923828125, -19.02734375, -18.3623046875, -17.697265625, -17.0322265625, -16.3671875, -15.7021484375, -15.037109375, -14.3720703125, -13.70703125, -13.0419921875, -12.376953125, -11.7119140625, -11.046875, -10.3818359375, -9.716796875, -9.0517578125, -8.38671875, -7.7216796875, -7.056640625, -6.3916015625, -5.7265625, -5.0615234375, -4.396484375, -3.7314453125, -3.06640625, -2.4013671875, -1.736328125, -1.0712890625, -0.40625, 0.2587890625, 0.923828125, 1.5888671875, 2.25390625, 2.9189453125, 3.583984375, 4.2490234375, 4.9140625, 5.5791015625, 6.244140625, 6.9091796875, 7.57421875, 8.2392578125, 8.904296875, 9.5693359375, 10.234375, 10.8994140625, 11.564453125, 12.2294921875, 12.89453125, 13.5595703125, 14.224609375, 14.8896484375, 15.5546875, 16.2197265625, 16.884765625, 17.5498046875, 18.21484375, 18.8798828125, 19.544921875, 20.2099609375, 20.875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 5.0, 13.0, 25.0, 35.0, 33.0, 69.0, 92.0, 106.0, 118.0, 113.0, 104.0, 81.0, 71.0, 47.0, 34.0, 25.0, 17.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.84375, -34.99072265625, -34.1376953125, -33.28466796875, -32.431640625, -31.57861328125, -30.7255859375, -29.87255859375, -29.01953125, -28.16650390625, -27.3134765625, -26.46044921875, -25.607421875, -24.75439453125, -23.9013671875, -23.04833984375, -22.1953125, -21.34228515625, -20.4892578125, -19.63623046875, -18.783203125, -17.93017578125, -17.0771484375, -16.22412109375, -15.37109375, -14.51806640625, -13.6650390625, -12.81201171875, -11.958984375, -11.10595703125, -10.2529296875, -9.39990234375, -8.546875, -7.69384765625, -6.8408203125, -5.98779296875, -5.134765625, -4.28173828125, -3.4287109375, -2.57568359375, -1.72265625, -0.86962890625, -0.0166015625, 0.83642578125, 1.689453125, 2.54248046875, 3.3955078125, 4.24853515625, 5.1015625, 5.95458984375, 6.8076171875, 7.66064453125, 8.513671875, 9.36669921875, 10.2197265625, 11.07275390625, 11.92578125, 12.77880859375, 13.6318359375, 14.48486328125, 15.337890625, 16.19091796875, 17.0439453125, 17.89697265625, 18.75]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 8.0, 8.0, 20.0, 19.0, 29.0, 63.0, 105.0, 249.0, 928.0, 7382.0, 379438.0, 3754704.0, 47897.0, 2630.0, 476.0, 135.0, 61.0, 36.0, 29.0, 9.0, 16.0, 12.0, 1.0, 3.0, 5.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.625, -39.18896484375, -37.7529296875, -36.31689453125, -34.880859375, -33.44482421875, -32.0087890625, -30.57275390625, -29.13671875, -27.70068359375, -26.2646484375, -24.82861328125, -23.392578125, -21.95654296875, -20.5205078125, -19.08447265625, -17.6484375, -16.21240234375, -14.7763671875, -13.34033203125, -11.904296875, -10.46826171875, -9.0322265625, -7.59619140625, -6.16015625, -4.72412109375, -3.2880859375, -1.85205078125, -0.416015625, 1.02001953125, 2.4560546875, 3.89208984375, 5.328125, 6.76416015625, 8.2001953125, 9.63623046875, 11.072265625, 12.50830078125, 13.9443359375, 15.38037109375, 16.81640625, 18.25244140625, 19.6884765625, 21.12451171875, 22.560546875, 23.99658203125, 25.4326171875, 26.86865234375, 28.3046875, 29.74072265625, 31.1767578125, 32.61279296875, 34.048828125, 35.48486328125, 36.9208984375, 38.35693359375, 39.79296875, 41.22900390625, 42.6650390625, 44.10107421875, 45.537109375, 46.97314453125, 48.4091796875, 49.84521484375, 51.28125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 6.0, 9.0, 8.0, 14.0, 25.0, 32.0, 46.0, 74.0, 106.0, 160.0, 293.0, 411.0, 575.0, 631.0, 568.0, 391.0, 242.0, 144.0, 98.0, 72.0, 43.0, 33.0, 23.0, 17.0, 12.0, 7.0, 7.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8671875, -6.6334228515625, -6.399658203125, -6.1658935546875, -5.93212890625, -5.6983642578125, -5.464599609375, -5.2308349609375, -4.9970703125, -4.7633056640625, -4.529541015625, -4.2957763671875, -4.06201171875, -3.8282470703125, -3.594482421875, -3.3607177734375, -3.126953125, -2.8931884765625, -2.659423828125, -2.4256591796875, -2.19189453125, -1.9581298828125, -1.724365234375, -1.4906005859375, -1.2568359375, -1.0230712890625, -0.789306640625, -0.5555419921875, -0.32177734375, -0.0880126953125, 0.145751953125, 0.3795166015625, 0.61328125, 0.8470458984375, 1.080810546875, 1.3145751953125, 1.54833984375, 1.7821044921875, 2.015869140625, 2.2496337890625, 2.4833984375, 2.7171630859375, 2.950927734375, 3.1846923828125, 3.41845703125, 3.6522216796875, 3.885986328125, 4.1197509765625, 4.353515625, 4.5872802734375, 4.821044921875, 5.0548095703125, 5.28857421875, 5.5223388671875, 5.756103515625, 5.9898681640625, 6.2236328125, 6.4573974609375, 6.691162109375, 6.9249267578125, 7.15869140625, 7.3924560546875, 7.626220703125, 7.8599853515625, 8.09375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 5.0, 9.0, 14.0, 16.0, 18.0, 29.0, 38.0, 34.0, 61.0, 66.0, 61.0, 76.0, 53.0, 75.0, 74.0, 64.0, 54.0, 44.0, 39.0, 30.0, 40.0, 17.0, 19.0, 14.0, 13.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0], "bins": [-23.817901611328125, -23.27366065979004, -22.72941780090332, -22.185176849365234, -21.64093589782715, -21.09669303894043, -20.552452087402344, -20.008211135864258, -19.46396827697754, -18.919727325439453, -18.375484466552734, -17.83124351501465, -17.287002563476562, -16.742759704589844, -16.198518753051758, -15.654276847839355, -15.11003589630127, -14.565793991088867, -14.021553039550781, -13.477311134338379, -12.933069229125977, -12.38882827758789, -11.844586372375488, -11.300344467163086, -10.756103515625, -10.211861610412598, -9.667620658874512, -9.12337875366211, -8.579136848449707, -8.034894943237305, -7.490653991699219, -6.946412086486816, -6.402169227600098, -5.8579277992248535, -5.313685894012451, -4.769444465637207, -4.225202560424805, -3.6809611320495605, -3.1367197036743164, -2.592478036880493, -2.04823637008667, -1.5039947032928467, -0.959753155708313, -0.4155116081237793, 0.12873005867004395, 0.6729717254638672, 1.2172131538391113, 1.7614548206329346, 2.305696487426758, 2.849938154220581, 3.3941798210144043, 3.9384212493896484, 4.482663154602051, 5.026904582977295, 5.571146011352539, 6.115387916564941, 6.6596293449401855, 7.20387077331543, 7.748112678527832, 8.292354583740234, 8.83659553527832, 9.380837440490723, 9.925079345703125, 10.469320297241211, 11.013562202453613]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 3.0, 4.0, 7.0, 4.0, 10.0, 29.0, 36.0, 33.0, 38.0, 55.0, 51.0, 74.0, 61.0, 62.0, 63.0, 68.0, 60.0, 57.0, 60.0, 44.0, 41.0, 40.0, 39.0, 22.0, 15.0, 10.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.046112060546875, -27.37696075439453, -26.70781135559082, -26.038660049438477, -25.369510650634766, -24.700359344482422, -24.031208038330078, -23.362058639526367, -22.692907333374023, -22.02375602722168, -21.35460662841797, -20.685455322265625, -20.016305923461914, -19.34715461730957, -18.67800521850586, -18.008853912353516, -17.339702606201172, -16.670551300048828, -16.001401901245117, -15.332250595092773, -14.663100242614746, -13.993949890136719, -13.324799537658691, -12.655649185180664, -11.986499786376953, -11.317349433898926, -10.648199081420898, -9.979047775268555, -9.309897422790527, -8.6407470703125, -7.971596717834473, -7.302445888519287, -6.633296012878418, -5.964145660400391, -5.294994831085205, -4.625844478607178, -3.9566938877105713, -3.287543296813965, -2.6183929443359375, -1.949242115020752, -1.2800917625427246, -0.6109412312507629, 0.05820930004119873, 0.7273597717285156, 1.396510362625122, 2.0656609535217285, 2.734811305999756, 3.4039621353149414, 4.073112487792969, 4.742262840270996, 5.411413669586182, 6.080564022064209, 6.7497148513793945, 7.418865203857422, 8.08801555633545, 8.757165908813477, 9.42631721496582, 10.095467567443848, 10.764617919921875, 11.433769226074219, 12.102919578552246, 12.772069931030273, 13.4412202835083, 14.110370635986328, 14.779520988464355]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 10.0, 5.0, 6.0, 9.0, 22.0, 41.0, 77.0, 145.0, 294.0, 748.0, 2424.0, 16056.0, 328927.0, 657778.0, 36275.0, 3923.0, 986.0, 430.0, 185.0, 97.0, 47.0, 28.0, 15.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4453125, -9.23138427734375, -9.0174560546875, -8.80352783203125, -8.589599609375, -8.37567138671875, -8.1617431640625, -7.94781494140625, -7.73388671875, -7.51995849609375, -7.3060302734375, -7.09210205078125, -6.878173828125, -6.66424560546875, -6.4503173828125, -6.23638916015625, -6.0224609375, -5.80853271484375, -5.5946044921875, -5.38067626953125, -5.166748046875, -4.95281982421875, -4.7388916015625, -4.52496337890625, -4.31103515625, -4.09710693359375, -3.8831787109375, -3.66925048828125, -3.455322265625, -3.24139404296875, -3.0274658203125, -2.81353759765625, -2.599609375, -2.38568115234375, -2.1717529296875, -1.95782470703125, -1.743896484375, -1.52996826171875, -1.3160400390625, -1.10211181640625, -0.88818359375, -0.67425537109375, -0.4603271484375, -0.24639892578125, -0.032470703125, 0.18145751953125, 0.3953857421875, 0.60931396484375, 0.8232421875, 1.03717041015625, 1.2510986328125, 1.46502685546875, 1.678955078125, 1.89288330078125, 2.1068115234375, 2.32073974609375, 2.53466796875, 2.74859619140625, 2.9625244140625, 3.17645263671875, 3.390380859375, 3.60430908203125, 3.8182373046875, 4.03216552734375, 4.24609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 3.0, 5.0, 13.0, 15.0, 44.0, 40.0, 60.0, 46.0, 86.0, 83.0, 92.0, 85.0, 74.0, 74.0, 64.0, 68.0, 49.0, 38.0, 25.0, 16.0, 7.0, 6.0, 10.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.8125, -23.28564453125, -22.7587890625, -22.23193359375, -21.705078125, -21.17822265625, -20.6513671875, -20.12451171875, -19.59765625, -19.07080078125, -18.5439453125, -18.01708984375, -17.490234375, -16.96337890625, -16.4365234375, -15.90966796875, -15.3828125, -14.85595703125, -14.3291015625, -13.80224609375, -13.275390625, -12.74853515625, -12.2216796875, -11.69482421875, -11.16796875, -10.64111328125, -10.1142578125, -9.58740234375, -9.060546875, -8.53369140625, -8.0068359375, -7.47998046875, -6.953125, -6.42626953125, -5.8994140625, -5.37255859375, -4.845703125, -4.31884765625, -3.7919921875, -3.26513671875, -2.73828125, -2.21142578125, -1.6845703125, -1.15771484375, -0.630859375, -0.10400390625, 0.4228515625, 0.94970703125, 1.4765625, 2.00341796875, 2.5302734375, 3.05712890625, 3.583984375, 4.11083984375, 4.6376953125, 5.16455078125, 5.69140625, 6.21826171875, 6.7451171875, 7.27197265625, 7.798828125, 8.32568359375, 8.8525390625, 9.37939453125, 9.90625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 11.0, 13.0, 22.0, 35.0, 52.0, 74.0, 113.0, 165.0, 277.0, 401.0, 640.0, 1170.0, 1801.0, 2820.0, 4670.0, 7981.0, 13520.0, 22604.0, 39203.0, 65802.0, 107442.0, 157304.0, 184023.0, 160398.0, 111488.0, 67718.0, 40381.0, 23533.0, 13849.0, 8015.0, 4892.0, 2970.0, 1815.0, 1174.0, 778.0, 476.0, 314.0, 208.0, 144.0, 91.0, 56.0, 38.0, 25.0, 16.0, 11.0, 5.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7421875, -0.7161712646484375, -0.690155029296875, -0.6641387939453125, -0.63812255859375, -0.6121063232421875, -0.586090087890625, -0.5600738525390625, -0.5340576171875, -0.5080413818359375, -0.482025146484375, -0.4560089111328125, -0.42999267578125, -0.4039764404296875, -0.377960205078125, -0.3519439697265625, -0.325927734375, -0.2999114990234375, -0.273895263671875, -0.2478790283203125, -0.22186279296875, -0.1958465576171875, -0.169830322265625, -0.1438140869140625, -0.1177978515625, -0.0917816162109375, -0.065765380859375, -0.0397491455078125, -0.01373291015625, 0.0122833251953125, 0.038299560546875, 0.0643157958984375, 0.09033203125, 0.1163482666015625, 0.142364501953125, 0.1683807373046875, 0.19439697265625, 0.2204132080078125, 0.246429443359375, 0.2724456787109375, 0.2984619140625, 0.3244781494140625, 0.350494384765625, 0.3765106201171875, 0.40252685546875, 0.4285430908203125, 0.454559326171875, 0.4805755615234375, 0.506591796875, 0.5326080322265625, 0.558624267578125, 0.5846405029296875, 0.61065673828125, 0.6366729736328125, 0.662689208984375, 0.6887054443359375, 0.7147216796875, 0.7407379150390625, 0.766754150390625, 0.7927703857421875, 0.81878662109375, 0.8448028564453125, 0.870819091796875, 0.8968353271484375, 0.9228515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 4.0, 11.0, 13.0, 14.0, 19.0, 17.0, 14.0, 24.0, 31.0, 21.0, 38.0, 41.0, 49.0, 51.0, 38.0, 53.0, 55.0, 49.0, 54.0, 42.0, 45.0, 40.0, 46.0, 40.0, 33.0, 28.0, 18.0, 19.0, 15.0, 15.0, 12.0, 9.0, 4.0, 6.0, 10.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.875, -15.373046875, -14.87109375, -14.369140625, -13.8671875, -13.365234375, -12.86328125, -12.361328125, -11.859375, -11.357421875, -10.85546875, -10.353515625, -9.8515625, -9.349609375, -8.84765625, -8.345703125, -7.84375, -7.341796875, -6.83984375, -6.337890625, -5.8359375, -5.333984375, -4.83203125, -4.330078125, -3.828125, -3.326171875, -2.82421875, -2.322265625, -1.8203125, -1.318359375, -0.81640625, -0.314453125, 0.1875, 0.689453125, 1.19140625, 1.693359375, 2.1953125, 2.697265625, 3.19921875, 3.701171875, 4.203125, 4.705078125, 5.20703125, 5.708984375, 6.2109375, 6.712890625, 7.21484375, 7.716796875, 8.21875, 8.720703125, 9.22265625, 9.724609375, 10.2265625, 10.728515625, 11.23046875, 11.732421875, 12.234375, 12.736328125, 13.23828125, 13.740234375, 14.2421875, 14.744140625, 15.24609375, 15.748046875, 16.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 8.0, 9.0, 16.0, 11.0, 18.0, 31.0, 50.0, 80.0, 101.0, 189.0, 227.0, 432.0, 749.0, 1295.0, 2604.0, 5804.0, 14704.0, 41716.0, 124337.0, 317164.0, 331034.0, 134428.0, 45221.0, 15921.0, 6210.0, 2827.0, 1338.0, 755.0, 453.0, 256.0, 192.0, 117.0, 89.0, 59.0, 37.0, 33.0, 22.0, 6.0, 6.0, 8.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12633514404296875, -0.1210784912109375, -0.11582183837890625, -0.110565185546875, -0.10530853271484375, -0.1000518798828125, -0.09479522705078125, -0.08953857421875, -0.08428192138671875, -0.0790252685546875, -0.07376861572265625, -0.068511962890625, -0.06325531005859375, -0.0579986572265625, -0.05274200439453125, -0.0474853515625, -0.04222869873046875, -0.0369720458984375, -0.03171539306640625, -0.026458740234375, -0.02120208740234375, -0.0159454345703125, -0.01068878173828125, -0.00543212890625, -0.00017547607421875, 0.0050811767578125, 0.01033782958984375, 0.015594482421875, 0.02085113525390625, 0.0261077880859375, 0.03136444091796875, 0.03662109375, 0.04187774658203125, 0.0471343994140625, 0.05239105224609375, 0.057647705078125, 0.06290435791015625, 0.0681610107421875, 0.07341766357421875, 0.07867431640625, 0.08393096923828125, 0.0891876220703125, 0.09444427490234375, 0.099700927734375, 0.10495758056640625, 0.1102142333984375, 0.11547088623046875, 0.1207275390625, 0.12598419189453125, 0.1312408447265625, 0.13649749755859375, 0.141754150390625, 0.14701080322265625, 0.1522674560546875, 0.15752410888671875, 0.16278076171875, 0.16803741455078125, 0.1732940673828125, 0.17855072021484375, 0.183807373046875, 0.18906402587890625, 0.1943206787109375, 0.19957733154296875, 0.204833984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 9.0, 9.0, 5.0, 7.0, 18.0, 14.0, 17.0, 25.0, 35.0, 37.0, 41.0, 34.0, 44.0, 50.0, 68.0, 78.0, 68.0, 63.0, 56.0, 49.0, 51.0, 33.0, 31.0, 32.0, 21.0, 20.0, 18.0, 15.0, 4.0, 8.0, 9.0, 9.0, 3.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012373924255371094, -0.00012011826038360596, -0.00011649727821350098, -0.000112876296043396, -0.00010925531387329102, -0.00010563433170318604, -0.00010201334953308105, -9.839236736297607e-05, -9.47713851928711e-05, -9.115040302276611e-05, -8.752942085266113e-05, -8.390843868255615e-05, -8.028745651245117e-05, -7.666647434234619e-05, -7.304549217224121e-05, -6.942451000213623e-05, -6.580352783203125e-05, -6.218254566192627e-05, -5.856156349182129e-05, -5.494058132171631e-05, -5.131959915161133e-05, -4.769861698150635e-05, -4.407763481140137e-05, -4.045665264129639e-05, -3.6835670471191406e-05, -3.3214688301086426e-05, -2.9593706130981445e-05, -2.5972723960876465e-05, -2.2351741790771484e-05, -1.8730759620666504e-05, -1.5109777450561523e-05, -1.1488795280456543e-05, -7.867813110351562e-06, -4.246830940246582e-06, -6.258487701416016e-07, 2.995133399963379e-06, 6.616115570068359e-06, 1.023709774017334e-05, 1.385807991027832e-05, 1.74790620803833e-05, 2.110004425048828e-05, 2.4721026420593262e-05, 2.8342008590698242e-05, 3.196299076080322e-05, 3.55839729309082e-05, 3.9204955101013184e-05, 4.2825937271118164e-05, 4.6446919441223145e-05, 5.0067901611328125e-05, 5.3688883781433105e-05, 5.7309865951538086e-05, 6.0930848121643066e-05, 6.455183029174805e-05, 6.817281246185303e-05, 7.179379463195801e-05, 7.541477680206299e-05, 7.903575897216797e-05, 8.265674114227295e-05, 8.627772331237793e-05, 8.989870548248291e-05, 9.351968765258789e-05, 9.714066982269287e-05, 0.00010076165199279785, 0.00010438263416290283, 0.00010800361633300781]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 14.0, 10.0, 32.0, 46.0, 78.0, 140.0, 238.0, 444.0, 827.0, 1636.0, 3126.0, 6681.0, 15036.0, 37097.0, 97856.0, 248655.0, 345339.0, 178108.0, 66641.0, 25650.0, 10816.0, 5045.0, 2324.0, 1237.0, 660.0, 320.0, 196.0, 108.0, 58.0, 54.0, 27.0, 16.0, 11.0, 5.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1412353515625, -0.1362457275390625, -0.131256103515625, -0.1262664794921875, -0.12127685546875, -0.1162872314453125, -0.111297607421875, -0.1063079833984375, -0.101318359375, -0.0963287353515625, -0.091339111328125, -0.0863494873046875, -0.08135986328125, -0.0763702392578125, -0.071380615234375, -0.0663909912109375, -0.0614013671875, -0.0564117431640625, -0.051422119140625, -0.0464324951171875, -0.04144287109375, -0.0364532470703125, -0.031463623046875, -0.0264739990234375, -0.021484375, -0.0164947509765625, -0.011505126953125, -0.0065155029296875, -0.00152587890625, 0.0034637451171875, 0.008453369140625, 0.0134429931640625, 0.0184326171875, 0.0234222412109375, 0.028411865234375, 0.0334014892578125, 0.03839111328125, 0.0433807373046875, 0.048370361328125, 0.0533599853515625, 0.058349609375, 0.0633392333984375, 0.068328857421875, 0.0733184814453125, 0.07830810546875, 0.0832977294921875, 0.088287353515625, 0.0932769775390625, 0.0982666015625, 0.1032562255859375, 0.108245849609375, 0.1132354736328125, 0.11822509765625, 0.1232147216796875, 0.128204345703125, 0.1331939697265625, 0.13818359375, 0.1431732177734375, 0.148162841796875, 0.1531524658203125, 0.15814208984375, 0.1631317138671875, 0.168121337890625, 0.1731109619140625, 0.1781005859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 3.0, 9.0, 3.0, 5.0, 12.0, 5.0, 10.0, 21.0, 21.0, 32.0, 25.0, 28.0, 44.0, 50.0, 59.0, 75.0, 61.0, 78.0, 76.0, 59.0, 58.0, 54.0, 40.0, 32.0, 21.0, 19.0, 12.0, 17.0, 14.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.045806884765625, -0.04435396194458008, -0.042901039123535156, -0.041448116302490234, -0.03999519348144531, -0.03854227066040039, -0.03708934783935547, -0.03563642501831055, -0.034183502197265625, -0.0327305793762207, -0.03127765655517578, -0.02982473373413086, -0.028371810913085938, -0.026918888092041016, -0.025465965270996094, -0.024013042449951172, -0.02256011962890625, -0.021107196807861328, -0.019654273986816406, -0.018201351165771484, -0.016748428344726562, -0.01529550552368164, -0.013842582702636719, -0.012389659881591797, -0.010936737060546875, -0.009483814239501953, -0.008030891418457031, -0.006577968597412109, -0.0051250457763671875, -0.0036721229553222656, -0.0022192001342773438, -0.0007662773132324219, 0.0006866455078125, 0.002139568328857422, 0.0035924911499023438, 0.005045413970947266, 0.0064983367919921875, 0.00795125961303711, 0.009404182434082031, 0.010857105255126953, 0.012310028076171875, 0.013762950897216797, 0.015215873718261719, 0.01666879653930664, 0.018121719360351562, 0.019574642181396484, 0.021027565002441406, 0.022480487823486328, 0.02393341064453125, 0.025386333465576172, 0.026839256286621094, 0.028292179107666016, 0.029745101928710938, 0.03119802474975586, 0.03265094757080078, 0.0341038703918457, 0.035556793212890625, 0.03700971603393555, 0.03846263885498047, 0.03991556167602539, 0.04136848449707031, 0.042821407318115234, 0.044274330139160156, 0.04572725296020508, 0.04718017578125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 14.0, 23.0, 31.0, 66.0, 96.0, 142.0, 150.0, 141.0, 115.0, 91.0, 48.0, 35.0, 25.0, 9.0, 3.0, 4.0, 5.0], "bins": [-34.64925765991211, -34.00336456298828, -33.35747146606445, -32.711578369140625, -32.0656852722168, -31.41979217529297, -30.77389907836914, -30.128005981445312, -29.482112884521484, -28.836219787597656, -28.190326690673828, -27.54443359375, -26.898540496826172, -26.252647399902344, -25.606754302978516, -24.960861206054688, -24.31496810913086, -23.66907501220703, -23.023181915283203, -22.377288818359375, -21.731395721435547, -21.08550262451172, -20.43960952758789, -19.793716430664062, -19.147823333740234, -18.501930236816406, -17.856037139892578, -17.21014404296875, -16.564250946044922, -15.918357849121094, -15.272464752197266, -14.626571655273438, -13.98067855834961, -13.334785461425781, -12.688892364501953, -12.042999267578125, -11.397106170654297, -10.751213073730469, -10.10531997680664, -9.459426879882812, -8.813533782958984, -8.167640686035156, -7.521747589111328, -6.8758544921875, -6.229961395263672, -5.584068298339844, -4.938175201416016, -4.2922821044921875, -3.646388530731201, -3.000495433807373, -2.354602336883545, -1.7087092399597168, -1.0628161430358887, -0.41692304611206055, 0.22897005081176758, 0.8748631477355957, 1.5207562446594238, 2.166649341583252, 2.81254243850708, 3.458435535430908, 4.104328632354736, 4.7502217292785645, 5.396114826202393, 6.042007923126221, 6.687901020050049]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 7.0, 10.0, 26.0, 41.0, 46.0, 53.0, 64.0, 86.0, 74.0, 82.0, 71.0, 78.0, 73.0, 64.0, 57.0, 45.0, 46.0, 26.0, 20.0, 5.0, 6.0, 3.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.093055725097656, -20.614152908325195, -20.135250091552734, -19.656347274780273, -19.177444458007812, -18.69853973388672, -18.219636917114258, -17.740734100341797, -17.261831283569336, -16.782928466796875, -16.304025650024414, -15.825121879577637, -15.346219062805176, -14.867316246032715, -14.388412475585938, -13.909509658813477, -13.430606842041016, -12.951704025268555, -12.472801208496094, -11.993897438049316, -11.514994621276855, -11.036091804504395, -10.557188034057617, -10.078285217285156, -9.599382400512695, -9.120479583740234, -8.641576766967773, -8.162672996520996, -7.683770179748535, -7.204867362976074, -6.725964069366455, -6.247060775756836, -5.768157005310059, -5.289254188537598, -4.8103508949279785, -4.331447601318359, -3.8525447845458984, -3.3736417293548584, -2.8947386741638184, -2.4158356189727783, -1.9369325637817383, -1.4580295085906982, -0.9791264533996582, -0.5002233982086182, -0.021320343017578125, 0.4575827121734619, 0.936485767364502, 1.415388822555542, 1.894291877746582, 2.373194932937622, 2.852097988128662, 3.331001043319702, 3.809904098510742, 4.288806915283203, 4.767710208892822, 5.246613502502441, 5.725516319274902, 6.204419136047363, 6.683322429656982, 7.162225723266602, 7.6411285400390625, 8.120031356811523, 8.598934173583984, 9.077837944030762, 9.556740760803223]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 16.0, 26.0, 23.0, 57.0, 92.0, 178.0, 381.0, 896.0, 2089.0, 6137.0, 18747.0, 61458.0, 192114.0, 387598.0, 253625.0, 85611.0, 26242.0, 8195.0, 2887.0, 1165.0, 506.0, 224.0, 101.0, 65.0, 41.0, 26.0, 17.0, 13.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.41943359375, -11.0341796875, -10.64892578125, -10.263671875, -9.87841796875, -9.4931640625, -9.10791015625, -8.72265625, -8.33740234375, -7.9521484375, -7.56689453125, -7.181640625, -6.79638671875, -6.4111328125, -6.02587890625, -5.640625, -5.25537109375, -4.8701171875, -4.48486328125, -4.099609375, -3.71435546875, -3.3291015625, -2.94384765625, -2.55859375, -2.17333984375, -1.7880859375, -1.40283203125, -1.017578125, -0.63232421875, -0.2470703125, 0.13818359375, 0.5234375, 0.90869140625, 1.2939453125, 1.67919921875, 2.064453125, 2.44970703125, 2.8349609375, 3.22021484375, 3.60546875, 3.99072265625, 4.3759765625, 4.76123046875, 5.146484375, 5.53173828125, 5.9169921875, 6.30224609375, 6.6875, 7.07275390625, 7.4580078125, 7.84326171875, 8.228515625, 8.61376953125, 8.9990234375, 9.38427734375, 9.76953125, 10.15478515625, 10.5400390625, 10.92529296875, 11.310546875, 11.69580078125, 12.0810546875, 12.46630859375, 12.8515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 5.0, 14.0, 12.0, 23.0, 21.0, 53.0, 42.0, 44.0, 58.0, 64.0, 87.0, 65.0, 70.0, 74.0, 58.0, 53.0, 41.0, 40.0, 47.0, 36.0, 25.0, 19.0, 14.0, 11.0, 2.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.859375, -28.120361328125, -27.38134765625, -26.642333984375, -25.9033203125, -25.164306640625, -24.42529296875, -23.686279296875, -22.947265625, -22.208251953125, -21.46923828125, -20.730224609375, -19.9912109375, -19.252197265625, -18.51318359375, -17.774169921875, -17.03515625, -16.296142578125, -15.55712890625, -14.818115234375, -14.0791015625, -13.340087890625, -12.60107421875, -11.862060546875, -11.123046875, -10.384033203125, -9.64501953125, -8.906005859375, -8.1669921875, -7.427978515625, -6.68896484375, -5.949951171875, -5.2109375, -4.471923828125, -3.73291015625, -2.993896484375, -2.2548828125, -1.515869140625, -0.77685546875, -0.037841796875, 0.701171875, 1.440185546875, 2.17919921875, 2.918212890625, 3.6572265625, 4.396240234375, 5.13525390625, 5.874267578125, 6.61328125, 7.352294921875, 8.09130859375, 8.830322265625, 9.5693359375, 10.308349609375, 11.04736328125, 11.786376953125, 12.525390625, 13.264404296875, 14.00341796875, 14.742431640625, 15.4814453125, 16.220458984375, 16.95947265625, 17.698486328125, 18.4375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 11.0, 8.0, 12.0, 12.0, 15.0, 26.0, 35.0, 37.0, 43.0, 79.0, 133.0, 181.0, 387.0, 2715.0, 250014.0, 784246.0, 9256.0, 598.0, 237.0, 144.0, 80.0, 63.0, 48.0, 32.0, 23.0, 18.0, 11.0, 17.0, 9.0, 10.0, 9.0, 4.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-57.84375, -56.244140625, -54.64453125, -53.044921875, -51.4453125, -49.845703125, -48.24609375, -46.646484375, -45.046875, -43.447265625, -41.84765625, -40.248046875, -38.6484375, -37.048828125, -35.44921875, -33.849609375, -32.25, -30.650390625, -29.05078125, -27.451171875, -25.8515625, -24.251953125, -22.65234375, -21.052734375, -19.453125, -17.853515625, -16.25390625, -14.654296875, -13.0546875, -11.455078125, -9.85546875, -8.255859375, -6.65625, -5.056640625, -3.45703125, -1.857421875, -0.2578125, 1.341796875, 2.94140625, 4.541015625, 6.140625, 7.740234375, 9.33984375, 10.939453125, 12.5390625, 14.138671875, 15.73828125, 17.337890625, 18.9375, 20.537109375, 22.13671875, 23.736328125, 25.3359375, 26.935546875, 28.53515625, 30.134765625, 31.734375, 33.333984375, 34.93359375, 36.533203125, 38.1328125, 39.732421875, 41.33203125, 42.931640625, 44.53125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 1.0, 5.0, 5.0, 3.0, 9.0, 7.0, 16.0, 12.0, 9.0, 19.0, 23.0, 31.0, 28.0, 37.0, 40.0, 45.0, 36.0, 46.0, 49.0, 37.0, 57.0, 46.0, 37.0, 55.0, 42.0, 51.0, 30.0, 29.0, 33.0, 32.0, 24.0, 11.0, 16.0, 15.0, 7.0, 12.0, 8.0, 5.0, 8.0, 5.0, 7.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-18.515625, -17.9896240234375, -17.463623046875, -16.9376220703125, -16.41162109375, -15.8856201171875, -15.359619140625, -14.8336181640625, -14.3076171875, -13.7816162109375, -13.255615234375, -12.7296142578125, -12.20361328125, -11.6776123046875, -11.151611328125, -10.6256103515625, -10.099609375, -9.5736083984375, -9.047607421875, -8.5216064453125, -7.99560546875, -7.4696044921875, -6.943603515625, -6.4176025390625, -5.8916015625, -5.3656005859375, -4.839599609375, -4.3135986328125, -3.78759765625, -3.2615966796875, -2.735595703125, -2.2095947265625, -1.68359375, -1.1575927734375, -0.631591796875, -0.1055908203125, 0.42041015625, 0.9464111328125, 1.472412109375, 1.9984130859375, 2.5244140625, 3.0504150390625, 3.576416015625, 4.1024169921875, 4.62841796875, 5.1544189453125, 5.680419921875, 6.2064208984375, 6.732421875, 7.2584228515625, 7.784423828125, 8.3104248046875, 8.83642578125, 9.3624267578125, 9.888427734375, 10.4144287109375, 10.9404296875, 11.4664306640625, 11.992431640625, 12.5184326171875, 13.04443359375, 13.5704345703125, 14.096435546875, 14.6224365234375, 15.1484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 4.0, 7.0, 9.0, 13.0, 12.0, 18.0, 20.0, 27.0, 57.0, 64.0, 94.0, 151.0, 223.0, 415.0, 824.0, 1897.0, 6185.0, 36577.0, 623512.0, 350071.0, 20635.0, 4523.0, 1540.0, 632.0, 396.0, 200.0, 139.0, 103.0, 56.0, 41.0, 41.0, 15.0, 13.0, 13.0, 8.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.640625, -10.343994140625, -10.04736328125, -9.750732421875, -9.4541015625, -9.157470703125, -8.86083984375, -8.564208984375, -8.267578125, -7.970947265625, -7.67431640625, -7.377685546875, -7.0810546875, -6.784423828125, -6.48779296875, -6.191162109375, -5.89453125, -5.597900390625, -5.30126953125, -5.004638671875, -4.7080078125, -4.411376953125, -4.11474609375, -3.818115234375, -3.521484375, -3.224853515625, -2.92822265625, -2.631591796875, -2.3349609375, -2.038330078125, -1.74169921875, -1.445068359375, -1.1484375, -0.851806640625, -0.55517578125, -0.258544921875, 0.0380859375, 0.334716796875, 0.63134765625, 0.927978515625, 1.224609375, 1.521240234375, 1.81787109375, 2.114501953125, 2.4111328125, 2.707763671875, 3.00439453125, 3.301025390625, 3.59765625, 3.894287109375, 4.19091796875, 4.487548828125, 4.7841796875, 5.080810546875, 5.37744140625, 5.674072265625, 5.970703125, 6.267333984375, 6.56396484375, 6.860595703125, 7.1572265625, 7.453857421875, 7.75048828125, 8.047119140625, 8.34375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 5.0, 15.0, 29.0, 53.0, 110.0, 191.0, 231.0, 173.0, 97.0, 45.0, 28.0, 11.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010747909545898438, -0.0010131746530532837, -0.0009515583515167236, -0.0008899420499801636, -0.0008283257484436035, -0.0007667094469070435, -0.0007050931453704834, -0.0006434768438339233, -0.0005818605422973633, -0.0005202442407608032, -0.00045862793922424316, -0.0003970116376876831, -0.00033539533615112305, -0.000273779034614563, -0.00021216273307800293, -0.00015054643154144287, -8.893013000488281e-05, -2.7313828468322754e-05, 3.4302473068237305e-05, 9.591877460479736e-05, 0.00015753507614135742, 0.00021915137767791748, 0.00028076767921447754, 0.0003423839807510376, 0.00040400028228759766, 0.0004656165838241577, 0.0005272328853607178, 0.0005888491868972778, 0.0006504654884338379, 0.000712081789970398, 0.000773698091506958, 0.0008353143930435181, 0.0008969306945800781, 0.0009585469961166382, 0.0010201632976531982, 0.0010817795991897583, 0.0011433959007263184, 0.0012050122022628784, 0.0012666285037994385, 0.0013282448053359985, 0.0013898611068725586, 0.0014514774084091187, 0.0015130937099456787, 0.0015747100114822388, 0.0016363263130187988, 0.0016979426145553589, 0.001759558916091919, 0.001821175217628479, 0.001882791519165039, 0.0019444078207015991, 0.002006024122238159, 0.0020676404237747192, 0.0021292567253112793, 0.0021908730268478394, 0.0022524893283843994, 0.0023141056299209595, 0.0023757219314575195, 0.0024373382329940796, 0.0024989545345306396, 0.0025605708360671997, 0.0026221871376037598, 0.00268380343914032, 0.00274541974067688, 0.00280703604221344, 0.00286865234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 3.0, 7.0, 4.0, 5.0, 3.0, 11.0, 15.0, 23.0, 16.0, 52.0, 99.0, 268.0, 771.0, 2796.0, 15468.0, 274129.0, 696625.0, 50723.0, 5430.0, 1309.0, 418.0, 163.0, 77.0, 37.0, 27.0, 18.0, 10.0, 7.0, 6.0, 7.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.171875, -8.878173828125, -8.58447265625, -8.290771484375, -7.9970703125, -7.703369140625, -7.40966796875, -7.115966796875, -6.822265625, -6.528564453125, -6.23486328125, -5.941162109375, -5.6474609375, -5.353759765625, -5.06005859375, -4.766357421875, -4.47265625, -4.178955078125, -3.88525390625, -3.591552734375, -3.2978515625, -3.004150390625, -2.71044921875, -2.416748046875, -2.123046875, -1.829345703125, -1.53564453125, -1.241943359375, -0.9482421875, -0.654541015625, -0.36083984375, -0.067138671875, 0.2265625, 0.520263671875, 0.81396484375, 1.107666015625, 1.4013671875, 1.695068359375, 1.98876953125, 2.282470703125, 2.576171875, 2.869873046875, 3.16357421875, 3.457275390625, 3.7509765625, 4.044677734375, 4.33837890625, 4.632080078125, 4.92578125, 5.219482421875, 5.51318359375, 5.806884765625, 6.1005859375, 6.394287109375, 6.68798828125, 6.981689453125, 7.275390625, 7.569091796875, 7.86279296875, 8.156494140625, 8.4501953125, 8.743896484375, 9.03759765625, 9.331298828125, 9.625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 0.0, 5.0, 3.0, 5.0, 3.0, 5.0, 7.0, 8.0, 12.0, 17.0, 28.0, 26.0, 32.0, 40.0, 54.0, 58.0, 59.0, 91.0, 85.0, 70.0, 73.0, 50.0, 51.0, 44.0, 48.0, 36.0, 13.0, 22.0, 14.0, 7.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1953125, -2.1299896240234375, -2.064666748046875, -1.9993438720703125, -1.93402099609375, -1.8686981201171875, -1.803375244140625, -1.7380523681640625, -1.6727294921875, -1.6074066162109375, -1.542083740234375, -1.4767608642578125, -1.41143798828125, -1.3461151123046875, -1.280792236328125, -1.2154693603515625, -1.150146484375, -1.0848236083984375, -1.019500732421875, -0.9541778564453125, -0.88885498046875, -0.8235321044921875, -0.758209228515625, -0.6928863525390625, -0.6275634765625, -0.5622406005859375, -0.496917724609375, -0.4315948486328125, -0.36627197265625, -0.3009490966796875, -0.235626220703125, -0.1703033447265625, -0.10498046875, -0.0396575927734375, 0.025665283203125, 0.0909881591796875, 0.15631103515625, 0.2216339111328125, 0.286956787109375, 0.3522796630859375, 0.4176025390625, 0.4829254150390625, 0.548248291015625, 0.6135711669921875, 0.67889404296875, 0.7442169189453125, 0.809539794921875, 0.8748626708984375, 0.940185546875, 1.0055084228515625, 1.070831298828125, 1.1361541748046875, 1.20147705078125, 1.2667999267578125, 1.332122802734375, 1.3974456787109375, 1.4627685546875, 1.5280914306640625, 1.593414306640625, 1.6587371826171875, 1.72406005859375, 1.7893829345703125, 1.854705810546875, 1.9200286865234375, 1.9853515625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 19.0, 58.0, 143.0, 328.0, 272.0, 132.0, 40.0, 12.0, 4.0, 1.0, 0.0, 1.0], "bins": [-166.32310485839844, -163.342041015625, -160.36099243164062, -157.3799285888672, -154.39886474609375, -151.4178009033203, -148.43675231933594, -145.4556884765625, -142.47462463378906, -139.49356079101562, -136.51251220703125, -133.5314483642578, -130.55038452148438, -127.56932830810547, -124.58827209472656, -121.60720825195312, -118.62615203857422, -115.64509582519531, -112.66403198242188, -109.68297576904297, -106.70191192626953, -103.72085571289062, -100.73979187011719, -97.75873565673828, -94.77767944335938, -91.79662322998047, -88.81555938720703, -85.83450317382812, -82.85343933105469, -79.87238311767578, -76.89132690429688, -73.91026306152344, -70.92919158935547, -67.94813537597656, -64.96707153320312, -61.98601531982422, -59.00495147705078, -56.023895263671875, -53.0428352355957, -50.06177520751953, -47.08071517944336, -44.09965515136719, -41.118595123291016, -38.137535095214844, -35.15647888183594, -32.1754150390625, -29.194358825683594, -26.213298797607422, -23.23223876953125, -20.251178741455078, -17.270118713378906, -14.289060592651367, -11.308000564575195, -8.326940536499023, -5.345882415771484, -2.3648223876953125, 0.6162376403808594, 3.597297191619873, 6.578356742858887, 9.559415817260742, 12.540475845336914, 15.521535873413086, 18.502593994140625, 21.483654022216797, 24.46471405029297]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 8.0, 11.0, 13.0, 20.0, 22.0, 22.0, 48.0, 26.0, 33.0, 47.0, 41.0, 36.0, 45.0, 78.0, 43.0, 45.0, 54.0, 54.0, 49.0, 38.0, 34.0, 31.0, 28.0, 30.0, 24.0, 21.0, 21.0, 22.0, 12.0, 8.0, 6.0, 3.0, 8.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.081356048583984, -36.07012939453125, -35.05890655517578, -34.04767990112305, -33.03645706176758, -32.025230407714844, -31.014005661010742, -30.00278091430664, -28.991554260253906, -27.980329513549805, -26.969104766845703, -25.95787811279297, -24.946653366088867, -23.935428619384766, -22.924203872680664, -21.912979125976562, -20.90175437927246, -19.89052963256836, -18.879304885864258, -17.868080139160156, -16.856853485107422, -15.84562873840332, -14.834403991699219, -13.823179244995117, -12.8119535446167, -11.800728797912598, -10.78950309753418, -9.778278350830078, -8.767053604125977, -7.755827903747559, -6.744603157043457, -5.733377933502197, -4.722150802612305, -3.710925579071045, -2.6997005939483643, -1.6884756088256836, -0.6772503852844238, 0.33397483825683594, 1.3451995849609375, 2.3564248085021973, 3.367650032043457, 4.378875255584717, 5.390100479125977, 6.401325225830078, 7.412550449371338, 8.423775672912598, 9.4350004196167, 10.446226119995117, 11.457450866699219, 12.46867561340332, 13.479901313781738, 14.49112606048584, 15.502351760864258, 16.51357650756836, 17.52480125427246, 18.536026000976562, 19.547252655029297, 20.5584774017334, 21.5697021484375, 22.580928802490234, 23.592153549194336, 24.603378295898438, 25.61460304260254, 26.62582778930664, 27.637052536010742]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 21.0, 30.0, 30.0, 50.0, 71.0, 119.0, 196.0, 371.0, 834.0, 2908.0, 43752.0, 2543123.0, 1575516.0, 24317.0, 1668.0, 471.0, 275.0, 165.0, 107.0, 71.0, 38.0, 31.0, 29.0, 26.0, 15.0, 10.0, 3.0, 3.0, 1.0, 6.0, 1.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-50.03125, -48.63818359375, -47.2451171875, -45.85205078125, -44.458984375, -43.06591796875, -41.6728515625, -40.27978515625, -38.88671875, -37.49365234375, -36.1005859375, -34.70751953125, -33.314453125, -31.92138671875, -30.5283203125, -29.13525390625, -27.7421875, -26.34912109375, -24.9560546875, -23.56298828125, -22.169921875, -20.77685546875, -19.3837890625, -17.99072265625, -16.59765625, -15.20458984375, -13.8115234375, -12.41845703125, -11.025390625, -9.63232421875, -8.2392578125, -6.84619140625, -5.453125, -4.06005859375, -2.6669921875, -1.27392578125, 0.119140625, 1.51220703125, 2.9052734375, 4.29833984375, 5.69140625, 7.08447265625, 8.4775390625, 9.87060546875, 11.263671875, 12.65673828125, 14.0498046875, 15.44287109375, 16.8359375, 18.22900390625, 19.6220703125, 21.01513671875, 22.408203125, 23.80126953125, 25.1943359375, 26.58740234375, 27.98046875, 29.37353515625, 30.7666015625, 32.15966796875, 33.552734375, 34.94580078125, 36.3388671875, 37.73193359375, 39.125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 11.0, 10.0, 29.0, 30.0, 45.0, 56.0, 56.0, 70.0, 74.0, 82.0, 65.0, 77.0, 67.0, 63.0, 46.0, 51.0, 45.0, 30.0, 17.0, 20.0, 20.0, 7.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -21.0771484375, -20.466796875, -19.8564453125, -19.24609375, -18.6357421875, -18.025390625, -17.4150390625, -16.8046875, -16.1943359375, -15.583984375, -14.9736328125, -14.36328125, -13.7529296875, -13.142578125, -12.5322265625, -11.921875, -11.3115234375, -10.701171875, -10.0908203125, -9.48046875, -8.8701171875, -8.259765625, -7.6494140625, -7.0390625, -6.4287109375, -5.818359375, -5.2080078125, -4.59765625, -3.9873046875, -3.376953125, -2.7666015625, -2.15625, -1.5458984375, -0.935546875, -0.3251953125, 0.28515625, 0.8955078125, 1.505859375, 2.1162109375, 2.7265625, 3.3369140625, 3.947265625, 4.5576171875, 5.16796875, 5.7783203125, 6.388671875, 6.9990234375, 7.609375, 8.2197265625, 8.830078125, 9.4404296875, 10.05078125, 10.6611328125, 11.271484375, 11.8818359375, 12.4921875, 13.1025390625, 13.712890625, 14.3232421875, 14.93359375, 15.5439453125, 16.154296875, 16.7646484375, 17.375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 7.0, 6.0, 11.0, 18.0, 17.0, 23.0, 32.0, 58.0, 97.0, 344.0, 4939.0, 4177311.0, 10703.0, 425.0, 107.0, 45.0, 43.0, 22.0, 7.0, 13.0, 11.0, 11.0, 10.0, 12.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.0, -81.5390625, -78.078125, -74.6171875, -71.15625, -67.6953125, -64.234375, -60.7734375, -57.3125, -53.8515625, -50.390625, -46.9296875, -43.46875, -40.0078125, -36.546875, -33.0859375, -29.625, -26.1640625, -22.703125, -19.2421875, -15.78125, -12.3203125, -8.859375, -5.3984375, -1.9375, 1.5234375, 4.984375, 8.4453125, 11.90625, 15.3671875, 18.828125, 22.2890625, 25.75, 29.2109375, 32.671875, 36.1328125, 39.59375, 43.0546875, 46.515625, 49.9765625, 53.4375, 56.8984375, 60.359375, 63.8203125, 67.28125, 70.7421875, 74.203125, 77.6640625, 81.125, 84.5859375, 88.046875, 91.5078125, 94.96875, 98.4296875, 101.890625, 105.3515625, 108.8125, 112.2734375, 115.734375, 119.1953125, 122.65625, 126.1171875, 129.578125, 133.0390625, 136.5]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 11.0, 16.0, 40.0, 45.0, 86.0, 133.0, 222.0, 354.0, 525.0, 646.0, 663.0, 496.0, 334.0, 191.0, 111.0, 78.0, 45.0, 21.0, 21.0, 14.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.890625, -10.64239501953125, -10.3941650390625, -10.14593505859375, -9.897705078125, -9.64947509765625, -9.4012451171875, -9.15301513671875, -8.90478515625, -8.65655517578125, -8.4083251953125, -8.16009521484375, -7.911865234375, -7.66363525390625, -7.4154052734375, -7.16717529296875, -6.9189453125, -6.67071533203125, -6.4224853515625, -6.17425537109375, -5.926025390625, -5.67779541015625, -5.4295654296875, -5.18133544921875, -4.93310546875, -4.68487548828125, -4.4366455078125, -4.18841552734375, -3.940185546875, -3.69195556640625, -3.4437255859375, -3.19549560546875, -2.947265625, -2.69903564453125, -2.4508056640625, -2.20257568359375, -1.954345703125, -1.70611572265625, -1.4578857421875, -1.20965576171875, -0.96142578125, -0.71319580078125, -0.4649658203125, -0.21673583984375, 0.031494140625, 0.27972412109375, 0.5279541015625, 0.77618408203125, 1.0244140625, 1.27264404296875, 1.5208740234375, 1.76910400390625, 2.017333984375, 2.26556396484375, 2.5137939453125, 2.76202392578125, 3.01025390625, 3.25848388671875, 3.5067138671875, 3.75494384765625, 4.003173828125, 4.25140380859375, 4.4996337890625, 4.74786376953125, 4.99609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 6.0, 15.0, 9.0, 22.0, 20.0, 48.0, 45.0, 65.0, 64.0, 65.0, 78.0, 75.0, 66.0, 67.0, 59.0, 66.0, 49.0, 44.0, 37.0, 24.0, 11.0, 17.0, 10.0, 11.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.704063415527344, -22.144882202148438, -21.58570098876953, -21.026519775390625, -20.467336654663086, -19.90815544128418, -19.348974227905273, -18.789793014526367, -18.23061180114746, -17.671430587768555, -17.11224937438965, -16.55306625366211, -15.99388599395752, -15.434703826904297, -14.87552261352539, -14.316341400146484, -13.757159233093262, -13.197978019714355, -12.638795852661133, -12.079614639282227, -11.52043342590332, -10.961252212524414, -10.402070045471191, -9.842888832092285, -9.283706665039062, -8.724525451660156, -8.165343284606934, -7.606162071228027, -7.046980857849121, -6.487799167633057, -5.928617477416992, -5.369436264038086, -4.810256004333496, -4.251074314117432, -3.6918931007385254, -3.132711410522461, -2.5735299587249756, -2.0143485069274902, -1.4551668167114258, -0.8959853649139404, -0.3368039131164551, 0.22237759828567505, 0.7815591096878052, 1.34074068069458, 1.8999221324920654, 2.459103584289551, 3.0182852745056152, 3.5774667263031006, 4.136648178100586, 4.69582986831665, 5.255011081695557, 5.814192771911621, 6.373373985290527, 6.932555675506592, 7.491737365722656, 8.050918579101562, 8.610099792480469, 9.169281005859375, 9.728463172912598, 10.287644386291504, 10.84682559967041, 11.406007766723633, 11.965188980102539, 12.524370193481445, 13.083552360534668]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 10.0, 8.0, 13.0, 12.0, 18.0, 24.0, 27.0, 27.0, 31.0, 47.0, 36.0, 47.0, 44.0, 54.0, 50.0, 48.0, 48.0, 38.0, 45.0, 50.0, 36.0, 55.0, 44.0, 29.0, 21.0, 29.0, 21.0, 17.0, 22.0, 13.0, 6.0, 5.0, 3.0, 0.0, 1.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-17.474252700805664, -16.992952346801758, -16.511653900146484, -16.030353546142578, -15.549053192138672, -15.067753791809082, -14.586454391479492, -14.105154037475586, -13.623854637145996, -13.142555236816406, -12.6612548828125, -12.17995548248291, -11.69865608215332, -11.217355728149414, -10.736056327819824, -10.254756927490234, -9.773456573486328, -9.292157173156738, -8.810856819152832, -8.329557418823242, -7.848257541656494, -7.366957664489746, -6.885658264160156, -6.404358386993408, -5.92305850982666, -5.441758632659912, -4.960458755493164, -4.479159355163574, -3.997859477996826, -3.516559600830078, -3.035259962081909, -2.5539603233337402, -2.072660446166992, -1.5913606882095337, -1.1100609302520752, -0.6287611722946167, -0.1474614143371582, 0.33383846282958984, 0.8151381015777588, 1.2964377403259277, 1.7777376174926758, 2.259037494659424, 2.7403371334075928, 3.2216367721557617, 3.7029366493225098, 4.184236526489258, 4.665535926818848, 5.146835803985596, 5.628135681152344, 6.109435558319092, 6.59073543548584, 7.07203483581543, 7.553334712982178, 8.034634590148926, 8.515933990478516, 8.997234344482422, 9.478533744812012, 9.959833145141602, 10.441133499145508, 10.922432899475098, 11.403732299804688, 11.885032653808594, 12.366332054138184, 12.847631454467773, 13.32893180847168]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 5.0, 14.0, 16.0, 20.0, 30.0, 40.0, 51.0, 73.0, 112.0, 169.0, 289.0, 382.0, 643.0, 1127.0, 2336.0, 4910.0, 11601.0, 30817.0, 87838.0, 235669.0, 358311.0, 198975.0, 71196.0, 25241.0, 9752.0, 4112.0, 1975.0, 1112.0, 603.0, 343.0, 269.0, 151.0, 120.0, 81.0, 51.0, 25.0, 21.0, 20.0, 15.0, 8.0, 4.0, 2.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.10546875, -2.038421630859375, -1.97137451171875, -1.904327392578125, -1.8372802734375, -1.770233154296875, -1.70318603515625, -1.636138916015625, -1.569091796875, -1.502044677734375, -1.43499755859375, -1.367950439453125, -1.3009033203125, -1.233856201171875, -1.16680908203125, -1.099761962890625, -1.03271484375, -0.965667724609375, -0.89862060546875, -0.831573486328125, -0.7645263671875, -0.697479248046875, -0.63043212890625, -0.563385009765625, -0.496337890625, -0.429290771484375, -0.36224365234375, -0.295196533203125, -0.2281494140625, -0.161102294921875, -0.09405517578125, -0.027008056640625, 0.0400390625, 0.107086181640625, 0.17413330078125, 0.241180419921875, 0.3082275390625, 0.375274658203125, 0.44232177734375, 0.509368896484375, 0.576416015625, 0.643463134765625, 0.71051025390625, 0.777557373046875, 0.8446044921875, 0.911651611328125, 0.97869873046875, 1.045745849609375, 1.11279296875, 1.179840087890625, 1.24688720703125, 1.313934326171875, 1.3809814453125, 1.448028564453125, 1.51507568359375, 1.582122802734375, 1.649169921875, 1.716217041015625, 1.78326416015625, 1.850311279296875, 1.9173583984375, 1.984405517578125, 2.05145263671875, 2.118499755859375, 2.185546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 4.0, 2.0, 12.0, 8.0, 20.0, 17.0, 15.0, 23.0, 31.0, 35.0, 44.0, 39.0, 42.0, 59.0, 55.0, 44.0, 55.0, 51.0, 55.0, 53.0, 49.0, 53.0, 29.0, 43.0, 27.0, 29.0, 21.0, 20.0, 12.0, 14.0, 6.0, 8.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-11.6875, -11.3585205078125, -11.029541015625, -10.7005615234375, -10.37158203125, -10.0426025390625, -9.713623046875, -9.3846435546875, -9.0556640625, -8.7266845703125, -8.397705078125, -8.0687255859375, -7.73974609375, -7.4107666015625, -7.081787109375, -6.7528076171875, -6.423828125, -6.0948486328125, -5.765869140625, -5.4368896484375, -5.10791015625, -4.7789306640625, -4.449951171875, -4.1209716796875, -3.7919921875, -3.4630126953125, -3.134033203125, -2.8050537109375, -2.47607421875, -2.1470947265625, -1.818115234375, -1.4891357421875, -1.16015625, -0.8311767578125, -0.502197265625, -0.1732177734375, 0.15576171875, 0.4847412109375, 0.813720703125, 1.1427001953125, 1.4716796875, 1.8006591796875, 2.129638671875, 2.4586181640625, 2.78759765625, 3.1165771484375, 3.445556640625, 3.7745361328125, 4.103515625, 4.4324951171875, 4.761474609375, 5.0904541015625, 5.41943359375, 5.7484130859375, 6.077392578125, 6.4063720703125, 6.7353515625, 7.0643310546875, 7.393310546875, 7.7222900390625, 8.05126953125, 8.3802490234375, 8.709228515625, 9.0382080078125, 9.3671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 12.0, 12.0, 20.0, 20.0, 32.0, 47.0, 87.0, 120.0, 167.0, 298.0, 433.0, 727.0, 1085.0, 1680.0, 2744.0, 4481.0, 7051.0, 11540.0, 18608.0, 30376.0, 49139.0, 77137.0, 114614.0, 150330.0, 161532.0, 139952.0, 101613.0, 66328.0, 41098.0, 25701.0, 15805.0, 9655.0, 5900.0, 3734.0, 2289.0, 1497.0, 898.0, 620.0, 386.0, 262.0, 162.0, 133.0, 68.0, 43.0, 33.0, 28.0, 12.0, 15.0, 6.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0], "bins": [-0.84765625, -0.8222198486328125, -0.796783447265625, -0.7713470458984375, -0.74591064453125, -0.7204742431640625, -0.695037841796875, -0.6696014404296875, -0.6441650390625, -0.6187286376953125, -0.593292236328125, -0.5678558349609375, -0.54241943359375, -0.5169830322265625, -0.491546630859375, -0.4661102294921875, -0.440673828125, -0.4152374267578125, -0.389801025390625, -0.3643646240234375, -0.33892822265625, -0.3134918212890625, -0.288055419921875, -0.2626190185546875, -0.2371826171875, -0.2117462158203125, -0.186309814453125, -0.1608734130859375, -0.13543701171875, -0.1100006103515625, -0.084564208984375, -0.0591278076171875, -0.03369140625, -0.0082550048828125, 0.017181396484375, 0.0426177978515625, 0.06805419921875, 0.0934906005859375, 0.118927001953125, 0.1443634033203125, 0.1697998046875, 0.1952362060546875, 0.220672607421875, 0.2461090087890625, 0.27154541015625, 0.2969818115234375, 0.322418212890625, 0.3478546142578125, 0.373291015625, 0.3987274169921875, 0.424163818359375, 0.4496002197265625, 0.47503662109375, 0.5004730224609375, 0.525909423828125, 0.5513458251953125, 0.5767822265625, 0.6022186279296875, 0.627655029296875, 0.6530914306640625, 0.67852783203125, 0.7039642333984375, 0.729400634765625, 0.7548370361328125, 0.7802734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 8.0, 6.0, 11.0, 17.0, 10.0, 17.0, 16.0, 20.0, 19.0, 35.0, 28.0, 32.0, 41.0, 32.0, 34.0, 38.0, 42.0, 40.0, 46.0, 37.0, 40.0, 41.0, 35.0, 44.0, 34.0, 30.0, 39.0, 25.0, 18.0, 22.0, 20.0, 12.0, 12.0, 12.0, 9.0, 11.0, 7.0, 6.0, 10.0, 4.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.921875, -12.4830322265625, -12.044189453125, -11.6053466796875, -11.16650390625, -10.7276611328125, -10.288818359375, -9.8499755859375, -9.4111328125, -8.9722900390625, -8.533447265625, -8.0946044921875, -7.65576171875, -7.2169189453125, -6.778076171875, -6.3392333984375, -5.900390625, -5.4615478515625, -5.022705078125, -4.5838623046875, -4.14501953125, -3.7061767578125, -3.267333984375, -2.8284912109375, -2.3896484375, -1.9508056640625, -1.511962890625, -1.0731201171875, -0.63427734375, -0.1954345703125, 0.243408203125, 0.6822509765625, 1.12109375, 1.5599365234375, 1.998779296875, 2.4376220703125, 2.87646484375, 3.3153076171875, 3.754150390625, 4.1929931640625, 4.6318359375, 5.0706787109375, 5.509521484375, 5.9483642578125, 6.38720703125, 6.8260498046875, 7.264892578125, 7.7037353515625, 8.142578125, 8.5814208984375, 9.020263671875, 9.4591064453125, 9.89794921875, 10.3367919921875, 10.775634765625, 11.2144775390625, 11.6533203125, 12.0921630859375, 12.531005859375, 12.9698486328125, 13.40869140625, 13.8475341796875, 14.286376953125, 14.7252197265625, 15.1640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 20.0, 15.0, 16.0, 25.0, 36.0, 51.0, 70.0, 107.0, 190.0, 284.0, 424.0, 712.0, 1299.0, 2372.0, 4663.0, 9399.0, 21289.0, 56286.0, 170619.0, 388391.0, 252839.0, 83889.0, 29839.0, 12908.0, 5816.0, 3023.0, 1629.0, 939.0, 469.0, 305.0, 207.0, 147.0, 72.0, 57.0, 48.0, 30.0, 22.0, 13.0, 7.0, 10.0, 4.0, 2.0, 0.0, 0.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.215576171875, -0.20898056030273438, -0.20238494873046875, -0.19578933715820312, -0.1891937255859375, -0.18259811401367188, -0.17600250244140625, -0.16940689086914062, -0.162811279296875, -0.15621566772460938, -0.14962005615234375, -0.14302444458007812, -0.1364288330078125, -0.12983322143554688, -0.12323760986328125, -0.11664199829101562, -0.11004638671875, -0.10345077514648438, -0.09685516357421875, -0.09025955200195312, -0.0836639404296875, -0.07706832885742188, -0.07047271728515625, -0.06387710571289062, -0.057281494140625, -0.050685882568359375, -0.04409027099609375, -0.037494659423828125, -0.0308990478515625, -0.024303436279296875, -0.01770782470703125, -0.011112213134765625, -0.0045166015625, 0.002079010009765625, 0.00867462158203125, 0.015270233154296875, 0.0218658447265625, 0.028461456298828125, 0.03505706787109375, 0.041652679443359375, 0.048248291015625, 0.054843902587890625, 0.06143951416015625, 0.06803512573242188, 0.0746307373046875, 0.08122634887695312, 0.08782196044921875, 0.09441757202148438, 0.10101318359375, 0.10760879516601562, 0.11420440673828125, 0.12080001831054688, 0.1273956298828125, 0.13399124145507812, 0.14058685302734375, 0.14718246459960938, 0.153778076171875, 0.16037368774414062, 0.16696929931640625, 0.17356491088867188, 0.1801605224609375, 0.18675613403320312, 0.19335174560546875, 0.19994735717773438, 0.20654296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 4.0, 4.0, 4.0, 5.0, 11.0, 12.0, 20.0, 24.0, 40.0, 47.0, 71.0, 79.0, 88.0, 81.0, 91.0, 90.0, 86.0, 58.0, 44.0, 30.0, 28.0, 13.0, 17.0, 13.0, 6.0, 5.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0001628398895263672, -0.0001568533480167389, -0.0001508668065071106, -0.0001448802649974823, -0.000138893723487854, -0.0001329071819782257, -0.0001269206404685974, -0.00012093409895896912, -0.00011494755744934082, -0.00010896101593971252, -0.00010297447443008423, -9.698793292045593e-05, -9.100139141082764e-05, -8.501484990119934e-05, -7.902830839157104e-05, -7.304176688194275e-05, -6.705522537231445e-05, -6.106868386268616e-05, -5.508214235305786e-05, -4.9095600843429565e-05, -4.310905933380127e-05, -3.7122517824172974e-05, -3.113597631454468e-05, -2.5149434804916382e-05, -1.9162893295288086e-05, -1.317635178565979e-05, -7.189810276031494e-06, -1.2032687664031982e-06, 4.783272743225098e-06, 1.0769814252853394e-05, 1.675635576248169e-05, 2.2742897272109985e-05, 2.872943878173828e-05, 3.471598029136658e-05, 4.070252180099487e-05, 4.668906331062317e-05, 5.2675604820251465e-05, 5.866214632987976e-05, 6.464868783950806e-05, 7.063522934913635e-05, 7.662177085876465e-05, 8.260831236839294e-05, 8.859485387802124e-05, 9.458139538764954e-05, 0.00010056793689727783, 0.00010655447840690613, 0.00011254101991653442, 0.00011852756142616272, 0.00012451410293579102, 0.0001305006444454193, 0.0001364871859550476, 0.0001424737274646759, 0.0001484602689743042, 0.0001544468104839325, 0.0001604333519935608, 0.0001664198935031891, 0.00017240643501281738, 0.00017839297652244568, 0.00018437951803207397, 0.00019036605954170227, 0.00019635260105133057, 0.00020233914256095886, 0.00020832568407058716, 0.00021431222558021545, 0.00022029876708984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 7.0, 5.0, 15.0, 31.0, 50.0, 60.0, 92.0, 170.0, 326.0, 588.0, 1230.0, 2548.0, 5641.0, 15333.0, 48408.0, 176899.0, 445277.0, 250087.0, 68208.0, 20439.0, 7113.0, 3074.0, 1396.0, 714.0, 337.0, 191.0, 123.0, 77.0, 42.0, 15.0, 7.0, 19.0, 6.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2587890625, -0.2515277862548828, -0.24426651000976562, -0.23700523376464844, -0.22974395751953125, -0.22248268127441406, -0.21522140502929688, -0.2079601287841797, -0.2006988525390625, -0.1934375762939453, -0.18617630004882812, -0.17891502380371094, -0.17165374755859375, -0.16439247131347656, -0.15713119506835938, -0.1498699188232422, -0.142608642578125, -0.1353473663330078, -0.12808609008789062, -0.12082481384277344, -0.11356353759765625, -0.10630226135253906, -0.09904098510742188, -0.09177970886230469, -0.0845184326171875, -0.07725715637207031, -0.06999588012695312, -0.06273460388183594, -0.05547332763671875, -0.04821205139160156, -0.040950775146484375, -0.03368949890136719, -0.02642822265625, -0.019166946411132812, -0.011905670166015625, -0.0046443939208984375, 0.00261688232421875, 0.009878158569335938, 0.017139434814453125, 0.024400711059570312, 0.0316619873046875, 0.03892326354980469, 0.046184539794921875, 0.05344581604003906, 0.06070709228515625, 0.06796836853027344, 0.07522964477539062, 0.08249092102050781, 0.089752197265625, 0.09701347351074219, 0.10427474975585938, 0.11153602600097656, 0.11879730224609375, 0.12605857849121094, 0.13331985473632812, 0.1405811309814453, 0.1478424072265625, 0.1551036834716797, 0.16236495971679688, 0.16962623596191406, 0.17688751220703125, 0.18414878845214844, 0.19141006469726562, 0.1986713409423828, 0.2059326171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 7.0, 11.0, 7.0, 8.0, 17.0, 10.0, 22.0, 35.0, 33.0, 43.0, 43.0, 60.0, 79.0, 76.0, 77.0, 83.0, 74.0, 82.0, 55.0, 31.0, 29.0, 31.0, 17.0, 11.0, 15.0, 7.0, 7.0, 6.0, 4.0, 12.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0740966796875, -0.07202577590942383, -0.06995487213134766, -0.06788396835327148, -0.06581306457519531, -0.06374216079711914, -0.06167125701904297, -0.0596003532409668, -0.057529449462890625, -0.05545854568481445, -0.05338764190673828, -0.05131673812866211, -0.04924583435058594, -0.047174930572509766, -0.045104026794433594, -0.04303312301635742, -0.04096221923828125, -0.03889131546020508, -0.036820411682128906, -0.034749507904052734, -0.03267860412597656, -0.03060770034790039, -0.02853679656982422, -0.026465892791748047, -0.024394989013671875, -0.022324085235595703, -0.02025318145751953, -0.01818227767944336, -0.016111373901367188, -0.014040470123291016, -0.011969566345214844, -0.009898662567138672, -0.0078277587890625, -0.005756855010986328, -0.0036859512329101562, -0.0016150474548339844, 0.0004558563232421875, 0.0025267601013183594, 0.004597663879394531, 0.006668567657470703, 0.008739471435546875, 0.010810375213623047, 0.012881278991699219, 0.01495218276977539, 0.017023086547851562, 0.019093990325927734, 0.021164894104003906, 0.023235797882080078, 0.02530670166015625, 0.027377605438232422, 0.029448509216308594, 0.031519412994384766, 0.03359031677246094, 0.03566122055053711, 0.03773212432861328, 0.03980302810668945, 0.041873931884765625, 0.0439448356628418, 0.04601573944091797, 0.04808664321899414, 0.05015754699707031, 0.052228450775146484, 0.054299354553222656, 0.05637025833129883, 0.058441162109375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 13.0, 22.0, 63.0, 152.0, 231.0, 237.0, 151.0, 87.0, 30.0, 9.0, 4.0, 1.0, 2.0, 2.0], "bins": [-56.258121490478516, -55.23427200317383, -54.21042251586914, -53.18656921386719, -52.1627197265625, -51.13887023925781, -50.115020751953125, -49.09117126464844, -48.06732177734375, -47.04347229003906, -46.019622802734375, -44.99577331542969, -43.971920013427734, -42.94807052612305, -41.92422103881836, -40.90037155151367, -39.87651824951172, -38.85266876220703, -37.828819274902344, -36.804969787597656, -35.7811164855957, -34.757266998291016, -33.73341751098633, -32.70956802368164, -31.685718536376953, -30.661869049072266, -29.638017654418945, -28.614168167114258, -27.59031867980957, -26.56646728515625, -25.542617797851562, -24.518768310546875, -23.494918823242188, -22.4710693359375, -21.44721794128418, -20.423368453979492, -19.399518966674805, -18.375667572021484, -17.351818084716797, -16.32796859741211, -15.304118156433105, -14.280267715454102, -13.256418228149414, -12.23256778717041, -11.208717346191406, -10.184867858886719, -9.161017417907715, -8.137166976928711, -7.113317489624023, -6.089467525482178, -5.065617561340332, -4.041767120361328, -3.0179171562194824, -1.9940671920776367, -0.9702167510986328, 0.05363321304321289, 1.0774831771850586, 2.1013331413269043, 3.125183343887329, 4.149033546447754, 5.1728835105896, 6.196733474731445, 7.220583915710449, 8.244434356689453, 9.26828384399414]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 7.0, 10.0, 9.0, 13.0, 17.0, 18.0, 23.0, 36.0, 38.0, 39.0, 44.0, 44.0, 48.0, 70.0, 60.0, 51.0, 49.0, 48.0, 54.0, 43.0, 59.0, 45.0, 37.0, 22.0, 28.0, 21.0, 17.0, 11.0, 10.0, 8.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-12.847481727600098, -12.512124061584473, -12.176765441894531, -11.841407775878906, -11.506050109863281, -11.17069149017334, -10.835333824157715, -10.499975204467773, -10.164617538452148, -9.829259872436523, -9.493901252746582, -9.158543586730957, -8.823185920715332, -8.48782730102539, -8.152469635009766, -7.817111492156982, -7.481753826141357, -7.146395683288574, -6.811038017272949, -6.475679874420166, -6.140321731567383, -5.804964065551758, -5.469605922698975, -5.134247779846191, -4.798890113830566, -4.463531970977783, -4.128174304962158, -3.792816162109375, -3.457458019256592, -3.1221001148223877, -2.7867422103881836, -2.4513840675354004, -2.116025924682617, -1.7806679010391235, -1.4453098773956299, -1.1099519729614258, -0.7745939493179321, -0.4392359256744385, -0.10387802124023438, 0.23148012161254883, 0.5668380260467529, 0.9021960496902466, 1.2375540733337402, 1.5729119777679443, 1.908270001411438, 2.2436280250549316, 2.5789859294891357, 2.914344072341919, 3.249701976776123, 3.585059881210327, 3.9204180240631104, 4.2557759284973145, 4.591134071350098, 4.926491737365723, 5.261849880218506, 5.597208023071289, 5.932565689086914, 6.267923831939697, 6.603281497955322, 6.9386396408081055, 7.273997783660889, 7.609355926513672, 7.944713592529297, 8.280071258544922, 8.615429878234863]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 8.0, 7.0, 12.0, 20.0, 28.0, 21.0, 28.0, 47.0, 87.0, 234.0, 1222.0, 14402.0, 281944.0, 682223.0, 63696.0, 3710.0, 493.0, 131.0, 66.0, 45.0, 29.0, 24.0, 16.0, 19.0, 11.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.03125, -29.97021484375, -28.9091796875, -27.84814453125, -26.787109375, -25.72607421875, -24.6650390625, -23.60400390625, -22.54296875, -21.48193359375, -20.4208984375, -19.35986328125, -18.298828125, -17.23779296875, -16.1767578125, -15.11572265625, -14.0546875, -12.99365234375, -11.9326171875, -10.87158203125, -9.810546875, -8.74951171875, -7.6884765625, -6.62744140625, -5.56640625, -4.50537109375, -3.4443359375, -2.38330078125, -1.322265625, -0.26123046875, 0.7998046875, 1.86083984375, 2.921875, 3.98291015625, 5.0439453125, 6.10498046875, 7.166015625, 8.22705078125, 9.2880859375, 10.34912109375, 11.41015625, 12.47119140625, 13.5322265625, 14.59326171875, 15.654296875, 16.71533203125, 17.7763671875, 18.83740234375, 19.8984375, 20.95947265625, 22.0205078125, 23.08154296875, 24.142578125, 25.20361328125, 26.2646484375, 27.32568359375, 28.38671875, 29.44775390625, 30.5087890625, 31.56982421875, 32.630859375, 33.69189453125, 34.7529296875, 35.81396484375, 36.875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 15.0, 16.0, 28.0, 43.0, 74.0, 76.0, 106.0, 131.0, 109.0, 121.0, 78.0, 66.0, 60.0, 35.0, 15.0, 17.0, 5.0, 3.0, 0.0, 2.0, 3.0], "bins": [-61.375, -60.1707763671875, -58.966552734375, -57.7623291015625, -56.55810546875, -55.3538818359375, -54.149658203125, -52.9454345703125, -51.7412109375, -50.5369873046875, -49.332763671875, -48.1285400390625, -46.92431640625, -45.7200927734375, -44.515869140625, -43.3116455078125, -42.107421875, -40.9031982421875, -39.698974609375, -38.4947509765625, -37.29052734375, -36.0863037109375, -34.882080078125, -33.6778564453125, -32.4736328125, -31.2694091796875, -30.065185546875, -28.8609619140625, -27.65673828125, -26.4525146484375, -25.248291015625, -24.0440673828125, -22.83984375, -21.6356201171875, -20.431396484375, -19.2271728515625, -18.02294921875, -16.8187255859375, -15.614501953125, -14.4102783203125, -13.2060546875, -12.0018310546875, -10.797607421875, -9.5933837890625, -8.38916015625, -7.1849365234375, -5.980712890625, -4.7764892578125, -3.572265625, -2.3680419921875, -1.163818359375, 0.0404052734375, 1.24462890625, 2.4488525390625, 3.653076171875, 4.8572998046875, 6.0615234375, 7.2657470703125, 8.469970703125, 9.6741943359375, 10.87841796875, 12.0826416015625, 13.286865234375, 14.4910888671875, 15.6953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 5.0, 10.0, 10.0, 16.0, 24.0, 32.0, 30.0, 41.0, 46.0, 62.0, 83.0, 96.0, 107.0, 138.0, 162.0, 250.0, 392.0, 994.0, 6174.0, 77038.0, 630621.0, 304968.0, 22892.0, 2381.0, 656.0, 300.0, 200.0, 167.0, 118.0, 107.0, 104.0, 71.0, 50.0, 47.0, 32.0, 23.0, 25.0, 16.0, 10.0, 12.0, 11.0, 4.0, 7.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-26.828125, -26.03369140625, -25.2392578125, -24.44482421875, -23.650390625, -22.85595703125, -22.0615234375, -21.26708984375, -20.47265625, -19.67822265625, -18.8837890625, -18.08935546875, -17.294921875, -16.50048828125, -15.7060546875, -14.91162109375, -14.1171875, -13.32275390625, -12.5283203125, -11.73388671875, -10.939453125, -10.14501953125, -9.3505859375, -8.55615234375, -7.76171875, -6.96728515625, -6.1728515625, -5.37841796875, -4.583984375, -3.78955078125, -2.9951171875, -2.20068359375, -1.40625, -0.61181640625, 0.1826171875, 0.97705078125, 1.771484375, 2.56591796875, 3.3603515625, 4.15478515625, 4.94921875, 5.74365234375, 6.5380859375, 7.33251953125, 8.126953125, 8.92138671875, 9.7158203125, 10.51025390625, 11.3046875, 12.09912109375, 12.8935546875, 13.68798828125, 14.482421875, 15.27685546875, 16.0712890625, 16.86572265625, 17.66015625, 18.45458984375, 19.2490234375, 20.04345703125, 20.837890625, 21.63232421875, 22.4267578125, 23.22119140625, 24.015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 3.0, 7.0, 7.0, 6.0, 16.0, 18.0, 12.0, 20.0, 19.0, 23.0, 23.0, 31.0, 35.0, 45.0, 52.0, 44.0, 51.0, 37.0, 44.0, 50.0, 41.0, 44.0, 52.0, 39.0, 36.0, 26.0, 33.0, 24.0, 34.0, 19.0, 20.0, 19.0, 9.0, 11.0, 6.0, 12.0, 8.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.3125, -15.794921875, -15.27734375, -14.759765625, -14.2421875, -13.724609375, -13.20703125, -12.689453125, -12.171875, -11.654296875, -11.13671875, -10.619140625, -10.1015625, -9.583984375, -9.06640625, -8.548828125, -8.03125, -7.513671875, -6.99609375, -6.478515625, -5.9609375, -5.443359375, -4.92578125, -4.408203125, -3.890625, -3.373046875, -2.85546875, -2.337890625, -1.8203125, -1.302734375, -0.78515625, -0.267578125, 0.25, 0.767578125, 1.28515625, 1.802734375, 2.3203125, 2.837890625, 3.35546875, 3.873046875, 4.390625, 4.908203125, 5.42578125, 5.943359375, 6.4609375, 6.978515625, 7.49609375, 8.013671875, 8.53125, 9.048828125, 9.56640625, 10.083984375, 10.6015625, 11.119140625, 11.63671875, 12.154296875, 12.671875, 13.189453125, 13.70703125, 14.224609375, 14.7421875, 15.259765625, 15.77734375, 16.294921875, 16.8125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 6.0, 7.0, 8.0, 22.0, 26.0, 60.0, 131.0, 264.0, 803.0, 2652.0, 10211.0, 127254.0, 803515.0, 91163.0, 8823.0, 2326.0, 780.0, 256.0, 125.0, 45.0, 25.0, 15.0, 9.0, 4.0, 6.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.1510009765625, -7.817626953125, -7.4842529296875, -7.15087890625, -6.8175048828125, -6.484130859375, -6.1507568359375, -5.8173828125, -5.4840087890625, -5.150634765625, -4.8172607421875, -4.48388671875, -4.1505126953125, -3.817138671875, -3.4837646484375, -3.150390625, -2.8170166015625, -2.483642578125, -2.1502685546875, -1.81689453125, -1.4835205078125, -1.150146484375, -0.8167724609375, -0.4833984375, -0.1500244140625, 0.183349609375, 0.5167236328125, 0.85009765625, 1.1834716796875, 1.516845703125, 1.8502197265625, 2.18359375, 2.5169677734375, 2.850341796875, 3.1837158203125, 3.51708984375, 3.8504638671875, 4.183837890625, 4.5172119140625, 4.8505859375, 5.1839599609375, 5.517333984375, 5.8507080078125, 6.18408203125, 6.5174560546875, 6.850830078125, 7.1842041015625, 7.517578125, 7.8509521484375, 8.184326171875, 8.5177001953125, 8.85107421875, 9.1844482421875, 9.517822265625, 9.8511962890625, 10.1845703125, 10.5179443359375, 10.851318359375, 11.1846923828125, 11.51806640625, 11.8514404296875, 12.184814453125, 12.5181884765625, 12.8515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 7.0, 14.0, 16.0, 22.0, 48.0, 62.0, 85.0, 114.0, 125.0, 143.0, 105.0, 71.0, 62.0, 37.0, 28.0, 14.0, 10.0, 11.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013523101806640625, -0.0013145506381988525, -0.0012767910957336426, -0.0012390315532684326, -0.0012012720108032227, -0.0011635124683380127, -0.0011257529258728027, -0.0010879933834075928, -0.0010502338409423828, -0.0010124742984771729, -0.0009747147560119629, -0.0009369552135467529, -0.000899195671081543, -0.000861436128616333, -0.000823676586151123, -0.0007859170436859131, -0.0007481575012207031, -0.0007103979587554932, -0.0006726384162902832, -0.0006348788738250732, -0.0005971193313598633, -0.0005593597888946533, -0.0005216002464294434, -0.0004838407039642334, -0.00044608116149902344, -0.0004083216190338135, -0.0003705620765686035, -0.00033280253410339355, -0.0002950429916381836, -0.00025728344917297363, -0.00021952390670776367, -0.0001817643642425537, -0.00014400482177734375, -0.00010624527931213379, -6.848573684692383e-05, -3.072619438171387e-05, 7.033348083496094e-06, 4.4792890548706055e-05, 8.255243301391602e-05, 0.00012031197547912598, 0.00015807151794433594, 0.0001958310604095459, 0.00023359060287475586, 0.0002713501453399658, 0.0003091096878051758, 0.00034686923027038574, 0.0003846287727355957, 0.00042238831520080566, 0.0004601478576660156, 0.0004979074001312256, 0.0005356669425964355, 0.0005734264850616455, 0.0006111860275268555, 0.0006489455699920654, 0.0006867051124572754, 0.0007244646549224854, 0.0007622241973876953, 0.0007999837398529053, 0.0008377432823181152, 0.0008755028247833252, 0.0009132623672485352, 0.0009510219097137451, 0.000988781452178955, 0.001026540994644165, 0.001064300537109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 12.0, 16.0, 25.0, 26.0, 40.0, 59.0, 106.0, 224.0, 558.0, 2874.0, 33267.0, 691763.0, 305078.0, 12158.0, 1490.0, 374.0, 180.0, 102.0, 62.0, 41.0, 22.0, 15.0, 18.0, 14.0, 6.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.6749267578125, -8.310791015625, -7.9466552734375, -7.58251953125, -7.2183837890625, -6.854248046875, -6.4901123046875, -6.1259765625, -5.7618408203125, -5.397705078125, -5.0335693359375, -4.66943359375, -4.3052978515625, -3.941162109375, -3.5770263671875, -3.212890625, -2.8487548828125, -2.484619140625, -2.1204833984375, -1.75634765625, -1.3922119140625, -1.028076171875, -0.6639404296875, -0.2998046875, 0.0643310546875, 0.428466796875, 0.7926025390625, 1.15673828125, 1.5208740234375, 1.885009765625, 2.2491455078125, 2.61328125, 2.9774169921875, 3.341552734375, 3.7056884765625, 4.06982421875, 4.4339599609375, 4.798095703125, 5.1622314453125, 5.5263671875, 5.8905029296875, 6.254638671875, 6.6187744140625, 6.98291015625, 7.3470458984375, 7.711181640625, 8.0753173828125, 8.439453125, 8.8035888671875, 9.167724609375, 9.5318603515625, 9.89599609375, 10.2601318359375, 10.624267578125, 10.9884033203125, 11.3525390625, 11.7166748046875, 12.080810546875, 12.4449462890625, 12.80908203125, 13.1732177734375, 13.537353515625, 13.9014892578125, 14.265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 11.0, 6.0, 13.0, 29.0, 35.0, 53.0, 54.0, 72.0, 77.0, 92.0, 102.0, 90.0, 84.0, 63.0, 67.0, 35.0, 33.0, 24.0, 14.0, 6.0, 13.0, 4.0, 7.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3515625, -2.26373291015625, -2.1759033203125, -2.08807373046875, -2.000244140625, -1.91241455078125, -1.8245849609375, -1.73675537109375, -1.64892578125, -1.56109619140625, -1.4732666015625, -1.38543701171875, -1.297607421875, -1.20977783203125, -1.1219482421875, -1.03411865234375, -0.9462890625, -0.85845947265625, -0.7706298828125, -0.68280029296875, -0.594970703125, -0.50714111328125, -0.4193115234375, -0.33148193359375, -0.24365234375, -0.15582275390625, -0.0679931640625, 0.01983642578125, 0.107666015625, 0.19549560546875, 0.2833251953125, 0.37115478515625, 0.458984375, 0.54681396484375, 0.6346435546875, 0.72247314453125, 0.810302734375, 0.89813232421875, 0.9859619140625, 1.07379150390625, 1.16162109375, 1.24945068359375, 1.3372802734375, 1.42510986328125, 1.512939453125, 1.60076904296875, 1.6885986328125, 1.77642822265625, 1.8642578125, 1.95208740234375, 2.0399169921875, 2.12774658203125, 2.215576171875, 2.30340576171875, 2.3912353515625, 2.47906494140625, 2.56689453125, 2.65472412109375, 2.7425537109375, 2.83038330078125, 2.918212890625, 3.00604248046875, 3.0938720703125, 3.18170166015625, 3.26953125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 44.0, 290.0, 489.0, 158.0, 19.0, 3.0], "bins": [-284.9657287597656, -280.2337341308594, -275.5017395019531, -270.7697448730469, -266.0377502441406, -261.30572509765625, -256.57373046875, -251.8417510986328, -247.1097412109375, -242.37774658203125, -237.645751953125, -232.9137420654297, -228.18174743652344, -223.4497528076172, -218.71775817871094, -213.9857635498047, -209.25376892089844, -204.5217742919922, -199.78977966308594, -195.05776977539062, -190.32577514648438, -185.59378051757812, -180.86178588867188, -176.12979125976562, -171.39779663085938, -166.66580200195312, -161.93380737304688, -157.20179748535156, -152.4698028564453, -147.73780822753906, -143.0058135986328, -138.27381896972656, -133.54180908203125, -128.809814453125, -124.07781219482422, -119.34581756591797, -114.61381530761719, -109.88182067871094, -105.14982604980469, -100.41783142089844, -95.68582916259766, -90.9538345336914, -86.22183227539062, -81.48983764648438, -76.75784301757812, -72.02584075927734, -67.2938461303711, -62.56184768676758, -57.82984924316406, -53.09785079956055, -48.36585235595703, -43.63385772705078, -38.901859283447266, -34.16986083984375, -29.437864303588867, -24.705867767333984, -19.9738712310791, -15.241873741149902, -10.509876251220703, -5.777878761291504, -1.0458812713623047, 3.686117172241211, 8.418113708496094, 13.150110244750977, 17.882108688354492]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 5.0, 3.0, 15.0, 19.0, 13.0, 31.0, 24.0, 38.0, 44.0, 43.0, 73.0, 50.0, 47.0, 68.0, 51.0, 61.0, 48.0, 52.0, 55.0, 48.0, 49.0, 25.0, 34.0, 36.0, 18.0, 17.0, 12.0, 6.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-53.541439056396484, -52.298763275146484, -51.05608367919922, -49.81340789794922, -48.57073211669922, -47.32805252075195, -46.08537673950195, -44.84269714355469, -43.60002136230469, -42.35734558105469, -41.11466598510742, -39.87199020385742, -38.629310607910156, -37.386634826660156, -36.143959045410156, -34.901283264160156, -33.65860366821289, -32.41592788696289, -31.173248291015625, -29.930572509765625, -28.687894821166992, -27.44521713256836, -26.20254135131836, -24.959863662719727, -23.717185974121094, -22.47450828552246, -21.231830596923828, -19.989154815673828, -18.746477127075195, -17.503799438476562, -16.261123657226562, -15.01844596862793, -13.77577018737793, -12.533092498779297, -11.29041576385498, -10.047739028930664, -8.805061340332031, -7.562384128570557, -6.319706916809082, -5.077030181884766, -3.834352493286133, -2.591675281524658, -1.3489980697631836, -0.10632085800170898, 1.1363563537597656, 2.3790335655212402, 3.621710777282715, 4.864387512207031, 6.107065200805664, 7.349742412567139, 8.592419624328613, 9.83509635925293, 11.077774047851562, 12.320451736450195, 13.563128471374512, 14.805805206298828, 16.04848289489746, 17.291160583496094, 18.533836364746094, 19.776514053344727, 21.01919174194336, 22.261869430541992, 23.504547119140625, 24.747222900390625, 25.989900588989258]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 6.0, 9.0, 8.0, 16.0, 29.0, 45.0, 71.0, 150.0, 227.0, 390.0, 689.0, 1653.0, 38404.0, 3921100.0, 229462.0, 1395.0, 237.0, 130.0, 75.0, 51.0, 33.0, 29.0, 26.0, 14.0, 10.0, 13.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.25, -37.34765625, -35.4453125, -33.54296875, -31.640625, -29.73828125, -27.8359375, -25.93359375, -24.03125, -22.12890625, -20.2265625, -18.32421875, -16.421875, -14.51953125, -12.6171875, -10.71484375, -8.8125, -6.91015625, -5.0078125, -3.10546875, -1.203125, 0.69921875, 2.6015625, 4.50390625, 6.40625, 8.30859375, 10.2109375, 12.11328125, 14.015625, 15.91796875, 17.8203125, 19.72265625, 21.625, 23.52734375, 25.4296875, 27.33203125, 29.234375, 31.13671875, 33.0390625, 34.94140625, 36.84375, 38.74609375, 40.6484375, 42.55078125, 44.453125, 46.35546875, 48.2578125, 50.16015625, 52.0625, 53.96484375, 55.8671875, 57.76953125, 59.671875, 61.57421875, 63.4765625, 65.37890625, 67.28125, 69.18359375, 71.0859375, 72.98828125, 74.890625, 76.79296875, 78.6953125, 80.59765625, 82.5]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 9.0, 15.0, 12.0, 20.0, 35.0, 34.0, 43.0, 57.0, 72.0, 68.0, 55.0, 71.0, 82.0, 64.0, 66.0, 59.0, 59.0, 40.0, 38.0, 28.0, 22.0, 12.0, 10.0, 10.0, 1.0, 2.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.921875, -15.303466796875, -14.68505859375, -14.066650390625, -13.4482421875, -12.829833984375, -12.21142578125, -11.593017578125, -10.974609375, -10.356201171875, -9.73779296875, -9.119384765625, -8.5009765625, -7.882568359375, -7.26416015625, -6.645751953125, -6.02734375, -5.408935546875, -4.79052734375, -4.172119140625, -3.5537109375, -2.935302734375, -2.31689453125, -1.698486328125, -1.080078125, -0.461669921875, 0.15673828125, 0.775146484375, 1.3935546875, 2.011962890625, 2.63037109375, 3.248779296875, 3.8671875, 4.485595703125, 5.10400390625, 5.722412109375, 6.3408203125, 6.959228515625, 7.57763671875, 8.196044921875, 8.814453125, 9.432861328125, 10.05126953125, 10.669677734375, 11.2880859375, 11.906494140625, 12.52490234375, 13.143310546875, 13.76171875, 14.380126953125, 14.99853515625, 15.616943359375, 16.2353515625, 16.853759765625, 17.47216796875, 18.090576171875, 18.708984375, 19.327392578125, 19.94580078125, 20.564208984375, 21.1826171875, 21.801025390625, 22.41943359375, 23.037841796875, 23.65625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 5.0, 9.0, 29.0, 51.0, 82.0, 172.0, 402.0, 1115.0, 4990.0, 194801.0, 3900487.0, 86417.0, 3921.0, 1028.0, 383.0, 168.0, 92.0, 49.0, 30.0, 9.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.046875, -19.838623046875, -18.63037109375, -17.422119140625, -16.2138671875, -15.005615234375, -13.79736328125, -12.589111328125, -11.380859375, -10.172607421875, -8.96435546875, -7.756103515625, -6.5478515625, -5.339599609375, -4.13134765625, -2.923095703125, -1.71484375, -0.506591796875, 0.70166015625, 1.909912109375, 3.1181640625, 4.326416015625, 5.53466796875, 6.742919921875, 7.951171875, 9.159423828125, 10.36767578125, 11.575927734375, 12.7841796875, 13.992431640625, 15.20068359375, 16.408935546875, 17.6171875, 18.825439453125, 20.03369140625, 21.241943359375, 22.4501953125, 23.658447265625, 24.86669921875, 26.074951171875, 27.283203125, 28.491455078125, 29.69970703125, 30.907958984375, 32.1162109375, 33.324462890625, 34.53271484375, 35.740966796875, 36.94921875, 38.157470703125, 39.36572265625, 40.573974609375, 41.7822265625, 42.990478515625, 44.19873046875, 45.406982421875, 46.615234375, 47.823486328125, 49.03173828125, 50.239990234375, 51.4482421875, 52.656494140625, 53.86474609375, 55.072998046875, 56.28125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 14.0, 19.0, 43.0, 85.0, 139.0, 305.0, 504.0, 780.0, 831.0, 598.0, 353.0, 193.0, 100.0, 48.0, 28.0, 12.0, 2.0, 5.0, 4.0, 0.0, 4.0], "bins": [-14.5859375, -14.3006591796875, -14.015380859375, -13.7301025390625, -13.44482421875, -13.1595458984375, -12.874267578125, -12.5889892578125, -12.3037109375, -12.0184326171875, -11.733154296875, -11.4478759765625, -11.16259765625, -10.8773193359375, -10.592041015625, -10.3067626953125, -10.021484375, -9.7362060546875, -9.450927734375, -9.1656494140625, -8.88037109375, -8.5950927734375, -8.309814453125, -8.0245361328125, -7.7392578125, -7.4539794921875, -7.168701171875, -6.8834228515625, -6.59814453125, -6.3128662109375, -6.027587890625, -5.7423095703125, -5.45703125, -5.1717529296875, -4.886474609375, -4.6011962890625, -4.31591796875, -4.0306396484375, -3.745361328125, -3.4600830078125, -3.1748046875, -2.8895263671875, -2.604248046875, -2.3189697265625, -2.03369140625, -1.7484130859375, -1.463134765625, -1.1778564453125, -0.892578125, -0.6072998046875, -0.322021484375, -0.0367431640625, 0.24853515625, 0.5338134765625, 0.819091796875, 1.1043701171875, 1.3896484375, 1.6749267578125, 1.960205078125, 2.2454833984375, 2.53076171875, 2.8160400390625, 3.101318359375, 3.3865966796875, 3.671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 3.0, 14.0, 23.0, 43.0, 62.0, 110.0, 131.0, 138.0, 143.0, 101.0, 87.0, 63.0, 40.0, 23.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-52.69935607910156, -51.68183517456055, -50.6643180847168, -49.64679718017578, -48.62928009033203, -47.611759185791016, -46.594242095947266, -45.57672119140625, -44.5592041015625, -43.541683197021484, -42.524166107177734, -41.50664520263672, -40.48912811279297, -39.47160720825195, -38.4540901184082, -37.43656921386719, -36.41904830932617, -35.401527404785156, -34.384010314941406, -33.36648941040039, -32.34897232055664, -31.331451416015625, -30.313932418823242, -29.29641342163086, -28.278894424438477, -27.261375427246094, -26.24385643005371, -25.226337432861328, -24.208816528320312, -23.191299438476562, -22.173778533935547, -21.156259536743164, -20.138736724853516, -19.121217727661133, -18.10369873046875, -17.086179733276367, -16.068660736083984, -15.051140785217285, -14.033620834350586, -13.016101837158203, -11.99858283996582, -10.981063842773438, -9.963544845581055, -8.946024894714355, -7.928505897521973, -6.91098690032959, -5.893467426300049, -4.875947952270508, -3.858428955078125, -2.840909719467163, -1.8233904838562012, -0.8058712482452393, 0.21164798736572266, 1.2291669845581055, 2.2466864585876465, 3.2642059326171875, 4.28172492980957, 5.299243927001953, 6.316763401031494, 7.334282875061035, 8.351801872253418, 9.3693208694458, 10.3868408203125, 11.404359817504883, 12.421878814697266]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 0.0, 6.0, 10.0, 6.0, 8.0, 12.0, 14.0, 14.0, 22.0, 17.0, 22.0, 27.0, 27.0, 28.0, 37.0, 44.0, 47.0, 36.0, 45.0, 52.0, 57.0, 52.0, 45.0, 38.0, 40.0, 24.0, 41.0, 41.0, 30.0, 28.0, 21.0, 21.0, 17.0, 20.0, 14.0, 7.0, 10.0, 4.0, 8.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.319596290588379, -11.884896278381348, -11.4501953125, -11.015495300292969, -10.580795288085938, -10.14609432220459, -9.711394309997559, -9.276693344116211, -8.84199333190918, -8.407293319702148, -7.972592353820801, -7.5378923416137695, -7.10319185256958, -6.668491363525391, -6.233791351318359, -5.79909086227417, -5.3643903732299805, -4.929689884185791, -4.494989395141602, -4.06028938293457, -3.625588893890381, -3.1908884048461914, -2.756188154220581, -2.3214879035949707, -1.8867874145507812, -1.4520870447158813, -1.0173866748809814, -0.5826863050460815, -0.14798593521118164, 0.2867145538330078, 0.7214148044586182, 1.1561150550842285, 1.590815544128418, 2.0255160331726074, 2.4602162837982178, 2.894916534423828, 3.3296170234680176, 3.764317512512207, 4.199017524719238, 4.633718013763428, 5.068418502807617, 5.503118991851807, 5.937819480895996, 6.372519493103027, 6.807219982147217, 7.241920471191406, 7.6766204833984375, 8.111320495605469, 8.546021461486816, 8.980721473693848, 9.415422439575195, 9.850122451782227, 10.284822463989258, 10.719523429870605, 11.154223442077637, 11.588924407958984, 12.023624420166016, 12.458324432373047, 12.893025398254395, 13.327725410461426, 13.762426376342773, 14.197126388549805, 14.631826400756836, 15.066526412963867, 15.501227378845215]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 5.0, 4.0, 7.0, 9.0, 8.0, 13.0, 21.0, 22.0, 15.0, 27.0, 34.0, 34.0, 67.0, 88.0, 137.0, 260.0, 596.0, 1623.0, 4895.0, 15984.0, 58571.0, 216506.0, 438780.0, 224284.0, 62035.0, 16464.0, 4931.0, 1673.0, 681.0, 287.0, 136.0, 77.0, 52.0, 55.0, 42.0, 29.0, 17.0, 16.0, 20.0, 13.0, 8.0, 6.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5546875, -2.458343505859375, -2.36199951171875, -2.265655517578125, -2.1693115234375, -2.072967529296875, -1.97662353515625, -1.880279541015625, -1.783935546875, -1.687591552734375, -1.59124755859375, -1.494903564453125, -1.3985595703125, -1.302215576171875, -1.20587158203125, -1.109527587890625, -1.01318359375, -0.916839599609375, -0.82049560546875, -0.724151611328125, -0.6278076171875, -0.531463623046875, -0.43511962890625, -0.338775634765625, -0.242431640625, -0.146087646484375, -0.04974365234375, 0.046600341796875, 0.1429443359375, 0.239288330078125, 0.33563232421875, 0.431976318359375, 0.5283203125, 0.624664306640625, 0.72100830078125, 0.817352294921875, 0.9136962890625, 1.010040283203125, 1.10638427734375, 1.202728271484375, 1.299072265625, 1.395416259765625, 1.49176025390625, 1.588104248046875, 1.6844482421875, 1.780792236328125, 1.87713623046875, 1.973480224609375, 2.06982421875, 2.166168212890625, 2.26251220703125, 2.358856201171875, 2.4552001953125, 2.551544189453125, 2.64788818359375, 2.744232177734375, 2.840576171875, 2.936920166015625, 3.03326416015625, 3.129608154296875, 3.2259521484375, 3.322296142578125, 3.41864013671875, 3.514984130859375, 3.611328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 7.0, 12.0, 21.0, 18.0, 33.0, 35.0, 42.0, 58.0, 59.0, 67.0, 75.0, 79.0, 88.0, 68.0, 60.0, 60.0, 50.0, 32.0, 34.0, 26.0, 26.0, 10.0, 17.0, 10.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6268310546875, -11.136474609375, -10.6461181640625, -10.15576171875, -9.6654052734375, -9.175048828125, -8.6846923828125, -8.1943359375, -7.7039794921875, -7.213623046875, -6.7232666015625, -6.23291015625, -5.7425537109375, -5.252197265625, -4.7618408203125, -4.271484375, -3.7811279296875, -3.290771484375, -2.8004150390625, -2.31005859375, -1.8197021484375, -1.329345703125, -0.8389892578125, -0.3486328125, 0.1417236328125, 0.632080078125, 1.1224365234375, 1.61279296875, 2.1031494140625, 2.593505859375, 3.0838623046875, 3.57421875, 4.0645751953125, 4.554931640625, 5.0452880859375, 5.53564453125, 6.0260009765625, 6.516357421875, 7.0067138671875, 7.4970703125, 7.9874267578125, 8.477783203125, 8.9681396484375, 9.45849609375, 9.9488525390625, 10.439208984375, 10.9295654296875, 11.419921875, 11.9102783203125, 12.400634765625, 12.8909912109375, 13.38134765625, 13.8717041015625, 14.362060546875, 14.8524169921875, 15.3427734375, 15.8331298828125, 16.323486328125, 16.8138427734375, 17.30419921875, 17.7945556640625, 18.284912109375, 18.7752685546875, 19.265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 8.0, 23.0, 36.0, 38.0, 46.0, 102.0, 168.0, 215.0, 358.0, 531.0, 849.0, 1380.0, 2098.0, 3247.0, 5056.0, 8106.0, 12575.0, 20538.0, 33461.0, 53423.0, 83117.0, 121120.0, 154048.0, 158919.0, 132043.0, 93697.0, 61281.0, 38359.0, 23732.0, 14646.0, 9253.0, 5805.0, 3679.0, 2331.0, 1538.0, 982.0, 605.0, 411.0, 238.0, 166.0, 101.0, 72.0, 49.0, 30.0, 20.0, 14.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0], "bins": [-0.98974609375, -0.96075439453125, -0.9317626953125, -0.90277099609375, -0.873779296875, -0.84478759765625, -0.8157958984375, -0.78680419921875, -0.7578125, -0.72882080078125, -0.6998291015625, -0.67083740234375, -0.641845703125, -0.61285400390625, -0.5838623046875, -0.55487060546875, -0.52587890625, -0.49688720703125, -0.4678955078125, -0.43890380859375, -0.409912109375, -0.38092041015625, -0.3519287109375, -0.32293701171875, -0.2939453125, -0.26495361328125, -0.2359619140625, -0.20697021484375, -0.177978515625, -0.14898681640625, -0.1199951171875, -0.09100341796875, -0.06201171875, -0.03302001953125, -0.0040283203125, 0.02496337890625, 0.053955078125, 0.08294677734375, 0.1119384765625, 0.14093017578125, 0.169921875, 0.19891357421875, 0.2279052734375, 0.25689697265625, 0.285888671875, 0.31488037109375, 0.3438720703125, 0.37286376953125, 0.40185546875, 0.43084716796875, 0.4598388671875, 0.48883056640625, 0.517822265625, 0.54681396484375, 0.5758056640625, 0.60479736328125, 0.6337890625, 0.66278076171875, 0.6917724609375, 0.72076416015625, 0.749755859375, 0.77874755859375, 0.8077392578125, 0.83673095703125, 0.86572265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 4.0, 6.0, 6.0, 11.0, 11.0, 12.0, 13.0, 22.0, 19.0, 23.0, 33.0, 29.0, 37.0, 35.0, 39.0, 40.0, 27.0, 35.0, 48.0, 43.0, 49.0, 46.0, 43.0, 38.0, 34.0, 30.0, 43.0, 31.0, 23.0, 20.0, 16.0, 18.0, 13.0, 14.0, 22.0, 9.0, 8.0, 10.0, 5.0, 5.0, 3.0, 3.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0625, -16.517333984375, -15.97216796875, -15.427001953125, -14.8818359375, -14.336669921875, -13.79150390625, -13.246337890625, -12.701171875, -12.156005859375, -11.61083984375, -11.065673828125, -10.5205078125, -9.975341796875, -9.43017578125, -8.885009765625, -8.33984375, -7.794677734375, -7.24951171875, -6.704345703125, -6.1591796875, -5.614013671875, -5.06884765625, -4.523681640625, -3.978515625, -3.433349609375, -2.88818359375, -2.343017578125, -1.7978515625, -1.252685546875, -0.70751953125, -0.162353515625, 0.3828125, 0.927978515625, 1.47314453125, 2.018310546875, 2.5634765625, 3.108642578125, 3.65380859375, 4.198974609375, 4.744140625, 5.289306640625, 5.83447265625, 6.379638671875, 6.9248046875, 7.469970703125, 8.01513671875, 8.560302734375, 9.10546875, 9.650634765625, 10.19580078125, 10.740966796875, 11.2861328125, 11.831298828125, 12.37646484375, 12.921630859375, 13.466796875, 14.011962890625, 14.55712890625, 15.102294921875, 15.6474609375, 16.192626953125, 16.73779296875, 17.282958984375, 17.828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 12.0, 25.0, 30.0, 62.0, 107.0, 197.0, 340.0, 645.0, 1242.0, 2893.0, 8840.0, 33879.0, 171097.0, 567919.0, 205810.0, 39334.0, 10029.0, 3314.0, 1280.0, 657.0, 358.0, 193.0, 129.0, 61.0, 33.0, 19.0, 10.0, 9.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.429931640625, -0.4171180725097656, -0.40430450439453125, -0.3914909362792969, -0.3786773681640625, -0.3658638000488281, -0.35305023193359375, -0.3402366638183594, -0.327423095703125, -0.3146095275878906, -0.30179595947265625, -0.2889823913574219, -0.2761688232421875, -0.2633552551269531, -0.25054168701171875, -0.23772811889648438, -0.22491455078125, -0.21210098266601562, -0.19928741455078125, -0.18647384643554688, -0.1736602783203125, -0.16084671020507812, -0.14803314208984375, -0.13521957397460938, -0.122406005859375, -0.10959243774414062, -0.09677886962890625, -0.08396530151367188, -0.0711517333984375, -0.058338165283203125, -0.04552459716796875, -0.032711029052734375, -0.0198974609375, -0.007083892822265625, 0.00572967529296875, 0.018543243408203125, 0.0313568115234375, 0.044170379638671875, 0.05698394775390625, 0.06979751586914062, 0.082611083984375, 0.09542465209960938, 0.10823822021484375, 0.12105178833007812, 0.1338653564453125, 0.14667892456054688, 0.15949249267578125, 0.17230606079101562, 0.18511962890625, 0.19793319702148438, 0.21074676513671875, 0.22356033325195312, 0.2363739013671875, 0.24918746948242188, 0.26200103759765625, 0.2748146057128906, 0.287628173828125, 0.3004417419433594, 0.31325531005859375, 0.3260688781738281, 0.3388824462890625, 0.3516960144042969, 0.36450958251953125, 0.3773231506347656, 0.39013671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 3.0, 17.0, 17.0, 22.0, 43.0, 40.0, 58.0, 81.0, 96.0, 118.0, 141.0, 90.0, 87.0, 49.0, 44.0, 32.0, 16.0, 14.0, 6.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026988983154296875, -0.00026144087314605713, -0.0002529919147491455, -0.0002445429563522339, -0.00023609399795532227, -0.00022764503955841064, -0.00021919608116149902, -0.0002107471227645874, -0.00020229816436767578, -0.00019384920597076416, -0.00018540024757385254, -0.00017695128917694092, -0.0001685023307800293, -0.00016005337238311768, -0.00015160441398620605, -0.00014315545558929443, -0.0001347064971923828, -0.0001262575387954712, -0.00011780858039855957, -0.00010935962200164795, -0.00010091066360473633, -9.246170520782471e-05, -8.401274681091309e-05, -7.556378841400146e-05, -6.711483001708984e-05, -5.866587162017822e-05, -5.02169132232666e-05, -4.176795482635498e-05, -3.331899642944336e-05, -2.4870038032531738e-05, -1.6421079635620117e-05, -7.972121238708496e-06, 4.76837158203125e-07, 8.925795555114746e-06, 1.7374753952026367e-05, 2.5823712348937988e-05, 3.427267074584961e-05, 4.272162914276123e-05, 5.117058753967285e-05, 5.961954593658447e-05, 6.80685043334961e-05, 7.651746273040771e-05, 8.496642112731934e-05, 9.341537952423096e-05, 0.00010186433792114258, 0.0001103132963180542, 0.00011876225471496582, 0.00012721121311187744, 0.00013566017150878906, 0.00014410912990570068, 0.0001525580883026123, 0.00016100704669952393, 0.00016945600509643555, 0.00017790496349334717, 0.0001863539218902588, 0.0001948028802871704, 0.00020325183868408203, 0.00021170079708099365, 0.00022014975547790527, 0.0002285987138748169, 0.00023704767227172852, 0.00024549663066864014, 0.00025394558906555176, 0.0002623945474624634, 0.000270843505859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 18.0, 15.0, 16.0, 38.0, 47.0, 74.0, 139.0, 271.0, 516.0, 1112.0, 2675.0, 7678.0, 24544.0, 91800.0, 352531.0, 409087.0, 113432.0, 29893.0, 8895.0, 3229.0, 1300.0, 566.0, 280.0, 148.0, 82.0, 53.0, 33.0, 23.0, 9.0, 7.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.286376953125, -0.27617645263671875, -0.2659759521484375, -0.25577545166015625, -0.245574951171875, -0.23537445068359375, -0.2251739501953125, -0.21497344970703125, -0.20477294921875, -0.19457244873046875, -0.1843719482421875, -0.17417144775390625, -0.163970947265625, -0.15377044677734375, -0.1435699462890625, -0.13336944580078125, -0.1231689453125, -0.11296844482421875, -0.1027679443359375, -0.09256744384765625, -0.082366943359375, -0.07216644287109375, -0.0619659423828125, -0.05176544189453125, -0.04156494140625, -0.03136444091796875, -0.0211639404296875, -0.01096343994140625, -0.000762939453125, 0.00943756103515625, 0.0196380615234375, 0.02983856201171875, 0.0400390625, 0.05023956298828125, 0.0604400634765625, 0.07064056396484375, 0.080841064453125, 0.09104156494140625, 0.1012420654296875, 0.11144256591796875, 0.12164306640625, 0.13184356689453125, 0.1420440673828125, 0.15224456787109375, 0.162445068359375, 0.17264556884765625, 0.1828460693359375, 0.19304656982421875, 0.2032470703125, 0.21344757080078125, 0.2236480712890625, 0.23384857177734375, 0.244049072265625, 0.25424957275390625, 0.2644500732421875, 0.27465057373046875, 0.28485107421875, 0.29505157470703125, 0.3052520751953125, 0.31545257568359375, 0.325653076171875, 0.33585357666015625, 0.3460540771484375, 0.35625457763671875, 0.366455078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 12.0, 8.0, 13.0, 20.0, 28.0, 30.0, 42.0, 44.0, 44.0, 65.0, 57.0, 70.0, 55.0, 78.0, 79.0, 64.0, 52.0, 41.0, 41.0, 33.0, 25.0, 30.0, 17.0, 10.0, 9.0, 4.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09356689453125, -0.09040451049804688, -0.08724212646484375, -0.08407974243164062, -0.0809173583984375, -0.07775497436523438, -0.07459259033203125, -0.07143020629882812, -0.068267822265625, -0.06510543823242188, -0.06194305419921875, -0.058780670166015625, -0.0556182861328125, -0.052455902099609375, -0.04929351806640625, -0.046131134033203125, -0.04296875, -0.039806365966796875, -0.03664398193359375, -0.033481597900390625, -0.0303192138671875, -0.027156829833984375, -0.02399444580078125, -0.020832061767578125, -0.017669677734375, -0.014507293701171875, -0.01134490966796875, -0.008182525634765625, -0.0050201416015625, -0.001857757568359375, 0.00130462646484375, 0.004467010498046875, 0.00762939453125, 0.010791778564453125, 0.01395416259765625, 0.017116546630859375, 0.0202789306640625, 0.023441314697265625, 0.02660369873046875, 0.029766082763671875, 0.032928466796875, 0.036090850830078125, 0.03925323486328125, 0.042415618896484375, 0.0455780029296875, 0.048740386962890625, 0.05190277099609375, 0.055065155029296875, 0.0582275390625, 0.061389923095703125, 0.06455230712890625, 0.06771469116210938, 0.0708770751953125, 0.07403945922851562, 0.07720184326171875, 0.08036422729492188, 0.083526611328125, 0.08668899536132812, 0.08985137939453125, 0.09301376342773438, 0.0961761474609375, 0.09933853149414062, 0.10250091552734375, 0.10566329956054688, 0.10882568359375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 17.0, 151.0, 553.0, 258.0, 29.0, 1.0, 2.0], "bins": [-154.35585021972656, -151.76426696777344, -149.17269897460938, -146.58111572265625, -143.9895477294922, -141.39796447753906, -138.806396484375, -136.21481323242188, -133.6232452392578, -131.0316619873047, -128.44009399414062, -125.84851837158203, -123.25694274902344, -120.66535949707031, -118.07379150390625, -115.48220825195312, -112.890625, -110.2990493774414, -107.70747375488281, -105.11589813232422, -102.52432250976562, -99.9327392578125, -97.34117126464844, -94.74958801269531, -92.15802001953125, -89.56644439697266, -86.97486877441406, -84.38329315185547, -81.79171752929688, -79.20013427734375, -76.60856628417969, -74.01698303222656, -71.42540740966797, -68.83383178710938, -66.24225616455078, -63.65068054199219, -61.05910110473633, -58.467525482177734, -55.87594985961914, -53.28437042236328, -50.69279861450195, -48.10122299194336, -45.509647369384766, -42.918067932128906, -40.32649230957031, -37.73491668701172, -35.143341064453125, -32.55176544189453, -29.960189819335938, -27.368614196777344, -24.777036666870117, -22.185461044311523, -19.593883514404297, -17.002307891845703, -14.41073226928711, -11.819154739379883, -9.227578163146973, -6.6360015869140625, -4.0444254875183105, -1.4528493881225586, 1.1387271881103516, 3.7303037643432617, 6.3218793869018555, 8.913456916809082, 11.505032539367676]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 10.0, 8.0, 13.0, 17.0, 16.0, 19.0, 20.0, 33.0, 40.0, 29.0, 41.0, 63.0, 52.0, 51.0, 68.0, 59.0, 54.0, 48.0, 47.0, 42.0, 45.0, 41.0, 38.0, 25.0, 21.0, 23.0, 21.0, 10.0, 15.0, 9.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.031588554382324, -9.67660140991211, -9.321614265441895, -8.96662712097168, -8.611639976501465, -8.25665283203125, -7.901665687561035, -7.54667854309082, -7.1916913986206055, -6.836704254150391, -6.481717109680176, -6.126729965209961, -5.771742820739746, -5.416755676269531, -5.061768531799316, -4.706781387329102, -4.351794242858887, -3.996807098388672, -3.641819953918457, -3.286832809448242, -2.9318456649780273, -2.5768585205078125, -2.2218713760375977, -1.8668842315673828, -1.511897087097168, -1.1569099426269531, -0.8019227981567383, -0.44693565368652344, -0.0919485092163086, 0.26303863525390625, 0.6180257797241211, 0.9730129241943359, 1.3279991149902344, 1.6829862594604492, 2.037973403930664, 2.392960548400879, 2.7479476928710938, 3.1029348373413086, 3.4579219818115234, 3.8129091262817383, 4.167896270751953, 4.522883415222168, 4.877870559692383, 5.232857704162598, 5.5878448486328125, 5.942831993103027, 6.297819137573242, 6.652806282043457, 7.007793426513672, 7.362780570983887, 7.717767715454102, 8.072754859924316, 8.427742004394531, 8.782729148864746, 9.137716293334961, 9.492703437805176, 9.84769058227539, 10.202677726745605, 10.55766487121582, 10.912652015686035, 11.26763916015625, 11.622626304626465, 11.97761344909668, 12.332600593566895, 12.68758773803711]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 5.0, 12.0, 7.0, 8.0, 9.0, 17.0, 15.0, 23.0, 17.0, 38.0, 38.0, 102.0, 177.0, 512.0, 1994.0, 12361.0, 108577.0, 594458.0, 291019.0, 33054.0, 4510.0, 937.0, 274.0, 121.0, 66.0, 37.0, 37.0, 32.0, 22.0, 14.0, 16.0, 6.0, 9.0, 4.0, 4.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.546875, -18.910888671875, -18.27490234375, -17.638916015625, -17.0029296875, -16.366943359375, -15.73095703125, -15.094970703125, -14.458984375, -13.822998046875, -13.18701171875, -12.551025390625, -11.9150390625, -11.279052734375, -10.64306640625, -10.007080078125, -9.37109375, -8.735107421875, -8.09912109375, -7.463134765625, -6.8271484375, -6.191162109375, -5.55517578125, -4.919189453125, -4.283203125, -3.647216796875, -3.01123046875, -2.375244140625, -1.7392578125, -1.103271484375, -0.46728515625, 0.168701171875, 0.8046875, 1.440673828125, 2.07666015625, 2.712646484375, 3.3486328125, 3.984619140625, 4.62060546875, 5.256591796875, 5.892578125, 6.528564453125, 7.16455078125, 7.800537109375, 8.4365234375, 9.072509765625, 9.70849609375, 10.344482421875, 10.98046875, 11.616455078125, 12.25244140625, 12.888427734375, 13.5244140625, 14.160400390625, 14.79638671875, 15.432373046875, 16.068359375, 16.704345703125, 17.34033203125, 17.976318359375, 18.6123046875, 19.248291015625, 19.88427734375, 20.520263671875, 21.15625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 28.0, 31.0, 23.0, 42.0, 55.0, 64.0, 78.0, 90.0, 83.0, 76.0, 68.0, 75.0, 54.0, 57.0, 48.0, 26.0, 25.0, 19.0, 15.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0], "bins": [-42.65625, -41.7608642578125, -40.865478515625, -39.9700927734375, -39.07470703125, -38.1793212890625, -37.283935546875, -36.3885498046875, -35.4931640625, -34.5977783203125, -33.702392578125, -32.8070068359375, -31.91162109375, -31.0162353515625, -30.120849609375, -29.2254638671875, -28.330078125, -27.4346923828125, -26.539306640625, -25.6439208984375, -24.74853515625, -23.8531494140625, -22.957763671875, -22.0623779296875, -21.1669921875, -20.2716064453125, -19.376220703125, -18.4808349609375, -17.58544921875, -16.6900634765625, -15.794677734375, -14.8992919921875, -14.00390625, -13.1085205078125, -12.213134765625, -11.3177490234375, -10.42236328125, -9.5269775390625, -8.631591796875, -7.7362060546875, -6.8408203125, -5.9454345703125, -5.050048828125, -4.1546630859375, -3.25927734375, -2.3638916015625, -1.468505859375, -0.5731201171875, 0.322265625, 1.2176513671875, 2.113037109375, 3.0084228515625, 3.90380859375, 4.7991943359375, 5.694580078125, 6.5899658203125, 7.4853515625, 8.3807373046875, 9.276123046875, 10.1715087890625, 11.06689453125, 11.9622802734375, 12.857666015625, 13.7530517578125, 14.6484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 6.0, 9.0, 13.0, 17.0, 27.0, 39.0, 46.0, 67.0, 105.0, 169.0, 255.0, 484.0, 2637.0, 149333.0, 871419.0, 21782.0, 1124.0, 373.0, 207.0, 146.0, 85.0, 56.0, 46.0, 20.0, 20.0, 15.0, 11.0, 16.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.71875, -39.49560546875, -38.2724609375, -37.04931640625, -35.826171875, -34.60302734375, -33.3798828125, -32.15673828125, -30.93359375, -29.71044921875, -28.4873046875, -27.26416015625, -26.041015625, -24.81787109375, -23.5947265625, -22.37158203125, -21.1484375, -19.92529296875, -18.7021484375, -17.47900390625, -16.255859375, -15.03271484375, -13.8095703125, -12.58642578125, -11.36328125, -10.14013671875, -8.9169921875, -7.69384765625, -6.470703125, -5.24755859375, -4.0244140625, -2.80126953125, -1.578125, -0.35498046875, 0.8681640625, 2.09130859375, 3.314453125, 4.53759765625, 5.7607421875, 6.98388671875, 8.20703125, 9.43017578125, 10.6533203125, 11.87646484375, 13.099609375, 14.32275390625, 15.5458984375, 16.76904296875, 17.9921875, 19.21533203125, 20.4384765625, 21.66162109375, 22.884765625, 24.10791015625, 25.3310546875, 26.55419921875, 27.77734375, 29.00048828125, 30.2236328125, 31.44677734375, 32.669921875, 33.89306640625, 35.1162109375, 36.33935546875, 37.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 8.0, 11.0, 11.0, 13.0, 17.0, 15.0, 26.0, 43.0, 32.0, 37.0, 43.0, 50.0, 43.0, 67.0, 51.0, 57.0, 49.0, 55.0, 57.0, 50.0, 44.0, 32.0, 31.0, 29.0, 24.0, 17.0, 18.0, 20.0, 15.0, 3.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.078125, -19.286865234375, -18.49560546875, -17.704345703125, -16.9130859375, -16.121826171875, -15.33056640625, -14.539306640625, -13.748046875, -12.956787109375, -12.16552734375, -11.374267578125, -10.5830078125, -9.791748046875, -9.00048828125, -8.209228515625, -7.41796875, -6.626708984375, -5.83544921875, -5.044189453125, -4.2529296875, -3.461669921875, -2.67041015625, -1.879150390625, -1.087890625, -0.296630859375, 0.49462890625, 1.285888671875, 2.0771484375, 2.868408203125, 3.65966796875, 4.450927734375, 5.2421875, 6.033447265625, 6.82470703125, 7.615966796875, 8.4072265625, 9.198486328125, 9.98974609375, 10.781005859375, 11.572265625, 12.363525390625, 13.15478515625, 13.946044921875, 14.7373046875, 15.528564453125, 16.31982421875, 17.111083984375, 17.90234375, 18.693603515625, 19.48486328125, 20.276123046875, 21.0673828125, 21.858642578125, 22.64990234375, 23.441162109375, 24.232421875, 25.023681640625, 25.81494140625, 26.606201171875, 27.3974609375, 28.188720703125, 28.97998046875, 29.771240234375, 30.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 7.0, 25.0, 49.0, 142.0, 549.0, 4812.0, 821913.0, 217427.0, 2934.0, 451.0, 142.0, 42.0, 18.0, 12.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.96875, -30.966796875, -29.96484375, -28.962890625, -27.9609375, -26.958984375, -25.95703125, -24.955078125, -23.953125, -22.951171875, -21.94921875, -20.947265625, -19.9453125, -18.943359375, -17.94140625, -16.939453125, -15.9375, -14.935546875, -13.93359375, -12.931640625, -11.9296875, -10.927734375, -9.92578125, -8.923828125, -7.921875, -6.919921875, -5.91796875, -4.916015625, -3.9140625, -2.912109375, -1.91015625, -0.908203125, 0.09375, 1.095703125, 2.09765625, 3.099609375, 4.1015625, 5.103515625, 6.10546875, 7.107421875, 8.109375, 9.111328125, 10.11328125, 11.115234375, 12.1171875, 13.119140625, 14.12109375, 15.123046875, 16.125, 17.126953125, 18.12890625, 19.130859375, 20.1328125, 21.134765625, 22.13671875, 23.138671875, 24.140625, 25.142578125, 26.14453125, 27.146484375, 28.1484375, 29.150390625, 30.15234375, 31.154296875, 32.15625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 0.0, 3.0, 2.0, 5.0, 4.0, 9.0, 14.0, 32.0, 49.0, 87.0, 132.0, 208.0, 175.0, 122.0, 55.0, 35.0, 28.0, 16.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017805099487304688, -0.0017206817865371704, -0.001660853624343872, -0.0016010254621505737, -0.0015411972999572754, -0.001481369137763977, -0.0014215409755706787, -0.0013617128133773804, -0.001301884651184082, -0.0012420564889907837, -0.0011822283267974854, -0.001122400164604187, -0.0010625720024108887, -0.0010027438402175903, -0.000942915678024292, -0.0008830875158309937, -0.0008232593536376953, -0.000763431191444397, -0.0007036030292510986, -0.0006437748670578003, -0.000583946704864502, -0.0005241185426712036, -0.0004642903804779053, -0.00040446221828460693, -0.0003446340560913086, -0.00028480589389801025, -0.00022497773170471191, -0.00016514956951141357, -0.00010532140731811523, -4.5493245124816895e-05, 1.4334917068481445e-05, 7.416307926177979e-05, 0.00013399124145507812, 0.00019381940364837646, 0.0002536475658416748, 0.00031347572803497314, 0.0003733038902282715, 0.0004331320524215698, 0.0004929602146148682, 0.0005527883768081665, 0.0006126165390014648, 0.0006724447011947632, 0.0007322728633880615, 0.0007921010255813599, 0.0008519291877746582, 0.0009117573499679565, 0.0009715855121612549, 0.0010314136743545532, 0.0010912418365478516, 0.00115106999874115, 0.0012108981609344482, 0.0012707263231277466, 0.001330554485321045, 0.0013903826475143433, 0.0014502108097076416, 0.00151003897190094, 0.0015698671340942383, 0.0016296952962875366, 0.001689523458480835, 0.0017493516206741333, 0.0018091797828674316, 0.00186900794506073, 0.0019288361072540283, 0.0019886642694473267, 0.002048492431640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 3.0, 7.0, 14.0, 10.0, 22.0, 25.0, 52.0, 85.0, 146.0, 509.0, 3981.0, 389487.0, 647979.0, 5250.0, 591.0, 173.0, 87.0, 46.0, 20.0, 23.0, 4.0, 9.0, 8.0, 4.0, 0.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.240478515625, -17.51220703125, -16.783935546875, -16.0556640625, -15.327392578125, -14.59912109375, -13.870849609375, -13.142578125, -12.414306640625, -11.68603515625, -10.957763671875, -10.2294921875, -9.501220703125, -8.77294921875, -8.044677734375, -7.31640625, -6.588134765625, -5.85986328125, -5.131591796875, -4.4033203125, -3.675048828125, -2.94677734375, -2.218505859375, -1.490234375, -0.761962890625, -0.03369140625, 0.694580078125, 1.4228515625, 2.151123046875, 2.87939453125, 3.607666015625, 4.3359375, 5.064208984375, 5.79248046875, 6.520751953125, 7.2490234375, 7.977294921875, 8.70556640625, 9.433837890625, 10.162109375, 10.890380859375, 11.61865234375, 12.346923828125, 13.0751953125, 13.803466796875, 14.53173828125, 15.260009765625, 15.98828125, 16.716552734375, 17.44482421875, 18.173095703125, 18.9013671875, 19.629638671875, 20.35791015625, 21.086181640625, 21.814453125, 22.542724609375, 23.27099609375, 23.999267578125, 24.7275390625, 25.455810546875, 26.18408203125, 26.912353515625, 27.640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 9.0, 5.0, 8.0, 15.0, 23.0, 35.0, 43.0, 49.0, 71.0, 96.0, 123.0, 122.0, 95.0, 70.0, 53.0, 43.0, 38.0, 29.0, 16.0, 15.0, 12.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.27734375, -3.1715087890625, -3.065673828125, -2.9598388671875, -2.85400390625, -2.7481689453125, -2.642333984375, -2.5364990234375, -2.4306640625, -2.3248291015625, -2.218994140625, -2.1131591796875, -2.00732421875, -1.9014892578125, -1.795654296875, -1.6898193359375, -1.583984375, -1.4781494140625, -1.372314453125, -1.2664794921875, -1.16064453125, -1.0548095703125, -0.948974609375, -0.8431396484375, -0.7373046875, -0.6314697265625, -0.525634765625, -0.4197998046875, -0.31396484375, -0.2081298828125, -0.102294921875, 0.0035400390625, 0.109375, 0.2152099609375, 0.321044921875, 0.4268798828125, 0.53271484375, 0.6385498046875, 0.744384765625, 0.8502197265625, 0.9560546875, 1.0618896484375, 1.167724609375, 1.2735595703125, 1.37939453125, 1.4852294921875, 1.591064453125, 1.6968994140625, 1.802734375, 1.9085693359375, 2.014404296875, 2.1202392578125, 2.22607421875, 2.3319091796875, 2.437744140625, 2.5435791015625, 2.6494140625, 2.7552490234375, 2.861083984375, 2.9669189453125, 3.07275390625, 3.1785888671875, 3.284423828125, 3.3902587890625, 3.49609375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 9.0, 3.0, 22.0, 53.0, 107.0, 184.0, 208.0, 187.0, 121.0, 65.0, 22.0, 17.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-96.90064239501953, -94.97946166992188, -93.05828094482422, -91.13710021972656, -89.21592712402344, -87.29474639892578, -85.37356567382812, -83.45238494873047, -81.53120422363281, -79.61002349853516, -77.6888427734375, -75.76766204833984, -73.84648132324219, -71.92530822753906, -70.0041275024414, -68.08294677734375, -66.1617660522461, -64.24058532714844, -62.31940460205078, -60.39822769165039, -58.477046966552734, -56.55586624145508, -54.63468933105469, -52.71350860595703, -50.792327880859375, -48.87114715576172, -46.94996643066406, -45.02878952026367, -43.107608795166016, -41.18642807006836, -39.26525115966797, -37.34407043457031, -35.422889709472656, -33.501708984375, -31.580530166625977, -29.659351348876953, -27.738170623779297, -25.81698989868164, -23.895811080932617, -21.974632263183594, -20.053451538085938, -18.13227081298828, -16.211091995239258, -14.289912223815918, -12.368732452392578, -10.447552680969238, -8.526372909545898, -6.605193138122559, -4.684013366699219, -2.762833595275879, -0.8416538238525391, 1.0795259475708008, 3.0007057189941406, 4.9218854904174805, 6.84306526184082, 8.76424503326416, 10.6854248046875, 12.60660457611084, 14.52778434753418, 16.448963165283203, 18.37014389038086, 20.291324615478516, 22.21250343322754, 24.133682250976562, 26.05486297607422]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 12.0, 12.0, 10.0, 20.0, 21.0, 21.0, 18.0, 22.0, 33.0, 29.0, 37.0, 41.0, 47.0, 30.0, 48.0, 56.0, 44.0, 52.0, 41.0, 44.0, 41.0, 34.0, 31.0, 31.0, 33.0, 26.0, 25.0, 26.0, 21.0, 16.0, 12.0, 11.0, 13.0, 8.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.08196258544922, -41.916744232177734, -40.75152587890625, -39.586307525634766, -38.42108917236328, -37.25586700439453, -36.09065246582031, -34.92543029785156, -33.76021194458008, -32.594993591308594, -31.42977523803711, -30.264556884765625, -29.099336624145508, -27.934118270874023, -26.76889991760254, -25.603679656982422, -24.43846321105957, -23.273244857788086, -22.1080265045166, -20.942806243896484, -19.777587890625, -18.612369537353516, -17.44715118408203, -16.281932830810547, -15.116713523864746, -13.951495170593262, -12.786275863647461, -11.621057510375977, -10.455839157104492, -9.290619850158691, -8.125401496887207, -6.960182189941406, -5.794963836669922, -4.629745006561279, -3.464526414871216, -2.2993078231811523, -1.1340889930725098, 0.031129837036132812, 1.1963481903076172, 2.361567497253418, 3.5267858505249023, 4.692004680633545, 5.8572235107421875, 7.022441864013672, 8.187660217285156, 9.352879524230957, 10.518097877502441, 11.683317184448242, 12.848535537719727, 14.013753890991211, 15.178973197937012, 16.344192504882812, 17.509410858154297, 18.67462921142578, 19.839847564697266, 21.00506591796875, 22.170284271240234, 23.33550262451172, 24.500720977783203, 25.665939331054688, 26.831159591674805, 27.99637794494629, 29.161596298217773, 30.32681655883789, 31.492034912109375]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 8.0, 3.0, 13.0, 17.0, 32.0, 59.0, 118.0, 295.0, 780.0, 1733.0, 24897.0, 4142931.0, 22417.0, 502.0, 168.0, 93.0, 57.0, 42.0, 16.0, 21.0, 14.0, 15.0, 8.0, 11.0, 4.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.0, -62.345703125, -59.69140625, -57.037109375, -54.3828125, -51.728515625, -49.07421875, -46.419921875, -43.765625, -41.111328125, -38.45703125, -35.802734375, -33.1484375, -30.494140625, -27.83984375, -25.185546875, -22.53125, -19.876953125, -17.22265625, -14.568359375, -11.9140625, -9.259765625, -6.60546875, -3.951171875, -1.296875, 1.357421875, 4.01171875, 6.666015625, 9.3203125, 11.974609375, 14.62890625, 17.283203125, 19.9375, 22.591796875, 25.24609375, 27.900390625, 30.5546875, 33.208984375, 35.86328125, 38.517578125, 41.171875, 43.826171875, 46.48046875, 49.134765625, 51.7890625, 54.443359375, 57.09765625, 59.751953125, 62.40625, 65.060546875, 67.71484375, 70.369140625, 73.0234375, 75.677734375, 78.33203125, 80.986328125, 83.640625, 86.294921875, 88.94921875, 91.603515625, 94.2578125, 96.912109375, 99.56640625, 102.220703125, 104.875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 17.0, 12.0, 43.0, 47.0, 82.0, 79.0, 104.0, 97.0, 124.0, 91.0, 72.0, 58.0, 67.0, 41.0, 27.0, 19.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.953125, -14.075927734375, -13.19873046875, -12.321533203125, -11.4443359375, -10.567138671875, -9.68994140625, -8.812744140625, -7.935546875, -7.058349609375, -6.18115234375, -5.303955078125, -4.4267578125, -3.549560546875, -2.67236328125, -1.795166015625, -0.91796875, -0.040771484375, 0.83642578125, 1.713623046875, 2.5908203125, 3.468017578125, 4.34521484375, 5.222412109375, 6.099609375, 6.976806640625, 7.85400390625, 8.731201171875, 9.6083984375, 10.485595703125, 11.36279296875, 12.239990234375, 13.1171875, 13.994384765625, 14.87158203125, 15.748779296875, 16.6259765625, 17.503173828125, 18.38037109375, 19.257568359375, 20.134765625, 21.011962890625, 21.88916015625, 22.766357421875, 23.6435546875, 24.520751953125, 25.39794921875, 26.275146484375, 27.15234375, 28.029541015625, 28.90673828125, 29.783935546875, 30.6611328125, 31.538330078125, 32.41552734375, 33.292724609375, 34.169921875, 35.047119140625, 35.92431640625, 36.801513671875, 37.6787109375, 38.555908203125, 39.43310546875, 40.310302734375, 41.1875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 10.0, 28.0, 29.0, 62.0, 100.0, 250.0, 560.0, 1454.0, 5874.0, 90552.0, 3719326.0, 361269.0, 11233.0, 2114.0, 700.0, 337.0, 156.0, 80.0, 49.0, 34.0, 25.0, 9.0, 4.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.453125, -29.459716796875, -28.46630859375, -27.472900390625, -26.4794921875, -25.486083984375, -24.49267578125, -23.499267578125, -22.505859375, -21.512451171875, -20.51904296875, -19.525634765625, -18.5322265625, -17.538818359375, -16.54541015625, -15.552001953125, -14.55859375, -13.565185546875, -12.57177734375, -11.578369140625, -10.5849609375, -9.591552734375, -8.59814453125, -7.604736328125, -6.611328125, -5.617919921875, -4.62451171875, -3.631103515625, -2.6376953125, -1.644287109375, -0.65087890625, 0.342529296875, 1.3359375, 2.329345703125, 3.32275390625, 4.316162109375, 5.3095703125, 6.302978515625, 7.29638671875, 8.289794921875, 9.283203125, 10.276611328125, 11.27001953125, 12.263427734375, 13.2568359375, 14.250244140625, 15.24365234375, 16.237060546875, 17.23046875, 18.223876953125, 19.21728515625, 20.210693359375, 21.2041015625, 22.197509765625, 23.19091796875, 24.184326171875, 25.177734375, 26.171142578125, 27.16455078125, 28.157958984375, 29.1513671875, 30.144775390625, 31.13818359375, 32.131591796875, 33.125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 13.0, 22.0, 32.0, 73.0, 111.0, 226.0, 394.0, 659.0, 899.0, 783.0, 425.0, 206.0, 95.0, 69.0, 20.0, 14.0, 10.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.044921875, -7.76171875, -7.478515625, -7.1953125, -6.912109375, -6.62890625, -6.345703125, -6.0625, -5.779296875, -5.49609375, -5.212890625, -4.9296875, -4.646484375, -4.36328125, -4.080078125, -3.796875, -3.513671875, -3.23046875, -2.947265625, -2.6640625, -2.380859375, -2.09765625, -1.814453125, -1.53125, -1.248046875, -0.96484375, -0.681640625, -0.3984375, -0.115234375, 0.16796875, 0.451171875, 0.734375, 1.017578125, 1.30078125, 1.583984375, 1.8671875, 2.150390625, 2.43359375, 2.716796875, 3.0, 3.283203125, 3.56640625, 3.849609375, 4.1328125, 4.416015625, 4.69921875, 4.982421875, 5.265625, 5.548828125, 5.83203125, 6.115234375, 6.3984375, 6.681640625, 6.96484375, 7.248046875, 7.53125, 7.814453125, 8.09765625, 8.380859375, 8.6640625, 8.947265625, 9.23046875, 9.513671875, 9.796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 9.0, 15.0, 39.0, 77.0, 119.0, 161.0, 188.0, 148.0, 108.0, 76.0, 28.0, 27.0, 7.0, 3.0, 1.0, 2.0], "bins": [-67.376953125, -66.13509368896484, -64.89322662353516, -63.6513671875, -62.40950393676758, -61.167640686035156, -59.925777435302734, -58.68391418457031, -57.442054748535156, -56.200191497802734, -54.95832824707031, -53.716468811035156, -52.474605560302734, -51.23274230957031, -49.99087905883789, -48.74901580810547, -47.50715637207031, -46.26529312133789, -45.02342987060547, -43.78157043457031, -42.53970718383789, -41.29784393310547, -40.05598068237305, -38.814117431640625, -37.5722541809082, -36.33039093017578, -35.08852767944336, -33.8466682434082, -32.60480499267578, -31.36294174194336, -30.121078491210938, -28.87921714782715, -27.637357711791992, -26.39549446105957, -25.15363311767578, -23.91176986694336, -22.66990852355957, -21.42804527282715, -20.18618392944336, -18.944320678710938, -17.702457427978516, -16.460594177246094, -15.218732833862305, -13.976869583129883, -12.735008239746094, -11.493144989013672, -10.251282691955566, -9.009420394897461, -7.767559051513672, -6.525696754455566, -5.283834457397461, -4.041971683502197, -2.800109386444092, -1.5582470893859863, -0.31638431549072266, 0.9254779815673828, 2.1673402786254883, 3.4092025756835938, 4.651064872741699, 5.892927646636963, 7.134789943695068, 8.376651763916016, 9.618515014648438, 10.860377311706543, 12.102239608764648]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 10.0, 14.0, 11.0, 18.0, 25.0, 25.0, 25.0, 25.0, 38.0, 48.0, 50.0, 60.0, 57.0, 61.0, 51.0, 49.0, 52.0, 50.0, 56.0, 40.0, 49.0, 34.0, 27.0, 26.0, 21.0, 12.0, 16.0, 14.0, 7.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.828600883483887, -10.330092430114746, -9.831583976745605, -9.333075523376465, -8.834567070007324, -8.336058616638184, -7.837549686431885, -7.339041233062744, -6.8405327796936035, -6.342024326324463, -5.843515872955322, -5.345006942749023, -4.846498489379883, -4.347990036010742, -3.8494815826416016, -3.350973129272461, -2.8524646759033203, -2.3539562225341797, -1.8554476499557495, -1.3569390773773193, -0.8584306240081787, -0.3599221706390381, 0.13858652114868164, 0.6370949745178223, 1.135603427886963, 1.6341118812561035, 2.132620334625244, 2.631129026412964, 3.1296374797821045, 3.628145933151245, 4.126654624938965, 4.6251630783081055, 5.12367057800293, 5.62217903137207, 6.120687484741211, 6.619195938110352, 7.117704391479492, 7.616212844848633, 8.114721298217773, 8.613229751586914, 9.111738204956055, 9.610246658325195, 10.108755111694336, 10.607263565063477, 11.105772018432617, 11.604280471801758, 12.102788925170898, 12.601297378540039, 13.099806785583496, 13.598315238952637, 14.096823692321777, 14.595332145690918, 15.093840599060059, 15.5923490524292, 16.090858459472656, 16.589366912841797, 17.087875366210938, 17.586383819580078, 18.08489227294922, 18.58340072631836, 19.0819091796875, 19.58041763305664, 20.07892608642578, 20.577434539794922, 21.075942993164062]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 7.0, 2.0, 14.0, 14.0, 15.0, 17.0, 13.0, 24.0, 41.0, 39.0, 58.0, 81.0, 131.0, 258.0, 543.0, 1899.0, 7742.0, 37048.0, 191456.0, 520538.0, 230439.0, 45260.0, 9283.0, 2286.0, 631.0, 243.0, 132.0, 79.0, 60.0, 39.0, 33.0, 24.0, 22.0, 19.0, 14.0, 13.0, 8.0, 10.0, 6.0, 6.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0078125, -2.902496337890625, -2.79718017578125, -2.691864013671875, -2.5865478515625, -2.481231689453125, -2.37591552734375, -2.270599365234375, -2.165283203125, -2.059967041015625, -1.95465087890625, -1.849334716796875, -1.7440185546875, -1.638702392578125, -1.53338623046875, -1.428070068359375, -1.32275390625, -1.217437744140625, -1.11212158203125, -1.006805419921875, -0.9014892578125, -0.796173095703125, -0.69085693359375, -0.585540771484375, -0.480224609375, -0.374908447265625, -0.26959228515625, -0.164276123046875, -0.0589599609375, 0.046356201171875, 0.15167236328125, 0.256988525390625, 0.3623046875, 0.467620849609375, 0.57293701171875, 0.678253173828125, 0.7835693359375, 0.888885498046875, 0.99420166015625, 1.099517822265625, 1.204833984375, 1.310150146484375, 1.41546630859375, 1.520782470703125, 1.6260986328125, 1.731414794921875, 1.83673095703125, 1.942047119140625, 2.04736328125, 2.152679443359375, 2.25799560546875, 2.363311767578125, 2.4686279296875, 2.573944091796875, 2.67926025390625, 2.784576416015625, 2.889892578125, 2.995208740234375, 3.10052490234375, 3.205841064453125, 3.3111572265625, 3.416473388671875, 3.52178955078125, 3.627105712890625, 3.732421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 13.0, 15.0, 31.0, 43.0, 47.0, 70.0, 99.0, 110.0, 121.0, 109.0, 98.0, 77.0, 63.0, 51.0, 22.0, 14.0, 13.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.78125, -15.11181640625, -14.4423828125, -13.77294921875, -13.103515625, -12.43408203125, -11.7646484375, -11.09521484375, -10.42578125, -9.75634765625, -9.0869140625, -8.41748046875, -7.748046875, -7.07861328125, -6.4091796875, -5.73974609375, -5.0703125, -4.40087890625, -3.7314453125, -3.06201171875, -2.392578125, -1.72314453125, -1.0537109375, -0.38427734375, 0.28515625, 0.95458984375, 1.6240234375, 2.29345703125, 2.962890625, 3.63232421875, 4.3017578125, 4.97119140625, 5.640625, 6.31005859375, 6.9794921875, 7.64892578125, 8.318359375, 8.98779296875, 9.6572265625, 10.32666015625, 10.99609375, 11.66552734375, 12.3349609375, 13.00439453125, 13.673828125, 14.34326171875, 15.0126953125, 15.68212890625, 16.3515625, 17.02099609375, 17.6904296875, 18.35986328125, 19.029296875, 19.69873046875, 20.3681640625, 21.03759765625, 21.70703125, 22.37646484375, 23.0458984375, 23.71533203125, 24.384765625, 25.05419921875, 25.7236328125, 26.39306640625, 27.0625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 13.0, 12.0, 18.0, 34.0, 45.0, 70.0, 99.0, 188.0, 275.0, 451.0, 683.0, 1138.0, 1922.0, 3022.0, 4981.0, 8665.0, 14866.0, 25841.0, 44349.0, 76782.0, 126790.0, 183574.0, 194212.0, 144909.0, 90127.0, 52441.0, 30113.0, 17315.0, 10042.0, 6049.0, 3557.0, 2233.0, 1360.0, 797.0, 544.0, 381.0, 228.0, 135.0, 109.0, 67.0, 32.0, 28.0, 15.0, 15.0, 8.0, 5.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9482498168945312, -0.9145660400390625, -0.8808822631835938, -0.847198486328125, -0.8135147094726562, -0.7798309326171875, -0.7461471557617188, -0.71246337890625, -0.6787796020507812, -0.6450958251953125, -0.6114120483398438, -0.577728271484375, -0.5440444946289062, -0.5103607177734375, -0.47667694091796875, -0.4429931640625, -0.40930938720703125, -0.3756256103515625, -0.34194183349609375, -0.308258056640625, -0.27457427978515625, -0.2408905029296875, -0.20720672607421875, -0.17352294921875, -0.13983917236328125, -0.1061553955078125, -0.07247161865234375, -0.038787841796875, -0.00510406494140625, 0.0285797119140625, 0.06226348876953125, 0.095947265625, 0.12963104248046875, 0.1633148193359375, 0.19699859619140625, 0.230682373046875, 0.26436614990234375, 0.2980499267578125, 0.33173370361328125, 0.36541748046875, 0.39910125732421875, 0.4327850341796875, 0.46646881103515625, 0.500152587890625, 0.5338363647460938, 0.5675201416015625, 0.6012039184570312, 0.6348876953125, 0.6685714721679688, 0.7022552490234375, 0.7359390258789062, 0.769622802734375, 0.8033065795898438, 0.8369903564453125, 0.8706741333007812, 0.90435791015625, 0.9380416870117188, 0.9717254638671875, 1.0054092407226562, 1.039093017578125, 1.0727767944335938, 1.1064605712890625, 1.1401443481445312, 1.173828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 0.0, 2.0, 1.0, 7.0, 4.0, 7.0, 6.0, 7.0, 15.0, 18.0, 17.0, 33.0, 17.0, 32.0, 37.0, 36.0, 51.0, 46.0, 50.0, 59.0, 52.0, 56.0, 50.0, 61.0, 47.0, 35.0, 41.0, 31.0, 35.0, 26.0, 29.0, 17.0, 11.0, 14.0, 10.0, 10.0, 10.0, 13.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.497314453125, -16.80712890625, -16.116943359375, -15.4267578125, -14.736572265625, -14.04638671875, -13.356201171875, -12.666015625, -11.975830078125, -11.28564453125, -10.595458984375, -9.9052734375, -9.215087890625, -8.52490234375, -7.834716796875, -7.14453125, -6.454345703125, -5.76416015625, -5.073974609375, -4.3837890625, -3.693603515625, -3.00341796875, -2.313232421875, -1.623046875, -0.932861328125, -0.24267578125, 0.447509765625, 1.1376953125, 1.827880859375, 2.51806640625, 3.208251953125, 3.8984375, 4.588623046875, 5.27880859375, 5.968994140625, 6.6591796875, 7.349365234375, 8.03955078125, 8.729736328125, 9.419921875, 10.110107421875, 10.80029296875, 11.490478515625, 12.1806640625, 12.870849609375, 13.56103515625, 14.251220703125, 14.94140625, 15.631591796875, 16.32177734375, 17.011962890625, 17.7021484375, 18.392333984375, 19.08251953125, 19.772705078125, 20.462890625, 21.153076171875, 21.84326171875, 22.533447265625, 23.2236328125, 23.913818359375, 24.60400390625, 25.294189453125, 25.984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 4.0, 4.0, 9.0, 16.0, 17.0, 20.0, 36.0, 59.0, 96.0, 101.0, 148.0, 221.0, 359.0, 518.0, 848.0, 1483.0, 2697.0, 5411.0, 12526.0, 30742.0, 82573.0, 233858.0, 392263.0, 177362.0, 62846.0, 23850.0, 9914.0, 4612.0, 2389.0, 1291.0, 756.0, 494.0, 325.0, 237.0, 132.0, 96.0, 69.0, 45.0, 31.0, 24.0, 19.0, 14.0, 6.0, 4.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1878662109375, -0.18206214904785156, -0.17625808715820312, -0.1704540252685547, -0.16464996337890625, -0.1588459014892578, -0.15304183959960938, -0.14723777770996094, -0.1414337158203125, -0.13562965393066406, -0.12982559204101562, -0.12402153015136719, -0.11821746826171875, -0.11241340637207031, -0.10660934448242188, -0.10080528259277344, -0.095001220703125, -0.08919715881347656, -0.08339309692382812, -0.07758903503417969, -0.07178497314453125, -0.06598091125488281, -0.060176849365234375, -0.05437278747558594, -0.0485687255859375, -0.04276466369628906, -0.036960601806640625, -0.031156539916992188, -0.02535247802734375, -0.019548416137695312, -0.013744354248046875, -0.007940292358398438, -0.00213623046875, 0.0036678314208984375, 0.009471893310546875, 0.015275955200195312, 0.02108001708984375, 0.026884078979492188, 0.032688140869140625, 0.03849220275878906, 0.0442962646484375, 0.05010032653808594, 0.055904388427734375, 0.06170845031738281, 0.06751251220703125, 0.07331657409667969, 0.07912063598632812, 0.08492469787597656, 0.090728759765625, 0.09653282165527344, 0.10233688354492188, 0.10814094543457031, 0.11394500732421875, 0.11974906921386719, 0.12555313110351562, 0.13135719299316406, 0.1371612548828125, 0.14296531677246094, 0.14876937866210938, 0.1545734405517578, 0.16037750244140625, 0.1661815643310547, 0.17198562622070312, 0.17778968811035156, 0.18359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 9.0, 15.0, 24.0, 54.0, 85.0, 141.0, 197.0, 173.0, 121.0, 72.0, 40.0, 33.0, 14.0, 10.0, 9.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002117156982421875, -0.00020205974578857422, -0.00019240379333496094, -0.00018274784088134766, -0.00017309188842773438, -0.0001634359359741211, -0.0001537799835205078, -0.00014412403106689453, -0.00013446807861328125, -0.00012481212615966797, -0.00011515617370605469, -0.0001055002212524414, -9.584426879882812e-05, -8.618831634521484e-05, -7.653236389160156e-05, -6.687641143798828e-05, -5.7220458984375e-05, -4.756450653076172e-05, -3.790855407714844e-05, -2.8252601623535156e-05, -1.8596649169921875e-05, -8.940696716308594e-06, 7.152557373046875e-07, 1.0371208190917969e-05, 2.002716064453125e-05, 2.968311309814453e-05, 3.933906555175781e-05, 4.8995018005371094e-05, 5.8650970458984375e-05, 6.830692291259766e-05, 7.796287536621094e-05, 8.761882781982422e-05, 9.72747802734375e-05, 0.00010693073272705078, 0.00011658668518066406, 0.00012624263763427734, 0.00013589859008789062, 0.0001455545425415039, 0.0001552104949951172, 0.00016486644744873047, 0.00017452239990234375, 0.00018417835235595703, 0.0001938343048095703, 0.0002034902572631836, 0.00021314620971679688, 0.00022280216217041016, 0.00023245811462402344, 0.00024211406707763672, 0.00025177001953125, 0.0002614259719848633, 0.00027108192443847656, 0.00028073787689208984, 0.0002903938293457031, 0.0003000497817993164, 0.0003097057342529297, 0.00031936168670654297, 0.00032901763916015625, 0.00033867359161376953, 0.0003483295440673828, 0.0003579854965209961, 0.0003676414489746094, 0.00037729740142822266, 0.00038695335388183594, 0.0003966093063354492, 0.0004062652587890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 5.0, 3.0, 8.0, 1.0, 12.0, 16.0, 21.0, 35.0, 40.0, 50.0, 104.0, 128.0, 203.0, 329.0, 577.0, 962.0, 1680.0, 3337.0, 7331.0, 17643.0, 49023.0, 148345.0, 377756.0, 287101.0, 97543.0, 32547.0, 12492.0, 5280.0, 2527.0, 1431.0, 717.0, 452.0, 308.0, 194.0, 101.0, 75.0, 43.0, 46.0, 18.0, 20.0, 13.0, 13.0, 6.0, 4.0, 3.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.205078125, -0.19882774353027344, -0.19257736206054688, -0.1863269805908203, -0.18007659912109375, -0.1738262176513672, -0.16757583618164062, -0.16132545471191406, -0.1550750732421875, -0.14882469177246094, -0.14257431030273438, -0.1363239288330078, -0.13007354736328125, -0.12382316589355469, -0.11757278442382812, -0.11132240295410156, -0.105072021484375, -0.09882164001464844, -0.09257125854492188, -0.08632087707519531, -0.08007049560546875, -0.07382011413574219, -0.06756973266601562, -0.06131935119628906, -0.0550689697265625, -0.04881858825683594, -0.042568206787109375, -0.03631782531738281, -0.03006744384765625, -0.023817062377929688, -0.017566680908203125, -0.011316299438476562, -0.00506591796875, 0.0011844635009765625, 0.007434844970703125, 0.013685226440429688, 0.01993560791015625, 0.026185989379882812, 0.032436370849609375, 0.03868675231933594, 0.0449371337890625, 0.05118751525878906, 0.057437896728515625, 0.06368827819824219, 0.06993865966796875, 0.07618904113769531, 0.08243942260742188, 0.08868980407714844, 0.094940185546875, 0.10119056701660156, 0.10744094848632812, 0.11369132995605469, 0.11994171142578125, 0.1261920928955078, 0.13244247436523438, 0.13869285583496094, 0.1449432373046875, 0.15119361877441406, 0.15744400024414062, 0.1636943817138672, 0.16994476318359375, 0.1761951446533203, 0.18244552612304688, 0.18869590759277344, 0.1949462890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 6.0, 4.0, 8.0, 3.0, 8.0, 20.0, 26.0, 26.0, 29.0, 31.0, 44.0, 42.0, 62.0, 58.0, 52.0, 50.0, 73.0, 60.0, 56.0, 36.0, 55.0, 40.0, 37.0, 25.0, 32.0, 28.0, 22.0, 19.0, 10.0, 5.0, 11.0, 8.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.056671142578125, -0.054810523986816406, -0.05294990539550781, -0.05108928680419922, -0.049228668212890625, -0.04736804962158203, -0.04550743103027344, -0.043646812438964844, -0.04178619384765625, -0.039925575256347656, -0.03806495666503906, -0.03620433807373047, -0.034343719482421875, -0.03248310089111328, -0.030622482299804688, -0.028761863708496094, -0.0269012451171875, -0.025040626525878906, -0.023180007934570312, -0.02131938934326172, -0.019458770751953125, -0.01759815216064453, -0.015737533569335938, -0.013876914978027344, -0.01201629638671875, -0.010155677795410156, -0.008295059204101562, -0.006434440612792969, -0.004573822021484375, -0.0027132034301757812, -0.0008525848388671875, 0.0010080337524414062, 0.00286865234375, 0.004729270935058594, 0.0065898895263671875, 0.008450508117675781, 0.010311126708984375, 0.012171745300292969, 0.014032363891601562, 0.015892982482910156, 0.01775360107421875, 0.019614219665527344, 0.021474838256835938, 0.02333545684814453, 0.025196075439453125, 0.02705669403076172, 0.028917312622070312, 0.030777931213378906, 0.0326385498046875, 0.034499168395996094, 0.03635978698730469, 0.03822040557861328, 0.040081024169921875, 0.04194164276123047, 0.04380226135253906, 0.045662879943847656, 0.04752349853515625, 0.049384117126464844, 0.05124473571777344, 0.05310535430908203, 0.054965972900390625, 0.05682659149169922, 0.05868721008300781, 0.060547828674316406, 0.062408447265625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 101.0, 609.0, 274.0, 22.0, 2.0], "bins": [-178.9852294921875, -176.03384399414062, -173.0824432373047, -170.1310577392578, -167.17967224121094, -164.228271484375, -161.27688598632812, -158.32550048828125, -155.3740997314453, -152.42271423339844, -149.4713134765625, -146.51992797851562, -143.56854248046875, -140.6171417236328, -137.66575622558594, -134.71437072753906, -131.76296997070312, -128.81158447265625, -125.86019134521484, -122.90879821777344, -119.95740509033203, -117.00601196289062, -114.05462646484375, -111.10323333740234, -108.15185546875, -105.2004623413086, -102.24907684326172, -99.29768371582031, -96.3462905883789, -93.3948974609375, -90.44351196289062, -87.49211883544922, -84.54073333740234, -81.58934020996094, -78.63795471191406, -75.68656158447266, -72.73516845703125, -69.78378295898438, -66.83238983154297, -63.88099670410156, -60.92960739135742, -57.97821807861328, -55.026824951171875, -52.075435638427734, -49.124046325683594, -46.17265319824219, -43.22126388549805, -40.269874572753906, -37.3184814453125, -34.36709213256836, -31.415699005126953, -28.464309692382812, -25.51291847229004, -22.561527252197266, -19.610137939453125, -16.65874671936035, -13.707354545593262, -10.755964279174805, -7.804573059082031, -4.853182792663574, -1.9017915725708008, 1.0495996475219727, 4.000988960266113, 6.952380180358887, 9.90377140045166]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 13.0, 10.0, 16.0, 22.0, 43.0, 20.0, 40.0, 56.0, 59.0, 69.0, 80.0, 76.0, 64.0, 62.0, 62.0, 58.0, 61.0, 35.0, 42.0, 26.0, 18.0, 20.0, 14.0, 10.0, 5.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.303756713867188, -8.899028778076172, -8.494300842285156, -8.089571952819824, -7.684844017028809, -7.280116081237793, -6.875387668609619, -6.470659255981445, -6.06593132019043, -5.661203384399414, -5.25647497177124, -4.851746559143066, -4.447018623352051, -4.042290687561035, -3.6375622749328613, -3.2328341007232666, -2.828105926513672, -2.423377752304077, -2.0186495780944824, -1.6139214038848877, -1.209193229675293, -0.8044650554656982, -0.3997368812561035, 0.004991292953491211, 0.40971946716308594, 0.8144476413726807, 1.2191758155822754, 1.6239039897918701, 2.028632164001465, 2.4333603382110596, 2.8380885124206543, 3.242816686630249, 3.6475448608398438, 4.052272796630859, 4.457001209259033, 4.861729621887207, 5.266457557678223, 5.671185493469238, 6.075913906097412, 6.480642318725586, 6.885370254516602, 7.290098190307617, 7.694826602935791, 8.099555015563965, 8.50428295135498, 8.909010887145996, 9.313739776611328, 9.718467712402344, 10.12319564819336, 10.527923583984375, 10.93265151977539, 11.337380409240723, 11.742108345031738, 12.146836280822754, 12.551565170288086, 12.956293106079102, 13.361021041870117, 13.765748977661133, 14.170476913452148, 14.57520580291748, 14.979933738708496, 15.384661674499512, 15.789390563964844, 16.19411849975586, 16.598846435546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 4.0, 4.0, 9.0, 16.0, 19.0, 31.0, 46.0, 58.0, 115.0, 348.0, 1628.0, 17283.0, 281792.0, 683338.0, 58580.0, 4224.0, 638.0, 166.0, 60.0, 69.0, 34.0, 25.0, 8.0, 11.0, 12.0, 9.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.46875, -19.79150390625, -19.1142578125, -18.43701171875, -17.759765625, -17.08251953125, -16.4052734375, -15.72802734375, -15.05078125, -14.37353515625, -13.6962890625, -13.01904296875, -12.341796875, -11.66455078125, -10.9873046875, -10.31005859375, -9.6328125, -8.95556640625, -8.2783203125, -7.60107421875, -6.923828125, -6.24658203125, -5.5693359375, -4.89208984375, -4.21484375, -3.53759765625, -2.8603515625, -2.18310546875, -1.505859375, -0.82861328125, -0.1513671875, 0.52587890625, 1.203125, 1.88037109375, 2.5576171875, 3.23486328125, 3.912109375, 4.58935546875, 5.2666015625, 5.94384765625, 6.62109375, 7.29833984375, 7.9755859375, 8.65283203125, 9.330078125, 10.00732421875, 10.6845703125, 11.36181640625, 12.0390625, 12.71630859375, 13.3935546875, 14.07080078125, 14.748046875, 15.42529296875, 16.1025390625, 16.77978515625, 17.45703125, 18.13427734375, 18.8115234375, 19.48876953125, 20.166015625, 20.84326171875, 21.5205078125, 22.19775390625, 22.875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 19.0, 16.0, 26.0, 28.0, 29.0, 35.0, 40.0, 55.0, 64.0, 44.0, 62.0, 61.0, 52.0, 68.0, 65.0, 42.0, 42.0, 37.0, 39.0, 40.0, 26.0, 26.0, 17.0, 17.0, 8.0, 5.0, 5.0, 4.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -17.00439453125, -16.3212890625, -15.63818359375, -14.955078125, -14.27197265625, -13.5888671875, -12.90576171875, -12.22265625, -11.53955078125, -10.8564453125, -10.17333984375, -9.490234375, -8.80712890625, -8.1240234375, -7.44091796875, -6.7578125, -6.07470703125, -5.3916015625, -4.70849609375, -4.025390625, -3.34228515625, -2.6591796875, -1.97607421875, -1.29296875, -0.60986328125, 0.0732421875, 0.75634765625, 1.439453125, 2.12255859375, 2.8056640625, 3.48876953125, 4.171875, 4.85498046875, 5.5380859375, 6.22119140625, 6.904296875, 7.58740234375, 8.2705078125, 8.95361328125, 9.63671875, 10.31982421875, 11.0029296875, 11.68603515625, 12.369140625, 13.05224609375, 13.7353515625, 14.41845703125, 15.1015625, 15.78466796875, 16.4677734375, 17.15087890625, 17.833984375, 18.51708984375, 19.2001953125, 19.88330078125, 20.56640625, 21.24951171875, 21.9326171875, 22.61572265625, 23.298828125, 23.98193359375, 24.6650390625, 25.34814453125, 26.03125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 2.0, 0.0, 4.0, 5.0, 6.0, 10.0, 10.0, 14.0, 17.0, 6.0, 23.0, 28.0, 32.0, 42.0, 48.0, 77.0, 103.0, 151.0, 263.0, 585.0, 2328.0, 36397.0, 707364.0, 287262.0, 11355.0, 1208.0, 442.0, 227.0, 145.0, 112.0, 63.0, 40.0, 39.0, 30.0, 20.0, 20.0, 18.0, 11.0, 14.0, 11.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.514892578125, -19.82666015625, -19.138427734375, -18.4501953125, -17.761962890625, -17.07373046875, -16.385498046875, -15.697265625, -15.009033203125, -14.32080078125, -13.632568359375, -12.9443359375, -12.256103515625, -11.56787109375, -10.879638671875, -10.19140625, -9.503173828125, -8.81494140625, -8.126708984375, -7.4384765625, -6.750244140625, -6.06201171875, -5.373779296875, -4.685546875, -3.997314453125, -3.30908203125, -2.620849609375, -1.9326171875, -1.244384765625, -0.55615234375, 0.132080078125, 0.8203125, 1.508544921875, 2.19677734375, 2.885009765625, 3.5732421875, 4.261474609375, 4.94970703125, 5.637939453125, 6.326171875, 7.014404296875, 7.70263671875, 8.390869140625, 9.0791015625, 9.767333984375, 10.45556640625, 11.143798828125, 11.83203125, 12.520263671875, 13.20849609375, 13.896728515625, 14.5849609375, 15.273193359375, 15.96142578125, 16.649658203125, 17.337890625, 18.026123046875, 18.71435546875, 19.402587890625, 20.0908203125, 20.779052734375, 21.46728515625, 22.155517578125, 22.84375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 13.0, 12.0, 22.0, 17.0, 34.0, 28.0, 34.0, 38.0, 33.0, 41.0, 49.0, 41.0, 67.0, 55.0, 46.0, 33.0, 39.0, 43.0, 43.0, 30.0, 44.0, 25.0, 37.0, 22.0, 18.0, 18.0, 26.0, 13.0, 14.0, 10.0, 10.0, 1.0, 5.0, 4.0, 1.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.0, -23.2978515625, -22.595703125, -21.8935546875, -21.19140625, -20.4892578125, -19.787109375, -19.0849609375, -18.3828125, -17.6806640625, -16.978515625, -16.2763671875, -15.57421875, -14.8720703125, -14.169921875, -13.4677734375, -12.765625, -12.0634765625, -11.361328125, -10.6591796875, -9.95703125, -9.2548828125, -8.552734375, -7.8505859375, -7.1484375, -6.4462890625, -5.744140625, -5.0419921875, -4.33984375, -3.6376953125, -2.935546875, -2.2333984375, -1.53125, -0.8291015625, -0.126953125, 0.5751953125, 1.27734375, 1.9794921875, 2.681640625, 3.3837890625, 4.0859375, 4.7880859375, 5.490234375, 6.1923828125, 6.89453125, 7.5966796875, 8.298828125, 9.0009765625, 9.703125, 10.4052734375, 11.107421875, 11.8095703125, 12.51171875, 13.2138671875, 13.916015625, 14.6181640625, 15.3203125, 16.0224609375, 16.724609375, 17.4267578125, 18.12890625, 18.8310546875, 19.533203125, 20.2353515625, 20.9375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 18.0, 45.0, 164.0, 911.0, 13321.0, 1024838.0, 8332.0, 687.0, 136.0, 44.0, 15.0, 8.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-35.375, -34.24951171875, -33.1240234375, -31.99853515625, -30.873046875, -29.74755859375, -28.6220703125, -27.49658203125, -26.37109375, -25.24560546875, -24.1201171875, -22.99462890625, -21.869140625, -20.74365234375, -19.6181640625, -18.49267578125, -17.3671875, -16.24169921875, -15.1162109375, -13.99072265625, -12.865234375, -11.73974609375, -10.6142578125, -9.48876953125, -8.36328125, -7.23779296875, -6.1123046875, -4.98681640625, -3.861328125, -2.73583984375, -1.6103515625, -0.48486328125, 0.640625, 1.76611328125, 2.8916015625, 4.01708984375, 5.142578125, 6.26806640625, 7.3935546875, 8.51904296875, 9.64453125, 10.77001953125, 11.8955078125, 13.02099609375, 14.146484375, 15.27197265625, 16.3974609375, 17.52294921875, 18.6484375, 19.77392578125, 20.8994140625, 22.02490234375, 23.150390625, 24.27587890625, 25.4013671875, 26.52685546875, 27.65234375, 28.77783203125, 29.9033203125, 31.02880859375, 32.154296875, 33.27978515625, 34.4052734375, 35.53076171875, 36.65625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 17.0, 14.0, 15.0, 37.0, 69.0, 99.0, 170.0, 176.0, 135.0, 94.0, 74.0, 45.0, 25.0, 7.0, 4.0, 8.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0017681121826171875, -0.0017233490943908691, -0.0016785860061645508, -0.0016338229179382324, -0.001589059829711914, -0.0015442967414855957, -0.0014995336532592773, -0.001454770565032959, -0.0014100074768066406, -0.0013652443885803223, -0.001320481300354004, -0.0012757182121276855, -0.0012309551239013672, -0.0011861920356750488, -0.0011414289474487305, -0.0010966658592224121, -0.0010519027709960938, -0.0010071396827697754, -0.000962376594543457, -0.0009176135063171387, -0.0008728504180908203, -0.000828087329864502, -0.0007833242416381836, -0.0007385611534118652, -0.0006937980651855469, -0.0006490349769592285, -0.0006042718887329102, -0.0005595088005065918, -0.0005147457122802734, -0.0004699826240539551, -0.0004252195358276367, -0.00038045644760131836, -0.000335693359375, -0.00029093027114868164, -0.0002461671829223633, -0.00020140409469604492, -0.00015664100646972656, -0.0001118779182434082, -6.711483001708984e-05, -2.2351741790771484e-05, 2.2411346435546875e-05, 6.717443466186523e-05, 0.0001119375228881836, 0.00015670061111450195, 0.0002014636993408203, 0.00024622678756713867, 0.00029098987579345703, 0.0003357529640197754, 0.00038051605224609375, 0.0004252791404724121, 0.00047004222869873047, 0.0005148053169250488, 0.0005595684051513672, 0.0006043314933776855, 0.0006490945816040039, 0.0006938576698303223, 0.0007386207580566406, 0.000783383846282959, 0.0008281469345092773, 0.0008729100227355957, 0.0009176731109619141, 0.0009624361991882324, 0.0010071992874145508, 0.0010519623756408691, 0.0010967254638671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 14.0, 20.0, 50.0, 178.0, 773.0, 10128.0, 1027211.0, 9137.0, 758.0, 154.0, 65.0, 20.0, 6.0, 7.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.5625, -30.56005859375, -29.5576171875, -28.55517578125, -27.552734375, -26.55029296875, -25.5478515625, -24.54541015625, -23.54296875, -22.54052734375, -21.5380859375, -20.53564453125, -19.533203125, -18.53076171875, -17.5283203125, -16.52587890625, -15.5234375, -14.52099609375, -13.5185546875, -12.51611328125, -11.513671875, -10.51123046875, -9.5087890625, -8.50634765625, -7.50390625, -6.50146484375, -5.4990234375, -4.49658203125, -3.494140625, -2.49169921875, -1.4892578125, -0.48681640625, 0.515625, 1.51806640625, 2.5205078125, 3.52294921875, 4.525390625, 5.52783203125, 6.5302734375, 7.53271484375, 8.53515625, 9.53759765625, 10.5400390625, 11.54248046875, 12.544921875, 13.54736328125, 14.5498046875, 15.55224609375, 16.5546875, 17.55712890625, 18.5595703125, 19.56201171875, 20.564453125, 21.56689453125, 22.5693359375, 23.57177734375, 24.57421875, 25.57666015625, 26.5791015625, 27.58154296875, 28.583984375, 29.58642578125, 30.5888671875, 31.59130859375, 32.59375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 14.0, 16.0, 38.0, 50.0, 77.0, 89.0, 140.0, 139.0, 119.0, 117.0, 77.0, 40.0, 29.0, 12.0, 10.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.6171875, -3.49462890625, -3.3720703125, -3.24951171875, -3.126953125, -3.00439453125, -2.8818359375, -2.75927734375, -2.63671875, -2.51416015625, -2.3916015625, -2.26904296875, -2.146484375, -2.02392578125, -1.9013671875, -1.77880859375, -1.65625, -1.53369140625, -1.4111328125, -1.28857421875, -1.166015625, -1.04345703125, -0.9208984375, -0.79833984375, -0.67578125, -0.55322265625, -0.4306640625, -0.30810546875, -0.185546875, -0.06298828125, 0.0595703125, 0.18212890625, 0.3046875, 0.42724609375, 0.5498046875, 0.67236328125, 0.794921875, 0.91748046875, 1.0400390625, 1.16259765625, 1.28515625, 1.40771484375, 1.5302734375, 1.65283203125, 1.775390625, 1.89794921875, 2.0205078125, 2.14306640625, 2.265625, 2.38818359375, 2.5107421875, 2.63330078125, 2.755859375, 2.87841796875, 3.0009765625, 3.12353515625, 3.24609375, 3.36865234375, 3.4912109375, 3.61376953125, 3.736328125, 3.85888671875, 3.9814453125, 4.10400390625, 4.2265625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 21.0, 85.0, 244.0, 363.0, 209.0, 63.0, 12.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.94796371459961, -43.881126403808594, -40.814292907714844, -37.74745559692383, -34.68061828613281, -31.613784790039062, -28.546947479248047, -25.480112075805664, -22.41327667236328, -19.3464412689209, -16.279605865478516, -13.2127685546875, -10.145933151245117, -7.079097747802734, -4.012260437011719, -0.9454250335693359, 2.121410369873047, 5.188246250152588, 8.255082130432129, 11.321918487548828, 14.388753890991211, 17.455589294433594, 20.52242660522461, 23.589262008666992, 26.656097412109375, 29.722932815551758, 32.78976821899414, 35.856605529785156, 38.923439025878906, 41.99027633666992, 45.05711364746094, 48.12394714355469, 51.19078063964844, 54.25761795043945, 57.3244514465332, 60.39128875732422, 63.45812225341797, 66.52496337890625, 69.591796875, 72.65863037109375, 75.7254638671875, 78.79229736328125, 81.85913848876953, 84.92597198486328, 87.99280548095703, 91.05964660644531, 94.12648010253906, 97.19331359863281, 100.2601547241211, 103.32698822021484, 106.39382934570312, 109.46066284179688, 112.52749633789062, 115.59432983398438, 118.66117095947266, 121.7280044555664, 124.79484558105469, 127.86167907714844, 130.9285125732422, 133.995361328125, 137.06219482421875, 140.1290283203125, 143.19586181640625, 146.2626953125, 149.32952880859375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 5.0, 4.0, 1.0, 3.0, 5.0, 3.0, 8.0, 5.0, 18.0, 10.0, 15.0, 13.0, 23.0, 23.0, 26.0, 29.0, 28.0, 27.0, 29.0, 41.0, 48.0, 42.0, 44.0, 30.0, 49.0, 54.0, 37.0, 41.0, 34.0, 37.0, 33.0, 30.0, 29.0, 29.0, 32.0, 24.0, 18.0, 19.0, 11.0, 8.0, 8.0, 8.0, 11.0, 5.0, 3.0, 5.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.890871047973633, -28.847314834594727, -27.803756713867188, -26.76020050048828, -25.716644287109375, -24.673086166381836, -23.62952995300293, -22.58597183227539, -21.542415618896484, -20.498859405517578, -19.45530128479004, -18.411745071411133, -17.368186950683594, -16.324630737304688, -15.281074523925781, -14.237517356872559, -13.193960189819336, -12.150403022766113, -11.10684585571289, -10.063289642333984, -9.019732475280762, -7.976175308227539, -6.932618618011475, -5.88906192779541, -4.8455047607421875, -3.801947832107544, -2.7583909034729004, -1.7148339748382568, -0.6712770462036133, 0.3722801208496094, 1.4158368110656738, 2.4593935012817383, 3.5029525756835938, 4.546509742736816, 5.590066432952881, 6.633623123168945, 7.677180290222168, 8.72073745727539, 9.764293670654297, 10.80785083770752, 11.851408004760742, 12.894965171813965, 13.938522338867188, 14.982078552246094, 16.025634765625, 17.06919288635254, 18.112749099731445, 19.156307220458984, 20.19986343383789, 21.243419647216797, 22.286977767944336, 23.330533981323242, 24.37409210205078, 25.417648315429688, 26.461204528808594, 27.5047607421875, 28.54831886291504, 29.591875076293945, 30.635433197021484, 31.67898941040039, 32.7225456237793, 33.76610565185547, 34.809661865234375, 35.85321807861328, 36.89677429199219]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 21.0, 44.0, 95.0, 197.0, 573.0, 2477.0, 1401119.0, 2786869.0, 2126.0, 341.0, 126.0, 91.0, 52.0, 26.0, 22.0, 16.0, 7.0, 9.0, 13.0, 13.0, 3.0, 9.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.09375, -39.47119140625, -36.8486328125, -34.22607421875, -31.603515625, -28.98095703125, -26.3583984375, -23.73583984375, -21.11328125, -18.49072265625, -15.8681640625, -13.24560546875, -10.623046875, -8.00048828125, -5.3779296875, -2.75537109375, -0.1328125, 2.48974609375, 5.1123046875, 7.73486328125, 10.357421875, 12.97998046875, 15.6025390625, 18.22509765625, 20.84765625, 23.47021484375, 26.0927734375, 28.71533203125, 31.337890625, 33.96044921875, 36.5830078125, 39.20556640625, 41.828125, 44.45068359375, 47.0732421875, 49.69580078125, 52.318359375, 54.94091796875, 57.5634765625, 60.18603515625, 62.80859375, 65.43115234375, 68.0537109375, 70.67626953125, 73.298828125, 75.92138671875, 78.5439453125, 81.16650390625, 83.7890625, 86.41162109375, 89.0341796875, 91.65673828125, 94.279296875, 96.90185546875, 99.5244140625, 102.14697265625, 104.76953125, 107.39208984375, 110.0146484375, 112.63720703125, 115.259765625, 117.88232421875, 120.5048828125, 123.12744140625, 125.75]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 14.0, 8.0, 14.0, 25.0, 24.0, 32.0, 52.0, 63.0, 60.0, 101.0, 89.0, 99.0, 79.0, 68.0, 65.0, 56.0, 48.0, 29.0, 37.0, 17.0, 15.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.5494384765625, -9.966064453125, -9.3826904296875, -8.79931640625, -8.2159423828125, -7.632568359375, -7.0491943359375, -6.4658203125, -5.8824462890625, -5.299072265625, -4.7156982421875, -4.13232421875, -3.5489501953125, -2.965576171875, -2.3822021484375, -1.798828125, -1.2154541015625, -0.632080078125, -0.0487060546875, 0.53466796875, 1.1180419921875, 1.701416015625, 2.2847900390625, 2.8681640625, 3.4515380859375, 4.034912109375, 4.6182861328125, 5.20166015625, 5.7850341796875, 6.368408203125, 6.9517822265625, 7.53515625, 8.1185302734375, 8.701904296875, 9.2852783203125, 9.86865234375, 10.4520263671875, 11.035400390625, 11.6187744140625, 12.2021484375, 12.7855224609375, 13.368896484375, 13.9522705078125, 14.53564453125, 15.1190185546875, 15.702392578125, 16.2857666015625, 16.869140625, 17.4525146484375, 18.035888671875, 18.6192626953125, 19.20263671875, 19.7860107421875, 20.369384765625, 20.9527587890625, 21.5361328125, 22.1195068359375, 22.702880859375, 23.2862548828125, 23.86962890625, 24.4530029296875, 25.036376953125, 25.6197509765625, 26.203125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 6.0, 11.0, 18.0, 11.0, 17.0, 25.0, 31.0, 49.0, 61.0, 112.0, 167.0, 262.0, 451.0, 777.0, 1464.0, 3414.0, 11193.0, 68567.0, 965505.0, 2864921.0, 240839.0, 25793.0, 5738.0, 2209.0, 1073.0, 562.0, 328.0, 214.0, 140.0, 112.0, 64.0, 34.0, 19.0, 27.0, 11.0, 11.0, 14.0, 6.0, 4.0, 4.0, 7.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.734375, -18.1875, -17.640625, -17.09375, -16.546875, -16.0, -15.453125, -14.90625, -14.359375, -13.8125, -13.265625, -12.71875, -12.171875, -11.625, -11.078125, -10.53125, -9.984375, -9.4375, -8.890625, -8.34375, -7.796875, -7.25, -6.703125, -6.15625, -5.609375, -5.0625, -4.515625, -3.96875, -3.421875, -2.875, -2.328125, -1.78125, -1.234375, -0.6875, -0.140625, 0.40625, 0.953125, 1.5, 2.046875, 2.59375, 3.140625, 3.6875, 4.234375, 4.78125, 5.328125, 5.875, 6.421875, 6.96875, 7.515625, 8.0625, 8.609375, 9.15625, 9.703125, 10.25, 10.796875, 11.34375, 11.890625, 12.4375, 12.984375, 13.53125, 14.078125, 14.625, 15.171875, 15.71875, 16.265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 7.0, 7.0, 3.0, 8.0, 16.0, 20.0, 15.0, 26.0, 44.0, 48.0, 82.0, 110.0, 121.0, 173.0, 266.0, 321.0, 359.0, 485.0, 464.0, 384.0, 316.0, 220.0, 144.0, 110.0, 100.0, 56.0, 40.0, 34.0, 24.0, 18.0, 17.0, 9.0, 5.0, 7.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.296875, -4.161376953125, -4.02587890625, -3.890380859375, -3.7548828125, -3.619384765625, -3.48388671875, -3.348388671875, -3.212890625, -3.077392578125, -2.94189453125, -2.806396484375, -2.6708984375, -2.535400390625, -2.39990234375, -2.264404296875, -2.12890625, -1.993408203125, -1.85791015625, -1.722412109375, -1.5869140625, -1.451416015625, -1.31591796875, -1.180419921875, -1.044921875, -0.909423828125, -0.77392578125, -0.638427734375, -0.5029296875, -0.367431640625, -0.23193359375, -0.096435546875, 0.0390625, 0.174560546875, 0.31005859375, 0.445556640625, 0.5810546875, 0.716552734375, 0.85205078125, 0.987548828125, 1.123046875, 1.258544921875, 1.39404296875, 1.529541015625, 1.6650390625, 1.800537109375, 1.93603515625, 2.071533203125, 2.20703125, 2.342529296875, 2.47802734375, 2.613525390625, 2.7490234375, 2.884521484375, 3.02001953125, 3.155517578125, 3.291015625, 3.426513671875, 3.56201171875, 3.697509765625, 3.8330078125, 3.968505859375, 4.10400390625, 4.239501953125, 4.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 19.0, 40.0, 79.0, 133.0, 151.0, 159.0, 156.0, 105.0, 75.0, 43.0, 23.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.22301483154297, -56.08574295043945, -54.94846725463867, -53.811195373535156, -52.673919677734375, -51.53664779663086, -50.39937210083008, -49.26210021972656, -48.12482452392578, -46.987552642822266, -45.850276947021484, -44.71300506591797, -43.57572937011719, -42.43845748901367, -41.30118179321289, -40.163909912109375, -39.02663803100586, -37.889366149902344, -36.75209045410156, -35.61481857299805, -34.477542877197266, -33.34027099609375, -32.20299530029297, -31.065723419189453, -29.928449630737305, -28.791175842285156, -27.653902053833008, -26.51662826538086, -25.379356384277344, -24.242080688476562, -23.104808807373047, -21.9675350189209, -20.830265045166016, -19.692991256713867, -18.55571746826172, -17.41844367980957, -16.281169891357422, -15.14389705657959, -14.006624221801758, -12.86935043334961, -11.732076644897461, -10.594802856445312, -9.457529067993164, -8.320256233215332, -7.182982444763184, -6.045708656311035, -4.908435344696045, -3.7711620330810547, -2.6338882446289062, -1.496614694595337, -0.3593411445617676, 0.7779324054718018, 1.915205955505371, 3.0524797439575195, 4.18975305557251, 5.3270263671875, 6.464300155639648, 7.601573944091797, 8.738847732543945, 9.876120567321777, 11.013394355773926, 12.150668144226074, 13.287940979003906, 14.425214767456055, 15.562488555908203]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 3.0, 7.0, 20.0, 9.0, 7.0, 8.0, 21.0, 25.0, 33.0, 32.0, 26.0, 41.0, 41.0, 48.0, 51.0, 57.0, 45.0, 51.0, 53.0, 29.0, 52.0, 49.0, 36.0, 43.0, 38.0, 26.0, 27.0, 18.0, 18.0, 22.0, 16.0, 8.0, 8.0, 11.0, 4.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.514082908630371, -10.119685173034668, -9.725286483764648, -9.330888748168945, -8.936490058898926, -8.542092323303223, -8.147693634033203, -7.7532958984375, -7.358898162841797, -6.9644999504089355, -6.570101737976074, -6.175704002380371, -5.78130578994751, -5.386907577514648, -4.992509365081787, -4.598111152648926, -4.2037129402160645, -3.809314727783203, -3.414916753768921, -3.0205185413360596, -2.6261205673217773, -2.231722354888916, -1.8373241424560547, -1.4429261684417725, -1.0485279560089111, -0.6541298627853394, -0.2597317099571228, 0.13466644287109375, 0.5290645360946655, 0.9234626293182373, 1.3178608417510986, 1.7122588157653809, 2.106657028198242, 2.5010552406311035, 2.8954532146453857, 3.289851427078247, 3.6842494010925293, 4.078647613525391, 4.473045825958252, 4.867444038391113, 5.261841773986816, 5.656239986419678, 6.050638198852539, 6.445035934448242, 6.8394341468811035, 7.233832359313965, 7.628230571746826, 8.022628784179688, 8.41702651977539, 8.811424255371094, 9.205822944641113, 9.600220680236816, 9.994619369506836, 10.389017105102539, 10.783414840698242, 11.177813529968262, 11.572212219238281, 11.966609954833984, 12.361008644104004, 12.755406379699707, 13.149805068969727, 13.54420280456543, 13.938600540161133, 14.332999229431152, 14.727396965026855]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 11.0, 5.0, 12.0, 17.0, 22.0, 24.0, 18.0, 34.0, 63.0, 80.0, 112.0, 213.0, 484.0, 1645.0, 8881.0, 65693.0, 454355.0, 442436.0, 63202.0, 8526.0, 1645.0, 500.0, 212.0, 103.0, 92.0, 48.0, 35.0, 21.0, 20.0, 9.0, 16.0, 8.0, 2.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.958984375, -3.822418212890625, -3.68585205078125, -3.549285888671875, -3.4127197265625, -3.276153564453125, -3.13958740234375, -3.003021240234375, -2.866455078125, -2.729888916015625, -2.59332275390625, -2.456756591796875, -2.3201904296875, -2.183624267578125, -2.04705810546875, -1.910491943359375, -1.77392578125, -1.637359619140625, -1.50079345703125, -1.364227294921875, -1.2276611328125, -1.091094970703125, -0.95452880859375, -0.817962646484375, -0.681396484375, -0.544830322265625, -0.40826416015625, -0.271697998046875, -0.1351318359375, 0.001434326171875, 0.13800048828125, 0.274566650390625, 0.4111328125, 0.547698974609375, 0.68426513671875, 0.820831298828125, 0.9573974609375, 1.093963623046875, 1.23052978515625, 1.367095947265625, 1.503662109375, 1.640228271484375, 1.77679443359375, 1.913360595703125, 2.0499267578125, 2.186492919921875, 2.32305908203125, 2.459625244140625, 2.59619140625, 2.732757568359375, 2.86932373046875, 3.005889892578125, 3.1424560546875, 3.279022216796875, 3.41558837890625, 3.552154541015625, 3.688720703125, 3.825286865234375, 3.96185302734375, 4.098419189453125, 4.2349853515625, 4.371551513671875, 4.50811767578125, 4.644683837890625, 4.78125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 6.0, 7.0, 10.0, 9.0, 21.0, 21.0, 29.0, 32.0, 56.0, 46.0, 68.0, 70.0, 59.0, 81.0, 68.0, 76.0, 64.0, 53.0, 49.0, 52.0, 34.0, 19.0, 24.0, 12.0, 18.0, 7.0, 8.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.609375, -8.197021484375, -7.78466796875, -7.372314453125, -6.9599609375, -6.547607421875, -6.13525390625, -5.722900390625, -5.310546875, -4.898193359375, -4.48583984375, -4.073486328125, -3.6611328125, -3.248779296875, -2.83642578125, -2.424072265625, -2.01171875, -1.599365234375, -1.18701171875, -0.774658203125, -0.3623046875, 0.050048828125, 0.46240234375, 0.874755859375, 1.287109375, 1.699462890625, 2.11181640625, 2.524169921875, 2.9365234375, 3.348876953125, 3.76123046875, 4.173583984375, 4.5859375, 4.998291015625, 5.41064453125, 5.822998046875, 6.2353515625, 6.647705078125, 7.06005859375, 7.472412109375, 7.884765625, 8.297119140625, 8.70947265625, 9.121826171875, 9.5341796875, 9.946533203125, 10.35888671875, 10.771240234375, 11.18359375, 11.595947265625, 12.00830078125, 12.420654296875, 12.8330078125, 13.245361328125, 13.65771484375, 14.070068359375, 14.482421875, 14.894775390625, 15.30712890625, 15.719482421875, 16.1318359375, 16.544189453125, 16.95654296875, 17.368896484375, 17.78125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 10.0, 12.0, 18.0, 31.0, 58.0, 90.0, 143.0, 241.0, 343.0, 510.0, 873.0, 1496.0, 2643.0, 4264.0, 7502.0, 13125.0, 22679.0, 38134.0, 63289.0, 100428.0, 143221.0, 170931.0, 159784.0, 121174.0, 78884.0, 48909.0, 29038.0, 16819.0, 9735.0, 5723.0, 3372.0, 1995.0, 1124.0, 769.0, 408.0, 269.0, 171.0, 118.0, 79.0, 45.0, 28.0, 25.0, 14.0, 9.0, 9.0, 2.0, 4.0, 5.0, 0.0, 2.0, 2.0], "bins": [-1.02734375, -0.9977645874023438, -0.9681854248046875, -0.9386062622070312, -0.909027099609375, -0.8794479370117188, -0.8498687744140625, -0.8202896118164062, -0.79071044921875, -0.7611312866210938, -0.7315521240234375, -0.7019729614257812, -0.672393798828125, -0.6428146362304688, -0.6132354736328125, -0.5836563110351562, -0.5540771484375, -0.5244979858398438, -0.4949188232421875, -0.46533966064453125, -0.435760498046875, -0.40618133544921875, -0.3766021728515625, -0.34702301025390625, -0.31744384765625, -0.28786468505859375, -0.2582855224609375, -0.22870635986328125, -0.199127197265625, -0.16954803466796875, -0.1399688720703125, -0.11038970947265625, -0.080810546875, -0.05123138427734375, -0.0216522216796875, 0.00792694091796875, 0.037506103515625, 0.06708526611328125, 0.0966644287109375, 0.12624359130859375, 0.15582275390625, 0.18540191650390625, 0.2149810791015625, 0.24456024169921875, 0.274139404296875, 0.30371856689453125, 0.3332977294921875, 0.36287689208984375, 0.3924560546875, 0.42203521728515625, 0.4516143798828125, 0.48119354248046875, 0.510772705078125, 0.5403518676757812, 0.5699310302734375, 0.5995101928710938, 0.62908935546875, 0.6586685180664062, 0.6882476806640625, 0.7178268432617188, 0.747406005859375, 0.7769851684570312, 0.8065643310546875, 0.8361434936523438, 0.86572265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 3.0, 4.0, 11.0, 14.0, 12.0, 16.0, 19.0, 29.0, 24.0, 38.0, 23.0, 28.0, 43.0, 33.0, 29.0, 29.0, 51.0, 50.0, 46.0, 41.0, 46.0, 44.0, 32.0, 41.0, 35.0, 34.0, 32.0, 27.0, 27.0, 23.0, 22.0, 19.0, 15.0, 10.0, 5.0, 7.0, 6.0, 7.0, 5.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.28125, -16.7640380859375, -16.246826171875, -15.7296142578125, -15.21240234375, -14.6951904296875, -14.177978515625, -13.6607666015625, -13.1435546875, -12.6263427734375, -12.109130859375, -11.5919189453125, -11.07470703125, -10.5574951171875, -10.040283203125, -9.5230712890625, -9.005859375, -8.4886474609375, -7.971435546875, -7.4542236328125, -6.93701171875, -6.4197998046875, -5.902587890625, -5.3853759765625, -4.8681640625, -4.3509521484375, -3.833740234375, -3.3165283203125, -2.79931640625, -2.2821044921875, -1.764892578125, -1.2476806640625, -0.73046875, -0.2132568359375, 0.303955078125, 0.8211669921875, 1.33837890625, 1.8555908203125, 2.372802734375, 2.8900146484375, 3.4072265625, 3.9244384765625, 4.441650390625, 4.9588623046875, 5.47607421875, 5.9932861328125, 6.510498046875, 7.0277099609375, 7.544921875, 8.0621337890625, 8.579345703125, 9.0965576171875, 9.61376953125, 10.1309814453125, 10.648193359375, 11.1654052734375, 11.6826171875, 12.1998291015625, 12.717041015625, 13.2342529296875, 13.75146484375, 14.2686767578125, 14.785888671875, 15.3031005859375, 15.8203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 13.0, 19.0, 22.0, 49.0, 68.0, 114.0, 189.0, 337.0, 643.0, 1303.0, 3045.0, 7853.0, 23983.0, 85075.0, 297656.0, 413083.0, 153065.0, 41041.0, 12632.0, 4572.0, 1858.0, 896.0, 422.0, 232.0, 140.0, 75.0, 59.0, 39.0, 20.0, 12.0, 11.0, 11.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25390625, -0.2462635040283203, -0.23862075805664062, -0.23097801208496094, -0.22333526611328125, -0.21569252014160156, -0.20804977416992188, -0.2004070281982422, -0.1927642822265625, -0.1851215362548828, -0.17747879028320312, -0.16983604431152344, -0.16219329833984375, -0.15455055236816406, -0.14690780639648438, -0.1392650604248047, -0.131622314453125, -0.12397956848144531, -0.11633682250976562, -0.10869407653808594, -0.10105133056640625, -0.09340858459472656, -0.08576583862304688, -0.07812309265136719, -0.0704803466796875, -0.06283760070800781, -0.055194854736328125, -0.04755210876464844, -0.03990936279296875, -0.03226661682128906, -0.024623870849609375, -0.016981124877929688, -0.00933837890625, -0.0016956329345703125, 0.005947113037109375, 0.013589859008789062, 0.02123260498046875, 0.028875350952148438, 0.036518096923828125, 0.04416084289550781, 0.0518035888671875, 0.05944633483886719, 0.06708908081054688, 0.07473182678222656, 0.08237457275390625, 0.09001731872558594, 0.09766006469726562, 0.10530281066894531, 0.112945556640625, 0.12058830261230469, 0.12823104858398438, 0.13587379455566406, 0.14351654052734375, 0.15115928649902344, 0.15880203247070312, 0.1664447784423828, 0.1740875244140625, 0.1817302703857422, 0.18937301635742188, 0.19701576232910156, 0.20465850830078125, 0.21230125427246094, 0.21994400024414062, 0.2275867462158203, 0.2352294921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 7.0, 8.0, 17.0, 23.0, 23.0, 40.0, 56.0, 80.0, 98.0, 136.0, 109.0, 101.0, 79.0, 67.0, 57.0, 29.0, 20.0, 15.0, 14.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001392364501953125, -0.00013232603669166565, -0.0001254156231880188, -0.00011850520968437195, -0.0001115947961807251, -0.00010468438267707825, -9.77739691734314e-05, -9.086355566978455e-05, -8.39531421661377e-05, -7.704272866249084e-05, -7.0132315158844e-05, -6.322190165519714e-05, -5.631148815155029e-05, -4.940107464790344e-05, -4.249066114425659e-05, -3.558024764060974e-05, -2.866983413696289e-05, -2.175942063331604e-05, -1.484900712966919e-05, -7.938593626022339e-06, -1.0281801223754883e-06, 5.882233381271362e-06, 1.2792646884918213e-05, 1.9703060388565063e-05, 2.6613473892211914e-05, 3.3523887395858765e-05, 4.0434300899505615e-05, 4.7344714403152466e-05, 5.4255127906799316e-05, 6.116554141044617e-05, 6.807595491409302e-05, 7.498636841773987e-05, 8.189678192138672e-05, 8.880719542503357e-05, 9.571760892868042e-05, 0.00010262802243232727, 0.00010953843593597412, 0.00011644884943962097, 0.00012335926294326782, 0.00013026967644691467, 0.00013718008995056152, 0.00014409050345420837, 0.00015100091695785522, 0.00015791133046150208, 0.00016482174396514893, 0.00017173215746879578, 0.00017864257097244263, 0.00018555298447608948, 0.00019246339797973633, 0.00019937381148338318, 0.00020628422498703003, 0.00021319463849067688, 0.00022010505199432373, 0.00022701546549797058, 0.00023392587900161743, 0.00024083629250526428, 0.00024774670600891113, 0.000254657119512558, 0.00026156753301620483, 0.0002684779465198517, 0.00027538836002349854, 0.0002822987735271454, 0.00028920918703079224, 0.0002961196005344391, 0.00030303001403808594]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 11.0, 20.0, 26.0, 29.0, 50.0, 77.0, 110.0, 176.0, 279.0, 432.0, 672.0, 1314.0, 2556.0, 5911.0, 16653.0, 58254.0, 217803.0, 444607.0, 213925.0, 57408.0, 16767.0, 5914.0, 2444.0, 1237.0, 688.0, 430.0, 277.0, 170.0, 102.0, 68.0, 38.0, 28.0, 22.0, 16.0, 10.0, 13.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2337646484375, -0.22609901428222656, -0.21843338012695312, -0.2107677459716797, -0.20310211181640625, -0.1954364776611328, -0.18777084350585938, -0.18010520935058594, -0.1724395751953125, -0.16477394104003906, -0.15710830688476562, -0.1494426727294922, -0.14177703857421875, -0.1341114044189453, -0.12644577026367188, -0.11878013610839844, -0.111114501953125, -0.10344886779785156, -0.09578323364257812, -0.08811759948730469, -0.08045196533203125, -0.07278633117675781, -0.06512069702148438, -0.05745506286621094, -0.0497894287109375, -0.04212379455566406, -0.034458160400390625, -0.026792526245117188, -0.01912689208984375, -0.011461257934570312, -0.003795623779296875, 0.0038700103759765625, 0.01153564453125, 0.019201278686523438, 0.026866912841796875, 0.03453254699707031, 0.04219818115234375, 0.04986381530761719, 0.057529449462890625, 0.06519508361816406, 0.0728607177734375, 0.08052635192871094, 0.08819198608398438, 0.09585762023925781, 0.10352325439453125, 0.11118888854980469, 0.11885452270507812, 0.12652015686035156, 0.134185791015625, 0.14185142517089844, 0.14951705932617188, 0.1571826934814453, 0.16484832763671875, 0.1725139617919922, 0.18017959594726562, 0.18784523010253906, 0.1955108642578125, 0.20317649841308594, 0.21084213256835938, 0.2185077667236328, 0.22617340087890625, 0.2338390350341797, 0.24150466918945312, 0.24917030334472656, 0.2568359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 14.0, 7.0, 19.0, 18.0, 17.0, 19.0, 34.0, 47.0, 48.0, 49.0, 64.0, 60.0, 74.0, 65.0, 61.0, 63.0, 52.0, 39.0, 57.0, 37.0, 22.0, 31.0, 19.0, 21.0, 9.0, 7.0, 8.0, 10.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06048583984375, -0.058432579040527344, -0.05637931823730469, -0.05432605743408203, -0.052272796630859375, -0.05021953582763672, -0.04816627502441406, -0.046113014221191406, -0.04405975341796875, -0.042006492614746094, -0.03995323181152344, -0.03789997100830078, -0.035846710205078125, -0.03379344940185547, -0.03174018859863281, -0.029686927795410156, -0.0276336669921875, -0.025580406188964844, -0.023527145385742188, -0.02147388458251953, -0.019420623779296875, -0.01736736297607422, -0.015314102172851562, -0.013260841369628906, -0.01120758056640625, -0.009154319763183594, -0.0071010589599609375, -0.005047798156738281, -0.002994537353515625, -0.0009412765502929688, 0.0011119842529296875, 0.0031652450561523438, 0.005218505859375, 0.007271766662597656, 0.009325027465820312, 0.011378288269042969, 0.013431549072265625, 0.015484809875488281, 0.017538070678710938, 0.019591331481933594, 0.02164459228515625, 0.023697853088378906, 0.025751113891601562, 0.02780437469482422, 0.029857635498046875, 0.03191089630126953, 0.03396415710449219, 0.036017417907714844, 0.0380706787109375, 0.040123939514160156, 0.04217720031738281, 0.04423046112060547, 0.046283721923828125, 0.04833698272705078, 0.05039024353027344, 0.052443504333496094, 0.05449676513671875, 0.056550025939941406, 0.05860328674316406, 0.06065654754638672, 0.06270980834960938, 0.06476306915283203, 0.06681632995605469, 0.06886959075927734, 0.0709228515625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 6.0, 51.0, 393.0, 455.0, 100.0, 11.0, 2.0], "bins": [-149.7362823486328, -147.24359130859375, -144.75088500976562, -142.25819396972656, -139.76548767089844, -137.27279663085938, -134.7801055908203, -132.2873992919922, -129.79470825195312, -127.30200958251953, -124.80931091308594, -122.31661987304688, -119.82392120361328, -117.33122253417969, -114.8385238647461, -112.3458251953125, -109.85313415527344, -107.36043548583984, -104.86773681640625, -102.37504577636719, -99.8823471069336, -97.3896484375, -94.8969497680664, -92.40425109863281, -89.91155242919922, -87.41885375976562, -84.92615509033203, -82.43346405029297, -79.94076538085938, -77.44806671142578, -74.95536804199219, -72.46267700195312, -69.96997833251953, -67.47727966308594, -64.98458099365234, -62.491886138916016, -59.99919128417969, -57.506492614746094, -55.0137939453125, -52.52109909057617, -50.02840042114258, -47.535701751708984, -45.043006896972656, -42.55030822753906, -40.057613372802734, -37.56491470336914, -35.07221984863281, -32.57952117919922, -30.08682632446289, -27.59412956237793, -25.10143280029297, -22.608734130859375, -20.116039276123047, -17.623340606689453, -15.130643844604492, -12.637947082519531, -10.145249366760254, -7.652552604675293, -5.159855365753174, -2.6671581268310547, -0.17446136474609375, 2.318235397338867, 4.8109331130981445, 7.3036298751831055, 9.796326637268066]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 17.0, 14.0, 9.0, 15.0, 26.0, 37.0, 37.0, 47.0, 49.0, 51.0, 59.0, 70.0, 51.0, 68.0, 44.0, 53.0, 55.0, 52.0, 43.0, 38.0, 27.0, 25.0, 19.0, 21.0, 16.0, 15.0, 8.0, 8.0, 5.0, 3.0, 0.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.121282577514648, -7.797036170959473, -7.472789764404297, -7.148543357849121, -6.8242974281311035, -6.500051021575928, -6.175804615020752, -5.851558685302734, -5.527312278747559, -5.203065872192383, -4.878819465637207, -4.554573059082031, -4.230327129364014, -3.906080722808838, -3.581834316253662, -3.2575881481170654, -2.9333415031433105, -2.6090950965881348, -2.284848928451538, -1.9606025218963623, -1.636356234550476, -1.3121099472045898, -0.9878635406494141, -0.6636173725128174, -0.3393709659576416, -0.015124648809432983, 0.30912166833877563, 0.6333680152893066, 0.9576143026351929, 1.281860589981079, 1.6061069965362549, 1.9303531646728516, 2.2545995712280273, 2.578845977783203, 2.9030921459198, 3.2273385524749756, 3.5515847206115723, 3.875831127166748, 4.200077533721924, 4.524323463439941, 4.848569869995117, 5.172816276550293, 5.497062683105469, 5.8213090896606445, 6.145555019378662, 6.469801425933838, 6.794047832489014, 7.118293762207031, 7.442540645599365, 7.766787052154541, 8.091032981872559, 8.415279388427734, 8.73952579498291, 9.063772201538086, 9.388018608093262, 9.712265014648438, 10.036511421203613, 10.360757827758789, 10.685004234313965, 11.00925064086914, 11.333497047424316, 11.657743453979492, 11.981988906860352, 12.306235313415527, 12.630481719970703]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 11.0, 5.0, 22.0, 26.0, 39.0, 46.0, 88.0, 178.0, 444.0, 1215.0, 3564.0, 11706.0, 46527.0, 224428.0, 585006.0, 133473.0, 29855.0, 7904.0, 2461.0, 846.0, 313.0, 134.0, 72.0, 43.0, 43.0, 17.0, 7.0, 20.0, 15.0, 6.0, 8.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.3201904296875, -9.968505859375, -9.6168212890625, -9.26513671875, -8.9134521484375, -8.561767578125, -8.2100830078125, -7.8583984375, -7.5067138671875, -7.155029296875, -6.8033447265625, -6.45166015625, -6.0999755859375, -5.748291015625, -5.3966064453125, -5.044921875, -4.6932373046875, -4.341552734375, -3.9898681640625, -3.63818359375, -3.2864990234375, -2.934814453125, -2.5831298828125, -2.2314453125, -1.8797607421875, -1.528076171875, -1.1763916015625, -0.82470703125, -0.4730224609375, -0.121337890625, 0.2303466796875, 0.58203125, 0.9337158203125, 1.285400390625, 1.6370849609375, 1.98876953125, 2.3404541015625, 2.692138671875, 3.0438232421875, 3.3955078125, 3.7471923828125, 4.098876953125, 4.4505615234375, 4.80224609375, 5.1539306640625, 5.505615234375, 5.8572998046875, 6.208984375, 6.5606689453125, 6.912353515625, 7.2640380859375, 7.61572265625, 7.9674072265625, 8.319091796875, 8.6707763671875, 9.0224609375, 9.3741455078125, 9.725830078125, 10.0775146484375, 10.42919921875, 10.7808837890625, 11.132568359375, 11.4842529296875, 11.8359375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 9.0, 11.0, 6.0, 15.0, 26.0, 27.0, 32.0, 38.0, 40.0, 50.0, 63.0, 62.0, 61.0, 63.0, 65.0, 60.0, 46.0, 56.0, 50.0, 43.0, 24.0, 31.0, 31.0, 16.0, 19.0, 16.0, 17.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.765625, -17.12939453125, -16.4931640625, -15.85693359375, -15.220703125, -14.58447265625, -13.9482421875, -13.31201171875, -12.67578125, -12.03955078125, -11.4033203125, -10.76708984375, -10.130859375, -9.49462890625, -8.8583984375, -8.22216796875, -7.5859375, -6.94970703125, -6.3134765625, -5.67724609375, -5.041015625, -4.40478515625, -3.7685546875, -3.13232421875, -2.49609375, -1.85986328125, -1.2236328125, -0.58740234375, 0.048828125, 0.68505859375, 1.3212890625, 1.95751953125, 2.59375, 3.22998046875, 3.8662109375, 4.50244140625, 5.138671875, 5.77490234375, 6.4111328125, 7.04736328125, 7.68359375, 8.31982421875, 8.9560546875, 9.59228515625, 10.228515625, 10.86474609375, 11.5009765625, 12.13720703125, 12.7734375, 13.40966796875, 14.0458984375, 14.68212890625, 15.318359375, 15.95458984375, 16.5908203125, 17.22705078125, 17.86328125, 18.49951171875, 19.1357421875, 19.77197265625, 20.408203125, 21.04443359375, 21.6806640625, 22.31689453125, 22.953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 11.0, 6.0, 14.0, 18.0, 20.0, 29.0, 30.0, 47.0, 76.0, 113.0, 182.0, 443.0, 2093.0, 48468.0, 937035.0, 56740.0, 2297.0, 416.0, 163.0, 100.0, 72.0, 48.0, 33.0, 24.0, 21.0, 13.0, 6.0, 10.0, 5.0, 4.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.0, -30.127197265625, -29.25439453125, -28.381591796875, -27.5087890625, -26.635986328125, -25.76318359375, -24.890380859375, -24.017578125, -23.144775390625, -22.27197265625, -21.399169921875, -20.5263671875, -19.653564453125, -18.78076171875, -17.907958984375, -17.03515625, -16.162353515625, -15.28955078125, -14.416748046875, -13.5439453125, -12.671142578125, -11.79833984375, -10.925537109375, -10.052734375, -9.179931640625, -8.30712890625, -7.434326171875, -6.5615234375, -5.688720703125, -4.81591796875, -3.943115234375, -3.0703125, -2.197509765625, -1.32470703125, -0.451904296875, 0.4208984375, 1.293701171875, 2.16650390625, 3.039306640625, 3.912109375, 4.784912109375, 5.65771484375, 6.530517578125, 7.4033203125, 8.276123046875, 9.14892578125, 10.021728515625, 10.89453125, 11.767333984375, 12.64013671875, 13.512939453125, 14.3857421875, 15.258544921875, 16.13134765625, 17.004150390625, 17.876953125, 18.749755859375, 19.62255859375, 20.495361328125, 21.3681640625, 22.240966796875, 23.11376953125, 23.986572265625, 24.859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 10.0, 2.0, 10.0, 12.0, 10.0, 25.0, 20.0, 21.0, 17.0, 31.0, 32.0, 37.0, 36.0, 41.0, 28.0, 51.0, 41.0, 46.0, 65.0, 45.0, 49.0, 48.0, 47.0, 35.0, 25.0, 30.0, 24.0, 35.0, 26.0, 23.0, 12.0, 11.0, 8.0, 9.0, 14.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.3125, -19.693603515625, -19.07470703125, -18.455810546875, -17.8369140625, -17.218017578125, -16.59912109375, -15.980224609375, -15.361328125, -14.742431640625, -14.12353515625, -13.504638671875, -12.8857421875, -12.266845703125, -11.64794921875, -11.029052734375, -10.41015625, -9.791259765625, -9.17236328125, -8.553466796875, -7.9345703125, -7.315673828125, -6.69677734375, -6.077880859375, -5.458984375, -4.840087890625, -4.22119140625, -3.602294921875, -2.9833984375, -2.364501953125, -1.74560546875, -1.126708984375, -0.5078125, 0.111083984375, 0.72998046875, 1.348876953125, 1.9677734375, 2.586669921875, 3.20556640625, 3.824462890625, 4.443359375, 5.062255859375, 5.68115234375, 6.300048828125, 6.9189453125, 7.537841796875, 8.15673828125, 8.775634765625, 9.39453125, 10.013427734375, 10.63232421875, 11.251220703125, 11.8701171875, 12.489013671875, 13.10791015625, 13.726806640625, 14.345703125, 14.964599609375, 15.58349609375, 16.202392578125, 16.8212890625, 17.440185546875, 18.05908203125, 18.677978515625, 19.296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 7.0, 1.0, 2.0, 9.0, 5.0, 12.0, 26.0, 27.0, 58.0, 189.0, 690.0, 4477.0, 750048.0, 288623.0, 3506.0, 563.0, 148.0, 58.0, 39.0, 18.0, 10.0, 9.0, 3.0, 0.0, 3.0, 0.0, 6.0, 0.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.40625, -22.69580078125, -21.9853515625, -21.27490234375, -20.564453125, -19.85400390625, -19.1435546875, -18.43310546875, -17.72265625, -17.01220703125, -16.3017578125, -15.59130859375, -14.880859375, -14.17041015625, -13.4599609375, -12.74951171875, -12.0390625, -11.32861328125, -10.6181640625, -9.90771484375, -9.197265625, -8.48681640625, -7.7763671875, -7.06591796875, -6.35546875, -5.64501953125, -4.9345703125, -4.22412109375, -3.513671875, -2.80322265625, -2.0927734375, -1.38232421875, -0.671875, 0.03857421875, 0.7490234375, 1.45947265625, 2.169921875, 2.88037109375, 3.5908203125, 4.30126953125, 5.01171875, 5.72216796875, 6.4326171875, 7.14306640625, 7.853515625, 8.56396484375, 9.2744140625, 9.98486328125, 10.6953125, 11.40576171875, 12.1162109375, 12.82666015625, 13.537109375, 14.24755859375, 14.9580078125, 15.66845703125, 16.37890625, 17.08935546875, 17.7998046875, 18.51025390625, 19.220703125, 19.93115234375, 20.6416015625, 21.35205078125, 22.0625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 6.0, 18.0, 27.0, 35.0, 54.0, 83.0, 121.0, 191.0, 160.0, 86.0, 59.0, 47.0, 39.0, 17.0, 16.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012874603271484375, -0.0012524053454399109, -0.0012173503637313843, -0.0011822953820228577, -0.001147240400314331, -0.0011121854186058044, -0.0010771304368972778, -0.0010420754551887512, -0.0010070204734802246, -0.000971965491771698, -0.0009369105100631714, -0.0009018555283546448, -0.0008668005466461182, -0.0008317455649375916, -0.0007966905832290649, -0.0007616356015205383, -0.0007265806198120117, -0.0006915256381034851, -0.0006564706563949585, -0.0006214156746864319, -0.0005863606929779053, -0.0005513057112693787, -0.000516250729560852, -0.00048119574785232544, -0.00044614076614379883, -0.0004110857844352722, -0.0003760308027267456, -0.000340975821018219, -0.0003059208393096924, -0.00027086585760116577, -0.00023581087589263916, -0.00020075589418411255, -0.00016570091247558594, -0.00013064593076705933, -9.559094905853271e-05, -6.0535967350006104e-05, -2.5480985641479492e-05, 9.573996067047119e-06, 4.462897777557373e-05, 7.968395948410034e-05, 0.00011473894119262695, 0.00014979392290115356, 0.00018484890460968018, 0.0002199038863182068, 0.0002549588680267334, 0.00029001384973526, 0.0003250688314437866, 0.00036012381315231323, 0.00039517879486083984, 0.00043023377656936646, 0.00046528875827789307, 0.0005003437399864197, 0.0005353987216949463, 0.0005704537034034729, 0.0006055086851119995, 0.0006405636668205261, 0.0006756186485290527, 0.0007106736302375793, 0.000745728611946106, 0.0007807835936546326, 0.0008158385753631592, 0.0008508935570716858, 0.0008859485387802124, 0.000921003520488739, 0.0009560585021972656]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 11.0, 19.0, 55.0, 109.0, 241.0, 730.0, 3612.0, 310149.0, 727741.0, 4511.0, 816.0, 284.0, 128.0, 61.0, 30.0, 10.0, 7.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.265625, -18.578857421875, -17.89208984375, -17.205322265625, -16.5185546875, -15.831787109375, -15.14501953125, -14.458251953125, -13.771484375, -13.084716796875, -12.39794921875, -11.711181640625, -11.0244140625, -10.337646484375, -9.65087890625, -8.964111328125, -8.27734375, -7.590576171875, -6.90380859375, -6.217041015625, -5.5302734375, -4.843505859375, -4.15673828125, -3.469970703125, -2.783203125, -2.096435546875, -1.40966796875, -0.722900390625, -0.0361328125, 0.650634765625, 1.33740234375, 2.024169921875, 2.7109375, 3.397705078125, 4.08447265625, 4.771240234375, 5.4580078125, 6.144775390625, 6.83154296875, 7.518310546875, 8.205078125, 8.891845703125, 9.57861328125, 10.265380859375, 10.9521484375, 11.638916015625, 12.32568359375, 13.012451171875, 13.69921875, 14.385986328125, 15.07275390625, 15.759521484375, 16.4462890625, 17.133056640625, 17.81982421875, 18.506591796875, 19.193359375, 19.880126953125, 20.56689453125, 21.253662109375, 21.9404296875, 22.627197265625, 23.31396484375, 24.000732421875, 24.6875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 14.0, 18.0, 19.0, 22.0, 34.0, 66.0, 83.0, 151.0, 202.0, 136.0, 84.0, 61.0, 29.0, 19.0, 18.0, 17.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.11907958984375, -3.0096435546875, -2.90020751953125, -2.790771484375, -2.68133544921875, -2.5718994140625, -2.46246337890625, -2.35302734375, -2.24359130859375, -2.1341552734375, -2.02471923828125, -1.915283203125, -1.80584716796875, -1.6964111328125, -1.58697509765625, -1.4775390625, -1.36810302734375, -1.2586669921875, -1.14923095703125, -1.039794921875, -0.93035888671875, -0.8209228515625, -0.71148681640625, -0.60205078125, -0.49261474609375, -0.3831787109375, -0.27374267578125, -0.164306640625, -0.05487060546875, 0.0545654296875, 0.16400146484375, 0.2734375, 0.38287353515625, 0.4923095703125, 0.60174560546875, 0.711181640625, 0.82061767578125, 0.9300537109375, 1.03948974609375, 1.14892578125, 1.25836181640625, 1.3677978515625, 1.47723388671875, 1.586669921875, 1.69610595703125, 1.8055419921875, 1.91497802734375, 2.0244140625, 2.13385009765625, 2.2432861328125, 2.35272216796875, 2.462158203125, 2.57159423828125, 2.6810302734375, 2.79046630859375, 2.89990234375, 3.00933837890625, 3.1187744140625, 3.22821044921875, 3.337646484375, 3.44708251953125, 3.5565185546875, 3.66595458984375, 3.775390625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 4.0, 6.0, 9.0, 13.0, 39.0, 48.0, 92.0, 90.0, 121.0, 145.0, 128.0, 102.0, 73.0, 64.0, 26.0, 19.0, 10.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.18519592285156, -50.1231575012207, -49.061119079589844, -47.999080657958984, -46.937042236328125, -45.875003814697266, -44.812965393066406, -43.75093078613281, -42.68888854980469, -41.62685012817383, -40.56481170654297, -39.50277328491211, -38.44073486328125, -37.37869644165039, -36.31665802001953, -35.25462341308594, -34.19258499145508, -33.13054656982422, -32.06850814819336, -31.0064697265625, -29.94443130493164, -28.88239288330078, -27.820356369018555, -26.758317947387695, -25.696279525756836, -24.634241104125977, -23.572202682495117, -22.510164260864258, -21.44812774658203, -20.386089324951172, -19.324050903320312, -18.262012481689453, -17.199974060058594, -16.137935638427734, -15.075897216796875, -14.013859748840332, -12.951821327209473, -11.889782905578613, -10.82774543762207, -9.765707015991211, -8.703668594360352, -7.641630172729492, -6.579592227935791, -5.51755428314209, -4.4555158615112305, -3.393477439880371, -2.33143949508667, -1.2694015502929688, -0.20736312866210938, 0.8546750545501709, 1.9167132377624512, 2.9787514209747314, 4.040789604187012, 5.102828025817871, 6.164865970611572, 7.226903915405273, 8.288942337036133, 9.350980758666992, 10.413019180297852, 11.475056648254395, 12.537095069885254, 13.599133491516113, 14.661170959472656, 15.723209381103516, 16.785247802734375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 11.0, 6.0, 3.0, 9.0, 9.0, 9.0, 12.0, 19.0, 12.0, 17.0, 26.0, 19.0, 26.0, 29.0, 30.0, 28.0, 37.0, 37.0, 36.0, 39.0, 45.0, 44.0, 43.0, 37.0, 40.0, 33.0, 39.0, 18.0, 36.0, 35.0, 20.0, 31.0, 27.0, 20.0, 17.0, 13.0, 24.0, 11.0, 9.0, 13.0, 9.0, 6.0, 6.0, 2.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.319732666015625, -25.47356414794922, -24.627397537231445, -23.78122901916504, -22.935060501098633, -22.08889389038086, -21.242725372314453, -20.396556854248047, -19.55038833618164, -18.704219818115234, -17.85805320739746, -17.011884689331055, -16.16571617126465, -15.319548606872559, -14.473381042480469, -13.627212524414062, -12.781044960021973, -11.934877395629883, -11.088708877563477, -10.242541313171387, -9.39637279510498, -8.55020523071289, -7.704037189483643, -6.8578691482543945, -6.0117011070251465, -5.165533065795898, -4.31936502456665, -3.4731972217559814, -2.6270291805267334, -1.7808613777160645, -0.9346933364868164, -0.08852529525756836, 0.7576427459716797, 1.6038107872009277, 2.449978828430176, 3.2961466312408447, 4.142314910888672, 4.988482475280762, 5.83465051651001, 6.680818557739258, 7.526986598968506, 8.373154640197754, 9.219322204589844, 10.06549072265625, 10.91165828704834, 11.75782585144043, 12.603994369506836, 13.450162887573242, 14.296330451965332, 15.142498016357422, 15.988666534423828, 16.834835052490234, 17.681001663208008, 18.527170181274414, 19.37333869934082, 20.219505310058594, 21.065673828125, 21.911842346191406, 22.75800895690918, 23.604177474975586, 24.450345993041992, 25.296512603759766, 26.142681121826172, 26.988849639892578, 27.835018157958984]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 13.0, 19.0, 39.0, 91.0, 145.0, 387.0, 1100.0, 9039.0, 2944824.0, 1233129.0, 4336.0, 662.0, 249.0, 97.0, 55.0, 29.0, 17.0, 12.0, 12.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.65625, -42.93310546875, -41.2099609375, -39.48681640625, -37.763671875, -36.04052734375, -34.3173828125, -32.59423828125, -30.87109375, -29.14794921875, -27.4248046875, -25.70166015625, -23.978515625, -22.25537109375, -20.5322265625, -18.80908203125, -17.0859375, -15.36279296875, -13.6396484375, -11.91650390625, -10.193359375, -8.47021484375, -6.7470703125, -5.02392578125, -3.30078125, -1.57763671875, 0.1455078125, 1.86865234375, 3.591796875, 5.31494140625, 7.0380859375, 8.76123046875, 10.484375, 12.20751953125, 13.9306640625, 15.65380859375, 17.376953125, 19.10009765625, 20.8232421875, 22.54638671875, 24.26953125, 25.99267578125, 27.7158203125, 29.43896484375, 31.162109375, 32.88525390625, 34.6083984375, 36.33154296875, 38.0546875, 39.77783203125, 41.5009765625, 43.22412109375, 44.947265625, 46.67041015625, 48.3935546875, 50.11669921875, 51.83984375, 53.56298828125, 55.2861328125, 57.00927734375, 58.732421875, 60.45556640625, 62.1787109375, 63.90185546875, 65.625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 6.0, 0.0, 8.0, 10.0, 12.0, 20.0, 20.0, 27.0, 40.0, 37.0, 25.0, 51.0, 52.0, 57.0, 82.0, 71.0, 70.0, 56.0, 67.0, 46.0, 51.0, 37.0, 30.0, 32.0, 21.0, 15.0, 19.0, 14.0, 15.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.5625, -9.17529296875, -8.7880859375, -8.40087890625, -8.013671875, -7.62646484375, -7.2392578125, -6.85205078125, -6.46484375, -6.07763671875, -5.6904296875, -5.30322265625, -4.916015625, -4.52880859375, -4.1416015625, -3.75439453125, -3.3671875, -2.97998046875, -2.5927734375, -2.20556640625, -1.818359375, -1.43115234375, -1.0439453125, -0.65673828125, -0.26953125, 0.11767578125, 0.5048828125, 0.89208984375, 1.279296875, 1.66650390625, 2.0537109375, 2.44091796875, 2.828125, 3.21533203125, 3.6025390625, 3.98974609375, 4.376953125, 4.76416015625, 5.1513671875, 5.53857421875, 5.92578125, 6.31298828125, 6.7001953125, 7.08740234375, 7.474609375, 7.86181640625, 8.2490234375, 8.63623046875, 9.0234375, 9.41064453125, 9.7978515625, 10.18505859375, 10.572265625, 10.95947265625, 11.3466796875, 11.73388671875, 12.12109375, 12.50830078125, 12.8955078125, 13.28271484375, 13.669921875, 14.05712890625, 14.4443359375, 14.83154296875, 15.21875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 3.0, 3.0, 9.0, 14.0, 23.0, 44.0, 77.0, 143.0, 281.0, 745.0, 2085.0, 10144.0, 379028.0, 3728694.0, 65606.0, 4959.0, 1402.0, 547.0, 233.0, 92.0, 55.0, 30.0, 15.0, 17.0, 11.0, 3.0, 4.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.8125, -30.827880859375, -29.84326171875, -28.858642578125, -27.8740234375, -26.889404296875, -25.90478515625, -24.920166015625, -23.935546875, -22.950927734375, -21.96630859375, -20.981689453125, -19.9970703125, -19.012451171875, -18.02783203125, -17.043212890625, -16.05859375, -15.073974609375, -14.08935546875, -13.104736328125, -12.1201171875, -11.135498046875, -10.15087890625, -9.166259765625, -8.181640625, -7.197021484375, -6.21240234375, -5.227783203125, -4.2431640625, -3.258544921875, -2.27392578125, -1.289306640625, -0.3046875, 0.679931640625, 1.66455078125, 2.649169921875, 3.6337890625, 4.618408203125, 5.60302734375, 6.587646484375, 7.572265625, 8.556884765625, 9.54150390625, 10.526123046875, 11.5107421875, 12.495361328125, 13.47998046875, 14.464599609375, 15.44921875, 16.433837890625, 17.41845703125, 18.403076171875, 19.3876953125, 20.372314453125, 21.35693359375, 22.341552734375, 23.326171875, 24.310791015625, 25.29541015625, 26.280029296875, 27.2646484375, 28.249267578125, 29.23388671875, 30.218505859375, 31.203125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 16.0, 26.0, 41.0, 87.0, 174.0, 267.0, 524.0, 872.0, 849.0, 582.0, 296.0, 139.0, 74.0, 55.0, 29.0, 12.0, 11.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.72265625, -7.46502685546875, -7.2073974609375, -6.94976806640625, -6.692138671875, -6.43450927734375, -6.1768798828125, -5.91925048828125, -5.66162109375, -5.40399169921875, -5.1463623046875, -4.88873291015625, -4.631103515625, -4.37347412109375, -4.1158447265625, -3.85821533203125, -3.6005859375, -3.34295654296875, -3.0853271484375, -2.82769775390625, -2.570068359375, -2.31243896484375, -2.0548095703125, -1.79718017578125, -1.53955078125, -1.28192138671875, -1.0242919921875, -0.76666259765625, -0.509033203125, -0.25140380859375, 0.0062255859375, 0.26385498046875, 0.521484375, 0.77911376953125, 1.0367431640625, 1.29437255859375, 1.552001953125, 1.80963134765625, 2.0672607421875, 2.32489013671875, 2.58251953125, 2.84014892578125, 3.0977783203125, 3.35540771484375, 3.613037109375, 3.87066650390625, 4.1282958984375, 4.38592529296875, 4.6435546875, 4.90118408203125, 5.1588134765625, 5.41644287109375, 5.674072265625, 5.93170166015625, 6.1893310546875, 6.44696044921875, 6.70458984375, 6.96221923828125, 7.2198486328125, 7.47747802734375, 7.735107421875, 7.99273681640625, 8.2503662109375, 8.50799560546875, 8.765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 12.0, 12.0, 25.0, 53.0, 90.0, 135.0, 188.0, 176.0, 147.0, 90.0, 47.0, 24.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.17447280883789, -59.97032165527344, -58.766170501708984, -57.56201934814453, -56.35786819458008, -55.153717041015625, -53.94956588745117, -52.74541473388672, -51.541259765625, -50.33710861206055, -49.132957458496094, -47.92880630493164, -46.72465515136719, -45.520503997802734, -44.31635284423828, -43.11219787597656, -41.908050537109375, -40.70389938354492, -39.49974822998047, -38.295597076416016, -37.09144592285156, -35.88729476928711, -34.683143615722656, -33.47898864746094, -32.27484130859375, -31.070690155029297, -29.866539001464844, -28.66238784790039, -27.458236694335938, -26.254085540771484, -25.0499324798584, -23.845781326293945, -22.641624450683594, -21.43747329711914, -20.233322143554688, -19.029170989990234, -17.82501983642578, -16.620868682861328, -15.416715621948242, -14.212564468383789, -13.008414268493652, -11.8042631149292, -10.60011100769043, -9.395959854125977, -8.191808700561523, -6.98765754699707, -5.783505916595459, -4.579354286193848, -3.3752031326293945, -2.1710517406463623, -0.9669003486633301, 0.23725104331970215, 1.4414024353027344, 2.6455535888671875, 3.849705219268799, 5.05385684967041, 6.258008003234863, 7.462159156799316, 8.666311264038086, 9.870462417602539, 11.074613571166992, 12.278764724731445, 13.482915878295898, 14.687067985534668, 15.891219139099121]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 8.0, 3.0, 10.0, 12.0, 20.0, 17.0, 20.0, 15.0, 25.0, 18.0, 34.0, 41.0, 28.0, 37.0, 53.0, 44.0, 50.0, 46.0, 45.0, 44.0, 54.0, 37.0, 42.0, 42.0, 42.0, 31.0, 21.0, 29.0, 21.0, 17.0, 15.0, 16.0, 12.0, 18.0, 9.0, 6.0, 9.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.263497352600098, -8.90318489074707, -8.542872428894043, -8.182559967041016, -7.822246551513672, -7.4619340896606445, -7.101621627807617, -6.74130916595459, -6.380996227264404, -6.020683765411377, -5.660370826721191, -5.300058364868164, -4.939745903015137, -4.579432964324951, -4.219120502471924, -3.8588078022003174, -3.498495101928711, -3.1381824016571045, -2.777869701385498, -2.4175572395324707, -2.0572445392608643, -1.6969318389892578, -1.3366193771362305, -0.976306676864624, -0.6159939765930176, -0.2556813359260559, 0.10463130474090576, 0.46494388580322266, 0.8252565860748291, 1.1855692863464355, 1.545881748199463, 1.9061944484710693, 2.266508102416992, 2.6268208026885986, 2.987133502960205, 3.3474459648132324, 3.707758665084839, 4.068071365356445, 4.428383827209473, 4.7886962890625, 5.1490092277526855, 5.509321689605713, 5.869634628295898, 6.229947090148926, 6.590259552001953, 6.950572490692139, 7.310884952545166, 7.671197891235352, 8.031510353088379, 8.391822814941406, 8.752135276794434, 9.112447738647461, 9.472761154174805, 9.833073616027832, 10.19338607788086, 10.553698539733887, 10.914011001586914, 11.274323463439941, 11.634635925292969, 11.994949340820312, 12.35526180267334, 12.715574264526367, 13.075886726379395, 13.436199188232422, 13.796512603759766]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 2.0, 18.0, 11.0, 21.0, 33.0, 47.0, 45.0, 94.0, 136.0, 204.0, 370.0, 732.0, 1403.0, 3691.0, 10471.0, 35665.0, 134133.0, 382581.0, 332713.0, 103945.0, 27980.0, 8419.0, 3022.0, 1255.0, 599.0, 360.0, 177.0, 124.0, 77.0, 55.0, 57.0, 29.0, 15.0, 21.0, 9.0, 3.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.087890625, -2.010284423828125, -1.93267822265625, -1.855072021484375, -1.7774658203125, -1.699859619140625, -1.62225341796875, -1.544647216796875, -1.467041015625, -1.389434814453125, -1.31182861328125, -1.234222412109375, -1.1566162109375, -1.079010009765625, -1.00140380859375, -0.923797607421875, -0.84619140625, -0.768585205078125, -0.69097900390625, -0.613372802734375, -0.5357666015625, -0.458160400390625, -0.38055419921875, -0.302947998046875, -0.225341796875, -0.147735595703125, -0.07012939453125, 0.007476806640625, 0.0850830078125, 0.162689208984375, 0.24029541015625, 0.317901611328125, 0.3955078125, 0.473114013671875, 0.55072021484375, 0.628326416015625, 0.7059326171875, 0.783538818359375, 0.86114501953125, 0.938751220703125, 1.016357421875, 1.093963623046875, 1.17156982421875, 1.249176025390625, 1.3267822265625, 1.404388427734375, 1.48199462890625, 1.559600830078125, 1.63720703125, 1.714813232421875, 1.79241943359375, 1.870025634765625, 1.9476318359375, 2.025238037109375, 2.10284423828125, 2.180450439453125, 2.258056640625, 2.335662841796875, 2.41326904296875, 2.490875244140625, 2.5684814453125, 2.646087646484375, 2.72369384765625, 2.801300048828125, 2.87890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 15.0, 14.0, 16.0, 16.0, 20.0, 22.0, 25.0, 28.0, 39.0, 49.0, 52.0, 49.0, 57.0, 53.0, 75.0, 50.0, 57.0, 55.0, 52.0, 47.0, 35.0, 31.0, 28.0, 27.0, 18.0, 13.0, 11.0, 18.0, 14.0, 7.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6015625, -8.31005859375, -8.0185546875, -7.72705078125, -7.435546875, -7.14404296875, -6.8525390625, -6.56103515625, -6.26953125, -5.97802734375, -5.6865234375, -5.39501953125, -5.103515625, -4.81201171875, -4.5205078125, -4.22900390625, -3.9375, -3.64599609375, -3.3544921875, -3.06298828125, -2.771484375, -2.47998046875, -2.1884765625, -1.89697265625, -1.60546875, -1.31396484375, -1.0224609375, -0.73095703125, -0.439453125, -0.14794921875, 0.1435546875, 0.43505859375, 0.7265625, 1.01806640625, 1.3095703125, 1.60107421875, 1.892578125, 2.18408203125, 2.4755859375, 2.76708984375, 3.05859375, 3.35009765625, 3.6416015625, 3.93310546875, 4.224609375, 4.51611328125, 4.8076171875, 5.09912109375, 5.390625, 5.68212890625, 5.9736328125, 6.26513671875, 6.556640625, 6.84814453125, 7.1396484375, 7.43115234375, 7.72265625, 8.01416015625, 8.3056640625, 8.59716796875, 8.888671875, 9.18017578125, 9.4716796875, 9.76318359375, 10.0546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 12.0, 13.0, 14.0, 32.0, 32.0, 59.0, 88.0, 172.0, 278.0, 454.0, 809.0, 1340.0, 2348.0, 4153.0, 7150.0, 13117.0, 22870.0, 40714.0, 70497.0, 115575.0, 171380.0, 194510.0, 157653.0, 102345.0, 61292.0, 35377.0, 19924.0, 11197.0, 6346.0, 3705.0, 2096.0, 1222.0, 711.0, 417.0, 227.0, 158.0, 98.0, 70.0, 32.0, 22.0, 16.0, 13.0, 8.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7646484375, -0.7376937866210938, -0.7107391357421875, -0.6837844848632812, -0.656829833984375, -0.6298751831054688, -0.6029205322265625, -0.5759658813476562, -0.54901123046875, -0.5220565795898438, -0.4951019287109375, -0.46814727783203125, -0.441192626953125, -0.41423797607421875, -0.3872833251953125, -0.36032867431640625, -0.3333740234375, -0.30641937255859375, -0.2794647216796875, -0.25251007080078125, -0.225555419921875, -0.19860076904296875, -0.1716461181640625, -0.14469146728515625, -0.11773681640625, -0.09078216552734375, -0.0638275146484375, -0.03687286376953125, -0.009918212890625, 0.01703643798828125, 0.0439910888671875, 0.07094573974609375, 0.097900390625, 0.12485504150390625, 0.1518096923828125, 0.17876434326171875, 0.205718994140625, 0.23267364501953125, 0.2596282958984375, 0.28658294677734375, 0.31353759765625, 0.34049224853515625, 0.3674468994140625, 0.39440155029296875, 0.421356201171875, 0.44831085205078125, 0.4752655029296875, 0.5022201538085938, 0.5291748046875, 0.5561294555664062, 0.5830841064453125, 0.6100387573242188, 0.636993408203125, 0.6639480590820312, 0.6909027099609375, 0.7178573608398438, 0.74481201171875, 0.7717666625976562, 0.7987213134765625, 0.8256759643554688, 0.852630615234375, 0.8795852661132812, 0.9065399169921875, 0.9334945678710938, 0.96044921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 12.0, 6.0, 6.0, 10.0, 11.0, 15.0, 11.0, 23.0, 31.0, 30.0, 37.0, 41.0, 41.0, 44.0, 53.0, 47.0, 53.0, 56.0, 56.0, 55.0, 56.0, 51.0, 35.0, 37.0, 28.0, 27.0, 22.0, 14.0, 18.0, 19.0, 11.0, 12.0, 10.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.4302978515625, -11.915283203125, -11.4002685546875, -10.88525390625, -10.3702392578125, -9.855224609375, -9.3402099609375, -8.8251953125, -8.3101806640625, -7.795166015625, -7.2801513671875, -6.76513671875, -6.2501220703125, -5.735107421875, -5.2200927734375, -4.705078125, -4.1900634765625, -3.675048828125, -3.1600341796875, -2.64501953125, -2.1300048828125, -1.614990234375, -1.0999755859375, -0.5849609375, -0.0699462890625, 0.445068359375, 0.9600830078125, 1.47509765625, 1.9901123046875, 2.505126953125, 3.0201416015625, 3.53515625, 4.0501708984375, 4.565185546875, 5.0802001953125, 5.59521484375, 6.1102294921875, 6.625244140625, 7.1402587890625, 7.6552734375, 8.1702880859375, 8.685302734375, 9.2003173828125, 9.71533203125, 10.2303466796875, 10.745361328125, 11.2603759765625, 11.775390625, 12.2904052734375, 12.805419921875, 13.3204345703125, 13.83544921875, 14.3504638671875, 14.865478515625, 15.3804931640625, 15.8955078125, 16.4105224609375, 16.925537109375, 17.4405517578125, 17.95556640625, 18.4705810546875, 18.985595703125, 19.5006103515625, 20.015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 11.0, 17.0, 22.0, 38.0, 79.0, 105.0, 205.0, 308.0, 614.0, 1159.0, 2633.0, 6821.0, 21378.0, 84802.0, 364133.0, 421430.0, 105540.0, 25460.0, 7910.0, 2964.0, 1330.0, 656.0, 385.0, 195.0, 124.0, 70.0, 45.0, 30.0, 26.0, 14.0, 4.0, 10.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2705078125, -0.26279449462890625, -0.2550811767578125, -0.24736785888671875, -0.239654541015625, -0.23194122314453125, -0.2242279052734375, -0.21651458740234375, -0.20880126953125, -0.20108795166015625, -0.1933746337890625, -0.18566131591796875, -0.177947998046875, -0.17023468017578125, -0.1625213623046875, -0.15480804443359375, -0.1470947265625, -0.13938140869140625, -0.1316680908203125, -0.12395477294921875, -0.116241455078125, -0.10852813720703125, -0.1008148193359375, -0.09310150146484375, -0.08538818359375, -0.07767486572265625, -0.0699615478515625, -0.06224822998046875, -0.054534912109375, -0.04682159423828125, -0.0391082763671875, -0.03139495849609375, -0.023681640625, -0.01596832275390625, -0.0082550048828125, -0.00054168701171875, 0.007171630859375, 0.01488494873046875, 0.0225982666015625, 0.03031158447265625, 0.03802490234375, 0.04573822021484375, 0.0534515380859375, 0.06116485595703125, 0.068878173828125, 0.07659149169921875, 0.0843048095703125, 0.09201812744140625, 0.0997314453125, 0.10744476318359375, 0.1151580810546875, 0.12287139892578125, 0.130584716796875, 0.13829803466796875, 0.1460113525390625, 0.15372467041015625, 0.16143798828125, 0.16915130615234375, 0.1768646240234375, 0.18457794189453125, 0.192291259765625, 0.20000457763671875, 0.2077178955078125, 0.21543121337890625, 0.22314453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 13.0, 25.0, 36.0, 40.0, 67.0, 82.0, 110.0, 118.0, 147.0, 105.0, 86.0, 59.0, 35.0, 24.0, 24.0, 8.0, 4.0, 6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001608133316040039, -0.0001543443650007248, -0.00014787539839744568, -0.00014140643179416656, -0.00013493746519088745, -0.00012846849858760834, -0.00012199953198432922, -0.00011553056538105011, -0.000109061598777771, -0.00010259263217449188, -9.612366557121277e-05, -8.965469896793365e-05, -8.318573236465454e-05, -7.671676576137543e-05, -7.024779915809631e-05, -6.37788325548172e-05, -5.7309865951538086e-05, -5.084089934825897e-05, -4.437193274497986e-05, -3.7902966141700745e-05, -3.143399953842163e-05, -2.4965032935142517e-05, -1.8496066331863403e-05, -1.202709972858429e-05, -5.558133125305176e-06, 9.10833477973938e-07, 7.379800081253052e-06, 1.3848766684532166e-05, 2.031773328781128e-05, 2.6786699891090393e-05, 3.325566649436951e-05, 3.972463309764862e-05, 4.6193599700927734e-05, 5.266256630420685e-05, 5.913153290748596e-05, 6.560049951076508e-05, 7.206946611404419e-05, 7.85384327173233e-05, 8.500739932060242e-05, 9.147636592388153e-05, 9.794533252716064e-05, 0.00010441429913043976, 0.00011088326573371887, 0.00011735223233699799, 0.0001238211989402771, 0.0001302901655435562, 0.00013675913214683533, 0.00014322809875011444, 0.00014969706535339355, 0.00015616603195667267, 0.00016263499855995178, 0.0001691039651632309, 0.00017557293176651, 0.00018204189836978912, 0.00018851086497306824, 0.00019497983157634735, 0.00020144879817962646, 0.00020791776478290558, 0.0002143867313861847, 0.0002208556979894638, 0.00022732466459274292, 0.00023379363119602203, 0.00024026259779930115, 0.00024673156440258026, 0.0002532005310058594]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 3.0, 12.0, 6.0, 19.0, 17.0, 35.0, 42.0, 65.0, 85.0, 155.0, 187.0, 367.0, 531.0, 946.0, 1748.0, 3602.0, 8235.0, 21773.0, 65908.0, 217137.0, 423029.0, 205944.0, 61986.0, 20908.0, 8144.0, 3476.0, 1700.0, 902.0, 573.0, 327.0, 212.0, 154.0, 94.0, 62.0, 47.0, 28.0, 26.0, 25.0, 15.0, 8.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.19482421875, -0.18863487243652344, -0.18244552612304688, -0.1762561798095703, -0.17006683349609375, -0.1638774871826172, -0.15768814086914062, -0.15149879455566406, -0.1453094482421875, -0.13912010192871094, -0.13293075561523438, -0.1267414093017578, -0.12055206298828125, -0.11436271667480469, -0.10817337036132812, -0.10198402404785156, -0.095794677734375, -0.08960533142089844, -0.08341598510742188, -0.07722663879394531, -0.07103729248046875, -0.06484794616699219, -0.058658599853515625, -0.05246925354003906, -0.0462799072265625, -0.04009056091308594, -0.033901214599609375, -0.027711868286132812, -0.02152252197265625, -0.015333175659179688, -0.009143829345703125, -0.0029544830322265625, 0.00323486328125, 0.009424209594726562, 0.015613555908203125, 0.021802902221679688, 0.02799224853515625, 0.03418159484863281, 0.040370941162109375, 0.04656028747558594, 0.0527496337890625, 0.05893898010253906, 0.06512832641601562, 0.07131767272949219, 0.07750701904296875, 0.08369636535644531, 0.08988571166992188, 0.09607505798339844, 0.102264404296875, 0.10845375061035156, 0.11464309692382812, 0.12083244323730469, 0.12702178955078125, 0.1332111358642578, 0.13940048217773438, 0.14558982849121094, 0.1517791748046875, 0.15796852111816406, 0.16415786743164062, 0.1703472137451172, 0.17653656005859375, 0.1827259063720703, 0.18891525268554688, 0.19510459899902344, 0.2012939453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 3.0, 9.0, 20.0, 22.0, 18.0, 20.0, 38.0, 47.0, 49.0, 53.0, 71.0, 77.0, 78.0, 79.0, 70.0, 73.0, 56.0, 51.0, 22.0, 30.0, 26.0, 21.0, 13.0, 8.0, 9.0, 9.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.069091796875, -0.06698322296142578, -0.06487464904785156, -0.06276607513427734, -0.060657501220703125, -0.058548927307128906, -0.05644035339355469, -0.05433177947998047, -0.05222320556640625, -0.05011463165283203, -0.04800605773925781, -0.045897483825683594, -0.043788909912109375, -0.041680335998535156, -0.03957176208496094, -0.03746318817138672, -0.0353546142578125, -0.03324604034423828, -0.031137466430664062, -0.029028892517089844, -0.026920318603515625, -0.024811744689941406, -0.022703170776367188, -0.02059459686279297, -0.01848602294921875, -0.01637744903564453, -0.014268875122070312, -0.012160301208496094, -0.010051727294921875, -0.007943153381347656, -0.0058345794677734375, -0.0037260055541992188, -0.001617431640625, 0.0004911422729492188, 0.0025997161865234375, 0.004708290100097656, 0.006816864013671875, 0.008925437927246094, 0.011034011840820312, 0.013142585754394531, 0.01525115966796875, 0.01735973358154297, 0.019468307495117188, 0.021576881408691406, 0.023685455322265625, 0.025794029235839844, 0.027902603149414062, 0.03001117706298828, 0.0321197509765625, 0.03422832489013672, 0.03633689880371094, 0.038445472717285156, 0.040554046630859375, 0.042662620544433594, 0.04477119445800781, 0.04687976837158203, 0.04898834228515625, 0.05109691619873047, 0.05320549011230469, 0.055314064025878906, 0.057422637939453125, 0.059531211853027344, 0.06163978576660156, 0.06374835968017578, 0.06585693359375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 23.0, 162.0, 515.0, 278.0, 31.0, 1.0, 1.0, 0.0, 2.0], "bins": [-119.61631774902344, -117.53804779052734, -115.45977783203125, -113.38150787353516, -111.30323791503906, -109.22496032714844, -107.14669799804688, -105.06842041015625, -102.99015045166016, -100.91188049316406, -98.83361053466797, -96.75534057617188, -94.67707061767578, -92.59880065917969, -90.52052307128906, -88.44225311279297, -86.36398315429688, -84.28571319580078, -82.20744323730469, -80.1291732788086, -78.0509033203125, -75.97262573242188, -73.89436340332031, -71.81608581542969, -69.73782348632812, -67.65955352783203, -65.58128356933594, -63.503013610839844, -61.424739837646484, -59.34646987915039, -57.2681999206543, -55.1899299621582, -53.11165237426758, -51.033382415771484, -48.95511245727539, -46.87683868408203, -44.79856872558594, -42.720298767089844, -40.64202880859375, -38.563758850097656, -36.48548889160156, -34.40721893310547, -32.328948974609375, -30.25067710876465, -28.172405242919922, -26.094135284423828, -24.015865325927734, -21.93759536743164, -19.85932159423828, -17.781051635742188, -15.702779769897461, -13.624509811401367, -11.546238899230957, -9.467967987060547, -7.389698028564453, -5.311427116394043, -3.233157157897949, -1.1548864841461182, 0.9233841896057129, 3.001654624938965, 5.079925537109375, 7.158196449279785, 9.236466407775879, 11.314737319946289, 13.3930082321167]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 9.0, 9.0, 6.0, 23.0, 23.0, 22.0, 22.0, 36.0, 35.0, 48.0, 47.0, 58.0, 68.0, 69.0, 62.0, 54.0, 71.0, 41.0, 63.0, 45.0, 29.0, 37.0, 23.0, 21.0, 21.0, 20.0, 21.0, 9.0, 8.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.083810806274414, -7.778956413269043, -7.474102020263672, -7.169248104095459, -6.864393711090088, -6.559539318084717, -6.254685401916504, -5.949831008911133, -5.644976615905762, -5.340122222900391, -5.0352678298950195, -4.730413913726807, -4.4255595207214355, -4.1207051277160645, -3.8158509731292725, -3.5109968185424805, -3.2061424255371094, -2.9012880325317383, -2.5964338779449463, -2.2915797233581543, -1.9867253303527832, -1.6818710565567017, -1.3770167827606201, -1.0721626281738281, -0.767308235168457, -0.4624539613723755, -0.15759968757629395, 0.1472545862197876, 0.45210886001586914, 0.7569631338119507, 1.0618174076080322, 1.3666715621948242, 1.6715259552001953, 1.9763802289962769, 2.2812345027923584, 2.5860886573791504, 2.8909430503845215, 3.1957974433898926, 3.5006515979766846, 3.8055057525634766, 4.110360145568848, 4.415214538574219, 4.72006893157959, 5.024922847747803, 5.329777240753174, 5.634631633758545, 5.939485549926758, 6.244339942932129, 6.5491943359375, 6.854048728942871, 7.158903121948242, 7.463757038116455, 7.768611431121826, 8.073465347290039, 8.37831974029541, 8.683174133300781, 8.988028526306152, 9.292882919311523, 9.597737312316895, 9.902591705322266, 10.20744514465332, 10.512299537658691, 10.817153930664062, 11.122008323669434, 11.426862716674805]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 13.0, 16.0, 22.0, 25.0, 42.0, 94.0, 140.0, 253.0, 700.0, 2365.0, 14270.0, 109933.0, 781103.0, 120149.0, 15322.0, 2672.0, 755.0, 277.0, 144.0, 90.0, 54.0, 35.0, 15.0, 8.0, 10.0, 8.0, 8.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-21.71875, -21.169189453125, -20.61962890625, -20.070068359375, -19.5205078125, -18.970947265625, -18.42138671875, -17.871826171875, -17.322265625, -16.772705078125, -16.22314453125, -15.673583984375, -15.1240234375, -14.574462890625, -14.02490234375, -13.475341796875, -12.92578125, -12.376220703125, -11.82666015625, -11.277099609375, -10.7275390625, -10.177978515625, -9.62841796875, -9.078857421875, -8.529296875, -7.979736328125, -7.43017578125, -6.880615234375, -6.3310546875, -5.781494140625, -5.23193359375, -4.682373046875, -4.1328125, -3.583251953125, -3.03369140625, -2.484130859375, -1.9345703125, -1.385009765625, -0.83544921875, -0.285888671875, 0.263671875, 0.813232421875, 1.36279296875, 1.912353515625, 2.4619140625, 3.011474609375, 3.56103515625, 4.110595703125, 4.66015625, 5.209716796875, 5.75927734375, 6.308837890625, 6.8583984375, 7.407958984375, 7.95751953125, 8.507080078125, 9.056640625, 9.606201171875, 10.15576171875, 10.705322265625, 11.2548828125, 11.804443359375, 12.35400390625, 12.903564453125, 13.453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 10.0, 17.0, 28.0, 13.0, 22.0, 22.0, 33.0, 34.0, 46.0, 36.0, 72.0, 62.0, 62.0, 60.0, 69.0, 50.0, 55.0, 47.0, 41.0, 33.0, 42.0, 25.0, 24.0, 22.0, 14.0, 19.0, 10.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.637939453125, -15.08837890625, -14.538818359375, -13.9892578125, -13.439697265625, -12.89013671875, -12.340576171875, -11.791015625, -11.241455078125, -10.69189453125, -10.142333984375, -9.5927734375, -9.043212890625, -8.49365234375, -7.944091796875, -7.39453125, -6.844970703125, -6.29541015625, -5.745849609375, -5.1962890625, -4.646728515625, -4.09716796875, -3.547607421875, -2.998046875, -2.448486328125, -1.89892578125, -1.349365234375, -0.7998046875, -0.250244140625, 0.29931640625, 0.848876953125, 1.3984375, 1.947998046875, 2.49755859375, 3.047119140625, 3.5966796875, 4.146240234375, 4.69580078125, 5.245361328125, 5.794921875, 6.344482421875, 6.89404296875, 7.443603515625, 7.9931640625, 8.542724609375, 9.09228515625, 9.641845703125, 10.19140625, 10.740966796875, 11.29052734375, 11.840087890625, 12.3896484375, 12.939208984375, 13.48876953125, 14.038330078125, 14.587890625, 15.137451171875, 15.68701171875, 16.236572265625, 16.7861328125, 17.335693359375, 17.88525390625, 18.434814453125, 18.984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 6.0, 16.0, 13.0, 18.0, 33.0, 32.0, 44.0, 88.0, 107.0, 151.0, 232.0, 347.0, 777.0, 3817.0, 69541.0, 905040.0, 62857.0, 3601.0, 775.0, 333.0, 210.0, 135.0, 106.0, 62.0, 58.0, 37.0, 30.0, 23.0, 13.0, 13.0, 7.0, 8.0, 7.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-29.71875, -28.946533203125, -28.17431640625, -27.402099609375, -26.6298828125, -25.857666015625, -25.08544921875, -24.313232421875, -23.541015625, -22.768798828125, -21.99658203125, -21.224365234375, -20.4521484375, -19.679931640625, -18.90771484375, -18.135498046875, -17.36328125, -16.591064453125, -15.81884765625, -15.046630859375, -14.2744140625, -13.502197265625, -12.72998046875, -11.957763671875, -11.185546875, -10.413330078125, -9.64111328125, -8.868896484375, -8.0966796875, -7.324462890625, -6.55224609375, -5.780029296875, -5.0078125, -4.235595703125, -3.46337890625, -2.691162109375, -1.9189453125, -1.146728515625, -0.37451171875, 0.397705078125, 1.169921875, 1.942138671875, 2.71435546875, 3.486572265625, 4.2587890625, 5.031005859375, 5.80322265625, 6.575439453125, 7.34765625, 8.119873046875, 8.89208984375, 9.664306640625, 10.4365234375, 11.208740234375, 11.98095703125, 12.753173828125, 13.525390625, 14.297607421875, 15.06982421875, 15.842041015625, 16.6142578125, 17.386474609375, 18.15869140625, 18.930908203125, 19.703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 5.0, 6.0, 6.0, 11.0, 9.0, 10.0, 16.0, 22.0, 17.0, 26.0, 16.0, 20.0, 32.0, 35.0, 37.0, 47.0, 40.0, 50.0, 53.0, 38.0, 52.0, 40.0, 50.0, 47.0, 28.0, 39.0, 43.0, 27.0, 24.0, 25.0, 17.0, 18.0, 18.0, 15.0, 13.0, 13.0, 13.0, 8.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.125, -16.6162109375, -16.107421875, -15.5986328125, -15.08984375, -14.5810546875, -14.072265625, -13.5634765625, -13.0546875, -12.5458984375, -12.037109375, -11.5283203125, -11.01953125, -10.5107421875, -10.001953125, -9.4931640625, -8.984375, -8.4755859375, -7.966796875, -7.4580078125, -6.94921875, -6.4404296875, -5.931640625, -5.4228515625, -4.9140625, -4.4052734375, -3.896484375, -3.3876953125, -2.87890625, -2.3701171875, -1.861328125, -1.3525390625, -0.84375, -0.3349609375, 0.173828125, 0.6826171875, 1.19140625, 1.7001953125, 2.208984375, 2.7177734375, 3.2265625, 3.7353515625, 4.244140625, 4.7529296875, 5.26171875, 5.7705078125, 6.279296875, 6.7880859375, 7.296875, 7.8056640625, 8.314453125, 8.8232421875, 9.33203125, 9.8408203125, 10.349609375, 10.8583984375, 11.3671875, 11.8759765625, 12.384765625, 12.8935546875, 13.40234375, 13.9111328125, 14.419921875, 14.9287109375, 15.4375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 6.0, 8.0, 32.0, 57.0, 68.0, 198.0, 339.0, 747.0, 2045.0, 18135.0, 977073.0, 45481.0, 2650.0, 889.0, 426.0, 201.0, 111.0, 36.0, 34.0, 11.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.4476318359375, -12.012451171875, -11.5772705078125, -11.14208984375, -10.7069091796875, -10.271728515625, -9.8365478515625, -9.4013671875, -8.9661865234375, -8.531005859375, -8.0958251953125, -7.66064453125, -7.2254638671875, -6.790283203125, -6.3551025390625, -5.919921875, -5.4847412109375, -5.049560546875, -4.6143798828125, -4.17919921875, -3.7440185546875, -3.308837890625, -2.8736572265625, -2.4384765625, -2.0032958984375, -1.568115234375, -1.1329345703125, -0.69775390625, -0.2625732421875, 0.172607421875, 0.6077880859375, 1.04296875, 1.4781494140625, 1.913330078125, 2.3485107421875, 2.78369140625, 3.2188720703125, 3.654052734375, 4.0892333984375, 4.5244140625, 4.9595947265625, 5.394775390625, 5.8299560546875, 6.26513671875, 6.7003173828125, 7.135498046875, 7.5706787109375, 8.005859375, 8.4410400390625, 8.876220703125, 9.3114013671875, 9.74658203125, 10.1817626953125, 10.616943359375, 11.0521240234375, 11.4873046875, 11.9224853515625, 12.357666015625, 12.7928466796875, 13.22802734375, 13.6632080078125, 14.098388671875, 14.5335693359375, 14.96875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 8.0, 15.0, 41.0, 157.0, 540.0, 163.0, 55.0, 20.0, 10.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0033740997314453125, -0.0032792389392852783, -0.003184378147125244, -0.00308951735496521, -0.0029946565628051758, -0.0028997957706451416, -0.0028049349784851074, -0.0027100741863250732, -0.002615213394165039, -0.002520352602005005, -0.0024254918098449707, -0.0023306310176849365, -0.0022357702255249023, -0.002140909433364868, -0.002046048641204834, -0.0019511878490447998, -0.0018563270568847656, -0.0017614662647247314, -0.0016666054725646973, -0.001571744680404663, -0.001476883888244629, -0.0013820230960845947, -0.0012871623039245605, -0.0011923015117645264, -0.0010974407196044922, -0.001002579927444458, -0.0009077191352844238, -0.0008128583431243896, -0.0007179975509643555, -0.0006231367588043213, -0.0005282759666442871, -0.00043341517448425293, -0.00033855438232421875, -0.00024369359016418457, -0.0001488327980041504, -5.397200584411621e-05, 4.088878631591797e-05, 0.00013574957847595215, 0.00023061037063598633, 0.0003254711627960205, 0.0004203319549560547, 0.0005151927471160889, 0.000610053539276123, 0.0007049143314361572, 0.0007997751235961914, 0.0008946359157562256, 0.0009894967079162598, 0.001084357500076294, 0.0011792182922363281, 0.0012740790843963623, 0.0013689398765563965, 0.0014638006687164307, 0.0015586614608764648, 0.001653522253036499, 0.0017483830451965332, 0.0018432438373565674, 0.0019381046295166016, 0.0020329654216766357, 0.00212782621383667, 0.002222687005996704, 0.0023175477981567383, 0.0024124085903167725, 0.0025072693824768066, 0.002602130174636841, 0.002696990966796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 9.0, 10.0, 13.0, 12.0, 25.0, 21.0, 28.0, 46.0, 70.0, 72.0, 134.0, 155.0, 251.0, 344.0, 595.0, 1359.0, 5921.0, 78449.0, 889863.0, 63058.0, 5147.0, 1255.0, 527.0, 346.0, 213.0, 184.0, 132.0, 75.0, 63.0, 48.0, 35.0, 20.0, 16.0, 12.0, 8.0, 10.0, 7.0, 0.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-10.0859375, -9.7845458984375, -9.483154296875, -9.1817626953125, -8.88037109375, -8.5789794921875, -8.277587890625, -7.9761962890625, -7.6748046875, -7.3734130859375, -7.072021484375, -6.7706298828125, -6.46923828125, -6.1678466796875, -5.866455078125, -5.5650634765625, -5.263671875, -4.9622802734375, -4.660888671875, -4.3594970703125, -4.05810546875, -3.7567138671875, -3.455322265625, -3.1539306640625, -2.8525390625, -2.5511474609375, -2.249755859375, -1.9483642578125, -1.64697265625, -1.3455810546875, -1.044189453125, -0.7427978515625, -0.44140625, -0.1400146484375, 0.161376953125, 0.4627685546875, 0.76416015625, 1.0655517578125, 1.366943359375, 1.6683349609375, 1.9697265625, 2.2711181640625, 2.572509765625, 2.8739013671875, 3.17529296875, 3.4766845703125, 3.778076171875, 4.0794677734375, 4.380859375, 4.6822509765625, 4.983642578125, 5.2850341796875, 5.58642578125, 5.8878173828125, 6.189208984375, 6.4906005859375, 6.7919921875, 7.0933837890625, 7.394775390625, 7.6961669921875, 7.99755859375, 8.2989501953125, 8.600341796875, 8.9017333984375, 9.203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 8.0, 3.0, 11.0, 9.0, 26.0, 18.0, 13.0, 27.0, 35.0, 39.0, 38.0, 70.0, 175.0, 185.0, 73.0, 51.0, 35.0, 31.0, 27.0, 36.0, 15.0, 18.0, 15.0, 12.0, 8.0, 5.0, 4.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.20703125, -1.15216064453125, -1.0972900390625, -1.04241943359375, -0.987548828125, -0.93267822265625, -0.8778076171875, -0.82293701171875, -0.76806640625, -0.71319580078125, -0.6583251953125, -0.60345458984375, -0.548583984375, -0.49371337890625, -0.4388427734375, -0.38397216796875, -0.3291015625, -0.27423095703125, -0.2193603515625, -0.16448974609375, -0.109619140625, -0.05474853515625, 0.0001220703125, 0.05499267578125, 0.10986328125, 0.16473388671875, 0.2196044921875, 0.27447509765625, 0.329345703125, 0.38421630859375, 0.4390869140625, 0.49395751953125, 0.548828125, 0.60369873046875, 0.6585693359375, 0.71343994140625, 0.768310546875, 0.82318115234375, 0.8780517578125, 0.93292236328125, 0.98779296875, 1.04266357421875, 1.0975341796875, 1.15240478515625, 1.207275390625, 1.26214599609375, 1.3170166015625, 1.37188720703125, 1.4267578125, 1.48162841796875, 1.5364990234375, 1.59136962890625, 1.646240234375, 1.70111083984375, 1.7559814453125, 1.81085205078125, 1.86572265625, 1.92059326171875, 1.9754638671875, 2.03033447265625, 2.085205078125, 2.14007568359375, 2.1949462890625, 2.24981689453125, 2.3046875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 13.0, 23.0, 61.0, 109.0, 197.0, 190.0, 161.0, 120.0, 63.0, 34.0, 15.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.79286193847656, -59.28363800048828, -57.7744140625, -56.26519012451172, -54.75596618652344, -53.246742248535156, -51.737518310546875, -50.228294372558594, -48.71907043457031, -47.20984649658203, -45.70062255859375, -44.19139862060547, -42.68217468261719, -41.172950744628906, -39.663726806640625, -38.154502868652344, -36.64528274536133, -35.13605880737305, -33.626834869384766, -32.117610931396484, -30.608386993408203, -29.099163055419922, -27.589941024780273, -26.080717086791992, -24.57149314880371, -23.06226921081543, -21.55304527282715, -20.0438232421875, -18.53459930419922, -17.025375366210938, -15.516151428222656, -14.006927490234375, -12.49770736694336, -10.988483428955078, -9.479259490966797, -7.970036506652832, -6.460812568664551, -4.9515886306762695, -3.4423656463623047, -1.9331417083740234, -0.4239177703857422, 1.08530592918396, 2.594529628753662, 4.103753089904785, 5.612977027893066, 7.122200965881348, 8.631423950195312, 10.140647888183594, 11.649871826171875, 13.159095764160156, 14.668319702148438, 16.17754364013672, 17.686767578125, 19.19599151611328, 20.70521354675293, 22.21443748474121, 23.723661422729492, 25.232885360717773, 26.742109298706055, 28.251331329345703, 29.760555267333984, 31.269779205322266, 32.77900314331055, 34.28822708129883, 35.79745101928711]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 1.0, 8.0, 6.0, 7.0, 13.0, 8.0, 15.0, 15.0, 23.0, 19.0, 19.0, 30.0, 40.0, 34.0, 36.0, 40.0, 37.0, 42.0, 33.0, 58.0, 51.0, 36.0, 41.0, 35.0, 34.0, 42.0, 36.0, 33.0, 34.0, 30.0, 28.0, 24.0, 12.0, 20.0, 10.0, 16.0, 7.0, 6.0, 9.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.019515991210938, -25.24300193786621, -24.466487884521484, -23.689971923828125, -22.9134578704834, -22.136943817138672, -21.360429763793945, -20.58391571044922, -19.80739974975586, -19.030885696411133, -18.254371643066406, -17.477855682373047, -16.70134162902832, -15.924827575683594, -15.148313522338867, -14.37179946899414, -13.595285415649414, -12.818771362304688, -12.042256355285645, -11.265742301940918, -10.489227294921875, -9.712713241577148, -8.936199188232422, -8.159685134887695, -7.383170127868652, -6.606655597686768, -5.830141067504883, -5.053627014160156, -4.2771124839782715, -3.5005979537963867, -2.72408390045166, -1.9475693702697754, -1.1710529327392578, -0.3945385217666626, 0.3819758892059326, 1.1584901809692383, 1.935004711151123, 2.711519241333008, 3.4880332946777344, 4.264547824859619, 5.041062355041504, 5.817576885223389, 6.594091415405273, 7.37060546875, 8.147119522094727, 8.92363452911377, 9.700148582458496, 10.476663589477539, 11.253177642822266, 12.029691696166992, 12.806206703186035, 13.582720756530762, 14.359235763549805, 15.135749816894531, 15.912263870239258, 16.688777923583984, 17.465293884277344, 18.24180793762207, 19.018321990966797, 19.794837951660156, 20.571352005004883, 21.34786605834961, 22.124380111694336, 22.900894165039062, 23.67740821838379]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 9.0, 5.0, 7.0, 8.0, 18.0, 24.0, 18.0, 39.0, 44.0, 58.0, 71.0, 151.0, 255.0, 559.0, 1875.0, 20526.0, 2794100.0, 1364077.0, 10563.0, 995.0, 335.0, 146.0, 116.0, 61.0, 45.0, 38.0, 34.0, 28.0, 23.0, 13.0, 8.0, 13.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.03125, -32.81201171875, -31.5927734375, -30.37353515625, -29.154296875, -27.93505859375, -26.7158203125, -25.49658203125, -24.27734375, -23.05810546875, -21.8388671875, -20.61962890625, -19.400390625, -18.18115234375, -16.9619140625, -15.74267578125, -14.5234375, -13.30419921875, -12.0849609375, -10.86572265625, -9.646484375, -8.42724609375, -7.2080078125, -5.98876953125, -4.76953125, -3.55029296875, -2.3310546875, -1.11181640625, 0.107421875, 1.32666015625, 2.5458984375, 3.76513671875, 4.984375, 6.20361328125, 7.4228515625, 8.64208984375, 9.861328125, 11.08056640625, 12.2998046875, 13.51904296875, 14.73828125, 15.95751953125, 17.1767578125, 18.39599609375, 19.615234375, 20.83447265625, 22.0537109375, 23.27294921875, 24.4921875, 25.71142578125, 26.9306640625, 28.14990234375, 29.369140625, 30.58837890625, 31.8076171875, 33.02685546875, 34.24609375, 35.46533203125, 36.6845703125, 37.90380859375, 39.123046875, 40.34228515625, 41.5615234375, 42.78076171875, 44.0]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 8.0, 9.0, 12.0, 17.0, 20.0, 30.0, 34.0, 52.0, 80.0, 68.0, 88.0, 75.0, 77.0, 82.0, 69.0, 67.0, 63.0, 35.0, 32.0, 21.0, 23.0, 19.0, 13.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5390625, -10.0836181640625, -9.628173828125, -9.1727294921875, -8.71728515625, -8.2618408203125, -7.806396484375, -7.3509521484375, -6.8955078125, -6.4400634765625, -5.984619140625, -5.5291748046875, -5.07373046875, -4.6182861328125, -4.162841796875, -3.7073974609375, -3.251953125, -2.7965087890625, -2.341064453125, -1.8856201171875, -1.43017578125, -0.9747314453125, -0.519287109375, -0.0638427734375, 0.3916015625, 0.8470458984375, 1.302490234375, 1.7579345703125, 2.21337890625, 2.6688232421875, 3.124267578125, 3.5797119140625, 4.03515625, 4.4906005859375, 4.946044921875, 5.4014892578125, 5.85693359375, 6.3123779296875, 6.767822265625, 7.2232666015625, 7.6787109375, 8.1341552734375, 8.589599609375, 9.0450439453125, 9.50048828125, 9.9559326171875, 10.411376953125, 10.8668212890625, 11.322265625, 11.7777099609375, 12.233154296875, 12.6885986328125, 13.14404296875, 13.5994873046875, 14.054931640625, 14.5103759765625, 14.9658203125, 15.4212646484375, 15.876708984375, 16.3321533203125, 16.78759765625, 17.2430419921875, 17.698486328125, 18.1539306640625, 18.609375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 14.0, 18.0, 21.0, 43.0, 94.0, 214.0, 534.0, 1322.0, 6327.0, 286122.0, 3858027.0, 36827.0, 3152.0, 887.0, 341.0, 159.0, 84.0, 40.0, 19.0, 10.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.1875, -35.03125, -33.875, -32.71875, -31.5625, -30.40625, -29.25, -28.09375, -26.9375, -25.78125, -24.625, -23.46875, -22.3125, -21.15625, -20.0, -18.84375, -17.6875, -16.53125, -15.375, -14.21875, -13.0625, -11.90625, -10.75, -9.59375, -8.4375, -7.28125, -6.125, -4.96875, -3.8125, -2.65625, -1.5, -0.34375, 0.8125, 1.96875, 3.125, 4.28125, 5.4375, 6.59375, 7.75, 8.90625, 10.0625, 11.21875, 12.375, 13.53125, 14.6875, 15.84375, 17.0, 18.15625, 19.3125, 20.46875, 21.625, 22.78125, 23.9375, 25.09375, 26.25, 27.40625, 28.5625, 29.71875, 30.875, 32.03125, 33.1875, 34.34375, 35.5, 36.65625, 37.8125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 8.0, 10.0, 33.0, 39.0, 72.0, 172.0, 332.0, 571.0, 990.0, 845.0, 483.0, 241.0, 130.0, 63.0, 36.0, 20.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.7557373046875, -8.503662109375, -8.2515869140625, -7.99951171875, -7.7474365234375, -7.495361328125, -7.2432861328125, -6.9912109375, -6.7391357421875, -6.487060546875, -6.2349853515625, -5.98291015625, -5.7308349609375, -5.478759765625, -5.2266845703125, -4.974609375, -4.7225341796875, -4.470458984375, -4.2183837890625, -3.96630859375, -3.7142333984375, -3.462158203125, -3.2100830078125, -2.9580078125, -2.7059326171875, -2.453857421875, -2.2017822265625, -1.94970703125, -1.6976318359375, -1.445556640625, -1.1934814453125, -0.94140625, -0.6893310546875, -0.437255859375, -0.1851806640625, 0.06689453125, 0.3189697265625, 0.571044921875, 0.8231201171875, 1.0751953125, 1.3272705078125, 1.579345703125, 1.8314208984375, 2.08349609375, 2.3355712890625, 2.587646484375, 2.8397216796875, 3.091796875, 3.3438720703125, 3.595947265625, 3.8480224609375, 4.10009765625, 4.3521728515625, 4.604248046875, 4.8563232421875, 5.1083984375, 5.3604736328125, 5.612548828125, 5.8646240234375, 6.11669921875, 6.3687744140625, 6.620849609375, 6.8729248046875, 7.125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 12.0, 28.0, 80.0, 155.0, 187.0, 227.0, 159.0, 93.0, 35.0, 22.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.059226989746094, -50.81850814819336, -49.577789306640625, -48.33707046508789, -47.096351623535156, -45.85563659667969, -44.61491775512695, -43.37419891357422, -42.133480072021484, -40.89276123046875, -39.652042388916016, -38.41132354736328, -37.17060852050781, -35.92988967895508, -34.689170837402344, -33.44845199584961, -32.207733154296875, -30.96701431274414, -29.726295471191406, -28.485578536987305, -27.24485969543457, -26.004140853881836, -24.763423919677734, -23.522705078125, -22.281986236572266, -21.04126739501953, -19.800548553466797, -18.559831619262695, -17.31911277770996, -16.078393936157227, -14.837676048278809, -13.59695816040039, -12.356237411499023, -11.115518569946289, -9.874800682067871, -8.634082794189453, -7.393363952636719, -6.152645587921143, -4.911927223205566, -3.6712093353271484, -2.430490493774414, -1.189772129058838, 0.05094623565673828, 1.2916646003723145, 2.5323829650878906, 3.773101329803467, 5.013819694519043, 6.254537582397461, 7.495256423950195, 8.73597526550293, 9.976693153381348, 11.217411041259766, 12.4581298828125, 13.698848724365234, 14.939566612243652, 16.18028450012207, 17.421003341674805, 18.66172218322754, 19.90243911743164, 21.143157958984375, 22.38387680053711, 23.624595642089844, 24.865314483642578, 26.10603141784668, 27.346750259399414]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 6.0, 11.0, 12.0, 12.0, 14.0, 11.0, 21.0, 20.0, 27.0, 25.0, 30.0, 35.0, 30.0, 30.0, 57.0, 31.0, 49.0, 50.0, 52.0, 44.0, 48.0, 37.0, 29.0, 43.0, 32.0, 43.0, 24.0, 32.0, 27.0, 18.0, 21.0, 13.0, 9.0, 11.0, 9.0, 7.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.08928108215332, -9.773820877075195, -9.45836067199707, -9.142901420593262, -8.827441215515137, -8.511981010437012, -8.196520805358887, -7.881060600280762, -7.565600872039795, -7.25014066696167, -6.934680938720703, -6.619220733642578, -6.303760528564453, -5.988300800323486, -5.672840595245361, -5.3573808670043945, -5.0419206619262695, -4.7264604568481445, -4.411000728607178, -4.095540523529053, -3.780080556869507, -3.464620590209961, -3.149160385131836, -2.83370041847229, -2.518240451812744, -2.2027804851531982, -1.8873203992843628, -1.5718603134155273, -1.2564003467559814, -0.9409403800964355, -0.6254802942276001, -0.31002020835876465, 0.00543975830078125, 0.3208997845649719, 0.6363598108291626, 0.9518198370933533, 1.267279863357544, 1.5827398300170898, 1.8981999158859253, 2.2136600017547607, 2.5291199684143066, 2.8445799350738525, 3.1600399017333984, 3.4755001068115234, 3.7909600734710693, 4.106420040130615, 4.42188024520874, 4.737339973449707, 5.052800178527832, 5.368260383605957, 5.683720111846924, 5.999180316925049, 6.314640045166016, 6.630100250244141, 6.945560455322266, 7.261020660400391, 7.576480388641357, 7.891940593719482, 8.20740032196045, 8.522860527038574, 8.8383207321167, 9.153779983520508, 9.469240188598633, 9.784700393676758, 10.100160598754883]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 11.0, 10.0, 13.0, 31.0, 67.0, 96.0, 118.0, 176.0, 360.0, 788.0, 1720.0, 5286.0, 24979.0, 167860.0, 576252.0, 226647.0, 33683.0, 6609.0, 2026.0, 833.0, 371.0, 254.0, 137.0, 76.0, 50.0, 38.0, 21.0, 16.0, 11.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.703125, -3.57794189453125, -3.4527587890625, -3.32757568359375, -3.202392578125, -3.07720947265625, -2.9520263671875, -2.82684326171875, -2.70166015625, -2.57647705078125, -2.4512939453125, -2.32611083984375, -2.200927734375, -2.07574462890625, -1.9505615234375, -1.82537841796875, -1.7001953125, -1.57501220703125, -1.4498291015625, -1.32464599609375, -1.199462890625, -1.07427978515625, -0.9490966796875, -0.82391357421875, -0.69873046875, -0.57354736328125, -0.4483642578125, -0.32318115234375, -0.197998046875, -0.07281494140625, 0.0523681640625, 0.17755126953125, 0.302734375, 0.42791748046875, 0.5531005859375, 0.67828369140625, 0.803466796875, 0.92864990234375, 1.0538330078125, 1.17901611328125, 1.30419921875, 1.42938232421875, 1.5545654296875, 1.67974853515625, 1.804931640625, 1.93011474609375, 2.0552978515625, 2.18048095703125, 2.3056640625, 2.43084716796875, 2.5560302734375, 2.68121337890625, 2.806396484375, 2.93157958984375, 3.0567626953125, 3.18194580078125, 3.30712890625, 3.43231201171875, 3.5574951171875, 3.68267822265625, 3.807861328125, 3.93304443359375, 4.0582275390625, 4.18341064453125, 4.30859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 10.0, 6.0, 8.0, 8.0, 11.0, 13.0, 15.0, 20.0, 32.0, 41.0, 48.0, 53.0, 57.0, 50.0, 50.0, 57.0, 77.0, 76.0, 54.0, 55.0, 48.0, 49.0, 52.0, 20.0, 24.0, 19.0, 22.0, 14.0, 9.0, 6.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.84375, -13.521728515625, -13.19970703125, -12.877685546875, -12.5556640625, -12.233642578125, -11.91162109375, -11.589599609375, -11.267578125, -10.945556640625, -10.62353515625, -10.301513671875, -9.9794921875, -9.657470703125, -9.33544921875, -9.013427734375, -8.69140625, -8.369384765625, -8.04736328125, -7.725341796875, -7.4033203125, -7.081298828125, -6.75927734375, -6.437255859375, -6.115234375, -5.793212890625, -5.47119140625, -5.149169921875, -4.8271484375, -4.505126953125, -4.18310546875, -3.861083984375, -3.5390625, -3.217041015625, -2.89501953125, -2.572998046875, -2.2509765625, -1.928955078125, -1.60693359375, -1.284912109375, -0.962890625, -0.640869140625, -0.31884765625, 0.003173828125, 0.3251953125, 0.647216796875, 0.96923828125, 1.291259765625, 1.61328125, 1.935302734375, 2.25732421875, 2.579345703125, 2.9013671875, 3.223388671875, 3.54541015625, 3.867431640625, 4.189453125, 4.511474609375, 4.83349609375, 5.155517578125, 5.4775390625, 5.799560546875, 6.12158203125, 6.443603515625, 6.765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 14.0, 15.0, 27.0, 41.0, 69.0, 94.0, 155.0, 219.0, 328.0, 492.0, 714.0, 1281.0, 1863.0, 3039.0, 4729.0, 7409.0, 12112.0, 18968.0, 29905.0, 47164.0, 72808.0, 106887.0, 143119.0, 160041.0, 139968.0, 103104.0, 69505.0, 45409.0, 29006.0, 18425.0, 11599.0, 7389.0, 4632.0, 2857.0, 1879.0, 1166.0, 731.0, 440.0, 293.0, 221.0, 140.0, 97.0, 56.0, 43.0, 29.0, 19.0, 10.0, 10.0, 11.0, 4.0, 1.0, 4.0], "bins": [-0.86572265625, -0.84130859375, -0.81689453125, -0.79248046875, -0.76806640625, -0.74365234375, -0.71923828125, -0.69482421875, -0.67041015625, -0.64599609375, -0.62158203125, -0.59716796875, -0.57275390625, -0.54833984375, -0.52392578125, -0.49951171875, -0.47509765625, -0.45068359375, -0.42626953125, -0.40185546875, -0.37744140625, -0.35302734375, -0.32861328125, -0.30419921875, -0.27978515625, -0.25537109375, -0.23095703125, -0.20654296875, -0.18212890625, -0.15771484375, -0.13330078125, -0.10888671875, -0.08447265625, -0.06005859375, -0.03564453125, -0.01123046875, 0.01318359375, 0.03759765625, 0.06201171875, 0.08642578125, 0.11083984375, 0.13525390625, 0.15966796875, 0.18408203125, 0.20849609375, 0.23291015625, 0.25732421875, 0.28173828125, 0.30615234375, 0.33056640625, 0.35498046875, 0.37939453125, 0.40380859375, 0.42822265625, 0.45263671875, 0.47705078125, 0.50146484375, 0.52587890625, 0.55029296875, 0.57470703125, 0.59912109375, 0.62353515625, 0.64794921875, 0.67236328125, 0.69677734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 13.0, 8.0, 11.0, 12.0, 23.0, 11.0, 19.0, 21.0, 16.0, 22.0, 32.0, 31.0, 32.0, 36.0, 48.0, 39.0, 43.0, 51.0, 49.0, 51.0, 51.0, 49.0, 48.0, 35.0, 29.0, 18.0, 32.0, 19.0, 31.0, 17.0, 14.0, 17.0, 11.0, 7.0, 14.0, 10.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 5.0, 0.0, 3.0, 1.0], "bins": [-16.96875, -16.5023193359375, -16.035888671875, -15.5694580078125, -15.10302734375, -14.6365966796875, -14.170166015625, -13.7037353515625, -13.2373046875, -12.7708740234375, -12.304443359375, -11.8380126953125, -11.37158203125, -10.9051513671875, -10.438720703125, -9.9722900390625, -9.505859375, -9.0394287109375, -8.572998046875, -8.1065673828125, -7.64013671875, -7.1737060546875, -6.707275390625, -6.2408447265625, -5.7744140625, -5.3079833984375, -4.841552734375, -4.3751220703125, -3.90869140625, -3.4422607421875, -2.975830078125, -2.5093994140625, -2.04296875, -1.5765380859375, -1.110107421875, -0.6436767578125, -0.17724609375, 0.2891845703125, 0.755615234375, 1.2220458984375, 1.6884765625, 2.1549072265625, 2.621337890625, 3.0877685546875, 3.55419921875, 4.0206298828125, 4.487060546875, 4.9534912109375, 5.419921875, 5.8863525390625, 6.352783203125, 6.8192138671875, 7.28564453125, 7.7520751953125, 8.218505859375, 8.6849365234375, 9.1513671875, 9.6177978515625, 10.084228515625, 10.5506591796875, 11.01708984375, 11.4835205078125, 11.949951171875, 12.4163818359375, 12.8828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 12.0, 10.0, 22.0, 54.0, 59.0, 99.0, 179.0, 326.0, 572.0, 1274.0, 2789.0, 8468.0, 33722.0, 175700.0, 548097.0, 219619.0, 41372.0, 10089.0, 3276.0, 1347.0, 640.0, 354.0, 199.0, 112.0, 57.0, 36.0, 29.0, 14.0, 7.0, 4.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252685546875, -0.24351882934570312, -0.23435211181640625, -0.22518539428710938, -0.2160186767578125, -0.20685195922851562, -0.19768524169921875, -0.18851852416992188, -0.179351806640625, -0.17018508911132812, -0.16101837158203125, -0.15185165405273438, -0.1426849365234375, -0.13351821899414062, -0.12435150146484375, -0.11518478393554688, -0.10601806640625, -0.09685134887695312, -0.08768463134765625, -0.07851791381835938, -0.0693511962890625, -0.060184478759765625, -0.05101776123046875, -0.041851043701171875, -0.032684326171875, -0.023517608642578125, -0.01435089111328125, -0.005184173583984375, 0.0039825439453125, 0.013149261474609375, 0.02231597900390625, 0.031482696533203125, 0.0406494140625, 0.049816131591796875, 0.05898284912109375, 0.06814956665039062, 0.0773162841796875, 0.08648300170898438, 0.09564971923828125, 0.10481643676757812, 0.113983154296875, 0.12314987182617188, 0.13231658935546875, 0.14148330688476562, 0.1506500244140625, 0.15981674194335938, 0.16898345947265625, 0.17815017700195312, 0.18731689453125, 0.19648361206054688, 0.20565032958984375, 0.21481704711914062, 0.2239837646484375, 0.23315048217773438, 0.24231719970703125, 0.2514839172363281, 0.260650634765625, 0.2698173522949219, 0.27898406982421875, 0.2881507873535156, 0.2973175048828125, 0.3064842224121094, 0.31565093994140625, 0.3248176574707031, 0.333984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 2.0, 7.0, 10.0, 19.0, 12.0, 33.0, 37.0, 58.0, 85.0, 67.0, 108.0, 88.0, 91.0, 95.0, 72.0, 63.0, 36.0, 34.0, 27.0, 12.0, 14.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016033649444580078, -0.00015495717525482178, -0.00014957785606384277, -0.00014419853687286377, -0.00013881921768188477, -0.00013343989849090576, -0.00012806057929992676, -0.00012268126010894775, -0.00011730194091796875, -0.00011192262172698975, -0.00010654330253601074, -0.00010116398334503174, -9.578466415405273e-05, -9.040534496307373e-05, -8.502602577209473e-05, -7.964670658111572e-05, -7.426738739013672e-05, -6.888806819915771e-05, -6.350874900817871e-05, -5.812942981719971e-05, -5.27501106262207e-05, -4.73707914352417e-05, -4.1991472244262695e-05, -3.661215305328369e-05, -3.123283386230469e-05, -2.5853514671325684e-05, -2.047419548034668e-05, -1.5094876289367676e-05, -9.715557098388672e-06, -4.336237907409668e-06, 1.043081283569336e-06, 6.42240047454834e-06, 1.1801719665527344e-05, 1.7181038856506348e-05, 2.256035804748535e-05, 2.7939677238464355e-05, 3.331899642944336e-05, 3.869831562042236e-05, 4.407763481140137e-05, 4.945695400238037e-05, 5.4836273193359375e-05, 6.021559238433838e-05, 6.559491157531738e-05, 7.097423076629639e-05, 7.635354995727539e-05, 8.17328691482544e-05, 8.71121883392334e-05, 9.24915075302124e-05, 9.78708267211914e-05, 0.00010325014591217041, 0.00010862946510314941, 0.00011400878429412842, 0.00011938810348510742, 0.00012476742267608643, 0.00013014674186706543, 0.00013552606105804443, 0.00014090538024902344, 0.00014628469944000244, 0.00015166401863098145, 0.00015704333782196045, 0.00016242265701293945, 0.00016780197620391846, 0.00017318129539489746, 0.00017856061458587646, 0.00018393993377685547]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 17.0, 15.0, 22.0, 21.0, 50.0, 57.0, 107.0, 157.0, 304.0, 496.0, 892.0, 1838.0, 3844.0, 8647.0, 23090.0, 77435.0, 298330.0, 438150.0, 134750.0, 37194.0, 12718.0, 5117.0, 2462.0, 1205.0, 656.0, 348.0, 235.0, 116.0, 61.0, 55.0, 30.0, 23.0, 15.0, 14.0, 15.0, 11.0, 5.0, 11.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.261962890625, -0.2540740966796875, -0.246185302734375, -0.2382965087890625, -0.23040771484375, -0.2225189208984375, -0.214630126953125, -0.2067413330078125, -0.1988525390625, -0.1909637451171875, -0.183074951171875, -0.1751861572265625, -0.16729736328125, -0.1594085693359375, -0.151519775390625, -0.1436309814453125, -0.1357421875, -0.1278533935546875, -0.119964599609375, -0.1120758056640625, -0.10418701171875, -0.0962982177734375, -0.088409423828125, -0.0805206298828125, -0.0726318359375, -0.0647430419921875, -0.056854248046875, -0.0489654541015625, -0.04107666015625, -0.0331878662109375, -0.025299072265625, -0.0174102783203125, -0.009521484375, -0.0016326904296875, 0.006256103515625, 0.0141448974609375, 0.02203369140625, 0.0299224853515625, 0.037811279296875, 0.0457000732421875, 0.0535888671875, 0.0614776611328125, 0.069366455078125, 0.0772552490234375, 0.08514404296875, 0.0930328369140625, 0.100921630859375, 0.1088104248046875, 0.11669921875, 0.1245880126953125, 0.132476806640625, 0.1403656005859375, 0.14825439453125, 0.1561431884765625, 0.164031982421875, 0.1719207763671875, 0.1798095703125, 0.1876983642578125, 0.195587158203125, 0.2034759521484375, 0.21136474609375, 0.2192535400390625, 0.227142333984375, 0.2350311279296875, 0.242919921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 9.0, 13.0, 27.0, 22.0, 19.0, 36.0, 52.0, 66.0, 59.0, 82.0, 89.0, 89.0, 77.0, 57.0, 52.0, 53.0, 44.0, 22.0, 25.0, 15.0, 16.0, 11.0, 6.0, 9.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.08331298828125, -0.08098888397216797, -0.07866477966308594, -0.0763406753540039, -0.07401657104492188, -0.07169246673583984, -0.06936836242675781, -0.06704425811767578, -0.06472015380859375, -0.06239604949951172, -0.06007194519042969, -0.057747840881347656, -0.055423736572265625, -0.053099632263183594, -0.05077552795410156, -0.04845142364501953, -0.0461273193359375, -0.04380321502685547, -0.04147911071777344, -0.039155006408691406, -0.036830902099609375, -0.034506797790527344, -0.03218269348144531, -0.02985858917236328, -0.02753448486328125, -0.02521038055419922, -0.022886276245117188, -0.020562171936035156, -0.018238067626953125, -0.015913963317871094, -0.013589859008789062, -0.011265754699707031, -0.008941650390625, -0.006617546081542969, -0.0042934417724609375, -0.0019693374633789062, 0.000354766845703125, 0.0026788711547851562, 0.0050029754638671875, 0.007327079772949219, 0.00965118408203125, 0.011975288391113281, 0.014299392700195312, 0.016623497009277344, 0.018947601318359375, 0.021271705627441406, 0.023595809936523438, 0.02591991424560547, 0.0282440185546875, 0.03056812286376953, 0.03289222717285156, 0.035216331481933594, 0.037540435791015625, 0.039864540100097656, 0.04218864440917969, 0.04451274871826172, 0.04683685302734375, 0.04916095733642578, 0.05148506164550781, 0.053809165954589844, 0.056133270263671875, 0.058457374572753906, 0.06078147888183594, 0.06310558319091797, 0.0654296875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 27.0, 198.0, 417.0, 306.0, 54.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.3003158569336, -88.51630401611328, -86.7322998046875, -84.94828796386719, -83.16427612304688, -81.3802719116211, -79.59626007080078, -77.812255859375, -76.02824401855469, -74.24423217773438, -72.4602279663086, -70.67621612548828, -68.89220428466797, -67.10820007324219, -65.32418823242188, -63.54018020629883, -61.75617218017578, -59.972164154052734, -58.18815231323242, -56.404144287109375, -54.62013626098633, -52.83612823486328, -51.05211639404297, -49.26810836791992, -47.48409652709961, -45.70008850097656, -43.91607666015625, -42.1320686340332, -40.348060607910156, -38.564048767089844, -36.7800407409668, -34.99603271484375, -33.2120246887207, -31.428014755249023, -29.644006729125977, -27.859996795654297, -26.07598876953125, -24.29197883605957, -22.50796890258789, -20.723960876464844, -18.939952850341797, -17.155942916870117, -15.37193489074707, -13.58792495727539, -11.803916931152344, -10.019906997680664, -8.2358980178833, -6.4518890380859375, -4.667879104614258, -2.8838701248168945, -1.0998609066009521, 0.6841483116149902, 2.4681572914123535, 4.252166748046875, 6.036175727844238, 7.820184707641602, 9.604193687438965, 11.388202667236328, 13.172211647033691, 14.956220626831055, 16.740230560302734, 18.52423858642578, 20.30824851989746, 22.09225845336914, 23.876266479492188]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 9.0, 9.0, 20.0, 27.0, 14.0, 39.0, 29.0, 46.0, 47.0, 50.0, 66.0, 64.0, 87.0, 56.0, 70.0, 46.0, 66.0, 48.0, 49.0, 39.0, 23.0, 30.0, 18.0, 12.0, 11.0, 6.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.433939933776855, -12.113565444946289, -11.793191909790039, -11.472817420959473, -11.152442932128906, -10.83206844329834, -10.511693954467773, -10.191320419311523, -9.870945930480957, -9.55057144165039, -9.23019790649414, -8.909823417663574, -8.589448928833008, -8.269074440002441, -7.948700428009033, -7.628326416015625, -7.307951927185059, -6.987577438354492, -6.667203426361084, -6.346829414367676, -6.026454925537109, -5.706080436706543, -5.385706424713135, -5.065332412719727, -4.74495792388916, -4.424583435058594, -4.1042094230651855, -3.7838351726531982, -3.463460922241211, -3.1430866718292236, -2.8227124214172363, -2.502338171005249, -2.1819639205932617, -1.8615896701812744, -1.541215419769287, -1.2208411693572998, -0.9004669189453125, -0.5800926685333252, -0.2597184181213379, 0.060655832290649414, 0.3810300827026367, 0.701404333114624, 1.0217785835266113, 1.3421528339385986, 1.662527084350586, 1.9829013347625732, 2.3032755851745605, 2.623649835586548, 2.944024085998535, 3.2643983364105225, 3.5847725868225098, 3.905146837234497, 4.225521087646484, 4.545895576477051, 4.866269588470459, 5.186643600463867, 5.507018089294434, 5.827392578125, 6.147766590118408, 6.468140602111816, 6.788515090942383, 7.108889579772949, 7.429263591766357, 7.749637603759766, 8.070012092590332]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 6.0, 5.0, 5.0, 8.0, 12.0, 20.0, 25.0, 32.0, 76.0, 123.0, 216.0, 465.0, 1142.0, 4305.0, 18892.0, 111682.0, 677610.0, 195790.0, 29140.0, 6285.0, 1613.0, 535.0, 243.0, 138.0, 70.0, 47.0, 25.0, 16.0, 11.0, 7.0, 3.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.1640625, -14.6846923828125, -14.205322265625, -13.7259521484375, -13.24658203125, -12.7672119140625, -12.287841796875, -11.8084716796875, -11.3291015625, -10.8497314453125, -10.370361328125, -9.8909912109375, -9.41162109375, -8.9322509765625, -8.452880859375, -7.9735107421875, -7.494140625, -7.0147705078125, -6.535400390625, -6.0560302734375, -5.57666015625, -5.0972900390625, -4.617919921875, -4.1385498046875, -3.6591796875, -3.1798095703125, -2.700439453125, -2.2210693359375, -1.74169921875, -1.2623291015625, -0.782958984375, -0.3035888671875, 0.17578125, 0.6551513671875, 1.134521484375, 1.6138916015625, 2.09326171875, 2.5726318359375, 3.052001953125, 3.5313720703125, 4.0107421875, 4.4901123046875, 4.969482421875, 5.4488525390625, 5.92822265625, 6.4075927734375, 6.886962890625, 7.3663330078125, 7.845703125, 8.3250732421875, 8.804443359375, 9.2838134765625, 9.76318359375, 10.2425537109375, 10.721923828125, 11.2012939453125, 11.6806640625, 12.1600341796875, 12.639404296875, 13.1187744140625, 13.59814453125, 14.0775146484375, 14.556884765625, 15.0362548828125, 15.515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 10.0, 9.0, 14.0, 14.0, 26.0, 28.0, 24.0, 37.0, 32.0, 43.0, 47.0, 50.0, 71.0, 63.0, 49.0, 59.0, 58.0, 53.0, 54.0, 51.0, 36.0, 38.0, 24.0, 23.0, 22.0, 15.0, 4.0, 10.0, 7.0, 7.0, 2.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.078125, -15.5791015625, -15.080078125, -14.5810546875, -14.08203125, -13.5830078125, -13.083984375, -12.5849609375, -12.0859375, -11.5869140625, -11.087890625, -10.5888671875, -10.08984375, -9.5908203125, -9.091796875, -8.5927734375, -8.09375, -7.5947265625, -7.095703125, -6.5966796875, -6.09765625, -5.5986328125, -5.099609375, -4.6005859375, -4.1015625, -3.6025390625, -3.103515625, -2.6044921875, -2.10546875, -1.6064453125, -1.107421875, -0.6083984375, -0.109375, 0.3896484375, 0.888671875, 1.3876953125, 1.88671875, 2.3857421875, 2.884765625, 3.3837890625, 3.8828125, 4.3818359375, 4.880859375, 5.3798828125, 5.87890625, 6.3779296875, 6.876953125, 7.3759765625, 7.875, 8.3740234375, 8.873046875, 9.3720703125, 9.87109375, 10.3701171875, 10.869140625, 11.3681640625, 11.8671875, 12.3662109375, 12.865234375, 13.3642578125, 13.86328125, 14.3623046875, 14.861328125, 15.3603515625, 15.859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 8.0, 8.0, 6.0, 10.0, 12.0, 17.0, 30.0, 44.0, 66.0, 79.0, 167.0, 240.0, 587.0, 3256.0, 85110.0, 920571.0, 35225.0, 1972.0, 503.0, 225.0, 138.0, 80.0, 59.0, 35.0, 18.0, 19.0, 12.0, 9.0, 12.0, 11.0, 6.0, 4.0, 4.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.85986328125, -30.8447265625, -29.82958984375, -28.814453125, -27.79931640625, -26.7841796875, -25.76904296875, -24.75390625, -23.73876953125, -22.7236328125, -21.70849609375, -20.693359375, -19.67822265625, -18.6630859375, -17.64794921875, -16.6328125, -15.61767578125, -14.6025390625, -13.58740234375, -12.572265625, -11.55712890625, -10.5419921875, -9.52685546875, -8.51171875, -7.49658203125, -6.4814453125, -5.46630859375, -4.451171875, -3.43603515625, -2.4208984375, -1.40576171875, -0.390625, 0.62451171875, 1.6396484375, 2.65478515625, 3.669921875, 4.68505859375, 5.7001953125, 6.71533203125, 7.73046875, 8.74560546875, 9.7607421875, 10.77587890625, 11.791015625, 12.80615234375, 13.8212890625, 14.83642578125, 15.8515625, 16.86669921875, 17.8818359375, 18.89697265625, 19.912109375, 20.92724609375, 21.9423828125, 22.95751953125, 23.97265625, 24.98779296875, 26.0029296875, 27.01806640625, 28.033203125, 29.04833984375, 30.0634765625, 31.07861328125, 32.09375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 2.0, 10.0, 9.0, 13.0, 8.0, 20.0, 19.0, 30.0, 35.0, 48.0, 49.0, 61.0, 53.0, 43.0, 64.0, 79.0, 72.0, 63.0, 58.0, 43.0, 39.0, 43.0, 25.0, 20.0, 23.0, 16.0, 14.0, 5.0, 11.0, 9.0, 4.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.171875, -20.48828125, -19.8046875, -19.12109375, -18.4375, -17.75390625, -17.0703125, -16.38671875, -15.703125, -15.01953125, -14.3359375, -13.65234375, -12.96875, -12.28515625, -11.6015625, -10.91796875, -10.234375, -9.55078125, -8.8671875, -8.18359375, -7.5, -6.81640625, -6.1328125, -5.44921875, -4.765625, -4.08203125, -3.3984375, -2.71484375, -2.03125, -1.34765625, -0.6640625, 0.01953125, 0.703125, 1.38671875, 2.0703125, 2.75390625, 3.4375, 4.12109375, 4.8046875, 5.48828125, 6.171875, 6.85546875, 7.5390625, 8.22265625, 8.90625, 9.58984375, 10.2734375, 10.95703125, 11.640625, 12.32421875, 13.0078125, 13.69140625, 14.375, 15.05859375, 15.7421875, 16.42578125, 17.109375, 17.79296875, 18.4765625, 19.16015625, 19.84375, 20.52734375, 21.2109375, 21.89453125, 22.578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 8.0, 12.0, 17.0, 57.0, 215.0, 1418.0, 37963.0, 1003525.0, 4566.0, 551.0, 108.0, 31.0, 21.0, 9.0, 13.0, 9.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.5234375, -20.8125, -20.1015625, -19.390625, -18.6796875, -17.96875, -17.2578125, -16.546875, -15.8359375, -15.125, -14.4140625, -13.703125, -12.9921875, -12.28125, -11.5703125, -10.859375, -10.1484375, -9.4375, -8.7265625, -8.015625, -7.3046875, -6.59375, -5.8828125, -5.171875, -4.4609375, -3.75, -3.0390625, -2.328125, -1.6171875, -0.90625, -0.1953125, 0.515625, 1.2265625, 1.9375, 2.6484375, 3.359375, 4.0703125, 4.78125, 5.4921875, 6.203125, 6.9140625, 7.625, 8.3359375, 9.046875, 9.7578125, 10.46875, 11.1796875, 11.890625, 12.6015625, 13.3125, 14.0234375, 14.734375, 15.4453125, 16.15625, 16.8671875, 17.578125, 18.2890625, 19.0, 19.7109375, 20.421875, 21.1328125, 21.84375, 22.5546875, 23.265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 4.0, 5.0, 5.0, 15.0, 20.0, 24.0, 29.0, 40.0, 72.0, 106.0, 161.0, 175.0, 108.0, 81.0, 51.0, 30.0, 16.0, 17.0, 12.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007991790771484375, -0.0007707476615905762, -0.0007423162460327148, -0.0007138848304748535, -0.0006854534149169922, -0.0006570219993591309, -0.0006285905838012695, -0.0006001591682434082, -0.0005717277526855469, -0.0005432963371276855, -0.0005148649215698242, -0.0004864335060119629, -0.00045800209045410156, -0.00042957067489624023, -0.0004011392593383789, -0.0003727078437805176, -0.00034427642822265625, -0.0003158450126647949, -0.0002874135971069336, -0.00025898218154907227, -0.00023055076599121094, -0.0002021193504333496, -0.00017368793487548828, -0.00014525651931762695, -0.00011682510375976562, -8.83936882019043e-05, -5.996227264404297e-05, -3.153085708618164e-05, -3.0994415283203125e-06, 2.5331974029541016e-05, 5.3763389587402344e-05, 8.219480514526367e-05, 0.000110626220703125, 0.00013905763626098633, 0.00016748905181884766, 0.00019592046737670898, 0.0002243518829345703, 0.00025278329849243164, 0.00028121471405029297, 0.0003096461296081543, 0.0003380775451660156, 0.00036650896072387695, 0.0003949403762817383, 0.0004233717918395996, 0.00045180320739746094, 0.00048023462295532227, 0.0005086660385131836, 0.0005370974540710449, 0.0005655288696289062, 0.0005939602851867676, 0.0006223917007446289, 0.0006508231163024902, 0.0006792545318603516, 0.0007076859474182129, 0.0007361173629760742, 0.0007645487785339355, 0.0007929801940917969, 0.0008214116096496582, 0.0008498430252075195, 0.0008782744407653809, 0.0009067058563232422, 0.0009351372718811035, 0.0009635686874389648, 0.0009920001029968262, 0.0010204315185546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 9.0, 11.0, 9.0, 32.0, 52.0, 80.0, 144.0, 349.0, 743.0, 2132.0, 12198.0, 367641.0, 644158.0, 16774.0, 2559.0, 881.0, 368.0, 164.0, 88.0, 53.0, 34.0, 18.0, 13.0, 10.0, 6.0, 2.0, 0.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.8984375, -12.5682373046875, -12.238037109375, -11.9078369140625, -11.57763671875, -11.2474365234375, -10.917236328125, -10.5870361328125, -10.2568359375, -9.9266357421875, -9.596435546875, -9.2662353515625, -8.93603515625, -8.6058349609375, -8.275634765625, -7.9454345703125, -7.615234375, -7.2850341796875, -6.954833984375, -6.6246337890625, -6.29443359375, -5.9642333984375, -5.634033203125, -5.3038330078125, -4.9736328125, -4.6434326171875, -4.313232421875, -3.9830322265625, -3.65283203125, -3.3226318359375, -2.992431640625, -2.6622314453125, -2.33203125, -2.0018310546875, -1.671630859375, -1.3414306640625, -1.01123046875, -0.6810302734375, -0.350830078125, -0.0206298828125, 0.3095703125, 0.6397705078125, 0.969970703125, 1.3001708984375, 1.63037109375, 1.9605712890625, 2.290771484375, 2.6209716796875, 2.951171875, 3.2813720703125, 3.611572265625, 3.9417724609375, 4.27197265625, 4.6021728515625, 4.932373046875, 5.2625732421875, 5.5927734375, 5.9229736328125, 6.253173828125, 6.5833740234375, 6.91357421875, 7.2437744140625, 7.573974609375, 7.9041748046875, 8.234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 9.0, 12.0, 32.0, 30.0, 50.0, 53.0, 105.0, 148.0, 189.0, 133.0, 67.0, 45.0, 33.0, 19.0, 14.0, 11.0, 12.0, 5.0, 6.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.3253173828125, -2.220947265625, -2.1165771484375, -2.01220703125, -1.9078369140625, -1.803466796875, -1.6990966796875, -1.5947265625, -1.4903564453125, -1.385986328125, -1.2816162109375, -1.17724609375, -1.0728759765625, -0.968505859375, -0.8641357421875, -0.759765625, -0.6553955078125, -0.551025390625, -0.4466552734375, -0.34228515625, -0.2379150390625, -0.133544921875, -0.0291748046875, 0.0751953125, 0.1795654296875, 0.283935546875, 0.3883056640625, 0.49267578125, 0.5970458984375, 0.701416015625, 0.8057861328125, 0.91015625, 1.0145263671875, 1.118896484375, 1.2232666015625, 1.32763671875, 1.4320068359375, 1.536376953125, 1.6407470703125, 1.7451171875, 1.8494873046875, 1.953857421875, 2.0582275390625, 2.16259765625, 2.2669677734375, 2.371337890625, 2.4757080078125, 2.580078125, 2.6844482421875, 2.788818359375, 2.8931884765625, 2.99755859375, 3.1019287109375, 3.206298828125, 3.3106689453125, 3.4150390625, 3.5194091796875, 3.623779296875, 3.7281494140625, 3.83251953125, 3.9368896484375, 4.041259765625, 4.1456298828125, 4.25]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 27.0, 47.0, 111.0, 172.0, 208.0, 180.0, 147.0, 58.0, 27.0, 19.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.11149597167969, -42.56704330444336, -41.02259063720703, -39.4781379699707, -37.933685302734375, -36.38923263549805, -34.84477996826172, -33.300323486328125, -31.75587272644043, -30.2114200592041, -28.666967391967773, -27.122512817382812, -25.578060150146484, -24.033607482910156, -22.489154815673828, -20.9447021484375, -19.400249481201172, -17.855796813964844, -16.311344146728516, -14.766890525817871, -13.222437858581543, -11.677985191345215, -10.13353157043457, -8.589078903198242, -7.044626235961914, -5.500173568725586, -3.9557204246520996, -2.4112672805786133, -0.8668146133422852, 0.677638053894043, 2.2220916748046875, 3.7665443420410156, 5.311000823974609, 6.8554534912109375, 8.399906158447266, 9.94435977935791, 11.488812446594238, 13.033265113830566, 14.577718734741211, 16.12217140197754, 17.666624069213867, 19.211076736450195, 20.755529403686523, 22.299983978271484, 23.844436645507812, 25.38888931274414, 26.93334197998047, 28.477794647216797, 30.022247314453125, 31.566699981689453, 33.11115264892578, 34.65560531616211, 36.20005798339844, 37.744510650634766, 39.288963317871094, 40.83341979980469, 42.37786865234375, 43.92232131958008, 45.466773986816406, 47.011226654052734, 48.55567932128906, 50.10013198852539, 51.64458465576172, 53.18904113769531, 54.73349380493164]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 9.0, 12.0, 15.0, 14.0, 23.0, 26.0, 25.0, 37.0, 40.0, 43.0, 48.0, 44.0, 50.0, 45.0, 47.0, 56.0, 50.0, 49.0, 48.0, 39.0, 38.0, 49.0, 36.0, 20.0, 25.0, 18.0, 16.0, 14.0, 11.0, 9.0, 6.0, 7.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.621726989746094, -29.739402770996094, -28.85707664489746, -27.97475242614746, -27.092426300048828, -26.210102081298828, -25.327777862548828, -24.445453643798828, -23.563127517700195, -22.680803298950195, -21.798477172851562, -20.916152954101562, -20.033828735351562, -19.15150260925293, -18.26917839050293, -17.386852264404297, -16.504528045654297, -15.62220287322998, -14.739877700805664, -13.857553482055664, -12.975228309631348, -12.092903137207031, -11.210578918457031, -10.328253746032715, -9.445928573608398, -8.563603401184082, -7.681278705596924, -6.798954010009766, -5.916628837585449, -5.034303665161133, -4.151978969573975, -3.2696542739868164, -2.387327194213867, -1.5050022602081299, -0.6226773262023926, 0.2596476078033447, 1.141972541809082, 2.0242977142333984, 2.9066224098205566, 3.788947105407715, 4.671272277832031, 5.553597450256348, 6.435922145843506, 7.318246841430664, 8.20057201385498, 9.082897186279297, 9.965221405029297, 10.847546577453613, 11.72987174987793, 12.612196922302246, 13.494522094726562, 14.376846313476562, 15.259171485900879, 16.141496658325195, 17.023820877075195, 17.906147003173828, 18.788471221923828, 19.670795440673828, 20.55312156677246, 21.43544578552246, 22.317771911621094, 23.200096130371094, 24.082420349121094, 24.964744567871094, 25.847070693969727]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 7.0, 11.0, 10.0, 21.0, 32.0, 59.0, 98.0, 217.0, 437.0, 1256.0, 7076.0, 137452.0, 3338752.0, 685865.0, 19926.0, 2043.0, 532.0, 201.0, 125.0, 71.0, 31.0, 15.0, 12.0, 4.0, 4.0, 1.0, 11.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.25, -29.42578125, -28.6015625, -27.77734375, -26.953125, -26.12890625, -25.3046875, -24.48046875, -23.65625, -22.83203125, -22.0078125, -21.18359375, -20.359375, -19.53515625, -18.7109375, -17.88671875, -17.0625, -16.23828125, -15.4140625, -14.58984375, -13.765625, -12.94140625, -12.1171875, -11.29296875, -10.46875, -9.64453125, -8.8203125, -7.99609375, -7.171875, -6.34765625, -5.5234375, -4.69921875, -3.875, -3.05078125, -2.2265625, -1.40234375, -0.578125, 0.24609375, 1.0703125, 1.89453125, 2.71875, 3.54296875, 4.3671875, 5.19140625, 6.015625, 6.83984375, 7.6640625, 8.48828125, 9.3125, 10.13671875, 10.9609375, 11.78515625, 12.609375, 13.43359375, 14.2578125, 15.08203125, 15.90625, 16.73046875, 17.5546875, 18.37890625, 19.203125, 20.02734375, 20.8515625, 21.67578125, 22.5]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 13.0, 12.0, 19.0, 16.0, 25.0, 26.0, 38.0, 35.0, 47.0, 45.0, 38.0, 49.0, 67.0, 51.0, 62.0, 53.0, 46.0, 61.0, 46.0, 31.0, 31.0, 29.0, 28.0, 32.0, 23.0, 11.0, 13.0, 16.0, 4.0, 8.0, 5.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.28125, -8.9915771484375, -8.701904296875, -8.4122314453125, -8.12255859375, -7.8328857421875, -7.543212890625, -7.2535400390625, -6.9638671875, -6.6741943359375, -6.384521484375, -6.0948486328125, -5.80517578125, -5.5155029296875, -5.225830078125, -4.9361572265625, -4.646484375, -4.3568115234375, -4.067138671875, -3.7774658203125, -3.48779296875, -3.1981201171875, -2.908447265625, -2.6187744140625, -2.3291015625, -2.0394287109375, -1.749755859375, -1.4600830078125, -1.17041015625, -0.8807373046875, -0.591064453125, -0.3013916015625, -0.01171875, 0.2779541015625, 0.567626953125, 0.8572998046875, 1.14697265625, 1.4366455078125, 1.726318359375, 2.0159912109375, 2.3056640625, 2.5953369140625, 2.885009765625, 3.1746826171875, 3.46435546875, 3.7540283203125, 4.043701171875, 4.3333740234375, 4.623046875, 4.9127197265625, 5.202392578125, 5.4920654296875, 5.78173828125, 6.0714111328125, 6.361083984375, 6.6507568359375, 6.9404296875, 7.2301025390625, 7.519775390625, 7.8094482421875, 8.09912109375, 8.3887939453125, 8.678466796875, 8.9681396484375, 9.2578125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 10.0, 9.0, 24.0, 36.0, 78.0, 222.0, 627.0, 2879.0, 103536.0, 4061725.0, 22581.0, 1754.0, 508.0, 153.0, 63.0, 27.0, 20.0, 10.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.91650390625, -61.3955078125, -59.87451171875, -58.353515625, -56.83251953125, -55.3115234375, -53.79052734375, -52.26953125, -50.74853515625, -49.2275390625, -47.70654296875, -46.185546875, -44.66455078125, -43.1435546875, -41.62255859375, -40.1015625, -38.58056640625, -37.0595703125, -35.53857421875, -34.017578125, -32.49658203125, -30.9755859375, -29.45458984375, -27.93359375, -26.41259765625, -24.8916015625, -23.37060546875, -21.849609375, -20.32861328125, -18.8076171875, -17.28662109375, -15.765625, -14.24462890625, -12.7236328125, -11.20263671875, -9.681640625, -8.16064453125, -6.6396484375, -5.11865234375, -3.59765625, -2.07666015625, -0.5556640625, 0.96533203125, 2.486328125, 4.00732421875, 5.5283203125, 7.04931640625, 8.5703125, 10.09130859375, 11.6123046875, 13.13330078125, 14.654296875, 16.17529296875, 17.6962890625, 19.21728515625, 20.73828125, 22.25927734375, 23.7802734375, 25.30126953125, 26.822265625, 28.34326171875, 29.8642578125, 31.38525390625, 32.90625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 23.0, 20.0, 36.0, 50.0, 108.0, 208.0, 405.0, 690.0, 843.0, 689.0, 470.0, 250.0, 112.0, 70.0, 37.0, 18.0, 13.0, 9.0, 7.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.68359375, -4.45574951171875, -4.2279052734375, -4.00006103515625, -3.772216796875, -3.54437255859375, -3.3165283203125, -3.08868408203125, -2.86083984375, -2.63299560546875, -2.4051513671875, -2.17730712890625, -1.949462890625, -1.72161865234375, -1.4937744140625, -1.26593017578125, -1.0380859375, -0.81024169921875, -0.5823974609375, -0.35455322265625, -0.126708984375, 0.10113525390625, 0.3289794921875, 0.55682373046875, 0.78466796875, 1.01251220703125, 1.2403564453125, 1.46820068359375, 1.696044921875, 1.92388916015625, 2.1517333984375, 2.37957763671875, 2.607421875, 2.83526611328125, 3.0631103515625, 3.29095458984375, 3.518798828125, 3.74664306640625, 3.9744873046875, 4.20233154296875, 4.43017578125, 4.65802001953125, 4.8858642578125, 5.11370849609375, 5.341552734375, 5.56939697265625, 5.7972412109375, 6.02508544921875, 6.2529296875, 6.48077392578125, 6.7086181640625, 6.93646240234375, 7.164306640625, 7.39215087890625, 7.6199951171875, 7.84783935546875, 8.07568359375, 8.30352783203125, 8.5313720703125, 8.75921630859375, 8.987060546875, 9.21490478515625, 9.4427490234375, 9.67059326171875, 9.8984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 11.0, 36.0, 46.0, 80.0, 86.0, 110.0, 123.0, 137.0, 103.0, 96.0, 67.0, 49.0, 25.0, 17.0, 14.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.719768524169922, -23.99237823486328, -23.264989852905273, -22.537599563598633, -21.810209274291992, -21.082820892333984, -20.355430603027344, -19.628040313720703, -18.900650024414062, -18.173259735107422, -17.445871353149414, -16.718481063842773, -15.991090774536133, -15.263701438903809, -14.536312103271484, -13.808921813964844, -13.081533432006836, -12.354144096374512, -11.626753807067871, -10.899364471435547, -10.171974182128906, -9.444584846496582, -8.717195510864258, -7.989805698394775, -7.262415885925293, -6.5350260734558105, -5.807636260986328, -5.080246925354004, -4.3528571128845215, -3.625467300415039, -2.898077964782715, -2.1706881523132324, -1.44329833984375, -0.7159086465835571, 0.011481046676635742, 0.7388706207275391, 1.4662604331970215, 2.193650245666504, 2.921039581298828, 3.6484293937683105, 4.375819206237793, 5.103209018707275, 5.830598831176758, 6.557988166809082, 7.2853779792785645, 8.012767791748047, 8.740157127380371, 9.467546463012695, 10.194936752319336, 10.92232608795166, 11.6497163772583, 12.377105712890625, 13.104496002197266, 13.83188533782959, 14.559274673461914, 15.286664962768555, 16.014053344726562, 16.741443634033203, 17.46883201599121, 18.19622230529785, 18.923612594604492, 19.6510009765625, 20.37839126586914, 21.10578155517578, 21.833171844482422]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 9.0, 7.0, 10.0, 14.0, 18.0, 27.0, 16.0, 23.0, 27.0, 28.0, 24.0, 35.0, 41.0, 34.0, 40.0, 41.0, 48.0, 42.0, 47.0, 47.0, 38.0, 36.0, 28.0, 33.0, 40.0, 23.0, 18.0, 23.0, 19.0, 24.0, 20.0, 18.0, 13.0, 15.0, 15.0, 12.0, 4.0, 4.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.284128189086914, -8.009078025817871, -7.73402738571167, -7.458976745605469, -7.183926582336426, -6.908875942230225, -6.633825302124023, -6.3587751388549805, -6.0837249755859375, -5.808674335479736, -5.533624172210693, -5.258573532104492, -4.983523368835449, -4.708472728729248, -4.433422088623047, -4.158371925354004, -3.8833212852478027, -3.6082708835601807, -3.3332204818725586, -3.0581698417663574, -2.7831196784973145, -2.5080690383911133, -2.233018636703491, -1.9579682350158691, -1.682917833328247, -1.407867431640625, -1.132817029953003, -0.8577665090560913, -0.5827161073684692, -0.30766570568084717, -0.03261518478393555, 0.24243521690368652, 0.5174856185913086, 0.7925360202789307, 1.0675864219665527, 1.3426369428634644, 1.6176873445510864, 1.8927377462387085, 2.16778826713562, 2.442838668823242, 2.7178890705108643, 2.9929394721984863, 3.2679898738861084, 3.5430402755737305, 3.8180909156799316, 4.093141078948975, 4.368191719055176, 4.643241882324219, 4.91829252243042, 5.193343162536621, 5.468393325805664, 5.743443965911865, 6.018494129180908, 6.293544769287109, 6.568594932556152, 6.8436455726623535, 7.118696212768555, 7.393746852874756, 7.668797016143799, 7.94384765625, 8.218897819519043, 8.493947982788086, 8.768999099731445, 9.044049263000488, 9.319099426269531]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 10.0, 18.0, 23.0, 42.0, 74.0, 109.0, 197.0, 388.0, 1195.0, 4750.0, 28069.0, 275288.0, 632753.0, 90523.0, 11351.0, 2383.0, 715.0, 272.0, 149.0, 83.0, 59.0, 44.0, 28.0, 15.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -5.043426513671875, -4.91497802734375, -4.786529541015625, -4.6580810546875, -4.529632568359375, -4.40118408203125, -4.272735595703125, -4.144287109375, -4.015838623046875, -3.88739013671875, -3.758941650390625, -3.6304931640625, -3.502044677734375, -3.37359619140625, -3.245147705078125, -3.11669921875, -2.988250732421875, -2.85980224609375, -2.731353759765625, -2.6029052734375, -2.474456787109375, -2.34600830078125, -2.217559814453125, -2.089111328125, -1.960662841796875, -1.83221435546875, -1.703765869140625, -1.5753173828125, -1.446868896484375, -1.31842041015625, -1.189971923828125, -1.0615234375, -0.933074951171875, -0.80462646484375, -0.676177978515625, -0.5477294921875, -0.419281005859375, -0.29083251953125, -0.162384033203125, -0.033935546875, 0.094512939453125, 0.22296142578125, 0.351409912109375, 0.4798583984375, 0.608306884765625, 0.73675537109375, 0.865203857421875, 0.99365234375, 1.122100830078125, 1.25054931640625, 1.378997802734375, 1.5074462890625, 1.635894775390625, 1.76434326171875, 1.892791748046875, 2.021240234375, 2.149688720703125, 2.27813720703125, 2.406585693359375, 2.5350341796875, 2.663482666015625, 2.79193115234375, 2.920379638671875, 3.048828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 2.0, 9.0, 9.0, 16.0, 22.0, 22.0, 38.0, 48.0, 53.0, 61.0, 68.0, 87.0, 74.0, 79.0, 68.0, 64.0, 66.0, 43.0, 36.0, 25.0, 33.0, 22.0, 18.0, 16.0, 10.0, 10.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.6796875, -13.37640380859375, -13.0731201171875, -12.76983642578125, -12.466552734375, -12.16326904296875, -11.8599853515625, -11.55670166015625, -11.25341796875, -10.95013427734375, -10.6468505859375, -10.34356689453125, -10.040283203125, -9.73699951171875, -9.4337158203125, -9.13043212890625, -8.8271484375, -8.52386474609375, -8.2205810546875, -7.91729736328125, -7.614013671875, -7.31072998046875, -7.0074462890625, -6.70416259765625, -6.40087890625, -6.09759521484375, -5.7943115234375, -5.49102783203125, -5.187744140625, -4.88446044921875, -4.5811767578125, -4.27789306640625, -3.974609375, -3.67132568359375, -3.3680419921875, -3.06475830078125, -2.761474609375, -2.45819091796875, -2.1549072265625, -1.85162353515625, -1.54833984375, -1.24505615234375, -0.9417724609375, -0.63848876953125, -0.335205078125, -0.03192138671875, 0.2713623046875, 0.57464599609375, 0.8779296875, 1.18121337890625, 1.4844970703125, 1.78778076171875, 2.091064453125, 2.39434814453125, 2.6976318359375, 3.00091552734375, 3.30419921875, 3.60748291015625, 3.9107666015625, 4.21405029296875, 4.517333984375, 4.82061767578125, 5.1239013671875, 5.42718505859375, 5.73046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 11.0, 12.0, 27.0, 36.0, 48.0, 76.0, 128.0, 201.0, 283.0, 390.0, 619.0, 996.0, 1466.0, 2320.0, 3707.0, 6034.0, 9945.0, 16175.0, 26299.0, 43111.0, 70448.0, 110060.0, 155496.0, 175495.0, 149940.0, 104048.0, 66022.0, 40562.0, 24484.0, 15094.0, 9172.0, 5639.0, 3603.0, 2339.0, 1507.0, 942.0, 592.0, 410.0, 234.0, 190.0, 98.0, 101.0, 55.0, 32.0, 30.0, 18.0, 18.0, 12.0, 6.0, 7.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0], "bins": [-0.6416015625, -0.6211929321289062, -0.6007843017578125, -0.5803756713867188, -0.559967041015625, -0.5395584106445312, -0.5191497802734375, -0.49874114990234375, -0.47833251953125, -0.45792388916015625, -0.4375152587890625, -0.41710662841796875, -0.396697998046875, -0.37628936767578125, -0.3558807373046875, -0.33547210693359375, -0.3150634765625, -0.29465484619140625, -0.2742462158203125, -0.25383758544921875, -0.233428955078125, -0.21302032470703125, -0.1926116943359375, -0.17220306396484375, -0.15179443359375, -0.13138580322265625, -0.1109771728515625, -0.09056854248046875, -0.070159912109375, -0.04975128173828125, -0.0293426513671875, -0.00893402099609375, 0.011474609375, 0.03188323974609375, 0.0522918701171875, 0.07270050048828125, 0.093109130859375, 0.11351776123046875, 0.1339263916015625, 0.15433502197265625, 0.17474365234375, 0.19515228271484375, 0.2155609130859375, 0.23596954345703125, 0.256378173828125, 0.27678680419921875, 0.2971954345703125, 0.31760406494140625, 0.3380126953125, 0.35842132568359375, 0.3788299560546875, 0.39923858642578125, 0.419647216796875, 0.44005584716796875, 0.4604644775390625, 0.48087310791015625, 0.50128173828125, 0.5216903686523438, 0.5420989990234375, 0.5625076293945312, 0.582916259765625, 0.6033248901367188, 0.6237335205078125, 0.6441421508789062, 0.66455078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 16.0, 7.0, 14.0, 18.0, 12.0, 23.0, 30.0, 26.0, 39.0, 40.0, 47.0, 52.0, 67.0, 46.0, 63.0, 63.0, 64.0, 55.0, 39.0, 42.0, 50.0, 28.0, 28.0, 20.0, 18.0, 12.0, 15.0, 10.0, 16.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.546875, -13.120849609375, -12.69482421875, -12.268798828125, -11.8427734375, -11.416748046875, -10.99072265625, -10.564697265625, -10.138671875, -9.712646484375, -9.28662109375, -8.860595703125, -8.4345703125, -8.008544921875, -7.58251953125, -7.156494140625, -6.73046875, -6.304443359375, -5.87841796875, -5.452392578125, -5.0263671875, -4.600341796875, -4.17431640625, -3.748291015625, -3.322265625, -2.896240234375, -2.47021484375, -2.044189453125, -1.6181640625, -1.192138671875, -0.76611328125, -0.340087890625, 0.0859375, 0.511962890625, 0.93798828125, 1.364013671875, 1.7900390625, 2.216064453125, 2.64208984375, 3.068115234375, 3.494140625, 3.920166015625, 4.34619140625, 4.772216796875, 5.1982421875, 5.624267578125, 6.05029296875, 6.476318359375, 6.90234375, 7.328369140625, 7.75439453125, 8.180419921875, 8.6064453125, 9.032470703125, 9.45849609375, 9.884521484375, 10.310546875, 10.736572265625, 11.16259765625, 11.588623046875, 12.0146484375, 12.440673828125, 12.86669921875, 13.292724609375, 13.71875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 2.0, 12.0, 10.0, 25.0, 34.0, 64.0, 92.0, 160.0, 280.0, 507.0, 1109.0, 2635.0, 8049.0, 30750.0, 139014.0, 507159.0, 277753.0, 59089.0, 14265.0, 4269.0, 1650.0, 701.0, 352.0, 192.0, 126.0, 82.0, 57.0, 45.0, 12.0, 17.0, 10.0, 5.0, 8.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2236328125, -0.21584701538085938, -0.20806121826171875, -0.20027542114257812, -0.1924896240234375, -0.18470382690429688, -0.17691802978515625, -0.16913223266601562, -0.161346435546875, -0.15356063842773438, -0.14577484130859375, -0.13798904418945312, -0.1302032470703125, -0.12241744995117188, -0.11463165283203125, -0.10684585571289062, -0.09906005859375, -0.09127426147460938, -0.08348846435546875, -0.07570266723632812, -0.0679168701171875, -0.060131072998046875, -0.05234527587890625, -0.044559478759765625, -0.036773681640625, -0.028987884521484375, -0.02120208740234375, -0.013416290283203125, -0.0056304931640625, 0.002155303955078125, 0.00994110107421875, 0.017726898193359375, 0.0255126953125, 0.033298492431640625, 0.04108428955078125, 0.048870086669921875, 0.0566558837890625, 0.06444168090820312, 0.07222747802734375, 0.08001327514648438, 0.087799072265625, 0.09558486938476562, 0.10337066650390625, 0.11115646362304688, 0.1189422607421875, 0.12672805786132812, 0.13451385498046875, 0.14229965209960938, 0.15008544921875, 0.15787124633789062, 0.16565704345703125, 0.17344284057617188, 0.1812286376953125, 0.18901443481445312, 0.19680023193359375, 0.20458602905273438, 0.212371826171875, 0.22015762329101562, 0.22794342041015625, 0.23572921752929688, 0.2435150146484375, 0.2513008117675781, 0.25908660888671875, 0.2668724060058594, 0.274658203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 4.0, 14.0, 13.0, 23.0, 36.0, 64.0, 55.0, 99.0, 103.0, 124.0, 135.0, 96.0, 62.0, 64.0, 27.0, 32.0, 13.0, 11.0, 10.0, 6.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023674964904785156, -0.00023105181753635406, -0.00022535398602485657, -0.00021965615451335907, -0.00021395832300186157, -0.00020826049149036407, -0.00020256265997886658, -0.00019686482846736908, -0.00019116699695587158, -0.00018546916544437408, -0.0001797713339328766, -0.0001740735024213791, -0.0001683756709098816, -0.0001626778393983841, -0.0001569800078868866, -0.0001512821763753891, -0.0001455843448638916, -0.0001398865133523941, -0.0001341886818408966, -0.0001284908503293991, -0.0001227930188179016, -0.00011709518730640411, -0.00011139735579490662, -0.00010569952428340912, -0.00010000169277191162, -9.430386126041412e-05, -8.860602974891663e-05, -8.290819823741913e-05, -7.721036672592163e-05, -7.151253521442413e-05, -6.581470370292664e-05, -6.011687219142914e-05, -5.441904067993164e-05, -4.872120916843414e-05, -4.3023377656936646e-05, -3.732554614543915e-05, -3.162771463394165e-05, -2.5929883122444153e-05, -2.0232051610946655e-05, -1.4534220099449158e-05, -8.83638858795166e-06, -3.1385570764541626e-06, 2.559274435043335e-06, 8.257105946540833e-06, 1.395493745803833e-05, 1.9652768969535828e-05, 2.5350600481033325e-05, 3.104843199253082e-05, 3.674626350402832e-05, 4.244409501552582e-05, 4.8141926527023315e-05, 5.383975803852081e-05, 5.953758955001831e-05, 6.523542106151581e-05, 7.09332525730133e-05, 7.66310840845108e-05, 8.23289155960083e-05, 8.80267471075058e-05, 9.37245786190033e-05, 9.94224101305008e-05, 0.00010512024164199829, 0.00011081807315349579, 0.00011651590466499329, 0.00012221373617649078, 0.00012791156768798828]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 3.0, 6.0, 12.0, 17.0, 25.0, 36.0, 72.0, 100.0, 198.0, 342.0, 570.0, 1132.0, 2264.0, 4586.0, 9902.0, 24229.0, 66955.0, 220534.0, 444039.0, 179868.0, 55929.0, 20487.0, 8707.0, 4123.0, 2062.0, 986.0, 601.0, 285.0, 177.0, 97.0, 62.0, 44.0, 30.0, 13.0, 16.0, 13.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2276611328125, -0.22063827514648438, -0.21361541748046875, -0.20659255981445312, -0.1995697021484375, -0.19254684448242188, -0.18552398681640625, -0.17850112915039062, -0.171478271484375, -0.16445541381835938, -0.15743255615234375, -0.15040969848632812, -0.1433868408203125, -0.13636398315429688, -0.12934112548828125, -0.12231826782226562, -0.11529541015625, -0.10827255249023438, -0.10124969482421875, -0.09422683715820312, -0.0872039794921875, -0.08018112182617188, -0.07315826416015625, -0.06613540649414062, -0.059112548828125, -0.052089691162109375, -0.04506683349609375, -0.038043975830078125, -0.0310211181640625, -0.023998260498046875, -0.01697540283203125, -0.009952545166015625, -0.0029296875, 0.004093170166015625, 0.01111602783203125, 0.018138885498046875, 0.0251617431640625, 0.032184600830078125, 0.03920745849609375, 0.046230316162109375, 0.053253173828125, 0.060276031494140625, 0.06729888916015625, 0.07432174682617188, 0.0813446044921875, 0.08836746215820312, 0.09539031982421875, 0.10241317749023438, 0.10943603515625, 0.11645889282226562, 0.12348175048828125, 0.13050460815429688, 0.1375274658203125, 0.14455032348632812, 0.15157318115234375, 0.15859603881835938, 0.165618896484375, 0.17264175415039062, 0.17966461181640625, 0.18668746948242188, 0.1937103271484375, 0.20073318481445312, 0.20775604248046875, 0.21477890014648438, 0.2218017578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 3.0, 6.0, 10.0, 2.0, 7.0, 7.0, 12.0, 23.0, 33.0, 22.0, 39.0, 51.0, 68.0, 73.0, 86.0, 99.0, 90.0, 76.0, 67.0, 39.0, 44.0, 38.0, 26.0, 14.0, 18.0, 6.0, 2.0, 10.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.053070068359375, -0.0513763427734375, -0.0496826171875, -0.0479888916015625, -0.046295166015625, -0.0446014404296875, -0.04290771484375, -0.0412139892578125, -0.039520263671875, -0.0378265380859375, -0.0361328125, -0.0344390869140625, -0.032745361328125, -0.0310516357421875, -0.02935791015625, -0.0276641845703125, -0.025970458984375, -0.0242767333984375, -0.0225830078125, -0.0208892822265625, -0.019195556640625, -0.0175018310546875, -0.01580810546875, -0.0141143798828125, -0.012420654296875, -0.0107269287109375, -0.009033203125, -0.0073394775390625, -0.005645751953125, -0.0039520263671875, -0.00225830078125, -0.0005645751953125, 0.001129150390625, 0.0028228759765625, 0.0045166015625, 0.0062103271484375, 0.007904052734375, 0.0095977783203125, 0.01129150390625, 0.0129852294921875, 0.014678955078125, 0.0163726806640625, 0.01806640625, 0.0197601318359375, 0.021453857421875, 0.0231475830078125, 0.02484130859375, 0.0265350341796875, 0.028228759765625, 0.0299224853515625, 0.0316162109375, 0.0333099365234375, 0.035003662109375, 0.0366973876953125, 0.03839111328125, 0.0400848388671875, 0.041778564453125, 0.0434722900390625, 0.045166015625, 0.0468597412109375, 0.048553466796875, 0.0502471923828125, 0.05194091796875, 0.0536346435546875, 0.055328369140625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 16.0, 59.0, 104.0, 156.0, 198.0, 157.0, 170.0, 84.0, 37.0, 19.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.7308464050293, -33.079444885253906, -32.42803955078125, -31.77663803100586, -31.12523651123047, -30.473833084106445, -29.822429656982422, -29.17102813720703, -28.519624710083008, -27.868221282958984, -27.216819763183594, -26.56541633605957, -25.91401481628418, -25.262611389160156, -24.611209869384766, -23.959806442260742, -23.30840301513672, -22.656999588012695, -22.005598068237305, -21.35419464111328, -20.70279312133789, -20.051389694213867, -19.399986267089844, -18.748584747314453, -18.097183227539062, -17.44577980041504, -16.79437828063965, -16.142974853515625, -15.491572380065918, -14.840169906616211, -14.188767433166504, -13.537364959716797, -12.88595962524414, -12.234557151794434, -11.583154678344727, -10.931751251220703, -10.280348777770996, -9.628946304321289, -8.977543830871582, -8.326141357421875, -7.674738883972168, -7.023336410522461, -6.371933460235596, -5.720530986785889, -5.069128036499023, -4.417725563049316, -3.7663230895996094, -3.114920139312744, -2.463517665863037, -1.812114953994751, -1.1607123613357544, -0.5093097686767578, 0.14209294319152832, 0.7934956550598145, 1.4448981285095215, 2.0963010787963867, 2.7477035522460938, 3.39910626411438, 4.050508975982666, 4.701911449432373, 5.353314399719238, 6.004716873168945, 6.656119346618652, 7.307522296905518, 7.958924770355225]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 7.0, 3.0, 8.0, 7.0, 9.0, 17.0, 19.0, 28.0, 25.0, 36.0, 40.0, 38.0, 58.0, 47.0, 61.0, 54.0, 69.0, 62.0, 52.0, 51.0, 40.0, 48.0, 28.0, 32.0, 30.0, 23.0, 27.0, 13.0, 22.0, 9.0, 12.0, 5.0, 11.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.660941123962402, -8.443230628967285, -8.225520133972168, -8.00780963897705, -7.790098667144775, -7.572388172149658, -7.354677200317383, -7.136966705322266, -6.919256210327148, -6.701545715332031, -6.483835220336914, -6.266124248504639, -6.0484137535095215, -5.830703258514404, -5.612992286682129, -5.395281791687012, -5.1775712966918945, -4.959860801696777, -4.74215030670166, -4.524439334869385, -4.306728839874268, -4.08901834487915, -3.871307611465454, -3.653596878051758, -3.4358863830566406, -3.2181758880615234, -3.000465154647827, -2.782754421234131, -2.5650439262390137, -2.3473334312438965, -2.1296226978302, -1.9119120836257935, -1.6942014694213867, -1.47649085521698, -1.2587802410125732, -1.0410696268081665, -0.8233590126037598, -0.605648398399353, -0.3879377841949463, -0.17022716999053955, 0.04748344421386719, 0.2651940584182739, 0.48290467262268066, 0.7006152868270874, 0.9183259010314941, 1.1360365152359009, 1.3537471294403076, 1.5714577436447144, 1.789168357849121, 2.0068788528442383, 2.2245895862579346, 2.442300319671631, 2.660010814666748, 2.8777213096618652, 3.0954320430755615, 3.313142776489258, 3.530853271484375, 3.748563766479492, 3.9662744998931885, 4.183985233306885, 4.401695728302002, 4.619406223297119, 4.8371171951293945, 5.054827690124512, 5.272538185119629]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 8.0, 7.0, 17.0, 17.0, 29.0, 48.0, 74.0, 144.0, 290.0, 667.0, 1981.0, 6854.0, 26670.0, 110518.0, 423568.0, 359090.0, 88544.0, 21639.0, 5559.0, 1635.0, 586.0, 260.0, 132.0, 75.0, 40.0, 33.0, 18.0, 9.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -10.0723876953125, -9.683837890625, -9.2952880859375, -8.90673828125, -8.5181884765625, -8.129638671875, -7.7410888671875, -7.3525390625, -6.9639892578125, -6.575439453125, -6.1868896484375, -5.79833984375, -5.4097900390625, -5.021240234375, -4.6326904296875, -4.244140625, -3.8555908203125, -3.467041015625, -3.0784912109375, -2.68994140625, -2.3013916015625, -1.912841796875, -1.5242919921875, -1.1357421875, -0.7471923828125, -0.358642578125, 0.0299072265625, 0.41845703125, 0.8070068359375, 1.195556640625, 1.5841064453125, 1.97265625, 2.3612060546875, 2.749755859375, 3.1383056640625, 3.52685546875, 3.9154052734375, 4.303955078125, 4.6925048828125, 5.0810546875, 5.4696044921875, 5.858154296875, 6.2467041015625, 6.63525390625, 7.0238037109375, 7.412353515625, 7.8009033203125, 8.189453125, 8.5780029296875, 8.966552734375, 9.3551025390625, 9.74365234375, 10.1322021484375, 10.520751953125, 10.9093017578125, 11.2978515625, 11.6864013671875, 12.074951171875, 12.4635009765625, 12.85205078125, 13.2406005859375, 13.629150390625, 14.0177001953125, 14.40625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 4.0, 9.0, 11.0, 13.0, 13.0, 22.0, 19.0, 43.0, 38.0, 46.0, 39.0, 54.0, 53.0, 52.0, 49.0, 65.0, 75.0, 56.0, 44.0, 55.0, 30.0, 32.0, 28.0, 21.0, 34.0, 18.0, 10.0, 19.0, 12.0, 12.0, 2.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -16.024169921875, -15.59521484375, -15.166259765625, -14.7373046875, -14.308349609375, -13.87939453125, -13.450439453125, -13.021484375, -12.592529296875, -12.16357421875, -11.734619140625, -11.3056640625, -10.876708984375, -10.44775390625, -10.018798828125, -9.58984375, -9.160888671875, -8.73193359375, -8.302978515625, -7.8740234375, -7.445068359375, -7.01611328125, -6.587158203125, -6.158203125, -5.729248046875, -5.30029296875, -4.871337890625, -4.4423828125, -4.013427734375, -3.58447265625, -3.155517578125, -2.7265625, -2.297607421875, -1.86865234375, -1.439697265625, -1.0107421875, -0.581787109375, -0.15283203125, 0.276123046875, 0.705078125, 1.134033203125, 1.56298828125, 1.991943359375, 2.4208984375, 2.849853515625, 3.27880859375, 3.707763671875, 4.13671875, 4.565673828125, 4.99462890625, 5.423583984375, 5.8525390625, 6.281494140625, 6.71044921875, 7.139404296875, 7.568359375, 7.997314453125, 8.42626953125, 8.855224609375, 9.2841796875, 9.713134765625, 10.14208984375, 10.571044921875, 11.0]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 10.0, 10.0, 14.0, 22.0, 32.0, 36.0, 49.0, 76.0, 133.0, 189.0, 306.0, 724.0, 2664.0, 16731.0, 128260.0, 620055.0, 241016.0, 31567.0, 4555.0, 1053.0, 412.0, 212.0, 142.0, 78.0, 59.0, 39.0, 23.0, 24.0, 16.0, 10.0, 14.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.25, -11.753173828125, -11.25634765625, -10.759521484375, -10.2626953125, -9.765869140625, -9.26904296875, -8.772216796875, -8.275390625, -7.778564453125, -7.28173828125, -6.784912109375, -6.2880859375, -5.791259765625, -5.29443359375, -4.797607421875, -4.30078125, -3.803955078125, -3.30712890625, -2.810302734375, -2.3134765625, -1.816650390625, -1.31982421875, -0.822998046875, -0.326171875, 0.170654296875, 0.66748046875, 1.164306640625, 1.6611328125, 2.157958984375, 2.65478515625, 3.151611328125, 3.6484375, 4.145263671875, 4.64208984375, 5.138916015625, 5.6357421875, 6.132568359375, 6.62939453125, 7.126220703125, 7.623046875, 8.119873046875, 8.61669921875, 9.113525390625, 9.6103515625, 10.107177734375, 10.60400390625, 11.100830078125, 11.59765625, 12.094482421875, 12.59130859375, 13.088134765625, 13.5849609375, 14.081787109375, 14.57861328125, 15.075439453125, 15.572265625, 16.069091796875, 16.56591796875, 17.062744140625, 17.5595703125, 18.056396484375, 18.55322265625, 19.050048828125, 19.546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 5.0, 0.0, 0.0, 3.0, 6.0, 7.0, 5.0, 2.0, 6.0, 11.0, 10.0, 8.0, 12.0, 16.0, 24.0, 20.0, 22.0, 31.0, 37.0, 50.0, 47.0, 58.0, 57.0, 64.0, 67.0, 54.0, 45.0, 43.0, 54.0, 40.0, 33.0, 31.0, 27.0, 17.0, 23.0, 16.0, 12.0, 11.0, 13.0, 4.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.72998046875, -10.2880859375, -9.84619140625, -9.404296875, -8.96240234375, -8.5205078125, -8.07861328125, -7.63671875, -7.19482421875, -6.7529296875, -6.31103515625, -5.869140625, -5.42724609375, -4.9853515625, -4.54345703125, -4.1015625, -3.65966796875, -3.2177734375, -2.77587890625, -2.333984375, -1.89208984375, -1.4501953125, -1.00830078125, -0.56640625, -0.12451171875, 0.3173828125, 0.75927734375, 1.201171875, 1.64306640625, 2.0849609375, 2.52685546875, 2.96875, 3.41064453125, 3.8525390625, 4.29443359375, 4.736328125, 5.17822265625, 5.6201171875, 6.06201171875, 6.50390625, 6.94580078125, 7.3876953125, 7.82958984375, 8.271484375, 8.71337890625, 9.1552734375, 9.59716796875, 10.0390625, 10.48095703125, 10.9228515625, 11.36474609375, 11.806640625, 12.24853515625, 12.6904296875, 13.13232421875, 13.57421875, 14.01611328125, 14.4580078125, 14.89990234375, 15.341796875, 15.78369140625, 16.2255859375, 16.66748046875, 17.109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 14.0, 21.0, 25.0, 94.0, 391.0, 2262.0, 93653.0, 937124.0, 13551.0, 1076.0, 224.0, 61.0, 26.0, 9.0, 12.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.30322265625, -12.8642578125, -12.42529296875, -11.986328125, -11.54736328125, -11.1083984375, -10.66943359375, -10.23046875, -9.79150390625, -9.3525390625, -8.91357421875, -8.474609375, -8.03564453125, -7.5966796875, -7.15771484375, -6.71875, -6.27978515625, -5.8408203125, -5.40185546875, -4.962890625, -4.52392578125, -4.0849609375, -3.64599609375, -3.20703125, -2.76806640625, -2.3291015625, -1.89013671875, -1.451171875, -1.01220703125, -0.5732421875, -0.13427734375, 0.3046875, 0.74365234375, 1.1826171875, 1.62158203125, 2.060546875, 2.49951171875, 2.9384765625, 3.37744140625, 3.81640625, 4.25537109375, 4.6943359375, 5.13330078125, 5.572265625, 6.01123046875, 6.4501953125, 6.88916015625, 7.328125, 7.76708984375, 8.2060546875, 8.64501953125, 9.083984375, 9.52294921875, 9.9619140625, 10.40087890625, 10.83984375, 11.27880859375, 11.7177734375, 12.15673828125, 12.595703125, 13.03466796875, 13.4736328125, 13.91259765625, 14.3515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 14.0, 18.0, 18.0, 32.0, 67.0, 78.0, 122.0, 161.0, 163.0, 110.0, 79.0, 46.0, 33.0, 26.0, 10.0, 4.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010042190551757812, -0.0009680688381195068, -0.0009319186210632324, -0.000895768404006958, -0.0008596181869506836, -0.0008234679698944092, -0.0007873177528381348, -0.0007511675357818604, -0.0007150173187255859, -0.0006788671016693115, -0.0006427168846130371, -0.0006065666675567627, -0.0005704164505004883, -0.0005342662334442139, -0.0004981160163879395, -0.00046196579933166504, -0.0004258155822753906, -0.0003896653652191162, -0.0003535151481628418, -0.0003173649311065674, -0.00028121471405029297, -0.00024506449699401855, -0.00020891427993774414, -0.00017276406288146973, -0.0001366138458251953, -0.0001004636287689209, -6.431341171264648e-05, -2.816319465637207e-05, 7.987022399902344e-06, 4.413723945617676e-05, 8.028745651245117e-05, 0.00011643767356872559, 0.000152587890625, 0.00018873810768127441, 0.00022488832473754883, 0.00026103854179382324, 0.00029718875885009766, 0.00033333897590637207, 0.0003694891929626465, 0.0004056394100189209, 0.0004417896270751953, 0.0004779398441314697, 0.0005140900611877441, 0.0005502402782440186, 0.000586390495300293, 0.0006225407123565674, 0.0006586909294128418, 0.0006948411464691162, 0.0007309913635253906, 0.000767141580581665, 0.0008032917976379395, 0.0008394420146942139, 0.0008755922317504883, 0.0009117424488067627, 0.0009478926658630371, 0.0009840428829193115, 0.001020193099975586, 0.0010563433170318604, 0.0010924935340881348, 0.0011286437511444092, 0.0011647939682006836, 0.001200944185256958, 0.0012370944023132324, 0.0012732446193695068, 0.0013093948364257812]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 12.0, 25.0, 38.0, 81.0, 137.0, 312.0, 703.0, 1935.0, 7267.0, 63087.0, 678251.0, 271532.0, 19345.0, 3712.0, 1193.0, 479.0, 204.0, 103.0, 55.0, 22.0, 12.0, 10.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -9.01898193359375, -8.7801513671875, -8.54132080078125, -8.302490234375, -8.06365966796875, -7.8248291015625, -7.58599853515625, -7.34716796875, -7.10833740234375, -6.8695068359375, -6.63067626953125, -6.391845703125, -6.15301513671875, -5.9141845703125, -5.67535400390625, -5.4365234375, -5.19769287109375, -4.9588623046875, -4.72003173828125, -4.481201171875, -4.24237060546875, -4.0035400390625, -3.76470947265625, -3.52587890625, -3.28704833984375, -3.0482177734375, -2.80938720703125, -2.570556640625, -2.33172607421875, -2.0928955078125, -1.85406494140625, -1.615234375, -1.37640380859375, -1.1375732421875, -0.89874267578125, -0.659912109375, -0.42108154296875, -0.1822509765625, 0.05657958984375, 0.29541015625, 0.53424072265625, 0.7730712890625, 1.01190185546875, 1.250732421875, 1.48956298828125, 1.7283935546875, 1.96722412109375, 2.2060546875, 2.44488525390625, 2.6837158203125, 2.92254638671875, 3.161376953125, 3.40020751953125, 3.6390380859375, 3.87786865234375, 4.11669921875, 4.35552978515625, 4.5943603515625, 4.83319091796875, 5.072021484375, 5.31085205078125, 5.5496826171875, 5.78851318359375, 6.02734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 12.0, 12.0, 22.0, 29.0, 33.0, 51.0, 77.0, 114.0, 118.0, 135.0, 124.0, 82.0, 53.0, 39.0, 30.0, 16.0, 19.0, 12.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.255859375, -2.169403076171875, -2.08294677734375, -1.996490478515625, -1.9100341796875, -1.823577880859375, -1.73712158203125, -1.650665283203125, -1.564208984375, -1.477752685546875, -1.39129638671875, -1.304840087890625, -1.2183837890625, -1.131927490234375, -1.04547119140625, -0.959014892578125, -0.87255859375, -0.786102294921875, -0.69964599609375, -0.613189697265625, -0.5267333984375, -0.440277099609375, -0.35382080078125, -0.267364501953125, -0.180908203125, -0.094451904296875, -0.00799560546875, 0.078460693359375, 0.1649169921875, 0.251373291015625, 0.33782958984375, 0.424285888671875, 0.5107421875, 0.597198486328125, 0.68365478515625, 0.770111083984375, 0.8565673828125, 0.943023681640625, 1.02947998046875, 1.115936279296875, 1.202392578125, 1.288848876953125, 1.37530517578125, 1.461761474609375, 1.5482177734375, 1.634674072265625, 1.72113037109375, 1.807586669921875, 1.89404296875, 1.980499267578125, 2.06695556640625, 2.153411865234375, 2.2398681640625, 2.326324462890625, 2.41278076171875, 2.499237060546875, 2.585693359375, 2.672149658203125, 2.75860595703125, 2.845062255859375, 2.9315185546875, 3.017974853515625, 3.10443115234375, 3.190887451171875, 3.27734375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 12.0, 19.0, 23.0, 44.0, 58.0, 87.0, 107.0, 115.0, 113.0, 113.0, 78.0, 67.0, 55.0, 38.0, 29.0, 20.0, 8.0, 8.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.609386444091797, -17.8399715423584, -17.070558547973633, -16.301143646240234, -15.531728744506836, -14.762314796447754, -13.992900848388672, -13.223485946655273, -12.454071998596191, -11.68465805053711, -10.915243148803711, -10.145829200744629, -9.376415252685547, -8.607000350952148, -7.837586402893066, -7.068171977996826, -6.298757553100586, -5.529343128204346, -4.7599287033081055, -3.9905147552490234, -3.221100330352783, -2.451685905456543, -1.682271957397461, -0.9128575325012207, -0.14344310760498047, 0.6259711980819702, 1.395385503768921, 2.164799690246582, 2.9342141151428223, 3.7036285400390625, 4.4730424880981445, 5.242456912994385, 6.011869430541992, 6.781283855438232, 7.550698280334473, 8.320112228393555, 9.089527130126953, 9.858941078186035, 10.628355026245117, 11.397769927978516, 12.167183876037598, 12.93659782409668, 13.706012725830078, 14.47542667388916, 15.244840621948242, 16.01425552368164, 16.783668518066406, 17.553083419799805, 18.322498321533203, 19.0919132232666, 19.861326217651367, 20.630741119384766, 21.400156021118164, 22.169570922851562, 22.938983917236328, 23.708398818969727, 24.477813720703125, 25.247228622436523, 26.01664161682129, 26.786056518554688, 27.555471420288086, 28.324886322021484, 29.09429931640625, 29.86371421813965, 30.633127212524414]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 4.0, 3.0, 5.0, 9.0, 9.0, 10.0, 18.0, 16.0, 20.0, 27.0, 30.0, 31.0, 30.0, 35.0, 32.0, 25.0, 37.0, 44.0, 36.0, 42.0, 39.0, 59.0, 56.0, 40.0, 33.0, 40.0, 30.0, 34.0, 24.0, 31.0, 29.0, 18.0, 21.0, 21.0, 5.0, 16.0, 7.0, 10.0, 8.0, 2.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.277517318725586, -19.671737670898438, -19.06595802307129, -18.460180282592773, -17.854400634765625, -17.248620986938477, -16.642841339111328, -16.03706169128418, -15.431282997131348, -14.8255033493042, -14.219724655151367, -13.613945007324219, -13.00816535949707, -12.402386665344238, -11.79660701751709, -11.190828323364258, -10.58504867553711, -9.979269027709961, -9.373490333557129, -8.76771068572998, -8.161931991577148, -7.55615234375, -6.950372695922852, -6.344593524932861, -5.738814353942871, -5.133035182952881, -4.527256011962891, -3.921476364135742, -3.315697193145752, -2.7099180221557617, -2.1041386127471924, -1.498359203338623, -0.892578125, -0.2867988348007202, 0.31898045539855957, 0.9247597455978394, 1.5305390357971191, 2.1363182067871094, 2.7420976161956787, 3.347877025604248, 3.9536561965942383, 4.5594353675842285, 5.165214538574219, 5.770994186401367, 6.376773357391357, 6.982552528381348, 7.588332176208496, 8.194110870361328, 8.799890518188477, 9.405670166015625, 10.011448860168457, 10.617228507995605, 11.223007202148438, 11.828786849975586, 12.434566497802734, 13.040346145629883, 13.646124839782715, 14.251904487609863, 14.857683181762695, 15.463462829589844, 16.069242477416992, 16.67502212524414, 17.280799865722656, 17.886579513549805, 18.492359161376953]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 3.0, 3.0, 3.0, 9.0, 12.0, 14.0, 17.0, 13.0, 28.0, 48.0, 51.0, 68.0, 98.0, 151.0, 315.0, 611.0, 1593.0, 4875.0, 23089.0, 179009.0, 1730891.0, 1991786.0, 225458.0, 27557.0, 5413.0, 1625.0, 635.0, 318.0, 171.0, 119.0, 71.0, 52.0, 43.0, 35.0, 24.0, 16.0, 6.0, 11.0, 6.0, 8.0, 6.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.609375, -12.17529296875, -11.7412109375, -11.30712890625, -10.873046875, -10.43896484375, -10.0048828125, -9.57080078125, -9.13671875, -8.70263671875, -8.2685546875, -7.83447265625, -7.400390625, -6.96630859375, -6.5322265625, -6.09814453125, -5.6640625, -5.22998046875, -4.7958984375, -4.36181640625, -3.927734375, -3.49365234375, -3.0595703125, -2.62548828125, -2.19140625, -1.75732421875, -1.3232421875, -0.88916015625, -0.455078125, -0.02099609375, 0.4130859375, 0.84716796875, 1.28125, 1.71533203125, 2.1494140625, 2.58349609375, 3.017578125, 3.45166015625, 3.8857421875, 4.31982421875, 4.75390625, 5.18798828125, 5.6220703125, 6.05615234375, 6.490234375, 6.92431640625, 7.3583984375, 7.79248046875, 8.2265625, 8.66064453125, 9.0947265625, 9.52880859375, 9.962890625, 10.39697265625, 10.8310546875, 11.26513671875, 11.69921875, 12.13330078125, 12.5673828125, 13.00146484375, 13.435546875, 13.86962890625, 14.3037109375, 14.73779296875, 15.171875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 10.0, 16.0, 15.0, 21.0, 24.0, 31.0, 49.0, 49.0, 41.0, 74.0, 62.0, 81.0, 60.0, 76.0, 64.0, 61.0, 54.0, 32.0, 43.0, 35.0, 35.0, 27.0, 12.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.65875244140625, -6.3604736328125, -6.06219482421875, -5.763916015625, -5.46563720703125, -5.1673583984375, -4.86907958984375, -4.57080078125, -4.27252197265625, -3.9742431640625, -3.67596435546875, -3.377685546875, -3.07940673828125, -2.7811279296875, -2.48284912109375, -2.1845703125, -1.88629150390625, -1.5880126953125, -1.28973388671875, -0.991455078125, -0.69317626953125, -0.3948974609375, -0.09661865234375, 0.20166015625, 0.49993896484375, 0.7982177734375, 1.09649658203125, 1.394775390625, 1.69305419921875, 1.9913330078125, 2.28961181640625, 2.587890625, 2.88616943359375, 3.1844482421875, 3.48272705078125, 3.781005859375, 4.07928466796875, 4.3775634765625, 4.67584228515625, 4.97412109375, 5.27239990234375, 5.5706787109375, 5.86895751953125, 6.167236328125, 6.46551513671875, 6.7637939453125, 7.06207275390625, 7.3603515625, 7.65863037109375, 7.9569091796875, 8.25518798828125, 8.553466796875, 8.85174560546875, 9.1500244140625, 9.44830322265625, 9.74658203125, 10.04486083984375, 10.3431396484375, 10.64141845703125, 10.939697265625, 11.23797607421875, 11.5362548828125, 11.83453369140625, 12.1328125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 13.0, 20.0, 72.0, 249.0, 1332.0, 19479.0, 4158278.0, 13270.0, 1216.0, 231.0, 67.0, 21.0, 14.0, 6.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.125, -50.1552734375, -48.185546875, -46.2158203125, -44.24609375, -42.2763671875, -40.306640625, -38.3369140625, -36.3671875, -34.3974609375, -32.427734375, -30.4580078125, -28.48828125, -26.5185546875, -24.548828125, -22.5791015625, -20.609375, -18.6396484375, -16.669921875, -14.7001953125, -12.73046875, -10.7607421875, -8.791015625, -6.8212890625, -4.8515625, -2.8818359375, -0.912109375, 1.0576171875, 3.02734375, 4.9970703125, 6.966796875, 8.9365234375, 10.90625, 12.8759765625, 14.845703125, 16.8154296875, 18.78515625, 20.7548828125, 22.724609375, 24.6943359375, 26.6640625, 28.6337890625, 30.603515625, 32.5732421875, 34.54296875, 36.5126953125, 38.482421875, 40.4521484375, 42.421875, 44.3916015625, 46.361328125, 48.3310546875, 50.30078125, 52.2705078125, 54.240234375, 56.2099609375, 58.1796875, 60.1494140625, 62.119140625, 64.0888671875, 66.05859375, 68.0283203125, 69.998046875, 71.9677734375, 73.9375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 13.0, 20.0, 39.0, 89.0, 218.0, 385.0, 694.0, 962.0, 770.0, 425.0, 227.0, 119.0, 50.0, 27.0, 12.0, 8.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.844482421875, -8.60302734375, -8.361572265625, -8.1201171875, -7.878662109375, -7.63720703125, -7.395751953125, -7.154296875, -6.912841796875, -6.67138671875, -6.429931640625, -6.1884765625, -5.947021484375, -5.70556640625, -5.464111328125, -5.22265625, -4.981201171875, -4.73974609375, -4.498291015625, -4.2568359375, -4.015380859375, -3.77392578125, -3.532470703125, -3.291015625, -3.049560546875, -2.80810546875, -2.566650390625, -2.3251953125, -2.083740234375, -1.84228515625, -1.600830078125, -1.359375, -1.117919921875, -0.87646484375, -0.635009765625, -0.3935546875, -0.152099609375, 0.08935546875, 0.330810546875, 0.572265625, 0.813720703125, 1.05517578125, 1.296630859375, 1.5380859375, 1.779541015625, 2.02099609375, 2.262451171875, 2.50390625, 2.745361328125, 2.98681640625, 3.228271484375, 3.4697265625, 3.711181640625, 3.95263671875, 4.194091796875, 4.435546875, 4.677001953125, 4.91845703125, 5.159912109375, 5.4013671875, 5.642822265625, 5.88427734375, 6.125732421875, 6.3671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 9.0, 11.0, 8.0, 6.0, 18.0, 12.0, 12.0, 22.0, 30.0, 33.0, 32.0, 43.0, 53.0, 47.0, 47.0, 53.0, 47.0, 53.0, 58.0, 50.0, 45.0, 39.0, 47.0, 37.0, 36.0, 30.0, 23.0, 16.0, 25.0, 18.0, 10.0, 12.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.90057373046875, -8.617405891418457, -8.334238052368164, -8.051070213317871, -7.767902374267578, -7.484734535217285, -7.201566219329834, -6.918398380279541, -6.635230541229248, -6.352062702178955, -6.068894863128662, -5.785727024078369, -5.502558708190918, -5.219390869140625, -4.936223030090332, -4.653055191040039, -4.369887351989746, -4.086719512939453, -3.80355167388916, -3.520383596420288, -3.237215757369995, -2.954047918319702, -2.67087984085083, -2.387712001800537, -2.104544162750244, -1.8213763236999512, -1.5382083654403687, -1.2550404071807861, -0.9718725681304932, -0.6887047290802002, -0.4055367708206177, -0.12236881256103516, 0.1607990264892578, 0.44396692514419556, 0.7271348237991333, 1.0103027820587158, 1.2934706211090088, 1.5766384601593018, 1.8598064184188843, 2.142974376678467, 2.4261422157287598, 2.7093100547790527, 2.9924778938293457, 3.2756459712982178, 3.5588138103485107, 3.8419816493988037, 4.125149726867676, 4.408317565917969, 4.691485404968262, 4.974653244018555, 5.257821083068848, 5.540988922119141, 5.824156761169434, 6.107324600219727, 6.390492916107178, 6.673660755157471, 6.956828594207764, 7.239996433258057, 7.52316427230835, 7.806332111358643, 8.089500427246094, 8.372668266296387, 8.65583610534668, 8.939003944396973, 9.222171783447266]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 9.0, 6.0, 11.0, 10.0, 13.0, 13.0, 17.0, 15.0, 12.0, 12.0, 28.0, 30.0, 30.0, 39.0, 26.0, 34.0, 41.0, 36.0, 40.0, 35.0, 48.0, 21.0, 33.0, 43.0, 37.0, 34.0, 35.0, 36.0, 27.0, 27.0, 22.0, 25.0, 21.0, 19.0, 12.0, 19.0, 22.0, 14.0, 7.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-8.134027481079102, -7.905045032501221, -7.67606258392334, -7.447079658508301, -7.21809720993042, -6.989114761352539, -6.760132312774658, -6.531149864196777, -6.302166938781738, -6.073184490203857, -5.844202041625977, -5.6152191162109375, -5.386236667633057, -5.157254219055176, -4.928271770477295, -4.699289321899414, -4.470306873321533, -4.241324424743652, -4.0123419761657715, -3.7833592891693115, -3.5543766021728516, -3.3253941535949707, -3.09641170501709, -2.867429256439209, -2.638446569442749, -2.409464120864868, -2.180481433868408, -1.9514989852905273, -1.722516417503357, -1.4935338497161865, -1.2645514011383057, -1.0355688333511353, -0.8065857887268066, -0.5776032209396362, -0.3486207127571106, -0.11963820457458496, 0.10934436321258545, 0.33832693099975586, 0.5673093795776367, 0.7962919473648071, 1.0252745151519775, 1.254257082939148, 1.4832396507263184, 1.7122220993041992, 1.9412046670913696, 2.17018723487854, 2.399169683456421, 2.628152370452881, 2.8571348190307617, 3.0861172676086426, 3.3150999546051025, 3.5440824031829834, 3.7730650901794434, 4.002047538757324, 4.231029987335205, 4.460012435913086, 4.688995361328125, 4.917977809906006, 5.146960258483887, 5.375943183898926, 5.604925632476807, 5.8339080810546875, 6.062890529632568, 6.291872978210449, 6.52085542678833]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 3.0, 5.0, 6.0, 14.0, 15.0, 15.0, 26.0, 26.0, 37.0, 45.0, 57.0, 88.0, 123.0, 157.0, 204.0, 312.0, 393.0, 854.0, 2528.0, 11812.0, 70237.0, 355649.0, 465203.0, 115225.0, 19082.0, 3719.0, 1037.0, 498.0, 304.0, 225.0, 155.0, 127.0, 94.0, 63.0, 46.0, 42.0, 38.0, 18.0, 11.0, 18.0, 11.0, 13.0, 6.0, 2.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-2.95703125, -2.865020751953125, -2.77301025390625, -2.680999755859375, -2.5889892578125, -2.496978759765625, -2.40496826171875, -2.312957763671875, -2.220947265625, -2.128936767578125, -2.03692626953125, -1.944915771484375, -1.8529052734375, -1.760894775390625, -1.66888427734375, -1.576873779296875, -1.48486328125, -1.392852783203125, -1.30084228515625, -1.208831787109375, -1.1168212890625, -1.024810791015625, -0.93280029296875, -0.840789794921875, -0.748779296875, -0.656768798828125, -0.56475830078125, -0.472747802734375, -0.3807373046875, -0.288726806640625, -0.19671630859375, -0.104705810546875, -0.0126953125, 0.079315185546875, 0.17132568359375, 0.263336181640625, 0.3553466796875, 0.447357177734375, 0.53936767578125, 0.631378173828125, 0.723388671875, 0.815399169921875, 0.90740966796875, 0.999420166015625, 1.0914306640625, 1.183441162109375, 1.27545166015625, 1.367462158203125, 1.45947265625, 1.551483154296875, 1.64349365234375, 1.735504150390625, 1.8275146484375, 1.919525146484375, 2.01153564453125, 2.103546142578125, 2.195556640625, 2.287567138671875, 2.37957763671875, 2.471588134765625, 2.5635986328125, 2.655609130859375, 2.74761962890625, 2.839630126953125, 2.931640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 4.0, 12.0, 10.0, 13.0, 15.0, 12.0, 18.0, 18.0, 23.0, 26.0, 20.0, 42.0, 28.0, 37.0, 49.0, 30.0, 44.0, 44.0, 34.0, 41.0, 55.0, 43.0, 36.0, 35.0, 26.0, 35.0, 34.0, 31.0, 24.0, 27.0, 15.0, 15.0, 22.0, 12.0, 12.0, 7.0, 11.0, 7.0, 6.0, 4.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.941162109375, -4.78076171875, -4.620361328125, -4.4599609375, -4.299560546875, -4.13916015625, -3.978759765625, -3.818359375, -3.657958984375, -3.49755859375, -3.337158203125, -3.1767578125, -3.016357421875, -2.85595703125, -2.695556640625, -2.53515625, -2.374755859375, -2.21435546875, -2.053955078125, -1.8935546875, -1.733154296875, -1.57275390625, -1.412353515625, -1.251953125, -1.091552734375, -0.93115234375, -0.770751953125, -0.6103515625, -0.449951171875, -0.28955078125, -0.129150390625, 0.03125, 0.191650390625, 0.35205078125, 0.512451171875, 0.6728515625, 0.833251953125, 0.99365234375, 1.154052734375, 1.314453125, 1.474853515625, 1.63525390625, 1.795654296875, 1.9560546875, 2.116455078125, 2.27685546875, 2.437255859375, 2.59765625, 2.758056640625, 2.91845703125, 3.078857421875, 3.2392578125, 3.399658203125, 3.56005859375, 3.720458984375, 3.880859375, 4.041259765625, 4.20166015625, 4.362060546875, 4.5224609375, 4.682861328125, 4.84326171875, 5.003662109375, 5.1640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 13.0, 27.0, 27.0, 66.0, 77.0, 117.0, 217.0, 317.0, 515.0, 799.0, 1400.0, 2270.0, 3757.0, 6414.0, 10554.0, 17633.0, 29643.0, 47784.0, 74131.0, 108368.0, 142226.0, 158076.0, 142075.0, 108386.0, 73503.0, 47142.0, 29004.0, 17642.0, 10383.0, 6315.0, 3810.0, 2296.0, 1308.0, 834.0, 520.0, 346.0, 188.0, 136.0, 66.0, 49.0, 37.0, 28.0, 22.0, 6.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.681640625, -0.6592864990234375, -0.636932373046875, -0.6145782470703125, -0.59222412109375, -0.5698699951171875, -0.547515869140625, -0.5251617431640625, -0.5028076171875, -0.4804534912109375, -0.458099365234375, -0.4357452392578125, -0.41339111328125, -0.3910369873046875, -0.368682861328125, -0.3463287353515625, -0.323974609375, -0.3016204833984375, -0.279266357421875, -0.2569122314453125, -0.23455810546875, -0.2122039794921875, -0.189849853515625, -0.1674957275390625, -0.1451416015625, -0.1227874755859375, -0.100433349609375, -0.0780792236328125, -0.05572509765625, -0.0333709716796875, -0.011016845703125, 0.0113372802734375, 0.03369140625, 0.0560455322265625, 0.078399658203125, 0.1007537841796875, 0.12310791015625, 0.1454620361328125, 0.167816162109375, 0.1901702880859375, 0.2125244140625, 0.2348785400390625, 0.257232666015625, 0.2795867919921875, 0.30194091796875, 0.3242950439453125, 0.346649169921875, 0.3690032958984375, 0.391357421875, 0.4137115478515625, 0.436065673828125, 0.4584197998046875, 0.48077392578125, 0.5031280517578125, 0.525482177734375, 0.5478363037109375, 0.5701904296875, 0.5925445556640625, 0.614898681640625, 0.6372528076171875, 0.65960693359375, 0.6819610595703125, 0.704315185546875, 0.7266693115234375, 0.7490234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 6.0, 11.0, 11.0, 15.0, 13.0, 17.0, 19.0, 22.0, 31.0, 30.0, 53.0, 46.0, 41.0, 34.0, 43.0, 48.0, 32.0, 55.0, 38.0, 41.0, 56.0, 37.0, 34.0, 46.0, 26.0, 19.0, 35.0, 20.0, 23.0, 15.0, 17.0, 9.0, 10.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.6875, -12.2816162109375, -11.875732421875, -11.4698486328125, -11.06396484375, -10.6580810546875, -10.252197265625, -9.8463134765625, -9.4404296875, -9.0345458984375, -8.628662109375, -8.2227783203125, -7.81689453125, -7.4110107421875, -7.005126953125, -6.5992431640625, -6.193359375, -5.7874755859375, -5.381591796875, -4.9757080078125, -4.56982421875, -4.1639404296875, -3.758056640625, -3.3521728515625, -2.9462890625, -2.5404052734375, -2.134521484375, -1.7286376953125, -1.32275390625, -0.9168701171875, -0.510986328125, -0.1051025390625, 0.30078125, 0.7066650390625, 1.112548828125, 1.5184326171875, 1.92431640625, 2.3302001953125, 2.736083984375, 3.1419677734375, 3.5478515625, 3.9537353515625, 4.359619140625, 4.7655029296875, 5.17138671875, 5.5772705078125, 5.983154296875, 6.3890380859375, 6.794921875, 7.2008056640625, 7.606689453125, 8.0125732421875, 8.41845703125, 8.8243408203125, 9.230224609375, 9.6361083984375, 10.0419921875, 10.4478759765625, 10.853759765625, 11.2596435546875, 11.66552734375, 12.0714111328125, 12.477294921875, 12.8831787109375, 13.2890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 11.0, 14.0, 36.0, 53.0, 105.0, 185.0, 362.0, 891.0, 3050.0, 16161.0, 216155.0, 731269.0, 69521.0, 7589.0, 1852.0, 661.0, 274.0, 139.0, 100.0, 35.0, 37.0, 24.0, 13.0, 7.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5254364013671875, -0.505462646484375, -0.4854888916015625, -0.46551513671875, -0.4455413818359375, -0.425567626953125, -0.4055938720703125, -0.3856201171875, -0.3656463623046875, -0.345672607421875, -0.3256988525390625, -0.30572509765625, -0.2857513427734375, -0.265777587890625, -0.2458038330078125, -0.225830078125, -0.2058563232421875, -0.185882568359375, -0.1659088134765625, -0.14593505859375, -0.1259613037109375, -0.105987548828125, -0.0860137939453125, -0.0660400390625, -0.0460662841796875, -0.026092529296875, -0.0061187744140625, 0.01385498046875, 0.0338287353515625, 0.053802490234375, 0.0737762451171875, 0.09375, 0.1137237548828125, 0.133697509765625, 0.1536712646484375, 0.17364501953125, 0.1936187744140625, 0.213592529296875, 0.2335662841796875, 0.2535400390625, 0.2735137939453125, 0.293487548828125, 0.3134613037109375, 0.33343505859375, 0.3534088134765625, 0.373382568359375, 0.3933563232421875, 0.413330078125, 0.4333038330078125, 0.453277587890625, 0.4732513427734375, 0.49322509765625, 0.5131988525390625, 0.533172607421875, 0.5531463623046875, 0.5731201171875, 0.5930938720703125, 0.613067626953125, 0.6330413818359375, 0.65301513671875, 0.6729888916015625, 0.692962646484375, 0.7129364013671875, 0.73291015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 2.0, 6.0, 9.0, 18.0, 26.0, 34.0, 69.0, 81.0, 96.0, 107.0, 113.0, 98.0, 87.0, 68.0, 60.0, 42.0, 36.0, 17.0, 14.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014150142669677734, -0.0001345369964838028, -0.00012757256627082825, -0.0001206081360578537, -0.00011364370584487915, -0.0001066792756319046, -9.971484541893005e-05, -9.27504152059555e-05, -8.578598499298096e-05, -7.882155478000641e-05, -7.185712456703186e-05, -6.489269435405731e-05, -5.7928264141082764e-05, -5.0963833928108215e-05, -4.399940371513367e-05, -3.703497350215912e-05, -3.007054328918457e-05, -2.3106113076210022e-05, -1.6141682863235474e-05, -9.177252650260925e-06, -2.212822437286377e-06, 4.751607775688171e-06, 1.171603798866272e-05, 1.8680468201637268e-05, 2.5644898414611816e-05, 3.2609328627586365e-05, 3.957375884056091e-05, 4.653818905353546e-05, 5.350261926651001e-05, 6.046704947948456e-05, 6.74314796924591e-05, 7.439590990543365e-05, 8.13603401184082e-05, 8.832477033138275e-05, 9.52892005443573e-05, 0.00010225363075733185, 0.0001092180609703064, 0.00011618249118328094, 0.0001231469213962555, 0.00013011135160923004, 0.0001370757818222046, 0.00014404021203517914, 0.0001510046422481537, 0.00015796907246112823, 0.00016493350267410278, 0.00017189793288707733, 0.00017886236310005188, 0.00018582679331302643, 0.00019279122352600098, 0.00019975565373897552, 0.00020672008395195007, 0.00021368451416492462, 0.00022064894437789917, 0.00022761337459087372, 0.00023457780480384827, 0.00024154223501682281, 0.00024850666522979736, 0.0002554710954427719, 0.00026243552565574646, 0.000269399955868721, 0.00027636438608169556, 0.0002833288162946701, 0.00029029324650764465, 0.0002972576767206192, 0.00030422210693359375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 7.0, 11.0, 16.0, 19.0, 30.0, 24.0, 42.0, 63.0, 85.0, 143.0, 251.0, 453.0, 892.0, 1753.0, 4001.0, 9248.0, 25488.0, 85157.0, 341789.0, 416606.0, 109179.0, 31916.0, 11673.0, 4823.0, 2244.0, 1144.0, 647.0, 340.0, 187.0, 117.0, 65.0, 34.0, 28.0, 18.0, 18.0, 8.0, 9.0, 7.0, 5.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36669921875, -0.354095458984375, -0.34149169921875, -0.328887939453125, -0.3162841796875, -0.303680419921875, -0.29107666015625, -0.278472900390625, -0.265869140625, -0.253265380859375, -0.24066162109375, -0.228057861328125, -0.2154541015625, -0.202850341796875, -0.19024658203125, -0.177642822265625, -0.1650390625, -0.152435302734375, -0.13983154296875, -0.127227783203125, -0.1146240234375, -0.102020263671875, -0.08941650390625, -0.076812744140625, -0.064208984375, -0.051605224609375, -0.03900146484375, -0.026397705078125, -0.0137939453125, -0.001190185546875, 0.01141357421875, 0.024017333984375, 0.03662109375, 0.049224853515625, 0.06182861328125, 0.074432373046875, 0.0870361328125, 0.099639892578125, 0.11224365234375, 0.124847412109375, 0.137451171875, 0.150054931640625, 0.16265869140625, 0.175262451171875, 0.1878662109375, 0.200469970703125, 0.21307373046875, 0.225677490234375, 0.23828125, 0.250885009765625, 0.26348876953125, 0.276092529296875, 0.2886962890625, 0.301300048828125, 0.31390380859375, 0.326507568359375, 0.339111328125, 0.351715087890625, 0.36431884765625, 0.376922607421875, 0.3895263671875, 0.402130126953125, 0.41473388671875, 0.427337646484375, 0.43994140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 7.0, 13.0, 23.0, 35.0, 54.0, 128.0, 178.0, 174.0, 134.0, 90.0, 47.0, 34.0, 20.0, 13.0, 6.0, 6.0, 5.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16748046875, -0.1624622344970703, -0.15744400024414062, -0.15242576599121094, -0.14740753173828125, -0.14238929748535156, -0.13737106323242188, -0.1323528289794922, -0.1273345947265625, -0.12231636047363281, -0.11729812622070312, -0.11227989196777344, -0.10726165771484375, -0.10224342346191406, -0.09722518920898438, -0.09220695495605469, -0.087188720703125, -0.08217048645019531, -0.07715225219726562, -0.07213401794433594, -0.06711578369140625, -0.06209754943847656, -0.057079315185546875, -0.05206108093261719, -0.0470428466796875, -0.04202461242675781, -0.037006378173828125, -0.03198814392089844, -0.02696990966796875, -0.021951675415039062, -0.016933441162109375, -0.011915206909179688, -0.00689697265625, -0.0018787384033203125, 0.003139495849609375, 0.008157730102539062, 0.01317596435546875, 0.018194198608398438, 0.023212432861328125, 0.028230667114257812, 0.0332489013671875, 0.03826713562011719, 0.043285369873046875, 0.04830360412597656, 0.05332183837890625, 0.05834007263183594, 0.06335830688476562, 0.06837654113769531, 0.073394775390625, 0.07841300964355469, 0.08343124389648438, 0.08844947814941406, 0.09346771240234375, 0.09848594665527344, 0.10350418090820312, 0.10852241516113281, 0.1135406494140625, 0.11855888366699219, 0.12357711791992188, 0.12859535217285156, 0.13361358642578125, 0.13863182067871094, 0.14365005493164062, 0.1486682891845703, 0.1536865234375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 9.0, 17.0, 20.0, 18.0, 17.0, 25.0, 30.0, 40.0, 44.0, 49.0, 52.0, 60.0, 65.0, 52.0, 64.0, 62.0, 54.0, 57.0, 50.0, 39.0, 33.0, 30.0, 26.0, 19.0, 23.0, 12.0, 6.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.976248264312744, -5.78230094909668, -5.588353633880615, -5.394406795501709, -5.2004594802856445, -5.00651216506958, -4.812564849853516, -4.618618011474609, -4.424670696258545, -4.2307233810424805, -4.036776065826416, -3.8428289890289307, -3.6488819122314453, -3.454934597015381, -3.2609872817993164, -3.067040205001831, -2.8730928897857666, -2.679145574569702, -2.485198497772217, -2.2912511825561523, -2.097304105758667, -1.9033567905426025, -1.7094095945358276, -1.5154623985290527, -1.3215152025222778, -1.127568006515503, -0.933620810508728, -0.7396735548973083, -0.5457263588905334, -0.35177916288375854, -0.15783190727233887, 0.036115288734436035, 0.23006248474121094, 0.42400968074798584, 0.6179568767547607, 0.8119041323661804, 1.0058512687683105, 1.199798583984375, 1.39374577999115, 1.5876929759979248, 1.7816401720046997, 1.9755873680114746, 2.169534683227539, 2.3634817600250244, 2.557429075241089, 2.751376152038574, 2.9453234672546387, 3.139270782470703, 3.3332178592681885, 3.527165174484253, 3.7211122512817383, 3.9150595664978027, 4.109006881713867, 4.302953720092773, 4.496901035308838, 4.690848350524902, 4.884795665740967, 5.078742980957031, 5.272690296173096, 5.466637134552002, 5.660584449768066, 5.854531764984131, 6.048479080200195, 6.242425918579102, 6.436373233795166]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 11.0, 11.0, 11.0, 14.0, 16.0, 16.0, 11.0, 19.0, 34.0, 18.0, 40.0, 35.0, 31.0, 39.0, 45.0, 36.0, 38.0, 45.0, 32.0, 28.0, 40.0, 45.0, 32.0, 44.0, 39.0, 19.0, 32.0, 25.0, 34.0, 16.0, 16.0, 22.0, 15.0, 20.0, 9.0, 11.0, 10.0, 7.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.036832809448242, -4.886883735656738, -4.736935138702393, -4.586986064910889, -4.437037467956543, -4.287088394165039, -4.137139320373535, -3.9871904850006104, -3.8372416496276855, -3.6872928142547607, -3.537343978881836, -3.387394905090332, -3.2374460697174072, -3.0874972343444824, -2.9375481605529785, -2.7875993251800537, -2.637650489807129, -2.487701654434204, -2.3377528190612793, -2.1878037452697754, -2.0378549098968506, -1.8879060745239258, -1.7379571199417114, -1.588008165359497, -1.4380593299865723, -1.2881104946136475, -1.138161540031433, -0.9882126450538635, -0.838263750076294, -0.6883148550987244, -0.5383659601211548, -0.38841700553894043, -0.23846817016601562, -0.08851927518844604, 0.061429619789123535, 0.21137851476669312, 0.3613274097442627, 0.5112763047218323, 0.6612251996994019, 0.8111741542816162, 0.961122989654541, 1.1110718250274658, 1.2610207796096802, 1.4109697341918945, 1.5609185695648193, 1.7108674049377441, 1.8608163595199585, 2.010765314102173, 2.1607141494750977, 2.3106629848480225, 2.4606118202209473, 2.610560894012451, 2.760509729385376, 2.910458564758301, 3.0604076385498047, 3.2103564739227295, 3.3603053092956543, 3.510254144668579, 3.660202980041504, 3.810152053833008, 3.9601008892059326, 4.110049724578857, 4.259998798370361, 4.409947395324707, 4.559896469116211]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 15.0, 15.0, 28.0, 39.0, 66.0, 89.0, 103.0, 237.0, 390.0, 710.0, 1489.0, 3402.0, 8678.0, 23506.0, 64422.0, 158140.0, 283353.0, 269748.0, 142952.0, 56595.0, 20763.0, 7706.0, 3129.0, 1398.0, 644.0, 353.0, 211.0, 122.0, 76.0, 44.0, 40.0, 29.0, 23.0, 11.0, 12.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.8065185546875, -7.527099609375, -7.2476806640625, -6.96826171875, -6.6888427734375, -6.409423828125, -6.1300048828125, -5.8505859375, -5.5711669921875, -5.291748046875, -5.0123291015625, -4.73291015625, -4.4534912109375, -4.174072265625, -3.8946533203125, -3.615234375, -3.3358154296875, -3.056396484375, -2.7769775390625, -2.49755859375, -2.2181396484375, -1.938720703125, -1.6593017578125, -1.3798828125, -1.1004638671875, -0.821044921875, -0.5416259765625, -0.26220703125, 0.0172119140625, 0.296630859375, 0.5760498046875, 0.85546875, 1.1348876953125, 1.414306640625, 1.6937255859375, 1.97314453125, 2.2525634765625, 2.531982421875, 2.8114013671875, 3.0908203125, 3.3702392578125, 3.649658203125, 3.9290771484375, 4.20849609375, 4.4879150390625, 4.767333984375, 5.0467529296875, 5.326171875, 5.6055908203125, 5.885009765625, 6.1644287109375, 6.44384765625, 6.7232666015625, 7.002685546875, 7.2821044921875, 7.5615234375, 7.8409423828125, 8.120361328125, 8.3997802734375, 8.67919921875, 8.9586181640625, 9.238037109375, 9.5174560546875, 9.796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 17.0, 12.0, 21.0, 30.0, 26.0, 26.0, 28.0, 44.0, 39.0, 46.0, 53.0, 68.0, 41.0, 47.0, 56.0, 64.0, 48.0, 49.0, 52.0, 24.0, 28.0, 34.0, 19.0, 24.0, 14.0, 17.0, 16.0, 12.0, 11.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6328125, -9.292724609375, -8.95263671875, -8.612548828125, -8.2724609375, -7.932373046875, -7.59228515625, -7.252197265625, -6.912109375, -6.572021484375, -6.23193359375, -5.891845703125, -5.5517578125, -5.211669921875, -4.87158203125, -4.531494140625, -4.19140625, -3.851318359375, -3.51123046875, -3.171142578125, -2.8310546875, -2.490966796875, -2.15087890625, -1.810791015625, -1.470703125, -1.130615234375, -0.79052734375, -0.450439453125, -0.1103515625, 0.229736328125, 0.56982421875, 0.909912109375, 1.25, 1.590087890625, 1.93017578125, 2.270263671875, 2.6103515625, 2.950439453125, 3.29052734375, 3.630615234375, 3.970703125, 4.310791015625, 4.65087890625, 4.990966796875, 5.3310546875, 5.671142578125, 6.01123046875, 6.351318359375, 6.69140625, 7.031494140625, 7.37158203125, 7.711669921875, 8.0517578125, 8.391845703125, 8.73193359375, 9.072021484375, 9.412109375, 9.752197265625, 10.09228515625, 10.432373046875, 10.7724609375, 11.112548828125, 11.45263671875, 11.792724609375, 12.1328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 6.0, 12.0, 10.0, 10.0, 12.0, 19.0, 37.0, 55.0, 51.0, 74.0, 118.0, 165.0, 267.0, 451.0, 773.0, 1591.0, 3880.0, 10974.0, 33823.0, 110102.0, 294960.0, 355578.0, 159620.0, 50362.0, 15594.0, 5481.0, 2066.0, 982.0, 535.0, 289.0, 198.0, 132.0, 74.0, 73.0, 35.0, 38.0, 26.0, 12.0, 24.0, 12.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.734375, -10.353271484375, -9.97216796875, -9.591064453125, -9.2099609375, -8.828857421875, -8.44775390625, -8.066650390625, -7.685546875, -7.304443359375, -6.92333984375, -6.542236328125, -6.1611328125, -5.780029296875, -5.39892578125, -5.017822265625, -4.63671875, -4.255615234375, -3.87451171875, -3.493408203125, -3.1123046875, -2.731201171875, -2.35009765625, -1.968994140625, -1.587890625, -1.206787109375, -0.82568359375, -0.444580078125, -0.0634765625, 0.317626953125, 0.69873046875, 1.079833984375, 1.4609375, 1.842041015625, 2.22314453125, 2.604248046875, 2.9853515625, 3.366455078125, 3.74755859375, 4.128662109375, 4.509765625, 4.890869140625, 5.27197265625, 5.653076171875, 6.0341796875, 6.415283203125, 6.79638671875, 7.177490234375, 7.55859375, 7.939697265625, 8.32080078125, 8.701904296875, 9.0830078125, 9.464111328125, 9.84521484375, 10.226318359375, 10.607421875, 10.988525390625, 11.36962890625, 11.750732421875, 12.1318359375, 12.512939453125, 12.89404296875, 13.275146484375, 13.65625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 11.0, 10.0, 9.0, 12.0, 12.0, 18.0, 21.0, 15.0, 46.0, 40.0, 43.0, 46.0, 52.0, 50.0, 60.0, 61.0, 52.0, 51.0, 62.0, 54.0, 38.0, 38.0, 31.0, 38.0, 26.0, 22.0, 18.0, 14.0, 10.0, 9.0, 6.0, 4.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5625, -13.1708984375, -12.779296875, -12.3876953125, -11.99609375, -11.6044921875, -11.212890625, -10.8212890625, -10.4296875, -10.0380859375, -9.646484375, -9.2548828125, -8.86328125, -8.4716796875, -8.080078125, -7.6884765625, -7.296875, -6.9052734375, -6.513671875, -6.1220703125, -5.73046875, -5.3388671875, -4.947265625, -4.5556640625, -4.1640625, -3.7724609375, -3.380859375, -2.9892578125, -2.59765625, -2.2060546875, -1.814453125, -1.4228515625, -1.03125, -0.6396484375, -0.248046875, 0.1435546875, 0.53515625, 0.9267578125, 1.318359375, 1.7099609375, 2.1015625, 2.4931640625, 2.884765625, 3.2763671875, 3.66796875, 4.0595703125, 4.451171875, 4.8427734375, 5.234375, 5.6259765625, 6.017578125, 6.4091796875, 6.80078125, 7.1923828125, 7.583984375, 7.9755859375, 8.3671875, 8.7587890625, 9.150390625, 9.5419921875, 9.93359375, 10.3251953125, 10.716796875, 11.1083984375, 11.5]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 10.0, 11.0, 25.0, 24.0, 51.0, 88.0, 110.0, 222.0, 331.0, 550.0, 1003.0, 1949.0, 4142.0, 9461.0, 22572.0, 55225.0, 126667.0, 237277.0, 321876.0, 150471.0, 67134.0, 27870.0, 11311.0, 4979.0, 2375.0, 1209.0, 682.0, 336.0, 209.0, 130.0, 82.0, 45.0, 42.0, 23.0, 16.0, 12.0, 9.0, 6.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.212890625, -2.149871826171875, -2.08685302734375, -2.023834228515625, -1.9608154296875, -1.897796630859375, -1.83477783203125, -1.771759033203125, -1.708740234375, -1.645721435546875, -1.58270263671875, -1.519683837890625, -1.4566650390625, -1.393646240234375, -1.33062744140625, -1.267608642578125, -1.20458984375, -1.141571044921875, -1.07855224609375, -1.015533447265625, -0.9525146484375, -0.889495849609375, -0.82647705078125, -0.763458251953125, -0.700439453125, -0.637420654296875, -0.57440185546875, -0.511383056640625, -0.4483642578125, -0.385345458984375, -0.32232666015625, -0.259307861328125, -0.1962890625, -0.133270263671875, -0.07025146484375, -0.007232666015625, 0.0557861328125, 0.118804931640625, 0.18182373046875, 0.244842529296875, 0.307861328125, 0.370880126953125, 0.43389892578125, 0.496917724609375, 0.5599365234375, 0.622955322265625, 0.68597412109375, 0.748992919921875, 0.81201171875, 0.875030517578125, 0.93804931640625, 1.001068115234375, 1.0640869140625, 1.127105712890625, 1.19012451171875, 1.253143310546875, 1.316162109375, 1.379180908203125, 1.44219970703125, 1.505218505859375, 1.5682373046875, 1.631256103515625, 1.69427490234375, 1.757293701171875, 1.8203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 4.0, 13.0, 10.0, 15.0, 25.0, 30.0, 38.0, 29.0, 41.0, 56.0, 48.0, 68.0, 73.0, 120.0, 78.0, 66.0, 57.0, 48.0, 38.0, 28.0, 19.0, 26.0, 18.0, 11.0, 15.0, 5.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041675567626953125, -0.00040189921855926514, -0.000387042760848999, -0.0003721863031387329, -0.0003573298454284668, -0.0003424733877182007, -0.00032761693000793457, -0.00031276047229766846, -0.00029790401458740234, -0.00028304755687713623, -0.0002681910991668701, -0.000253334641456604, -0.0002384781837463379, -0.00022362172603607178, -0.00020876526832580566, -0.00019390881061553955, -0.00017905235290527344, -0.00016419589519500732, -0.0001493394374847412, -0.0001344829797744751, -0.00011962652206420898, -0.00010477006435394287, -8.991360664367676e-05, -7.505714893341064e-05, -6.020069122314453e-05, -4.534423351287842e-05, -3.0487775802612305e-05, -1.563131809234619e-05, -7.748603820800781e-07, 1.4081597328186035e-05, 2.893805503845215e-05, 4.379451274871826e-05, 5.8650970458984375e-05, 7.350742816925049e-05, 8.83638858795166e-05, 0.00010322034358978271, 0.00011807680130004883, 0.00013293325901031494, 0.00014778971672058105, 0.00016264617443084717, 0.00017750263214111328, 0.0001923590898513794, 0.0002072155475616455, 0.00022207200527191162, 0.00023692846298217773, 0.00025178492069244385, 0.00026664137840270996, 0.0002814978361129761, 0.0002963542938232422, 0.0003112107515335083, 0.0003260672092437744, 0.00034092366695404053, 0.00035578012466430664, 0.00037063658237457275, 0.00038549304008483887, 0.000400349497795105, 0.0004152059555053711, 0.0004300624132156372, 0.0004449188709259033, 0.00045977532863616943, 0.00047463178634643555, 0.0004894882440567017, 0.0005043447017669678, 0.0005192011594772339, 0.0005340576171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 7.0, 18.0, 18.0, 24.0, 60.0, 62.0, 106.0, 162.0, 245.0, 400.0, 618.0, 985.0, 1658.0, 2887.0, 6044.0, 13799.0, 35773.0, 101299.0, 244493.0, 374755.0, 164308.0, 60538.0, 21836.0, 8736.0, 4175.0, 2191.0, 1227.0, 760.0, 456.0, 321.0, 192.0, 157.0, 94.0, 52.0, 31.0, 29.0, 18.0, 8.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.466461181640625, -2.38214111328125, -2.297821044921875, -2.2135009765625, -2.129180908203125, -2.04486083984375, -1.960540771484375, -1.876220703125, -1.791900634765625, -1.70758056640625, -1.623260498046875, -1.5389404296875, -1.454620361328125, -1.37030029296875, -1.285980224609375, -1.20166015625, -1.117340087890625, -1.03302001953125, -0.948699951171875, -0.8643798828125, -0.780059814453125, -0.69573974609375, -0.611419677734375, -0.527099609375, -0.442779541015625, -0.35845947265625, -0.274139404296875, -0.1898193359375, -0.105499267578125, -0.02117919921875, 0.063140869140625, 0.1474609375, 0.231781005859375, 0.31610107421875, 0.400421142578125, 0.4847412109375, 0.569061279296875, 0.65338134765625, 0.737701416015625, 0.822021484375, 0.906341552734375, 0.99066162109375, 1.074981689453125, 1.1593017578125, 1.243621826171875, 1.32794189453125, 1.412261962890625, 1.49658203125, 1.580902099609375, 1.66522216796875, 1.749542236328125, 1.8338623046875, 1.918182373046875, 2.00250244140625, 2.086822509765625, 2.171142578125, 2.255462646484375, 2.33978271484375, 2.424102783203125, 2.5084228515625, 2.592742919921875, 2.67706298828125, 2.761383056640625, 2.845703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 3.0, 10.0, 16.0, 25.0, 26.0, 32.0, 40.0, 56.0, 60.0, 76.0, 112.0, 119.0, 95.0, 72.0, 59.0, 49.0, 26.0, 25.0, 24.0, 13.0, 17.0, 12.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.153564453125, -2.09033203125, -2.027099609375, -1.9638671875, -1.900634765625, -1.83740234375, -1.774169921875, -1.7109375, -1.647705078125, -1.58447265625, -1.521240234375, -1.4580078125, -1.394775390625, -1.33154296875, -1.268310546875, -1.205078125, -1.141845703125, -1.07861328125, -1.015380859375, -0.9521484375, -0.888916015625, -0.82568359375, -0.762451171875, -0.69921875, -0.635986328125, -0.57275390625, -0.509521484375, -0.4462890625, -0.383056640625, -0.31982421875, -0.256591796875, -0.193359375, -0.130126953125, -0.06689453125, -0.003662109375, 0.0595703125, 0.122802734375, 0.18603515625, 0.249267578125, 0.3125, 0.375732421875, 0.43896484375, 0.502197265625, 0.5654296875, 0.628662109375, 0.69189453125, 0.755126953125, 0.818359375, 0.881591796875, 0.94482421875, 1.008056640625, 1.0712890625, 1.134521484375, 1.19775390625, 1.260986328125, 1.32421875, 1.387451171875, 1.45068359375, 1.513916015625, 1.5771484375, 1.640380859375, 1.70361328125, 1.766845703125, 1.830078125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 9.0, 11.0, 17.0, 37.0, 36.0, 50.0, 45.0, 59.0, 80.0, 88.0, 96.0, 86.0, 65.0, 72.0, 45.0, 53.0, 44.0, 24.0, 16.0, 23.0, 9.0, 7.0, 9.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.547061920166016, -18.023813247680664, -17.500564575195312, -16.97731590270996, -16.45406723022461, -15.930818557739258, -15.407569885253906, -14.884321212768555, -14.361072540283203, -13.837823867797852, -13.3145751953125, -12.791326522827148, -12.268077850341797, -11.744829177856445, -11.221580505371094, -10.698331832885742, -10.175084114074707, -9.651835441589355, -9.128586769104004, -8.605338096618652, -8.0820894241333, -7.558840751647949, -7.035592555999756, -6.512343883514404, -5.989095211029053, -5.465846538543701, -4.94259786605835, -4.419349670410156, -3.8961007595062256, -3.372852087020874, -2.8496036529541016, -2.32635498046875, -1.8031072616577148, -1.2798585891723633, -0.7566100358963013, -0.23336148262023926, 0.2898871898651123, 0.8131358623504639, 1.3363842964172363, 1.859632968902588, 2.3828816413879395, 2.906130313873291, 3.4293789863586426, 3.952627420425415, 4.4758758544921875, 4.999124526977539, 5.522373199462891, 6.045621871948242, 6.568870544433594, 7.092119216918945, 7.615367889404297, 8.138616561889648, 8.661865234375, 9.185113906860352, 9.708362579345703, 10.231611251831055, 10.754859924316406, 11.278108596801758, 11.80135726928711, 12.324605941772461, 12.847854614257812, 13.371103286743164, 13.894351959228516, 14.417600631713867, 14.940848350524902]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 8.0, 3.0, 4.0, 8.0, 10.0, 14.0, 21.0, 15.0, 13.0, 25.0, 19.0, 20.0, 20.0, 23.0, 30.0, 33.0, 47.0, 31.0, 34.0, 38.0, 22.0, 26.0, 44.0, 41.0, 35.0, 31.0, 35.0, 31.0, 26.0, 43.0, 29.0, 30.0, 24.0, 19.0, 21.0, 18.0, 19.0, 25.0, 12.0, 11.0, 12.0, 6.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-15.537579536437988, -15.07518482208252, -14.612789154052734, -14.150394439697266, -13.687999725341797, -13.225604057312012, -12.763209342956543, -12.300813674926758, -11.838418960571289, -11.37602424621582, -10.913628578186035, -10.451233863830566, -9.988839149475098, -9.526443481445312, -9.064048767089844, -8.601654052734375, -8.139259338378906, -7.676864147186279, -7.2144694328308105, -6.752074241638184, -6.289679050445557, -5.82728385925293, -5.364889144897461, -4.902493953704834, -4.440098762512207, -3.977703809738159, -3.5153086185455322, -3.0529136657714844, -2.5905184745788574, -2.1281235218048096, -1.6657285690307617, -1.2033333778381348, -0.7409381866455078, -0.2785431444644928, 0.18385189771652222, 0.6462469100952148, 1.1086419820785522, 1.5710370540618896, 2.0334320068359375, 2.4958271980285645, 2.9582221508026123, 3.42061710357666, 3.883012294769287, 4.345407485961914, 4.807802200317383, 5.27019739151001, 5.732592582702637, 6.1949872970581055, 6.657382488250732, 7.119777679443359, 7.582172393798828, 8.044567108154297, 8.506962776184082, 8.96935749053955, 9.431753158569336, 9.894147872924805, 10.356542587280273, 10.818937301635742, 11.281332969665527, 11.743727684020996, 12.206122398376465, 12.66851806640625, 13.130912780761719, 13.593307495117188, 14.055703163146973]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 5.0, 10.0, 11.0, 18.0, 34.0, 29.0, 33.0, 58.0, 74.0, 109.0, 153.0, 176.0, 241.0, 343.0, 497.0, 668.0, 875.0, 1193.0, 1634.0, 2103.0, 2648.0, 3271.0, 4019.0, 5013.0, 1002522.0, 5189.0, 4311.0, 3587.0, 2847.0, 2304.0, 1723.0, 1282.0, 927.0, 716.0, 531.0, 391.0, 270.0, 201.0, 153.0, 122.0, 82.0, 61.0, 47.0, 34.0, 15.0, 28.0, 20.0, 7.0, 8.0, 1.0, 8.0, 3.0, 0.0, 2.0, 2.0], "bins": [-11.096685409545898, -10.766871452331543, -10.437057495117188, -10.107244491577148, -9.777430534362793, -9.447616577148438, -9.117803573608398, -8.787989616394043, -8.458175659179688, -8.128361701965332, -7.798548221588135, -7.4687347412109375, -7.138920783996582, -6.809106826782227, -6.479293346405029, -6.149479866027832, -5.819665908813477, -5.489851951599121, -5.160038471221924, -4.830224990844727, -4.500411033630371, -4.170597076416016, -3.8407835960388184, -3.510969877243042, -3.1811561584472656, -2.8513424396514893, -2.521528720855713, -2.1917150020599365, -1.8619012832641602, -1.5320875644683838, -1.2022738456726074, -0.872460126876831, -0.5426464080810547, -0.21283268928527832, 0.11698102951049805, 0.4467947483062744, 0.7766084671020508, 1.1064221858978271, 1.4362359046936035, 1.7660496234893799, 2.0958633422851562, 2.4256770610809326, 2.755490779876709, 3.0853044986724854, 3.4151182174682617, 3.744931936264038, 4.0747456550598145, 4.404559135437012, 4.734373092651367, 5.064187049865723, 5.39400053024292, 5.723814010620117, 6.053627967834473, 6.383441925048828, 6.713255405426025, 7.043068885803223, 7.372882843017578, 7.702696800231934, 8.032510757446289, 8.362323760986328, 8.692137718200684, 9.021951675415039, 9.351764678955078, 9.681578636169434, 10.011392593383789]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 9.0, 16.0, 33.0, 89.0, 255.0, 1164.0, 9170.0, 51303952.0, 146614.0, 7657.0, 982.0, 224.0, 104.0, 50.0, 22.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.45854949951172, -88.89169311523438, -85.32483673095703, -81.75798034667969, -78.19112396240234, -74.624267578125, -71.05740356445312, -67.49055480957031, -63.9236946105957, -60.35683822631836, -56.789981842041016, -53.223121643066406, -49.65626525878906, -46.08940887451172, -42.522552490234375, -38.95569610595703, -35.38883972167969, -31.821983337402344, -28.255126953125, -24.688268661499023, -21.12141227722168, -17.554555892944336, -13.98769760131836, -10.420841217041016, -6.853984832763672, -3.28712797164917, 0.27972888946533203, 3.846586227416992, 7.413442611694336, 10.98029899597168, 14.547157287597656, 18.114013671875, 21.680877685546875, 25.24773406982422, 28.814590454101562, 32.381446838378906, 35.94830322265625, 39.515159606933594, 43.0820198059082, 46.64887619018555, 50.21573257446289, 53.782588958740234, 57.34944534301758, 60.91630554199219, 64.48316192626953, 68.05001831054688, 71.61687469482422, 75.18373107910156, 78.7505874633789, 82.31744384765625, 85.8843002319336, 89.45115661621094, 93.01801300048828, 96.58486938476562, 100.1517333984375, 103.71858215332031, 107.28544616699219, 110.85230255126953, 114.41915893554688, 117.98601531982422, 121.55287170410156, 125.1197280883789, 128.68658447265625, 132.25344848632812, 135.82029724121094]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 10.0, 16.0, 30.0, 22.0, 54.0, 90.0, 139.0, 179.0, 291.0, 497.0, 695.0, 1118.0, 1626.0, 2453.0, 3861.0, 5919.0, 8511.0, 12899.0, 19458.0, 28723.0, 42699.0, 62787.0, 92466.0, 133554.0, 185902.0, 246539.0, 306661.0, 528397.0, 3318210.0, 325833.0, 269777.0, 208488.0, 151507.0, 106717.0, 73231.0, 50195.0, 33586.0, 22509.0, 15148.0, 10190.0, 7066.0, 4660.0, 3002.0, 2060.0, 1334.0, 836.0, 543.0, 344.0, 230.0, 118.0, 101.0, 56.0, 35.0, 27.0, 18.0, 19.0, 6.0, 1.0, 3.0], "bins": [-3.310546875, -3.2108154296875, -3.111083984375, -3.0113525390625, -2.91162109375, -2.8118896484375, -2.712158203125, -2.6124267578125, -2.5126953125, -2.4129638671875, -2.313232421875, -2.2135009765625, -2.11376953125, -2.0140380859375, -1.914306640625, -1.8145751953125, -1.71484375, -1.6151123046875, -1.515380859375, -1.4156494140625, -1.31591796875, -1.2161865234375, -1.116455078125, -1.0167236328125, -0.9169921875, -0.8172607421875, -0.717529296875, -0.6177978515625, -0.51806640625, -0.4183349609375, -0.318603515625, -0.2188720703125, -0.119140625, -0.0194091796875, 0.080322265625, 0.1800537109375, 0.27978515625, 0.3795166015625, 0.479248046875, 0.5789794921875, 0.6787109375, 0.7784423828125, 0.878173828125, 0.9779052734375, 1.07763671875, 1.1773681640625, 1.277099609375, 1.3768310546875, 1.4765625, 1.5762939453125, 1.676025390625, 1.7757568359375, 1.87548828125, 1.9752197265625, 2.074951171875, 2.1746826171875, 2.2744140625, 2.3741455078125, 2.473876953125, 2.5736083984375, 2.67333984375, 2.7730712890625, 2.872802734375, 2.9725341796875, 3.072265625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 10.0, 12.0, 9.0, 12.0, 6.0, 17.0, 21.0, 18.0, 10.0, 24.0, 39.0, 27.0, 40.0, 37.0, 31.0, 46.0, 48.0, 221.0, 900.0, 44.0, 34.0, 48.0, 37.0, 38.0, 45.0, 40.0, 29.0, 26.0, 20.0, 23.0, 18.0, 13.0, 18.0, 16.0, 9.0, 10.0, 8.0, 4.0, 10.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.0625, -80.5556640625, -78.048828125, -75.5419921875, -73.03515625, -70.5283203125, -68.021484375, -65.5146484375, -63.0078125, -60.5009765625, -57.994140625, -55.4873046875, -52.98046875, -50.4736328125, -47.966796875, -45.4599609375, -42.953125, -40.4462890625, -37.939453125, -35.4326171875, -32.92578125, -30.4189453125, -27.912109375, -25.4052734375, -22.8984375, -20.3916015625, -17.884765625, -15.3779296875, -12.87109375, -10.3642578125, -7.857421875, -5.3505859375, -2.84375, -0.3369140625, 2.169921875, 4.6767578125, 7.18359375, 9.6904296875, 12.197265625, 14.7041015625, 17.2109375, 19.7177734375, 22.224609375, 24.7314453125, 27.23828125, 29.7451171875, 32.251953125, 34.7587890625, 37.265625, 39.7724609375, 42.279296875, 44.7861328125, 47.29296875, 49.7998046875, 52.306640625, 54.8134765625, 57.3203125, 59.8271484375, 62.333984375, 64.8408203125, 67.34765625, 69.8544921875, 72.361328125, 74.8681640625, 77.375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 8.0, 11.0, 19.0, 36.0, 65.0, 93.0, 142.0, 207.0, 336.0, 480.0, 672.0, 973.0, 1450.0, 2313.0, 3408.0, 5008.0, 7345.0, 11129.0, 17082.0, 25814.0, 38491.0, 57903.0, 86179.0, 124107.0, 171102.0, 225734.0, 281775.0, 334722.0, 3445304.0, 353464.0, 286459.0, 233876.0, 178104.0, 127460.0, 89102.0, 61001.0, 40204.0, 26767.0, 17635.0, 11891.0, 7744.0, 5215.0, 3539.0, 2254.0, 1525.0, 1075.0, 726.0, 511.0, 355.0, 204.0, 132.0, 106.0, 71.0, 43.0, 28.0, 17.0, 13.0, 7.0, 4.0, 4.0, 4.0], "bins": [-2.671875, -2.587188720703125, -2.50250244140625, -2.417816162109375, -2.3331298828125, -2.248443603515625, -2.16375732421875, -2.079071044921875, -1.994384765625, -1.909698486328125, -1.82501220703125, -1.740325927734375, -1.6556396484375, -1.570953369140625, -1.48626708984375, -1.401580810546875, -1.31689453125, -1.232208251953125, -1.14752197265625, -1.062835693359375, -0.9781494140625, -0.893463134765625, -0.80877685546875, -0.724090576171875, -0.639404296875, -0.554718017578125, -0.47003173828125, -0.385345458984375, -0.3006591796875, -0.215972900390625, -0.13128662109375, -0.046600341796875, 0.0380859375, 0.122772216796875, 0.20745849609375, 0.292144775390625, 0.3768310546875, 0.461517333984375, 0.54620361328125, 0.630889892578125, 0.715576171875, 0.800262451171875, 0.88494873046875, 0.969635009765625, 1.0543212890625, 1.139007568359375, 1.22369384765625, 1.308380126953125, 1.39306640625, 1.477752685546875, 1.56243896484375, 1.647125244140625, 1.7318115234375, 1.816497802734375, 1.90118408203125, 1.985870361328125, 2.070556640625, 2.155242919921875, 2.23992919921875, 2.324615478515625, 2.4093017578125, 2.493988037109375, 2.57867431640625, 2.663360595703125, 2.748046875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 5.0, 5.0, 4.0, 13.0, 12.0, 14.0, 23.0, 28.0, 20.0, 26.0, 23.0, 28.0, 32.0, 27.0, 29.0, 29.0, 53.0, 46.0, 48.0, 1052.0, 45.0, 40.0, 29.0, 41.0, 36.0, 32.0, 29.0, 25.0, 23.0, 27.0, 26.0, 22.0, 20.0, 15.0, 10.0, 6.0, 19.0, 10.0, 5.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.21875, -50.50439453125, -48.7900390625, -47.07568359375, -45.361328125, -43.64697265625, -41.9326171875, -40.21826171875, -38.50390625, -36.78955078125, -35.0751953125, -33.36083984375, -31.646484375, -29.93212890625, -28.2177734375, -26.50341796875, -24.7890625, -23.07470703125, -21.3603515625, -19.64599609375, -17.931640625, -16.21728515625, -14.5029296875, -12.78857421875, -11.07421875, -9.35986328125, -7.6455078125, -5.93115234375, -4.216796875, -2.50244140625, -0.7880859375, 0.92626953125, 2.640625, 4.35498046875, 6.0693359375, 7.78369140625, 9.498046875, 11.21240234375, 12.9267578125, 14.64111328125, 16.35546875, 18.06982421875, 19.7841796875, 21.49853515625, 23.212890625, 24.92724609375, 26.6416015625, 28.35595703125, 30.0703125, 31.78466796875, 33.4990234375, 35.21337890625, 36.927734375, 38.64208984375, 40.3564453125, 42.07080078125, 43.78515625, 45.49951171875, 47.2138671875, 48.92822265625, 50.642578125, 52.35693359375, 54.0712890625, 55.78564453125, 57.5]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 9.0, 15.0, 23.0, 42.0, 53.0, 78.0, 95.0, 148.0, 185.0, 306.0, 398.0, 589.0, 871.0, 1282.0, 1958.0, 2808.0, 4161.0, 6044.0, 8848.0, 13008.0, 19010.0, 27541.0, 40428.0, 57929.0, 86354.0, 320948.0, 5395651.0, 98415.0, 64601.0, 43833.0, 29964.0, 20505.0, 14317.0, 9865.0, 6614.0, 4614.0, 3173.0, 2115.0, 1326.0, 964.0, 716.0, 478.0, 346.0, 230.0, 160.0, 129.0, 94.0, 61.0, 42.0, 30.0, 17.0, 15.0, 6.0, 6.0, 8.0, 6.0, 0.0, 3.0], "bins": [-6.1640625, -5.97222900390625, -5.7803955078125, -5.58856201171875, -5.396728515625, -5.20489501953125, -5.0130615234375, -4.82122802734375, -4.62939453125, -4.43756103515625, -4.2457275390625, -4.05389404296875, -3.862060546875, -3.67022705078125, -3.4783935546875, -3.28656005859375, -3.0947265625, -2.90289306640625, -2.7110595703125, -2.51922607421875, -2.327392578125, -2.13555908203125, -1.9437255859375, -1.75189208984375, -1.56005859375, -1.36822509765625, -1.1763916015625, -0.98455810546875, -0.792724609375, -0.60089111328125, -0.4090576171875, -0.21722412109375, -0.025390625, 0.16644287109375, 0.3582763671875, 0.55010986328125, 0.741943359375, 0.93377685546875, 1.1256103515625, 1.31744384765625, 1.50927734375, 1.70111083984375, 1.8929443359375, 2.08477783203125, 2.276611328125, 2.46844482421875, 2.6602783203125, 2.85211181640625, 3.0439453125, 3.23577880859375, 3.4276123046875, 3.61944580078125, 3.811279296875, 4.00311279296875, 4.1949462890625, 4.38677978515625, 4.57861328125, 4.77044677734375, 4.9622802734375, 5.15411376953125, 5.345947265625, 5.53778076171875, 5.7296142578125, 5.92144775390625, 6.11328125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 7.0, 11.0, 18.0, 9.0, 12.0, 27.0, 21.0, 25.0, 18.0, 28.0, 33.0, 37.0, 36.0, 44.0, 36.0, 34.0, 42.0, 985.0, 131.0, 50.0, 52.0, 48.0, 26.0, 34.0, 39.0, 30.0, 29.0, 22.0, 26.0, 17.0, 18.0, 8.0, 6.0, 12.0, 11.0, 10.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-58.5625, -56.87744140625, -55.1923828125, -53.50732421875, -51.822265625, -50.13720703125, -48.4521484375, -46.76708984375, -45.08203125, -43.39697265625, -41.7119140625, -40.02685546875, -38.341796875, -36.65673828125, -34.9716796875, -33.28662109375, -31.6015625, -29.91650390625, -28.2314453125, -26.54638671875, -24.861328125, -23.17626953125, -21.4912109375, -19.80615234375, -18.12109375, -16.43603515625, -14.7509765625, -13.06591796875, -11.380859375, -9.69580078125, -8.0107421875, -6.32568359375, -4.640625, -2.95556640625, -1.2705078125, 0.41455078125, 2.099609375, 3.78466796875, 5.4697265625, 7.15478515625, 8.83984375, 10.52490234375, 12.2099609375, 13.89501953125, 15.580078125, 17.26513671875, 18.9501953125, 20.63525390625, 22.3203125, 24.00537109375, 25.6904296875, 27.37548828125, 29.060546875, 30.74560546875, 32.4306640625, 34.11572265625, 35.80078125, 37.48583984375, 39.1708984375, 40.85595703125, 42.541015625, 44.22607421875, 45.9111328125, 47.59619140625, 49.28125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 7.0, 11.0, 22.0, 29.0, 51.0, 119.0, 349.0, 210.0, 91.0, 51.0, 30.0, 14.0, 10.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-269.0674133300781, -254.68031311035156, -240.293212890625, -225.90611267089844, -211.51901245117188, -197.1319122314453, -182.74481201171875, -168.3577117919922, -153.97061157226562, -139.58351135253906, -125.1964111328125, -110.80931091308594, -96.42221069335938, -82.03511047363281, -67.64801025390625, -53.26091003417969, -38.873809814453125, -24.486709594726562, -10.099609375, 4.2874908447265625, 18.674591064453125, 33.06169128417969, 47.44879150390625, 61.83589172363281, 76.22299194335938, 90.61009216308594, 104.9971923828125, 119.38429260253906, 133.77139282226562, 148.1584930419922, 162.54559326171875, 176.9326934814453, 191.31976318359375, 205.7068634033203, 220.09396362304688, 234.48106384277344, 248.8681640625, 263.2552490234375, 277.6423645019531, 292.02947998046875, 306.41656494140625, 320.80364990234375, 335.1907653808594, 349.577880859375, 363.9649658203125, 378.35205078125, 392.7391662597656, 407.12628173828125, 421.51336669921875, 435.90045166015625, 450.2875671386719, 464.6746826171875, 479.061767578125, 493.4488525390625, 507.8359680175781, 522.2230834960938, 536.6101684570312, 550.9972534179688, 565.3843994140625, 579.771484375, 594.1585693359375, 608.545654296875, 622.9327392578125, 637.3198852539062, 651.7069702148438]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 5.0, 7.0, 10.0, 6.0, 7.0, 9.0, 7.0, 17.0, 28.0, 30.0, 37.0, 47.0, 60.0, 131.0, 163.0, 126.0, 82.0, 59.0, 39.0, 36.0, 25.0, 15.0, 9.0, 13.0, 6.0, 6.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1054.973388671875, -1024.541015625, -994.108642578125, -963.67626953125, -933.243896484375, -902.8115234375, -872.3790893554688, -841.9467163085938, -811.5143432617188, -781.0819702148438, -750.6495971679688, -720.2172241210938, -689.7847900390625, -659.3524169921875, -628.9200439453125, -598.4876708984375, -568.0552978515625, -537.6229248046875, -507.1905517578125, -476.7581481933594, -446.3257751464844, -415.8934020996094, -385.46099853515625, -355.02862548828125, -324.59625244140625, -294.16387939453125, -263.73150634765625, -233.29910278320312, -202.86672973632812, -172.43435668945312, -142.00196838378906, -111.569580078125, -81.13720703125, -50.70482635498047, -20.272445678710938, 10.159934997558594, 40.592315673828125, 71.02468872070312, 101.45707702636719, 131.88946533203125, 162.32183837890625, 192.75421142578125, 223.1865997314453, 253.61898803710938, 284.0513610839844, 314.4837341308594, 344.9161376953125, 375.3485107421875, 405.7808837890625, 436.2132568359375, 466.6456298828125, 497.0780334472656, 527.5103759765625, 557.9427490234375, 588.3751831054688, 618.8075561523438, 649.2399291992188, 679.6723022460938, 710.1046752929688, 740.5370483398438, 770.969482421875, 801.40185546875, 831.834228515625, 862.2666015625, 892.698974609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 10.0, 8.0, 7.0, 19.0, 33.0, 31.0, 67.0, 73.0, 139.0, 195.0, 309.0, 583.0, 1057.0, 2195.0, 4945.0, 14502.0, 94978.0, 4008935.0, 46982.0, 10758.0, 4031.0, 1947.0, 1036.0, 530.0, 306.0, 234.0, 118.0, 95.0, 44.0, 40.0, 24.0, 12.0, 11.0, 12.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.869140625, -0.845245361328125, -0.82135009765625, -0.797454833984375, -0.7735595703125, -0.749664306640625, -0.72576904296875, -0.701873779296875, -0.677978515625, -0.654083251953125, -0.63018798828125, -0.606292724609375, -0.5823974609375, -0.558502197265625, -0.53460693359375, -0.510711669921875, -0.48681640625, -0.462921142578125, -0.43902587890625, -0.415130615234375, -0.3912353515625, -0.367340087890625, -0.34344482421875, -0.319549560546875, -0.295654296875, -0.271759033203125, -0.24786376953125, -0.223968505859375, -0.2000732421875, -0.176177978515625, -0.15228271484375, -0.128387451171875, -0.1044921875, -0.080596923828125, -0.05670166015625, -0.032806396484375, -0.0089111328125, 0.014984130859375, 0.03887939453125, 0.062774658203125, 0.086669921875, 0.110565185546875, 0.13446044921875, 0.158355712890625, 0.1822509765625, 0.206146240234375, 0.23004150390625, 0.253936767578125, 0.27783203125, 0.301727294921875, 0.32562255859375, 0.349517822265625, 0.3734130859375, 0.397308349609375, 0.42120361328125, 0.445098876953125, 0.468994140625, 0.492889404296875, 0.51678466796875, 0.540679931640625, 0.5645751953125, 0.588470458984375, 0.61236572265625, 0.636260986328125, 0.66015625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 13.0, 8.0, 10.0, 12.0, 8.0, 16.0, 16.0, 32.0, 92.0, 597.0, 62.0, 24.0, 18.0, 11.0, 8.0, 11.0, 5.0, 4.0, 3.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.55224609375, -0.5370216369628906, -0.5217971801757812, -0.5065727233886719, -0.4913482666015625, -0.4761238098144531, -0.46089935302734375, -0.4456748962402344, -0.430450439453125, -0.4152259826660156, -0.40000152587890625, -0.3847770690917969, -0.3695526123046875, -0.3543281555175781, -0.33910369873046875, -0.3238792419433594, -0.30865478515625, -0.2934303283691406, -0.27820587158203125, -0.2629814147949219, -0.2477569580078125, -0.23253250122070312, -0.21730804443359375, -0.20208358764648438, -0.186859130859375, -0.17163467407226562, -0.15641021728515625, -0.14118576049804688, -0.1259613037109375, -0.11073684692382812, -0.09551239013671875, -0.08028793334960938, -0.0650634765625, -0.049839019775390625, -0.03461456298828125, -0.019390106201171875, -0.0041656494140625, 0.011058807373046875, 0.02628326416015625, 0.041507720947265625, 0.056732177734375, 0.07195663452148438, 0.08718109130859375, 0.10240554809570312, 0.1176300048828125, 0.13285446166992188, 0.14807891845703125, 0.16330337524414062, 0.17852783203125, 0.19375228881835938, 0.20897674560546875, 0.22420120239257812, 0.2394256591796875, 0.2546501159667969, 0.26987457275390625, 0.2850990295410156, 0.300323486328125, 0.3155479431152344, 0.33077239990234375, 0.3459968566894531, 0.3612213134765625, 0.3764457702636719, 0.39167022705078125, 0.4068946838378906, 0.422119140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 5.0, 8.0, 9.0, 13.0, 20.0, 29.0, 29.0, 45.0, 58.0, 69.0, 105.0, 188.0, 311.0, 469.0, 824.0, 1563.0, 3190.0, 7902.0, 26500.0, 166981.0, 3524130.0, 399988.0, 43204.0, 10876.0, 3846.0, 1780.0, 884.0, 447.0, 284.0, 171.0, 97.0, 71.0, 40.0, 35.0, 24.0, 15.0, 16.0, 11.0, 8.0, 6.0, 7.0, 5.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.475341796875, -0.4593086242675781, -0.44327545166015625, -0.4272422790527344, -0.4112091064453125, -0.3951759338378906, -0.37914276123046875, -0.3631095886230469, -0.347076416015625, -0.3310432434082031, -0.31501007080078125, -0.2989768981933594, -0.2829437255859375, -0.2669105529785156, -0.25087738037109375, -0.23484420776367188, -0.21881103515625, -0.20277786254882812, -0.18674468994140625, -0.17071151733398438, -0.1546783447265625, -0.13864517211914062, -0.12261199951171875, -0.10657882690429688, -0.090545654296875, -0.07451248168945312, -0.05847930908203125, -0.042446136474609375, -0.0264129638671875, -0.010379791259765625, 0.00565338134765625, 0.021686553955078125, 0.0377197265625, 0.053752899169921875, 0.06978607177734375, 0.08581924438476562, 0.1018524169921875, 0.11788558959960938, 0.13391876220703125, 0.14995193481445312, 0.165985107421875, 0.18201828002929688, 0.19805145263671875, 0.21408462524414062, 0.2301177978515625, 0.24615097045898438, 0.26218414306640625, 0.2782173156738281, 0.29425048828125, 0.3102836608886719, 0.32631683349609375, 0.3423500061035156, 0.3583831787109375, 0.3744163513183594, 0.39044952392578125, 0.4064826965332031, 0.422515869140625, 0.4385490417480469, 0.45458221435546875, 0.4706153869628906, 0.4866485595703125, 0.5026817321777344, 0.5187149047851562, 0.5347480773925781, 0.55078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 12.0, 14.0, 13.0, 27.0, 32.0, 43.0, 74.0, 141.0, 270.0, 635.0, 1627.0, 558.0, 211.0, 123.0, 74.0, 60.0, 37.0, 21.0, 17.0, 23.0, 10.0, 3.0, 10.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.364013671875, -0.35373687744140625, -0.3434600830078125, -0.33318328857421875, -0.322906494140625, -0.31262969970703125, -0.3023529052734375, -0.29207611083984375, -0.28179931640625, -0.27152252197265625, -0.2612457275390625, -0.25096893310546875, -0.240692138671875, -0.23041534423828125, -0.2201385498046875, -0.20986175537109375, -0.1995849609375, -0.18930816650390625, -0.1790313720703125, -0.16875457763671875, -0.158477783203125, -0.14820098876953125, -0.1379241943359375, -0.12764739990234375, -0.11737060546875, -0.10709381103515625, -0.0968170166015625, -0.08654022216796875, -0.076263427734375, -0.06598663330078125, -0.0557098388671875, -0.04543304443359375, -0.03515625, -0.02487945556640625, -0.0146026611328125, -0.00432586669921875, 0.005950927734375, 0.01622772216796875, 0.0265045166015625, 0.03678131103515625, 0.04705810546875, 0.05733489990234375, 0.0676116943359375, 0.07788848876953125, 0.088165283203125, 0.09844207763671875, 0.1087188720703125, 0.11899566650390625, 0.1292724609375, 0.13954925537109375, 0.1498260498046875, 0.16010284423828125, 0.170379638671875, 0.18065643310546875, 0.1909332275390625, 0.20121002197265625, 0.21148681640625, 0.22176361083984375, 0.2320404052734375, 0.24231719970703125, 0.252593994140625, 0.26287078857421875, 0.2731475830078125, 0.28342437744140625, 0.293701171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 12.0, 311.0, 656.0, 27.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.3276233673095703, -2.1351613998413086, -1.9426991939544678, -1.750237226486206, -1.5577750205993652, -1.3653130531311035, -1.1728509664535522, -0.980388879776001, -0.7879267930984497, -0.5954647064208984, -0.40300264954566956, -0.21054059267044067, -0.018078505992889404, 0.17438358068466187, 0.36684560775756836, 0.5593076944351196, 0.7517697811126709, 0.9442318677902222, 1.1366939544677734, 1.3291559219360352, 1.521618127822876, 1.7140800952911377, 1.906542181968689, 2.0990042686462402, 2.291466236114502, 2.4839282035827637, 2.6763904094696045, 2.868852376937866, 3.061314582824707, 3.2537765502929688, 3.4462385177612305, 3.6387007236480713, 3.831162929534912, 4.023624897003174, 4.2160868644714355, 4.4085493087768555, 4.601011276245117, 4.793473243713379, 4.985935211181641, 5.178397178649902, 5.370859622955322, 5.563321590423584, 5.755783557891846, 5.948246002197266, 6.140707969665527, 6.333169937133789, 6.525631904602051, 6.7180938720703125, 6.910555839538574, 7.103017807006836, 7.295479774475098, 7.487942218780518, 7.680404186248779, 7.872866153717041, 8.065328598022461, 8.257790565490723, 8.450252532958984, 8.642714500427246, 8.835176467895508, 9.02763843536377, 9.220100402832031, 9.41256332397461, 9.605025291442871, 9.797487258911133, 9.989949226379395]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 11.0, 13.0, 19.0, 15.0, 28.0, 36.0, 39.0, 50.0, 74.0, 77.0, 101.0, 99.0, 78.0, 69.0, 73.0, 58.0, 40.0, 32.0, 25.0, 21.0, 11.0, 8.0, 6.0, 6.0, 10.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3035147190093994, -1.2544056177139282, -1.205296516418457, -1.1561874151229858, -1.1070783138275146, -1.0579692125320435, -1.0088601112365723, -0.9597510099411011, -0.9106419086456299, -0.8615328073501587, -0.8124237060546875, -0.7633146047592163, -0.7142055034637451, -0.6650964021682739, -0.6159873008728027, -0.5668781995773315, -0.5177690386772156, -0.4686599373817444, -0.4195508360862732, -0.370441734790802, -0.3213326334953308, -0.2722235321998596, -0.22311440110206604, -0.17400529980659485, -0.12489619851112366, -0.07578709721565247, -0.026677988469600677, 0.02243112027645111, 0.0715402215719223, 0.1206493228673935, 0.16975843906402588, 0.21886754035949707, 0.26797664165496826, 0.31708574295043945, 0.36619484424591064, 0.41530394554138184, 0.464413046836853, 0.5135221481323242, 0.5626312494277954, 0.6117403507232666, 0.6608494520187378, 0.709958553314209, 0.7590676546096802, 0.8081767559051514, 0.8572858572006226, 0.9063949584960938, 0.9555040597915649, 1.0046131610870361, 1.0537223815917969, 1.102831482887268, 1.1519405841827393, 1.2010496854782104, 1.2501587867736816, 1.2992678880691528, 1.348376989364624, 1.3974860906600952, 1.4465951919555664, 1.4957042932510376, 1.5448133945465088, 1.59392249584198, 1.6430315971374512, 1.6921406984329224, 1.7412497997283936, 1.7903589010238647, 1.839468002319336]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 7.0, 8.0, 12.0, 12.0, 19.0, 25.0, 36.0, 29.0, 47.0, 70.0, 65.0, 114.0, 164.0, 213.0, 330.0, 430.0, 522.0, 805.0, 1071.0, 1579.0, 2465.0, 3724.0, 6014.0, 10489.0, 20248.0, 51714.0, 815422.0, 76084.0, 24708.0, 12040.0, 6895.0, 4252.0, 2747.0, 1790.0, 1302.0, 871.0, 594.0, 449.0, 329.0, 225.0, 158.0, 128.0, 111.0, 49.0, 49.0, 50.0, 30.0, 19.0, 9.0, 10.0, 10.0, 11.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.3603515625, -1.312835693359375, -1.26531982421875, -1.217803955078125, -1.1702880859375, -1.122772216796875, -1.07525634765625, -1.027740478515625, -0.980224609375, -0.932708740234375, -0.88519287109375, -0.837677001953125, -0.7901611328125, -0.742645263671875, -0.69512939453125, -0.647613525390625, -0.60009765625, -0.552581787109375, -0.50506591796875, -0.457550048828125, -0.4100341796875, -0.362518310546875, -0.31500244140625, -0.267486572265625, -0.219970703125, -0.172454833984375, -0.12493896484375, -0.077423095703125, -0.0299072265625, 0.017608642578125, 0.06512451171875, 0.112640380859375, 0.16015625, 0.207672119140625, 0.25518798828125, 0.302703857421875, 0.3502197265625, 0.397735595703125, 0.44525146484375, 0.492767333984375, 0.540283203125, 0.587799072265625, 0.63531494140625, 0.682830810546875, 0.7303466796875, 0.777862548828125, 0.82537841796875, 0.872894287109375, 0.92041015625, 0.967926025390625, 1.01544189453125, 1.062957763671875, 1.1104736328125, 1.157989501953125, 1.20550537109375, 1.253021240234375, 1.300537109375, 1.348052978515625, 1.39556884765625, 1.443084716796875, 1.4906005859375, 1.538116455078125, 1.58563232421875, 1.633148193359375, 1.6806640625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 10.0, 8.0, 7.0, 10.0, 10.0, 10.0, 12.0, 15.0, 20.0, 51.0, 425.0, 259.0, 46.0, 18.0, 21.0, 10.0, 7.0, 10.0, 6.0, 3.0, 6.0, 4.0, 6.0, 5.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.529296875, -0.5145645141601562, -0.4998321533203125, -0.48509979248046875, -0.470367431640625, -0.45563507080078125, -0.4409027099609375, -0.42617034912109375, -0.41143798828125, -0.39670562744140625, -0.3819732666015625, -0.36724090576171875, -0.352508544921875, -0.33777618408203125, -0.3230438232421875, -0.30831146240234375, -0.2935791015625, -0.27884674072265625, -0.2641143798828125, -0.24938201904296875, -0.234649658203125, -0.21991729736328125, -0.2051849365234375, -0.19045257568359375, -0.17572021484375, -0.16098785400390625, -0.1462554931640625, -0.13152313232421875, -0.116790771484375, -0.10205841064453125, -0.0873260498046875, -0.07259368896484375, -0.057861328125, -0.04312896728515625, -0.0283966064453125, -0.01366424560546875, 0.001068115234375, 0.01580047607421875, 0.0305328369140625, 0.04526519775390625, 0.05999755859375, 0.07472991943359375, 0.0894622802734375, 0.10419464111328125, 0.118927001953125, 0.13365936279296875, 0.1483917236328125, 0.16312408447265625, 0.1778564453125, 0.19258880615234375, 0.2073211669921875, 0.22205352783203125, 0.236785888671875, 0.25151824951171875, 0.2662506103515625, 0.28098297119140625, 0.29571533203125, 0.31044769287109375, 0.3251800537109375, 0.33991241455078125, 0.354644775390625, 0.36937713623046875, 0.3841094970703125, 0.39884185791015625, 0.41357421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 7.0, 12.0, 14.0, 18.0, 16.0, 22.0, 29.0, 22.0, 48.0, 56.0, 76.0, 77.0, 121.0, 159.0, 225.0, 313.0, 502.0, 907.0, 1659.0, 3452.0, 8608.0, 24737.0, 95368.0, 458792.0, 349066.0, 70820.0, 19577.0, 6970.0, 2911.0, 1474.0, 797.0, 453.0, 318.0, 223.0, 173.0, 124.0, 93.0, 52.0, 45.0, 40.0, 35.0, 28.0, 20.0, 22.0, 17.0, 12.0, 12.0, 6.0, 5.0, 4.0, 8.0, 3.0, 3.0], "bins": [-1.28125, -1.244537353515625, -1.20782470703125, -1.171112060546875, -1.1343994140625, -1.097686767578125, -1.06097412109375, -1.024261474609375, -0.987548828125, -0.950836181640625, -0.91412353515625, -0.877410888671875, -0.8406982421875, -0.803985595703125, -0.76727294921875, -0.730560302734375, -0.69384765625, -0.657135009765625, -0.62042236328125, -0.583709716796875, -0.5469970703125, -0.510284423828125, -0.47357177734375, -0.436859130859375, -0.400146484375, -0.363433837890625, -0.32672119140625, -0.290008544921875, -0.2532958984375, -0.216583251953125, -0.17987060546875, -0.143157958984375, -0.1064453125, -0.069732666015625, -0.03302001953125, 0.003692626953125, 0.0404052734375, 0.077117919921875, 0.11383056640625, 0.150543212890625, 0.187255859375, 0.223968505859375, 0.26068115234375, 0.297393798828125, 0.3341064453125, 0.370819091796875, 0.40753173828125, 0.444244384765625, 0.48095703125, 0.517669677734375, 0.55438232421875, 0.591094970703125, 0.6278076171875, 0.664520263671875, 0.70123291015625, 0.737945556640625, 0.774658203125, 0.811370849609375, 0.84808349609375, 0.884796142578125, 0.9215087890625, 0.958221435546875, 0.99493408203125, 1.031646728515625, 1.068359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 11.0, 2.0, 1.0, 8.0, 4.0, 6.0, 5.0, 10.0, 14.0, 14.0, 19.0, 17.0, 23.0, 27.0, 28.0, 30.0, 56.0, 44.0, 35.0, 46.0, 47.0, 34.0, 34.0, 43.0, 36.0, 36.0, 47.0, 28.0, 28.0, 36.0, 31.0, 18.0, 31.0, 16.0, 22.0, 20.0, 7.0, 18.0, 8.0, 11.0, 11.0, 11.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.541015625, -1.4909210205078125, -1.440826416015625, -1.3907318115234375, -1.34063720703125, -1.2905426025390625, -1.240447998046875, -1.1903533935546875, -1.1402587890625, -1.0901641845703125, -1.040069580078125, -0.9899749755859375, -0.93988037109375, -0.8897857666015625, -0.839691162109375, -0.7895965576171875, -0.739501953125, -0.6894073486328125, -0.639312744140625, -0.5892181396484375, -0.53912353515625, -0.4890289306640625, -0.438934326171875, -0.3888397216796875, -0.3387451171875, -0.2886505126953125, -0.238555908203125, -0.1884613037109375, -0.13836669921875, -0.0882720947265625, -0.038177490234375, 0.0119171142578125, 0.06201171875, 0.1121063232421875, 0.162200927734375, 0.2122955322265625, 0.26239013671875, 0.3124847412109375, 0.362579345703125, 0.4126739501953125, 0.4627685546875, 0.5128631591796875, 0.562957763671875, 0.6130523681640625, 0.66314697265625, 0.7132415771484375, 0.763336181640625, 0.8134307861328125, 0.863525390625, 0.9136199951171875, 0.963714599609375, 1.0138092041015625, 1.06390380859375, 1.1139984130859375, 1.164093017578125, 1.2141876220703125, 1.2642822265625, 1.3143768310546875, 1.364471435546875, 1.4145660400390625, 1.46466064453125, 1.5147552490234375, 1.564849853515625, 1.6149444580078125, 1.6650390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 4.0, 14.0, 21.0, 35.0, 59.0, 160.0, 495.0, 2650.0, 173821.0, 866974.0, 3351.0, 607.0, 199.0, 65.0, 33.0, 22.0, 20.0, 5.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83203125, -6.669586181640625, -6.50714111328125, -6.344696044921875, -6.1822509765625, -6.019805908203125, -5.85736083984375, -5.694915771484375, -5.532470703125, -5.370025634765625, -5.20758056640625, -5.045135498046875, -4.8826904296875, -4.720245361328125, -4.55780029296875, -4.395355224609375, -4.23291015625, -4.070465087890625, -3.90802001953125, -3.745574951171875, -3.5831298828125, -3.420684814453125, -3.25823974609375, -3.095794677734375, -2.933349609375, -2.770904541015625, -2.60845947265625, -2.446014404296875, -2.2835693359375, -2.121124267578125, -1.95867919921875, -1.796234130859375, -1.6337890625, -1.471343994140625, -1.30889892578125, -1.146453857421875, -0.9840087890625, -0.821563720703125, -0.65911865234375, -0.496673583984375, -0.334228515625, -0.171783447265625, -0.00933837890625, 0.153106689453125, 0.3155517578125, 0.477996826171875, 0.64044189453125, 0.802886962890625, 0.96533203125, 1.127777099609375, 1.29022216796875, 1.452667236328125, 1.6151123046875, 1.777557373046875, 1.94000244140625, 2.102447509765625, 2.264892578125, 2.427337646484375, 2.58978271484375, 2.752227783203125, 2.9146728515625, 3.077117919921875, 3.23956298828125, 3.402008056640625, 3.564453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 17.0, 27.0, 62.0, 102.0, 234.0, 232.0, 169.0, 71.0, 45.0, 17.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001468658447265625, -0.00014302413910627365, -0.0001391824334859848, -0.00013534072786569595, -0.0001314990222454071, -0.00012765731662511826, -0.0001238156110048294, -0.00011997390538454056, -0.00011613219976425171, -0.00011229049414396286, -0.00010844878852367401, -0.00010460708290338516, -0.00010076537728309631, -9.692367166280746e-05, -9.308196604251862e-05, -8.924026042222977e-05, -8.539855480194092e-05, -8.155684918165207e-05, -7.771514356136322e-05, -7.387343794107437e-05, -7.003173232078552e-05, -6.619002670049667e-05, -6.234832108020782e-05, -5.8506615459918976e-05, -5.466490983963013e-05, -5.082320421934128e-05, -4.698149859905243e-05, -4.313979297876358e-05, -3.929808735847473e-05, -3.545638173818588e-05, -3.1614676117897034e-05, -2.7772970497608185e-05, -2.3931264877319336e-05, -2.0089559257030487e-05, -1.6247853636741638e-05, -1.240614801645279e-05, -8.56444239616394e-06, -4.7227367758750916e-06, -8.810311555862427e-07, 2.960674464702606e-06, 6.802380084991455e-06, 1.0644085705280304e-05, 1.4485791325569153e-05, 1.8327496945858002e-05, 2.216920256614685e-05, 2.60109081864357e-05, 2.985261380672455e-05, 3.36943194270134e-05, 3.7536025047302246e-05, 4.1377730667591095e-05, 4.5219436287879944e-05, 4.906114190816879e-05, 5.290284752845764e-05, 5.674455314874649e-05, 6.058625876903534e-05, 6.442796438932419e-05, 6.826967000961304e-05, 7.211137562990189e-05, 7.595308125019073e-05, 7.979478687047958e-05, 8.363649249076843e-05, 8.747819811105728e-05, 9.131990373134613e-05, 9.516160935163498e-05, 9.900331497192383e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 8.0, 9.0, 7.0, 12.0, 21.0, 32.0, 56.0, 70.0, 151.0, 324.0, 728.0, 2220.0, 9455.0, 114002.0, 882858.0, 31448.0, 4801.0, 1311.0, 519.0, 231.0, 101.0, 77.0, 30.0, 25.0, 16.0, 17.0, 6.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.3314971923828125, -1.286041259765625, -1.2405853271484375, -1.19512939453125, -1.1496734619140625, -1.104217529296875, -1.0587615966796875, -1.0133056640625, -0.9678497314453125, -0.922393798828125, -0.8769378662109375, -0.83148193359375, -0.7860260009765625, -0.740570068359375, -0.6951141357421875, -0.649658203125, -0.6042022705078125, -0.558746337890625, -0.5132904052734375, -0.46783447265625, -0.4223785400390625, -0.376922607421875, -0.3314666748046875, -0.2860107421875, -0.2405548095703125, -0.195098876953125, -0.1496429443359375, -0.10418701171875, -0.0587310791015625, -0.013275146484375, 0.0321807861328125, 0.07763671875, 0.1230926513671875, 0.168548583984375, 0.2140045166015625, 0.25946044921875, 0.3049163818359375, 0.350372314453125, 0.3958282470703125, 0.4412841796875, 0.4867401123046875, 0.532196044921875, 0.5776519775390625, 0.62310791015625, 0.6685638427734375, 0.714019775390625, 0.7594757080078125, 0.804931640625, 0.8503875732421875, 0.895843505859375, 0.9412994384765625, 0.98675537109375, 1.0322113037109375, 1.077667236328125, 1.1231231689453125, 1.1685791015625, 1.2140350341796875, 1.259490966796875, 1.3049468994140625, 1.35040283203125, 1.3958587646484375, 1.441314697265625, 1.4867706298828125, 1.5322265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 0.0, 1.0, 3.0, 8.0, 8.0, 5.0, 13.0, 25.0, 23.0, 45.0, 66.0, 112.0, 148.0, 147.0, 132.0, 91.0, 55.0, 42.0, 20.0, 14.0, 11.0, 9.0, 5.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2050323486328125, -1.151275634765625, -1.0975189208984375, -1.04376220703125, -0.9900054931640625, -0.936248779296875, -0.8824920654296875, -0.8287353515625, -0.7749786376953125, -0.721221923828125, -0.6674652099609375, -0.61370849609375, -0.5599517822265625, -0.506195068359375, -0.4524383544921875, -0.398681640625, -0.3449249267578125, -0.291168212890625, -0.2374114990234375, -0.18365478515625, -0.1298980712890625, -0.076141357421875, -0.0223846435546875, 0.0313720703125, 0.0851287841796875, 0.138885498046875, 0.1926422119140625, 0.24639892578125, 0.3001556396484375, 0.353912353515625, 0.4076690673828125, 0.46142578125, 0.5151824951171875, 0.568939208984375, 0.6226959228515625, 0.67645263671875, 0.7302093505859375, 0.783966064453125, 0.8377227783203125, 0.8914794921875, 0.9452362060546875, 0.998992919921875, 1.0527496337890625, 1.10650634765625, 1.1602630615234375, 1.214019775390625, 1.2677764892578125, 1.321533203125, 1.3752899169921875, 1.429046630859375, 1.4828033447265625, 1.53656005859375, 1.5903167724609375, 1.644073486328125, 1.6978302001953125, 1.7515869140625, 1.8053436279296875, 1.859100341796875, 1.9128570556640625, 1.96661376953125, 2.0203704833984375, 2.074127197265625, 2.1278839111328125, 2.181640625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 6.0, 13.0, 32.0, 68.0, 259.0, 427.0, 125.0, 28.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.47325897216797, -32.75071334838867, -32.02816390991211, -31.30561637878418, -30.58306884765625, -29.860523223876953, -29.13797378540039, -28.415428161621094, -27.692880630493164, -26.970333099365234, -26.247785568237305, -25.525238037109375, -24.802690505981445, -24.080142974853516, -23.35759735107422, -22.63504981994629, -21.91250228881836, -21.18995475769043, -20.4674072265625, -19.74485969543457, -19.02231216430664, -18.299766540527344, -17.57721710205078, -16.854671478271484, -16.132122039794922, -15.409574508666992, -14.687026977539062, -13.964479446411133, -13.24193286895752, -12.51938533782959, -11.79683780670166, -11.074291229248047, -10.3517427444458, -9.629195213317871, -8.906647682189941, -8.184101104736328, -7.461553573608398, -6.739006042480469, -6.016458511352539, -5.293911457061768, -4.571363925933838, -3.8488166332244873, -3.1262693405151367, -2.403721809387207, -1.6811745166778564, -0.9586272239685059, -0.23607969284057617, 0.4864673614501953, 1.209014892578125, 1.9315621852874756, 2.654109477996826, 3.376657009124756, 4.099204063415527, 4.821751594543457, 5.544299125671387, 6.266846179962158, 6.989393711090088, 7.711941242218018, 8.434488296508789, 9.157035827636719, 9.879583358764648, 10.602130889892578, 11.324678421020508, 12.047224998474121, 12.76977252960205]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 4.0, 12.0, 13.0, 6.0, 23.0, 36.0, 70.0, 104.0, 131.0, 164.0, 159.0, 98.0, 51.0, 24.0, 23.0, 17.0, 3.0, 6.0, 3.0, 3.0, 8.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.6807861328125, -32.570159912109375, -31.459531784057617, -30.34890365600586, -29.2382755279541, -28.127647399902344, -27.01702117919922, -25.90639305114746, -24.795764923095703, -23.685136795043945, -22.57451057434082, -21.463882446289062, -20.353254318237305, -19.242626190185547, -18.131999969482422, -17.021371841430664, -15.910745620727539, -14.800118446350098, -13.68949031829834, -12.578863143920898, -11.46823501586914, -10.3576078414917, -9.246980667114258, -8.1363525390625, -7.025725364685059, -5.915097713470459, -4.804470062255859, -3.693842887878418, -2.5832152366638184, -1.4725875854492188, -0.36196041107177734, 0.7486672401428223, 1.8592948913574219, 2.9699225425720215, 4.080550193786621, 5.1911773681640625, 6.301805019378662, 7.412432670593262, 8.523059844970703, 9.633687973022461, 10.744315147399902, 11.854942321777344, 12.965570449829102, 14.076197624206543, 15.186824798583984, 16.297452926635742, 17.4080810546875, 18.518707275390625, 19.629335403442383, 20.73996353149414, 21.850589752197266, 22.961217880249023, 24.07184600830078, 25.182472229003906, 26.293100357055664, 27.403728485107422, 28.514354705810547, 29.624982833862305, 30.73560905456543, 31.846237182617188, 32.95686340332031, 34.0674934387207, 35.17811965942383, 36.28874588012695, 37.399375915527344]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 2.0, 6.0, 9.0, 14.0, 35.0, 35.0, 69.0, 117.0, 220.0, 395.0, 725.0, 1521.0, 3466.0, 8959.0, 29232.0, 251752.0, 3811380.0, 60752.0, 14725.0, 5586.0, 2502.0, 1251.0, 656.0, 353.0, 210.0, 110.0, 69.0, 49.0, 26.0, 14.0, 10.0, 8.0, 7.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.365234375, -3.246063232421875, -3.12689208984375, -3.007720947265625, -2.8885498046875, -2.769378662109375, -2.65020751953125, -2.531036376953125, -2.411865234375, -2.292694091796875, -2.17352294921875, -2.054351806640625, -1.9351806640625, -1.816009521484375, -1.69683837890625, -1.577667236328125, -1.45849609375, -1.339324951171875, -1.22015380859375, -1.100982666015625, -0.9818115234375, -0.862640380859375, -0.74346923828125, -0.624298095703125, -0.505126953125, -0.385955810546875, -0.26678466796875, -0.147613525390625, -0.0284423828125, 0.090728759765625, 0.20989990234375, 0.329071044921875, 0.4482421875, 0.567413330078125, 0.68658447265625, 0.805755615234375, 0.9249267578125, 1.044097900390625, 1.16326904296875, 1.282440185546875, 1.401611328125, 1.520782470703125, 1.63995361328125, 1.759124755859375, 1.8782958984375, 1.997467041015625, 2.11663818359375, 2.235809326171875, 2.35498046875, 2.474151611328125, 2.59332275390625, 2.712493896484375, 2.8316650390625, 2.950836181640625, 3.07000732421875, 3.189178466796875, 3.308349609375, 3.427520751953125, 3.54669189453125, 3.665863037109375, 3.7850341796875, 3.904205322265625, 4.02337646484375, 4.142547607421875, 4.26171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 5.0, 10.0, 11.0, 7.0, 10.0, 5.0, 12.0, 12.0, 24.0, 40.0, 73.0, 205.0, 278.0, 124.0, 48.0, 25.0, 16.0, 11.0, 10.0, 10.0, 3.0, 5.0, 6.0, 7.0, 4.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.320556640625, -0.3095664978027344, -0.29857635498046875, -0.2875862121582031, -0.2765960693359375, -0.2656059265136719, -0.25461578369140625, -0.24362564086914062, -0.232635498046875, -0.22164535522460938, -0.21065521240234375, -0.19966506958007812, -0.1886749267578125, -0.17768478393554688, -0.16669464111328125, -0.15570449829101562, -0.14471435546875, -0.13372421264648438, -0.12273406982421875, -0.11174392700195312, -0.1007537841796875, -0.08976364135742188, -0.07877349853515625, -0.06778335571289062, -0.056793212890625, -0.045803070068359375, -0.03481292724609375, -0.023822784423828125, -0.0128326416015625, -0.001842498779296875, 0.00914764404296875, 0.020137786865234375, 0.0311279296875, 0.042118072509765625, 0.05310821533203125, 0.06409835815429688, 0.0750885009765625, 0.08607864379882812, 0.09706878662109375, 0.10805892944335938, 0.119049072265625, 0.13003921508789062, 0.14102935791015625, 0.15201950073242188, 0.1630096435546875, 0.17399978637695312, 0.18498992919921875, 0.19598007202148438, 0.20697021484375, 0.21796035766601562, 0.22895050048828125, 0.23994064331054688, 0.2509307861328125, 0.2619209289550781, 0.27291107177734375, 0.2839012145996094, 0.294891357421875, 0.3058815002441406, 0.31687164306640625, 0.3278617858886719, 0.3388519287109375, 0.3498420715332031, 0.36083221435546875, 0.3718223571777344, 0.3828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 3.0, 9.0, 13.0, 20.0, 25.0, 23.0, 41.0, 59.0, 82.0, 103.0, 191.0, 287.0, 491.0, 812.0, 1569.0, 3249.0, 7800.0, 23590.0, 117289.0, 2873522.0, 1058817.0, 76548.0, 17744.0, 6173.0, 2598.0, 1307.0, 745.0, 429.0, 244.0, 154.0, 108.0, 64.0, 43.0, 36.0, 23.0, 15.0, 17.0, 7.0, 11.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5458984375, -1.4988861083984375, -1.451873779296875, -1.4048614501953125, -1.35784912109375, -1.3108367919921875, -1.263824462890625, -1.2168121337890625, -1.1697998046875, -1.1227874755859375, -1.075775146484375, -1.0287628173828125, -0.98175048828125, -0.9347381591796875, -0.887725830078125, -0.8407135009765625, -0.793701171875, -0.7466888427734375, -0.699676513671875, -0.6526641845703125, -0.60565185546875, -0.5586395263671875, -0.511627197265625, -0.4646148681640625, -0.4176025390625, -0.3705902099609375, -0.323577880859375, -0.2765655517578125, -0.22955322265625, -0.1825408935546875, -0.135528564453125, -0.0885162353515625, -0.04150390625, 0.0055084228515625, 0.052520751953125, 0.0995330810546875, 0.14654541015625, 0.1935577392578125, 0.240570068359375, 0.2875823974609375, 0.3345947265625, 0.3816070556640625, 0.428619384765625, 0.4756317138671875, 0.52264404296875, 0.5696563720703125, 0.616668701171875, 0.6636810302734375, 0.710693359375, 0.7577056884765625, 0.804718017578125, 0.8517303466796875, 0.89874267578125, 0.9457550048828125, 0.992767333984375, 1.0397796630859375, 1.0867919921875, 1.1338043212890625, 1.180816650390625, 1.2278289794921875, 1.27484130859375, 1.3218536376953125, 1.368865966796875, 1.4158782958984375, 1.462890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 11.0, 7.0, 13.0, 24.0, 11.0, 26.0, 50.0, 87.0, 116.0, 246.0, 536.0, 1497.0, 699.0, 314.0, 144.0, 99.0, 50.0, 35.0, 27.0, 29.0, 17.0, 10.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45849609375, -0.4439964294433594, -0.42949676513671875, -0.4149971008300781, -0.4004974365234375, -0.3859977722167969, -0.37149810791015625, -0.3569984436035156, -0.342498779296875, -0.3279991149902344, -0.31349945068359375, -0.2989997863769531, -0.2845001220703125, -0.2700004577636719, -0.25550079345703125, -0.24100112915039062, -0.22650146484375, -0.21200180053710938, -0.19750213623046875, -0.18300247192382812, -0.1685028076171875, -0.15400314331054688, -0.13950347900390625, -0.12500381469726562, -0.110504150390625, -0.09600448608398438, -0.08150482177734375, -0.06700515747070312, -0.0525054931640625, -0.038005828857421875, -0.02350616455078125, -0.009006500244140625, 0.0054931640625, 0.019992828369140625, 0.03449249267578125, 0.048992156982421875, 0.0634918212890625, 0.07799148559570312, 0.09249114990234375, 0.10699081420898438, 0.121490478515625, 0.13599014282226562, 0.15048980712890625, 0.16498947143554688, 0.1794891357421875, 0.19398880004882812, 0.20848846435546875, 0.22298812866210938, 0.23748779296875, 0.2519874572753906, 0.26648712158203125, 0.2809867858886719, 0.2954864501953125, 0.3099861145019531, 0.32448577880859375, 0.3389854431152344, 0.353485107421875, 0.3679847717285156, 0.38248443603515625, 0.3969841003417969, 0.4114837646484375, 0.4259834289550781, 0.44048309326171875, 0.4549827575683594, 0.469482421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 27.0, 467.0, 458.0, 35.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.45427417755127, -13.205036163330078, -12.955798149108887, -12.706560134887695, -12.457322120666504, -12.208084106445312, -11.958846092224121, -11.70960807800293, -11.460370063781738, -11.211132049560547, -10.961894035339355, -10.712656021118164, -10.463418006896973, -10.214179992675781, -9.96494197845459, -9.715703964233398, -9.46646499633789, -9.2172269821167, -8.967988967895508, -8.718750953674316, -8.469512939453125, -8.220274925231934, -7.971036911010742, -7.721798419952393, -7.472560882568359, -7.223322868347168, -6.974084854125977, -6.724846839904785, -6.475608825683594, -6.226370811462402, -5.977132797241211, -5.727894306182861, -5.47865629196167, -5.2294182777404785, -4.980180263519287, -4.730942249298096, -4.481704235076904, -4.232465744018555, -3.9832279682159424, -3.733989715576172, -3.4847517013549805, -3.235513687133789, -2.9862756729125977, -2.7370376586914062, -2.4877994060516357, -2.2385613918304443, -1.989323377609253, -1.740085244178772, -1.4908473491668701, -1.2416093349456787, -0.9923712015151978, -0.7431331872940063, -0.49389511346817017, -0.24465703964233398, 0.004580974578857422, 0.2538191080093384, 0.5030571222305298, 0.752295196056366, 1.0015332698822021, 1.2507712841033936, 1.500009298324585, 1.749247431755066, 1.9984854459762573, 2.2477235794067383, 2.4969615936279297]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 7.0, 5.0, 10.0, 7.0, 15.0, 30.0, 42.0, 55.0, 80.0, 89.0, 97.0, 92.0, 71.0, 78.0, 90.0, 51.0, 48.0, 35.0, 25.0, 20.0, 11.0, 11.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4434051513671875, -2.369737148284912, -2.2960689067840576, -2.2224009037017822, -2.1487326622009277, -2.0750646591186523, -2.001396656036377, -1.9277284145355225, -1.854060411453247, -1.7803922891616821, -1.7067241668701172, -1.6330561637878418, -1.5593880414962769, -1.485719919204712, -1.412051796913147, -1.338383674621582, -1.264715552330017, -1.1910474300384521, -1.1173793077468872, -1.0437111854553223, -0.9700431823730469, -0.8963750600814819, -0.822706937789917, -0.7490388751029968, -0.6753707528114319, -0.6017026305198669, -0.5280345678329468, -0.45436644554138184, -0.3806983530521393, -0.30703026056289673, -0.2333621382713318, -0.15969407558441162, -0.08602595329284668, -0.012357853353023529, 0.06131024658679962, 0.13497835397720337, 0.20864644646644592, 0.2823145389556885, 0.3559826612472534, 0.4296507239341736, 0.5033188462257385, 0.5769869685173035, 0.6506550312042236, 0.7243231534957886, 0.7979912757873535, 0.8716593384742737, 0.9453274607658386, 1.0189955234527588, 1.0926636457443237, 1.1663317680358887, 1.2399998903274536, 1.3136680126190186, 1.387336015701294, 1.4610041379928589, 1.5346722602844238, 1.6083402633666992, 1.6820085048675537, 1.7556766271591187, 1.8293447494506836, 1.903012752532959, 1.976680874824524, 2.050348997116089, 2.1240172386169434, 2.1976852416992188, 2.271353244781494]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 9.0, 4.0, 2.0, 7.0, 12.0, 26.0, 29.0, 54.0, 49.0, 97.0, 156.0, 249.0, 410.0, 731.0, 1519.0, 3197.0, 7984.0, 25687.0, 260569.0, 696506.0, 33792.0, 9981.0, 3792.0, 1677.0, 851.0, 464.0, 234.0, 173.0, 116.0, 51.0, 30.0, 30.0, 16.0, 19.0, 10.0, 4.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.677734375, -3.546844482421875, -3.41595458984375, -3.285064697265625, -3.1541748046875, -3.023284912109375, -2.89239501953125, -2.761505126953125, -2.630615234375, -2.499725341796875, -2.36883544921875, -2.237945556640625, -2.1070556640625, -1.976165771484375, -1.84527587890625, -1.714385986328125, -1.58349609375, -1.452606201171875, -1.32171630859375, -1.190826416015625, -1.0599365234375, -0.929046630859375, -0.79815673828125, -0.667266845703125, -0.536376953125, -0.405487060546875, -0.27459716796875, -0.143707275390625, -0.0128173828125, 0.118072509765625, 0.24896240234375, 0.379852294921875, 0.5107421875, 0.641632080078125, 0.77252197265625, 0.903411865234375, 1.0343017578125, 1.165191650390625, 1.29608154296875, 1.426971435546875, 1.557861328125, 1.688751220703125, 1.81964111328125, 1.950531005859375, 2.0814208984375, 2.212310791015625, 2.34320068359375, 2.474090576171875, 2.60498046875, 2.735870361328125, 2.86676025390625, 2.997650146484375, 3.1285400390625, 3.259429931640625, 3.39031982421875, 3.521209716796875, 3.652099609375, 3.782989501953125, 3.91387939453125, 4.044769287109375, 4.1756591796875, 4.306549072265625, 4.43743896484375, 4.568328857421875, 4.69921875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 2.0, 6.0, 3.0, 5.0, 9.0, 6.0, 8.0, 7.0, 9.0, 13.0, 16.0, 18.0, 39.0, 67.0, 184.0, 266.0, 167.0, 67.0, 26.0, 10.0, 12.0, 14.0, 8.0, 11.0, 7.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.337646484375, -0.3257598876953125, -0.313873291015625, -0.3019866943359375, -0.29010009765625, -0.2782135009765625, -0.266326904296875, -0.2544403076171875, -0.2425537109375, -0.2306671142578125, -0.218780517578125, -0.2068939208984375, -0.19500732421875, -0.1831207275390625, -0.171234130859375, -0.1593475341796875, -0.1474609375, -0.1355743408203125, -0.123687744140625, -0.1118011474609375, -0.09991455078125, -0.0880279541015625, -0.076141357421875, -0.0642547607421875, -0.0523681640625, -0.0404815673828125, -0.028594970703125, -0.0167083740234375, -0.00482177734375, 0.0070648193359375, 0.018951416015625, 0.0308380126953125, 0.042724609375, 0.0546112060546875, 0.066497802734375, 0.0783843994140625, 0.09027099609375, 0.1021575927734375, 0.114044189453125, 0.1259307861328125, 0.1378173828125, 0.1497039794921875, 0.161590576171875, 0.1734771728515625, 0.18536376953125, 0.1972503662109375, 0.209136962890625, 0.2210235595703125, 0.23291015625, 0.2447967529296875, 0.256683349609375, 0.2685699462890625, 0.28045654296875, 0.2923431396484375, 0.304229736328125, 0.3161163330078125, 0.3280029296875, 0.3398895263671875, 0.351776123046875, 0.3636627197265625, 0.37554931640625, 0.3874359130859375, 0.399322509765625, 0.4112091064453125, 0.423095703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 7.0, 5.0, 7.0, 7.0, 3.0, 6.0, 6.0, 22.0, 52.0, 243.0, 1269.0, 16686.0, 985041.0, 42496.0, 2082.0, 397.0, 106.0, 40.0, 11.0, 11.0, 4.0, 5.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.9248046875, -4.724609375, -4.5244140625, -4.32421875, -4.1240234375, -3.923828125, -3.7236328125, -3.5234375, -3.3232421875, -3.123046875, -2.9228515625, -2.72265625, -2.5224609375, -2.322265625, -2.1220703125, -1.921875, -1.7216796875, -1.521484375, -1.3212890625, -1.12109375, -0.9208984375, -0.720703125, -0.5205078125, -0.3203125, -0.1201171875, 0.080078125, 0.2802734375, 0.48046875, 0.6806640625, 0.880859375, 1.0810546875, 1.28125, 1.4814453125, 1.681640625, 1.8818359375, 2.08203125, 2.2822265625, 2.482421875, 2.6826171875, 2.8828125, 3.0830078125, 3.283203125, 3.4833984375, 3.68359375, 3.8837890625, 4.083984375, 4.2841796875, 4.484375, 4.6845703125, 4.884765625, 5.0849609375, 5.28515625, 5.4853515625, 5.685546875, 5.8857421875, 6.0859375, 6.2861328125, 6.486328125, 6.6865234375, 6.88671875, 7.0869140625, 7.287109375, 7.4873046875, 7.6875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 5.0, 7.0, 12.0, 5.0, 16.0, 17.0, 18.0, 23.0, 29.0, 20.0, 33.0, 29.0, 38.0, 33.0, 48.0, 42.0, 58.0, 52.0, 56.0, 49.0, 40.0, 37.0, 42.0, 32.0, 35.0, 23.0, 32.0, 21.0, 24.0, 23.0, 19.0, 13.0, 21.0, 7.0, 7.0, 12.0, 4.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1591796875, -1.125274658203125, -1.09136962890625, -1.057464599609375, -1.0235595703125, -0.989654541015625, -0.95574951171875, -0.921844482421875, -0.887939453125, -0.854034423828125, -0.82012939453125, -0.786224365234375, -0.7523193359375, -0.718414306640625, -0.68450927734375, -0.650604248046875, -0.61669921875, -0.582794189453125, -0.54888916015625, -0.514984130859375, -0.4810791015625, -0.447174072265625, -0.41326904296875, -0.379364013671875, -0.345458984375, -0.311553955078125, -0.27764892578125, -0.243743896484375, -0.2098388671875, -0.175933837890625, -0.14202880859375, -0.108123779296875, -0.07421875, -0.040313720703125, -0.00640869140625, 0.027496337890625, 0.0614013671875, 0.095306396484375, 0.12921142578125, 0.163116455078125, 0.197021484375, 0.230926513671875, 0.26483154296875, 0.298736572265625, 0.3326416015625, 0.366546630859375, 0.40045166015625, 0.434356689453125, 0.46826171875, 0.502166748046875, 0.53607177734375, 0.569976806640625, 0.6038818359375, 0.637786865234375, 0.67169189453125, 0.705596923828125, 0.739501953125, 0.773406982421875, 0.80731201171875, 0.841217041015625, 0.8751220703125, 0.909027099609375, 0.94293212890625, 0.976837158203125, 1.0107421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 5.0, 1.0, 8.0, 6.0, 10.0, 14.0, 19.0, 23.0, 43.0, 54.0, 106.0, 164.0, 303.0, 601.0, 1569.0, 5735.0, 76430.0, 939157.0, 19004.0, 3162.0, 1051.0, 442.0, 244.0, 130.0, 82.0, 69.0, 33.0, 24.0, 17.0, 8.0, 5.0, 7.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.57550048828125, -4.4244384765625, -4.27337646484375, -4.122314453125, -3.97125244140625, -3.8201904296875, -3.66912841796875, -3.51806640625, -3.36700439453125, -3.2159423828125, -3.06488037109375, -2.913818359375, -2.76275634765625, -2.6116943359375, -2.46063232421875, -2.3095703125, -2.15850830078125, -2.0074462890625, -1.85638427734375, -1.705322265625, -1.55426025390625, -1.4031982421875, -1.25213623046875, -1.10107421875, -0.95001220703125, -0.7989501953125, -0.64788818359375, -0.496826171875, -0.34576416015625, -0.1947021484375, -0.04364013671875, 0.107421875, 0.25848388671875, 0.4095458984375, 0.56060791015625, 0.711669921875, 0.86273193359375, 1.0137939453125, 1.16485595703125, 1.31591796875, 1.46697998046875, 1.6180419921875, 1.76910400390625, 1.920166015625, 2.07122802734375, 2.2222900390625, 2.37335205078125, 2.5244140625, 2.67547607421875, 2.8265380859375, 2.97760009765625, 3.128662109375, 3.27972412109375, 3.4307861328125, 3.58184814453125, 3.73291015625, 3.88397216796875, 4.0350341796875, 4.18609619140625, 4.337158203125, 4.48822021484375, 4.6392822265625, 4.79034423828125, 4.94140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 3.0, 4.0, 3.0, 2.0, 13.0, 9.0, 11.0, 13.0, 16.0, 18.0, 33.0, 39.0, 68.0, 93.0, 120.0, 122.0, 120.0, 95.0, 52.0, 45.0, 34.0, 17.0, 12.0, 9.0, 9.0, 7.0, 9.0, 7.0, 5.0, 2.0, 3.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014472007751464844, -0.00014011934399604797, -0.0001355186104774475, -0.00013091787695884705, -0.00012631714344024658, -0.00012171640992164612, -0.00011711567640304565, -0.00011251494288444519, -0.00010791420936584473, -0.00010331347584724426, -9.87127423286438e-05, -9.411200881004333e-05, -8.951127529144287e-05, -8.491054177284241e-05, -8.030980825424194e-05, -7.570907473564148e-05, -7.110834121704102e-05, -6.650760769844055e-05, -6.190687417984009e-05, -5.7306140661239624e-05, -5.270540714263916e-05, -4.8104673624038696e-05, -4.350394010543823e-05, -3.890320658683777e-05, -3.4302473068237305e-05, -2.970173954963684e-05, -2.5101006031036377e-05, -2.0500272512435913e-05, -1.589953899383545e-05, -1.1298805475234985e-05, -6.6980719566345215e-06, -2.0973384380340576e-06, 2.5033950805664062e-06, 7.10412859916687e-06, 1.1704862117767334e-05, 1.6305595636367798e-05, 2.0906329154968262e-05, 2.5507062673568726e-05, 3.010779619216919e-05, 3.470852971076965e-05, 3.930926322937012e-05, 4.390999674797058e-05, 4.8510730266571045e-05, 5.311146378517151e-05, 5.771219730377197e-05, 6.231293082237244e-05, 6.69136643409729e-05, 7.151439785957336e-05, 7.611513137817383e-05, 8.071586489677429e-05, 8.531659841537476e-05, 8.991733193397522e-05, 9.451806545257568e-05, 9.911879897117615e-05, 0.00010371953248977661, 0.00010832026600837708, 0.00011292099952697754, 0.000117521733045578, 0.00012212246656417847, 0.00012672320008277893, 0.0001313239336013794, 0.00013592466711997986, 0.00014052540063858032, 0.00014512613415718079, 0.00014972686767578125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 12.0, 23.0, 35.0, 28.0, 58.0, 90.0, 146.0, 229.0, 415.0, 641.0, 1283.0, 2865.0, 8528.0, 33343.0, 327757.0, 608587.0, 46883.0, 10692.0, 3681.0, 1485.0, 671.0, 392.0, 229.0, 146.0, 103.0, 53.0, 43.0, 36.0, 14.0, 15.0, 8.0, 7.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.84375, -1.788055419921875, -1.73236083984375, -1.676666259765625, -1.6209716796875, -1.565277099609375, -1.50958251953125, -1.453887939453125, -1.398193359375, -1.342498779296875, -1.28680419921875, -1.231109619140625, -1.1754150390625, -1.119720458984375, -1.06402587890625, -1.008331298828125, -0.95263671875, -0.896942138671875, -0.84124755859375, -0.785552978515625, -0.7298583984375, -0.674163818359375, -0.61846923828125, -0.562774658203125, -0.507080078125, -0.451385498046875, -0.39569091796875, -0.339996337890625, -0.2843017578125, -0.228607177734375, -0.17291259765625, -0.117218017578125, -0.0615234375, -0.005828857421875, 0.04986572265625, 0.105560302734375, 0.1612548828125, 0.216949462890625, 0.27264404296875, 0.328338623046875, 0.384033203125, 0.439727783203125, 0.49542236328125, 0.551116943359375, 0.6068115234375, 0.662506103515625, 0.71820068359375, 0.773895263671875, 0.82958984375, 0.885284423828125, 0.94097900390625, 0.996673583984375, 1.0523681640625, 1.108062744140625, 1.16375732421875, 1.219451904296875, 1.275146484375, 1.330841064453125, 1.38653564453125, 1.442230224609375, 1.4979248046875, 1.553619384765625, 1.60931396484375, 1.665008544921875, 1.720703125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 4.0, 15.0, 14.0, 20.0, 22.0, 23.0, 46.0, 70.0, 96.0, 142.0, 175.0, 128.0, 88.0, 40.0, 31.0, 20.0, 15.0, 13.0, 8.0, 7.0, 3.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.166015625, -2.10614013671875, -2.0462646484375, -1.98638916015625, -1.926513671875, -1.86663818359375, -1.8067626953125, -1.74688720703125, -1.68701171875, -1.62713623046875, -1.5672607421875, -1.50738525390625, -1.447509765625, -1.38763427734375, -1.3277587890625, -1.26788330078125, -1.2080078125, -1.14813232421875, -1.0882568359375, -1.02838134765625, -0.968505859375, -0.90863037109375, -0.8487548828125, -0.78887939453125, -0.72900390625, -0.66912841796875, -0.6092529296875, -0.54937744140625, -0.489501953125, -0.42962646484375, -0.3697509765625, -0.30987548828125, -0.25, -0.19012451171875, -0.1302490234375, -0.07037353515625, -0.010498046875, 0.04937744140625, 0.1092529296875, 0.16912841796875, 0.22900390625, 0.28887939453125, 0.3487548828125, 0.40863037109375, 0.468505859375, 0.52838134765625, 0.5882568359375, 0.64813232421875, 0.7080078125, 0.76788330078125, 0.8277587890625, 0.88763427734375, 0.947509765625, 1.00738525390625, 1.0672607421875, 1.12713623046875, 1.18701171875, 1.24688720703125, 1.3067626953125, 1.36663818359375, 1.426513671875, 1.48638916015625, 1.5462646484375, 1.60614013671875, 1.666015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 10.0, 20.0, 87.0, 330.0, 406.0, 104.0, 29.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.24677848815918, -18.44936752319336, -17.651954650878906, -16.854543685913086, -16.057132720947266, -15.259720802307129, -14.462308883666992, -13.664897918701172, -12.867486000061035, -12.070074081420898, -11.272663116455078, -10.475251197814941, -9.677839279174805, -8.880428314208984, -8.083016395568848, -7.285604953765869, -6.488193511962891, -5.690782070159912, -4.893370628356934, -4.095958709716797, -3.2985472679138184, -2.50113582611084, -1.7037239074707031, -0.9063124656677246, -0.1089010238647461, 0.688510537147522, 1.48592209815979, 2.2833337783813477, 3.080745220184326, 3.8781566619873047, 4.675568580627441, 5.47298002243042, 6.270389556884766, 7.067800998687744, 7.865212440490723, 8.66262435913086, 9.46003532409668, 10.257447242736816, 11.054859161376953, 11.852270126342773, 12.64968204498291, 13.447093963623047, 14.244504928588867, 15.041916847229004, 15.83932876586914, 16.63673973083496, 17.43415069580078, 18.231563568115234, 19.028974533081055, 19.826385498046875, 20.623798370361328, 21.42120933532715, 22.21862030029297, 23.016033172607422, 23.813444137573242, 24.610855102539062, 25.408267974853516, 26.205678939819336, 27.00309181213379, 27.80050277709961, 28.59791374206543, 29.39532470703125, 30.192737579345703, 30.990148544311523, 31.787559509277344]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 5.0, 10.0, 8.0, 15.0, 12.0, 16.0, 28.0, 41.0, 40.0, 64.0, 81.0, 89.0, 118.0, 97.0, 98.0, 64.0, 50.0, 45.0, 32.0, 18.0, 14.0, 11.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.791168212890625, -16.354806900024414, -15.918447494506836, -15.482086181640625, -15.04572582244873, -14.609365463256836, -14.173005104064941, -13.736644744873047, -13.300284385681152, -12.863924026489258, -12.427563667297363, -11.991203308105469, -11.554841995239258, -11.118481636047363, -10.682121276855469, -10.245760917663574, -9.80940055847168, -9.373040199279785, -8.93667984008789, -8.50031852722168, -8.063958168029785, -7.627597808837891, -7.191237449645996, -6.754877090454102, -6.318515777587891, -5.882155418395996, -5.445794582366943, -5.009434223175049, -4.573073863983154, -4.136713027954102, -3.700352668762207, -3.2639923095703125, -2.827631950378418, -2.3912713527679443, -1.9549109935760498, -1.5185503959655762, -1.082189917564392, -0.645829439163208, -0.20946884155273438, 0.22689151763916016, 0.6632521152496338, 1.0996125936508179, 1.535973072052002, 1.9723336696624756, 2.408694267272949, 2.8450546264648438, 3.2814152240753174, 3.717775583267212, 4.1541361808776855, 4.59049654006958, 5.026857376098633, 5.463217735290527, 5.899578094482422, 6.335938453674316, 6.772299289703369, 7.208659648895264, 7.645020484924316, 8.081380844116211, 8.517741203308105, 8.9541015625, 9.390462875366211, 9.826823234558105, 10.26318359375, 10.699543952941895, 11.135904312133789]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 6.0, 9.0, 13.0, 23.0, 25.0, 24.0, 50.0, 70.0, 95.0, 119.0, 151.0, 227.0, 302.0, 394.0, 620.0, 943.0, 1608.0, 3074.0, 7407.0, 34959.0, 3979128.0, 141888.0, 13211.0, 4517.0, 2114.0, 1112.0, 679.0, 435.0, 296.0, 233.0, 131.0, 96.0, 79.0, 51.0, 29.0, 35.0, 33.0, 23.0, 11.0, 14.0, 9.0, 10.0, 8.0, 6.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.8392333984375, -4.651123046875, -4.4630126953125, -4.27490234375, -4.0867919921875, -3.898681640625, -3.7105712890625, -3.5224609375, -3.3343505859375, -3.146240234375, -2.9581298828125, -2.77001953125, -2.5819091796875, -2.393798828125, -2.2056884765625, -2.017578125, -1.8294677734375, -1.641357421875, -1.4532470703125, -1.26513671875, -1.0770263671875, -0.888916015625, -0.7008056640625, -0.5126953125, -0.3245849609375, -0.136474609375, 0.0516357421875, 0.23974609375, 0.4278564453125, 0.615966796875, 0.8040771484375, 0.9921875, 1.1802978515625, 1.368408203125, 1.5565185546875, 1.74462890625, 1.9327392578125, 2.120849609375, 2.3089599609375, 2.4970703125, 2.6851806640625, 2.873291015625, 3.0614013671875, 3.24951171875, 3.4376220703125, 3.625732421875, 3.8138427734375, 4.001953125, 4.1900634765625, 4.378173828125, 4.5662841796875, 4.75439453125, 4.9425048828125, 5.130615234375, 5.3187255859375, 5.5068359375, 5.6949462890625, 5.883056640625, 6.0711669921875, 6.25927734375, 6.4473876953125, 6.635498046875, 6.8236083984375, 7.01171875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 5.0, 8.0, 6.0, 12.0, 20.0, 22.0, 29.0, 60.0, 107.0, 183.0, 207.0, 143.0, 62.0, 31.0, 23.0, 19.0, 17.0, 11.0, 5.0, 4.0, 2.0, 2.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32470703125, -0.31270599365234375, -0.3007049560546875, -0.28870391845703125, -0.276702880859375, -0.26470184326171875, -0.2527008056640625, -0.24069976806640625, -0.22869873046875, -0.21669769287109375, -0.2046966552734375, -0.19269561767578125, -0.180694580078125, -0.16869354248046875, -0.1566925048828125, -0.14469146728515625, -0.1326904296875, -0.12068939208984375, -0.1086883544921875, -0.09668731689453125, -0.084686279296875, -0.07268524169921875, -0.0606842041015625, -0.04868316650390625, -0.03668212890625, -0.02468109130859375, -0.0126800537109375, -0.00067901611328125, 0.011322021484375, 0.02332305908203125, 0.0353240966796875, 0.04732513427734375, 0.059326171875, 0.07132720947265625, 0.0833282470703125, 0.09532928466796875, 0.107330322265625, 0.11933135986328125, 0.1313323974609375, 0.14333343505859375, 0.15533447265625, 0.16733551025390625, 0.1793365478515625, 0.19133758544921875, 0.203338623046875, 0.21533966064453125, 0.2273406982421875, 0.23934173583984375, 0.2513427734375, 0.26334381103515625, 0.2753448486328125, 0.28734588623046875, 0.299346923828125, 0.31134796142578125, 0.3233489990234375, 0.33535003662109375, 0.34735107421875, 0.35935211181640625, 0.3713531494140625, 0.38335418701171875, 0.395355224609375, 0.40735626220703125, 0.4193572998046875, 0.43135833740234375, 0.443359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 4.0, 6.0, 8.0, 22.0, 18.0, 29.0, 57.0, 121.0, 493.0, 3976.0, 1079146.0, 3104837.0, 4709.0, 542.0, 160.0, 57.0, 37.0, 14.0, 8.0, 6.0, 10.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.1796875, -8.9017333984375, -8.623779296875, -8.3458251953125, -8.06787109375, -7.7899169921875, -7.511962890625, -7.2340087890625, -6.9560546875, -6.6781005859375, -6.400146484375, -6.1221923828125, -5.84423828125, -5.5662841796875, -5.288330078125, -5.0103759765625, -4.732421875, -4.4544677734375, -4.176513671875, -3.8985595703125, -3.62060546875, -3.3426513671875, -3.064697265625, -2.7867431640625, -2.5087890625, -2.2308349609375, -1.952880859375, -1.6749267578125, -1.39697265625, -1.1190185546875, -0.841064453125, -0.5631103515625, -0.28515625, -0.0072021484375, 0.270751953125, 0.5487060546875, 0.82666015625, 1.1046142578125, 1.382568359375, 1.6605224609375, 1.9384765625, 2.2164306640625, 2.494384765625, 2.7723388671875, 3.05029296875, 3.3282470703125, 3.606201171875, 3.8841552734375, 4.162109375, 4.4400634765625, 4.718017578125, 4.9959716796875, 5.27392578125, 5.5518798828125, 5.829833984375, 6.1077880859375, 6.3857421875, 6.6636962890625, 6.941650390625, 7.2196044921875, 7.49755859375, 7.7755126953125, 8.053466796875, 8.3314208984375, 8.609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 0.0, 6.0, 4.0, 9.0, 12.0, 9.0, 30.0, 42.0, 76.0, 118.0, 374.0, 1438.0, 1225.0, 355.0, 145.0, 87.0, 48.0, 22.0, 12.0, 16.0, 11.0, 7.0, 2.0, 8.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5810546875, -0.5623016357421875, -0.543548583984375, -0.5247955322265625, -0.50604248046875, -0.4872894287109375, -0.468536376953125, -0.4497833251953125, -0.4310302734375, -0.4122772216796875, -0.393524169921875, -0.3747711181640625, -0.35601806640625, -0.3372650146484375, -0.318511962890625, -0.2997589111328125, -0.281005859375, -0.2622528076171875, -0.243499755859375, -0.2247467041015625, -0.20599365234375, -0.1872406005859375, -0.168487548828125, -0.1497344970703125, -0.1309814453125, -0.1122283935546875, -0.093475341796875, -0.0747222900390625, -0.05596923828125, -0.0372161865234375, -0.018463134765625, 0.0002899169921875, 0.01904296875, 0.0377960205078125, 0.056549072265625, 0.0753021240234375, 0.09405517578125, 0.1128082275390625, 0.131561279296875, 0.1503143310546875, 0.1690673828125, 0.1878204345703125, 0.206573486328125, 0.2253265380859375, 0.24407958984375, 0.2628326416015625, 0.281585693359375, 0.3003387451171875, 0.319091796875, 0.3378448486328125, 0.356597900390625, 0.3753509521484375, 0.39410400390625, 0.4128570556640625, 0.431610107421875, 0.4503631591796875, 0.4691162109375, 0.4878692626953125, 0.506622314453125, 0.5253753662109375, 0.54412841796875, 0.5628814697265625, 0.581634521484375, 0.6003875732421875, 0.619140625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 24.0, 130.0, 441.0, 300.0, 71.0, 22.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.944924354553223, -5.769207954406738, -5.593491554260254, -5.417774677276611, -5.242058277130127, -5.066341876983643, -4.890625, -4.714908599853516, -4.539192199707031, -4.363475799560547, -4.1877593994140625, -4.01204252243042, -3.8363261222839355, -3.660609722137451, -3.4848930835723877, -3.309176445007324, -3.13346004486084, -2.9577436447143555, -2.782027006149292, -2.6063103675842285, -2.430593967437744, -2.2548775672912598, -2.0791609287261963, -1.9034444093704224, -1.7277278900146484, -1.5520113706588745, -1.3762948513031006, -1.2005783319473267, -1.0248618125915527, -0.8491452932357788, -0.6734287738800049, -0.49771225452423096, -0.32199573516845703, -0.1462792158126831, 0.02943730354309082, 0.20515382289886475, 0.38087034225463867, 0.5565868616104126, 0.7323033809661865, 0.9080199003219604, 1.0837364196777344, 1.2594529390335083, 1.4351694583892822, 1.6108859777450562, 1.78660249710083, 1.962319016456604, 2.138035535812378, 2.3137521743774414, 2.489468574523926, 2.66518497467041, 2.8409016132354736, 3.016618251800537, 3.1923346519470215, 3.368051052093506, 3.5437676906585693, 3.719484329223633, 3.895200729370117, 4.070917129516602, 4.246633529663086, 4.4223504066467285, 4.598066806793213, 4.773783206939697, 4.94950008392334, 5.125216484069824, 5.300932884216309]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 10.0, 15.0, 11.0, 17.0, 38.0, 30.0, 46.0, 55.0, 59.0, 61.0, 68.0, 79.0, 98.0, 62.0, 59.0, 72.0, 40.0, 31.0, 27.0, 28.0, 23.0, 20.0, 6.0, 4.0, 11.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9736270904541016, -1.904973030090332, -1.8363189697265625, -1.7676650285720825, -1.699010968208313, -1.6303569078445435, -1.5617029666900635, -1.493048906326294, -1.4243948459625244, -1.3557407855987549, -1.2870867252349854, -1.2184327840805054, -1.1497787237167358, -1.0811246633529663, -1.0124707221984863, -0.9438166618347168, -0.8751626014709473, -0.8065085411071777, -0.737854540348053, -0.6692005395889282, -0.6005464792251587, -0.5318924188613892, -0.4632384181022644, -0.39458438754081726, -0.3259303569793701, -0.257276326417923, -0.18862229585647583, -0.11996826529502869, -0.05131423473358154, 0.0173397958278656, 0.08599382638931274, 0.1546478569507599, 0.22330188751220703, 0.2919559180736542, 0.3606099486351013, 0.42926397919654846, 0.4979180097579956, 0.5665720701217651, 0.6352260708808899, 0.7038800716400146, 0.7725341320037842, 0.8411881923675537, 0.9098421931266785, 0.9784961938858032, 1.0471502542495728, 1.1158043146133423, 1.1844582557678223, 1.2531123161315918, 1.3217663764953613, 1.3904204368591309, 1.4590744972229004, 1.5277284383773804, 1.59638249874115, 1.6650365591049194, 1.7336905002593994, 1.802344560623169, 1.8709986209869385, 1.939652681350708, 2.0083067417144775, 2.076960802078247, 2.1456146240234375, 2.214268684387207, 2.2829227447509766, 2.351576805114746, 2.4202308654785156]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 11.0, 8.0, 13.0, 17.0, 34.0, 45.0, 63.0, 103.0, 152.0, 292.0, 457.0, 916.0, 1742.0, 4730.0, 18603.0, 220407.0, 744407.0, 43235.0, 7973.0, 2643.0, 1162.0, 610.0, 362.0, 195.0, 121.0, 80.0, 48.0, 39.0, 29.0, 16.0, 6.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.064453125, -2.974884033203125, -2.88531494140625, -2.795745849609375, -2.7061767578125, -2.616607666015625, -2.52703857421875, -2.437469482421875, -2.347900390625, -2.258331298828125, -2.16876220703125, -2.079193115234375, -1.9896240234375, -1.900054931640625, -1.81048583984375, -1.720916748046875, -1.63134765625, -1.541778564453125, -1.45220947265625, -1.362640380859375, -1.2730712890625, -1.183502197265625, -1.09393310546875, -1.004364013671875, -0.914794921875, -0.825225830078125, -0.73565673828125, -0.646087646484375, -0.5565185546875, -0.466949462890625, -0.37738037109375, -0.287811279296875, -0.1982421875, -0.108673095703125, -0.01910400390625, 0.070465087890625, 0.1600341796875, 0.249603271484375, 0.33917236328125, 0.428741455078125, 0.518310546875, 0.607879638671875, 0.69744873046875, 0.787017822265625, 0.8765869140625, 0.966156005859375, 1.05572509765625, 1.145294189453125, 1.23486328125, 1.324432373046875, 1.41400146484375, 1.503570556640625, 1.5931396484375, 1.682708740234375, 1.77227783203125, 1.861846923828125, 1.951416015625, 2.040985107421875, 2.13055419921875, 2.220123291015625, 2.3096923828125, 2.399261474609375, 2.48883056640625, 2.578399658203125, 2.66796875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 5.0, 12.0, 16.0, 19.0, 53.0, 67.0, 115.0, 178.0, 186.0, 130.0, 90.0, 42.0, 27.0, 22.0, 11.0, 6.0, 2.0, 1.0, 0.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33251953125, -0.32068634033203125, -0.3088531494140625, -0.29701995849609375, -0.285186767578125, -0.27335357666015625, -0.2615203857421875, -0.24968719482421875, -0.23785400390625, -0.22602081298828125, -0.2141876220703125, -0.20235443115234375, -0.190521240234375, -0.17868804931640625, -0.1668548583984375, -0.15502166748046875, -0.1431884765625, -0.13135528564453125, -0.1195220947265625, -0.10768890380859375, -0.095855712890625, -0.08402252197265625, -0.0721893310546875, -0.06035614013671875, -0.04852294921875, -0.03668975830078125, -0.0248565673828125, -0.01302337646484375, -0.001190185546875, 0.01064300537109375, 0.0224761962890625, 0.03430938720703125, 0.046142578125, 0.05797576904296875, 0.0698089599609375, 0.08164215087890625, 0.093475341796875, 0.10530853271484375, 0.1171417236328125, 0.12897491455078125, 0.14080810546875, 0.15264129638671875, 0.1644744873046875, 0.17630767822265625, 0.188140869140625, 0.19997406005859375, 0.2118072509765625, 0.22364044189453125, 0.2354736328125, 0.24730682373046875, 0.2591400146484375, 0.27097320556640625, 0.282806396484375, 0.29463958740234375, 0.3064727783203125, 0.31830596923828125, 0.33013916015625, 0.34197235107421875, 0.3538055419921875, 0.36563873291015625, 0.377471923828125, 0.38930511474609375, 0.4011383056640625, 0.41297149658203125, 0.4248046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 6.0, 13.0, 15.0, 21.0, 39.0, 52.0, 69.0, 79.0, 128.0, 192.0, 291.0, 532.0, 1130.0, 3406.0, 13645.0, 84088.0, 595118.0, 302667.0, 35823.0, 7220.0, 2143.0, 805.0, 391.0, 210.0, 138.0, 78.0, 74.0, 44.0, 35.0, 26.0, 19.0, 14.0, 13.0, 5.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5673828125, -1.5041656494140625, -1.440948486328125, -1.3777313232421875, -1.31451416015625, -1.2512969970703125, -1.188079833984375, -1.1248626708984375, -1.0616455078125, -0.9984283447265625, -0.935211181640625, -0.8719940185546875, -0.80877685546875, -0.7455596923828125, -0.682342529296875, -0.6191253662109375, -0.555908203125, -0.4926910400390625, -0.429473876953125, -0.3662567138671875, -0.30303955078125, -0.2398223876953125, -0.176605224609375, -0.1133880615234375, -0.0501708984375, 0.0130462646484375, 0.076263427734375, 0.1394805908203125, 0.20269775390625, 0.2659149169921875, 0.329132080078125, 0.3923492431640625, 0.45556640625, 0.5187835693359375, 0.582000732421875, 0.6452178955078125, 0.70843505859375, 0.7716522216796875, 0.834869384765625, 0.8980865478515625, 0.9613037109375, 1.0245208740234375, 1.087738037109375, 1.1509552001953125, 1.21417236328125, 1.2773895263671875, 1.340606689453125, 1.4038238525390625, 1.467041015625, 1.5302581787109375, 1.593475341796875, 1.6566925048828125, 1.71990966796875, 1.7831268310546875, 1.846343994140625, 1.9095611572265625, 1.9727783203125, 2.0359954833984375, 2.099212646484375, 2.1624298095703125, 2.22564697265625, 2.2888641357421875, 2.352081298828125, 2.4152984619140625, 2.478515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 4.0, 2.0, 7.0, 9.0, 12.0, 15.0, 20.0, 18.0, 30.0, 30.0, 20.0, 42.0, 45.0, 42.0, 41.0, 52.0, 35.0, 49.0, 47.0, 65.0, 63.0, 56.0, 53.0, 38.0, 28.0, 32.0, 31.0, 24.0, 12.0, 12.0, 10.0, 11.0, 11.0, 9.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89111328125, -0.8545913696289062, -0.8180694580078125, -0.7815475463867188, -0.745025634765625, -0.7085037231445312, -0.6719818115234375, -0.6354598999023438, -0.59893798828125, -0.5624160766601562, -0.5258941650390625, -0.48937225341796875, -0.452850341796875, -0.41632843017578125, -0.3798065185546875, -0.34328460693359375, -0.3067626953125, -0.27024078369140625, -0.2337188720703125, -0.19719696044921875, -0.160675048828125, -0.12415313720703125, -0.0876312255859375, -0.05110931396484375, -0.01458740234375, 0.02193450927734375, 0.0584564208984375, 0.09497833251953125, 0.131500244140625, 0.16802215576171875, 0.2045440673828125, 0.24106597900390625, 0.277587890625, 0.31410980224609375, 0.3506317138671875, 0.38715362548828125, 0.423675537109375, 0.46019744873046875, 0.4967193603515625, 0.5332412719726562, 0.56976318359375, 0.6062850952148438, 0.6428070068359375, 0.6793289184570312, 0.715850830078125, 0.7523727416992188, 0.7888946533203125, 0.8254165649414062, 0.8619384765625, 0.8984603881835938, 0.9349822998046875, 0.9715042114257812, 1.008026123046875, 1.0445480346679688, 1.0810699462890625, 1.1175918579101562, 1.15411376953125, 1.1906356811523438, 1.2271575927734375, 1.2636795043945312, 1.300201416015625, 1.3367233276367188, 1.3732452392578125, 1.4097671508789062, 1.4462890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 10.0, 13.0, 20.0, 20.0, 36.0, 50.0, 99.0, 176.0, 387.0, 1063.0, 3590.0, 18588.0, 211912.0, 747394.0, 54272.0, 7761.0, 1898.0, 640.0, 271.0, 136.0, 72.0, 48.0, 30.0, 9.0, 12.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.767578125, -1.720123291015625, -1.67266845703125, -1.625213623046875, -1.5777587890625, -1.530303955078125, -1.48284912109375, -1.435394287109375, -1.387939453125, -1.340484619140625, -1.29302978515625, -1.245574951171875, -1.1981201171875, -1.150665283203125, -1.10321044921875, -1.055755615234375, -1.00830078125, -0.960845947265625, -0.91339111328125, -0.865936279296875, -0.8184814453125, -0.771026611328125, -0.72357177734375, -0.676116943359375, -0.628662109375, -0.581207275390625, -0.53375244140625, -0.486297607421875, -0.4388427734375, -0.391387939453125, -0.34393310546875, -0.296478271484375, -0.2490234375, -0.201568603515625, -0.15411376953125, -0.106658935546875, -0.0592041015625, -0.011749267578125, 0.03570556640625, 0.083160400390625, 0.130615234375, 0.178070068359375, 0.22552490234375, 0.272979736328125, 0.3204345703125, 0.367889404296875, 0.41534423828125, 0.462799072265625, 0.51025390625, 0.557708740234375, 0.60516357421875, 0.652618408203125, 0.7000732421875, 0.747528076171875, 0.79498291015625, 0.842437744140625, 0.889892578125, 0.937347412109375, 0.98480224609375, 1.032257080078125, 1.0797119140625, 1.127166748046875, 1.17462158203125, 1.222076416015625, 1.26953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 9.0, 8.0, 4.0, 7.0, 14.0, 5.0, 9.0, 18.0, 16.0, 24.0, 22.0, 39.0, 38.0, 44.0, 79.0, 71.0, 95.0, 88.0, 86.0, 68.0, 47.0, 40.0, 32.0, 26.0, 21.0, 14.0, 12.0, 11.0, 7.0, 15.0, 7.0, 7.0, 0.0, 10.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011038780212402344, -0.00010697171092033386, -0.00010355561971664429, -0.00010013952851295471, -9.672343730926514e-05, -9.330734610557556e-05, -8.989125490188599e-05, -8.647516369819641e-05, -8.305907249450684e-05, -7.964298129081726e-05, -7.622689008712769e-05, -7.281079888343811e-05, -6.939470767974854e-05, -6.597861647605896e-05, -6.256252527236938e-05, -5.914643406867981e-05, -5.5730342864990234e-05, -5.231425166130066e-05, -4.8898160457611084e-05, -4.548206925392151e-05, -4.2065978050231934e-05, -3.864988684654236e-05, -3.523379564285278e-05, -3.181770443916321e-05, -2.8401613235473633e-05, -2.4985522031784058e-05, -2.1569430828094482e-05, -1.8153339624404907e-05, -1.4737248420715332e-05, -1.1321157217025757e-05, -7.905066013336182e-06, -4.4889748096466064e-06, -1.0728836059570312e-06, 2.343207597732544e-06, 5.759298801422119e-06, 9.175390005111694e-06, 1.259148120880127e-05, 1.6007572412490845e-05, 1.942366361618042e-05, 2.2839754819869995e-05, 2.625584602355957e-05, 2.9671937227249146e-05, 3.308802843093872e-05, 3.6504119634628296e-05, 3.992021083831787e-05, 4.3336302042007446e-05, 4.675239324569702e-05, 5.01684844493866e-05, 5.358457565307617e-05, 5.700066685676575e-05, 6.041675806045532e-05, 6.38328492641449e-05, 6.724894046783447e-05, 7.066503167152405e-05, 7.408112287521362e-05, 7.74972140789032e-05, 8.091330528259277e-05, 8.432939648628235e-05, 8.774548768997192e-05, 9.11615788936615e-05, 9.457767009735107e-05, 9.799376130104065e-05, 0.00010140985250473022, 0.0001048259437084198, 0.00010824203491210938]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 10.0, 12.0, 16.0, 27.0, 31.0, 43.0, 56.0, 69.0, 112.0, 158.0, 224.0, 379.0, 704.0, 1551.0, 4612.0, 17252.0, 81700.0, 619113.0, 267024.0, 40735.0, 9413.0, 2833.0, 1104.0, 508.0, 245.0, 183.0, 122.0, 83.0, 76.0, 40.0, 30.0, 20.0, 17.0, 9.0, 8.0, 9.0, 4.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -0.9977569580078125, -0.964263916015625, -0.9307708740234375, -0.89727783203125, -0.8637847900390625, -0.830291748046875, -0.7967987060546875, -0.7633056640625, -0.7298126220703125, -0.696319580078125, -0.6628265380859375, -0.62933349609375, -0.5958404541015625, -0.562347412109375, -0.5288543701171875, -0.495361328125, -0.4618682861328125, -0.428375244140625, -0.3948822021484375, -0.36138916015625, -0.3278961181640625, -0.294403076171875, -0.2609100341796875, -0.2274169921875, -0.1939239501953125, -0.160430908203125, -0.1269378662109375, -0.09344482421875, -0.0599517822265625, -0.026458740234375, 0.0070343017578125, 0.04052734375, 0.0740203857421875, 0.107513427734375, 0.1410064697265625, 0.17449951171875, 0.2079925537109375, 0.241485595703125, 0.2749786376953125, 0.3084716796875, 0.3419647216796875, 0.375457763671875, 0.4089508056640625, 0.44244384765625, 0.4759368896484375, 0.509429931640625, 0.5429229736328125, 0.576416015625, 0.6099090576171875, 0.643402099609375, 0.6768951416015625, 0.71038818359375, 0.7438812255859375, 0.777374267578125, 0.8108673095703125, 0.8443603515625, 0.8778533935546875, 0.911346435546875, 0.9448394775390625, 0.97833251953125, 1.0118255615234375, 1.045318603515625, 1.0788116455078125, 1.1123046875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 8.0, 8.0, 12.0, 9.0, 16.0, 15.0, 21.0, 25.0, 34.0, 34.0, 61.0, 60.0, 74.0, 95.0, 99.0, 92.0, 70.0, 52.0, 49.0, 40.0, 18.0, 18.0, 15.0, 11.0, 8.0, 3.0, 15.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5234298706054688, -0.5053558349609375, -0.48728179931640625, -0.469207763671875, -0.45113372802734375, -0.4330596923828125, -0.41498565673828125, -0.39691162109375, -0.37883758544921875, -0.3607635498046875, -0.34268951416015625, -0.324615478515625, -0.30654144287109375, -0.2884674072265625, -0.27039337158203125, -0.2523193359375, -0.23424530029296875, -0.2161712646484375, -0.19809722900390625, -0.180023193359375, -0.16194915771484375, -0.1438751220703125, -0.12580108642578125, -0.10772705078125, -0.08965301513671875, -0.0715789794921875, -0.05350494384765625, -0.035430908203125, -0.01735687255859375, 0.0007171630859375, 0.01879119873046875, 0.036865234375, 0.05493927001953125, 0.0730133056640625, 0.09108734130859375, 0.109161376953125, 0.12723541259765625, 0.1453094482421875, 0.16338348388671875, 0.18145751953125, 0.19953155517578125, 0.2176055908203125, 0.23567962646484375, 0.253753662109375, 0.27182769775390625, 0.2899017333984375, 0.30797576904296875, 0.3260498046875, 0.34412384033203125, 0.3621978759765625, 0.38027191162109375, 0.398345947265625, 0.41641998291015625, 0.4344940185546875, 0.45256805419921875, 0.47064208984375, 0.48871612548828125, 0.5067901611328125, 0.5248641967773438, 0.542938232421875, 0.5610122680664062, 0.5790863037109375, 0.5971603393554688, 0.615234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 27.0, 114.0, 486.0, 284.0, 59.0, 14.0, 10.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.217018127441406, -32.31507873535156, -31.41314125061035, -30.511201858520508, -29.609264373779297, -28.707324981689453, -27.80538558959961, -26.903446197509766, -26.001508712768555, -25.09956932067871, -24.1976318359375, -23.295692443847656, -22.393753051757812, -21.4918155670166, -20.589876174926758, -19.687938690185547, -18.785999298095703, -17.88405990600586, -16.98212242126465, -16.080183029174805, -15.178244590759277, -14.27630615234375, -13.374366760253906, -12.472428321838379, -11.570489883422852, -10.668551445007324, -9.766613006591797, -8.864673614501953, -7.962735176086426, -7.060796737670898, -6.158857822418213, -5.256918907165527, -4.35498046875, -3.4530417919158936, -2.551103115081787, -1.6491644382476807, -0.7472257614135742, 0.15471267700195312, 1.0566515922546387, 1.9585905075073242, 2.8605289459228516, 3.762467622756958, 4.6644062995910645, 5.56634521484375, 6.468283653259277, 7.370222091674805, 8.272161483764648, 9.174099922180176, 10.076038360595703, 10.97797679901123, 11.879915237426758, 12.781854629516602, 13.683793067932129, 14.585731506347656, 15.4876708984375, 16.389610290527344, 17.291547775268555, 18.1934871673584, 19.09542465209961, 19.997364044189453, 20.899303436279297, 21.801240921020508, 22.70318031311035, 23.605117797851562, 24.507057189941406]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 0.0, 7.0, 4.0, 11.0, 6.0, 10.0, 14.0, 13.0, 16.0, 26.0, 29.0, 42.0, 43.0, 35.0, 40.0, 50.0, 61.0, 58.0, 55.0, 50.0, 49.0, 46.0, 53.0, 60.0, 34.0, 32.0, 29.0, 28.0, 20.0, 16.0, 13.0, 11.0, 8.0, 14.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-10.991156578063965, -10.698351860046387, -10.405548095703125, -10.112743377685547, -9.819939613342285, -9.527134895324707, -9.234331130981445, -8.941526412963867, -8.648721694946289, -8.355916976928711, -8.06311321258545, -7.770308971405029, -7.477504730224609, -7.184700012207031, -6.891895771026611, -6.599091529846191, -6.30628776550293, -6.01348352432251, -5.72067928314209, -5.42787504196167, -5.13507080078125, -4.842266082763672, -4.549461841583252, -4.256657600402832, -3.963853359222412, -3.671049118041992, -3.3782448768615723, -3.0854403972625732, -2.7926361560821533, -2.4998319149017334, -2.2070274353027344, -1.9142231941223145, -1.6214179992675781, -1.3286137580871582, -1.0358093976974487, -0.743005096912384, -0.45020079612731934, -0.15739655494689941, 0.13540780544281006, 0.42821216583251953, 0.7210164070129395, 1.0138206481933594, 1.3066250085830688, 1.5994293689727783, 1.8922336101531982, 2.185037851333618, 2.477842330932617, 2.770646572113037, 3.063450813293457, 3.356255054473877, 3.649059295654297, 3.941863775253296, 4.234667778015137, 4.527472496032715, 4.820276737213135, 5.113080978393555, 5.405885219573975, 5.6986894607543945, 5.9914937019348145, 6.284297943115234, 6.5771026611328125, 6.869906425476074, 7.162711143493652, 7.455515384674072, 7.748319625854492]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 5.0, 4.0, 35.0, 34.0, 61.0, 99.0, 194.0, 741.0, 4300.0, 3976193.0, 208463.0, 3053.0, 627.0, 244.0, 86.0, 58.0, 33.0, 12.0, 15.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.140625, -11.70556640625, -11.2705078125, -10.83544921875, -10.400390625, -9.96533203125, -9.5302734375, -9.09521484375, -8.66015625, -8.22509765625, -7.7900390625, -7.35498046875, -6.919921875, -6.48486328125, -6.0498046875, -5.61474609375, -5.1796875, -4.74462890625, -4.3095703125, -3.87451171875, -3.439453125, -3.00439453125, -2.5693359375, -2.13427734375, -1.69921875, -1.26416015625, -0.8291015625, -0.39404296875, 0.041015625, 0.47607421875, 0.9111328125, 1.34619140625, 1.78125, 2.21630859375, 2.6513671875, 3.08642578125, 3.521484375, 3.95654296875, 4.3916015625, 4.82666015625, 5.26171875, 5.69677734375, 6.1318359375, 6.56689453125, 7.001953125, 7.43701171875, 7.8720703125, 8.30712890625, 8.7421875, 9.17724609375, 9.6123046875, 10.04736328125, 10.482421875, 10.91748046875, 11.3525390625, 11.78759765625, 12.22265625, 12.65771484375, 13.0927734375, 13.52783203125, 13.962890625, 14.39794921875, 14.8330078125, 15.26806640625, 15.703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 5.0, 12.0, 20.0, 22.0, 38.0, 72.0, 85.0, 151.0, 135.0, 121.0, 95.0, 85.0, 61.0, 36.0, 22.0, 12.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39453125, -0.38031005859375, -0.3660888671875, -0.35186767578125, -0.337646484375, -0.32342529296875, -0.3092041015625, -0.29498291015625, -0.28076171875, -0.26654052734375, -0.2523193359375, -0.23809814453125, -0.223876953125, -0.20965576171875, -0.1954345703125, -0.18121337890625, -0.1669921875, -0.15277099609375, -0.1385498046875, -0.12432861328125, -0.110107421875, -0.09588623046875, -0.0816650390625, -0.06744384765625, -0.05322265625, -0.03900146484375, -0.0247802734375, -0.01055908203125, 0.003662109375, 0.01788330078125, 0.0321044921875, 0.04632568359375, 0.060546875, 0.07476806640625, 0.0889892578125, 0.10321044921875, 0.117431640625, 0.13165283203125, 0.1458740234375, 0.16009521484375, 0.17431640625, 0.18853759765625, 0.2027587890625, 0.21697998046875, 0.231201171875, 0.24542236328125, 0.2596435546875, 0.27386474609375, 0.2880859375, 0.30230712890625, 0.3165283203125, 0.33074951171875, 0.344970703125, 0.35919189453125, 0.3734130859375, 0.38763427734375, 0.40185546875, 0.41607666015625, 0.4302978515625, 0.44451904296875, 0.458740234375, 0.47296142578125, 0.4871826171875, 0.50140380859375, 0.515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 17.0, 17.0, 41.0, 66.0, 137.0, 247.0, 612.0, 1543.0, 4946.0, 23966.0, 305052.0, 3721249.0, 115912.0, 14590.0, 3663.0, 1234.0, 493.0, 229.0, 117.0, 66.0, 37.0, 16.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.537109375, -2.461029052734375, -2.38494873046875, -2.308868408203125, -2.2327880859375, -2.156707763671875, -2.08062744140625, -2.004547119140625, -1.928466796875, -1.852386474609375, -1.77630615234375, -1.700225830078125, -1.6241455078125, -1.548065185546875, -1.47198486328125, -1.395904541015625, -1.31982421875, -1.243743896484375, -1.16766357421875, -1.091583251953125, -1.0155029296875, -0.939422607421875, -0.86334228515625, -0.787261962890625, -0.711181640625, -0.635101318359375, -0.55902099609375, -0.482940673828125, -0.4068603515625, -0.330780029296875, -0.25469970703125, -0.178619384765625, -0.1025390625, -0.026458740234375, 0.04962158203125, 0.125701904296875, 0.2017822265625, 0.277862548828125, 0.35394287109375, 0.430023193359375, 0.506103515625, 0.582183837890625, 0.65826416015625, 0.734344482421875, 0.8104248046875, 0.886505126953125, 0.96258544921875, 1.038665771484375, 1.11474609375, 1.190826416015625, 1.26690673828125, 1.342987060546875, 1.4190673828125, 1.495147705078125, 1.57122802734375, 1.647308349609375, 1.723388671875, 1.799468994140625, 1.87554931640625, 1.951629638671875, 2.0277099609375, 2.103790283203125, 2.17987060546875, 2.255950927734375, 2.33203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 15.0, 18.0, 17.0, 24.0, 28.0, 59.0, 82.0, 134.0, 240.0, 552.0, 1434.0, 685.0, 292.0, 167.0, 99.0, 65.0, 42.0, 18.0, 25.0, 22.0, 11.0, 8.0, 7.0, 2.0, 5.0, 0.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.50244140625, -0.4879264831542969, -0.47341156005859375, -0.4588966369628906, -0.4443817138671875, -0.4298667907714844, -0.41535186767578125, -0.4008369445800781, -0.386322021484375, -0.3718070983886719, -0.35729217529296875, -0.3427772521972656, -0.3282623291015625, -0.3137474060058594, -0.29923248291015625, -0.2847175598144531, -0.27020263671875, -0.2556877136230469, -0.24117279052734375, -0.22665786743164062, -0.2121429443359375, -0.19762802124023438, -0.18311309814453125, -0.16859817504882812, -0.154083251953125, -0.13956832885742188, -0.12505340576171875, -0.11053848266601562, -0.0960235595703125, -0.08150863647460938, -0.06699371337890625, -0.052478790283203125, -0.0379638671875, -0.023448944091796875, -0.00893402099609375, 0.005580902099609375, 0.0200958251953125, 0.034610748291015625, 0.04912567138671875, 0.06364059448242188, 0.078155517578125, 0.09267044067382812, 0.10718536376953125, 0.12170028686523438, 0.1362152099609375, 0.15073013305664062, 0.16524505615234375, 0.17975997924804688, 0.19427490234375, 0.20878982543945312, 0.22330474853515625, 0.23781967163085938, 0.2523345947265625, 0.2668495178222656, 0.28136444091796875, 0.2958793640136719, 0.310394287109375, 0.3249092102050781, 0.33942413330078125, 0.3539390563964844, 0.3684539794921875, 0.3829689025878906, 0.39748382568359375, 0.4119987487792969, 0.426513671875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 21.0, 85.0, 282.0, 412.0, 155.0, 29.0, 11.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6905460357666016, -1.505519151687622, -1.320492148399353, -1.135465145111084, -0.9504382610321045, -0.7654113173484802, -0.580384373664856, -0.3953573703765869, -0.21033048629760742, -0.025303542613983154, 0.1597234010696411, 0.3447503447532654, 0.5297772884368896, 0.7148042321205139, 0.8998311758041382, 1.0848581790924072, 1.2698850631713867, 1.4549119472503662, 1.6399389505386353, 1.8249659538269043, 2.009992837905884, 2.1950197219848633, 2.380046844482422, 2.5650737285614014, 2.750100612640381, 2.9351274967193604, 3.12015438079834, 3.3051815032958984, 3.490208387374878, 3.6752352714538574, 3.860262393951416, 4.045289039611816, 4.230316162109375, 4.415343284606934, 4.600369930267334, 4.785397052764893, 4.970423698425293, 5.155450820922852, 5.34047794342041, 5.525505065917969, 5.710531711578369, 5.895558834075928, 6.080585479736328, 6.265612602233887, 6.450639724731445, 6.635666370391846, 6.820693492889404, 7.005720138549805, 7.190747261047363, 7.375774383544922, 7.560801029205322, 7.745828151702881, 7.930854797363281, 8.11588191986084, 8.300909042358398, 8.485936164855957, 8.670963287353516, 8.855990409851074, 9.041017532348633, 9.226043701171875, 9.411070823669434, 9.596097946166992, 9.78112506866455, 9.96615219116211, 10.151178359985352]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 3.0, 4.0, 2.0, 9.0, 14.0, 14.0, 17.0, 23.0, 21.0, 9.0, 41.0, 30.0, 38.0, 38.0, 42.0, 43.0, 51.0, 40.0, 43.0, 48.0, 43.0, 55.0, 42.0, 43.0, 46.0, 27.0, 24.0, 34.0, 34.0, 24.0, 11.0, 15.0, 14.0, 6.0, 11.0, 7.0, 4.0, 7.0, 8.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.682251214981079, -1.6342061758041382, -1.5861611366271973, -1.5381160974502563, -1.4900710582733154, -1.442026138305664, -1.3939810991287231, -1.3459360599517822, -1.2978910207748413, -1.2498459815979004, -1.2018009424209595, -1.1537559032440186, -1.1057109832763672, -1.0576659440994263, -1.0096209049224854, -0.9615758657455444, -0.9135308265686035, -0.8654857873916626, -0.8174407482147217, -0.7693957686424255, -0.7213507294654846, -0.6733056902885437, -0.6252607107162476, -0.5772156715393066, -0.5291706323623657, -0.4811255931854248, -0.4330805838108063, -0.38503557443618774, -0.3369905352592468, -0.2889454960823059, -0.24090048670768738, -0.19285547733306885, -0.14481055736541748, -0.09676553308963776, -0.04872050881385803, -0.0006754845380783081, 0.047369539737701416, 0.09541456401348114, 0.14345958828926086, 0.1915045976638794, 0.2395496368408203, 0.28759467601776123, 0.33563968539237976, 0.3836846947669983, 0.4317297339439392, 0.4797747731208801, 0.5278197526931763, 0.5758647918701172, 0.6239098310470581, 0.671954870223999, 0.7199999094009399, 0.7680448889732361, 0.816089928150177, 0.8641349673271179, 0.9121799468994141, 0.960224986076355, 1.008270025253296, 1.0563150644302368, 1.1043601036071777, 1.1524051427841187, 1.2004501819610596, 1.248495101928711, 1.2965401411056519, 1.3445851802825928, 1.3926302194595337]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 6.0, 8.0, 8.0, 6.0, 7.0, 12.0, 20.0, 44.0, 66.0, 104.0, 170.0, 313.0, 556.0, 1092.0, 2443.0, 7144.0, 37328.0, 506639.0, 448184.0, 33243.0, 6396.0, 2396.0, 1043.0, 568.0, 322.0, 164.0, 88.0, 58.0, 44.0, 20.0, 20.0, 9.0, 11.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.32421875, -2.246673583984375, -2.16912841796875, -2.091583251953125, -2.0140380859375, -1.936492919921875, -1.85894775390625, -1.781402587890625, -1.703857421875, -1.626312255859375, -1.54876708984375, -1.471221923828125, -1.3936767578125, -1.316131591796875, -1.23858642578125, -1.161041259765625, -1.08349609375, -1.005950927734375, -0.92840576171875, -0.850860595703125, -0.7733154296875, -0.695770263671875, -0.61822509765625, -0.540679931640625, -0.463134765625, -0.385589599609375, -0.30804443359375, -0.230499267578125, -0.1529541015625, -0.075408935546875, 0.00213623046875, 0.079681396484375, 0.1572265625, 0.234771728515625, 0.31231689453125, 0.389862060546875, 0.4674072265625, 0.544952392578125, 0.62249755859375, 0.700042724609375, 0.777587890625, 0.855133056640625, 0.93267822265625, 1.010223388671875, 1.0877685546875, 1.165313720703125, 1.24285888671875, 1.320404052734375, 1.39794921875, 1.475494384765625, 1.55303955078125, 1.630584716796875, 1.7081298828125, 1.785675048828125, 1.86322021484375, 1.940765380859375, 2.018310546875, 2.095855712890625, 2.17340087890625, 2.250946044921875, 2.3284912109375, 2.406036376953125, 2.48358154296875, 2.561126708984375, 2.638671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 10.0, 12.0, 17.0, 39.0, 63.0, 66.0, 124.0, 128.0, 147.0, 117.0, 96.0, 60.0, 39.0, 31.0, 18.0, 12.0, 3.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395263671875, -0.381744384765625, -0.36822509765625, -0.354705810546875, -0.3411865234375, -0.327667236328125, -0.31414794921875, -0.300628662109375, -0.287109375, -0.273590087890625, -0.26007080078125, -0.246551513671875, -0.2330322265625, -0.219512939453125, -0.20599365234375, -0.192474365234375, -0.178955078125, -0.165435791015625, -0.15191650390625, -0.138397216796875, -0.1248779296875, -0.111358642578125, -0.09783935546875, -0.084320068359375, -0.07080078125, -0.057281494140625, -0.04376220703125, -0.030242919921875, -0.0167236328125, -0.003204345703125, 0.01031494140625, 0.023834228515625, 0.037353515625, 0.050872802734375, 0.06439208984375, 0.077911376953125, 0.0914306640625, 0.104949951171875, 0.11846923828125, 0.131988525390625, 0.1455078125, 0.159027099609375, 0.17254638671875, 0.186065673828125, 0.1995849609375, 0.213104248046875, 0.22662353515625, 0.240142822265625, 0.253662109375, 0.267181396484375, 0.28070068359375, 0.294219970703125, 0.3077392578125, 0.321258544921875, 0.33477783203125, 0.348297119140625, 0.36181640625, 0.375335693359375, 0.38885498046875, 0.402374267578125, 0.4158935546875, 0.429412841796875, 0.44293212890625, 0.456451416015625, 0.469970703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 6.0, 17.0, 14.0, 19.0, 35.0, 38.0, 44.0, 46.0, 76.0, 97.0, 148.0, 207.0, 355.0, 651.0, 1418.0, 3429.0, 9744.0, 34323.0, 157036.0, 532012.0, 237437.0, 49267.0, 13522.0, 4587.0, 1826.0, 835.0, 424.0, 254.0, 173.0, 122.0, 88.0, 73.0, 54.0, 38.0, 36.0, 26.0, 20.0, 14.0, 13.0, 8.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5380859375, -1.490936279296875, -1.44378662109375, -1.396636962890625, -1.3494873046875, -1.302337646484375, -1.25518798828125, -1.208038330078125, -1.160888671875, -1.113739013671875, -1.06658935546875, -1.019439697265625, -0.9722900390625, -0.925140380859375, -0.87799072265625, -0.830841064453125, -0.78369140625, -0.736541748046875, -0.68939208984375, -0.642242431640625, -0.5950927734375, -0.547943115234375, -0.50079345703125, -0.453643798828125, -0.406494140625, -0.359344482421875, -0.31219482421875, -0.265045166015625, -0.2178955078125, -0.170745849609375, -0.12359619140625, -0.076446533203125, -0.029296875, 0.017852783203125, 0.06500244140625, 0.112152099609375, 0.1593017578125, 0.206451416015625, 0.25360107421875, 0.300750732421875, 0.347900390625, 0.395050048828125, 0.44219970703125, 0.489349365234375, 0.5364990234375, 0.583648681640625, 0.63079833984375, 0.677947998046875, 0.72509765625, 0.772247314453125, 0.81939697265625, 0.866546630859375, 0.9136962890625, 0.960845947265625, 1.00799560546875, 1.055145263671875, 1.102294921875, 1.149444580078125, 1.19659423828125, 1.243743896484375, 1.2908935546875, 1.338043212890625, 1.38519287109375, 1.432342529296875, 1.4794921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 12.0, 9.0, 17.0, 9.0, 13.0, 12.0, 26.0, 26.0, 25.0, 30.0, 35.0, 43.0, 43.0, 44.0, 50.0, 39.0, 46.0, 51.0, 43.0, 44.0, 48.0, 46.0, 45.0, 32.0, 30.0, 31.0, 18.0, 25.0, 20.0, 17.0, 11.0, 10.0, 13.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1706695556640625, -1.132354736328125, -1.0940399169921875, -1.05572509765625, -1.0174102783203125, -0.979095458984375, -0.9407806396484375, -0.9024658203125, -0.8641510009765625, -0.825836181640625, -0.7875213623046875, -0.74920654296875, -0.7108917236328125, -0.672576904296875, -0.6342620849609375, -0.595947265625, -0.5576324462890625, -0.519317626953125, -0.4810028076171875, -0.44268798828125, -0.4043731689453125, -0.366058349609375, -0.3277435302734375, -0.2894287109375, -0.2511138916015625, -0.212799072265625, -0.1744842529296875, -0.13616943359375, -0.0978546142578125, -0.059539794921875, -0.0212249755859375, 0.01708984375, 0.0554046630859375, 0.093719482421875, 0.1320343017578125, 0.17034912109375, 0.2086639404296875, 0.246978759765625, 0.2852935791015625, 0.3236083984375, 0.3619232177734375, 0.400238037109375, 0.4385528564453125, 0.47686767578125, 0.5151824951171875, 0.553497314453125, 0.5918121337890625, 0.630126953125, 0.6684417724609375, 0.706756591796875, 0.7450714111328125, 0.78338623046875, 0.8217010498046875, 0.860015869140625, 0.8983306884765625, 0.9366455078125, 0.9749603271484375, 1.013275146484375, 1.0515899658203125, 1.08990478515625, 1.1282196044921875, 1.166534423828125, 1.2048492431640625, 1.2431640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 2.0, 5.0, 8.0, 7.0, 20.0, 46.0, 83.0, 159.0, 361.0, 994.0, 3343.0, 16368.0, 139754.0, 746581.0, 121339.0, 14849.0, 3066.0, 925.0, 346.0, 138.0, 72.0, 30.0, 24.0, 11.0, 5.0, 5.0, 10.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94091796875, -0.9053726196289062, -0.8698272705078125, -0.8342819213867188, -0.798736572265625, -0.7631912231445312, -0.7276458740234375, -0.6921005249023438, -0.65655517578125, -0.6210098266601562, -0.5854644775390625, -0.5499191284179688, -0.514373779296875, -0.47882843017578125, -0.4432830810546875, -0.40773773193359375, -0.3721923828125, -0.33664703369140625, -0.3011016845703125, -0.26555633544921875, -0.230010986328125, -0.19446563720703125, -0.1589202880859375, -0.12337493896484375, -0.08782958984375, -0.05228424072265625, -0.0167388916015625, 0.01880645751953125, 0.054351806640625, 0.08989715576171875, 0.1254425048828125, 0.16098785400390625, 0.196533203125, 0.23207855224609375, 0.2676239013671875, 0.30316925048828125, 0.338714599609375, 0.37425994873046875, 0.4098052978515625, 0.44535064697265625, 0.48089599609375, 0.5164413452148438, 0.5519866943359375, 0.5875320434570312, 0.623077392578125, 0.6586227416992188, 0.6941680908203125, 0.7297134399414062, 0.7652587890625, 0.8008041381835938, 0.8363494873046875, 0.8718948364257812, 0.907440185546875, 0.9429855346679688, 0.9785308837890625, 1.0140762329101562, 1.04962158203125, 1.0851669311523438, 1.1207122802734375, 1.1562576293945312, 1.191802978515625, 1.2273483276367188, 1.2628936767578125, 1.2984390258789062, 1.333984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 10.0, 4.0, 9.0, 13.0, 21.0, 28.0, 34.0, 31.0, 49.0, 65.0, 107.0, 123.0, 129.0, 83.0, 57.0, 50.0, 40.0, 26.0, 30.0, 21.0, 13.0, 9.0, 12.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001538991928100586, -0.00015006586909294128, -0.00014623254537582397, -0.00014239922165870667, -0.00013856589794158936, -0.00013473257422447205, -0.00013089925050735474, -0.00012706592679023743, -0.00012323260307312012, -0.00011939927935600281, -0.0001155659556388855, -0.00011173263192176819, -0.00010789930820465088, -0.00010406598448753357, -0.00010023266077041626, -9.639933705329895e-05, -9.256601333618164e-05, -8.873268961906433e-05, -8.489936590194702e-05, -8.106604218482971e-05, -7.72327184677124e-05, -7.339939475059509e-05, -6.956607103347778e-05, -6.573274731636047e-05, -6.189942359924316e-05, -5.8066099882125854e-05, -5.4232776165008545e-05, -5.0399452447891235e-05, -4.6566128730773926e-05, -4.2732805013656616e-05, -3.889948129653931e-05, -3.5066157579422e-05, -3.123283386230469e-05, -2.7399510145187378e-05, -2.356618642807007e-05, -1.973286271095276e-05, -1.589953899383545e-05, -1.206621527671814e-05, -8.23289155960083e-06, -4.3995678424835205e-06, -5.662441253662109e-07, 3.2670795917510986e-06, 7.100403308868408e-06, 1.0933727025985718e-05, 1.4767050743103027e-05, 1.8600374460220337e-05, 2.2433698177337646e-05, 2.6267021894454956e-05, 3.0100345611572266e-05, 3.3933669328689575e-05, 3.7766993045806885e-05, 4.1600316762924194e-05, 4.5433640480041504e-05, 4.9266964197158813e-05, 5.310028791427612e-05, 5.693361163139343e-05, 6.076693534851074e-05, 6.460025906562805e-05, 6.843358278274536e-05, 7.226690649986267e-05, 7.610023021697998e-05, 7.993355393409729e-05, 8.37668776512146e-05, 8.760020136833191e-05, 9.143352508544922e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 10.0, 13.0, 18.0, 23.0, 32.0, 61.0, 80.0, 113.0, 219.0, 416.0, 897.0, 2098.0, 7064.0, 33996.0, 274548.0, 640973.0, 70701.0, 11594.0, 3133.0, 1265.0, 576.0, 289.0, 143.0, 90.0, 49.0, 45.0, 16.0, 20.0, 14.0, 9.0, 10.0, 6.0, 0.0, 1.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.14453125, -1.1078338623046875, -1.071136474609375, -1.0344390869140625, -0.99774169921875, -0.9610443115234375, -0.924346923828125, -0.8876495361328125, -0.8509521484375, -0.8142547607421875, -0.777557373046875, -0.7408599853515625, -0.70416259765625, -0.6674652099609375, -0.630767822265625, -0.5940704345703125, -0.557373046875, -0.5206756591796875, -0.483978271484375, -0.4472808837890625, -0.41058349609375, -0.3738861083984375, -0.337188720703125, -0.3004913330078125, -0.2637939453125, -0.2270965576171875, -0.190399169921875, -0.1537017822265625, -0.11700439453125, -0.0803070068359375, -0.043609619140625, -0.0069122314453125, 0.02978515625, 0.0664825439453125, 0.103179931640625, 0.1398773193359375, 0.17657470703125, 0.2132720947265625, 0.249969482421875, 0.2866668701171875, 0.3233642578125, 0.3600616455078125, 0.396759033203125, 0.4334564208984375, 0.47015380859375, 0.5068511962890625, 0.543548583984375, 0.5802459716796875, 0.616943359375, 0.6536407470703125, 0.690338134765625, 0.7270355224609375, 0.76373291015625, 0.8004302978515625, 0.837127685546875, 0.8738250732421875, 0.9105224609375, 0.9472198486328125, 0.983917236328125, 1.0206146240234375, 1.05731201171875, 1.0940093994140625, 1.130706787109375, 1.1674041748046875, 1.2041015625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 9.0, 7.0, 12.0, 13.0, 27.0, 26.0, 29.0, 41.0, 41.0, 60.0, 87.0, 112.0, 127.0, 89.0, 77.0, 57.0, 38.0, 27.0, 32.0, 26.0, 8.0, 8.0, 12.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59130859375, -0.5694503784179688, -0.5475921630859375, -0.5257339477539062, -0.503875732421875, -0.48201751708984375, -0.4601593017578125, -0.43830108642578125, -0.41644287109375, -0.39458465576171875, -0.3727264404296875, -0.35086822509765625, -0.329010009765625, -0.30715179443359375, -0.2852935791015625, -0.26343536376953125, -0.2415771484375, -0.21971893310546875, -0.1978607177734375, -0.17600250244140625, -0.154144287109375, -0.13228607177734375, -0.1104278564453125, -0.08856964111328125, -0.06671142578125, -0.04485321044921875, -0.0229949951171875, -0.00113677978515625, 0.020721435546875, 0.04257965087890625, 0.0644378662109375, 0.08629608154296875, 0.108154296875, 0.13001251220703125, 0.1518707275390625, 0.17372894287109375, 0.195587158203125, 0.21744537353515625, 0.2393035888671875, 0.26116180419921875, 0.28302001953125, 0.30487823486328125, 0.3267364501953125, 0.34859466552734375, 0.370452880859375, 0.39231109619140625, 0.4141693115234375, 0.43602752685546875, 0.4578857421875, 0.47974395751953125, 0.5016021728515625, 0.5234603881835938, 0.545318603515625, 0.5671768188476562, 0.5890350341796875, 0.6108932495117188, 0.63275146484375, 0.6546096801757812, 0.6764678955078125, 0.6983261108398438, 0.720184326171875, 0.7420425415039062, 0.7639007568359375, 0.7857589721679688, 0.8076171875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 11.0, 29.0, 47.0, 130.0, 272.0, 248.0, 138.0, 66.0, 35.0, 10.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.89056968688965, -17.44415855407715, -16.99774742126465, -16.55133628845215, -16.10492515563965, -15.658514022827148, -15.212103843688965, -14.765692710876465, -14.319281578063965, -13.872870445251465, -13.426459312438965, -12.980048179626465, -12.533638000488281, -12.087226867675781, -11.640815734863281, -11.194404602050781, -10.747993469238281, -10.301582336425781, -9.855171203613281, -9.408760070800781, -8.962348937988281, -8.515937805175781, -8.069527626037598, -7.623116493225098, -7.176705360412598, -6.730294227600098, -6.283883094787598, -5.837472438812256, -5.391061305999756, -4.944650173187256, -4.498239517211914, -4.051828384399414, -3.6054182052612305, -3.1590070724487305, -2.7125961780548096, -2.2661852836608887, -1.8197741508483887, -1.3733630180358887, -0.9269521236419678, -0.4805412292480469, -0.034130096435546875, 0.4122809171676636, 0.858691930770874, 1.3051029443740845, 1.751513957977295, 2.197925090789795, 2.644335985183716, 3.0907468795776367, 3.5371580123901367, 3.9835691452026367, 4.429980278015137, 4.8763909339904785, 5.3228020668029785, 5.7692131996154785, 6.21562385559082, 6.66203498840332, 7.10844612121582, 7.55485725402832, 8.00126838684082, 8.44767951965332, 8.89409065246582, 9.34050178527832, 9.786911964416504, 10.233323097229004, 10.679734230041504]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 1.0, 10.0, 10.0, 6.0, 5.0, 13.0, 14.0, 21.0, 19.0, 26.0, 26.0, 39.0, 32.0, 31.0, 41.0, 48.0, 44.0, 58.0, 55.0, 56.0, 47.0, 43.0, 46.0, 39.0, 48.0, 28.0, 33.0, 28.0, 18.0, 25.0, 18.0, 10.0, 15.0, 14.0, 6.0, 9.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.042398452758789, -7.792926788330078, -7.543455123901367, -7.293983459472656, -7.044511795043945, -6.795040130615234, -6.545568466186523, -6.2960968017578125, -6.046625137329102, -5.797153472900391, -5.54768180847168, -5.298210144042969, -5.048738479614258, -4.799266815185547, -4.549795150756836, -4.300323486328125, -4.050852298736572, -3.8013806343078613, -3.5519089698791504, -3.3024373054504395, -3.0529656410217285, -2.8034939765930176, -2.5540225505828857, -2.304550886154175, -2.055079221725464, -1.805607557296753, -1.556135892868042, -1.3066643476486206, -1.0571926832199097, -0.8077210187911987, -0.5582494735717773, -0.3087778091430664, -0.059305667877197266, 0.19016596674919128, 0.43963760137557983, 0.689109206199646, 0.9385808706283569, 1.1880525350570679, 1.4375240802764893, 1.6869957447052002, 1.9364674091339111, 2.185939073562622, 2.435410737991333, 2.684882164001465, 2.934353828430176, 3.1838254928588867, 3.4332971572875977, 3.6827688217163086, 3.9322404861450195, 4.1817121505737305, 4.431183815002441, 4.680655479431152, 4.930127143859863, 5.179598808288574, 5.429070472717285, 5.678542137145996, 5.928013801574707, 6.177485466003418, 6.426957130432129, 6.67642879486084, 6.925900459289551, 7.175372123718262, 7.424843788146973, 7.674315452575684, 7.923786640167236]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 10.0, 8.0, 16.0, 21.0, 25.0, 48.0, 67.0, 101.0, 205.0, 301.0, 554.0, 1089.0, 2651.0, 9022.0, 57037.0, 3793104.0, 302674.0, 19236.0, 4448.0, 1707.0, 791.0, 461.0, 239.0, 148.0, 80.0, 60.0, 36.0, 30.0, 27.0, 16.0, 9.0, 6.0, 7.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.517578125, -2.435699462890625, -2.35382080078125, -2.271942138671875, -2.1900634765625, -2.108184814453125, -2.02630615234375, -1.944427490234375, -1.862548828125, -1.780670166015625, -1.69879150390625, -1.616912841796875, -1.5350341796875, -1.453155517578125, -1.37127685546875, -1.289398193359375, -1.20751953125, -1.125640869140625, -1.04376220703125, -0.961883544921875, -0.8800048828125, -0.798126220703125, -0.71624755859375, -0.634368896484375, -0.552490234375, -0.470611572265625, -0.38873291015625, -0.306854248046875, -0.2249755859375, -0.143096923828125, -0.06121826171875, 0.020660400390625, 0.1025390625, 0.184417724609375, 0.26629638671875, 0.348175048828125, 0.4300537109375, 0.511932373046875, 0.59381103515625, 0.675689697265625, 0.757568359375, 0.839447021484375, 0.92132568359375, 1.003204345703125, 1.0850830078125, 1.166961669921875, 1.24884033203125, 1.330718994140625, 1.41259765625, 1.494476318359375, 1.57635498046875, 1.658233642578125, 1.7401123046875, 1.821990966796875, 1.90386962890625, 1.985748291015625, 2.067626953125, 2.149505615234375, 2.23138427734375, 2.313262939453125, 2.3951416015625, 2.477020263671875, 2.55889892578125, 2.640777587890625, 2.72265625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 8.0, 11.0, 22.0, 32.0, 32.0, 46.0, 83.0, 93.0, 109.0, 109.0, 109.0, 92.0, 81.0, 55.0, 37.0, 31.0, 20.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.430419921875, -0.41628265380859375, -0.4021453857421875, -0.38800811767578125, -0.373870849609375, -0.35973358154296875, -0.3455963134765625, -0.33145904541015625, -0.31732177734375, -0.30318450927734375, -0.2890472412109375, -0.27490997314453125, -0.260772705078125, -0.24663543701171875, -0.2324981689453125, -0.21836090087890625, -0.2042236328125, -0.19008636474609375, -0.1759490966796875, -0.16181182861328125, -0.147674560546875, -0.13353729248046875, -0.1194000244140625, -0.10526275634765625, -0.09112548828125, -0.07698822021484375, -0.0628509521484375, -0.04871368408203125, -0.034576416015625, -0.02043914794921875, -0.0063018798828125, 0.00783538818359375, 0.02197265625, 0.03610992431640625, 0.0502471923828125, 0.06438446044921875, 0.078521728515625, 0.09265899658203125, 0.1067962646484375, 0.12093353271484375, 0.13507080078125, 0.14920806884765625, 0.1633453369140625, 0.17748260498046875, 0.191619873046875, 0.20575714111328125, 0.2198944091796875, 0.23403167724609375, 0.2481689453125, 0.26230621337890625, 0.2764434814453125, 0.29058074951171875, 0.304718017578125, 0.31885528564453125, 0.3329925537109375, 0.34712982177734375, 0.36126708984375, 0.37540435791015625, 0.3895416259765625, 0.40367889404296875, 0.417816162109375, 0.43195343017578125, 0.4460906982421875, 0.46022796630859375, 0.474365234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 6.0, 8.0, 15.0, 32.0, 66.0, 181.0, 684.0, 3865.0, 93815.0, 4060871.0, 31361.0, 2493.0, 524.0, 181.0, 77.0, 51.0, 32.0, 12.0, 6.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.19921875, -1.0836181640625, -0.968017578125, -0.8524169921875, -0.73681640625, -0.6212158203125, -0.505615234375, -0.3900146484375, -0.2744140625, -0.1588134765625, -0.043212890625, 0.0723876953125, 0.18798828125, 0.3035888671875, 0.419189453125, 0.5347900390625, 0.650390625, 0.7659912109375, 0.881591796875, 0.9971923828125, 1.11279296875, 1.2283935546875, 1.343994140625, 1.4595947265625, 1.5751953125, 1.6907958984375, 1.806396484375, 1.9219970703125, 2.03759765625, 2.1531982421875, 2.268798828125, 2.3843994140625, 2.5, 2.6156005859375, 2.731201171875, 2.8468017578125, 2.96240234375, 3.0780029296875, 3.193603515625, 3.3092041015625, 3.4248046875, 3.5404052734375, 3.656005859375, 3.7716064453125, 3.88720703125, 4.0028076171875, 4.118408203125, 4.2340087890625, 4.349609375, 4.4652099609375, 4.580810546875, 4.6964111328125, 4.81201171875, 4.9276123046875, 5.043212890625, 5.1588134765625, 5.2744140625, 5.3900146484375, 5.505615234375, 5.6212158203125, 5.73681640625, 5.8524169921875, 5.968017578125, 6.0836181640625, 6.19921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 11.0, 8.0, 15.0, 17.0, 33.0, 47.0, 98.0, 188.0, 638.0, 1861.0, 680.0, 235.0, 99.0, 63.0, 26.0, 16.0, 10.0, 7.0, 13.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.440673828125, -0.4219398498535156, -0.40320587158203125, -0.3844718933105469, -0.3657379150390625, -0.3470039367675781, -0.32826995849609375, -0.3095359802246094, -0.290802001953125, -0.2720680236816406, -0.25333404541015625, -0.23460006713867188, -0.2158660888671875, -0.19713211059570312, -0.17839813232421875, -0.15966415405273438, -0.14093017578125, -0.12219619750976562, -0.10346221923828125, -0.08472824096679688, -0.0659942626953125, -0.047260284423828125, -0.02852630615234375, -0.009792327880859375, 0.008941650390625, 0.027675628662109375, 0.04640960693359375, 0.06514358520507812, 0.0838775634765625, 0.10261154174804688, 0.12134552001953125, 0.14007949829101562, 0.1588134765625, 0.17754745483398438, 0.19628143310546875, 0.21501541137695312, 0.2337493896484375, 0.2524833679199219, 0.27121734619140625, 0.2899513244628906, 0.308685302734375, 0.3274192810058594, 0.34615325927734375, 0.3648872375488281, 0.3836212158203125, 0.4023551940917969, 0.42108917236328125, 0.4398231506347656, 0.45855712890625, 0.4772911071777344, 0.49602508544921875, 0.5147590637207031, 0.5334930419921875, 0.5522270202636719, 0.5709609985351562, 0.5896949768066406, 0.608428955078125, 0.6271629333496094, 0.6458969116210938, 0.6646308898925781, 0.6833648681640625, 0.7020988464355469, 0.7208328247070312, 0.7395668029785156, 0.75830078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 14.0, 49.0, 129.0, 235.0, 283.0, 171.0, 56.0, 32.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.410473108291626, -1.2918307781219482, -1.17318856716156, -1.0545463562011719, -0.9359040260314941, -0.8172617554664612, -0.6986194849014282, -0.5799772143363953, -0.4613349437713623, -0.34269267320632935, -0.2240504026412964, -0.10540813207626343, 0.013234138488769531, 0.1318764090538025, 0.25051867961883545, 0.3691609501838684, 0.48780322074890137, 0.6064454913139343, 0.7250877618789673, 0.8437300324440002, 0.9623723030090332, 1.081014633178711, 1.1996568441390991, 1.3182990550994873, 1.436941385269165, 1.5555837154388428, 1.674225926399231, 1.7928681373596191, 1.9115104675292969, 2.0301527976989746, 2.1487951278686523, 2.267437219619751, 2.3860793113708496, 2.5047216415405273, 2.623363971710205, 2.7420060634613037, 2.8606483936309814, 2.979290723800659, 3.097932815551758, 3.2165751457214355, 3.3352174758911133, 3.453859806060791, 3.5725021362304688, 3.6911442279815674, 3.809786558151245, 3.928428888320923, 4.0470709800720215, 4.165713310241699, 4.284355640411377, 4.402997970581055, 4.521640300750732, 4.64028263092041, 4.75892448425293, 4.877566814422607, 4.996209144592285, 5.114851474761963, 5.233493804931641, 5.352136135101318, 5.470778465270996, 5.589420795440674, 5.708063125610352, 5.826704978942871, 5.945347309112549, 6.063989639282227, 6.182631969451904]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 9.0, 15.0, 18.0, 19.0, 28.0, 35.0, 51.0, 68.0, 55.0, 60.0, 63.0, 73.0, 67.0, 63.0, 69.0, 64.0, 46.0, 38.0, 34.0, 34.0, 28.0, 19.0, 17.0, 8.0, 1.0, 6.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.557455062866211, -2.4830498695373535, -2.408644676208496, -2.3342394828796387, -2.2598342895507812, -2.185429096221924, -2.1110239028930664, -2.036618709564209, -1.9622135162353516, -1.8878083229064941, -1.8134031295776367, -1.7389979362487793, -1.6645927429199219, -1.5901875495910645, -1.515782356262207, -1.4413771629333496, -1.3669719696044922, -1.2925667762756348, -1.2181615829467773, -1.14375638961792, -1.0693511962890625, -0.9949460029602051, -0.9205408096313477, -0.8461356163024902, -0.7717304229736328, -0.6973252296447754, -0.622920036315918, -0.5485148429870605, -0.4741096496582031, -0.3997044563293457, -0.3252992630004883, -0.25089406967163086, -0.17648911476135254, -0.10208392143249512, -0.027678728103637695, 0.04672646522521973, 0.12113165855407715, 0.19553685188293457, 0.269942045211792, 0.3443472385406494, 0.41875243186950684, 0.49315762519836426, 0.5675628185272217, 0.6419680118560791, 0.7163732051849365, 0.790778398513794, 0.8651835918426514, 0.9395887851715088, 1.0139939785003662, 1.0883991718292236, 1.162804365158081, 1.2372095584869385, 1.311614751815796, 1.3860199451446533, 1.4604251384735107, 1.5348303318023682, 1.6092355251312256, 1.683640718460083, 1.7580459117889404, 1.8324511051177979, 1.9068562984466553, 1.9812614917755127, 2.05566668510437, 2.1300718784332275, 2.204477071762085]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 9.0, 18.0, 18.0, 36.0, 36.0, 68.0, 98.0, 143.0, 209.0, 294.0, 530.0, 846.0, 1409.0, 2686.0, 6027.0, 16370.0, 55773.0, 234292.0, 485609.0, 177003.0, 42771.0, 13493.0, 5050.0, 2396.0, 1271.0, 735.0, 457.0, 301.0, 179.0, 126.0, 98.0, 60.0, 39.0, 26.0, 13.0, 18.0, 15.0, 11.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.09295654296875, -1.0570068359375, -1.02105712890625, -0.985107421875, -0.94915771484375, -0.9132080078125, -0.87725830078125, -0.84130859375, -0.80535888671875, -0.7694091796875, -0.73345947265625, -0.697509765625, -0.66156005859375, -0.6256103515625, -0.58966064453125, -0.5537109375, -0.51776123046875, -0.4818115234375, -0.44586181640625, -0.409912109375, -0.37396240234375, -0.3380126953125, -0.30206298828125, -0.26611328125, -0.23016357421875, -0.1942138671875, -0.15826416015625, -0.122314453125, -0.08636474609375, -0.0504150390625, -0.01446533203125, 0.021484375, 0.05743408203125, 0.0933837890625, 0.12933349609375, 0.165283203125, 0.20123291015625, 0.2371826171875, 0.27313232421875, 0.30908203125, 0.34503173828125, 0.3809814453125, 0.41693115234375, 0.452880859375, 0.48883056640625, 0.5247802734375, 0.56072998046875, 0.5966796875, 0.63262939453125, 0.6685791015625, 0.70452880859375, 0.740478515625, 0.77642822265625, 0.8123779296875, 0.84832763671875, 0.88427734375, 0.92022705078125, 0.9561767578125, 0.99212646484375, 1.028076171875, 1.06402587890625, 1.0999755859375, 1.13592529296875, 1.171875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 16.0, 21.0, 46.0, 37.0, 73.0, 83.0, 105.0, 104.0, 107.0, 108.0, 92.0, 55.0, 57.0, 30.0, 17.0, 16.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43505859375, -0.4209556579589844, -0.40685272216796875, -0.3927497863769531, -0.3786468505859375, -0.3645439147949219, -0.35044097900390625, -0.3363380432128906, -0.322235107421875, -0.3081321716308594, -0.29402923583984375, -0.2799263000488281, -0.2658233642578125, -0.2517204284667969, -0.23761749267578125, -0.22351455688476562, -0.20941162109375, -0.19530868530273438, -0.18120574951171875, -0.16710281372070312, -0.1529998779296875, -0.13889694213867188, -0.12479400634765625, -0.11069107055664062, -0.096588134765625, -0.08248519897460938, -0.06838226318359375, -0.054279327392578125, -0.0401763916015625, -0.026073455810546875, -0.01197052001953125, 0.002132415771484375, 0.0162353515625, 0.030338287353515625, 0.04444122314453125, 0.058544158935546875, 0.0726470947265625, 0.08675003051757812, 0.10085296630859375, 0.11495590209960938, 0.129058837890625, 0.14316177368164062, 0.15726470947265625, 0.17136764526367188, 0.1854705810546875, 0.19957351684570312, 0.21367645263671875, 0.22777938842773438, 0.24188232421875, 0.2559852600097656, 0.27008819580078125, 0.2841911315917969, 0.2982940673828125, 0.3123970031738281, 0.32649993896484375, 0.3406028747558594, 0.354705810546875, 0.3688087463378906, 0.38291168212890625, 0.3970146179199219, 0.4111175537109375, 0.4252204895019531, 0.43932342529296875, 0.4534263610839844, 0.467529296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 8.0, 9.0, 9.0, 20.0, 27.0, 23.0, 52.0, 63.0, 92.0, 135.0, 228.0, 385.0, 673.0, 1580.0, 4152.0, 13276.0, 54912.0, 287273.0, 509057.0, 135799.0, 27907.0, 7846.0, 2613.0, 1046.0, 484.0, 278.0, 177.0, 111.0, 83.0, 59.0, 52.0, 31.0, 16.0, 23.0, 10.0, 11.0, 5.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.058349609375, -1.01806640625, -0.977783203125, -0.9375, -0.897216796875, -0.85693359375, -0.816650390625, -0.7763671875, -0.736083984375, -0.69580078125, -0.655517578125, -0.615234375, -0.574951171875, -0.53466796875, -0.494384765625, -0.4541015625, -0.413818359375, -0.37353515625, -0.333251953125, -0.29296875, -0.252685546875, -0.21240234375, -0.172119140625, -0.1318359375, -0.091552734375, -0.05126953125, -0.010986328125, 0.029296875, 0.069580078125, 0.10986328125, 0.150146484375, 0.1904296875, 0.230712890625, 0.27099609375, 0.311279296875, 0.3515625, 0.391845703125, 0.43212890625, 0.472412109375, 0.5126953125, 0.552978515625, 0.59326171875, 0.633544921875, 0.673828125, 0.714111328125, 0.75439453125, 0.794677734375, 0.8349609375, 0.875244140625, 0.91552734375, 0.955810546875, 0.99609375, 1.036376953125, 1.07666015625, 1.116943359375, 1.1572265625, 1.197509765625, 1.23779296875, 1.278076171875, 1.318359375, 1.358642578125, 1.39892578125, 1.439208984375, 1.4794921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 2.0, 9.0, 17.0, 6.0, 11.0, 15.0, 19.0, 23.0, 34.0, 36.0, 47.0, 49.0, 46.0, 49.0, 47.0, 39.0, 54.0, 46.0, 49.0, 43.0, 58.0, 44.0, 40.0, 24.0, 30.0, 34.0, 32.0, 14.0, 10.0, 17.0, 13.0, 10.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.04296875, -1.0038909912109375, -0.964813232421875, -0.9257354736328125, -0.88665771484375, -0.8475799560546875, -0.808502197265625, -0.7694244384765625, -0.7303466796875, -0.6912689208984375, -0.652191162109375, -0.6131134033203125, -0.57403564453125, -0.5349578857421875, -0.495880126953125, -0.4568023681640625, -0.417724609375, -0.3786468505859375, -0.339569091796875, -0.3004913330078125, -0.26141357421875, -0.2223358154296875, -0.183258056640625, -0.1441802978515625, -0.1051025390625, -0.0660247802734375, -0.026947021484375, 0.0121307373046875, 0.05120849609375, 0.0902862548828125, 0.129364013671875, 0.1684417724609375, 0.20751953125, 0.2465972900390625, 0.285675048828125, 0.3247528076171875, 0.36383056640625, 0.4029083251953125, 0.441986083984375, 0.4810638427734375, 0.5201416015625, 0.5592193603515625, 0.598297119140625, 0.6373748779296875, 0.67645263671875, 0.7155303955078125, 0.754608154296875, 0.7936859130859375, 0.832763671875, 0.8718414306640625, 0.910919189453125, 0.9499969482421875, 0.98907470703125, 1.0281524658203125, 1.067230224609375, 1.1063079833984375, 1.1453857421875, 1.1844635009765625, 1.223541259765625, 1.2626190185546875, 1.30169677734375, 1.3407745361328125, 1.379852294921875, 1.4189300537109375, 1.4580078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 7.0, 8.0, 14.0, 18.0, 17.0, 40.0, 73.0, 114.0, 163.0, 299.0, 642.0, 1274.0, 2968.0, 8011.0, 25693.0, 103606.0, 406266.0, 372320.0, 90920.0, 23366.0, 7381.0, 2766.0, 1205.0, 605.0, 325.0, 156.0, 95.0, 66.0, 42.0, 22.0, 21.0, 17.0, 10.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3642578125, -0.3535308837890625, -0.342803955078125, -0.3320770263671875, -0.32135009765625, -0.3106231689453125, -0.299896240234375, -0.2891693115234375, -0.2784423828125, -0.2677154541015625, -0.256988525390625, -0.2462615966796875, -0.23553466796875, -0.2248077392578125, -0.214080810546875, -0.2033538818359375, -0.192626953125, -0.1819000244140625, -0.171173095703125, -0.1604461669921875, -0.14971923828125, -0.1389923095703125, -0.128265380859375, -0.1175384521484375, -0.1068115234375, -0.0960845947265625, -0.085357666015625, -0.0746307373046875, -0.06390380859375, -0.0531768798828125, -0.042449951171875, -0.0317230224609375, -0.02099609375, -0.0102691650390625, 0.000457763671875, 0.0111846923828125, 0.02191162109375, 0.0326385498046875, 0.043365478515625, 0.0540924072265625, 0.0648193359375, 0.0755462646484375, 0.086273193359375, 0.0970001220703125, 0.10772705078125, 0.1184539794921875, 0.129180908203125, 0.1399078369140625, 0.150634765625, 0.1613616943359375, 0.172088623046875, 0.1828155517578125, 0.19354248046875, 0.2042694091796875, 0.214996337890625, 0.2257232666015625, 0.2364501953125, 0.2471771240234375, 0.257904052734375, 0.2686309814453125, 0.27935791015625, 0.2900848388671875, 0.300811767578125, 0.3115386962890625, 0.322265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 6.0, 4.0, 2.0, 14.0, 12.0, 18.0, 17.0, 19.0, 25.0, 41.0, 53.0, 57.0, 70.0, 94.0, 93.0, 92.0, 74.0, 70.0, 41.0, 50.0, 31.0, 24.0, 26.0, 15.0, 13.0, 6.0, 3.0, 6.0, 9.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.802248001098633e-05, -7.499847561120987e-05, -7.197447121143341e-05, -6.895046681165695e-05, -6.592646241188049e-05, -6.290245801210403e-05, -5.9878453612327576e-05, -5.685444921255112e-05, -5.383044481277466e-05, -5.08064404129982e-05, -4.778243601322174e-05, -4.475843161344528e-05, -4.173442721366882e-05, -3.8710422813892365e-05, -3.5686418414115906e-05, -3.266241401433945e-05, -2.9638409614562988e-05, -2.661440521478653e-05, -2.359040081501007e-05, -2.0566396415233612e-05, -1.7542392015457153e-05, -1.4518387615680695e-05, -1.1494383215904236e-05, -8.470378816127777e-06, -5.446374416351318e-06, -2.4223700165748596e-06, 6.016343832015991e-07, 3.625638782978058e-06, 6.649643182754517e-06, 9.673647582530975e-06, 1.2697651982307434e-05, 1.5721656382083893e-05, 1.874566078186035e-05, 2.176966518163681e-05, 2.479366958141327e-05, 2.7817673981189728e-05, 3.0841678380966187e-05, 3.3865682780742645e-05, 3.6889687180519104e-05, 3.991369158029556e-05, 4.293769598007202e-05, 4.596170037984848e-05, 4.898570477962494e-05, 5.20097091794014e-05, 5.5033713579177856e-05, 5.8057717978954315e-05, 6.108172237873077e-05, 6.410572677850723e-05, 6.712973117828369e-05, 7.015373557806015e-05, 7.317773997783661e-05, 7.620174437761307e-05, 7.922574877738953e-05, 8.224975317716599e-05, 8.527375757694244e-05, 8.82977619767189e-05, 9.132176637649536e-05, 9.434577077627182e-05, 9.736977517604828e-05, 0.00010039377957582474, 0.0001034177839756012, 0.00010644178837537766, 0.00010946579277515411, 0.00011248979717493057, 0.00011551380157470703]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 12.0, 9.0, 17.0, 17.0, 23.0, 40.0, 67.0, 77.0, 106.0, 168.0, 281.0, 438.0, 860.0, 1588.0, 3563.0, 8418.0, 25222.0, 84554.0, 334477.0, 423749.0, 113941.0, 31938.0, 10626.0, 4135.0, 1893.0, 900.0, 520.0, 312.0, 174.0, 111.0, 84.0, 57.0, 38.0, 31.0, 26.0, 28.0, 18.0, 11.0, 7.0, 5.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.295654296875, -0.2847480773925781, -0.27384185791015625, -0.2629356384277344, -0.2520294189453125, -0.24112319946289062, -0.23021697998046875, -0.21931076049804688, -0.208404541015625, -0.19749832153320312, -0.18659210205078125, -0.17568588256835938, -0.1647796630859375, -0.15387344360351562, -0.14296722412109375, -0.13206100463867188, -0.12115478515625, -0.11024856567382812, -0.09934234619140625, -0.08843612670898438, -0.0775299072265625, -0.06662368774414062, -0.05571746826171875, -0.044811248779296875, -0.033905029296875, -0.022998809814453125, -0.01209259033203125, -0.001186370849609375, 0.0097198486328125, 0.020626068115234375, 0.03153228759765625, 0.042438507080078125, 0.0533447265625, 0.06425094604492188, 0.07515716552734375, 0.08606338500976562, 0.0969696044921875, 0.10787582397460938, 0.11878204345703125, 0.12968826293945312, 0.140594482421875, 0.15150070190429688, 0.16240692138671875, 0.17331314086914062, 0.1842193603515625, 0.19512557983398438, 0.20603179931640625, 0.21693801879882812, 0.22784423828125, 0.23875045776367188, 0.24965667724609375, 0.2605628967285156, 0.2714691162109375, 0.2823753356933594, 0.29328155517578125, 0.3041877746582031, 0.315093994140625, 0.3260002136230469, 0.33690643310546875, 0.3478126525878906, 0.3587188720703125, 0.3696250915527344, 0.38053131103515625, 0.3914375305175781, 0.40234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 5.0, 10.0, 12.0, 7.0, 10.0, 11.0, 19.0, 29.0, 35.0, 36.0, 51.0, 70.0, 66.0, 69.0, 77.0, 64.0, 67.0, 66.0, 51.0, 43.0, 41.0, 28.0, 37.0, 14.0, 12.0, 14.0, 7.0, 11.0, 7.0, 4.0, 4.0, 7.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264892578125, -0.25504302978515625, -0.2451934814453125, -0.23534393310546875, -0.225494384765625, -0.21564483642578125, -0.2057952880859375, -0.19594573974609375, -0.18609619140625, -0.17624664306640625, -0.1663970947265625, -0.15654754638671875, -0.146697998046875, -0.13684844970703125, -0.1269989013671875, -0.11714935302734375, -0.1072998046875, -0.09745025634765625, -0.0876007080078125, -0.07775115966796875, -0.067901611328125, -0.05805206298828125, -0.0482025146484375, -0.03835296630859375, -0.02850341796875, -0.01865386962890625, -0.0088043212890625, 0.00104522705078125, 0.010894775390625, 0.02074432373046875, 0.0305938720703125, 0.04044342041015625, 0.05029296875, 0.06014251708984375, 0.0699920654296875, 0.07984161376953125, 0.089691162109375, 0.09954071044921875, 0.1093902587890625, 0.11923980712890625, 0.12908935546875, 0.13893890380859375, 0.1487884521484375, 0.15863800048828125, 0.168487548828125, 0.17833709716796875, 0.1881866455078125, 0.19803619384765625, 0.2078857421875, 0.21773529052734375, 0.2275848388671875, 0.23743438720703125, 0.247283935546875, 0.25713348388671875, 0.2669830322265625, 0.27683258056640625, 0.28668212890625, 0.29653167724609375, 0.3063812255859375, 0.31623077392578125, 0.326080322265625, 0.33592987060546875, 0.3457794189453125, 0.35562896728515625, 0.365478515625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 13.0, 28.0, 57.0, 112.0, 250.0, 258.0, 146.0, 76.0, 25.0, 15.0, 12.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.310193061828613, -3.9585907459259033, -3.6069884300231934, -3.2553858757019043, -2.9037835597991943, -2.5521812438964844, -2.2005786895751953, -1.8489763736724854, -1.4973740577697754, -1.1457717418670654, -0.7941693067550659, -0.4425668716430664, -0.09096455574035645, 0.2606377601623535, 0.6122403144836426, 0.9638426303863525, 1.3154449462890625, 1.6670472621917725, 2.0186495780944824, 2.3702521324157715, 2.7218544483184814, 3.0734567642211914, 3.4250593185424805, 3.7766616344451904, 4.1282639503479, 4.4798665046691895, 4.83146858215332, 5.183071136474609, 5.534673690795898, 5.886275768280029, 6.237878322601318, 6.589480400085449, 6.941083908081055, 7.292686462402344, 7.644288539886475, 7.995891094207764, 8.347493171691895, 8.699095726013184, 9.050698280334473, 9.402300834655762, 9.753902435302734, 10.105504989624023, 10.457107543945312, 10.808710098266602, 11.160311698913574, 11.511914253234863, 11.863516807556152, 12.215119361877441, 12.56672191619873, 12.91832447052002, 13.269927024841309, 13.621528625488281, 13.97313117980957, 14.32473373413086, 14.676336288452148, 15.027938842773438, 15.379541397094727, 15.731143951416016, 16.082746505737305, 16.434349060058594, 16.785951614379883, 17.137554168701172, 17.489154815673828, 17.840757369995117, 18.192359924316406]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 4.0, 5.0, 8.0, 11.0, 9.0, 16.0, 12.0, 20.0, 27.0, 21.0, 29.0, 23.0, 26.0, 32.0, 36.0, 32.0, 25.0, 28.0, 42.0, 42.0, 44.0, 37.0, 45.0, 40.0, 30.0, 19.0, 35.0, 35.0, 31.0, 34.0, 22.0, 23.0, 22.0, 15.0, 10.0, 21.0, 14.0, 16.0, 6.0, 14.0, 6.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.604959964752197, -5.434990882873535, -5.265021800994873, -5.095052719116211, -4.925084114074707, -4.755115032196045, -4.585145950317383, -4.415176868438721, -4.245207786560059, -4.0752387046813965, -3.9052698612213135, -3.7353007793426514, -3.5653319358825684, -3.3953628540039062, -3.225393772125244, -3.055424690246582, -2.885456085205078, -2.715487003326416, -2.545518159866333, -2.375549077987671, -2.205580234527588, -2.035611152648926, -1.8656420707702637, -1.6956731081008911, -1.5257041454315186, -1.355735182762146, -1.1857662200927734, -1.0157971382141113, -0.8458281755447388, -0.6758592128753662, -0.5058901309967041, -0.33592116832733154, -0.1659526824951172, 0.004016309976577759, 0.1739853024482727, 0.34395432472229004, 0.5139232873916626, 0.6838922500610352, 0.8538613319396973, 1.0238302946090698, 1.1937992572784424, 1.363768219947815, 1.5337371826171875, 1.7037062644958496, 1.8736752271652222, 2.0436441898345947, 2.213613271713257, 2.38358211517334, 2.553551197052002, 2.723520278930664, 2.893489122390747, 3.063458204269409, 3.233427047729492, 3.4033961296081543, 3.5733652114868164, 3.7433342933654785, 3.9133031368255615, 4.0832719802856445, 4.253241062164307, 4.423210144042969, 4.593179225921631, 4.763148307800293, 4.933116912841797, 5.103085994720459, 5.273055076599121]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 10.0, 17.0, 25.0, 28.0, 40.0, 72.0, 133.0, 191.0, 395.0, 764.0, 1814.0, 4934.0, 20093.0, 239054.0, 3835057.0, 73947.0, 11386.0, 3454.0, 1352.0, 606.0, 367.0, 191.0, 102.0, 77.0, 52.0, 28.0, 32.0, 9.0, 14.0, 12.0, 5.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7705078125, -1.7139739990234375, -1.657440185546875, -1.6009063720703125, -1.54437255859375, -1.4878387451171875, -1.431304931640625, -1.3747711181640625, -1.3182373046875, -1.2617034912109375, -1.205169677734375, -1.1486358642578125, -1.09210205078125, -1.0355682373046875, -0.979034423828125, -0.9225006103515625, -0.865966796875, -0.8094329833984375, -0.752899169921875, -0.6963653564453125, -0.63983154296875, -0.5832977294921875, -0.526763916015625, -0.4702301025390625, -0.4136962890625, -0.3571624755859375, -0.300628662109375, -0.2440948486328125, -0.18756103515625, -0.1310272216796875, -0.074493408203125, -0.0179595947265625, 0.03857421875, 0.0951080322265625, 0.151641845703125, 0.2081756591796875, 0.26470947265625, 0.3212432861328125, 0.377777099609375, 0.4343109130859375, 0.4908447265625, 0.5473785400390625, 0.603912353515625, 0.6604461669921875, 0.71697998046875, 0.7735137939453125, 0.830047607421875, 0.8865814208984375, 0.943115234375, 0.9996490478515625, 1.056182861328125, 1.1127166748046875, 1.16925048828125, 1.2257843017578125, 1.282318115234375, 1.3388519287109375, 1.3953857421875, 1.4519195556640625, 1.508453369140625, 1.5649871826171875, 1.62152099609375, 1.6780548095703125, 1.734588623046875, 1.7911224365234375, 1.84765625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 4.0, 19.0, 20.0, 33.0, 42.0, 68.0, 88.0, 105.0, 118.0, 88.0, 105.0, 99.0, 76.0, 35.0, 34.0, 25.0, 10.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4579010009765625, -0.442657470703125, -0.4274139404296875, -0.41217041015625, -0.3969268798828125, -0.381683349609375, -0.3664398193359375, -0.3511962890625, -0.3359527587890625, -0.320709228515625, -0.3054656982421875, -0.29022216796875, -0.2749786376953125, -0.259735107421875, -0.2444915771484375, -0.229248046875, -0.2140045166015625, -0.198760986328125, -0.1835174560546875, -0.16827392578125, -0.1530303955078125, -0.137786865234375, -0.1225433349609375, -0.1072998046875, -0.0920562744140625, -0.076812744140625, -0.0615692138671875, -0.04632568359375, -0.0310821533203125, -0.015838623046875, -0.0005950927734375, 0.0146484375, 0.0298919677734375, 0.045135498046875, 0.0603790283203125, 0.07562255859375, 0.0908660888671875, 0.106109619140625, 0.1213531494140625, 0.1365966796875, 0.1518402099609375, 0.167083740234375, 0.1823272705078125, 0.19757080078125, 0.2128143310546875, 0.228057861328125, 0.2433013916015625, 0.258544921875, 0.2737884521484375, 0.289031982421875, 0.3042755126953125, 0.31951904296875, 0.3347625732421875, 0.350006103515625, 0.3652496337890625, 0.3804931640625, 0.3957366943359375, 0.410980224609375, 0.4262237548828125, 0.44146728515625, 0.4567108154296875, 0.471954345703125, 0.4871978759765625, 0.50244140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 7.0, 6.0, 8.0, 27.0, 66.0, 137.0, 293.0, 649.0, 1672.0, 6314.0, 52186.0, 3474649.0, 631192.0, 21689.0, 3518.0, 1085.0, 406.0, 207.0, 92.0, 44.0, 25.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3779296875, -1.3284149169921875, -1.278900146484375, -1.2293853759765625, -1.17987060546875, -1.1303558349609375, -1.080841064453125, -1.0313262939453125, -0.9818115234375, -0.9322967529296875, -0.882781982421875, -0.8332672119140625, -0.78375244140625, -0.7342376708984375, -0.684722900390625, -0.6352081298828125, -0.585693359375, -0.5361785888671875, -0.486663818359375, -0.4371490478515625, -0.38763427734375, -0.3381195068359375, -0.288604736328125, -0.2390899658203125, -0.1895751953125, -0.1400604248046875, -0.090545654296875, -0.0410308837890625, 0.00848388671875, 0.0579986572265625, 0.107513427734375, 0.1570281982421875, 0.20654296875, 0.2560577392578125, 0.305572509765625, 0.3550872802734375, 0.40460205078125, 0.4541168212890625, 0.503631591796875, 0.5531463623046875, 0.6026611328125, 0.6521759033203125, 0.701690673828125, 0.7512054443359375, 0.80072021484375, 0.8502349853515625, 0.899749755859375, 0.9492645263671875, 0.998779296875, 1.0482940673828125, 1.097808837890625, 1.1473236083984375, 1.19683837890625, 1.2463531494140625, 1.295867919921875, 1.3453826904296875, 1.3948974609375, 1.4444122314453125, 1.493927001953125, 1.5434417724609375, 1.59295654296875, 1.6424713134765625, 1.691986083984375, 1.7415008544921875, 1.791015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 13.0, 9.0, 20.0, 25.0, 54.0, 88.0, 153.0, 290.0, 672.0, 1576.0, 584.0, 250.0, 125.0, 71.0, 40.0, 28.0, 16.0, 16.0, 10.0, 8.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.359619140625, -0.3485374450683594, -0.33745574951171875, -0.3263740539550781, -0.3152923583984375, -0.3042106628417969, -0.29312896728515625, -0.2820472717285156, -0.270965576171875, -0.2598838806152344, -0.24880218505859375, -0.23772048950195312, -0.2266387939453125, -0.21555709838867188, -0.20447540283203125, -0.19339370727539062, -0.18231201171875, -0.17123031616210938, -0.16014862060546875, -0.14906692504882812, -0.1379852294921875, -0.12690353393554688, -0.11582183837890625, -0.10474014282226562, -0.093658447265625, -0.08257675170898438, -0.07149505615234375, -0.060413360595703125, -0.0493316650390625, -0.038249969482421875, -0.02716827392578125, -0.016086578369140625, -0.0050048828125, 0.006076812744140625, 0.01715850830078125, 0.028240203857421875, 0.0393218994140625, 0.050403594970703125, 0.06148529052734375, 0.07256698608398438, 0.083648681640625, 0.09473037719726562, 0.10581207275390625, 0.11689376831054688, 0.1279754638671875, 0.13905715942382812, 0.15013885498046875, 0.16122055053710938, 0.17230224609375, 0.18338394165039062, 0.19446563720703125, 0.20554733276367188, 0.2166290283203125, 0.22771072387695312, 0.23879241943359375, 0.24987411499023438, 0.260955810546875, 0.2720375061035156, 0.28311920166015625, 0.2942008972167969, 0.3052825927734375, 0.3163642883300781, 0.32744598388671875, 0.3385276794433594, 0.349609375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 16.0, 61.0, 246.0, 417.0, 192.0, 54.0, 14.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.766304969787598, -6.632399082183838, -6.498493671417236, -6.364587783813477, -6.230681896209717, -6.096776008605957, -5.9628705978393555, -5.828964710235596, -5.695058822631836, -5.561152935028076, -5.427247524261475, -5.293341636657715, -5.159435749053955, -5.025529861450195, -4.891624450683594, -4.757718563079834, -4.623812675476074, -4.4899067878723145, -4.356001377105713, -4.222095489501953, -4.088189601898193, -3.9542839527130127, -3.820378303527832, -3.6864724159240723, -3.5525670051574707, -3.41866135597229, -3.2847554683685303, -3.1508498191833496, -3.01694393157959, -2.883038282394409, -2.7491326332092285, -2.6152267456054688, -2.481321334838867, -2.3474156856536865, -2.2135097980499268, -2.079604148864746, -1.9456982612609863, -1.8117926120758057, -1.6778868436813354, -1.5439810752868652, -1.4100751876831055, -1.2761694192886353, -1.142263650894165, -1.0083580017089844, -0.8744521737098694, -0.7405464053153992, -0.6066406965255737, -0.4727349281311035, -0.3388291597366333, -0.20492340624332428, -0.07101765275001526, 0.06288808584213257, 0.19679385423660278, 0.330699622631073, 0.46460533142089844, 0.5985110998153687, 0.7324168682098389, 0.8663226366043091, 1.0002284049987793, 1.13413405418396, 1.2680399417877197, 1.4019455909729004, 1.5358513593673706, 1.6697571277618408, 1.803662896156311]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 6.0, 10.0, 7.0, 13.0, 14.0, 24.0, 23.0, 15.0, 26.0, 26.0, 41.0, 32.0, 47.0, 48.0, 46.0, 33.0, 52.0, 45.0, 48.0, 40.0, 40.0, 47.0, 38.0, 54.0, 27.0, 30.0, 26.0, 19.0, 21.0, 18.0, 18.0, 14.0, 11.0, 7.0, 12.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9037561416625977, -0.8721358776092529, -0.8405156135559082, -0.8088953495025635, -0.7772750854492188, -0.745654821395874, -0.7140344977378845, -0.6824142336845398, -0.6507939696311951, -0.6191737055778503, -0.5875534415245056, -0.5559331774711609, -0.5243128538131714, -0.49269261956214905, -0.46107232570648193, -0.4294520616531372, -0.3978317975997925, -0.36621153354644775, -0.334591269493103, -0.3029709756374359, -0.2713507115840912, -0.23973044753074646, -0.20811016857624054, -0.17648988962173462, -0.1448696255683899, -0.11324935406446457, -0.08162908256053925, -0.05000881105661392, -0.0183885395526886, 0.013231724500656128, 0.04485200345516205, 0.07647228240966797, 0.10809242725372314, 0.13971269130706787, 0.1713329702615738, 0.2029532492160797, 0.23457351326942444, 0.26619377732276917, 0.2978140711784363, 0.329434335231781, 0.36105459928512573, 0.39267486333847046, 0.4242951273918152, 0.4559154212474823, 0.487535685300827, 0.5191559791564941, 0.5507762432098389, 0.5823965072631836, 0.6140167713165283, 0.645637035369873, 0.6772572994232178, 0.7088775634765625, 0.7404978275299072, 0.772118091583252, 0.8037384152412415, 0.8353586792945862, 0.8669789433479309, 0.8985992074012756, 0.9302194714546204, 0.9618397355079651, 0.9934600591659546, 1.0250803232192993, 1.056700587272644, 1.0883208513259888, 1.1199411153793335]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 14.0, 9.0, 11.0, 12.0, 35.0, 35.0, 44.0, 61.0, 82.0, 138.0, 192.0, 311.0, 450.0, 700.0, 1211.0, 2411.0, 5054.0, 11610.0, 33309.0, 122804.0, 414390.0, 328165.0, 84495.0, 24866.0, 9109.0, 4017.0, 1980.0, 1120.0, 650.0, 439.0, 253.0, 159.0, 117.0, 83.0, 57.0, 39.0, 32.0, 30.0, 13.0, 9.0, 10.0, 11.0, 7.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.96484375, -0.9325408935546875, -0.900238037109375, -0.8679351806640625, -0.83563232421875, -0.8033294677734375, -0.771026611328125, -0.7387237548828125, -0.7064208984375, -0.6741180419921875, -0.641815185546875, -0.6095123291015625, -0.57720947265625, -0.5449066162109375, -0.512603759765625, -0.4803009033203125, -0.447998046875, -0.4156951904296875, -0.383392333984375, -0.3510894775390625, -0.31878662109375, -0.2864837646484375, -0.254180908203125, -0.2218780517578125, -0.1895751953125, -0.1572723388671875, -0.124969482421875, -0.0926666259765625, -0.06036376953125, -0.0280609130859375, 0.004241943359375, 0.0365447998046875, 0.06884765625, 0.1011505126953125, 0.133453369140625, 0.1657562255859375, 0.19805908203125, 0.2303619384765625, 0.262664794921875, 0.2949676513671875, 0.3272705078125, 0.3595733642578125, 0.391876220703125, 0.4241790771484375, 0.45648193359375, 0.4887847900390625, 0.521087646484375, 0.5533905029296875, 0.585693359375, 0.6179962158203125, 0.650299072265625, 0.6826019287109375, 0.71490478515625, 0.7472076416015625, 0.779510498046875, 0.8118133544921875, 0.8441162109375, 0.8764190673828125, 0.908721923828125, 0.9410247802734375, 0.97332763671875, 1.0056304931640625, 1.037933349609375, 1.0702362060546875, 1.1025390625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 7.0, 18.0, 19.0, 24.0, 39.0, 65.0, 97.0, 102.0, 98.0, 115.0, 111.0, 96.0, 67.0, 50.0, 32.0, 20.0, 11.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.457916259765625, -0.44268798828125, -0.427459716796875, -0.4122314453125, -0.397003173828125, -0.38177490234375, -0.366546630859375, -0.351318359375, -0.336090087890625, -0.32086181640625, -0.305633544921875, -0.2904052734375, -0.275177001953125, -0.25994873046875, -0.244720458984375, -0.2294921875, -0.214263916015625, -0.19903564453125, -0.183807373046875, -0.1685791015625, -0.153350830078125, -0.13812255859375, -0.122894287109375, -0.107666015625, -0.092437744140625, -0.07720947265625, -0.061981201171875, -0.0467529296875, -0.031524658203125, -0.01629638671875, -0.001068115234375, 0.01416015625, 0.029388427734375, 0.04461669921875, 0.059844970703125, 0.0750732421875, 0.090301513671875, 0.10552978515625, 0.120758056640625, 0.135986328125, 0.151214599609375, 0.16644287109375, 0.181671142578125, 0.1968994140625, 0.212127685546875, 0.22735595703125, 0.242584228515625, 0.2578125, 0.273040771484375, 0.28826904296875, 0.303497314453125, 0.3187255859375, 0.333953857421875, 0.34918212890625, 0.364410400390625, 0.379638671875, 0.394866943359375, 0.41009521484375, 0.425323486328125, 0.4405517578125, 0.455780029296875, 0.47100830078125, 0.486236572265625, 0.50146484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 9.0, 11.0, 9.0, 16.0, 19.0, 23.0, 32.0, 46.0, 57.0, 79.0, 91.0, 162.0, 196.0, 303.0, 593.0, 1186.0, 2905.0, 8474.0, 28000.0, 112059.0, 408291.0, 359076.0, 91076.0, 23550.0, 7090.0, 2560.0, 1096.0, 509.0, 293.0, 184.0, 119.0, 102.0, 83.0, 47.0, 47.0, 28.0, 24.0, 17.0, 21.0, 20.0, 14.0, 11.0, 10.0, 6.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.015625, -0.9827880859375, -0.949951171875, -0.9171142578125, -0.88427734375, -0.8514404296875, -0.818603515625, -0.7857666015625, -0.7529296875, -0.7200927734375, -0.687255859375, -0.6544189453125, -0.62158203125, -0.5887451171875, -0.555908203125, -0.5230712890625, -0.490234375, -0.4573974609375, -0.424560546875, -0.3917236328125, -0.35888671875, -0.3260498046875, -0.293212890625, -0.2603759765625, -0.2275390625, -0.1947021484375, -0.161865234375, -0.1290283203125, -0.09619140625, -0.0633544921875, -0.030517578125, 0.0023193359375, 0.03515625, 0.0679931640625, 0.100830078125, 0.1336669921875, 0.16650390625, 0.1993408203125, 0.232177734375, 0.2650146484375, 0.2978515625, 0.3306884765625, 0.363525390625, 0.3963623046875, 0.42919921875, 0.4620361328125, 0.494873046875, 0.5277099609375, 0.560546875, 0.5933837890625, 0.626220703125, 0.6590576171875, 0.69189453125, 0.7247314453125, 0.757568359375, 0.7904052734375, 0.8232421875, 0.8560791015625, 0.888916015625, 0.9217529296875, 0.95458984375, 0.9874267578125, 1.020263671875, 1.0531005859375, 1.0859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 9.0, 8.0, 8.0, 6.0, 7.0, 18.0, 20.0, 16.0, 29.0, 20.0, 31.0, 27.0, 29.0, 33.0, 25.0, 40.0, 40.0, 40.0, 41.0, 56.0, 43.0, 45.0, 33.0, 29.0, 34.0, 35.0, 31.0, 26.0, 27.0, 32.0, 30.0, 24.0, 13.0, 13.0, 15.0, 7.0, 10.0, 7.0, 11.0, 7.0, 5.0, 3.0, 10.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.98095703125, -0.9502029418945312, -0.9194488525390625, -0.8886947631835938, -0.857940673828125, -0.8271865844726562, -0.7964324951171875, -0.7656784057617188, -0.73492431640625, -0.7041702270507812, -0.6734161376953125, -0.6426620483398438, -0.611907958984375, -0.5811538696289062, -0.5503997802734375, -0.5196456909179688, -0.4888916015625, -0.45813751220703125, -0.4273834228515625, -0.39662933349609375, -0.365875244140625, -0.33512115478515625, -0.3043670654296875, -0.27361297607421875, -0.24285888671875, -0.21210479736328125, -0.1813507080078125, -0.15059661865234375, -0.119842529296875, -0.08908843994140625, -0.0583343505859375, -0.02758026123046875, 0.003173828125, 0.03392791748046875, 0.0646820068359375, 0.09543609619140625, 0.126190185546875, 0.15694427490234375, 0.1876983642578125, 0.21845245361328125, 0.24920654296875, 0.27996063232421875, 0.3107147216796875, 0.34146881103515625, 0.372222900390625, 0.40297698974609375, 0.4337310791015625, 0.46448516845703125, 0.4952392578125, 0.5259933471679688, 0.5567474365234375, 0.5875015258789062, 0.618255615234375, 0.6490097045898438, 0.6797637939453125, 0.7105178833007812, 0.74127197265625, 0.7720260620117188, 0.8027801513671875, 0.8335342407226562, 0.864288330078125, 0.8950424194335938, 0.9257965087890625, 0.9565505981445312, 0.9873046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 10.0, 14.0, 15.0, 20.0, 46.0, 48.0, 57.0, 104.0, 204.0, 341.0, 643.0, 1183.0, 2745.0, 6653.0, 18245.0, 55401.0, 194858.0, 448695.0, 221947.0, 63357.0, 20247.0, 7584.0, 3178.0, 1399.0, 657.0, 347.0, 211.0, 98.0, 70.0, 52.0, 34.0, 24.0, 10.0, 16.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2425537109375, -0.23532485961914062, -0.22809600830078125, -0.22086715698242188, -0.2136383056640625, -0.20640945434570312, -0.19918060302734375, -0.19195175170898438, -0.184722900390625, -0.17749404907226562, -0.17026519775390625, -0.16303634643554688, -0.1558074951171875, -0.14857864379882812, -0.14134979248046875, -0.13412094116210938, -0.12689208984375, -0.11966323852539062, -0.11243438720703125, -0.10520553588867188, -0.0979766845703125, -0.09074783325195312, -0.08351898193359375, -0.07629013061523438, -0.069061279296875, -0.061832427978515625, -0.05460357666015625, -0.047374725341796875, -0.0401458740234375, -0.032917022705078125, -0.02568817138671875, -0.018459320068359375, -0.01123046875, -0.004001617431640625, 0.00322723388671875, 0.010456085205078125, 0.0176849365234375, 0.024913787841796875, 0.03214263916015625, 0.039371490478515625, 0.046600341796875, 0.053829193115234375, 0.06105804443359375, 0.06828689575195312, 0.0755157470703125, 0.08274459838867188, 0.08997344970703125, 0.09720230102539062, 0.10443115234375, 0.11166000366210938, 0.11888885498046875, 0.12611770629882812, 0.1333465576171875, 0.14057540893554688, 0.14780426025390625, 0.15503311157226562, 0.162261962890625, 0.16949081420898438, 0.17671966552734375, 0.18394851684570312, 0.1911773681640625, 0.19840621948242188, 0.20563507080078125, 0.21286392211914062, 0.2200927734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 5.0, 4.0, 14.0, 13.0, 9.0, 13.0, 14.0, 13.0, 16.0, 14.0, 37.0, 38.0, 45.0, 76.0, 86.0, 89.0, 100.0, 66.0, 66.0, 56.0, 38.0, 36.0, 22.0, 23.0, 12.0, 19.0, 16.0, 9.0, 9.0, 6.0, 6.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.270408630371094e-05, -6.054248660802841e-05, -5.8380886912345886e-05, -5.621928721666336e-05, -5.4057687520980835e-05, -5.189608782529831e-05, -4.9734488129615784e-05, -4.757288843393326e-05, -4.541128873825073e-05, -4.324968904256821e-05, -4.108808934688568e-05, -3.8926489651203156e-05, -3.676488995552063e-05, -3.4603290259838104e-05, -3.244169056415558e-05, -3.0280090868473053e-05, -2.8118491172790527e-05, -2.5956891477108002e-05, -2.3795291781425476e-05, -2.163369208574295e-05, -1.9472092390060425e-05, -1.73104926943779e-05, -1.5148892998695374e-05, -1.2987293303012848e-05, -1.0825693607330322e-05, -8.664093911647797e-06, -6.502494215965271e-06, -4.340894520282745e-06, -2.1792948246002197e-06, -1.7695128917694092e-08, 2.1439045667648315e-06, 4.305504262447357e-06, 6.467103958129883e-06, 8.628703653812408e-06, 1.0790303349494934e-05, 1.295190304517746e-05, 1.5113502740859985e-05, 1.727510243654251e-05, 1.9436702132225037e-05, 2.1598301827907562e-05, 2.3759901523590088e-05, 2.5921501219272614e-05, 2.808310091495514e-05, 3.0244700610637665e-05, 3.240630030632019e-05, 3.4567900002002716e-05, 3.672949969768524e-05, 3.889109939336777e-05, 4.105269908905029e-05, 4.321429878473282e-05, 4.5375898480415344e-05, 4.753749817609787e-05, 4.9699097871780396e-05, 5.186069756746292e-05, 5.402229726314545e-05, 5.618389695882797e-05, 5.83454966545105e-05, 6.0507096350193024e-05, 6.266869604587555e-05, 6.483029574155807e-05, 6.69918954372406e-05, 6.915349513292313e-05, 7.131509482860565e-05, 7.347669452428818e-05, 7.56382942199707e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 9.0, 6.0, 7.0, 18.0, 35.0, 37.0, 46.0, 89.0, 117.0, 212.0, 359.0, 706.0, 1491.0, 3594.0, 11067.0, 38491.0, 170156.0, 550038.0, 207140.0, 44565.0, 12788.0, 4191.0, 1642.0, 750.0, 371.0, 210.0, 140.0, 98.0, 49.0, 33.0, 35.0, 21.0, 10.0, 11.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.3474388122558594, -0.33818817138671875, -0.3289375305175781, -0.3196868896484375, -0.3104362487792969, -0.30118560791015625, -0.2919349670410156, -0.282684326171875, -0.2734336853027344, -0.26418304443359375, -0.2549324035644531, -0.2456817626953125, -0.23643112182617188, -0.22718048095703125, -0.21792984008789062, -0.20867919921875, -0.19942855834960938, -0.19017791748046875, -0.18092727661132812, -0.1716766357421875, -0.16242599487304688, -0.15317535400390625, -0.14392471313476562, -0.134674072265625, -0.12542343139648438, -0.11617279052734375, -0.10692214965820312, -0.0976715087890625, -0.08842086791992188, -0.07917022705078125, -0.06991958618164062, -0.0606689453125, -0.051418304443359375, -0.04216766357421875, -0.032917022705078125, -0.0236663818359375, -0.014415740966796875, -0.00516510009765625, 0.004085540771484375, 0.013336181640625, 0.022586822509765625, 0.03183746337890625, 0.041088104248046875, 0.0503387451171875, 0.059589385986328125, 0.06884002685546875, 0.07809066772460938, 0.08734130859375, 0.09659194946289062, 0.10584259033203125, 0.11509323120117188, 0.1243438720703125, 0.13359451293945312, 0.14284515380859375, 0.15209579467773438, 0.161346435546875, 0.17059707641601562, 0.17984771728515625, 0.18909835815429688, 0.1983489990234375, 0.20759963989257812, 0.21685028076171875, 0.22610092163085938, 0.2353515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 1.0, 5.0, 8.0, 3.0, 6.0, 12.0, 13.0, 18.0, 27.0, 32.0, 37.0, 49.0, 60.0, 82.0, 86.0, 80.0, 78.0, 69.0, 83.0, 60.0, 48.0, 28.0, 35.0, 24.0, 10.0, 6.0, 12.0, 11.0, 6.0, 4.0, 2.0, 1.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.362060546875, -0.3533649444580078, -0.3446693420410156, -0.33597373962402344, -0.32727813720703125, -0.31858253479003906, -0.3098869323730469, -0.3011913299560547, -0.2924957275390625, -0.2838001251220703, -0.2751045227050781, -0.26640892028808594, -0.25771331787109375, -0.24901771545410156, -0.24032211303710938, -0.2316265106201172, -0.222930908203125, -0.2142353057861328, -0.20553970336914062, -0.19684410095214844, -0.18814849853515625, -0.17945289611816406, -0.17075729370117188, -0.1620616912841797, -0.1533660888671875, -0.1446704864501953, -0.13597488403320312, -0.12727928161621094, -0.11858367919921875, -0.10988807678222656, -0.10119247436523438, -0.09249687194824219, -0.08380126953125, -0.07510566711425781, -0.06641006469726562, -0.05771446228027344, -0.04901885986328125, -0.04032325744628906, -0.031627655029296875, -0.022932052612304688, -0.0142364501953125, -0.0055408477783203125, 0.003154754638671875, 0.011850357055664062, 0.02054595947265625, 0.029241561889648438, 0.037937164306640625, 0.04663276672363281, 0.055328369140625, 0.06402397155761719, 0.07271957397460938, 0.08141517639160156, 0.09011077880859375, 0.09880638122558594, 0.10750198364257812, 0.11619758605957031, 0.1248931884765625, 0.1335887908935547, 0.14228439331054688, 0.15097999572753906, 0.15967559814453125, 0.16837120056152344, 0.17706680297851562, 0.1857624053955078, 0.1944580078125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 10.0, 30.0, 77.0, 123.0, 245.0, 242.0, 143.0, 53.0, 39.0, 14.0, 9.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.874499797821045, -6.531778335571289, -6.189056873321533, -5.846335411071777, -5.50361442565918, -5.160892963409424, -4.818171501159668, -4.47545051574707, -4.132728576660156, -3.7900071144104004, -3.4472858905792236, -3.1045644283294678, -2.761843204498291, -2.419121742248535, -2.0764002799987793, -1.7336790561676025, -1.3909578323364258, -1.0482364892959595, -0.7055150866508484, -0.3627936840057373, -0.020072340965270996, 0.3226490020751953, 0.6653704643249512, 1.008091688156128, 1.3508131504058838, 1.69353449344635, 2.0362558364868164, 2.3789772987365723, 2.721698760986328, 3.064419984817505, 3.4071414470672607, 3.7498626708984375, 4.092583656311035, 4.435305118560791, 4.778026580810547, 5.1207475662231445, 5.4634690284729, 5.806190490722656, 6.148911952972412, 6.491633415222168, 6.834354400634766, 7.1770758628845215, 7.519797325134277, 7.862518310546875, 8.205240249633789, 8.547961235046387, 8.890682220458984, 9.233404159545898, 9.576126098632812, 9.91884708404541, 10.261569023132324, 10.604290008544922, 10.947011947631836, 11.289732933044434, 11.632453918457031, 11.975175857543945, 12.317896842956543, 12.66061782836914, 13.003339767456055, 13.346060752868652, 13.688782691955566, 14.031503677368164, 14.374225616455078, 14.716946601867676, 15.059667587280273]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 1.0, 5.0, 12.0, 7.0, 7.0, 12.0, 23.0, 26.0, 21.0, 28.0, 47.0, 28.0, 52.0, 53.0, 64.0, 55.0, 49.0, 52.0, 60.0, 55.0, 48.0, 42.0, 33.0, 30.0, 33.0, 31.0, 31.0, 20.0, 19.0, 12.0, 8.0, 7.0, 9.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.214570999145508, -7.98219108581543, -7.749811172485352, -7.517431259155273, -7.285051345825195, -7.052671432495117, -6.820291519165039, -6.587911605834961, -6.355531692504883, -6.123151779174805, -5.890771865844727, -5.658391952514648, -5.42601203918457, -5.193632125854492, -4.961252212524414, -4.728872299194336, -4.496492385864258, -4.26411247253418, -4.031732559204102, -3.7993526458740234, -3.5669727325439453, -3.334592819213867, -3.102212905883789, -2.869832992553711, -2.6374526023864746, -2.4050726890563965, -2.1726927757263184, -1.9403128623962402, -1.707932949066162, -1.4755529165267944, -1.2431730031967163, -1.0107930898666382, -0.7784132957458496, -0.5460333824157715, -0.31365343928337097, -0.08127349615097046, 0.15110641717910767, 0.38348639011383057, 0.6158663034439087, 0.8482462167739868, 1.080626130104065, 1.313006043434143, 1.5453859567642212, 1.7777659893035889, 2.010145902633667, 2.242525815963745, 2.4749057292938232, 2.7072856426239014, 2.9396655559539795, 3.1720454692840576, 3.4044253826141357, 3.636805295944214, 3.869185209274292, 4.101565361022949, 4.333945274353027, 4.5663251876831055, 4.798705101013184, 5.031085014343262, 5.26346492767334, 5.495844841003418, 5.728224754333496, 5.960604667663574, 6.192984580993652, 6.4253644943237305, 6.657744407653809]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 7.0, 15.0, 18.0, 31.0, 44.0, 58.0, 136.0, 239.0, 441.0, 951.0, 2653.0, 10329.0, 88809.0, 3902671.0, 167174.0, 14486.0, 3522.0, 1328.0, 583.0, 331.0, 163.0, 102.0, 56.0, 33.0, 29.0, 16.0, 11.0, 12.0, 5.0, 2.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8515625, -1.78900146484375, -1.7264404296875, -1.66387939453125, -1.601318359375, -1.53875732421875, -1.4761962890625, -1.41363525390625, -1.35107421875, -1.28851318359375, -1.2259521484375, -1.16339111328125, -1.100830078125, -1.03826904296875, -0.9757080078125, -0.91314697265625, -0.8505859375, -0.78802490234375, -0.7254638671875, -0.66290283203125, -0.600341796875, -0.53778076171875, -0.4752197265625, -0.41265869140625, -0.35009765625, -0.28753662109375, -0.2249755859375, -0.16241455078125, -0.099853515625, -0.03729248046875, 0.0252685546875, 0.08782958984375, 0.150390625, 0.21295166015625, 0.2755126953125, 0.33807373046875, 0.400634765625, 0.46319580078125, 0.5257568359375, 0.58831787109375, 0.65087890625, 0.71343994140625, 0.7760009765625, 0.83856201171875, 0.901123046875, 0.96368408203125, 1.0262451171875, 1.08880615234375, 1.1513671875, 1.21392822265625, 1.2764892578125, 1.33905029296875, 1.401611328125, 1.46417236328125, 1.5267333984375, 1.58929443359375, 1.65185546875, 1.71441650390625, 1.7769775390625, 1.83953857421875, 1.902099609375, 1.96466064453125, 2.0272216796875, 2.08978271484375, 2.15234375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 18.0, 11.0, 24.0, 24.0, 49.0, 76.0, 95.0, 105.0, 103.0, 101.0, 94.0, 92.0, 72.0, 49.0, 31.0, 24.0, 10.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.474365234375, -0.4585151672363281, -0.44266510009765625, -0.4268150329589844, -0.4109649658203125, -0.3951148986816406, -0.37926483154296875, -0.3634147644042969, -0.347564697265625, -0.3317146301269531, -0.31586456298828125, -0.3000144958496094, -0.2841644287109375, -0.2683143615722656, -0.25246429443359375, -0.23661422729492188, -0.22076416015625, -0.20491409301757812, -0.18906402587890625, -0.17321395874023438, -0.1573638916015625, -0.14151382446289062, -0.12566375732421875, -0.10981369018554688, -0.093963623046875, -0.07811355590820312, -0.06226348876953125, -0.046413421630859375, -0.0305633544921875, -0.014713287353515625, 0.00113677978515625, 0.016986846923828125, 0.0328369140625, 0.048686981201171875, 0.06453704833984375, 0.08038711547851562, 0.0962371826171875, 0.11208724975585938, 0.12793731689453125, 0.14378738403320312, 0.159637451171875, 0.17548751831054688, 0.19133758544921875, 0.20718765258789062, 0.2230377197265625, 0.23888778686523438, 0.25473785400390625, 0.2705879211425781, 0.28643798828125, 0.3022880554199219, 0.31813812255859375, 0.3339881896972656, 0.3498382568359375, 0.3656883239746094, 0.38153839111328125, 0.3973884582519531, 0.413238525390625, 0.4290885925292969, 0.44493865966796875, 0.4607887268066406, 0.4766387939453125, 0.4924888610839844, 0.5083389282226562, 0.5241889953613281, 0.5400390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 12.0, 26.0, 54.0, 154.0, 468.0, 2445.0, 67916.0, 4102875.0, 17812.0, 1751.0, 462.0, 157.0, 68.0, 36.0, 15.0, 14.0, 8.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.269073486328125, -1.15728759765625, -1.045501708984375, -0.9337158203125, -0.821929931640625, -0.71014404296875, -0.598358154296875, -0.486572265625, -0.374786376953125, -0.26300048828125, -0.151214599609375, -0.0394287109375, 0.072357177734375, 0.18414306640625, 0.295928955078125, 0.40771484375, 0.519500732421875, 0.63128662109375, 0.743072509765625, 0.8548583984375, 0.966644287109375, 1.07843017578125, 1.190216064453125, 1.302001953125, 1.413787841796875, 1.52557373046875, 1.637359619140625, 1.7491455078125, 1.860931396484375, 1.97271728515625, 2.084503173828125, 2.1962890625, 2.308074951171875, 2.41986083984375, 2.531646728515625, 2.6434326171875, 2.755218505859375, 2.86700439453125, 2.978790283203125, 3.090576171875, 3.202362060546875, 3.31414794921875, 3.425933837890625, 3.5377197265625, 3.649505615234375, 3.76129150390625, 3.873077392578125, 3.98486328125, 4.096649169921875, 4.20843505859375, 4.320220947265625, 4.4320068359375, 4.543792724609375, 4.65557861328125, 4.767364501953125, 4.879150390625, 4.990936279296875, 5.10272216796875, 5.214508056640625, 5.3262939453125, 5.438079833984375, 5.54986572265625, 5.661651611328125, 5.7734375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 5.0, 8.0, 15.0, 27.0, 41.0, 82.0, 196.0, 566.0, 1941.0, 737.0, 236.0, 98.0, 45.0, 27.0, 12.0, 12.0, 4.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.48462677001953125, -0.4599761962890625, -0.43532562255859375, -0.410675048828125, -0.38602447509765625, -0.3613739013671875, -0.33672332763671875, -0.31207275390625, -0.28742218017578125, -0.2627716064453125, -0.23812103271484375, -0.213470458984375, -0.18881988525390625, -0.1641693115234375, -0.13951873779296875, -0.1148681640625, -0.09021759033203125, -0.0655670166015625, -0.04091644287109375, -0.016265869140625, 0.00838470458984375, 0.0330352783203125, 0.05768585205078125, 0.08233642578125, 0.10698699951171875, 0.1316375732421875, 0.15628814697265625, 0.180938720703125, 0.20558929443359375, 0.2302398681640625, 0.25489044189453125, 0.279541015625, 0.30419158935546875, 0.3288421630859375, 0.35349273681640625, 0.378143310546875, 0.40279388427734375, 0.4274444580078125, 0.45209503173828125, 0.47674560546875, 0.5013961791992188, 0.5260467529296875, 0.5506973266601562, 0.575347900390625, 0.5999984741210938, 0.6246490478515625, 0.6492996215820312, 0.6739501953125, 0.6986007690429688, 0.7232513427734375, 0.7479019165039062, 0.772552490234375, 0.7972030639648438, 0.8218536376953125, 0.8465042114257812, 0.87115478515625, 0.8958053588867188, 0.9204559326171875, 0.9451065063476562, 0.969757080078125, 0.9944076538085938, 1.0190582275390625, 1.0437088012695312, 1.068359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 30.0, 92.0, 323.0, 337.0, 149.0, 50.0, 10.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0], "bins": [-11.190675735473633, -10.984847068786621, -10.779019355773926, -10.573190689086914, -10.367362976074219, -10.161534309387207, -9.955706596374512, -9.7498779296875, -9.544050216674805, -9.338221549987793, -9.132393836975098, -8.926565170288086, -8.72073745727539, -8.514908790588379, -8.309081077575684, -8.103252410888672, -7.897424221038818, -7.691596031188965, -7.485767841339111, -7.279939651489258, -7.074111461639404, -6.868283271789551, -6.662454605102539, -6.456626892089844, -6.250798225402832, -6.0449700355529785, -5.839141845703125, -5.6333136558532715, -5.427485466003418, -5.2216572761535645, -5.015829086303711, -4.810000419616699, -4.604172229766846, -4.398344039916992, -4.192515850067139, -3.986687660217285, -3.7808594703674316, -3.575031280517578, -3.3692028522491455, -3.163374662399292, -2.9575467109680176, -2.751718521118164, -2.5458903312683105, -2.340062141418457, -2.1342339515686035, -1.9284056425094604, -1.7225773334503174, -1.5167491436004639, -1.3109208345413208, -1.1050926446914673, -0.899264395236969, -0.6934361457824707, -0.4876079559326172, -0.28177976608276367, -0.0759514570236206, 0.1298767328262329, 0.3357049226760864, 0.5415331125259399, 0.7473613619804382, 0.9531896114349365, 1.15901780128479, 1.3648459911346436, 1.5706743001937866, 1.7765024900436401, 1.9823306798934937]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 2.0, 11.0, 13.0, 12.0, 23.0, 26.0, 24.0, 39.0, 65.0, 52.0, 66.0, 58.0, 77.0, 80.0, 73.0, 58.0, 72.0, 60.0, 46.0, 32.0, 38.0, 18.0, 20.0, 7.0, 14.0, 3.0, 7.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013636589050293, -1.9260454177856445, -1.838454246520996, -1.7508630752563477, -1.6632720232009888, -1.5756808519363403, -1.488089680671692, -1.400498628616333, -1.3129074573516846, -1.2253162860870361, -1.1377251148223877, -1.0501339435577393, -0.9625428915023804, -0.8749517202377319, -0.7873605489730835, -0.6997694373130798, -0.6121782064437866, -0.5245870351791382, -0.4369959235191345, -0.3494047522544861, -0.26181361079216003, -0.17422246932983398, -0.08663129806518555, 0.0009598135948181152, 0.08855098485946655, 0.1761421263217926, 0.26373326778411865, 0.3513244390487671, 0.43891558051109314, 0.5265067219734192, 0.6140978932380676, 0.7016890048980713, 0.7892801761627197, 0.8768713474273682, 0.9644624590873718, 1.052053689956665, 1.139644742012024, 1.2272359132766724, 1.3148270845413208, 1.4024181365966797, 1.4900093078613281, 1.5776004791259766, 1.665191650390625, 1.7527828216552734, 1.8403738737106323, 1.9279650449752808, 2.0155563354492188, 2.103147268295288, 2.1907386779785156, 2.278329849243164, 2.3659210205078125, 2.453512191772461, 2.5411033630371094, 2.628694534301758, 2.7162857055664062, 2.8038766384124756, 2.891467809677124, 2.9790589809417725, 3.066650152206421, 3.1542413234710693, 3.2418324947357178, 3.329423427581787, 3.4170145988464355, 3.504605770111084, 3.5921969413757324]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 5.0, 15.0, 18.0, 26.0, 43.0, 57.0, 111.0, 188.0, 333.0, 620.0, 1468.0, 3487.0, 12125.0, 73036.0, 612521.0, 300395.0, 32598.0, 6920.0, 2425.0, 991.0, 500.0, 264.0, 150.0, 98.0, 58.0, 26.0, 19.0, 16.0, 14.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.90234375, -1.840576171875, -1.77880859375, -1.717041015625, -1.6552734375, -1.593505859375, -1.53173828125, -1.469970703125, -1.408203125, -1.346435546875, -1.28466796875, -1.222900390625, -1.1611328125, -1.099365234375, -1.03759765625, -0.975830078125, -0.9140625, -0.852294921875, -0.79052734375, -0.728759765625, -0.6669921875, -0.605224609375, -0.54345703125, -0.481689453125, -0.419921875, -0.358154296875, -0.29638671875, -0.234619140625, -0.1728515625, -0.111083984375, -0.04931640625, 0.012451171875, 0.07421875, 0.135986328125, 0.19775390625, 0.259521484375, 0.3212890625, 0.383056640625, 0.44482421875, 0.506591796875, 0.568359375, 0.630126953125, 0.69189453125, 0.753662109375, 0.8154296875, 0.877197265625, 0.93896484375, 1.000732421875, 1.0625, 1.124267578125, 1.18603515625, 1.247802734375, 1.3095703125, 1.371337890625, 1.43310546875, 1.494873046875, 1.556640625, 1.618408203125, 1.68017578125, 1.741943359375, 1.8037109375, 1.865478515625, 1.92724609375, 1.989013671875, 2.05078125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 18.0, 12.0, 29.0, 43.0, 71.0, 99.0, 116.0, 93.0, 114.0, 94.0, 96.0, 80.0, 54.0, 29.0, 12.0, 16.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5107421875, -0.49480438232421875, -0.4788665771484375, -0.46292877197265625, -0.446990966796875, -0.43105316162109375, -0.4151153564453125, -0.39917755126953125, -0.38323974609375, -0.36730194091796875, -0.3513641357421875, -0.33542633056640625, -0.319488525390625, -0.30355072021484375, -0.2876129150390625, -0.27167510986328125, -0.2557373046875, -0.23979949951171875, -0.2238616943359375, -0.20792388916015625, -0.191986083984375, -0.17604827880859375, -0.1601104736328125, -0.14417266845703125, -0.12823486328125, -0.11229705810546875, -0.0963592529296875, -0.08042144775390625, -0.064483642578125, -0.04854583740234375, -0.0326080322265625, -0.01667022705078125, -0.000732421875, 0.01520538330078125, 0.0311431884765625, 0.04708099365234375, 0.063018798828125, 0.07895660400390625, 0.0948944091796875, 0.11083221435546875, 0.12677001953125, 0.14270782470703125, 0.1586456298828125, 0.17458343505859375, 0.190521240234375, 0.20645904541015625, 0.2223968505859375, 0.23833465576171875, 0.2542724609375, 0.27021026611328125, 0.2861480712890625, 0.30208587646484375, 0.318023681640625, 0.33396148681640625, 0.3498992919921875, 0.36583709716796875, 0.38177490234375, 0.39771270751953125, 0.4136505126953125, 0.42958831787109375, 0.445526123046875, 0.46146392822265625, 0.4774017333984375, 0.49333953857421875, 0.50927734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 11.0, 8.0, 21.0, 22.0, 28.0, 29.0, 50.0, 78.0, 150.0, 238.0, 369.0, 683.0, 1490.0, 4058.0, 13338.0, 55720.0, 265542.0, 512204.0, 148862.0, 31982.0, 8402.0, 2792.0, 1130.0, 532.0, 276.0, 185.0, 112.0, 82.0, 56.0, 31.0, 21.0, 16.0, 11.0, 5.0, 5.0, 6.0, 1.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96484375, -0.9281768798828125, -0.891510009765625, -0.8548431396484375, -0.81817626953125, -0.7815093994140625, -0.744842529296875, -0.7081756591796875, -0.6715087890625, -0.6348419189453125, -0.598175048828125, -0.5615081787109375, -0.52484130859375, -0.4881744384765625, -0.451507568359375, -0.4148406982421875, -0.378173828125, -0.3415069580078125, -0.304840087890625, -0.2681732177734375, -0.23150634765625, -0.1948394775390625, -0.158172607421875, -0.1215057373046875, -0.0848388671875, -0.0481719970703125, -0.011505126953125, 0.0251617431640625, 0.06182861328125, 0.0984954833984375, 0.135162353515625, 0.1718292236328125, 0.20849609375, 0.2451629638671875, 0.281829833984375, 0.3184967041015625, 0.35516357421875, 0.3918304443359375, 0.428497314453125, 0.4651641845703125, 0.5018310546875, 0.5384979248046875, 0.575164794921875, 0.6118316650390625, 0.64849853515625, 0.6851654052734375, 0.721832275390625, 0.7584991455078125, 0.795166015625, 0.8318328857421875, 0.868499755859375, 0.9051666259765625, 0.94183349609375, 0.9785003662109375, 1.015167236328125, 1.0518341064453125, 1.0885009765625, 1.1251678466796875, 1.161834716796875, 1.1985015869140625, 1.23516845703125, 1.2718353271484375, 1.308502197265625, 1.3451690673828125, 1.3818359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 9.0, 14.0, 12.0, 16.0, 14.0, 22.0, 30.0, 35.0, 34.0, 38.0, 50.0, 43.0, 44.0, 54.0, 45.0, 55.0, 46.0, 42.0, 53.0, 41.0, 36.0, 36.0, 30.0, 42.0, 33.0, 21.0, 16.0, 14.0, 16.0, 9.0, 11.0, 12.0, 4.0, 3.0, 2.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98876953125, -0.9518051147460938, -0.9148406982421875, -0.8778762817382812, -0.840911865234375, -0.8039474487304688, -0.7669830322265625, -0.7300186157226562, -0.69305419921875, -0.6560897827148438, -0.6191253662109375, -0.5821609497070312, -0.545196533203125, -0.5082321166992188, -0.4712677001953125, -0.43430328369140625, -0.3973388671875, -0.36037445068359375, -0.3234100341796875, -0.28644561767578125, -0.249481201171875, -0.21251678466796875, -0.1755523681640625, -0.13858795166015625, -0.10162353515625, -0.06465911865234375, -0.0276947021484375, 0.00926971435546875, 0.046234130859375, 0.08319854736328125, 0.1201629638671875, 0.15712738037109375, 0.194091796875, 0.23105621337890625, 0.2680206298828125, 0.30498504638671875, 0.341949462890625, 0.37891387939453125, 0.4158782958984375, 0.45284271240234375, 0.48980712890625, 0.5267715454101562, 0.5637359619140625, 0.6007003784179688, 0.637664794921875, 0.6746292114257812, 0.7115936279296875, 0.7485580444335938, 0.7855224609375, 0.8224868774414062, 0.8594512939453125, 0.8964157104492188, 0.933380126953125, 0.9703445434570312, 1.0073089599609375, 1.0442733764648438, 1.08123779296875, 1.1182022094726562, 1.1551666259765625, 1.1921310424804688, 1.229095458984375, 1.2660598754882812, 1.3030242919921875, 1.3399887084960938, 1.376953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 3.0, 7.0, 10.0, 14.0, 24.0, 54.0, 67.0, 127.0, 264.0, 481.0, 1177.0, 3429.0, 12801.0, 67051.0, 448941.0, 431768.0, 64321.0, 12378.0, 3357.0, 1162.0, 522.0, 271.0, 115.0, 67.0, 58.0, 29.0, 16.0, 14.0, 6.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.467041015625, -0.45441436767578125, -0.4417877197265625, -0.42916107177734375, -0.416534423828125, -0.40390777587890625, -0.3912811279296875, -0.37865447998046875, -0.36602783203125, -0.35340118408203125, -0.3407745361328125, -0.32814788818359375, -0.315521240234375, -0.30289459228515625, -0.2902679443359375, -0.27764129638671875, -0.2650146484375, -0.25238800048828125, -0.2397613525390625, -0.22713470458984375, -0.214508056640625, -0.20188140869140625, -0.1892547607421875, -0.17662811279296875, -0.16400146484375, -0.15137481689453125, -0.1387481689453125, -0.12612152099609375, -0.113494873046875, -0.10086822509765625, -0.0882415771484375, -0.07561492919921875, -0.06298828125, -0.05036163330078125, -0.0377349853515625, -0.02510833740234375, -0.012481689453125, 0.00014495849609375, 0.0127716064453125, 0.02539825439453125, 0.03802490234375, 0.05065155029296875, 0.0632781982421875, 0.07590484619140625, 0.088531494140625, 0.10115814208984375, 0.1137847900390625, 0.12641143798828125, 0.1390380859375, 0.15166473388671875, 0.1642913818359375, 0.17691802978515625, 0.189544677734375, 0.20217132568359375, 0.2147979736328125, 0.22742462158203125, 0.24005126953125, 0.25267791748046875, 0.2653045654296875, 0.27793121337890625, 0.290557861328125, 0.30318450927734375, 0.3158111572265625, 0.32843780517578125, 0.341064453125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 3.0, 9.0, 8.0, 13.0, 13.0, 14.0, 21.0, 23.0, 33.0, 31.0, 70.0, 73.0, 75.0, 116.0, 108.0, 81.0, 71.0, 41.0, 37.0, 28.0, 23.0, 12.0, 16.0, 12.0, 8.0, 6.0, 5.0, 7.0, 9.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.362531661987305e-05, -8.106045424938202e-05, -7.849559187889099e-05, -7.593072950839996e-05, -7.336586713790894e-05, -7.080100476741791e-05, -6.823614239692688e-05, -6.567128002643585e-05, -6.310641765594482e-05, -6.0541555285453796e-05, -5.797669291496277e-05, -5.541183054447174e-05, -5.284696817398071e-05, -5.0282105803489685e-05, -4.771724343299866e-05, -4.515238106250763e-05, -4.25875186920166e-05, -4.0022656321525574e-05, -3.7457793951034546e-05, -3.489293158054352e-05, -3.232806921005249e-05, -2.9763206839561462e-05, -2.7198344469070435e-05, -2.4633482098579407e-05, -2.206861972808838e-05, -1.950375735759735e-05, -1.6938894987106323e-05, -1.4374032616615295e-05, -1.1809170246124268e-05, -9.24430787563324e-06, -6.679445505142212e-06, -4.114583134651184e-06, -1.5497207641601562e-06, 1.0151416063308716e-06, 3.5800039768218994e-06, 6.144866347312927e-06, 8.709728717803955e-06, 1.1274591088294983e-05, 1.383945345878601e-05, 1.640431582927704e-05, 1.8969178199768066e-05, 2.1534040570259094e-05, 2.4098902940750122e-05, 2.666376531124115e-05, 2.9228627681732178e-05, 3.1793490052223206e-05, 3.4358352422714233e-05, 3.692321479320526e-05, 3.948807716369629e-05, 4.205293953418732e-05, 4.4617801904678345e-05, 4.718266427516937e-05, 4.97475266456604e-05, 5.231238901615143e-05, 5.4877251386642456e-05, 5.7442113757133484e-05, 6.000697612762451e-05, 6.257183849811554e-05, 6.513670086860657e-05, 6.77015632390976e-05, 7.026642560958862e-05, 7.283128798007965e-05, 7.539615035057068e-05, 7.79610127210617e-05, 8.052587509155273e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 8.0, 18.0, 23.0, 62.0, 81.0, 188.0, 335.0, 736.0, 2081.0, 7369.0, 37176.0, 280947.0, 618603.0, 81345.0, 14093.0, 3482.0, 1125.0, 429.0, 193.0, 97.0, 70.0, 39.0, 14.0, 12.0, 6.0, 9.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.54052734375, -0.5256004333496094, -0.5106735229492188, -0.4957466125488281, -0.4808197021484375, -0.4658927917480469, -0.45096588134765625, -0.4360389709472656, -0.421112060546875, -0.4061851501464844, -0.39125823974609375, -0.3763313293457031, -0.3614044189453125, -0.3464775085449219, -0.33155059814453125, -0.3166236877441406, -0.30169677734375, -0.2867698669433594, -0.27184295654296875, -0.2569160461425781, -0.2419891357421875, -0.22706222534179688, -0.21213531494140625, -0.19720840454101562, -0.182281494140625, -0.16735458374023438, -0.15242767333984375, -0.13750076293945312, -0.1225738525390625, -0.10764694213867188, -0.09272003173828125, -0.07779312133789062, -0.0628662109375, -0.047939300537109375, -0.03301239013671875, -0.018085479736328125, -0.0031585693359375, 0.011768341064453125, 0.02669525146484375, 0.041622161865234375, 0.056549072265625, 0.07147598266601562, 0.08640289306640625, 0.10132980346679688, 0.1162567138671875, 0.13118362426757812, 0.14611053466796875, 0.16103744506835938, 0.17596435546875, 0.19089126586914062, 0.20581817626953125, 0.22074508666992188, 0.2356719970703125, 0.2505989074707031, 0.26552581787109375, 0.2804527282714844, 0.295379638671875, 0.3103065490722656, 0.32523345947265625, 0.3401603698730469, 0.3550872802734375, 0.3700141906738281, 0.38494110107421875, 0.3998680114746094, 0.414794921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 6.0, 11.0, 11.0, 18.0, 26.0, 28.0, 38.0, 65.0, 63.0, 82.0, 99.0, 95.0, 80.0, 73.0, 58.0, 65.0, 35.0, 30.0, 25.0, 25.0, 8.0, 12.0, 5.0, 10.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259765625, -0.24959945678710938, -0.23943328857421875, -0.22926712036132812, -0.2191009521484375, -0.20893478393554688, -0.19876861572265625, -0.18860244750976562, -0.178436279296875, -0.16827011108398438, -0.15810394287109375, -0.14793777465820312, -0.1377716064453125, -0.12760543823242188, -0.11743927001953125, -0.10727310180664062, -0.09710693359375, -0.08694076538085938, -0.07677459716796875, -0.06660842895507812, -0.0564422607421875, -0.046276092529296875, -0.03610992431640625, -0.025943756103515625, -0.015777587890625, -0.005611419677734375, 0.00455474853515625, 0.014720916748046875, 0.0248870849609375, 0.035053253173828125, 0.04521942138671875, 0.055385589599609375, 0.0655517578125, 0.07571792602539062, 0.08588409423828125, 0.09605026245117188, 0.1062164306640625, 0.11638259887695312, 0.12654876708984375, 0.13671493530273438, 0.146881103515625, 0.15704727172851562, 0.16721343994140625, 0.17737960815429688, 0.1875457763671875, 0.19771194458007812, 0.20787811279296875, 0.21804428100585938, 0.22821044921875, 0.23837661743164062, 0.24854278564453125, 0.2587089538574219, 0.2688751220703125, 0.2790412902832031, 0.28920745849609375, 0.2993736267089844, 0.309539794921875, 0.3197059631347656, 0.32987213134765625, 0.3400382995605469, 0.3502044677734375, 0.3603706359863281, 0.37053680419921875, 0.3807029724121094, 0.390869140625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 7.0, 9.0, 12.0, 17.0, 17.0, 31.0, 48.0, 59.0, 86.0, 106.0, 123.0, 131.0, 100.0, 73.0, 56.0, 34.0, 24.0, 12.0, 10.0, 11.0, 5.0, 3.0, 8.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.325015068054199, -4.169290065765381, -4.0135650634765625, -3.8578402996063232, -3.702115297317505, -3.5463902950286865, -3.3906655311584473, -3.234940528869629, -3.0792155265808105, -2.923490524291992, -2.767765522003174, -2.6120407581329346, -2.456315755844116, -2.300590753555298, -2.1448659896850586, -1.9891409873962402, -1.8334159851074219, -1.6776909828186035, -1.5219660997390747, -1.366241216659546, -1.2105162143707275, -1.0547912120819092, -0.8990663290023804, -0.7433414459228516, -0.5876164436340332, -0.4318915009498596, -0.27616655826568604, -0.12044161558151245, 0.03528332710266113, 0.19100826978683472, 0.3467332124710083, 0.5024580955505371, 0.6581830978393555, 0.813908040523529, 0.9696329832077026, 1.1253578662872314, 1.2810828685760498, 1.4368078708648682, 1.592532753944397, 1.7482576370239258, 1.9039826393127441, 2.0597076416015625, 2.215432643890381, 2.37115740776062, 2.5268824100494385, 2.682607412338257, 2.838332176208496, 2.9940571784973145, 3.149782180786133, 3.305507183074951, 3.4612321853637695, 3.616956949234009, 3.772681951522827, 3.9284069538116455, 4.084131717681885, 4.239856719970703, 4.3955817222595215, 4.55130672454834, 4.707031726837158, 4.862756729125977, 5.018481254577637, 5.174206256866455, 5.329931259155273, 5.485656261444092, 5.64138126373291]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 8.0, 8.0, 5.0, 5.0, 16.0, 11.0, 13.0, 14.0, 19.0, 26.0, 41.0, 40.0, 25.0, 43.0, 55.0, 52.0, 72.0, 65.0, 45.0, 46.0, 50.0, 49.0, 47.0, 40.0, 41.0, 30.0, 25.0, 18.0, 20.0, 12.0, 14.0, 14.0, 13.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.08458948135376, -6.858901500701904, -6.633213520050049, -6.407525062561035, -6.18183708190918, -5.956149101257324, -5.730461120605469, -5.504773139953613, -5.279085159301758, -5.053397178649902, -4.827709197998047, -4.602021217346191, -4.376332759857178, -4.150644779205322, -3.924956798553467, -3.6992688179016113, -3.4735805988311768, -3.2478926181793213, -3.0222043991088867, -2.7965164184570312, -2.570828437805176, -2.3451404571533203, -2.1194522380828857, -1.8937642574310303, -1.6680761575698853, -1.4423880577087402, -1.2167000770568848, -0.9910119771957397, -0.7653239369392395, -0.5396358966827393, -0.31394779682159424, -0.08825981616973877, 0.13742828369140625, 0.3631163239479065, 0.5888043642044067, 0.8144924640655518, 1.0401804447174072, 1.2658685445785522, 1.4915566444396973, 1.7172446250915527, 1.9429327249526978, 2.1686208248138428, 2.3943088054656982, 2.619997024536133, 2.8456850051879883, 3.0713729858398438, 3.297060966491699, 3.5227489471435547, 3.7484371662139893, 3.9741251468658447, 4.199813365936279, 4.425501346588135, 4.65118932723999, 4.876877307891846, 5.102565765380859, 5.328253746032715, 5.55394172668457, 5.779629707336426, 6.005317687988281, 6.231005668640137, 6.45669412612915, 6.682382106781006, 6.908070087432861, 7.133758068084717, 7.359446048736572]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 12.0, 9.0, 16.0, 38.0, 73.0, 128.0, 252.0, 692.0, 2771.0, 23319.0, 4064374.0, 94943.0, 5649.0, 1166.0, 424.0, 194.0, 92.0, 47.0, 37.0, 13.0, 4.0, 8.0, 6.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.147064208984375, -2.06951904296875, -1.991973876953125, -1.9144287109375, -1.836883544921875, -1.75933837890625, -1.681793212890625, -1.604248046875, -1.526702880859375, -1.44915771484375, -1.371612548828125, -1.2940673828125, -1.216522216796875, -1.13897705078125, -1.061431884765625, -0.98388671875, -0.906341552734375, -0.82879638671875, -0.751251220703125, -0.6737060546875, -0.596160888671875, -0.51861572265625, -0.441070556640625, -0.363525390625, -0.285980224609375, -0.20843505859375, -0.130889892578125, -0.0533447265625, 0.024200439453125, 0.10174560546875, 0.179290771484375, 0.2568359375, 0.334381103515625, 0.41192626953125, 0.489471435546875, 0.5670166015625, 0.644561767578125, 0.72210693359375, 0.799652099609375, 0.877197265625, 0.954742431640625, 1.03228759765625, 1.109832763671875, 1.1873779296875, 1.264923095703125, 1.34246826171875, 1.420013427734375, 1.49755859375, 1.575103759765625, 1.65264892578125, 1.730194091796875, 1.8077392578125, 1.885284423828125, 1.96282958984375, 2.040374755859375, 2.117919921875, 2.195465087890625, 2.27301025390625, 2.350555419921875, 2.4281005859375, 2.505645751953125, 2.58319091796875, 2.660736083984375, 2.73828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 14.0, 16.0, 32.0, 35.0, 63.0, 77.0, 103.0, 100.0, 94.0, 98.0, 88.0, 91.0, 68.0, 39.0, 26.0, 16.0, 8.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.497314453125, -0.4809913635253906, -0.46466827392578125, -0.4483451843261719, -0.4320220947265625, -0.4156990051269531, -0.39937591552734375, -0.3830528259277344, -0.366729736328125, -0.3504066467285156, -0.33408355712890625, -0.3177604675292969, -0.3014373779296875, -0.2851142883300781, -0.26879119873046875, -0.2524681091308594, -0.23614501953125, -0.21982192993164062, -0.20349884033203125, -0.18717575073242188, -0.1708526611328125, -0.15452957153320312, -0.13820648193359375, -0.12188339233398438, -0.105560302734375, -0.08923721313476562, -0.07291412353515625, -0.056591033935546875, -0.0402679443359375, -0.023944854736328125, -0.00762176513671875, 0.008701324462890625, 0.0250244140625, 0.041347503662109375, 0.05767059326171875, 0.07399368286132812, 0.0903167724609375, 0.10663986206054688, 0.12296295166015625, 0.13928604125976562, 0.155609130859375, 0.17193222045898438, 0.18825531005859375, 0.20457839965820312, 0.2209014892578125, 0.23722457885742188, 0.25354766845703125, 0.2698707580566406, 0.28619384765625, 0.3025169372558594, 0.31884002685546875, 0.3351631164550781, 0.3514862060546875, 0.3678092956542969, 0.38413238525390625, 0.4004554748535156, 0.416778564453125, 0.4331016540527344, 0.44942474365234375, 0.4657478332519531, 0.4820709228515625, 0.4983940124511719, 0.5147171020507812, 0.5310401916503906, 0.54736328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 12.0, 6.0, 6.0, 15.0, 21.0, 41.0, 56.0, 82.0, 159.0, 286.0, 556.0, 1336.0, 4248.0, 20694.0, 285724.0, 3757736.0, 106003.0, 12380.0, 2915.0, 1032.0, 442.0, 216.0, 136.0, 80.0, 34.0, 14.0, 21.0, 12.0, 7.0, 3.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.169921875, -1.1358642578125, -1.101806640625, -1.0677490234375, -1.03369140625, -0.9996337890625, -0.965576171875, -0.9315185546875, -0.8974609375, -0.8634033203125, -0.829345703125, -0.7952880859375, -0.76123046875, -0.7271728515625, -0.693115234375, -0.6590576171875, -0.625, -0.5909423828125, -0.556884765625, -0.5228271484375, -0.48876953125, -0.4547119140625, -0.420654296875, -0.3865966796875, -0.3525390625, -0.3184814453125, -0.284423828125, -0.2503662109375, -0.21630859375, -0.1822509765625, -0.148193359375, -0.1141357421875, -0.080078125, -0.0460205078125, -0.011962890625, 0.0220947265625, 0.05615234375, 0.0902099609375, 0.124267578125, 0.1583251953125, 0.1923828125, 0.2264404296875, 0.260498046875, 0.2945556640625, 0.32861328125, 0.3626708984375, 0.396728515625, 0.4307861328125, 0.46484375, 0.4989013671875, 0.532958984375, 0.5670166015625, 0.60107421875, 0.6351318359375, 0.669189453125, 0.7032470703125, 0.7373046875, 0.7713623046875, 0.805419921875, 0.8394775390625, 0.87353515625, 0.9075927734375, 0.941650390625, 0.9757080078125, 1.009765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 7.0, 10.0, 5.0, 16.0, 30.0, 54.0, 93.0, 252.0, 994.0, 1908.0, 400.0, 127.0, 78.0, 40.0, 20.0, 14.0, 10.0, 6.0, 2.0, 9.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.591796875, -0.5767021179199219, -0.5616073608398438, -0.5465126037597656, -0.5314178466796875, -0.5163230895996094, -0.5012283325195312, -0.4861335754394531, -0.471038818359375, -0.4559440612792969, -0.44084930419921875, -0.4257545471191406, -0.4106597900390625, -0.3955650329589844, -0.38047027587890625, -0.3653755187988281, -0.35028076171875, -0.3351860046386719, -0.32009124755859375, -0.3049964904785156, -0.2899017333984375, -0.2748069763183594, -0.25971221923828125, -0.24461746215820312, -0.229522705078125, -0.21442794799804688, -0.19933319091796875, -0.18423843383789062, -0.1691436767578125, -0.15404891967773438, -0.13895416259765625, -0.12385940551757812, -0.1087646484375, -0.09366989135742188, -0.07857513427734375, -0.06348037719726562, -0.0483856201171875, -0.033290863037109375, -0.01819610595703125, -0.003101348876953125, 0.011993408203125, 0.027088165283203125, 0.04218292236328125, 0.057277679443359375, 0.0723724365234375, 0.08746719360351562, 0.10256195068359375, 0.11765670776367188, 0.13275146484375, 0.14784622192382812, 0.16294097900390625, 0.17803573608398438, 0.1931304931640625, 0.20822525024414062, 0.22332000732421875, 0.23841476440429688, 0.253509521484375, 0.2686042785644531, 0.28369903564453125, 0.2987937927246094, 0.3138885498046875, 0.3289833068847656, 0.34407806396484375, 0.3591728210449219, 0.374267578125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 21.0, 80.0, 201.0, 338.0, 227.0, 89.0, 29.0, 7.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.827905654907227, -4.7148051261901855, -4.6017045974731445, -4.4886040687561035, -4.3755035400390625, -4.26240348815918, -4.149302959442139, -4.036202430725098, -3.9231019020080566, -3.8100013732910156, -3.6969008445739746, -3.5838005542755127, -3.4707000255584717, -3.3575994968414307, -3.2444992065429688, -3.1313986778259277, -3.0182981491088867, -2.9051976203918457, -2.7920970916748047, -2.6789968013763428, -2.5658962726593018, -2.4527957439422607, -2.339695453643799, -2.226594924926758, -2.113494396209717, -2.000393867492676, -1.8872934579849243, -1.7741930484771729, -1.6610925197601318, -1.5479919910430908, -1.4348915815353394, -1.321791172027588, -1.208690881729126, -1.095590353012085, -0.9824899435043335, -0.8693894743919373, -0.756289005279541, -0.6431885361671448, -0.5300880670547485, -0.4169875979423523, -0.30388712882995605, -0.19078665971755981, -0.07768619060516357, 0.035414278507232666, 0.1485147476196289, 0.26161521673202515, 0.3747156858444214, 0.4878161549568176, 0.6009166240692139, 0.7140170931816101, 0.8271175622940063, 0.9402180314064026, 1.0533185005187988, 1.1664190292358398, 1.2795194387435913, 1.3926198482513428, 1.5057203769683838, 1.6188209056854248, 1.7319213151931763, 1.8450217247009277, 1.9581222534179688, 2.0712227821350098, 2.184323310852051, 2.2974236011505127, 2.4105241298675537]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 0.0, 9.0, 7.0, 19.0, 19.0, 25.0, 19.0, 24.0, 25.0, 35.0, 36.0, 63.0, 52.0, 49.0, 59.0, 63.0, 61.0, 60.0, 50.0, 57.0, 43.0, 44.0, 39.0, 32.0, 22.0, 20.0, 14.0, 17.0, 6.0, 8.0, 12.0, 5.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.5629534721374512, -1.5217095613479614, -1.4804657697677612, -1.4392218589782715, -1.3979780673980713, -1.3567341566085815, -1.3154903650283813, -1.2742464542388916, -1.2330026626586914, -1.1917587518692017, -1.1505149602890015, -1.1092710494995117, -1.0680272579193115, -1.0267833471298218, -0.9855394959449768, -0.9442956447601318, -0.9030517339706421, -0.8618078827857971, -0.8205640316009521, -0.7793201804161072, -0.7380763292312622, -0.6968324184417725, -0.6555885672569275, -0.6143447160720825, -0.5731008648872375, -0.5318570137023926, -0.4906131625175476, -0.44936928153038025, -0.4081254303455353, -0.3668815791606903, -0.32563769817352295, -0.284393846988678, -0.24314987659454346, -0.2019060254096985, -0.16066215932369232, -0.11941830068826675, -0.07817444205284119, -0.036930590867996216, 0.004313275218009949, 0.04555714130401611, 0.08680099248886108, 0.12804484367370605, 0.16928870975971222, 0.21053257584571838, 0.25177642703056335, 0.2930202782154083, 0.3342641592025757, 0.37550801038742065, 0.4167518615722656, 0.4579957127571106, 0.49923956394195557, 0.5404834151268005, 0.5817272663116455, 0.6229711771011353, 0.6642150282859802, 0.7054588794708252, 0.7467027306556702, 0.7879465818405151, 0.8291904330253601, 0.8704342842102051, 0.9116781949996948, 0.952921986579895, 0.9941658973693848, 1.035409688949585, 1.0766535997390747]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 8.0, 11.0, 26.0, 15.0, 32.0, 59.0, 100.0, 137.0, 200.0, 322.0, 565.0, 1057.0, 1901.0, 4315.0, 11777.0, 41378.0, 195516.0, 531057.0, 197672.0, 41604.0, 11884.0, 4345.0, 2069.0, 1027.0, 552.0, 332.0, 214.0, 119.0, 74.0, 61.0, 36.0, 29.0, 17.0, 12.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.26953125, -1.2292327880859375, -1.188934326171875, -1.1486358642578125, -1.10833740234375, -1.0680389404296875, -1.027740478515625, -0.9874420166015625, -0.9471435546875, -0.9068450927734375, -0.866546630859375, -0.8262481689453125, -0.78594970703125, -0.7456512451171875, -0.705352783203125, -0.6650543212890625, -0.624755859375, -0.5844573974609375, -0.544158935546875, -0.5038604736328125, -0.46356201171875, -0.4232635498046875, -0.382965087890625, -0.3426666259765625, -0.3023681640625, -0.2620697021484375, -0.221771240234375, -0.1814727783203125, -0.14117431640625, -0.1008758544921875, -0.060577392578125, -0.0202789306640625, 0.02001953125, 0.0603179931640625, 0.100616455078125, 0.1409149169921875, 0.18121337890625, 0.2215118408203125, 0.261810302734375, 0.3021087646484375, 0.3424072265625, 0.3827056884765625, 0.423004150390625, 0.4633026123046875, 0.50360107421875, 0.5438995361328125, 0.584197998046875, 0.6244964599609375, 0.664794921875, 0.7050933837890625, 0.745391845703125, 0.7856903076171875, 0.82598876953125, 0.8662872314453125, 0.906585693359375, 0.9468841552734375, 0.9871826171875, 1.0274810791015625, 1.067779541015625, 1.1080780029296875, 1.14837646484375, 1.1886749267578125, 1.228973388671875, 1.2692718505859375, 1.3095703125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 12.0, 17.0, 35.0, 41.0, 50.0, 90.0, 99.0, 104.0, 91.0, 94.0, 92.0, 96.0, 50.0, 46.0, 25.0, 18.0, 8.0, 9.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4833984375, -0.46753692626953125, -0.4516754150390625, -0.43581390380859375, -0.419952392578125, -0.40409088134765625, -0.3882293701171875, -0.37236785888671875, -0.35650634765625, -0.34064483642578125, -0.3247833251953125, -0.30892181396484375, -0.293060302734375, -0.27719879150390625, -0.2613372802734375, -0.24547576904296875, -0.2296142578125, -0.21375274658203125, -0.1978912353515625, -0.18202972412109375, -0.166168212890625, -0.15030670166015625, -0.1344451904296875, -0.11858367919921875, -0.10272216796875, -0.08686065673828125, -0.0709991455078125, -0.05513763427734375, -0.039276123046875, -0.02341461181640625, -0.0075531005859375, 0.00830841064453125, 0.024169921875, 0.04003143310546875, 0.0558929443359375, 0.07175445556640625, 0.087615966796875, 0.10347747802734375, 0.1193389892578125, 0.13520050048828125, 0.15106201171875, 0.16692352294921875, 0.1827850341796875, 0.19864654541015625, 0.214508056640625, 0.23036956787109375, 0.2462310791015625, 0.26209259033203125, 0.2779541015625, 0.29381561279296875, 0.3096771240234375, 0.32553863525390625, 0.341400146484375, 0.35726165771484375, 0.3731231689453125, 0.38898468017578125, 0.40484619140625, 0.42070770263671875, 0.4365692138671875, 0.45243072509765625, 0.468292236328125, 0.48415374755859375, 0.5000152587890625, 0.5158767700195312, 0.53173828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 8.0, 8.0, 9.0, 7.0, 7.0, 13.0, 17.0, 15.0, 24.0, 32.0, 41.0, 61.0, 108.0, 128.0, 154.0, 268.0, 427.0, 658.0, 1195.0, 2192.0, 4243.0, 9144.0, 20972.0, 51501.0, 135686.0, 297678.0, 297325.0, 135332.0, 51710.0, 20680.0, 9098.0, 4341.0, 2251.0, 1194.0, 680.0, 414.0, 265.0, 207.0, 138.0, 81.0, 57.0, 48.0, 40.0, 41.0, 17.0, 15.0, 11.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.67236328125, -0.652587890625, -0.6328125, -0.613037109375, -0.59326171875, -0.573486328125, -0.5537109375, -0.533935546875, -0.51416015625, -0.494384765625, -0.474609375, -0.454833984375, -0.43505859375, -0.415283203125, -0.3955078125, -0.375732421875, -0.35595703125, -0.336181640625, -0.31640625, -0.296630859375, -0.27685546875, -0.257080078125, -0.2373046875, -0.217529296875, -0.19775390625, -0.177978515625, -0.158203125, -0.138427734375, -0.11865234375, -0.098876953125, -0.0791015625, -0.059326171875, -0.03955078125, -0.019775390625, 0.0, 0.019775390625, 0.03955078125, 0.059326171875, 0.0791015625, 0.098876953125, 0.11865234375, 0.138427734375, 0.158203125, 0.177978515625, 0.19775390625, 0.217529296875, 0.2373046875, 0.257080078125, 0.27685546875, 0.296630859375, 0.31640625, 0.336181640625, 0.35595703125, 0.375732421875, 0.3955078125, 0.415283203125, 0.43505859375, 0.454833984375, 0.474609375, 0.494384765625, 0.51416015625, 0.533935546875, 0.5537109375, 0.573486328125, 0.59326171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 7.0, 4.0, 6.0, 3.0, 6.0, 7.0, 13.0, 10.0, 10.0, 20.0, 20.0, 24.0, 35.0, 26.0, 30.0, 25.0, 30.0, 34.0, 37.0, 44.0, 42.0, 39.0, 45.0, 38.0, 36.0, 30.0, 32.0, 38.0, 33.0, 35.0, 32.0, 23.0, 28.0, 27.0, 20.0, 13.0, 12.0, 7.0, 16.0, 12.0, 9.0, 18.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97900390625, -0.9501571655273438, -0.9213104248046875, -0.8924636840820312, -0.863616943359375, -0.8347702026367188, -0.8059234619140625, -0.7770767211914062, -0.74822998046875, -0.7193832397460938, -0.6905364990234375, -0.6616897583007812, -0.632843017578125, -0.6039962768554688, -0.5751495361328125, -0.5463027954101562, -0.5174560546875, -0.48860931396484375, -0.4597625732421875, -0.43091583251953125, -0.402069091796875, -0.37322235107421875, -0.3443756103515625, -0.31552886962890625, -0.28668212890625, -0.25783538818359375, -0.2289886474609375, -0.20014190673828125, -0.171295166015625, -0.14244842529296875, -0.1136016845703125, -0.08475494384765625, -0.055908203125, -0.02706146240234375, 0.0017852783203125, 0.03063201904296875, 0.059478759765625, 0.08832550048828125, 0.1171722412109375, 0.14601898193359375, 0.17486572265625, 0.20371246337890625, 0.2325592041015625, 0.26140594482421875, 0.290252685546875, 0.31909942626953125, 0.3479461669921875, 0.37679290771484375, 0.4056396484375, 0.43448638916015625, 0.4633331298828125, 0.49217987060546875, 0.521026611328125, 0.5498733520507812, 0.5787200927734375, 0.6075668334960938, 0.63641357421875, 0.6652603149414062, 0.6941070556640625, 0.7229537963867188, 0.751800537109375, 0.7806472778320312, 0.8094940185546875, 0.8383407592773438, 0.8671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 13.0, 19.0, 41.0, 67.0, 139.0, 294.0, 748.0, 1854.0, 5434.0, 20462.0, 107894.0, 539475.0, 305520.0, 49912.0, 11242.0, 3302.0, 1202.0, 485.0, 230.0, 97.0, 51.0, 32.0, 16.0, 13.0, 6.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.37744140625, -0.3655662536621094, -0.35369110107421875, -0.3418159484863281, -0.3299407958984375, -0.3180656433105469, -0.30619049072265625, -0.2943153381347656, -0.282440185546875, -0.2705650329589844, -0.25868988037109375, -0.24681472778320312, -0.2349395751953125, -0.22306442260742188, -0.21118927001953125, -0.19931411743164062, -0.18743896484375, -0.17556381225585938, -0.16368865966796875, -0.15181350708007812, -0.1399383544921875, -0.12806320190429688, -0.11618804931640625, -0.10431289672851562, -0.092437744140625, -0.08056259155273438, -0.06868743896484375, -0.056812286376953125, -0.0449371337890625, -0.033061981201171875, -0.02118682861328125, -0.009311676025390625, 0.0025634765625, 0.014438629150390625, 0.02631378173828125, 0.038188934326171875, 0.0500640869140625, 0.061939239501953125, 0.07381439208984375, 0.08568954467773438, 0.097564697265625, 0.10943984985351562, 0.12131500244140625, 0.13319015502929688, 0.1450653076171875, 0.15694046020507812, 0.16881561279296875, 0.18069076538085938, 0.19256591796875, 0.20444107055664062, 0.21631622314453125, 0.22819137573242188, 0.2400665283203125, 0.2519416809082031, 0.26381683349609375, 0.2756919860839844, 0.287567138671875, 0.2994422912597656, 0.31131744384765625, 0.3231925964355469, 0.3350677490234375, 0.3469429016113281, 0.35881805419921875, 0.3706932067871094, 0.382568359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 8.0, 13.0, 11.0, 19.0, 18.0, 30.0, 25.0, 33.0, 59.0, 64.0, 70.0, 82.0, 83.0, 82.0, 87.0, 66.0, 52.0, 47.0, 36.0, 23.0, 15.0, 17.0, 10.0, 11.0, 9.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.778406143188477e-05, -7.53914937376976e-05, -7.299892604351044e-05, -7.060635834932327e-05, -6.821379065513611e-05, -6.582122296094894e-05, -6.342865526676178e-05, -6.103608757257462e-05, -5.864351987838745e-05, -5.625095218420029e-05, -5.385838449001312e-05, -5.146581679582596e-05, -4.9073249101638794e-05, -4.668068140745163e-05, -4.4288113713264465e-05, -4.18955460190773e-05, -3.950297832489014e-05, -3.711041063070297e-05, -3.471784293651581e-05, -3.2325275242328644e-05, -2.993270754814148e-05, -2.7540139853954315e-05, -2.514757215976715e-05, -2.2755004465579987e-05, -2.0362436771392822e-05, -1.7969869077205658e-05, -1.5577301383018494e-05, -1.318473368883133e-05, -1.0792165994644165e-05, -8.399598300457e-06, -6.0070306062698364e-06, -3.614462912082672e-06, -1.2218952178955078e-06, 1.1706724762916565e-06, 3.563240170478821e-06, 5.955807864665985e-06, 8.34837555885315e-06, 1.0740943253040314e-05, 1.3133510947227478e-05, 1.5526078641414642e-05, 1.7918646335601807e-05, 2.031121402978897e-05, 2.2703781723976135e-05, 2.50963494181633e-05, 2.7488917112350464e-05, 2.9881484806537628e-05, 3.227405250072479e-05, 3.466662019491196e-05, 3.705918788909912e-05, 3.9451755583286285e-05, 4.184432327747345e-05, 4.4236890971660614e-05, 4.662945866584778e-05, 4.902202636003494e-05, 5.141459405422211e-05, 5.380716174840927e-05, 5.6199729442596436e-05, 5.85922971367836e-05, 6.0984864830970764e-05, 6.337743252515793e-05, 6.577000021934509e-05, 6.816256791353226e-05, 7.055513560771942e-05, 7.294770330190659e-05, 7.534027099609375e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 10.0, 6.0, 15.0, 27.0, 32.0, 47.0, 57.0, 92.0, 132.0, 176.0, 271.0, 482.0, 906.0, 1615.0, 3335.0, 6961.0, 15839.0, 39834.0, 114312.0, 368852.0, 330997.0, 101142.0, 35850.0, 14502.0, 6344.0, 3030.0, 1564.0, 816.0, 470.0, 293.0, 171.0, 115.0, 83.0, 53.0, 30.0, 26.0, 21.0, 10.0, 10.0, 12.0, 2.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.248046875, -0.2402820587158203, -0.23251724243164062, -0.22475242614746094, -0.21698760986328125, -0.20922279357910156, -0.20145797729492188, -0.1936931610107422, -0.1859283447265625, -0.1781635284423828, -0.17039871215820312, -0.16263389587402344, -0.15486907958984375, -0.14710426330566406, -0.13933944702148438, -0.1315746307373047, -0.123809814453125, -0.11604499816894531, -0.10828018188476562, -0.10051536560058594, -0.09275054931640625, -0.08498573303222656, -0.07722091674804688, -0.06945610046386719, -0.0616912841796875, -0.05392646789550781, -0.046161651611328125, -0.03839683532714844, -0.03063201904296875, -0.022867202758789062, -0.015102386474609375, -0.0073375701904296875, 0.00042724609375, 0.008192062377929688, 0.015956878662109375, 0.023721694946289062, 0.03148651123046875, 0.03925132751464844, 0.047016143798828125, 0.05478096008300781, 0.0625457763671875, 0.07031059265136719, 0.07807540893554688, 0.08584022521972656, 0.09360504150390625, 0.10136985778808594, 0.10913467407226562, 0.11689949035644531, 0.124664306640625, 0.1324291229248047, 0.14019393920898438, 0.14795875549316406, 0.15572357177734375, 0.16348838806152344, 0.17125320434570312, 0.1790180206298828, 0.1867828369140625, 0.1945476531982422, 0.20231246948242188, 0.21007728576660156, 0.21784210205078125, 0.22560691833496094, 0.23337173461914062, 0.2411365509033203, 0.2489013671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 2.0, 2.0, 7.0, 11.0, 9.0, 13.0, 18.0, 15.0, 30.0, 32.0, 35.0, 54.0, 61.0, 77.0, 83.0, 73.0, 79.0, 88.0, 58.0, 46.0, 39.0, 34.0, 20.0, 20.0, 16.0, 9.0, 3.0, 9.0, 12.0, 9.0, 4.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2474365234375, -0.2386608123779297, -0.22988510131835938, -0.22110939025878906, -0.21233367919921875, -0.20355796813964844, -0.19478225708007812, -0.1860065460205078, -0.1772308349609375, -0.1684551239013672, -0.15967941284179688, -0.15090370178222656, -0.14212799072265625, -0.13335227966308594, -0.12457656860351562, -0.11580085754394531, -0.107025146484375, -0.09824943542480469, -0.08947372436523438, -0.08069801330566406, -0.07192230224609375, -0.06314659118652344, -0.054370880126953125, -0.04559516906738281, -0.0368194580078125, -0.028043746948242188, -0.019268035888671875, -0.010492324829101562, -0.00171661376953125, 0.0070590972900390625, 0.015834808349609375, 0.024610519409179688, 0.03338623046875, 0.04216194152832031, 0.050937652587890625, 0.05971336364746094, 0.06848907470703125, 0.07726478576660156, 0.08604049682617188, 0.09481620788574219, 0.1035919189453125, 0.11236763000488281, 0.12114334106445312, 0.12991905212402344, 0.13869476318359375, 0.14747047424316406, 0.15624618530273438, 0.1650218963623047, 0.173797607421875, 0.1825733184814453, 0.19134902954101562, 0.20012474060058594, 0.20890045166015625, 0.21767616271972656, 0.22645187377929688, 0.2352275848388672, 0.2440032958984375, 0.2527790069580078, 0.2615547180175781, 0.27033042907714844, 0.27910614013671875, 0.28788185119628906, 0.2966575622558594, 0.3054332733154297, 0.314208984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 17.0, 13.0, 28.0, 22.0, 43.0, 67.0, 119.0, 131.0, 145.0, 138.0, 111.0, 63.0, 40.0, 15.0, 20.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.768758773803711, -7.572025775909424, -7.375293254852295, -7.178560256958008, -6.981827259063721, -6.785094261169434, -6.588361740112305, -6.391628742218018, -6.1948957443237305, -5.998162746429443, -5.8014302253723145, -5.604697227478027, -5.40796422958374, -5.211231231689453, -5.014498710632324, -4.817765712738037, -4.62103271484375, -4.424299716949463, -4.227567195892334, -4.030834197998047, -3.8341012001037598, -3.6373684406280518, -3.4406356811523438, -3.2439026832580566, -3.0471701622009277, -2.8504374027252197, -2.6537044048309326, -2.4569716453552246, -2.2602386474609375, -2.0635058879852295, -1.866773009300232, -1.6700401306152344, -1.4733071327209473, -1.2765742540359497, -1.0798413753509521, -0.8831085562705994, -0.6863756775856018, -0.48964279890060425, -0.29290997982025146, -0.0961771011352539, 0.10055577754974365, 0.2972886562347412, 0.4940215051174164, 0.6907543540000916, 0.8874872326850891, 1.0842201709747314, 1.2809529304504395, 1.477685809135437, 1.6744186878204346, 1.8711515665054321, 2.0678844451904297, 2.2646172046661377, 2.461350202560425, 2.658082962036133, 2.85481595993042, 3.051548719406128, 3.248281478881836, 3.445014238357544, 3.641747236251831, 3.838479995727539, 4.035212993621826, 4.231945991516113, 4.428678512573242, 4.625411510467529, 4.822144508361816]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 5.0, 2.0, 8.0, 5.0, 9.0, 5.0, 10.0, 14.0, 14.0, 13.0, 10.0, 23.0, 38.0, 31.0, 39.0, 43.0, 37.0, 50.0, 57.0, 49.0, 34.0, 45.0, 42.0, 47.0, 25.0, 39.0, 33.0, 35.0, 24.0, 30.0, 22.0, 26.0, 22.0, 24.0, 19.0, 13.0, 11.0, 10.0, 9.0, 5.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.620201110839844, -5.441276550292969, -5.2623515129089355, -5.083426475524902, -4.904501914978027, -4.725577354431152, -4.546652317047119, -4.367727279663086, -4.188802719116211, -4.009878158569336, -3.8309531211853027, -3.6520283222198486, -3.4731035232543945, -3.2941787242889404, -3.1152539253234863, -2.9363291263580322, -2.757404327392578, -2.578479528427124, -2.39955472946167, -2.220629930496216, -2.0417051315307617, -1.8627803325653076, -1.6838555335998535, -1.5049307346343994, -1.3260059356689453, -1.1470811367034912, -0.9681563377380371, -0.789231538772583, -0.6103067398071289, -0.4313819408416748, -0.2524571418762207, -0.0735323429107666, 0.1053929328918457, 0.2843177318572998, 0.4632425308227539, 0.642167329788208, 0.8210921287536621, 1.0000169277191162, 1.1789417266845703, 1.3578665256500244, 1.5367913246154785, 1.7157161235809326, 1.8946409225463867, 2.073565721511841, 2.252490520477295, 2.431415319442749, 2.610340118408203, 2.7892649173736572, 2.9681897163391113, 3.1471145153045654, 3.3260393142700195, 3.5049641132354736, 3.6838889122009277, 3.862813711166382, 4.041738510131836, 4.220663070678711, 4.399588108062744, 4.578513145446777, 4.757437705993652, 4.936362266540527, 5.1152873039245605, 5.294212341308594, 5.473136901855469, 5.652061462402344, 5.830986499786377]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 13.0, 12.0, 15.0, 17.0, 24.0, 32.0, 54.0, 95.0, 157.0, 298.0, 544.0, 1137.0, 2696.0, 9044.0, 60493.0, 3884773.0, 210690.0, 16464.0, 4276.0, 1650.0, 741.0, 389.0, 281.0, 126.0, 78.0, 54.0, 37.0, 22.0, 14.0, 11.0, 7.0, 6.0, 8.0, 4.0, 2.0, 5.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.20391845703125, -1.1588134765625, -1.11370849609375, -1.068603515625, -1.02349853515625, -0.9783935546875, -0.93328857421875, -0.88818359375, -0.84307861328125, -0.7979736328125, -0.75286865234375, -0.707763671875, -0.66265869140625, -0.6175537109375, -0.57244873046875, -0.52734375, -0.48223876953125, -0.4371337890625, -0.39202880859375, -0.346923828125, -0.30181884765625, -0.2567138671875, -0.21160888671875, -0.16650390625, -0.12139892578125, -0.0762939453125, -0.03118896484375, 0.013916015625, 0.05902099609375, 0.1041259765625, 0.14923095703125, 0.1943359375, 0.23944091796875, 0.2845458984375, 0.32965087890625, 0.374755859375, 0.41986083984375, 0.4649658203125, 0.51007080078125, 0.55517578125, 0.60028076171875, 0.6453857421875, 0.69049072265625, 0.735595703125, 0.78070068359375, 0.8258056640625, 0.87091064453125, 0.916015625, 0.96112060546875, 1.0062255859375, 1.05133056640625, 1.096435546875, 1.14154052734375, 1.1866455078125, 1.23175048828125, 1.27685546875, 1.32196044921875, 1.3670654296875, 1.41217041015625, 1.457275390625, 1.50238037109375, 1.5474853515625, 1.59259033203125, 1.6376953125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 9.0, 18.0, 20.0, 34.0, 58.0, 56.0, 80.0, 85.0, 111.0, 91.0, 85.0, 93.0, 68.0, 64.0, 51.0, 22.0, 17.0, 15.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.4828453063964844, -0.46642303466796875, -0.4500007629394531, -0.4335784912109375, -0.4171562194824219, -0.40073394775390625, -0.3843116760253906, -0.367889404296875, -0.3514671325683594, -0.33504486083984375, -0.3186225891113281, -0.3022003173828125, -0.2857780456542969, -0.26935577392578125, -0.2529335021972656, -0.23651123046875, -0.22008895874023438, -0.20366668701171875, -0.18724441528320312, -0.1708221435546875, -0.15439987182617188, -0.13797760009765625, -0.12155532836914062, -0.105133056640625, -0.08871078491210938, -0.07228851318359375, -0.055866241455078125, -0.0394439697265625, -0.023021697998046875, -0.00659942626953125, 0.009822845458984375, 0.0262451171875, 0.042667388916015625, 0.05908966064453125, 0.07551193237304688, 0.0919342041015625, 0.10835647583007812, 0.12477874755859375, 0.14120101928710938, 0.157623291015625, 0.17404556274414062, 0.19046783447265625, 0.20689010620117188, 0.2233123779296875, 0.23973464965820312, 0.25615692138671875, 0.2725791931152344, 0.28900146484375, 0.3054237365722656, 0.32184600830078125, 0.3382682800292969, 0.3546905517578125, 0.3711128234863281, 0.38753509521484375, 0.4039573669433594, 0.420379638671875, 0.4368019104003906, 0.45322418212890625, 0.4696464538574219, 0.4860687255859375, 0.5024909973144531, 0.5189132690429688, 0.5353355407714844, 0.5517578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 13.0, 23.0, 27.0, 32.0, 48.0, 87.0, 118.0, 199.0, 309.0, 525.0, 848.0, 1563.0, 2918.0, 6324.0, 15766.0, 55889.0, 430395.0, 3308825.0, 297274.0, 46346.0, 14282.0, 5778.0, 2804.0, 1512.0, 878.0, 526.0, 348.0, 206.0, 131.0, 80.0, 56.0, 44.0, 32.0, 16.0, 14.0, 8.0, 12.0, 4.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6220703125, -0.6034622192382812, -0.5848541259765625, -0.5662460327148438, -0.547637939453125, -0.5290298461914062, -0.5104217529296875, -0.49181365966796875, -0.47320556640625, -0.45459747314453125, -0.4359893798828125, -0.41738128662109375, -0.398773193359375, -0.38016510009765625, -0.3615570068359375, -0.34294891357421875, -0.3243408203125, -0.30573272705078125, -0.2871246337890625, -0.26851654052734375, -0.249908447265625, -0.23130035400390625, -0.2126922607421875, -0.19408416748046875, -0.17547607421875, -0.15686798095703125, -0.1382598876953125, -0.11965179443359375, -0.101043701171875, -0.08243560791015625, -0.0638275146484375, -0.04521942138671875, -0.026611328125, -0.00800323486328125, 0.0106048583984375, 0.02921295166015625, 0.047821044921875, 0.06642913818359375, 0.0850372314453125, 0.10364532470703125, 0.12225341796875, 0.14086151123046875, 0.1594696044921875, 0.17807769775390625, 0.196685791015625, 0.21529388427734375, 0.2339019775390625, 0.25251007080078125, 0.2711181640625, 0.28972625732421875, 0.3083343505859375, 0.32694244384765625, 0.345550537109375, 0.36415863037109375, 0.3827667236328125, 0.40137481689453125, 0.41998291015625, 0.43859100341796875, 0.4571990966796875, 0.47580718994140625, 0.494415283203125, 0.5130233764648438, 0.5316314697265625, 0.5502395629882812, 0.56884765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 8.0, 14.0, 23.0, 34.0, 54.0, 116.0, 310.0, 1007.0, 1591.0, 463.0, 178.0, 101.0, 39.0, 28.0, 24.0, 14.0, 13.0, 4.0, 6.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.40625, -0.3923377990722656, -0.37842559814453125, -0.3645133972167969, -0.3506011962890625, -0.3366889953613281, -0.32277679443359375, -0.3088645935058594, -0.294952392578125, -0.2810401916503906, -0.26712799072265625, -0.2532157897949219, -0.2393035888671875, -0.22539138793945312, -0.21147918701171875, -0.19756698608398438, -0.18365478515625, -0.16974258422851562, -0.15583038330078125, -0.14191818237304688, -0.1280059814453125, -0.11409378051757812, -0.10018157958984375, -0.08626937866210938, -0.072357177734375, -0.058444976806640625, -0.04453277587890625, -0.030620574951171875, -0.0167083740234375, -0.002796173095703125, 0.01111602783203125, 0.025028228759765625, 0.0389404296875, 0.052852630615234375, 0.06676483154296875, 0.08067703247070312, 0.0945892333984375, 0.10850143432617188, 0.12241363525390625, 0.13632583618164062, 0.150238037109375, 0.16415023803710938, 0.17806243896484375, 0.19197463989257812, 0.2058868408203125, 0.21979904174804688, 0.23371124267578125, 0.24762344360351562, 0.26153564453125, 0.2754478454589844, 0.28936004638671875, 0.3032722473144531, 0.3171844482421875, 0.3310966491699219, 0.34500885009765625, 0.3589210510253906, 0.372833251953125, 0.3867454528808594, 0.40065765380859375, 0.4145698547363281, 0.4284820556640625, 0.4423942565917969, 0.45630645751953125, 0.4702186584472656, 0.484130859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 17.0, 43.0, 114.0, 211.0, 258.0, 182.0, 102.0, 35.0, 21.0, 12.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4974539279937744, -2.3937904834747314, -2.2901270389556885, -2.1864633560180664, -2.0827999114990234, -1.9791364669799805, -1.8754730224609375, -1.7718095779418945, -1.668146014213562, -1.564482569694519, -1.4608190059661865, -1.3571555614471436, -1.2534921169281006, -1.149828553199768, -1.046165108680725, -0.9425016045570374, -0.8388381004333496, -0.7351745963096619, -0.6315110921859741, -0.5278476476669312, -0.4241841435432434, -0.32052063941955566, -0.2168571949005127, -0.11319369077682495, -0.009530186653137207, 0.09413330256938934, 0.1977967917919159, 0.30146026611328125, 0.405123770236969, 0.5087872743606567, 0.6124507188796997, 0.7161142230033875, 0.8197779655456543, 0.923441469669342, 1.0271049737930298, 1.1307684183120728, 1.2344319820404053, 1.3380954265594482, 1.4417588710784912, 1.5454223155975342, 1.6490858793258667, 1.7527493238449097, 1.8564128875732422, 1.9600763320922852, 2.063739776611328, 2.167403221130371, 2.271066665649414, 2.374730348587036, 2.478393793106079, 2.582057237625122, 2.685720682144165, 2.789384365081787, 2.89304780960083, 2.996711254119873, 3.100374698638916, 3.204038143157959, 3.307701587677002, 3.411365032196045, 3.515028476715088, 3.618691921234131, 3.722355604171753, 3.826019048690796, 3.929682493209839, 4.033346176147461, 4.137009620666504]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 13.0, 12.0, 16.0, 14.0, 27.0, 29.0, 26.0, 41.0, 46.0, 55.0, 63.0, 55.0, 69.0, 73.0, 66.0, 61.0, 48.0, 62.0, 47.0, 45.0, 31.0, 29.0, 18.0, 12.0, 12.0, 10.0, 10.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1707916259765625, -2.112978219985962, -2.0551648139953613, -1.9973512887954712, -1.939537763595581, -1.8817243576049805, -1.8239109516143799, -1.7660974264144897, -1.7082839012145996, -1.650470495223999, -1.5926569700241089, -1.5348435640335083, -1.4770300388336182, -1.4192166328430176, -1.361403226852417, -1.3035897016525269, -1.2457762956619263, -1.1879628896713257, -1.1301493644714355, -1.072335958480835, -1.0145224332809448, -0.9567090272903442, -0.8988955616950989, -0.8410820960998535, -0.7832686305046082, -0.7254551649093628, -0.6676416993141174, -0.6098282337188721, -0.5520148277282715, -0.49420133233070374, -0.43638789653778076, -0.3785744309425354, -0.3207608461380005, -0.2629473805427551, -0.20513392984867096, -0.1473204791545868, -0.08950701355934143, -0.03169354796409607, 0.026119887828826904, 0.08393335342407227, 0.14174681901931763, 0.199560284614563, 0.25737375020980835, 0.3151871860027313, 0.3730006515979767, 0.43081411719322205, 0.488627552986145, 0.5464410185813904, 0.6042544841766357, 0.6620679497718811, 0.7198814153671265, 0.777694821357727, 0.8355083465576172, 0.8933217525482178, 0.9511352181434631, 1.0089486837387085, 1.0667622089385986, 1.1245756149291992, 1.1823891401290894, 1.24020254611969, 1.29801607131958, 1.3558294773101807, 1.4136428833007812, 1.4714564085006714, 1.529269814491272]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 17.0, 28.0, 24.0, 51.0, 71.0, 150.0, 243.0, 432.0, 721.0, 1536.0, 3357.0, 10034.0, 41546.0, 271481.0, 587747.0, 101346.0, 19377.0, 5763.0, 2197.0, 1072.0, 573.0, 310.0, 175.0, 81.0, 72.0, 36.0, 28.0, 26.0, 13.0, 13.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2421875, -1.1997222900390625, -1.157257080078125, -1.1147918701171875, -1.07232666015625, -1.0298614501953125, -0.987396240234375, -0.9449310302734375, -0.9024658203125, -0.8600006103515625, -0.817535400390625, -0.7750701904296875, -0.73260498046875, -0.6901397705078125, -0.647674560546875, -0.6052093505859375, -0.562744140625, -0.5202789306640625, -0.477813720703125, -0.4353485107421875, -0.39288330078125, -0.3504180908203125, -0.307952880859375, -0.2654876708984375, -0.2230224609375, -0.1805572509765625, -0.138092041015625, -0.0956268310546875, -0.05316162109375, -0.0106964111328125, 0.031768798828125, 0.0742340087890625, 0.11669921875, 0.1591644287109375, 0.201629638671875, 0.2440948486328125, 0.28656005859375, 0.3290252685546875, 0.371490478515625, 0.4139556884765625, 0.4564208984375, 0.4988861083984375, 0.541351318359375, 0.5838165283203125, 0.62628173828125, 0.6687469482421875, 0.711212158203125, 0.7536773681640625, 0.796142578125, 0.8386077880859375, 0.881072998046875, 0.9235382080078125, 0.96600341796875, 1.0084686279296875, 1.050933837890625, 1.0933990478515625, 1.1358642578125, 1.1783294677734375, 1.220794677734375, 1.2632598876953125, 1.30572509765625, 1.3481903076171875, 1.390655517578125, 1.4331207275390625, 1.4755859375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 12.0, 23.0, 30.0, 42.0, 44.0, 64.0, 96.0, 95.0, 93.0, 98.0, 72.0, 83.0, 67.0, 60.0, 42.0, 24.0, 12.0, 11.0, 6.0, 9.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.491455078125, -0.4761009216308594, -0.46074676513671875, -0.4453926086425781, -0.4300384521484375, -0.4146842956542969, -0.39933013916015625, -0.3839759826660156, -0.368621826171875, -0.3532676696777344, -0.33791351318359375, -0.3225593566894531, -0.3072052001953125, -0.2918510437011719, -0.27649688720703125, -0.2611427307128906, -0.24578857421875, -0.23043441772460938, -0.21508026123046875, -0.19972610473632812, -0.1843719482421875, -0.16901779174804688, -0.15366363525390625, -0.13830947875976562, -0.122955322265625, -0.10760116577148438, -0.09224700927734375, -0.07689285278320312, -0.0615386962890625, -0.046184539794921875, -0.03083038330078125, -0.015476226806640625, -0.0001220703125, 0.015232086181640625, 0.03058624267578125, 0.045940399169921875, 0.0612945556640625, 0.07664871215820312, 0.09200286865234375, 0.10735702514648438, 0.122711181640625, 0.13806533813476562, 0.15341949462890625, 0.16877365112304688, 0.1841278076171875, 0.19948196411132812, 0.21483612060546875, 0.23019027709960938, 0.24554443359375, 0.2608985900878906, 0.27625274658203125, 0.2916069030761719, 0.3069610595703125, 0.3223152160644531, 0.33766937255859375, 0.3530235290527344, 0.368377685546875, 0.3837318420410156, 0.39908599853515625, 0.4144401550292969, 0.4297943115234375, 0.4451484680175781, 0.46050262451171875, 0.4758567810058594, 0.4912109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 12.0, 12.0, 23.0, 17.0, 44.0, 44.0, 68.0, 118.0, 170.0, 309.0, 550.0, 1101.0, 2404.0, 6756.0, 24675.0, 122458.0, 559619.0, 263984.0, 47824.0, 11436.0, 3664.0, 1511.0, 724.0, 366.0, 230.0, 119.0, 101.0, 64.0, 37.0, 25.0, 29.0, 14.0, 7.0, 7.0, 5.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0755233764648438, -1.0426483154296875, -1.0097732543945312, -0.976898193359375, -0.9440231323242188, -0.9111480712890625, -0.8782730102539062, -0.84539794921875, -0.8125228881835938, -0.7796478271484375, -0.7467727661132812, -0.713897705078125, -0.6810226440429688, -0.6481475830078125, -0.6152725219726562, -0.5823974609375, -0.5495223999023438, -0.5166473388671875, -0.48377227783203125, -0.450897216796875, -0.41802215576171875, -0.3851470947265625, -0.35227203369140625, -0.31939697265625, -0.28652191162109375, -0.2536468505859375, -0.22077178955078125, -0.187896728515625, -0.15502166748046875, -0.1221466064453125, -0.08927154541015625, -0.056396484375, -0.02352142333984375, 0.0093536376953125, 0.04222869873046875, 0.075103759765625, 0.10797882080078125, 0.1408538818359375, 0.17372894287109375, 0.20660400390625, 0.23947906494140625, 0.2723541259765625, 0.30522918701171875, 0.338104248046875, 0.37097930908203125, 0.4038543701171875, 0.43672943115234375, 0.4696044921875, 0.5024795532226562, 0.5353546142578125, 0.5682296752929688, 0.601104736328125, 0.6339797973632812, 0.6668548583984375, 0.6997299194335938, 0.73260498046875, 0.7654800415039062, 0.7983551025390625, 0.8312301635742188, 0.864105224609375, 0.8969802856445312, 0.9298553466796875, 0.9627304077148438, 0.99560546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 10.0, 12.0, 11.0, 14.0, 17.0, 30.0, 23.0, 35.0, 37.0, 52.0, 41.0, 59.0, 46.0, 64.0, 46.0, 58.0, 61.0, 54.0, 47.0, 33.0, 48.0, 36.0, 19.0, 33.0, 22.0, 25.0, 11.0, 8.0, 10.0, 8.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1865234375, -1.1474761962890625, -1.108428955078125, -1.0693817138671875, -1.03033447265625, -0.9912872314453125, -0.952239990234375, -0.9131927490234375, -0.8741455078125, -0.8350982666015625, -0.796051025390625, -0.7570037841796875, -0.71795654296875, -0.6789093017578125, -0.639862060546875, -0.6008148193359375, -0.561767578125, -0.5227203369140625, -0.483673095703125, -0.4446258544921875, -0.40557861328125, -0.3665313720703125, -0.327484130859375, -0.2884368896484375, -0.2493896484375, -0.2103424072265625, -0.171295166015625, -0.1322479248046875, -0.09320068359375, -0.0541534423828125, -0.015106201171875, 0.0239410400390625, 0.06298828125, 0.1020355224609375, 0.141082763671875, 0.1801300048828125, 0.21917724609375, 0.2582244873046875, 0.297271728515625, 0.3363189697265625, 0.3753662109375, 0.4144134521484375, 0.453460693359375, 0.4925079345703125, 0.53155517578125, 0.5706024169921875, 0.609649658203125, 0.6486968994140625, 0.687744140625, 0.7267913818359375, 0.765838623046875, 0.8048858642578125, 0.84393310546875, 0.8829803466796875, 0.922027587890625, 0.9610748291015625, 1.0001220703125, 1.0391693115234375, 1.078216552734375, 1.1172637939453125, 1.15631103515625, 1.1953582763671875, 1.234405517578125, 1.2734527587890625, 1.3125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 5.0, 8.0, 4.0, 8.0, 14.0, 18.0, 24.0, 40.0, 62.0, 124.0, 221.0, 419.0, 1022.0, 3095.0, 12642.0, 67939.0, 629107.0, 286988.0, 35933.0, 7343.0, 2105.0, 692.0, 324.0, 164.0, 86.0, 67.0, 31.0, 27.0, 9.0, 11.0, 7.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.394775390625, -0.3834381103515625, -0.372100830078125, -0.3607635498046875, -0.34942626953125, -0.3380889892578125, -0.326751708984375, -0.3154144287109375, -0.3040771484375, -0.2927398681640625, -0.281402587890625, -0.2700653076171875, -0.25872802734375, -0.2473907470703125, -0.236053466796875, -0.2247161865234375, -0.21337890625, -0.2020416259765625, -0.190704345703125, -0.1793670654296875, -0.16802978515625, -0.1566925048828125, -0.145355224609375, -0.1340179443359375, -0.1226806640625, -0.1113433837890625, -0.100006103515625, -0.0886688232421875, -0.07733154296875, -0.0659942626953125, -0.054656982421875, -0.0433197021484375, -0.031982421875, -0.0206451416015625, -0.009307861328125, 0.0020294189453125, 0.01336669921875, 0.0247039794921875, 0.036041259765625, 0.0473785400390625, 0.0587158203125, 0.0700531005859375, 0.081390380859375, 0.0927276611328125, 0.10406494140625, 0.1154022216796875, 0.126739501953125, 0.1380767822265625, 0.1494140625, 0.1607513427734375, 0.172088623046875, 0.1834259033203125, 0.19476318359375, 0.2061004638671875, 0.217437744140625, 0.2287750244140625, 0.2401123046875, 0.2514495849609375, 0.262786865234375, 0.2741241455078125, 0.28546142578125, 0.2967987060546875, 0.308135986328125, 0.3194732666015625, 0.330810546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 7.0, 9.0, 7.0, 3.0, 10.0, 20.0, 16.0, 27.0, 53.0, 95.0, 109.0, 145.0, 142.0, 120.0, 81.0, 51.0, 20.0, 24.0, 18.0, 15.0, 7.0, 3.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001348257064819336, -0.00013136956840753555, -0.0001279134303331375, -0.00012445729225873947, -0.00012100115418434143, -0.00011754501610994339, -0.00011408887803554535, -0.00011063273996114731, -0.00010717660188674927, -0.00010372046381235123, -0.00010026432573795319, -9.680818766355515e-05, -9.33520495891571e-05, -8.989591151475906e-05, -8.643977344036102e-05, -8.298363536596298e-05, -7.952749729156494e-05, -7.60713592171669e-05, -7.261522114276886e-05, -6.915908306837082e-05, -6.570294499397278e-05, -6.224680691957474e-05, -5.87906688451767e-05, -5.5334530770778656e-05, -5.1878392696380615e-05, -4.8422254621982574e-05, -4.4966116547584534e-05, -4.150997847318649e-05, -3.805384039878845e-05, -3.459770232439041e-05, -3.114156424999237e-05, -2.768542617559433e-05, -2.422928810119629e-05, -2.0773150026798248e-05, -1.7317011952400208e-05, -1.3860873878002167e-05, -1.0404735803604126e-05, -6.948597729206085e-06, -3.4924596548080444e-06, -3.632158041000366e-08, 3.419816493988037e-06, 6.875954568386078e-06, 1.0332092642784119e-05, 1.378823071718216e-05, 1.72443687915802e-05, 2.070050686597824e-05, 2.4156644940376282e-05, 2.7612783014774323e-05, 3.106892108917236e-05, 3.4525059163570404e-05, 3.7981197237968445e-05, 4.1437335312366486e-05, 4.4893473386764526e-05, 4.834961146116257e-05, 5.180574953556061e-05, 5.526188760995865e-05, 5.871802568435669e-05, 6.217416375875473e-05, 6.563030183315277e-05, 6.908643990755081e-05, 7.254257798194885e-05, 7.59987160563469e-05, 7.945485413074493e-05, 8.291099220514297e-05, 8.636713027954102e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 2.0, 6.0, 12.0, 11.0, 24.0, 32.0, 35.0, 66.0, 90.0, 139.0, 245.0, 401.0, 863.0, 2036.0, 5794.0, 20848.0, 90542.0, 639298.0, 230534.0, 41587.0, 10125.0, 3133.0, 1285.0, 619.0, 299.0, 178.0, 124.0, 75.0, 53.0, 26.0, 13.0, 14.0, 18.0, 10.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381103515625, -0.3707313537597656, -0.36035919189453125, -0.3499870300292969, -0.3396148681640625, -0.3292427062988281, -0.31887054443359375, -0.3084983825683594, -0.298126220703125, -0.2877540588378906, -0.27738189697265625, -0.2670097351074219, -0.2566375732421875, -0.24626541137695312, -0.23589324951171875, -0.22552108764648438, -0.21514892578125, -0.20477676391601562, -0.19440460205078125, -0.18403244018554688, -0.1736602783203125, -0.16328811645507812, -0.15291595458984375, -0.14254379272460938, -0.132171630859375, -0.12179946899414062, -0.11142730712890625, -0.10105514526367188, -0.0906829833984375, -0.08031082153320312, -0.06993865966796875, -0.059566497802734375, -0.0491943359375, -0.038822174072265625, -0.02845001220703125, -0.018077850341796875, -0.0077056884765625, 0.002666473388671875, 0.01303863525390625, 0.023410797119140625, 0.033782958984375, 0.044155120849609375, 0.05452728271484375, 0.06489944458007812, 0.0752716064453125, 0.08564376831054688, 0.09601593017578125, 0.10638809204101562, 0.11676025390625, 0.12713241577148438, 0.13750457763671875, 0.14787673950195312, 0.1582489013671875, 0.16862106323242188, 0.17899322509765625, 0.18936538696289062, 0.199737548828125, 0.21010971069335938, 0.22048187255859375, 0.23085403442382812, 0.2412261962890625, 0.2515983581542969, 0.26197052001953125, 0.2723426818847656, 0.28271484375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 10.0, 5.0, 9.0, 21.0, 18.0, 22.0, 35.0, 44.0, 81.0, 94.0, 102.0, 120.0, 116.0, 105.0, 40.0, 42.0, 33.0, 23.0, 21.0, 9.0, 14.0, 5.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32958984375, -0.3194770812988281, -0.30936431884765625, -0.2992515563964844, -0.2891387939453125, -0.2790260314941406, -0.26891326904296875, -0.2588005065917969, -0.248687744140625, -0.23857498168945312, -0.22846221923828125, -0.21834945678710938, -0.2082366943359375, -0.19812393188476562, -0.18801116943359375, -0.17789840698242188, -0.16778564453125, -0.15767288208007812, -0.14756011962890625, -0.13744735717773438, -0.1273345947265625, -0.11722183227539062, -0.10710906982421875, -0.09699630737304688, -0.086883544921875, -0.07677078247070312, -0.06665802001953125, -0.056545257568359375, -0.0464324951171875, -0.036319732666015625, -0.02620697021484375, -0.016094207763671875, -0.0059814453125, 0.004131317138671875, 0.01424407958984375, 0.024356842041015625, 0.0344696044921875, 0.044582366943359375, 0.05469512939453125, 0.06480789184570312, 0.074920654296875, 0.08503341674804688, 0.09514617919921875, 0.10525894165039062, 0.1153717041015625, 0.12548446655273438, 0.13559722900390625, 0.14570999145507812, 0.15582275390625, 0.16593551635742188, 0.17604827880859375, 0.18616104125976562, 0.1962738037109375, 0.20638656616210938, 0.21649932861328125, 0.22661209106445312, 0.236724853515625, 0.24683761596679688, 0.25695037841796875, 0.2670631408691406, 0.2771759033203125, 0.2872886657714844, 0.29740142822265625, 0.3075141906738281, 0.317626953125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 8.0, 30.0, 81.0, 270.0, 409.0, 163.0, 30.0, 14.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-27.737422943115234, -27.2174015045166, -26.69738006591797, -26.177358627319336, -25.657337188720703, -25.13731575012207, -24.617294311523438, -24.097274780273438, -23.577251434326172, -23.05722999572754, -22.537208557128906, -22.017187118530273, -21.49716567993164, -20.977144241333008, -20.457122802734375, -19.937103271484375, -19.417081832885742, -18.89706039428711, -18.377038955688477, -17.857017517089844, -17.33699607849121, -16.816974639892578, -16.296953201293945, -15.776932716369629, -15.256911277770996, -14.736889839172363, -14.21686840057373, -13.696846961975098, -13.176826477050781, -12.656805038452148, -12.136783599853516, -11.616762161254883, -11.096741676330566, -10.576720237731934, -10.0566987991333, -9.536677360534668, -9.016656875610352, -8.496635437011719, -7.976613998413086, -7.456592559814453, -6.93657112121582, -6.4165496826171875, -5.896528244018555, -5.37650728225708, -4.856485843658447, -4.3364644050598145, -3.8164432048797607, -3.296422004699707, -2.776400566101074, -2.2563791275024414, -1.7363579273223877, -1.2163366079330444, -0.6963152885437012, -0.17629384994506836, 0.34372735023498535, 0.8637485504150391, 1.3837699890136719, 1.9037913084030151, 2.4238126277923584, 2.943833827972412, 3.463855266571045, 3.9838767051696777, 4.503897666931152, 5.023919105529785, 5.543940544128418]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 8.0, 5.0, 9.0, 6.0, 15.0, 13.0, 19.0, 20.0, 19.0, 27.0, 34.0, 25.0, 28.0, 36.0, 37.0, 50.0, 41.0, 51.0, 53.0, 49.0, 33.0, 41.0, 31.0, 43.0, 35.0, 23.0, 43.0, 34.0, 27.0, 24.0, 14.0, 17.0, 18.0, 11.0, 15.0, 14.0, 5.0, 5.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.519078254699707, -5.355840682983398, -5.192602634429932, -5.029365062713623, -4.866127014160156, -4.702889442443848, -4.539651870727539, -4.3764142990112305, -4.213176250457764, -4.049938678741455, -3.8867006301879883, -3.7234630584716797, -3.560225248336792, -3.3969874382019043, -3.2337498664855957, -3.070512056350708, -2.9072742462158203, -2.7440364360809326, -2.580798625946045, -2.4175610542297363, -2.2543232440948486, -2.091085433959961, -1.9278477430343628, -1.7646100521087646, -1.601372241973877, -1.4381344318389893, -1.2748967409133911, -1.111659049987793, -0.9484212398529053, -0.7851834893226624, -0.6219457387924194, -0.4587080478668213, -0.2954697608947754, -0.13223201036453247, 0.03100574016571045, 0.19424349069595337, 0.3574812412261963, 0.5207189917564392, 0.6839567422866821, 0.8471944332122803, 1.010432243347168, 1.1736700534820557, 1.3369077444076538, 1.500145435333252, 1.6633832454681396, 1.8266210556030273, 1.9898587465286255, 2.1530964374542236, 2.3163342475891113, 2.479572057723999, 2.6428098678588867, 2.8060474395751953, 2.969285249710083, 3.1325230598449707, 3.2957606315612793, 3.458998441696167, 3.6222362518310547, 3.7854740619659424, 3.94871187210083, 4.111949443817139, 4.2751874923706055, 4.438425064086914, 4.601662635803223, 4.764900207519531, 4.928138256072998]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 13.0, 25.0, 49.0, 64.0, 123.0, 189.0, 401.0, 932.0, 2781.0, 10056.0, 71460.0, 3955443.0, 132917.0, 13743.0, 3645.0, 1200.0, 535.0, 296.0, 158.0, 80.0, 58.0, 41.0, 25.0, 7.0, 11.0, 6.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3486328125, -1.303070068359375, -1.25750732421875, -1.211944580078125, -1.1663818359375, -1.120819091796875, -1.07525634765625, -1.029693603515625, -0.984130859375, -0.938568115234375, -0.89300537109375, -0.847442626953125, -0.8018798828125, -0.756317138671875, -0.71075439453125, -0.665191650390625, -0.61962890625, -0.574066162109375, -0.52850341796875, -0.482940673828125, -0.4373779296875, -0.391815185546875, -0.34625244140625, -0.300689697265625, -0.255126953125, -0.209564208984375, -0.16400146484375, -0.118438720703125, -0.0728759765625, -0.027313232421875, 0.01824951171875, 0.063812255859375, 0.109375, 0.154937744140625, 0.20050048828125, 0.246063232421875, 0.2916259765625, 0.337188720703125, 0.38275146484375, 0.428314208984375, 0.473876953125, 0.519439697265625, 0.56500244140625, 0.610565185546875, 0.6561279296875, 0.701690673828125, 0.74725341796875, 0.792816162109375, 0.83837890625, 0.883941650390625, 0.92950439453125, 0.975067138671875, 1.0206298828125, 1.066192626953125, 1.11175537109375, 1.157318115234375, 1.202880859375, 1.248443603515625, 1.29400634765625, 1.339569091796875, 1.3851318359375, 1.430694580078125, 1.47625732421875, 1.521820068359375, 1.5673828125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 9.0, 15.0, 31.0, 37.0, 47.0, 64.0, 76.0, 108.0, 81.0, 98.0, 87.0, 92.0, 63.0, 65.0, 37.0, 28.0, 17.0, 15.0, 10.0, 8.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.508636474609375, -0.49237060546875, -0.476104736328125, -0.4598388671875, -0.443572998046875, -0.42730712890625, -0.411041259765625, -0.394775390625, -0.378509521484375, -0.36224365234375, -0.345977783203125, -0.3297119140625, -0.313446044921875, -0.29718017578125, -0.280914306640625, -0.2646484375, -0.248382568359375, -0.23211669921875, -0.215850830078125, -0.1995849609375, -0.183319091796875, -0.16705322265625, -0.150787353515625, -0.134521484375, -0.118255615234375, -0.10198974609375, -0.085723876953125, -0.0694580078125, -0.053192138671875, -0.03692626953125, -0.020660400390625, -0.00439453125, 0.011871337890625, 0.02813720703125, 0.044403076171875, 0.0606689453125, 0.076934814453125, 0.09320068359375, 0.109466552734375, 0.125732421875, 0.141998291015625, 0.15826416015625, 0.174530029296875, 0.1907958984375, 0.207061767578125, 0.22332763671875, 0.239593505859375, 0.255859375, 0.272125244140625, 0.28839111328125, 0.304656982421875, 0.3209228515625, 0.337188720703125, 0.35345458984375, 0.369720458984375, 0.385986328125, 0.402252197265625, 0.41851806640625, 0.434783935546875, 0.4510498046875, 0.467315673828125, 0.48358154296875, 0.499847412109375, 0.51611328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 3.0, 9.0, 21.0, 24.0, 79.0, 96.0, 206.0, 471.0, 1043.0, 2417.0, 6988.0, 26977.0, 244761.0, 3698094.0, 179507.0, 23127.0, 6281.0, 2345.0, 1017.0, 424.0, 193.0, 94.0, 39.0, 28.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6488189697265625, -0.623321533203125, -0.5978240966796875, -0.57232666015625, -0.5468292236328125, -0.521331787109375, -0.4958343505859375, -0.4703369140625, -0.4448394775390625, -0.419342041015625, -0.3938446044921875, -0.36834716796875, -0.3428497314453125, -0.317352294921875, -0.2918548583984375, -0.266357421875, -0.2408599853515625, -0.215362548828125, -0.1898651123046875, -0.16436767578125, -0.1388702392578125, -0.113372802734375, -0.0878753662109375, -0.0623779296875, -0.0368804931640625, -0.011383056640625, 0.0141143798828125, 0.03961181640625, 0.0651092529296875, 0.090606689453125, 0.1161041259765625, 0.1416015625, 0.1670989990234375, 0.192596435546875, 0.2180938720703125, 0.24359130859375, 0.2690887451171875, 0.294586181640625, 0.3200836181640625, 0.3455810546875, 0.3710784912109375, 0.396575927734375, 0.4220733642578125, 0.44757080078125, 0.4730682373046875, 0.498565673828125, 0.5240631103515625, 0.549560546875, 0.5750579833984375, 0.600555419921875, 0.6260528564453125, 0.65155029296875, 0.6770477294921875, 0.702545166015625, 0.7280426025390625, 0.7535400390625, 0.7790374755859375, 0.804534912109375, 0.8300323486328125, 0.85552978515625, 0.8810272216796875, 0.906524658203125, 0.9320220947265625, 0.95751953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 17.0, 19.0, 25.0, 25.0, 72.0, 132.0, 316.0, 1082.0, 1528.0, 412.0, 154.0, 92.0, 46.0, 36.0, 32.0, 16.0, 12.0, 7.0, 2.0, 4.0, 7.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.38916015625, -0.3792152404785156, -0.36927032470703125, -0.3593254089355469, -0.3493804931640625, -0.3394355773925781, -0.32949066162109375, -0.3195457458496094, -0.309600830078125, -0.2996559143066406, -0.28971099853515625, -0.2797660827636719, -0.2698211669921875, -0.2598762512207031, -0.24993133544921875, -0.23998641967773438, -0.23004150390625, -0.22009658813476562, -0.21015167236328125, -0.20020675659179688, -0.1902618408203125, -0.18031692504882812, -0.17037200927734375, -0.16042709350585938, -0.150482177734375, -0.14053726196289062, -0.13059234619140625, -0.12064743041992188, -0.1107025146484375, -0.10075759887695312, -0.09081268310546875, -0.08086776733398438, -0.0709228515625, -0.060977935791015625, -0.05103302001953125, -0.041088104248046875, -0.0311431884765625, -0.021198272705078125, -0.01125335693359375, -0.001308441162109375, 0.008636474609375, 0.018581390380859375, 0.02852630615234375, 0.038471221923828125, 0.0484161376953125, 0.058361053466796875, 0.06830596923828125, 0.07825088500976562, 0.08819580078125, 0.09814071655273438, 0.10808563232421875, 0.11803054809570312, 0.1279754638671875, 0.13792037963867188, 0.14786529541015625, 0.15781021118164062, 0.167755126953125, 0.17770004272460938, 0.18764495849609375, 0.19758987426757812, 0.2075347900390625, 0.21747970581054688, 0.22742462158203125, 0.23736953735351562, 0.247314453125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 20.0, 34.0, 54.0, 74.0, 114.0, 121.0, 123.0, 139.0, 108.0, 65.0, 53.0, 29.0, 20.0, 11.0, 7.0, 7.0, 2.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0534998178482056, -1.0099730491638184, -0.9664463996887207, -0.9229196906089783, -0.8793929815292358, -0.8358662724494934, -0.792339563369751, -0.7488128542900085, -0.7052861452102661, -0.6617594361305237, -0.6182327270507812, -0.5747060179710388, -0.5311793088912964, -0.48765259981155396, -0.4441258907318115, -0.4005991816520691, -0.35707247257232666, -0.31354576349258423, -0.2700190544128418, -0.22649234533309937, -0.18296563625335693, -0.1394389271736145, -0.09591221809387207, -0.05238550901412964, -0.008858799934387207, 0.034667909145355225, 0.07819461822509766, 0.12172132730484009, 0.16524803638458252, 0.20877474546432495, 0.2523014545440674, 0.2958281636238098, 0.3393549919128418, 0.38288170099258423, 0.42640841007232666, 0.4699351191520691, 0.5134618282318115, 0.556988537311554, 0.6005152463912964, 0.6440419554710388, 0.6875686645507812, 0.7310953736305237, 0.7746220827102661, 0.8181487917900085, 0.861675500869751, 0.9052022099494934, 0.9487289190292358, 0.9922556281089783, 1.0357823371887207, 1.0793089866638184, 1.1228357553482056, 1.1663625240325928, 1.2098891735076904, 1.253415822982788, 1.2969425916671753, 1.3404693603515625, 1.3839960098266602, 1.4275226593017578, 1.471049427986145, 1.5145761966705322, 1.5581028461456299, 1.6016294956207275, 1.6451562643051147, 1.688683032989502, 1.7322096824645996]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 5.0, 5.0, 12.0, 16.0, 22.0, 15.0, 28.0, 29.0, 33.0, 23.0, 37.0, 41.0, 32.0, 51.0, 35.0, 49.0, 50.0, 40.0, 41.0, 55.0, 42.0, 48.0, 38.0, 39.0, 37.0, 39.0, 31.0, 16.0, 15.0, 15.0, 12.0, 2.0, 11.0, 7.0, 5.0, 6.0, 3.0, 0.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.148053765296936, -1.1169829368591309, -1.0859121084213257, -1.0548412799835205, -1.0237704515457153, -0.9926996231079102, -0.9616287350654602, -0.930557906627655, -0.8994870781898499, -0.8684162497520447, -0.8373454213142395, -0.8062745928764343, -0.7752037048339844, -0.7441328763961792, -0.713062047958374, -0.6819912195205688, -0.6509203910827637, -0.6198495626449585, -0.5887787342071533, -0.5577079057693481, -0.526637077331543, -0.4955662190914154, -0.46449536085128784, -0.43342453241348267, -0.4023537039756775, -0.3712828755378723, -0.34021204710006714, -0.3091411888599396, -0.2780703604221344, -0.24699953198432922, -0.21592868864536285, -0.18485784530639648, -0.15378707647323608, -0.12271624058485031, -0.09164540469646454, -0.060574568808078766, -0.029503732919692993, 0.0015670955181121826, 0.03263793885707855, 0.06370878219604492, 0.0947796106338501, 0.12585043907165527, 0.15692128241062164, 0.187992125749588, 0.2190629541873932, 0.25013378262519836, 0.2812046408653259, 0.3122754693031311, 0.3433462977409363, 0.37441712617874146, 0.40548795461654663, 0.4365588128566742, 0.46762964129447937, 0.49870046973228455, 0.5297713279724121, 0.5608421564102173, 0.5919129848480225, 0.6229838132858276, 0.6540546417236328, 0.685125470161438, 0.7161962985992432, 0.7472671270370483, 0.7783380150794983, 0.8094088435173035, 0.8404796719551086]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 4.0, 12.0, 24.0, 41.0, 87.0, 186.0, 299.0, 634.0, 1461.0, 4974.0, 27370.0, 307664.0, 633112.0, 60357.0, 8423.0, 2225.0, 846.0, 376.0, 216.0, 102.0, 49.0, 35.0, 12.0, 9.0, 9.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9609375, -1.903564453125, -1.84619140625, -1.788818359375, -1.7314453125, -1.674072265625, -1.61669921875, -1.559326171875, -1.501953125, -1.444580078125, -1.38720703125, -1.329833984375, -1.2724609375, -1.215087890625, -1.15771484375, -1.100341796875, -1.04296875, -0.985595703125, -0.92822265625, -0.870849609375, -0.8134765625, -0.756103515625, -0.69873046875, -0.641357421875, -0.583984375, -0.526611328125, -0.46923828125, -0.411865234375, -0.3544921875, -0.297119140625, -0.23974609375, -0.182373046875, -0.125, -0.067626953125, -0.01025390625, 0.047119140625, 0.1044921875, 0.161865234375, 0.21923828125, 0.276611328125, 0.333984375, 0.391357421875, 0.44873046875, 0.506103515625, 0.5634765625, 0.620849609375, 0.67822265625, 0.735595703125, 0.79296875, 0.850341796875, 0.90771484375, 0.965087890625, 1.0224609375, 1.079833984375, 1.13720703125, 1.194580078125, 1.251953125, 1.309326171875, 1.36669921875, 1.424072265625, 1.4814453125, 1.538818359375, 1.59619140625, 1.653564453125, 1.7109375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 23.0, 28.0, 37.0, 53.0, 62.0, 87.0, 92.0, 107.0, 91.0, 83.0, 82.0, 71.0, 50.0, 44.0, 26.0, 15.0, 13.0, 9.0, 4.0, 7.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5104560852050781, -0.49454498291015625, -0.4786338806152344, -0.4627227783203125, -0.4468116760253906, -0.43090057373046875, -0.4149894714355469, -0.399078369140625, -0.3831672668457031, -0.36725616455078125, -0.3513450622558594, -0.3354339599609375, -0.3195228576660156, -0.30361175537109375, -0.2877006530761719, -0.27178955078125, -0.2558784484863281, -0.23996734619140625, -0.22405624389648438, -0.2081451416015625, -0.19223403930664062, -0.17632293701171875, -0.16041183471679688, -0.144500732421875, -0.12858963012695312, -0.11267852783203125, -0.09676742553710938, -0.0808563232421875, -0.06494522094726562, -0.04903411865234375, -0.033123016357421875, -0.0172119140625, -0.001300811767578125, 0.01461029052734375, 0.030521392822265625, 0.0464324951171875, 0.062343597412109375, 0.07825469970703125, 0.09416580200195312, 0.110076904296875, 0.12598800659179688, 0.14189910888671875, 0.15781021118164062, 0.1737213134765625, 0.18963241577148438, 0.20554351806640625, 0.22145462036132812, 0.23736572265625, 0.2532768249511719, 0.26918792724609375, 0.2850990295410156, 0.3010101318359375, 0.3169212341308594, 0.33283233642578125, 0.3487434387207031, 0.364654541015625, 0.3805656433105469, 0.39647674560546875, 0.4123878479003906, 0.4282989501953125, 0.4442100524902344, 0.46012115478515625, 0.4760322570800781, 0.491943359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 13.0, 11.0, 12.0, 9.0, 22.0, 29.0, 33.0, 51.0, 77.0, 120.0, 188.0, 314.0, 751.0, 1718.0, 4685.0, 14997.0, 56545.0, 261978.0, 525748.0, 134952.0, 31817.0, 8995.0, 3006.0, 1190.0, 484.0, 292.0, 157.0, 117.0, 65.0, 36.0, 51.0, 26.0, 14.0, 16.0, 13.0, 6.0, 4.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.083984375, -1.0532684326171875, -1.022552490234375, -0.9918365478515625, -0.96112060546875, -0.9304046630859375, -0.899688720703125, -0.8689727783203125, -0.8382568359375, -0.8075408935546875, -0.776824951171875, -0.7461090087890625, -0.71539306640625, -0.6846771240234375, -0.653961181640625, -0.6232452392578125, -0.592529296875, -0.5618133544921875, -0.531097412109375, -0.5003814697265625, -0.46966552734375, -0.4389495849609375, -0.408233642578125, -0.3775177001953125, -0.3468017578125, -0.3160858154296875, -0.285369873046875, -0.2546539306640625, -0.22393798828125, -0.1932220458984375, -0.162506103515625, -0.1317901611328125, -0.10107421875, -0.0703582763671875, -0.039642333984375, -0.0089263916015625, 0.02178955078125, 0.0525054931640625, 0.083221435546875, 0.1139373779296875, 0.1446533203125, 0.1753692626953125, 0.206085205078125, 0.2368011474609375, 0.26751708984375, 0.2982330322265625, 0.328948974609375, 0.3596649169921875, 0.390380859375, 0.4210968017578125, 0.451812744140625, 0.4825286865234375, 0.51324462890625, 0.5439605712890625, 0.574676513671875, 0.6053924560546875, 0.6361083984375, 0.6668243408203125, 0.697540283203125, 0.7282562255859375, 0.75897216796875, 0.7896881103515625, 0.820404052734375, 0.8511199951171875, 0.8818359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 2.0, 6.0, 6.0, 9.0, 12.0, 17.0, 15.0, 29.0, 17.0, 32.0, 27.0, 43.0, 34.0, 45.0, 31.0, 38.0, 49.0, 56.0, 46.0, 55.0, 49.0, 38.0, 36.0, 45.0, 39.0, 29.0, 15.0, 26.0, 27.0, 23.0, 16.0, 18.0, 9.0, 9.0, 11.0, 11.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.0645294189453125, -1.031402587890625, -0.9982757568359375, -0.96514892578125, -0.9320220947265625, -0.898895263671875, -0.8657684326171875, -0.8326416015625, -0.7995147705078125, -0.766387939453125, -0.7332611083984375, -0.70013427734375, -0.6670074462890625, -0.633880615234375, -0.6007537841796875, -0.567626953125, -0.5345001220703125, -0.501373291015625, -0.4682464599609375, -0.43511962890625, -0.4019927978515625, -0.368865966796875, -0.3357391357421875, -0.3026123046875, -0.2694854736328125, -0.236358642578125, -0.2032318115234375, -0.17010498046875, -0.1369781494140625, -0.103851318359375, -0.0707244873046875, -0.03759765625, -0.0044708251953125, 0.028656005859375, 0.0617828369140625, 0.09490966796875, 0.1280364990234375, 0.161163330078125, 0.1942901611328125, 0.2274169921875, 0.2605438232421875, 0.293670654296875, 0.3267974853515625, 0.35992431640625, 0.3930511474609375, 0.426177978515625, 0.4593048095703125, 0.492431640625, 0.5255584716796875, 0.558685302734375, 0.5918121337890625, 0.62493896484375, 0.6580657958984375, 0.691192626953125, 0.7243194580078125, 0.7574462890625, 0.7905731201171875, 0.823699951171875, 0.8568267822265625, 0.88995361328125, 0.9230804443359375, 0.956207275390625, 0.9893341064453125, 1.0224609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 8.0, 13.0, 9.0, 21.0, 32.0, 58.0, 122.0, 300.0, 727.0, 2169.0, 10465.0, 70303.0, 702300.0, 231352.0, 24350.0, 4326.0, 1184.0, 452.0, 162.0, 90.0, 46.0, 27.0, 14.0, 8.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.385009765625, -0.3732490539550781, -0.36148834228515625, -0.3497276306152344, -0.3379669189453125, -0.3262062072753906, -0.31444549560546875, -0.3026847839355469, -0.290924072265625, -0.2791633605957031, -0.26740264892578125, -0.2556419372558594, -0.2438812255859375, -0.23212051391601562, -0.22035980224609375, -0.20859909057617188, -0.19683837890625, -0.18507766723632812, -0.17331695556640625, -0.16155624389648438, -0.1497955322265625, -0.13803482055664062, -0.12627410888671875, -0.11451339721679688, -0.102752685546875, -0.09099197387695312, -0.07923126220703125, -0.06747055053710938, -0.0557098388671875, -0.043949127197265625, -0.03218841552734375, -0.020427703857421875, -0.0086669921875, 0.003093719482421875, 0.01485443115234375, 0.026615142822265625, 0.0383758544921875, 0.050136566162109375, 0.06189727783203125, 0.07365798950195312, 0.085418701171875, 0.09717941284179688, 0.10894012451171875, 0.12070083618164062, 0.1324615478515625, 0.14422225952148438, 0.15598297119140625, 0.16774368286132812, 0.17950439453125, 0.19126510620117188, 0.20302581787109375, 0.21478652954101562, 0.2265472412109375, 0.23830795288085938, 0.25006866455078125, 0.2618293762207031, 0.273590087890625, 0.2853507995605469, 0.29711151123046875, 0.3088722229003906, 0.3206329345703125, 0.3323936462402344, 0.34415435791015625, 0.3559150695800781, 0.36767578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 2.0, 10.0, 7.0, 7.0, 13.0, 15.0, 15.0, 15.0, 18.0, 32.0, 48.0, 65.0, 83.0, 129.0, 119.0, 88.0, 92.0, 56.0, 43.0, 29.0, 21.0, 15.0, 6.0, 9.0, 8.0, 10.0, 8.0, 9.0, 7.0, 2.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.614229202270508e-05, -9.349267929792404e-05, -9.0843066573143e-05, -8.819345384836197e-05, -8.554384112358093e-05, -8.28942283987999e-05, -8.024461567401886e-05, -7.759500294923782e-05, -7.494539022445679e-05, -7.229577749967575e-05, -6.964616477489471e-05, -6.699655205011368e-05, -6.434693932533264e-05, -6.16973266005516e-05, -5.904771387577057e-05, -5.639810115098953e-05, -5.3748488426208496e-05, -5.109887570142746e-05, -4.844926297664642e-05, -4.579965025186539e-05, -4.315003752708435e-05, -4.0500424802303314e-05, -3.785081207752228e-05, -3.520119935274124e-05, -3.2551586627960205e-05, -2.990197390317917e-05, -2.7252361178398132e-05, -2.4602748453617096e-05, -2.195313572883606e-05, -1.9303523004055023e-05, -1.6653910279273987e-05, -1.400429755449295e-05, -1.1354684829711914e-05, -8.705072104930878e-06, -6.055459380149841e-06, -3.405846655368805e-06, -7.562339305877686e-07, 1.8933787941932678e-06, 4.542991518974304e-06, 7.1926042437553406e-06, 9.842216968536377e-06, 1.2491829693317413e-05, 1.514144241809845e-05, 1.7791055142879486e-05, 2.0440667867660522e-05, 2.309028059244156e-05, 2.5739893317222595e-05, 2.838950604200363e-05, 3.103911876678467e-05, 3.3688731491565704e-05, 3.633834421634674e-05, 3.898795694112778e-05, 4.1637569665908813e-05, 4.428718239068985e-05, 4.6936795115470886e-05, 4.958640784025192e-05, 5.223602056503296e-05, 5.4885633289813995e-05, 5.753524601459503e-05, 6.018485873937607e-05, 6.28344714641571e-05, 6.548408418893814e-05, 6.813369691371918e-05, 7.078330963850021e-05, 7.343292236328125e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 6.0, 6.0, 11.0, 16.0, 26.0, 40.0, 62.0, 127.0, 226.0, 445.0, 869.0, 2042.0, 5632.0, 17517.0, 67195.0, 495688.0, 380791.0, 54799.0, 14812.0, 4739.0, 1848.0, 763.0, 365.0, 185.0, 124.0, 65.0, 44.0, 38.0, 28.0, 6.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.2790641784667969, -0.27004241943359375, -0.2610206604003906, -0.2519989013671875, -0.24297714233398438, -0.23395538330078125, -0.22493362426757812, -0.215911865234375, -0.20689010620117188, -0.19786834716796875, -0.18884658813476562, -0.1798248291015625, -0.17080307006835938, -0.16178131103515625, -0.15275955200195312, -0.14373779296875, -0.13471603393554688, -0.12569427490234375, -0.11667251586914062, -0.1076507568359375, -0.09862899780273438, -0.08960723876953125, -0.08058547973632812, -0.071563720703125, -0.06254196166992188, -0.05352020263671875, -0.044498443603515625, -0.0354766845703125, -0.026454925537109375, -0.01743316650390625, -0.008411407470703125, 0.0006103515625, 0.009632110595703125, 0.01865386962890625, 0.027675628662109375, 0.0366973876953125, 0.045719146728515625, 0.05474090576171875, 0.06376266479492188, 0.072784423828125, 0.08180618286132812, 0.09082794189453125, 0.09984970092773438, 0.1088714599609375, 0.11789321899414062, 0.12691497802734375, 0.13593673706054688, 0.14495849609375, 0.15398025512695312, 0.16300201416015625, 0.17202377319335938, 0.1810455322265625, 0.19006729125976562, 0.19908905029296875, 0.20811080932617188, 0.217132568359375, 0.22615432739257812, 0.23517608642578125, 0.24419784545898438, 0.2532196044921875, 0.2622413635253906, 0.27126312255859375, 0.2802848815917969, 0.289306640625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 14.0, 7.0, 6.0, 26.0, 25.0, 26.0, 35.0, 67.0, 98.0, 122.0, 114.0, 106.0, 93.0, 63.0, 48.0, 33.0, 27.0, 28.0, 14.0, 9.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38720703125, -0.37738800048828125, -0.3675689697265625, -0.35774993896484375, -0.347930908203125, -0.33811187744140625, -0.3282928466796875, -0.31847381591796875, -0.30865478515625, -0.29883575439453125, -0.2890167236328125, -0.27919769287109375, -0.269378662109375, -0.25955963134765625, -0.2497406005859375, -0.23992156982421875, -0.2301025390625, -0.22028350830078125, -0.2104644775390625, -0.20064544677734375, -0.190826416015625, -0.18100738525390625, -0.1711883544921875, -0.16136932373046875, -0.15155029296875, -0.14173126220703125, -0.1319122314453125, -0.12209320068359375, -0.112274169921875, -0.10245513916015625, -0.0926361083984375, -0.08281707763671875, -0.072998046875, -0.06317901611328125, -0.0533599853515625, -0.04354095458984375, -0.033721923828125, -0.02390289306640625, -0.0140838623046875, -0.00426483154296875, 0.00555419921875, 0.01537322998046875, 0.0251922607421875, 0.03501129150390625, 0.044830322265625, 0.05464935302734375, 0.0644683837890625, 0.07428741455078125, 0.0841064453125, 0.09392547607421875, 0.1037445068359375, 0.11356353759765625, 0.123382568359375, 0.13320159912109375, 0.1430206298828125, 0.15283966064453125, 0.16265869140625, 0.17247772216796875, 0.1822967529296875, 0.19211578369140625, 0.201934814453125, 0.21175384521484375, 0.2215728759765625, 0.23139190673828125, 0.2412109375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 31.0, 153.0, 374.0, 331.0, 89.0, 20.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.770190238952637, -15.276162147521973, -14.782134056091309, -14.288105964660645, -13.79407787322998, -13.300049781799316, -12.806021690368652, -12.311993598937988, -11.817965507507324, -11.32393741607666, -10.829909324645996, -10.335881233215332, -9.841853141784668, -9.347825050354004, -8.85379695892334, -8.359768867492676, -7.86574125289917, -7.371713161468506, -6.877685070037842, -6.383656978607178, -5.889628887176514, -5.395601272583008, -4.901573181152344, -4.40754508972168, -3.9135167598724365, -3.4194886684417725, -2.9254605770111084, -2.4314327239990234, -1.9374045133590698, -1.4433765411376953, -0.9493484497070312, -0.4553203582763672, 0.038707733154296875, 0.5327358245849609, 1.026763916015625, 1.5207918882369995, 2.014820098876953, 2.508847951889038, 3.002876043319702, 3.496904134750366, 3.9909322261810303, 4.484960079193115, 4.978988170623779, 5.473016262054443, 5.967044353485107, 6.4610724449157715, 6.9551005363464355, 7.4491286277771, 7.943156719207764, 8.43718433380127, 8.931212425231934, 9.425240516662598, 9.919268608093262, 10.413296699523926, 10.90732479095459, 11.401352882385254, 11.895380973815918, 12.389409065246582, 12.883437156677246, 13.37746524810791, 13.871493339538574, 14.365521430969238, 14.859549522399902, 15.353577613830566, 15.84760570526123]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 8.0, 8.0, 6.0, 14.0, 12.0, 9.0, 18.0, 21.0, 8.0, 15.0, 25.0, 25.0, 29.0, 30.0, 35.0, 28.0, 32.0, 46.0, 48.0, 35.0, 36.0, 32.0, 52.0, 43.0, 37.0, 31.0, 40.0, 36.0, 41.0, 26.0, 29.0, 24.0, 23.0, 16.0, 16.0, 10.0, 11.0, 19.0, 7.0, 6.0, 2.0, 2.0, 2.0, 7.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.561349391937256, -4.426307201385498, -4.291265487670898, -4.156223297119141, -4.021181106567383, -3.886138916015625, -3.7510969638824463, -3.6160550117492676, -3.4810128211975098, -3.345970630645752, -3.2109286785125732, -3.0758867263793945, -2.9408445358276367, -2.805802345275879, -2.6707603931427, -2.5357184410095215, -2.4006762504577637, -2.265634059906006, -2.130592107772827, -1.9955500364303589, -1.8605079650878906, -1.7254658937454224, -1.590423822402954, -1.4553817510604858, -1.3203396797180176, -1.1852976083755493, -1.050255537033081, -0.9152134656906128, -0.7801713943481445, -0.6451293230056763, -0.510087251663208, -0.37504518032073975, -0.2400035858154297, -0.10496151447296143, 0.030080556869506836, 0.1651226282119751, 0.30016469955444336, 0.4352067708969116, 0.5702488422393799, 0.7052909135818481, 0.8403329849243164, 0.9753750562667847, 1.110417127609253, 1.2454591989517212, 1.3805012702941895, 1.5155433416366577, 1.650585412979126, 1.7856274843215942, 1.9206695556640625, 2.0557117462158203, 2.190753698348999, 2.3257956504821777, 2.4608378410339355, 2.5958800315856934, 2.730921983718872, 2.865963935852051, 3.0010061264038086, 3.1360483169555664, 3.271090269088745, 3.406132221221924, 3.5411744117736816, 3.6762166023254395, 3.811258554458618, 3.946300506591797, 4.081342697143555]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 10.0, 14.0, 19.0, 20.0, 45.0, 49.0, 76.0, 148.0, 223.0, 410.0, 701.0, 1645.0, 4290.0, 15186.0, 128529.0, 3941601.0, 81916.0, 12416.0, 3876.0, 1456.0, 684.0, 377.0, 221.0, 132.0, 70.0, 51.0, 36.0, 26.0, 14.0, 11.0, 11.0, 4.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4794921875, -1.4235076904296875, -1.367523193359375, -1.3115386962890625, -1.25555419921875, -1.1995697021484375, -1.143585205078125, -1.0876007080078125, -1.0316162109375, -0.9756317138671875, -0.919647216796875, -0.8636627197265625, -0.80767822265625, -0.7516937255859375, -0.695709228515625, -0.6397247314453125, -0.583740234375, -0.5277557373046875, -0.471771240234375, -0.4157867431640625, -0.35980224609375, -0.3038177490234375, -0.247833251953125, -0.1918487548828125, -0.1358642578125, -0.0798797607421875, -0.023895263671875, 0.0320892333984375, 0.08807373046875, 0.1440582275390625, 0.200042724609375, 0.2560272216796875, 0.31201171875, 0.3679962158203125, 0.423980712890625, 0.4799652099609375, 0.53594970703125, 0.5919342041015625, 0.647918701171875, 0.7039031982421875, 0.7598876953125, 0.8158721923828125, 0.871856689453125, 0.9278411865234375, 0.98382568359375, 1.0398101806640625, 1.095794677734375, 1.1517791748046875, 1.207763671875, 1.2637481689453125, 1.319732666015625, 1.3757171630859375, 1.43170166015625, 1.4876861572265625, 1.543670654296875, 1.5996551513671875, 1.6556396484375, 1.7116241455078125, 1.767608642578125, 1.8235931396484375, 1.87957763671875, 1.9355621337890625, 1.991546630859375, 2.0475311279296875, 2.103515625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 11.0, 20.0, 24.0, 54.0, 58.0, 73.0, 73.0, 105.0, 100.0, 87.0, 92.0, 68.0, 65.0, 51.0, 35.0, 28.0, 15.0, 16.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52587890625, -0.5093841552734375, -0.492889404296875, -0.4763946533203125, -0.45989990234375, -0.4434051513671875, -0.426910400390625, -0.4104156494140625, -0.3939208984375, -0.3774261474609375, -0.360931396484375, -0.3444366455078125, -0.32794189453125, -0.3114471435546875, -0.294952392578125, -0.2784576416015625, -0.261962890625, -0.2454681396484375, -0.228973388671875, -0.2124786376953125, -0.19598388671875, -0.1794891357421875, -0.162994384765625, -0.1464996337890625, -0.1300048828125, -0.1135101318359375, -0.097015380859375, -0.0805206298828125, -0.06402587890625, -0.0475311279296875, -0.031036376953125, -0.0145416259765625, 0.001953125, 0.0184478759765625, 0.034942626953125, 0.0514373779296875, 0.06793212890625, 0.0844268798828125, 0.100921630859375, 0.1174163818359375, 0.1339111328125, 0.1504058837890625, 0.166900634765625, 0.1833953857421875, 0.19989013671875, 0.2163848876953125, 0.232879638671875, 0.2493743896484375, 0.265869140625, 0.2823638916015625, 0.298858642578125, 0.3153533935546875, 0.33184814453125, 0.3483428955078125, 0.364837646484375, 0.3813323974609375, 0.3978271484375, 0.4143218994140625, 0.430816650390625, 0.4473114013671875, 0.46380615234375, 0.4803009033203125, 0.496795654296875, 0.5132904052734375, 0.52978515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 10.0, 10.0, 19.0, 22.0, 26.0, 33.0, 41.0, 82.0, 98.0, 155.0, 214.0, 283.0, 419.0, 647.0, 1034.0, 1859.0, 3635.0, 8373.0, 24322.0, 105597.0, 3206654.0, 747488.0, 62793.0, 17015.0, 6449.0, 2907.0, 1502.0, 837.0, 539.0, 348.0, 255.0, 177.0, 118.0, 88.0, 76.0, 44.0, 31.0, 21.0, 21.0, 15.0, 6.0, 9.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8251953125, -0.7984466552734375, -0.771697998046875, -0.7449493408203125, -0.71820068359375, -0.6914520263671875, -0.664703369140625, -0.6379547119140625, -0.6112060546875, -0.5844573974609375, -0.557708740234375, -0.5309600830078125, -0.50421142578125, -0.4774627685546875, -0.450714111328125, -0.4239654541015625, -0.397216796875, -0.3704681396484375, -0.343719482421875, -0.3169708251953125, -0.29022216796875, -0.2634735107421875, -0.236724853515625, -0.2099761962890625, -0.1832275390625, -0.1564788818359375, -0.129730224609375, -0.1029815673828125, -0.07623291015625, -0.0494842529296875, -0.022735595703125, 0.0040130615234375, 0.03076171875, 0.0575103759765625, 0.084259033203125, 0.1110076904296875, 0.13775634765625, 0.1645050048828125, 0.191253662109375, 0.2180023193359375, 0.2447509765625, 0.2714996337890625, 0.298248291015625, 0.3249969482421875, 0.35174560546875, 0.3784942626953125, 0.405242919921875, 0.4319915771484375, 0.458740234375, 0.4854888916015625, 0.512237548828125, 0.5389862060546875, 0.56573486328125, 0.5924835205078125, 0.619232177734375, 0.6459808349609375, 0.6727294921875, 0.6994781494140625, 0.726226806640625, 0.7529754638671875, 0.77972412109375, 0.8064727783203125, 0.833221435546875, 0.8599700927734375, 0.88671875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 5.0, 12.0, 18.0, 26.0, 41.0, 55.0, 111.0, 500.0, 2538.0, 457.0, 128.0, 59.0, 45.0, 19.0, 14.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59765625, -0.5798110961914062, -0.5619659423828125, -0.5441207885742188, -0.526275634765625, -0.5084304809570312, -0.4905853271484375, -0.47274017333984375, -0.45489501953125, -0.43704986572265625, -0.4192047119140625, -0.40135955810546875, -0.383514404296875, -0.36566925048828125, -0.3478240966796875, -0.32997894287109375, -0.3121337890625, -0.29428863525390625, -0.2764434814453125, -0.25859832763671875, -0.240753173828125, -0.22290802001953125, -0.2050628662109375, -0.18721771240234375, -0.16937255859375, -0.15152740478515625, -0.1336822509765625, -0.11583709716796875, -0.097991943359375, -0.08014678955078125, -0.0623016357421875, -0.04445648193359375, -0.026611328125, -0.00876617431640625, 0.0090789794921875, 0.02692413330078125, 0.044769287109375, 0.06261444091796875, 0.0804595947265625, 0.09830474853515625, 0.11614990234375, 0.13399505615234375, 0.1518402099609375, 0.16968536376953125, 0.187530517578125, 0.20537567138671875, 0.2232208251953125, 0.24106597900390625, 0.2589111328125, 0.27675628662109375, 0.2946014404296875, 0.31244659423828125, 0.330291748046875, 0.34813690185546875, 0.3659820556640625, 0.38382720947265625, 0.40167236328125, 0.41951751708984375, 0.4373626708984375, 0.45520782470703125, 0.473052978515625, 0.49089813232421875, 0.5087432861328125, 0.5265884399414062, 0.54443359375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 13.0, 25.0, 51.0, 106.0, 200.0, 229.0, 170.0, 107.0, 42.0, 26.0, 12.0, 11.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.156145095825195, -4.062246322631836, -3.9683480262756348, -3.8744492530822754, -3.780550718307495, -3.686652183532715, -3.5927536487579346, -3.4988551139831543, -3.404956340789795, -3.3110578060150146, -3.2171592712402344, -3.123260498046875, -3.0293619632720947, -2.9354634284973145, -2.841564893722534, -2.747666358947754, -2.6537678241729736, -2.5598692893981934, -2.465970754623413, -2.372072219848633, -2.2781734466552734, -2.184274911880493, -2.090376377105713, -1.9964778423309326, -1.9025791883468628, -1.8086806535720825, -1.7147819995880127, -1.6208834648132324, -1.5269849300384521, -1.4330862760543823, -1.339187741279602, -1.2452890872955322, -1.151390790939331, -1.0574922561645508, -0.963593602180481, -0.8696950674057007, -0.7757964730262756, -0.6818978786468506, -0.5879993438720703, -0.49410074949264526, -0.4002021551132202, -0.30630356073379517, -0.2124049961566925, -0.11850643157958984, -0.024607837200164795, 0.06929075717926025, 0.16318929195404053, 0.2570878863334656, 0.3509864807128906, 0.4448850750923157, 0.5387836694717407, 0.632682204246521, 0.726580798625946, 0.8204793930053711, 0.9143779277801514, 1.0082764625549316, 1.1021751165390015, 1.1960736513137817, 1.2899723052978516, 1.3838708400726318, 1.477769374847412, 1.571668028831482, 1.6655665636062622, 1.759465217590332, 1.8533637523651123]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 9.0, 11.0, 15.0, 19.0, 26.0, 24.0, 28.0, 32.0, 40.0, 43.0, 49.0, 63.0, 69.0, 74.0, 70.0, 64.0, 58.0, 46.0, 47.0, 38.0, 37.0, 24.0, 35.0, 24.0, 26.0, 11.0, 10.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0081117153167725, -1.955435872077942, -1.9027599096298218, -1.8500840663909912, -1.797408103942871, -1.7447322607040405, -1.69205641746521, -1.6393804550170898, -1.5867044925689697, -1.5340286493301392, -1.481352686882019, -1.4286768436431885, -1.3760008811950684, -1.3233250379562378, -1.2706491947174072, -1.217973232269287, -1.1652973890304565, -1.112621545791626, -1.0599455833435059, -1.0072697401046753, -0.9545937776565552, -0.9019179344177246, -0.8492420315742493, -0.7965661287307739, -0.7438902258872986, -0.6912143230438232, -0.6385384202003479, -0.5858625173568726, -0.533186674118042, -0.48051074147224426, -0.4278348684310913, -0.37515896558761597, -0.3224831819534302, -0.26980727910995483, -0.21713139116764069, -0.16445550322532654, -0.1117796003818512, -0.059103697538375854, -0.0064278244972229, 0.04624807834625244, 0.09892398118972778, 0.15159988403320312, 0.20427577197551727, 0.2569516599178314, 0.30962756276130676, 0.3623034656047821, 0.41497933864593506, 0.4676552414894104, 0.5203311443328857, 0.5730070471763611, 0.6256829500198364, 0.678358793258667, 0.7310347557067871, 0.7837105989456177, 0.836386501789093, 0.8890624046325684, 0.9417383074760437, 0.994414210319519, 1.0470900535583496, 1.0997660160064697, 1.1524418592453003, 1.2051178216934204, 1.257793664932251, 1.310469627380371, 1.3631454706192017]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 5.0, 4.0, 11.0, 11.0, 16.0, 25.0, 31.0, 72.0, 106.0, 171.0, 308.0, 595.0, 1357.0, 3566.0, 11823.0, 64083.0, 506831.0, 395580.0, 48737.0, 9708.0, 3028.0, 1206.0, 575.0, 286.0, 169.0, 109.0, 50.0, 33.0, 19.0, 16.0, 8.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.791015625, -1.731170654296875, -1.67132568359375, -1.611480712890625, -1.5516357421875, -1.491790771484375, -1.43194580078125, -1.372100830078125, -1.312255859375, -1.252410888671875, -1.19256591796875, -1.132720947265625, -1.0728759765625, -1.013031005859375, -0.95318603515625, -0.893341064453125, -0.83349609375, -0.773651123046875, -0.71380615234375, -0.653961181640625, -0.5941162109375, -0.534271240234375, -0.47442626953125, -0.414581298828125, -0.354736328125, -0.294891357421875, -0.23504638671875, -0.175201416015625, -0.1153564453125, -0.055511474609375, 0.00433349609375, 0.064178466796875, 0.1240234375, 0.183868408203125, 0.24371337890625, 0.303558349609375, 0.3634033203125, 0.423248291015625, 0.48309326171875, 0.542938232421875, 0.602783203125, 0.662628173828125, 0.72247314453125, 0.782318115234375, 0.8421630859375, 0.902008056640625, 0.96185302734375, 1.021697998046875, 1.08154296875, 1.141387939453125, 1.20123291015625, 1.261077880859375, 1.3209228515625, 1.380767822265625, 1.44061279296875, 1.500457763671875, 1.560302734375, 1.620147705078125, 1.67999267578125, 1.739837646484375, 1.7996826171875, 1.859527587890625, 1.91937255859375, 1.979217529296875, 2.0390625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 6.0, 29.0, 23.0, 54.0, 63.0, 66.0, 77.0, 104.0, 120.0, 91.0, 68.0, 71.0, 66.0, 45.0, 43.0, 22.0, 12.0, 13.0, 8.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53662109375, -0.5202102661132812, -0.5037994384765625, -0.48738861083984375, -0.470977783203125, -0.45456695556640625, -0.4381561279296875, -0.42174530029296875, -0.40533447265625, -0.38892364501953125, -0.3725128173828125, -0.35610198974609375, -0.339691162109375, -0.32328033447265625, -0.3068695068359375, -0.29045867919921875, -0.2740478515625, -0.25763702392578125, -0.2412261962890625, -0.22481536865234375, -0.208404541015625, -0.19199371337890625, -0.1755828857421875, -0.15917205810546875, -0.14276123046875, -0.12635040283203125, -0.1099395751953125, -0.09352874755859375, -0.077117919921875, -0.06070709228515625, -0.0442962646484375, -0.02788543701171875, -0.011474609375, 0.00493621826171875, 0.0213470458984375, 0.03775787353515625, 0.054168701171875, 0.07057952880859375, 0.0869903564453125, 0.10340118408203125, 0.11981201171875, 0.13622283935546875, 0.1526336669921875, 0.16904449462890625, 0.185455322265625, 0.20186614990234375, 0.2182769775390625, 0.23468780517578125, 0.2510986328125, 0.26750946044921875, 0.2839202880859375, 0.30033111572265625, 0.316741943359375, 0.33315277099609375, 0.3495635986328125, 0.36597442626953125, 0.38238525390625, 0.39879608154296875, 0.4152069091796875, 0.43161773681640625, 0.448028564453125, 0.46443939208984375, 0.4808502197265625, 0.49726104736328125, 0.513671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 8.0, 7.0, 10.0, 20.0, 16.0, 31.0, 39.0, 46.0, 68.0, 127.0, 190.0, 337.0, 633.0, 1308.0, 2819.0, 7262.0, 21075.0, 78016.0, 328055.0, 443432.0, 118395.0, 29983.0, 9543.0, 3651.0, 1606.0, 792.0, 401.0, 228.0, 144.0, 87.0, 58.0, 30.0, 37.0, 19.0, 18.0, 6.0, 7.0, 11.0, 8.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.046875, -1.015289306640625, -0.98370361328125, -0.952117919921875, -0.9205322265625, -0.888946533203125, -0.85736083984375, -0.825775146484375, -0.794189453125, -0.762603759765625, -0.73101806640625, -0.699432373046875, -0.6678466796875, -0.636260986328125, -0.60467529296875, -0.573089599609375, -0.54150390625, -0.509918212890625, -0.47833251953125, -0.446746826171875, -0.4151611328125, -0.383575439453125, -0.35198974609375, -0.320404052734375, -0.288818359375, -0.257232666015625, -0.22564697265625, -0.194061279296875, -0.1624755859375, -0.130889892578125, -0.09930419921875, -0.067718505859375, -0.0361328125, -0.004547119140625, 0.02703857421875, 0.058624267578125, 0.0902099609375, 0.121795654296875, 0.15338134765625, 0.184967041015625, 0.216552734375, 0.248138427734375, 0.27972412109375, 0.311309814453125, 0.3428955078125, 0.374481201171875, 0.40606689453125, 0.437652587890625, 0.46923828125, 0.500823974609375, 0.53240966796875, 0.563995361328125, 0.5955810546875, 0.627166748046875, 0.65875244140625, 0.690338134765625, 0.721923828125, 0.753509521484375, 0.78509521484375, 0.816680908203125, 0.8482666015625, 0.879852294921875, 0.91143798828125, 0.943023681640625, 0.974609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 7.0, 7.0, 10.0, 13.0, 10.0, 14.0, 15.0, 24.0, 29.0, 29.0, 30.0, 48.0, 35.0, 22.0, 37.0, 54.0, 39.0, 52.0, 61.0, 49.0, 49.0, 51.0, 42.0, 49.0, 29.0, 32.0, 32.0, 26.0, 14.0, 10.0, 8.0, 20.0, 7.0, 4.0, 8.0, 8.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.2451171875, -1.2060394287109375, -1.166961669921875, -1.1278839111328125, -1.08880615234375, -1.0497283935546875, -1.010650634765625, -0.9715728759765625, -0.9324951171875, -0.8934173583984375, -0.854339599609375, -0.8152618408203125, -0.77618408203125, -0.7371063232421875, -0.698028564453125, -0.6589508056640625, -0.619873046875, -0.5807952880859375, -0.541717529296875, -0.5026397705078125, -0.46356201171875, -0.4244842529296875, -0.385406494140625, -0.3463287353515625, -0.3072509765625, -0.2681732177734375, -0.229095458984375, -0.1900177001953125, -0.15093994140625, -0.1118621826171875, -0.072784423828125, -0.0337066650390625, 0.00537109375, 0.0444488525390625, 0.083526611328125, 0.1226043701171875, 0.16168212890625, 0.2007598876953125, 0.239837646484375, 0.2789154052734375, 0.3179931640625, 0.3570709228515625, 0.396148681640625, 0.4352264404296875, 0.47430419921875, 0.5133819580078125, 0.552459716796875, 0.5915374755859375, 0.630615234375, 0.6696929931640625, 0.708770751953125, 0.7478485107421875, 0.78692626953125, 0.8260040283203125, 0.865081787109375, 0.9041595458984375, 0.9432373046875, 0.9823150634765625, 1.021392822265625, 1.0604705810546875, 1.09954833984375, 1.1386260986328125, 1.177703857421875, 1.2167816162109375, 1.255859375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 8.0, 11.0, 21.0, 19.0, 22.0, 27.0, 37.0, 65.0, 78.0, 144.0, 204.0, 335.0, 708.0, 1721.0, 7226.0, 136031.0, 869238.0, 26782.0, 3434.0, 1100.0, 517.0, 277.0, 151.0, 91.0, 66.0, 58.0, 36.0, 31.0, 27.0, 14.0, 22.0, 7.0, 6.0, 4.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.230194091796875, -1.19085693359375, -1.151519775390625, -1.1121826171875, -1.072845458984375, -1.03350830078125, -0.994171142578125, -0.954833984375, -0.915496826171875, -0.87615966796875, -0.836822509765625, -0.7974853515625, -0.758148193359375, -0.71881103515625, -0.679473876953125, -0.64013671875, -0.600799560546875, -0.56146240234375, -0.522125244140625, -0.4827880859375, -0.443450927734375, -0.40411376953125, -0.364776611328125, -0.325439453125, -0.286102294921875, -0.24676513671875, -0.207427978515625, -0.1680908203125, -0.128753662109375, -0.08941650390625, -0.050079345703125, -0.0107421875, 0.028594970703125, 0.06793212890625, 0.107269287109375, 0.1466064453125, 0.185943603515625, 0.22528076171875, 0.264617919921875, 0.303955078125, 0.343292236328125, 0.38262939453125, 0.421966552734375, 0.4613037109375, 0.500640869140625, 0.53997802734375, 0.579315185546875, 0.61865234375, 0.657989501953125, 0.69732666015625, 0.736663818359375, 0.7760009765625, 0.815338134765625, 0.85467529296875, 0.894012451171875, 0.933349609375, 0.972686767578125, 1.01202392578125, 1.051361083984375, 1.0906982421875, 1.130035400390625, 1.16937255859375, 1.208709716796875, 1.248046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 16.0, 15.0, 26.0, 18.0, 46.0, 37.0, 74.0, 93.0, 169.0, 151.0, 101.0, 67.0, 57.0, 29.0, 27.0, 16.0, 15.0, 11.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012373924255371094, -0.00011881440877914429, -0.00011388957500457764, -0.00010896474123001099, -0.00010403990745544434, -9.911507368087769e-05, -9.419023990631104e-05, -8.926540613174438e-05, -8.434057235717773e-05, -7.941573858261108e-05, -7.449090480804443e-05, -6.956607103347778e-05, -6.464123725891113e-05, -5.971640348434448e-05, -5.479156970977783e-05, -4.986673593521118e-05, -4.494190216064453e-05, -4.001706838607788e-05, -3.509223461151123e-05, -3.016740083694458e-05, -2.524256706237793e-05, -2.031773328781128e-05, -1.539289951324463e-05, -1.0468065738677979e-05, -5.543231964111328e-06, -6.183981895446777e-07, 4.306435585021973e-06, 9.231269359588623e-06, 1.4156103134155273e-05, 1.9080936908721924e-05, 2.4005770683288574e-05, 2.8930604457855225e-05, 3.3855438232421875e-05, 3.8780272006988525e-05, 4.3705105781555176e-05, 4.8629939556121826e-05, 5.3554773330688477e-05, 5.847960710525513e-05, 6.340444087982178e-05, 6.832927465438843e-05, 7.325410842895508e-05, 7.817894220352173e-05, 8.310377597808838e-05, 8.802860975265503e-05, 9.295344352722168e-05, 9.787827730178833e-05, 0.00010280311107635498, 0.00010772794485092163, 0.00011265277862548828, 0.00011757761240005493, 0.00012250244617462158, 0.00012742727994918823, 0.00013235211372375488, 0.00013727694749832153, 0.00014220178127288818, 0.00014712661504745483, 0.00015205144882202148, 0.00015697628259658813, 0.00016190111637115479, 0.00016682595014572144, 0.00017175078392028809, 0.00017667561769485474, 0.0001816004514694214, 0.00018652528524398804, 0.0001914501190185547]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 10.0, 10.0, 10.0, 5.0, 20.0, 38.0, 46.0, 76.0, 99.0, 215.0, 334.0, 791.0, 2008.0, 9883.0, 140306.0, 837899.0, 48612.0, 5360.0, 1462.0, 603.0, 261.0, 173.0, 111.0, 77.0, 49.0, 30.0, 24.0, 14.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.1262969970703125, -1.091461181640625, -1.0566253662109375, -1.02178955078125, -0.9869537353515625, -0.952117919921875, -0.9172821044921875, -0.8824462890625, -0.8476104736328125, -0.812774658203125, -0.7779388427734375, -0.74310302734375, -0.7082672119140625, -0.673431396484375, -0.6385955810546875, -0.603759765625, -0.5689239501953125, -0.534088134765625, -0.4992523193359375, -0.46441650390625, -0.4295806884765625, -0.394744873046875, -0.3599090576171875, -0.3250732421875, -0.2902374267578125, -0.255401611328125, -0.2205657958984375, -0.18572998046875, -0.1508941650390625, -0.116058349609375, -0.0812225341796875, -0.04638671875, -0.0115509033203125, 0.023284912109375, 0.0581207275390625, 0.09295654296875, 0.1277923583984375, 0.162628173828125, 0.1974639892578125, 0.2322998046875, 0.2671356201171875, 0.301971435546875, 0.3368072509765625, 0.37164306640625, 0.4064788818359375, 0.441314697265625, 0.4761505126953125, 0.510986328125, 0.5458221435546875, 0.580657958984375, 0.6154937744140625, 0.65032958984375, 0.6851654052734375, 0.720001220703125, 0.7548370361328125, 0.7896728515625, 0.8245086669921875, 0.859344482421875, 0.8941802978515625, 0.92901611328125, 0.9638519287109375, 0.998687744140625, 1.0335235595703125, 1.068359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 22.0, 21.0, 49.0, 64.0, 148.0, 297.0, 166.0, 88.0, 49.0, 34.0, 17.0, 8.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8271484375, -0.787109375, -0.7470703125, -0.70703125, -0.6669921875, -0.626953125, -0.5869140625, -0.546875, -0.5068359375, -0.466796875, -0.4267578125, -0.38671875, -0.3466796875, -0.306640625, -0.2666015625, -0.2265625, -0.1865234375, -0.146484375, -0.1064453125, -0.06640625, -0.0263671875, 0.013671875, 0.0537109375, 0.09375, 0.1337890625, 0.173828125, 0.2138671875, 0.25390625, 0.2939453125, 0.333984375, 0.3740234375, 0.4140625, 0.4541015625, 0.494140625, 0.5341796875, 0.57421875, 0.6142578125, 0.654296875, 0.6943359375, 0.734375, 0.7744140625, 0.814453125, 0.8544921875, 0.89453125, 0.9345703125, 0.974609375, 1.0146484375, 1.0546875, 1.0947265625, 1.134765625, 1.1748046875, 1.21484375, 1.2548828125, 1.294921875, 1.3349609375, 1.375, 1.4150390625, 1.455078125, 1.4951171875, 1.53515625, 1.5751953125, 1.615234375, 1.6552734375, 1.6953125, 1.7353515625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 6.0, 12.0, 25.0, 41.0, 71.0, 109.0, 177.0, 175.0, 148.0, 94.0, 71.0, 31.0, 20.0, 11.0, 9.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.787625312805176, -10.432682037353516, -10.077739715576172, -9.722796440124512, -9.367854118347168, -9.012910842895508, -8.657968521118164, -8.303025245666504, -7.948082447052002, -7.5931396484375, -7.238196849822998, -6.883254051208496, -6.528310775756836, -6.173368453979492, -5.818425178527832, -5.46348237991333, -5.108539581298828, -4.753596782684326, -4.398653984069824, -4.043710708618164, -3.688768148422241, -3.3338253498077393, -2.978882312774658, -2.6239395141601562, -2.2689967155456543, -1.9140539169311523, -1.5591109991073608, -1.2041680812835693, -0.8492252826690674, -0.49428248405456543, -0.13933944702148438, 0.21560335159301758, 0.5705471038818359, 0.9254899621009827, 1.2804328203201294, 1.635375738143921, 1.9903185367584229, 2.345261335372925, 2.700204372406006, 3.055147171020508, 3.4100899696350098, 3.7650327682495117, 4.119975566864014, 4.474918365478516, 4.829861640930176, 5.1848039627075195, 5.53974723815918, 5.894690036773682, 6.249632835388184, 6.6045756340026855, 6.9595184326171875, 7.314461708068848, 7.669404029846191, 8.024347305297852, 8.379289627075195, 8.734232902526855, 9.089176177978516, 9.444119453430176, 9.79906177520752, 10.15400505065918, 10.508947372436523, 10.863890647888184, 11.218833923339844, 11.573776245117188, 11.928718566894531]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 8.0, 3.0, 3.0, 4.0, 11.0, 14.0, 13.0, 24.0, 26.0, 26.0, 46.0, 40.0, 42.0, 51.0, 44.0, 43.0, 54.0, 46.0, 46.0, 55.0, 51.0, 43.0, 37.0, 42.0, 38.0, 35.0, 37.0, 27.0, 15.0, 18.0, 11.0, 13.0, 8.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.879934310913086, -8.626358985900879, -8.372784614562988, -8.119209289550781, -7.865634918212891, -7.612059593200684, -7.358484745025635, -7.104909896850586, -6.851335048675537, -6.597760200500488, -6.3441853523254395, -6.090610504150391, -5.837035179138184, -5.583460807800293, -5.329885482788086, -5.076310634613037, -4.822735786437988, -4.5691609382629395, -4.315586090087891, -4.062011241912842, -3.808436155319214, -3.554861307144165, -3.301286220550537, -3.0477113723754883, -2.7941365242004395, -2.5405616760253906, -2.286986827850342, -2.033411741256714, -1.779836893081665, -1.5262620449066162, -1.2726870775222778, -1.0191121101379395, -0.765538215637207, -0.5119633078575134, -0.2583884000778198, -0.004813492298126221, 0.24876141548156738, 0.5023362636566162, 0.7559112310409546, 1.009486198425293, 1.2630610466003418, 1.5166358947753906, 1.770210862159729, 2.0237858295440674, 2.277360677719116, 2.530935525894165, 2.784510612487793, 3.038085460662842, 3.2916603088378906, 3.5452351570129395, 3.7988100051879883, 4.052384853363037, 4.305959701538086, 4.559535026550293, 4.813109874725342, 5.066684722900391, 5.3202595710754395, 5.573834419250488, 5.827409267425537, 6.080984115600586, 6.334559440612793, 6.588133811950684, 6.841709136962891, 7.0952839851379395, 7.348858833312988]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 6.0, 15.0, 36.0, 59.0, 99.0, 180.0, 370.0, 1084.0, 4502.0, 43159.0, 4034976.0, 100237.0, 7023.0, 1491.0, 510.0, 217.0, 120.0, 69.0, 34.0, 28.0, 17.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.357421875, -3.26043701171875, -3.1634521484375, -3.06646728515625, -2.969482421875, -2.87249755859375, -2.7755126953125, -2.67852783203125, -2.58154296875, -2.48455810546875, -2.3875732421875, -2.29058837890625, -2.193603515625, -2.09661865234375, -1.9996337890625, -1.90264892578125, -1.8056640625, -1.70867919921875, -1.6116943359375, -1.51470947265625, -1.417724609375, -1.32073974609375, -1.2237548828125, -1.12677001953125, -1.02978515625, -0.93280029296875, -0.8358154296875, -0.73883056640625, -0.641845703125, -0.54486083984375, -0.4478759765625, -0.35089111328125, -0.25390625, -0.15692138671875, -0.0599365234375, 0.03704833984375, 0.134033203125, 0.23101806640625, 0.3280029296875, 0.42498779296875, 0.52197265625, 0.61895751953125, 0.7159423828125, 0.81292724609375, 0.909912109375, 1.00689697265625, 1.1038818359375, 1.20086669921875, 1.2978515625, 1.39483642578125, 1.4918212890625, 1.58880615234375, 1.685791015625, 1.78277587890625, 1.8797607421875, 1.97674560546875, 2.07373046875, 2.17071533203125, 2.2677001953125, 2.36468505859375, 2.461669921875, 2.55865478515625, 2.6556396484375, 2.75262451171875, 2.849609375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 2.0, 4.0, 7.0, 11.0, 26.0, 30.0, 48.0, 53.0, 70.0, 91.0, 85.0, 83.0, 84.0, 81.0, 68.0, 66.0, 49.0, 37.0, 39.0, 25.0, 11.0, 11.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.5605926513671875, -0.543548583984375, -0.5265045166015625, -0.50946044921875, -0.4924163818359375, -0.475372314453125, -0.4583282470703125, -0.4412841796875, -0.4242401123046875, -0.407196044921875, -0.3901519775390625, -0.37310791015625, -0.3560638427734375, -0.339019775390625, -0.3219757080078125, -0.304931640625, -0.2878875732421875, -0.270843505859375, -0.2537994384765625, -0.23675537109375, -0.2197113037109375, -0.202667236328125, -0.1856231689453125, -0.1685791015625, -0.1515350341796875, -0.134490966796875, -0.1174468994140625, -0.10040283203125, -0.0833587646484375, -0.066314697265625, -0.0492706298828125, -0.0322265625, -0.0151824951171875, 0.001861572265625, 0.0189056396484375, 0.03594970703125, 0.0529937744140625, 0.070037841796875, 0.0870819091796875, 0.1041259765625, 0.1211700439453125, 0.138214111328125, 0.1552581787109375, 0.17230224609375, 0.1893463134765625, 0.206390380859375, 0.2234344482421875, 0.240478515625, 0.2575225830078125, 0.274566650390625, 0.2916107177734375, 0.30865478515625, 0.3256988525390625, 0.342742919921875, 0.3597869873046875, 0.3768310546875, 0.3938751220703125, 0.410919189453125, 0.4279632568359375, 0.44500732421875, 0.4620513916015625, 0.479095458984375, 0.4961395263671875, 0.51318359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 3.0, 12.0, 13.0, 18.0, 15.0, 29.0, 33.0, 33.0, 72.0, 83.0, 158.0, 320.0, 824.0, 3180.0, 20133.0, 963431.0, 3171732.0, 28346.0, 3997.0, 999.0, 361.0, 145.0, 92.0, 65.0, 45.0, 25.0, 19.0, 26.0, 21.0, 13.0, 10.0, 4.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8671875, -1.7982177734375, -1.729248046875, -1.6602783203125, -1.59130859375, -1.5223388671875, -1.453369140625, -1.3843994140625, -1.3154296875, -1.2464599609375, -1.177490234375, -1.1085205078125, -1.03955078125, -0.9705810546875, -0.901611328125, -0.8326416015625, -0.763671875, -0.6947021484375, -0.625732421875, -0.5567626953125, -0.48779296875, -0.4188232421875, -0.349853515625, -0.2808837890625, -0.2119140625, -0.1429443359375, -0.073974609375, -0.0050048828125, 0.06396484375, 0.1329345703125, 0.201904296875, 0.2708740234375, 0.33984375, 0.4088134765625, 0.477783203125, 0.5467529296875, 0.61572265625, 0.6846923828125, 0.753662109375, 0.8226318359375, 0.8916015625, 0.9605712890625, 1.029541015625, 1.0985107421875, 1.16748046875, 1.2364501953125, 1.305419921875, 1.3743896484375, 1.443359375, 1.5123291015625, 1.581298828125, 1.6502685546875, 1.71923828125, 1.7882080078125, 1.857177734375, 1.9261474609375, 1.9951171875, 2.0640869140625, 2.133056640625, 2.2020263671875, 2.27099609375, 2.3399658203125, 2.408935546875, 2.4779052734375, 2.546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 9.0, 2.0, 9.0, 14.0, 38.0, 85.0, 218.0, 1660.0, 1670.0, 222.0, 68.0, 35.0, 20.0, 21.0, 4.0, 2.0, 4.0, 4.0], "bins": [-2.130859375, -2.091400146484375, -2.05194091796875, -2.012481689453125, -1.9730224609375, -1.933563232421875, -1.89410400390625, -1.854644775390625, -1.815185546875, -1.775726318359375, -1.73626708984375, -1.696807861328125, -1.6573486328125, -1.617889404296875, -1.57843017578125, -1.538970947265625, -1.49951171875, -1.460052490234375, -1.42059326171875, -1.381134033203125, -1.3416748046875, -1.302215576171875, -1.26275634765625, -1.223297119140625, -1.183837890625, -1.144378662109375, -1.10491943359375, -1.065460205078125, -1.0260009765625, -0.986541748046875, -0.94708251953125, -0.907623291015625, -0.8681640625, -0.828704833984375, -0.78924560546875, -0.749786376953125, -0.7103271484375, -0.670867919921875, -0.63140869140625, -0.591949462890625, -0.552490234375, -0.513031005859375, -0.47357177734375, -0.434112548828125, -0.3946533203125, -0.355194091796875, -0.31573486328125, -0.276275634765625, -0.23681640625, -0.197357177734375, -0.15789794921875, -0.118438720703125, -0.0789794921875, -0.039520263671875, -6.103515625e-05, 0.039398193359375, 0.078857421875, 0.118316650390625, 0.15777587890625, 0.197235107421875, 0.2366943359375, 0.276153564453125, 0.31561279296875, 0.355072021484375, 0.39453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 42.0, 126.0, 375.0, 318.0, 94.0, 34.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.23236083984375, -12.950109481811523, -12.667858123779297, -12.385607719421387, -12.10335636138916, -11.821105003356934, -11.538854598999023, -11.256603240966797, -10.97435188293457, -10.692100524902344, -10.409849166870117, -10.127598762512207, -9.84534740447998, -9.563096046447754, -9.280845642089844, -8.998594284057617, -8.71634292602539, -8.434091567993164, -8.151840209960938, -7.869589805603027, -7.587338447570801, -7.305087089538574, -7.022836208343506, -6.7405853271484375, -6.458333969116211, -6.176082611083984, -5.893831729888916, -5.611580848693848, -5.329329490661621, -5.0470781326293945, -4.764827251434326, -4.482576370239258, -4.200324058532715, -3.9180729389190674, -3.63582181930542, -3.3535706996917725, -3.071319580078125, -2.7890684604644775, -2.50681734085083, -2.2245662212371826, -1.9423151016235352, -1.6600639820098877, -1.3778128623962402, -1.0955617427825928, -0.8133106231689453, -0.5310595035552979, -0.2488083839416504, 0.03344273567199707, 0.31569385528564453, 0.597944974899292, 0.8801960945129395, 1.162447214126587, 1.4446983337402344, 1.7269494533538818, 2.0092005729675293, 2.2914516925811768, 2.573702812194824, 2.8559539318084717, 3.138205051422119, 3.4204561710357666, 3.702707290649414, 3.9849584102630615, 4.267209529876709, 4.549460411071777, 4.831711769104004]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 6.0, 6.0, 8.0, 7.0, 11.0, 11.0, 6.0, 18.0, 27.0, 17.0, 16.0, 26.0, 28.0, 34.0, 28.0, 39.0, 33.0, 41.0, 40.0, 45.0, 47.0, 32.0, 29.0, 34.0, 32.0, 44.0, 42.0, 39.0, 27.0, 31.0, 18.0, 31.0, 22.0, 17.0, 15.0, 21.0, 5.0, 10.0, 16.0, 8.0, 4.0, 8.0, 5.0, 5.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.8610910177230835, -1.8044270277023315, -1.7477630376815796, -1.6910990476608276, -1.6344350576400757, -1.5777710676193237, -1.5211070775985718, -1.4644430875778198, -1.4077790975570679, -1.351115107536316, -1.294451117515564, -1.237787127494812, -1.18112313747406, -1.124459147453308, -1.0677951574325562, -1.0111311674118042, -0.9544671773910522, -0.8978031873703003, -0.8411391973495483, -0.7844752073287964, -0.7278112173080444, -0.6711472272872925, -0.6144832372665405, -0.5578192472457886, -0.5011552572250366, -0.44449126720428467, -0.3878272771835327, -0.33116328716278076, -0.2744992971420288, -0.21783530712127686, -0.1611713171005249, -0.10450732707977295, -0.04784345626831055, 0.008820533752441406, 0.06548452377319336, 0.12214851379394531, 0.17881250381469727, 0.23547649383544922, 0.29214048385620117, 0.3488044738769531, 0.4054684638977051, 0.46213245391845703, 0.518796443939209, 0.5754604339599609, 0.6321244239807129, 0.6887884140014648, 0.7454524040222168, 0.8021163940429688, 0.8587803840637207, 0.9154443740844727, 0.9721083641052246, 1.0287723541259766, 1.0854363441467285, 1.1421003341674805, 1.1987643241882324, 1.2554283142089844, 1.3120923042297363, 1.3687562942504883, 1.4254202842712402, 1.4820842742919922, 1.5387482643127441, 1.595412254333496, 1.652076244354248, 1.708740234375, 1.765404224395752]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 2.0, 9.0, 5.0, 17.0, 21.0, 31.0, 45.0, 74.0, 123.0, 223.0, 357.0, 651.0, 1271.0, 2592.0, 6461.0, 19518.0, 75292.0, 333347.0, 449083.0, 115817.0, 28388.0, 8597.0, 3275.0, 1568.0, 739.0, 388.0, 247.0, 163.0, 83.0, 40.0, 40.0, 26.0, 19.0, 9.0, 8.0, 4.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4263153076171875, -1.378997802734375, -1.3316802978515625, -1.28436279296875, -1.2370452880859375, -1.189727783203125, -1.1424102783203125, -1.0950927734375, -1.0477752685546875, -1.000457763671875, -0.9531402587890625, -0.90582275390625, -0.8585052490234375, -0.811187744140625, -0.7638702392578125, -0.716552734375, -0.6692352294921875, -0.621917724609375, -0.5746002197265625, -0.52728271484375, -0.4799652099609375, -0.432647705078125, -0.3853302001953125, -0.3380126953125, -0.2906951904296875, -0.243377685546875, -0.1960601806640625, -0.14874267578125, -0.1014251708984375, -0.054107666015625, -0.0067901611328125, 0.04052734375, 0.0878448486328125, 0.135162353515625, 0.1824798583984375, 0.22979736328125, 0.2771148681640625, 0.324432373046875, 0.3717498779296875, 0.4190673828125, 0.4663848876953125, 0.513702392578125, 0.5610198974609375, 0.60833740234375, 0.6556549072265625, 0.702972412109375, 0.7502899169921875, 0.797607421875, 0.8449249267578125, 0.892242431640625, 0.9395599365234375, 0.98687744140625, 1.0341949462890625, 1.081512451171875, 1.1288299560546875, 1.1761474609375, 1.2234649658203125, 1.270782470703125, 1.3180999755859375, 1.36541748046875, 1.4127349853515625, 1.460052490234375, 1.5073699951171875, 1.5546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 2.0, 5.0, 6.0, 6.0, 17.0, 18.0, 32.0, 45.0, 47.0, 68.0, 73.0, 83.0, 82.0, 74.0, 93.0, 64.0, 69.0, 57.0, 33.0, 40.0, 28.0, 24.0, 16.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.580078125, -0.5631027221679688, -0.5461273193359375, -0.5291519165039062, -0.512176513671875, -0.49520111083984375, -0.4782257080078125, -0.46125030517578125, -0.44427490234375, -0.42729949951171875, -0.4103240966796875, -0.39334869384765625, -0.376373291015625, -0.35939788818359375, -0.3424224853515625, -0.32544708251953125, -0.3084716796875, -0.29149627685546875, -0.2745208740234375, -0.25754547119140625, -0.240570068359375, -0.22359466552734375, -0.2066192626953125, -0.18964385986328125, -0.17266845703125, -0.15569305419921875, -0.1387176513671875, -0.12174224853515625, -0.104766845703125, -0.08779144287109375, -0.0708160400390625, -0.05384063720703125, -0.036865234375, -0.01988983154296875, -0.0029144287109375, 0.01406097412109375, 0.031036376953125, 0.04801177978515625, 0.0649871826171875, 0.08196258544921875, 0.09893798828125, 0.11591339111328125, 0.1328887939453125, 0.14986419677734375, 0.166839599609375, 0.18381500244140625, 0.2007904052734375, 0.21776580810546875, 0.2347412109375, 0.25171661376953125, 0.2686920166015625, 0.28566741943359375, 0.302642822265625, 0.31961822509765625, 0.3365936279296875, 0.35356903076171875, 0.37054443359375, 0.38751983642578125, 0.4044952392578125, 0.42147064208984375, 0.438446044921875, 0.45542144775390625, 0.4723968505859375, 0.48937225341796875, 0.50634765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 8.0, 5.0, 7.0, 16.0, 22.0, 31.0, 45.0, 98.0, 175.0, 307.0, 642.0, 1449.0, 3954.0, 15521.0, 96012.0, 655270.0, 234540.0, 30184.0, 6482.0, 2156.0, 774.0, 373.0, 181.0, 119.0, 64.0, 44.0, 25.0, 14.0, 8.0, 9.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.201171875, -2.1358489990234375, -2.070526123046875, -2.0052032470703125, -1.93988037109375, -1.8745574951171875, -1.809234619140625, -1.7439117431640625, -1.6785888671875, -1.6132659912109375, -1.547943115234375, -1.4826202392578125, -1.41729736328125, -1.3519744873046875, -1.286651611328125, -1.2213287353515625, -1.156005859375, -1.0906829833984375, -1.025360107421875, -0.9600372314453125, -0.89471435546875, -0.8293914794921875, -0.764068603515625, -0.6987457275390625, -0.6334228515625, -0.5680999755859375, -0.502777099609375, -0.4374542236328125, -0.37213134765625, -0.3068084716796875, -0.241485595703125, -0.1761627197265625, -0.11083984375, -0.0455169677734375, 0.019805908203125, 0.0851287841796875, 0.15045166015625, 0.2157745361328125, 0.281097412109375, 0.3464202880859375, 0.4117431640625, 0.4770660400390625, 0.542388916015625, 0.6077117919921875, 0.67303466796875, 0.7383575439453125, 0.803680419921875, 0.8690032958984375, 0.934326171875, 0.9996490478515625, 1.064971923828125, 1.1302947998046875, 1.19561767578125, 1.2609405517578125, 1.326263427734375, 1.3915863037109375, 1.4569091796875, 1.5222320556640625, 1.587554931640625, 1.6528778076171875, 1.71820068359375, 1.7835235595703125, 1.848846435546875, 1.9141693115234375, 1.9794921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 3.0, 2.0, 12.0, 6.0, 7.0, 14.0, 18.0, 23.0, 22.0, 20.0, 22.0, 29.0, 36.0, 32.0, 35.0, 35.0, 35.0, 49.0, 53.0, 47.0, 41.0, 47.0, 42.0, 49.0, 36.0, 42.0, 37.0, 29.0, 25.0, 28.0, 19.0, 19.0, 14.0, 6.0, 6.0, 7.0, 12.0, 6.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7705078125, -1.71588134765625, -1.6612548828125, -1.60662841796875, -1.552001953125, -1.49737548828125, -1.4427490234375, -1.38812255859375, -1.33349609375, -1.27886962890625, -1.2242431640625, -1.16961669921875, -1.114990234375, -1.06036376953125, -1.0057373046875, -0.95111083984375, -0.896484375, -0.84185791015625, -0.7872314453125, -0.73260498046875, -0.677978515625, -0.62335205078125, -0.5687255859375, -0.51409912109375, -0.45947265625, -0.40484619140625, -0.3502197265625, -0.29559326171875, -0.240966796875, -0.18634033203125, -0.1317138671875, -0.07708740234375, -0.0224609375, 0.03216552734375, 0.0867919921875, 0.14141845703125, 0.196044921875, 0.25067138671875, 0.3052978515625, 0.35992431640625, 0.41455078125, 0.46917724609375, 0.5238037109375, 0.57843017578125, 0.633056640625, 0.68768310546875, 0.7423095703125, 0.79693603515625, 0.8515625, 0.90618896484375, 0.9608154296875, 1.01544189453125, 1.070068359375, 1.12469482421875, 1.1793212890625, 1.23394775390625, 1.28857421875, 1.34320068359375, 1.3978271484375, 1.45245361328125, 1.507080078125, 1.56170654296875, 1.6163330078125, 1.67095947265625, 1.7255859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 6.0, 15.0, 12.0, 18.0, 20.0, 43.0, 61.0, 136.0, 225.0, 446.0, 1063.0, 3086.0, 14497.0, 155058.0, 751695.0, 106612.0, 11161.0, 2563.0, 916.0, 415.0, 194.0, 111.0, 62.0, 35.0, 29.0, 27.0, 15.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.98876953125, -0.960052490234375, -0.93133544921875, -0.902618408203125, -0.8739013671875, -0.845184326171875, -0.81646728515625, -0.787750244140625, -0.759033203125, -0.730316162109375, -0.70159912109375, -0.672882080078125, -0.6441650390625, -0.615447998046875, -0.58673095703125, -0.558013916015625, -0.529296875, -0.500579833984375, -0.47186279296875, -0.443145751953125, -0.4144287109375, -0.385711669921875, -0.35699462890625, -0.328277587890625, -0.299560546875, -0.270843505859375, -0.24212646484375, -0.213409423828125, -0.1846923828125, -0.155975341796875, -0.12725830078125, -0.098541259765625, -0.06982421875, -0.041107177734375, -0.01239013671875, 0.016326904296875, 0.0450439453125, 0.073760986328125, 0.10247802734375, 0.131195068359375, 0.159912109375, 0.188629150390625, 0.21734619140625, 0.246063232421875, 0.2747802734375, 0.303497314453125, 0.33221435546875, 0.360931396484375, 0.3896484375, 0.418365478515625, 0.44708251953125, 0.475799560546875, 0.5045166015625, 0.533233642578125, 0.56195068359375, 0.590667724609375, 0.619384765625, 0.648101806640625, 0.67681884765625, 0.705535888671875, 0.7342529296875, 0.762969970703125, 0.79168701171875, 0.820404052734375, 0.84912109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 11.0, 16.0, 19.0, 31.0, 43.0, 54.0, 71.0, 118.0, 99.0, 122.0, 80.0, 106.0, 61.0, 59.0, 31.0, 14.0, 16.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00018537044525146484, -0.00018038414418697357, -0.0001753978431224823, -0.00017041154205799103, -0.00016542524099349976, -0.00016043893992900848, -0.0001554526388645172, -0.00015046633780002594, -0.00014548003673553467, -0.0001404937356710434, -0.00013550743460655212, -0.00013052113354206085, -0.00012553483247756958, -0.00012054853141307831, -0.00011556223034858704, -0.00011057592928409576, -0.00010558962821960449, -0.00010060332715511322, -9.561702609062195e-05, -9.063072502613068e-05, -8.56444239616394e-05, -8.065812289714813e-05, -7.567182183265686e-05, -7.068552076816559e-05, -6.569921970367432e-05, -6.0712918639183044e-05, -5.572661757469177e-05, -5.07403165102005e-05, -4.575401544570923e-05, -4.0767714381217957e-05, -3.5781413316726685e-05, -3.079511225223541e-05, -2.580881118774414e-05, -2.082251012325287e-05, -1.5836209058761597e-05, -1.0849907994270325e-05, -5.863606929779053e-06, -8.773058652877808e-07, 4.108995199203491e-06, 9.095296263694763e-06, 1.4081597328186035e-05, 1.9067898392677307e-05, 2.405419945716858e-05, 2.904050052165985e-05, 3.402680158615112e-05, 3.9013102650642395e-05, 4.399940371513367e-05, 4.898570477962494e-05, 5.397200584411621e-05, 5.895830690860748e-05, 6.394460797309875e-05, 6.893090903759003e-05, 7.39172101020813e-05, 7.890351116657257e-05, 8.388981223106384e-05, 8.887611329555511e-05, 9.386241436004639e-05, 9.884871542453766e-05, 0.00010383501648902893, 0.0001088213175535202, 0.00011380761861801147, 0.00011879391968250275, 0.00012378022074699402, 0.0001287665218114853, 0.00013375282287597656]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 10.0, 4.0, 10.0, 13.0, 18.0, 28.0, 30.0, 52.0, 94.0, 187.0, 287.0, 676.0, 1573.0, 4420.0, 16087.0, 78242.0, 419325.0, 423530.0, 80104.0, 16306.0, 4507.0, 1556.0, 689.0, 324.0, 201.0, 109.0, 62.0, 44.0, 25.0, 13.0, 7.0, 8.0, 6.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5536651611328125, -0.534576416015625, -0.5154876708984375, -0.49639892578125, -0.4773101806640625, -0.458221435546875, -0.4391326904296875, -0.4200439453125, -0.4009552001953125, -0.381866455078125, -0.3627777099609375, -0.34368896484375, -0.3246002197265625, -0.305511474609375, -0.2864227294921875, -0.267333984375, -0.2482452392578125, -0.229156494140625, -0.2100677490234375, -0.19097900390625, -0.1718902587890625, -0.152801513671875, -0.1337127685546875, -0.1146240234375, -0.0955352783203125, -0.076446533203125, -0.0573577880859375, -0.03826904296875, -0.0191802978515625, -9.1552734375e-05, 0.0189971923828125, 0.0380859375, 0.0571746826171875, 0.076263427734375, 0.0953521728515625, 0.11444091796875, 0.1335296630859375, 0.152618408203125, 0.1717071533203125, 0.1907958984375, 0.2098846435546875, 0.228973388671875, 0.2480621337890625, 0.26715087890625, 0.2862396240234375, 0.305328369140625, 0.3244171142578125, 0.343505859375, 0.3625946044921875, 0.381683349609375, 0.4007720947265625, 0.41986083984375, 0.4389495849609375, 0.458038330078125, 0.4771270751953125, 0.4962158203125, 0.5153045654296875, 0.534393310546875, 0.5534820556640625, 0.57257080078125, 0.5916595458984375, 0.610748291015625, 0.6298370361328125, 0.64892578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 11.0, 6.0, 21.0, 17.0, 20.0, 40.0, 40.0, 40.0, 62.0, 76.0, 95.0, 99.0, 87.0, 89.0, 59.0, 55.0, 43.0, 26.0, 27.0, 18.0, 11.0, 9.0, 7.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6494140625, -0.6286773681640625, -0.607940673828125, -0.5872039794921875, -0.56646728515625, -0.5457305908203125, -0.524993896484375, -0.5042572021484375, -0.4835205078125, -0.4627838134765625, -0.442047119140625, -0.4213104248046875, -0.40057373046875, -0.3798370361328125, -0.359100341796875, -0.3383636474609375, -0.317626953125, -0.2968902587890625, -0.276153564453125, -0.2554168701171875, -0.23468017578125, -0.2139434814453125, -0.193206787109375, -0.1724700927734375, -0.1517333984375, -0.1309967041015625, -0.110260009765625, -0.0895233154296875, -0.06878662109375, -0.0480499267578125, -0.027313232421875, -0.0065765380859375, 0.01416015625, 0.0348968505859375, 0.055633544921875, 0.0763702392578125, 0.09710693359375, 0.1178436279296875, 0.138580322265625, 0.1593170166015625, 0.1800537109375, 0.2007904052734375, 0.221527099609375, 0.2422637939453125, 0.26300048828125, 0.2837371826171875, 0.304473876953125, 0.3252105712890625, 0.345947265625, 0.3666839599609375, 0.387420654296875, 0.4081573486328125, 0.42889404296875, 0.4496307373046875, 0.470367431640625, 0.4911041259765625, 0.5118408203125, 0.5325775146484375, 0.553314208984375, 0.5740509033203125, 0.59478759765625, 0.6155242919921875, 0.636260986328125, 0.6569976806640625, 0.677734375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 36.0, 71.0, 136.0, 228.0, 224.0, 146.0, 86.0, 32.0, 19.0, 11.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.579538345336914, -6.029973030090332, -5.48040771484375, -4.930842399597168, -4.381277084350586, -3.831711530685425, -3.2821459770202637, -2.7325806617736816, -2.1830153465270996, -1.6334500312805176, -1.083884596824646, -0.5343191623687744, 0.015246152877807617, 0.5648114681243896, 1.1143770217895508, 1.6639423370361328, 2.213507652282715, 2.763072967529297, 3.312638282775879, 3.86220383644104, 4.411768913269043, 4.961334228515625, 5.510900020599365, 6.060465335845947, 6.610030651092529, 7.159595966339111, 7.709161281585693, 8.258727073669434, 8.808292388916016, 9.357857704162598, 9.90742301940918, 10.456988334655762, 11.006553649902344, 11.556118965148926, 12.105684280395508, 12.65524959564209, 13.204814910888672, 13.754380226135254, 14.303945541381836, 14.853511810302734, 15.403076171875, 15.952641487121582, 16.502206802368164, 17.051773071289062, 17.601337432861328, 18.150903701782227, 18.700468063354492, 19.25003433227539, 19.799598693847656, 20.349164962768555, 20.89872932434082, 21.44829559326172, 21.997859954833984, 22.547426223754883, 23.09699058532715, 23.646556854248047, 24.196123123168945, 24.745689392089844, 25.29525375366211, 25.844820022583008, 26.394384384155273, 26.943950653076172, 27.493515014648438, 28.043081283569336, 28.5926456451416]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 2.0, 7.0, 4.0, 9.0, 12.0, 18.0, 25.0, 29.0, 24.0, 26.0, 56.0, 42.0, 53.0, 65.0, 48.0, 44.0, 52.0, 60.0, 59.0, 57.0, 50.0, 42.0, 36.0, 34.0, 23.0, 26.0, 23.0, 17.0, 11.0, 9.0, 9.0, 4.0, 7.0, 2.0, 4.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.830204010009766, -11.503683090209961, -11.177162170410156, -10.850641250610352, -10.524120330810547, -10.197599411010742, -9.871078491210938, -9.544556617736816, -9.218035697937012, -8.891514778137207, -8.564993858337402, -8.238472938537598, -7.911951541900635, -7.58543062210083, -7.258909702301025, -6.9323883056640625, -6.605867862701416, -6.279346942901611, -5.952826023101807, -5.626304626464844, -5.299783706665039, -4.973262786865234, -4.64674186706543, -4.320220947265625, -3.993699789047241, -3.6671788692474365, -3.3406577110290527, -3.014136791229248, -2.6876158714294434, -2.3610947132110596, -2.034573793411255, -1.708052635192871, -1.3815317153930664, -1.0550106763839722, -0.7284896969795227, -0.40196871757507324, -0.075447678565979, 0.25107336044311523, 0.5775942802429199, 0.9041154384613037, 1.2306363582611084, 1.5571573972702026, 1.8836784362792969, 2.2101993560791016, 2.5367202758789062, 2.86324143409729, 3.1897623538970947, 3.5162835121154785, 3.842804431915283, 4.169325351715088, 4.495846271514893, 4.8223676681518555, 5.14888858795166, 5.475409507751465, 5.8019304275512695, 6.128451347351074, 6.454972267150879, 6.781493186950684, 7.108014106750488, 7.434535026550293, 7.761056423187256, 8.087577819824219, 8.414098739624023, 8.740619659423828, 9.067140579223633]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 9.0, 15.0, 29.0, 45.0, 55.0, 129.0, 185.0, 534.0, 3824.0, 3831490.0, 354058.0, 2954.0, 481.0, 214.0, 94.0, 54.0, 42.0, 22.0, 20.0, 6.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.724609375, -3.581085205078125, -3.43756103515625, -3.294036865234375, -3.1505126953125, -3.006988525390625, -2.86346435546875, -2.719940185546875, -2.576416015625, -2.432891845703125, -2.28936767578125, -2.145843505859375, -2.0023193359375, -1.858795166015625, -1.71527099609375, -1.571746826171875, -1.42822265625, -1.284698486328125, -1.14117431640625, -0.997650146484375, -0.8541259765625, -0.710601806640625, -0.56707763671875, -0.423553466796875, -0.280029296875, -0.136505126953125, 0.00701904296875, 0.150543212890625, 0.2940673828125, 0.437591552734375, 0.58111572265625, 0.724639892578125, 0.8681640625, 1.011688232421875, 1.15521240234375, 1.298736572265625, 1.4422607421875, 1.585784912109375, 1.72930908203125, 1.872833251953125, 2.016357421875, 2.159881591796875, 2.30340576171875, 2.446929931640625, 2.5904541015625, 2.733978271484375, 2.87750244140625, 3.021026611328125, 3.16455078125, 3.308074951171875, 3.45159912109375, 3.595123291015625, 3.7386474609375, 3.882171630859375, 4.02569580078125, 4.169219970703125, 4.312744140625, 4.456268310546875, 4.59979248046875, 4.743316650390625, 4.8868408203125, 5.030364990234375, 5.17388916015625, 5.317413330078125, 5.4609375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 2.0, 1.0, 7.0, 10.0, 12.0, 20.0, 38.0, 30.0, 44.0, 51.0, 67.0, 77.0, 71.0, 77.0, 78.0, 76.0, 63.0, 54.0, 41.0, 47.0, 32.0, 40.0, 10.0, 9.0, 14.0, 3.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6131668090820312, -0.5949859619140625, -0.5768051147460938, -0.558624267578125, -0.5404434204101562, -0.5222625732421875, -0.5040817260742188, -0.48590087890625, -0.46772003173828125, -0.4495391845703125, -0.43135833740234375, -0.413177490234375, -0.39499664306640625, -0.3768157958984375, -0.35863494873046875, -0.3404541015625, -0.32227325439453125, -0.3040924072265625, -0.28591156005859375, -0.267730712890625, -0.24954986572265625, -0.2313690185546875, -0.21318817138671875, -0.19500732421875, -0.17682647705078125, -0.1586456298828125, -0.14046478271484375, -0.122283935546875, -0.10410308837890625, -0.0859222412109375, -0.06774139404296875, -0.049560546875, -0.03137969970703125, -0.0131988525390625, 0.00498199462890625, 0.023162841796875, 0.04134368896484375, 0.0595245361328125, 0.07770538330078125, 0.09588623046875, 0.11406707763671875, 0.1322479248046875, 0.15042877197265625, 0.168609619140625, 0.18679046630859375, 0.2049713134765625, 0.22315216064453125, 0.2413330078125, 0.25951385498046875, 0.2776947021484375, 0.29587554931640625, 0.314056396484375, 0.33223724365234375, 0.3504180908203125, 0.36859893798828125, 0.38677978515625, 0.40496063232421875, 0.4231414794921875, 0.44132232666015625, 0.459503173828125, 0.47768402099609375, 0.4958648681640625, 0.5140457153320312, 0.5322265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 4.0, 5.0, 2.0, 16.0, 12.0, 18.0, 18.0, 30.0, 36.0, 47.0, 68.0, 107.0, 149.0, 245.0, 394.0, 853.0, 2133.0, 7707.0, 51485.0, 3929039.0, 181067.0, 14463.0, 3559.0, 1277.0, 583.0, 292.0, 186.0, 112.0, 90.0, 73.0, 44.0, 39.0, 26.0, 27.0, 15.0, 16.0, 15.0, 8.0, 6.0, 3.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.455078125, -1.40057373046875, -1.3460693359375, -1.29156494140625, -1.237060546875, -1.18255615234375, -1.1280517578125, -1.07354736328125, -1.01904296875, -0.96453857421875, -0.9100341796875, -0.85552978515625, -0.801025390625, -0.74652099609375, -0.6920166015625, -0.63751220703125, -0.5830078125, -0.52850341796875, -0.4739990234375, -0.41949462890625, -0.364990234375, -0.31048583984375, -0.2559814453125, -0.20147705078125, -0.14697265625, -0.09246826171875, -0.0379638671875, 0.01654052734375, 0.071044921875, 0.12554931640625, 0.1800537109375, 0.23455810546875, 0.2890625, 0.34356689453125, 0.3980712890625, 0.45257568359375, 0.507080078125, 0.56158447265625, 0.6160888671875, 0.67059326171875, 0.72509765625, 0.77960205078125, 0.8341064453125, 0.88861083984375, 0.943115234375, 0.99761962890625, 1.0521240234375, 1.10662841796875, 1.1611328125, 1.21563720703125, 1.2701416015625, 1.32464599609375, 1.379150390625, 1.43365478515625, 1.4881591796875, 1.54266357421875, 1.59716796875, 1.65167236328125, 1.7061767578125, 1.76068115234375, 1.815185546875, 1.86968994140625, 1.9241943359375, 1.97869873046875, 2.033203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 10.0, 12.0, 27.0, 53.0, 181.0, 2955.0, 656.0, 94.0, 35.0, 18.0, 13.0, 13.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2259521484375, -0.2107410430908203, -0.19552993774414062, -0.18031883239746094, -0.16510772705078125, -0.14989662170410156, -0.13468551635742188, -0.11947441101074219, -0.1042633056640625, -0.08905220031738281, -0.07384109497070312, -0.05862998962402344, -0.04341888427734375, -0.028207778930664062, -0.012996673583984375, 0.0022144317626953125, 0.017425537109375, 0.03263664245605469, 0.047847747802734375, 0.06305885314941406, 0.07826995849609375, 0.09348106384277344, 0.10869216918945312, 0.12390327453613281, 0.1391143798828125, 0.1543254852294922, 0.16953659057617188, 0.18474769592285156, 0.19995880126953125, 0.21516990661621094, 0.23038101196289062, 0.2455921173095703, 0.26080322265625, 0.2760143280029297, 0.2912254333496094, 0.30643653869628906, 0.32164764404296875, 0.33685874938964844, 0.3520698547363281, 0.3672809600830078, 0.3824920654296875, 0.3977031707763672, 0.4129142761230469, 0.42812538146972656, 0.44333648681640625, 0.45854759216308594, 0.4737586975097656, 0.4889698028564453, 0.504180908203125, 0.5193920135498047, 0.5346031188964844, 0.5498142242431641, 0.5650253295898438, 0.5802364349365234, 0.5954475402832031, 0.6106586456298828, 0.6258697509765625, 0.6410808563232422, 0.6562919616699219, 0.6715030670166016, 0.6867141723632812, 0.7019252777099609, 0.7171363830566406, 0.7323474884033203, 0.74755859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 19.0, 17.0, 61.0, 154.0, 258.0, 248.0, 144.0, 61.0, 27.0, 12.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1189324855804443, -1.0446792840957642, -0.970426082611084, -0.8961728811264038, -0.8219196796417236, -0.7476664781570435, -0.6734132766723633, -0.5991600751876831, -0.5249068737030029, -0.45065367221832275, -0.3764004707336426, -0.3021472692489624, -0.22789406776428223, -0.15364086627960205, -0.07938766479492188, -0.005134463310241699, 0.06911873817443848, 0.14337193965911865, 0.21762514114379883, 0.291878342628479, 0.3661315441131592, 0.44038474559783936, 0.5146379470825195, 0.5888911485671997, 0.6631443500518799, 0.7373975515365601, 0.8116507530212402, 0.8859039545059204, 0.9601571559906006, 1.0344103574752808, 1.108663558959961, 1.1829167604446411, 1.2571697235107422, 1.3314229249954224, 1.4056761264801025, 1.4799293279647827, 1.554182529449463, 1.628435730934143, 1.7026889324188232, 1.7769421339035034, 1.8511953353881836, 1.9254485368728638, 1.999701738357544, 2.0739550590515137, 2.1482081413269043, 2.222461223602295, 2.2967145442962646, 2.3709678649902344, 2.445220947265625, 2.5194740295410156, 2.5937273502349854, 2.667980670928955, 2.7422337532043457, 2.8164868354797363, 2.890740156173706, 2.964993476867676, 3.0392465591430664, 3.113499641418457, 3.1877529621124268, 3.2620062828063965, 3.336259365081787, 3.4105124473571777, 3.4847657680511475, 3.559019088745117, 3.633272171020508]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 3.0, 6.0, 13.0, 15.0, 15.0, 19.0, 20.0, 23.0, 22.0, 29.0, 35.0, 34.0, 38.0, 46.0, 42.0, 31.0, 45.0, 51.0, 53.0, 34.0, 28.0, 42.0, 33.0, 38.0, 36.0, 33.0, 33.0, 32.0, 32.0, 15.0, 12.0, 15.0, 15.0, 10.0, 11.0, 9.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6099852919578552, -0.5884954929351807, -0.5670056939125061, -0.5455158948898315, -0.524026095867157, -0.5025362968444824, -0.4810464680194855, -0.4595566689968109, -0.43806686997413635, -0.4165770709514618, -0.39508727192878723, -0.3735974431037903, -0.3521076440811157, -0.33061784505844116, -0.3091280460357666, -0.28763824701309204, -0.2661484479904175, -0.24465864896774292, -0.22316884994506836, -0.2016790360212326, -0.18018923699855804, -0.15869943797588348, -0.13720962405204773, -0.11571982502937317, -0.09423002600669861, -0.07274022698402405, -0.05125042051076889, -0.029760614037513733, -0.008270815014839172, 0.013218984007835388, 0.03470879793167114, 0.0561985969543457, 0.07768839597702026, 0.09917819499969482, 0.12066800147294998, 0.14215780794620514, 0.1636476069688797, 0.18513740599155426, 0.20662721991539001, 0.22811701893806458, 0.24960681796073914, 0.2710966169834137, 0.29258641600608826, 0.3140762448310852, 0.33556604385375977, 0.3570558428764343, 0.3785456418991089, 0.40003544092178345, 0.421525239944458, 0.44301503896713257, 0.46450483798980713, 0.4859946370124817, 0.5074844360351562, 0.5289742350578308, 0.5504640340805054, 0.5719538927078247, 0.5934436321258545, 0.614933431148529, 0.6364232301712036, 0.6579130291938782, 0.6794028282165527, 0.7008926272392273, 0.7223824262619019, 0.7438722848892212, 0.7653620839118958]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 7.0, 13.0, 31.0, 37.0, 60.0, 104.0, 193.0, 333.0, 658.0, 1306.0, 3318.0, 9904.0, 35580.0, 168408.0, 522625.0, 236642.0, 48880.0, 13014.0, 4123.0, 1640.0, 778.0, 358.0, 201.0, 119.0, 94.0, 43.0, 36.0, 12.0, 6.0, 9.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7861328125, -1.7329864501953125, -1.679840087890625, -1.6266937255859375, -1.57354736328125, -1.5204010009765625, -1.467254638671875, -1.4141082763671875, -1.3609619140625, -1.3078155517578125, -1.254669189453125, -1.2015228271484375, -1.14837646484375, -1.0952301025390625, -1.042083740234375, -0.9889373779296875, -0.935791015625, -0.8826446533203125, -0.829498291015625, -0.7763519287109375, -0.72320556640625, -0.6700592041015625, -0.616912841796875, -0.5637664794921875, -0.5106201171875, -0.4574737548828125, -0.404327392578125, -0.3511810302734375, -0.29803466796875, -0.2448883056640625, -0.191741943359375, -0.1385955810546875, -0.08544921875, -0.0323028564453125, 0.020843505859375, 0.0739898681640625, 0.12713623046875, 0.1802825927734375, 0.233428955078125, 0.2865753173828125, 0.3397216796875, 0.3928680419921875, 0.446014404296875, 0.4991607666015625, 0.55230712890625, 0.6054534912109375, 0.658599853515625, 0.7117462158203125, 0.764892578125, 0.8180389404296875, 0.871185302734375, 0.9243316650390625, 0.97747802734375, 1.0306243896484375, 1.083770751953125, 1.1369171142578125, 1.1900634765625, 1.2432098388671875, 1.296356201171875, 1.3495025634765625, 1.40264892578125, 1.4557952880859375, 1.508941650390625, 1.5620880126953125, 1.615234375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 6.0, 8.0, 9.0, 12.0, 24.0, 33.0, 30.0, 31.0, 64.0, 66.0, 80.0, 80.0, 77.0, 63.0, 73.0, 63.0, 43.0, 59.0, 43.0, 37.0, 25.0, 23.0, 15.0, 9.0, 9.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.6026763916015625, -0.584259033203125, -0.5658416748046875, -0.54742431640625, -0.5290069580078125, -0.510589599609375, -0.4921722412109375, -0.4737548828125, -0.4553375244140625, -0.436920166015625, -0.4185028076171875, -0.40008544921875, -0.3816680908203125, -0.363250732421875, -0.3448333740234375, -0.326416015625, -0.3079986572265625, -0.289581298828125, -0.2711639404296875, -0.25274658203125, -0.2343292236328125, -0.215911865234375, -0.1974945068359375, -0.1790771484375, -0.1606597900390625, -0.142242431640625, -0.1238250732421875, -0.10540771484375, -0.0869903564453125, -0.068572998046875, -0.0501556396484375, -0.03173828125, -0.0133209228515625, 0.005096435546875, 0.0235137939453125, 0.04193115234375, 0.0603485107421875, 0.078765869140625, 0.0971832275390625, 0.1156005859375, 0.1340179443359375, 0.152435302734375, 0.1708526611328125, 0.18927001953125, 0.2076873779296875, 0.226104736328125, 0.2445220947265625, 0.262939453125, 0.2813568115234375, 0.299774169921875, 0.3181915283203125, 0.33660888671875, 0.3550262451171875, 0.373443603515625, 0.3918609619140625, 0.4102783203125, 0.4286956787109375, 0.447113037109375, 0.4655303955078125, 0.48394775390625, 0.5023651123046875, 0.520782470703125, 0.5391998291015625, 0.5576171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 5.0, 14.0, 13.0, 15.0, 19.0, 23.0, 44.0, 56.0, 74.0, 140.0, 265.0, 687.0, 1882.0, 7100.0, 38488.0, 435831.0, 509758.0, 43090.0, 7463.0, 2153.0, 737.0, 309.0, 139.0, 83.0, 50.0, 24.0, 18.0, 8.0, 19.0, 6.0, 7.0, 5.0, 6.0, 4.0, 8.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.5703125, -2.494781494140625, -2.41925048828125, -2.343719482421875, -2.2681884765625, -2.192657470703125, -2.11712646484375, -2.041595458984375, -1.966064453125, -1.890533447265625, -1.81500244140625, -1.739471435546875, -1.6639404296875, -1.588409423828125, -1.51287841796875, -1.437347412109375, -1.36181640625, -1.286285400390625, -1.21075439453125, -1.135223388671875, -1.0596923828125, -0.984161376953125, -0.90863037109375, -0.833099365234375, -0.757568359375, -0.682037353515625, -0.60650634765625, -0.530975341796875, -0.4554443359375, -0.379913330078125, -0.30438232421875, -0.228851318359375, -0.1533203125, -0.077789306640625, -0.00225830078125, 0.073272705078125, 0.1488037109375, 0.224334716796875, 0.29986572265625, 0.375396728515625, 0.450927734375, 0.526458740234375, 0.60198974609375, 0.677520751953125, 0.7530517578125, 0.828582763671875, 0.90411376953125, 0.979644775390625, 1.05517578125, 1.130706787109375, 1.20623779296875, 1.281768798828125, 1.3572998046875, 1.432830810546875, 1.50836181640625, 1.583892822265625, 1.659423828125, 1.734954833984375, 1.81048583984375, 1.886016845703125, 1.9615478515625, 2.037078857421875, 2.11260986328125, 2.188140869140625, 2.263671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 3.0, 5.0, 5.0, 5.0, 5.0, 12.0, 10.0, 10.0, 13.0, 28.0, 30.0, 33.0, 25.0, 32.0, 37.0, 30.0, 56.0, 58.0, 47.0, 46.0, 59.0, 64.0, 57.0, 41.0, 42.0, 38.0, 28.0, 38.0, 28.0, 23.0, 18.0, 16.0, 10.0, 5.0, 14.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.103515625, -2.0306396484375, -1.957763671875, -1.8848876953125, -1.81201171875, -1.7391357421875, -1.666259765625, -1.5933837890625, -1.5205078125, -1.4476318359375, -1.374755859375, -1.3018798828125, -1.22900390625, -1.1561279296875, -1.083251953125, -1.0103759765625, -0.9375, -0.8646240234375, -0.791748046875, -0.7188720703125, -0.64599609375, -0.5731201171875, -0.500244140625, -0.4273681640625, -0.3544921875, -0.2816162109375, -0.208740234375, -0.1358642578125, -0.06298828125, 0.0098876953125, 0.082763671875, 0.1556396484375, 0.228515625, 0.3013916015625, 0.374267578125, 0.4471435546875, 0.52001953125, 0.5928955078125, 0.665771484375, 0.7386474609375, 0.8115234375, 0.8843994140625, 0.957275390625, 1.0301513671875, 1.10302734375, 1.1759033203125, 1.248779296875, 1.3216552734375, 1.39453125, 1.4674072265625, 1.540283203125, 1.6131591796875, 1.68603515625, 1.7589111328125, 1.831787109375, 1.9046630859375, 1.9775390625, 2.0504150390625, 2.123291015625, 2.1961669921875, 2.26904296875, 2.3419189453125, 2.414794921875, 2.4876708984375, 2.560546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 15.0, 12.0, 15.0, 23.0, 26.0, 57.0, 90.0, 135.0, 227.0, 428.0, 1102.0, 3609.0, 25205.0, 683987.0, 314792.0, 14398.0, 2613.0, 844.0, 378.0, 199.0, 124.0, 70.0, 47.0, 38.0, 32.0, 17.0, 14.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.431640625, -1.3917388916015625, -1.351837158203125, -1.3119354248046875, -1.27203369140625, -1.2321319580078125, -1.192230224609375, -1.1523284912109375, -1.1124267578125, -1.0725250244140625, -1.032623291015625, -0.9927215576171875, -0.95281982421875, -0.9129180908203125, -0.873016357421875, -0.8331146240234375, -0.793212890625, -0.7533111572265625, -0.713409423828125, -0.6735076904296875, -0.63360595703125, -0.5937042236328125, -0.553802490234375, -0.5139007568359375, -0.4739990234375, -0.4340972900390625, -0.394195556640625, -0.3542938232421875, -0.31439208984375, -0.2744903564453125, -0.234588623046875, -0.1946868896484375, -0.15478515625, -0.1148834228515625, -0.074981689453125, -0.0350799560546875, 0.00482177734375, 0.0447235107421875, 0.084625244140625, 0.1245269775390625, 0.1644287109375, 0.2043304443359375, 0.244232177734375, 0.2841339111328125, 0.32403564453125, 0.3639373779296875, 0.403839111328125, 0.4437408447265625, 0.483642578125, 0.5235443115234375, 0.563446044921875, 0.6033477783203125, 0.64324951171875, 0.6831512451171875, 0.723052978515625, 0.7629547119140625, 0.8028564453125, 0.8427581787109375, 0.882659912109375, 0.9225616455078125, 0.96246337890625, 1.0023651123046875, 1.042266845703125, 1.0821685791015625, 1.1220703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 12.0, 36.0, 100.0, 183.0, 266.0, 195.0, 105.0, 49.0, 22.0, 11.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015664100646972656, -0.00014588609337806702, -0.00013513118028640747, -0.00012437626719474792, -0.00011362135410308838, -0.00010286644101142883, -9.211152791976929e-05, -8.135661482810974e-05, -7.06017017364502e-05, -5.984678864479065e-05, -4.9091875553131104e-05, -3.833696246147156e-05, -2.7582049369812012e-05, -1.6827136278152466e-05, -6.07222318649292e-06, 4.682689905166626e-06, 1.5437602996826172e-05, 2.6192516088485718e-05, 3.6947429180145264e-05, 4.770234227180481e-05, 5.8457255363464355e-05, 6.92121684551239e-05, 7.996708154678345e-05, 9.072199463844299e-05, 0.00010147690773010254, 0.00011223182082176208, 0.00012298673391342163, 0.00013374164700508118, 0.00014449656009674072, 0.00015525147318840027, 0.00016600638628005981, 0.00017676129937171936, 0.0001875162124633789, 0.00019827112555503845, 0.000209026038646698, 0.00021978095173835754, 0.0002305358648300171, 0.00024129077792167664, 0.0002520456910133362, 0.00026280060410499573, 0.0002735555171966553, 0.0002843104302883148, 0.00029506534337997437, 0.0003058202564716339, 0.00031657516956329346, 0.000327330082654953, 0.00033808499574661255, 0.0003488399088382721, 0.00035959482192993164, 0.0003703497350215912, 0.00038110464811325073, 0.0003918595612049103, 0.0004026144742965698, 0.00041336938738822937, 0.0004241243004798889, 0.00043487921357154846, 0.000445634126663208, 0.00045638903975486755, 0.0004671439528465271, 0.00047789886593818665, 0.0004886537790298462, 0.0004994086921215057, 0.0005101636052131653, 0.0005209185183048248, 0.0005316734313964844]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 21.0, 13.0, 39.0, 59.0, 79.0, 147.0, 296.0, 604.0, 1346.0, 3932.0, 15815.0, 109237.0, 703685.0, 182521.0, 22563.0, 5019.0, 1679.0, 729.0, 318.0, 157.0, 95.0, 59.0, 48.0, 23.0, 18.0, 11.0, 11.0, 3.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8505859375, -0.8245010375976562, -0.7984161376953125, -0.7723312377929688, -0.746246337890625, -0.7201614379882812, -0.6940765380859375, -0.6679916381835938, -0.64190673828125, -0.6158218383789062, -0.5897369384765625, -0.5636520385742188, -0.537567138671875, -0.5114822387695312, -0.4853973388671875, -0.45931243896484375, -0.4332275390625, -0.40714263916015625, -0.3810577392578125, -0.35497283935546875, -0.328887939453125, -0.30280303955078125, -0.2767181396484375, -0.25063323974609375, -0.22454833984375, -0.19846343994140625, -0.1723785400390625, -0.14629364013671875, -0.120208740234375, -0.09412384033203125, -0.0680389404296875, -0.04195404052734375, -0.015869140625, 0.01021575927734375, 0.0363006591796875, 0.06238555908203125, 0.088470458984375, 0.11455535888671875, 0.1406402587890625, 0.16672515869140625, 0.19281005859375, 0.21889495849609375, 0.2449798583984375, 0.27106475830078125, 0.297149658203125, 0.32323455810546875, 0.3493194580078125, 0.37540435791015625, 0.4014892578125, 0.42757415771484375, 0.4536590576171875, 0.47974395751953125, 0.505828857421875, 0.5319137573242188, 0.5579986572265625, 0.5840835571289062, 0.61016845703125, 0.6362533569335938, 0.6623382568359375, 0.6884231567382812, 0.714508056640625, 0.7405929565429688, 0.7666778564453125, 0.7927627563476562, 0.81884765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 8.0, 6.0, 10.0, 19.0, 21.0, 16.0, 41.0, 42.0, 50.0, 56.0, 75.0, 94.0, 85.0, 90.0, 74.0, 58.0, 54.0, 42.0, 30.0, 22.0, 20.0, 18.0, 14.0, 7.0, 9.0, 8.0, 2.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.01953125, -0.9938125610351562, -0.9680938720703125, -0.9423751831054688, -0.916656494140625, -0.8909378051757812, -0.8652191162109375, -0.8395004272460938, -0.81378173828125, -0.7880630493164062, -0.7623443603515625, -0.7366256713867188, -0.710906982421875, -0.6851882934570312, -0.6594696044921875, -0.6337509155273438, -0.6080322265625, -0.5823135375976562, -0.5565948486328125, -0.5308761596679688, -0.505157470703125, -0.47943878173828125, -0.4537200927734375, -0.42800140380859375, -0.40228271484375, -0.37656402587890625, -0.3508453369140625, -0.32512664794921875, -0.299407958984375, -0.27368927001953125, -0.2479705810546875, -0.22225189208984375, -0.196533203125, -0.17081451416015625, -0.1450958251953125, -0.11937713623046875, -0.093658447265625, -0.06793975830078125, -0.0422210693359375, -0.01650238037109375, 0.00921630859375, 0.03493499755859375, 0.0606536865234375, 0.08637237548828125, 0.112091064453125, 0.13780975341796875, 0.1635284423828125, 0.18924713134765625, 0.2149658203125, 0.24068450927734375, 0.2664031982421875, 0.29212188720703125, 0.317840576171875, 0.34355926513671875, 0.3692779541015625, 0.39499664306640625, 0.42071533203125, 0.44643402099609375, 0.4721527099609375, 0.49787139892578125, 0.523590087890625, 0.5493087768554688, 0.5750274658203125, 0.6007461547851562, 0.62646484375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 6.0, 11.0, 21.0, 42.0, 68.0, 115.0, 187.0, 203.0, 155.0, 83.0, 58.0, 17.0, 15.0, 9.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.257390975952148, -7.716111660003662, -7.174832344055176, -6.633553504943848, -6.092274188995361, -5.550994873046875, -5.009716033935547, -4.4684367179870605, -3.927157402038574, -3.385878086090088, -2.8445990085601807, -2.3033199310302734, -1.762040615081787, -1.2207612991333008, -0.6794822216033936, -0.13820314407348633, 0.403076171875, 0.9443553686141968, 1.4856345653533936, 2.026913642883301, 2.568192958831787, 3.1094722747802734, 3.6507513523101807, 4.192030429840088, 4.733309745788574, 5.2745890617370605, 5.815868377685547, 6.357147216796875, 6.898426532745361, 7.439705848693848, 7.980984687805176, 8.52226448059082, 9.063545227050781, 9.60482406616211, 10.146103858947754, 10.687382698059082, 11.228662490844727, 11.769941329956055, 12.311220169067383, 12.852499008178711, 13.393778800964355, 13.935057640075684, 14.476337432861328, 15.017616271972656, 15.558895111083984, 16.100173950195312, 16.641454696655273, 17.1827335357666, 17.72401237487793, 18.265291213989258, 18.806570053100586, 19.347850799560547, 19.889129638671875, 20.430408477783203, 20.97168731689453, 21.51296615600586, 22.054244995117188, 22.595523834228516, 23.136802673339844, 23.678083419799805, 24.219362258911133, 24.76064109802246, 25.30191993713379, 25.843198776245117, 26.384479522705078]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 2.0, 4.0, 9.0, 10.0, 10.0, 10.0, 16.0, 15.0, 15.0, 29.0, 31.0, 25.0, 32.0, 46.0, 48.0, 60.0, 45.0, 61.0, 56.0, 55.0, 55.0, 43.0, 46.0, 32.0, 35.0, 28.0, 31.0, 25.0, 26.0, 15.0, 16.0, 15.0, 8.0, 7.0, 5.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-10.431926727294922, -10.109883308410645, -9.787839889526367, -9.46579647064209, -9.143753051757812, -8.821709632873535, -8.499666213989258, -8.177621841430664, -7.855578899383545, -7.533535480499268, -7.21149206161499, -6.889448642730713, -6.567404747009277, -6.245361328125, -5.923317909240723, -5.601274490356445, -5.279231071472168, -4.957187652587891, -4.635144233703613, -4.313100814819336, -3.9910571575164795, -3.669013738632202, -3.3469700813293457, -3.0249266624450684, -2.702883243560791, -2.3808398246765137, -2.0587964057922363, -1.7367527484893799, -1.4147093296051025, -1.0926659107208252, -0.7706223726272583, -0.4485788345336914, -0.12653446197509766, 0.19550901651382446, 0.5175524950027466, 0.8395959734916687, 1.1616394519805908, 1.4836828708648682, 1.805726408958435, 2.127769947052002, 2.4498133659362793, 2.7718567848205566, 3.093900203704834, 3.4159438610076904, 3.7379872798919678, 4.060030937194824, 4.382074356079102, 4.704117774963379, 5.026161193847656, 5.348204612731934, 5.670248031616211, 5.992291450500488, 6.314334869384766, 6.636378288269043, 6.9584221839904785, 7.280465602874756, 7.602509021759033, 7.9245524406433105, 8.246596336364746, 8.568639755249023, 8.8906831741333, 9.212726593017578, 9.534770011901855, 9.856813430786133, 10.17885684967041]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 11.0, 11.0, 9.0, 18.0, 23.0, 41.0, 42.0, 73.0, 86.0, 137.0, 190.0, 341.0, 639.0, 1161.0, 2613.0, 7459.0, 32070.0, 450804.0, 3630011.0, 51864.0, 10027.0, 3304.0, 1434.0, 738.0, 402.0, 260.0, 151.0, 111.0, 67.0, 53.0, 35.0, 24.0, 15.0, 15.0, 3.0, 7.0, 6.0, 7.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.33984375, -1.2967987060546875, -1.253753662109375, -1.2107086181640625, -1.16766357421875, -1.1246185302734375, -1.081573486328125, -1.0385284423828125, -0.9954833984375, -0.9524383544921875, -0.909393310546875, -0.8663482666015625, -0.82330322265625, -0.7802581787109375, -0.737213134765625, -0.6941680908203125, -0.651123046875, -0.6080780029296875, -0.565032958984375, -0.5219879150390625, -0.47894287109375, -0.4358978271484375, -0.392852783203125, -0.3498077392578125, -0.3067626953125, -0.2637176513671875, -0.220672607421875, -0.1776275634765625, -0.13458251953125, -0.0915374755859375, -0.048492431640625, -0.0054473876953125, 0.03759765625, 0.0806427001953125, 0.123687744140625, 0.1667327880859375, 0.20977783203125, 0.2528228759765625, 0.295867919921875, 0.3389129638671875, 0.3819580078125, 0.4250030517578125, 0.468048095703125, 0.5110931396484375, 0.55413818359375, 0.5971832275390625, 0.640228271484375, 0.6832733154296875, 0.726318359375, 0.7693634033203125, 0.812408447265625, 0.8554534912109375, 0.89849853515625, 0.9415435791015625, 0.984588623046875, 1.0276336669921875, 1.0706787109375, 1.1137237548828125, 1.156768798828125, 1.1998138427734375, 1.24285888671875, 1.2859039306640625, 1.328948974609375, 1.3719940185546875, 1.4150390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 4.0, 4.0, 6.0, 9.0, 10.0, 19.0, 24.0, 32.0, 29.0, 37.0, 54.0, 71.0, 70.0, 72.0, 72.0, 73.0, 59.0, 66.0, 67.0, 41.0, 43.0, 26.0, 32.0, 11.0, 16.0, 11.0, 9.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.61962890625, -0.6006393432617188, -0.5816497802734375, -0.5626602172851562, -0.543670654296875, -0.5246810913085938, -0.5056915283203125, -0.48670196533203125, -0.46771240234375, -0.44872283935546875, -0.4297332763671875, -0.41074371337890625, -0.391754150390625, -0.37276458740234375, -0.3537750244140625, -0.33478546142578125, -0.3157958984375, -0.29680633544921875, -0.2778167724609375, -0.25882720947265625, -0.239837646484375, -0.22084808349609375, -0.2018585205078125, -0.18286895751953125, -0.16387939453125, -0.14488983154296875, -0.1259002685546875, -0.10691070556640625, -0.087921142578125, -0.06893157958984375, -0.0499420166015625, -0.03095245361328125, -0.011962890625, 0.00702667236328125, 0.0260162353515625, 0.04500579833984375, 0.063995361328125, 0.08298492431640625, 0.1019744873046875, 0.12096405029296875, 0.13995361328125, 0.15894317626953125, 0.1779327392578125, 0.19692230224609375, 0.215911865234375, 0.23490142822265625, 0.2538909912109375, 0.27288055419921875, 0.2918701171875, 0.31085968017578125, 0.3298492431640625, 0.34883880615234375, 0.367828369140625, 0.38681793212890625, 0.4058074951171875, 0.42479705810546875, 0.44378662109375, 0.46277618408203125, 0.4817657470703125, 0.5007553100585938, 0.519744873046875, 0.5387344360351562, 0.5577239990234375, 0.5767135620117188, 0.595703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 8.0, 14.0, 14.0, 26.0, 23.0, 34.0, 66.0, 89.0, 129.0, 207.0, 292.0, 465.0, 755.0, 1319.0, 2437.0, 4739.0, 11404.0, 35264.0, 190888.0, 3537079.0, 333851.0, 48590.0, 14128.0, 5733.0, 2845.0, 1516.0, 814.0, 488.0, 359.0, 192.0, 162.0, 123.0, 58.0, 46.0, 31.0, 29.0, 23.0, 20.0, 13.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98291015625, -0.9518203735351562, -0.9207305908203125, -0.8896408081054688, -0.858551025390625, -0.8274612426757812, -0.7963714599609375, -0.7652816772460938, -0.73419189453125, -0.7031021118164062, -0.6720123291015625, -0.6409225463867188, -0.609832763671875, -0.5787429809570312, -0.5476531982421875, -0.5165634155273438, -0.4854736328125, -0.45438385009765625, -0.4232940673828125, -0.39220428466796875, -0.361114501953125, -0.33002471923828125, -0.2989349365234375, -0.26784515380859375, -0.23675537109375, -0.20566558837890625, -0.1745758056640625, -0.14348602294921875, -0.112396240234375, -0.08130645751953125, -0.0502166748046875, -0.01912689208984375, 0.011962890625, 0.04305267333984375, 0.0741424560546875, 0.10523223876953125, 0.136322021484375, 0.16741180419921875, 0.1985015869140625, 0.22959136962890625, 0.26068115234375, 0.29177093505859375, 0.3228607177734375, 0.35395050048828125, 0.385040283203125, 0.41613006591796875, 0.4472198486328125, 0.47830963134765625, 0.5093994140625, 0.5404891967773438, 0.5715789794921875, 0.6026687622070312, 0.633758544921875, 0.6648483276367188, 0.6959381103515625, 0.7270278930664062, 0.75811767578125, 0.7892074584960938, 0.8202972412109375, 0.8513870239257812, 0.882476806640625, 0.9135665893554688, 0.9446563720703125, 0.9757461547851562, 1.0068359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 5.0, 11.0, 16.0, 36.0, 50.0, 122.0, 366.0, 2429.0, 643.0, 194.0, 73.0, 48.0, 17.0, 15.0, 14.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.441162109375, -0.4276924133300781, -0.41422271728515625, -0.4007530212402344, -0.3872833251953125, -0.3738136291503906, -0.36034393310546875, -0.3468742370605469, -0.333404541015625, -0.3199348449707031, -0.30646514892578125, -0.2929954528808594, -0.2795257568359375, -0.2660560607910156, -0.25258636474609375, -0.23911666870117188, -0.22564697265625, -0.21217727661132812, -0.19870758056640625, -0.18523788452148438, -0.1717681884765625, -0.15829849243164062, -0.14482879638671875, -0.13135910034179688, -0.117889404296875, -0.10441970825195312, -0.09095001220703125, -0.07748031616210938, -0.0640106201171875, -0.050540924072265625, -0.03707122802734375, -0.023601531982421875, -0.0101318359375, 0.003337860107421875, 0.01680755615234375, 0.030277252197265625, 0.0437469482421875, 0.057216644287109375, 0.07068634033203125, 0.08415603637695312, 0.097625732421875, 0.11109542846679688, 0.12456512451171875, 0.13803482055664062, 0.1515045166015625, 0.16497421264648438, 0.17844390869140625, 0.19191360473632812, 0.20538330078125, 0.21885299682617188, 0.23232269287109375, 0.24579238891601562, 0.2592620849609375, 0.2727317810058594, 0.28620147705078125, 0.2996711730957031, 0.313140869140625, 0.3266105651855469, 0.34008026123046875, 0.3535499572753906, 0.3670196533203125, 0.3804893493652344, 0.39395904541015625, 0.4074287414550781, 0.4208984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 13.0, 19.0, 49.0, 111.0, 166.0, 210.0, 184.0, 128.0, 66.0, 26.0, 16.0, 7.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.795786142349243, -2.716071128845215, -2.6363563537597656, -2.5566413402557373, -2.476926326751709, -2.3972113132476807, -2.3174962997436523, -2.237781524658203, -2.158066511154175, -2.0783514976501465, -1.9986366033554077, -1.918921709060669, -1.8392066955566406, -1.7594916820526123, -1.6797767877578735, -1.6000618934631348, -1.5203468799591064, -1.4406318664550781, -1.3609169721603394, -1.2812020778656006, -1.2014870643615723, -1.121772050857544, -1.0420571565628052, -0.9623422026634216, -0.8826272487640381, -0.8029122948646545, -0.723197340965271, -0.6434823870658875, -0.5637674331665039, -0.48405247926712036, -0.4043375253677368, -0.32462257146835327, -0.24490737915039062, -0.16519242525100708, -0.08547747135162354, -0.00576251745223999, 0.07395243644714355, 0.1536673903465271, 0.23338234424591064, 0.3130972981452942, 0.39281225204467773, 0.4725272059440613, 0.5522421598434448, 0.6319571137428284, 0.7116720676422119, 0.7913870215415955, 0.871101975440979, 0.9508169293403625, 1.030531883239746, 1.1102468967437744, 1.1899617910385132, 1.269676685333252, 1.3493916988372803, 1.4291067123413086, 1.5088216066360474, 1.5885365009307861, 1.6682515144348145, 1.7479665279388428, 1.8276814222335815, 1.9073963165283203, 1.9871113300323486, 2.066826343536377, 2.146541118621826, 2.2262561321258545, 2.305971145629883]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 5.0, 6.0, 15.0, 14.0, 16.0, 22.0, 19.0, 34.0, 28.0, 51.0, 44.0, 45.0, 45.0, 58.0, 46.0, 54.0, 49.0, 59.0, 58.0, 44.0, 30.0, 31.0, 30.0, 37.0, 28.0, 25.0, 20.0, 15.0, 18.0, 13.0, 8.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0], "bins": [-1.3957661390304565, -1.3625102043151855, -1.3292542695999146, -1.2959983348846436, -1.2627424001693726, -1.2294864654541016, -1.196230411529541, -1.16297447681427, -1.129718542098999, -1.096462607383728, -1.063206672668457, -1.029950737953186, -0.9966947436332703, -0.9634388089179993, -0.9301828742027283, -0.8969269394874573, -0.8636710047721863, -0.8304150700569153, -0.7971591353416443, -0.7639031410217285, -0.7306472063064575, -0.6973912715911865, -0.6641353368759155, -0.6308794021606445, -0.5976234674453735, -0.5643675327301025, -0.5311115980148315, -0.49785563349723816, -0.4645996689796448, -0.4313437342643738, -0.3980877995491028, -0.3648318648338318, -0.33157581090927124, -0.29831987619400024, -0.26506391167640686, -0.23180797696113586, -0.19855202734470367, -0.16529607772827148, -0.1320401430130005, -0.0987841933965683, -0.06552824378013611, -0.03227229788899422, 0.0009836480021476746, 0.03423959016799927, 0.06749553978443146, 0.10075148940086365, 0.13400742411613464, 0.16726337373256683, 0.20051932334899902, 0.2337752729654312, 0.2670312225818634, 0.3002871572971344, 0.3335431218147278, 0.3667990565299988, 0.4000549912452698, 0.43331092596054077, 0.46656689047813416, 0.49982282519340515, 0.5330787897109985, 0.5663347244262695, 0.5995906591415405, 0.6328465938568115, 0.6661025285720825, 0.6993585228919983, 0.7326144576072693]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 11.0, 10.0, 23.0, 32.0, 26.0, 62.0, 83.0, 123.0, 203.0, 354.0, 643.0, 1161.0, 2348.0, 5681.0, 15951.0, 60004.0, 274011.0, 487122.0, 148860.0, 33915.0, 10147.0, 3818.0, 1791.0, 856.0, 512.0, 281.0, 167.0, 98.0, 60.0, 58.0, 39.0, 27.0, 15.0, 9.0, 9.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.44140625, -1.3981170654296875, -1.354827880859375, -1.3115386962890625, -1.26824951171875, -1.2249603271484375, -1.181671142578125, -1.1383819580078125, -1.0950927734375, -1.0518035888671875, -1.008514404296875, -0.9652252197265625, -0.92193603515625, -0.8786468505859375, -0.835357666015625, -0.7920684814453125, -0.748779296875, -0.7054901123046875, -0.662200927734375, -0.6189117431640625, -0.57562255859375, -0.5323333740234375, -0.489044189453125, -0.4457550048828125, -0.4024658203125, -0.3591766357421875, -0.315887451171875, -0.2725982666015625, -0.22930908203125, -0.1860198974609375, -0.142730712890625, -0.0994415283203125, -0.05615234375, -0.0128631591796875, 0.030426025390625, 0.0737152099609375, 0.11700439453125, 0.1602935791015625, 0.203582763671875, 0.2468719482421875, 0.2901611328125, 0.3334503173828125, 0.376739501953125, 0.4200286865234375, 0.46331787109375, 0.5066070556640625, 0.549896240234375, 0.5931854248046875, 0.636474609375, 0.6797637939453125, 0.723052978515625, 0.7663421630859375, 0.80963134765625, 0.8529205322265625, 0.896209716796875, 0.9394989013671875, 0.9827880859375, 1.0260772705078125, 1.069366455078125, 1.1126556396484375, 1.15594482421875, 1.1992340087890625, 1.242523193359375, 1.2858123779296875, 1.3291015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 6.0, 5.0, 5.0, 5.0, 9.0, 15.0, 12.0, 24.0, 30.0, 39.0, 44.0, 56.0, 59.0, 59.0, 71.0, 72.0, 75.0, 58.0, 71.0, 66.0, 44.0, 40.0, 29.0, 30.0, 21.0, 12.0, 12.0, 5.0, 5.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.5843887329101562, -0.5652618408203125, -0.5461349487304688, -0.527008056640625, -0.5078811645507812, -0.4887542724609375, -0.46962738037109375, -0.45050048828125, -0.43137359619140625, -0.4122467041015625, -0.39311981201171875, -0.373992919921875, -0.35486602783203125, -0.3357391357421875, -0.31661224365234375, -0.2974853515625, -0.27835845947265625, -0.2592315673828125, -0.24010467529296875, -0.220977783203125, -0.20185089111328125, -0.1827239990234375, -0.16359710693359375, -0.14447021484375, -0.12534332275390625, -0.1062164306640625, -0.08708953857421875, -0.067962646484375, -0.04883575439453125, -0.0297088623046875, -0.01058197021484375, 0.008544921875, 0.02767181396484375, 0.0467987060546875, 0.06592559814453125, 0.085052490234375, 0.10417938232421875, 0.1233062744140625, 0.14243316650390625, 0.16156005859375, 0.18068695068359375, 0.1998138427734375, 0.21894073486328125, 0.238067626953125, 0.25719451904296875, 0.2763214111328125, 0.29544830322265625, 0.3145751953125, 0.33370208740234375, 0.3528289794921875, 0.37195587158203125, 0.391082763671875, 0.41020965576171875, 0.4293365478515625, 0.44846343994140625, 0.46759033203125, 0.48671722412109375, 0.5058441162109375, 0.5249710083007812, 0.544097900390625, 0.5632247924804688, 0.5823516845703125, 0.6014785766601562, 0.62060546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 11.0, 13.0, 14.0, 19.0, 34.0, 56.0, 78.0, 172.0, 426.0, 1719.0, 12171.0, 322505.0, 686714.0, 21108.0, 2432.0, 545.0, 220.0, 111.0, 52.0, 42.0, 30.0, 17.0, 12.0, 8.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.810333251953125, -2.70269775390625, -2.595062255859375, -2.4874267578125, -2.379791259765625, -2.27215576171875, -2.164520263671875, -2.056884765625, -1.949249267578125, -1.84161376953125, -1.733978271484375, -1.6263427734375, -1.518707275390625, -1.41107177734375, -1.303436279296875, -1.19580078125, -1.088165283203125, -0.98052978515625, -0.872894287109375, -0.7652587890625, -0.657623291015625, -0.54998779296875, -0.442352294921875, -0.334716796875, -0.227081298828125, -0.11944580078125, -0.011810302734375, 0.0958251953125, 0.203460693359375, 0.31109619140625, 0.418731689453125, 0.5263671875, 0.634002685546875, 0.74163818359375, 0.849273681640625, 0.9569091796875, 1.064544677734375, 1.17218017578125, 1.279815673828125, 1.387451171875, 1.495086669921875, 1.60272216796875, 1.710357666015625, 1.8179931640625, 1.925628662109375, 2.03326416015625, 2.140899658203125, 2.24853515625, 2.356170654296875, 2.46380615234375, 2.571441650390625, 2.6790771484375, 2.786712646484375, 2.89434814453125, 3.001983642578125, 3.109619140625, 3.217254638671875, 3.32489013671875, 3.432525634765625, 3.5401611328125, 3.647796630859375, 3.75543212890625, 3.863067626953125, 3.970703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 7.0, 12.0, 6.0, 10.0, 15.0, 17.0, 21.0, 27.0, 34.0, 35.0, 39.0, 32.0, 50.0, 54.0, 53.0, 55.0, 53.0, 77.0, 44.0, 41.0, 58.0, 41.0, 38.0, 31.0, 23.0, 25.0, 17.0, 17.0, 11.0, 8.0, 2.0, 9.0, 6.0, 3.0, 1.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.36846923828125, -2.2877197265625, -2.20697021484375, -2.126220703125, -2.04547119140625, -1.9647216796875, -1.88397216796875, -1.80322265625, -1.72247314453125, -1.6417236328125, -1.56097412109375, -1.480224609375, -1.39947509765625, -1.3187255859375, -1.23797607421875, -1.1572265625, -1.07647705078125, -0.9957275390625, -0.91497802734375, -0.834228515625, -0.75347900390625, -0.6727294921875, -0.59197998046875, -0.51123046875, -0.43048095703125, -0.3497314453125, -0.26898193359375, -0.188232421875, -0.10748291015625, -0.0267333984375, 0.05401611328125, 0.134765625, 0.21551513671875, 0.2962646484375, 0.37701416015625, 0.457763671875, 0.53851318359375, 0.6192626953125, 0.70001220703125, 0.78076171875, 0.86151123046875, 0.9422607421875, 1.02301025390625, 1.103759765625, 1.18450927734375, 1.2652587890625, 1.34600830078125, 1.4267578125, 1.50750732421875, 1.5882568359375, 1.66900634765625, 1.749755859375, 1.83050537109375, 1.9112548828125, 1.99200439453125, 2.07275390625, 2.15350341796875, 2.2342529296875, 2.31500244140625, 2.395751953125, 2.47650146484375, 2.5572509765625, 2.63800048828125, 2.71875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 10.0, 3.0, 6.0, 14.0, 20.0, 36.0, 46.0, 71.0, 118.0, 185.0, 442.0, 1101.0, 5194.0, 155884.0, 865083.0, 16898.0, 2149.0, 627.0, 257.0, 134.0, 99.0, 46.0, 42.0, 25.0, 18.0, 8.0, 13.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8505859375, -1.7965240478515625, -1.742462158203125, -1.6884002685546875, -1.63433837890625, -1.5802764892578125, -1.526214599609375, -1.4721527099609375, -1.4180908203125, -1.3640289306640625, -1.309967041015625, -1.2559051513671875, -1.20184326171875, -1.1477813720703125, -1.093719482421875, -1.0396575927734375, -0.985595703125, -0.9315338134765625, -0.877471923828125, -0.8234100341796875, -0.76934814453125, -0.7152862548828125, -0.661224365234375, -0.6071624755859375, -0.5531005859375, -0.4990386962890625, -0.444976806640625, -0.3909149169921875, -0.33685302734375, -0.2827911376953125, -0.228729248046875, -0.1746673583984375, -0.12060546875, -0.0665435791015625, -0.012481689453125, 0.0415802001953125, 0.09564208984375, 0.1497039794921875, 0.203765869140625, 0.2578277587890625, 0.3118896484375, 0.3659515380859375, 0.420013427734375, 0.4740753173828125, 0.52813720703125, 0.5821990966796875, 0.636260986328125, 0.6903228759765625, 0.744384765625, 0.7984466552734375, 0.852508544921875, 0.9065704345703125, 0.96063232421875, 1.0146942138671875, 1.068756103515625, 1.1228179931640625, 1.1768798828125, 1.2309417724609375, 1.285003662109375, 1.3390655517578125, 1.39312744140625, 1.4471893310546875, 1.501251220703125, 1.5553131103515625, 1.609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 6.0, 1.0, 2.0, 7.0, 4.0, 8.0, 8.0, 21.0, 21.0, 21.0, 30.0, 41.0, 49.0, 55.0, 65.0, 71.0, 74.0, 62.0, 70.0, 73.0, 56.0, 49.0, 43.0, 33.0, 26.0, 25.0, 21.0, 14.0, 10.0, 12.0, 5.0, 2.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.893013000488281e-05, -8.616596460342407e-05, -8.340179920196533e-05, -8.063763380050659e-05, -7.787346839904785e-05, -7.510930299758911e-05, -7.234513759613037e-05, -6.958097219467163e-05, -6.681680679321289e-05, -6.405264139175415e-05, -6.128847599029541e-05, -5.852431058883667e-05, -5.576014518737793e-05, -5.299597978591919e-05, -5.023181438446045e-05, -4.746764898300171e-05, -4.470348358154297e-05, -4.193931818008423e-05, -3.917515277862549e-05, -3.641098737716675e-05, -3.364682197570801e-05, -3.088265657424927e-05, -2.8118491172790527e-05, -2.5354325771331787e-05, -2.2590160369873047e-05, -1.9825994968414307e-05, -1.7061829566955566e-05, -1.4297664165496826e-05, -1.1533498764038086e-05, -8.769333362579346e-06, -6.0051679611206055e-06, -3.2410025596618652e-06, -4.76837158203125e-07, 2.2873282432556152e-06, 5.0514936447143555e-06, 7.815659046173096e-06, 1.0579824447631836e-05, 1.3343989849090576e-05, 1.6108155250549316e-05, 1.8872320652008057e-05, 2.1636486053466797e-05, 2.4400651454925537e-05, 2.7164816856384277e-05, 2.9928982257843018e-05, 3.269314765930176e-05, 3.54573130607605e-05, 3.822147846221924e-05, 4.098564386367798e-05, 4.374980926513672e-05, 4.651397466659546e-05, 4.92781400680542e-05, 5.204230546951294e-05, 5.480647087097168e-05, 5.757063627243042e-05, 6.033480167388916e-05, 6.30989670753479e-05, 6.586313247680664e-05, 6.862729787826538e-05, 7.139146327972412e-05, 7.415562868118286e-05, 7.69197940826416e-05, 7.968395948410034e-05, 8.244812488555908e-05, 8.521229028701782e-05, 8.797645568847656e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 11.0, 22.0, 22.0, 35.0, 67.0, 100.0, 179.0, 369.0, 817.0, 2689.0, 17500.0, 443496.0, 557287.0, 21212.0, 3016.0, 888.0, 373.0, 196.0, 95.0, 55.0, 40.0, 17.0, 21.0, 17.0, 9.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1650390625, -1.12750244140625, -1.0899658203125, -1.05242919921875, -1.014892578125, -0.97735595703125, -0.9398193359375, -0.90228271484375, -0.86474609375, -0.82720947265625, -0.7896728515625, -0.75213623046875, -0.714599609375, -0.67706298828125, -0.6395263671875, -0.60198974609375, -0.564453125, -0.52691650390625, -0.4893798828125, -0.45184326171875, -0.414306640625, -0.37677001953125, -0.3392333984375, -0.30169677734375, -0.26416015625, -0.22662353515625, -0.1890869140625, -0.15155029296875, -0.114013671875, -0.07647705078125, -0.0389404296875, -0.00140380859375, 0.0361328125, 0.07366943359375, 0.1112060546875, 0.14874267578125, 0.186279296875, 0.22381591796875, 0.2613525390625, 0.29888916015625, 0.33642578125, 0.37396240234375, 0.4114990234375, 0.44903564453125, 0.486572265625, 0.52410888671875, 0.5616455078125, 0.59918212890625, 0.63671875, 0.67425537109375, 0.7117919921875, 0.74932861328125, 0.786865234375, 0.82440185546875, 0.8619384765625, 0.89947509765625, 0.93701171875, 0.97454833984375, 1.0120849609375, 1.04962158203125, 1.087158203125, 1.12469482421875, 1.1622314453125, 1.19976806640625, 1.2373046875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 7.0, 8.0, 5.0, 8.0, 21.0, 31.0, 62.0, 76.0, 116.0, 110.0, 147.0, 111.0, 103.0, 64.0, 48.0, 32.0, 19.0, 13.0, 10.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.42742919921875, -1.3919677734375, -1.35650634765625, -1.321044921875, -1.28558349609375, -1.2501220703125, -1.21466064453125, -1.17919921875, -1.14373779296875, -1.1082763671875, -1.07281494140625, -1.037353515625, -1.00189208984375, -0.9664306640625, -0.93096923828125, -0.8955078125, -0.86004638671875, -0.8245849609375, -0.78912353515625, -0.753662109375, -0.71820068359375, -0.6827392578125, -0.64727783203125, -0.61181640625, -0.57635498046875, -0.5408935546875, -0.50543212890625, -0.469970703125, -0.43450927734375, -0.3990478515625, -0.36358642578125, -0.328125, -0.29266357421875, -0.2572021484375, -0.22174072265625, -0.186279296875, -0.15081787109375, -0.1153564453125, -0.07989501953125, -0.04443359375, -0.00897216796875, 0.0264892578125, 0.06195068359375, 0.097412109375, 0.13287353515625, 0.1683349609375, 0.20379638671875, 0.2392578125, 0.27471923828125, 0.3101806640625, 0.34564208984375, 0.381103515625, 0.41656494140625, 0.4520263671875, 0.48748779296875, 0.52294921875, 0.55841064453125, 0.5938720703125, 0.62933349609375, 0.664794921875, 0.70025634765625, 0.7357177734375, 0.77117919921875, 0.806640625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 11.0, 13.0, 21.0, 62.0, 103.0, 135.0, 164.0, 167.0, 124.0, 81.0, 51.0, 37.0, 14.0, 6.0, 4.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.18783187866211, -20.7177677154541, -20.247703552246094, -19.777639389038086, -19.307575225830078, -18.83751106262207, -18.367446899414062, -17.897382736206055, -17.427318572998047, -16.95725440979004, -16.48719024658203, -16.017126083374023, -15.547061920166016, -15.076997756958008, -14.60693359375, -14.136869430541992, -13.666805267333984, -13.196741104125977, -12.726676940917969, -12.256612777709961, -11.786548614501953, -11.316484451293945, -10.846420288085938, -10.37635612487793, -9.906291007995605, -9.436226844787598, -8.96616268157959, -8.496098518371582, -8.026034355163574, -7.555970191955566, -7.085906028747559, -6.615841865539551, -6.145777702331543, -5.675713539123535, -5.205649375915527, -4.7355852127075195, -4.265521049499512, -3.795456647872925, -3.325392484664917, -2.855328321456909, -2.3852641582489014, -1.9151999950408936, -1.4451358318328857, -0.9750715494155884, -0.5050073862075806, -0.0349431037902832, 0.4351210594177246, 0.9051852226257324, 1.3752493858337402, 1.845313549041748, 2.315377712249756, 2.7854418754577637, 3.2555060386657715, 3.7255704402923584, 4.195634841918945, 4.665699005126953, 5.135763168334961, 5.605827331542969, 6.075891494750977, 6.545955657958984, 7.016019821166992, 7.486083984375, 7.956148147583008, 8.426212310791016, 8.896276473999023]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 3.0, 5.0, 12.0, 8.0, 14.0, 14.0, 7.0, 18.0, 26.0, 26.0, 29.0, 27.0, 48.0, 59.0, 65.0, 62.0, 51.0, 53.0, 64.0, 51.0, 39.0, 52.0, 36.0, 42.0, 32.0, 29.0, 16.0, 11.0, 21.0, 15.0, 13.0, 13.0, 6.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.042323112487793, -9.700469017028809, -9.35861587524414, -9.016761779785156, -8.674907684326172, -8.333054542541504, -7.9912004470825195, -7.649346828460693, -7.307493209838867, -6.965639591217041, -6.623785972595215, -6.2819318771362305, -5.940078258514404, -5.598224639892578, -5.256370544433594, -4.914516925811768, -4.572663307189941, -4.230809688568115, -3.88895583152771, -3.5471019744873047, -3.2052483558654785, -2.8633947372436523, -2.521540880203247, -2.179687023162842, -1.8378334045410156, -1.4959796667099, -1.1541259288787842, -0.8122721910476685, -0.47041845321655273, -0.128564715385437, 0.2132890224456787, 0.555142879486084, 0.8969964981079102, 1.2388502359390259, 1.5807039737701416, 1.9225577116012573, 2.264411449432373, 2.606265068054199, 2.9481189250946045, 3.2899727821350098, 3.631826400756836, 3.973680019378662, 4.315533638000488, 4.657387733459473, 4.999241352081299, 5.341094970703125, 5.682949066162109, 6.0248026847839355, 6.366656303405762, 6.708509922027588, 7.050363540649414, 7.392217636108398, 7.734071254730225, 8.07592487335205, 8.417778968811035, 8.759632110595703, 9.101486206054688, 9.443340301513672, 9.78519344329834, 10.127047538757324, 10.468900680541992, 10.810754776000977, 11.152608871459961, 11.494462966918945, 11.836316108703613]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 4.0, 9.0, 9.0, 14.0, 25.0, 30.0, 59.0, 86.0, 156.0, 366.0, 1066.0, 10249.0, 4161453.0, 18468.0, 1358.0, 412.0, 205.0, 118.0, 57.0, 54.0, 25.0, 14.0, 8.0, 8.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.5711669921875, -5.400146484375, -5.2291259765625, -5.05810546875, -4.8870849609375, -4.716064453125, -4.5450439453125, -4.3740234375, -4.2030029296875, -4.031982421875, -3.8609619140625, -3.68994140625, -3.5189208984375, -3.347900390625, -3.1768798828125, -3.005859375, -2.8348388671875, -2.663818359375, -2.4927978515625, -2.32177734375, -2.1507568359375, -1.979736328125, -1.8087158203125, -1.6376953125, -1.4666748046875, -1.295654296875, -1.1246337890625, -0.95361328125, -0.7825927734375, -0.611572265625, -0.4405517578125, -0.26953125, -0.0985107421875, 0.072509765625, 0.2435302734375, 0.41455078125, 0.5855712890625, 0.756591796875, 0.9276123046875, 1.0986328125, 1.2696533203125, 1.440673828125, 1.6116943359375, 1.78271484375, 1.9537353515625, 2.124755859375, 2.2957763671875, 2.466796875, 2.6378173828125, 2.808837890625, 2.9798583984375, 3.15087890625, 3.3218994140625, 3.492919921875, 3.6639404296875, 3.8349609375, 4.0059814453125, 4.177001953125, 4.3480224609375, 4.51904296875, 4.6900634765625, 4.861083984375, 5.0321044921875, 5.203125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 10.0, 9.0, 8.0, 17.0, 14.0, 22.0, 36.0, 46.0, 47.0, 71.0, 86.0, 81.0, 84.0, 85.0, 77.0, 73.0, 56.0, 47.0, 31.0, 19.0, 18.0, 14.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7587890625, -0.7330093383789062, -0.7072296142578125, -0.6814498901367188, -0.655670166015625, -0.6298904418945312, -0.6041107177734375, -0.5783309936523438, -0.55255126953125, -0.5267715454101562, -0.5009918212890625, -0.47521209716796875, -0.449432373046875, -0.42365264892578125, -0.3978729248046875, -0.37209320068359375, -0.3463134765625, -0.32053375244140625, -0.2947540283203125, -0.26897430419921875, -0.243194580078125, -0.21741485595703125, -0.1916351318359375, -0.16585540771484375, -0.14007568359375, -0.11429595947265625, -0.0885162353515625, -0.06273651123046875, -0.036956787109375, -0.01117706298828125, 0.0146026611328125, 0.04038238525390625, 0.066162109375, 0.09194183349609375, 0.1177215576171875, 0.14350128173828125, 0.169281005859375, 0.19506072998046875, 0.2208404541015625, 0.24662017822265625, 0.27239990234375, 0.29817962646484375, 0.3239593505859375, 0.34973907470703125, 0.375518798828125, 0.40129852294921875, 0.4270782470703125, 0.45285797119140625, 0.4786376953125, 0.5044174194335938, 0.5301971435546875, 0.5559768676757812, 0.581756591796875, 0.6075363159179688, 0.6333160400390625, 0.6590957641601562, 0.68487548828125, 0.7106552124023438, 0.7364349365234375, 0.7622146606445312, 0.787994384765625, 0.8137741088867188, 0.8395538330078125, 0.8653335571289062, 0.89111328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 19.0, 19.0, 24.0, 19.0, 32.0, 49.0, 59.0, 90.0, 175.0, 283.0, 611.0, 1627.0, 5956.0, 53504.0, 4057124.0, 65111.0, 6404.0, 1721.0, 629.0, 310.0, 160.0, 107.0, 46.0, 55.0, 28.0, 26.0, 20.0, 13.0, 8.0, 5.0, 10.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-3.171875, -3.0916290283203125, -3.011383056640625, -2.9311370849609375, -2.85089111328125, -2.7706451416015625, -2.690399169921875, -2.6101531982421875, -2.5299072265625, -2.4496612548828125, -2.369415283203125, -2.2891693115234375, -2.20892333984375, -2.1286773681640625, -2.048431396484375, -1.9681854248046875, -1.887939453125, -1.8076934814453125, -1.727447509765625, -1.6472015380859375, -1.56695556640625, -1.4867095947265625, -1.406463623046875, -1.3262176513671875, -1.2459716796875, -1.1657257080078125, -1.085479736328125, -1.0052337646484375, -0.92498779296875, -0.8447418212890625, -0.764495849609375, -0.6842498779296875, -0.60400390625, -0.5237579345703125, -0.443511962890625, -0.3632659912109375, -0.28302001953125, -0.2027740478515625, -0.122528076171875, -0.0422821044921875, 0.0379638671875, 0.1182098388671875, 0.198455810546875, 0.2787017822265625, 0.35894775390625, 0.4391937255859375, 0.519439697265625, 0.5996856689453125, 0.679931640625, 0.7601776123046875, 0.840423583984375, 0.9206695556640625, 1.00091552734375, 1.0811614990234375, 1.161407470703125, 1.2416534423828125, 1.3218994140625, 1.4021453857421875, 1.482391357421875, 1.5626373291015625, 1.64288330078125, 1.7231292724609375, 1.803375244140625, 1.8836212158203125, 1.9638671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 18.0, 37.0, 192.0, 3350.0, 337.0, 82.0, 29.0, 12.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2841796875, -1.258819580078125, -1.23345947265625, -1.208099365234375, -1.1827392578125, -1.157379150390625, -1.13201904296875, -1.106658935546875, -1.081298828125, -1.055938720703125, -1.03057861328125, -1.005218505859375, -0.9798583984375, -0.954498291015625, -0.92913818359375, -0.903778076171875, -0.87841796875, -0.853057861328125, -0.82769775390625, -0.802337646484375, -0.7769775390625, -0.751617431640625, -0.72625732421875, -0.700897216796875, -0.675537109375, -0.650177001953125, -0.62481689453125, -0.599456787109375, -0.5740966796875, -0.548736572265625, -0.52337646484375, -0.498016357421875, -0.47265625, -0.447296142578125, -0.42193603515625, -0.396575927734375, -0.3712158203125, -0.345855712890625, -0.32049560546875, -0.295135498046875, -0.269775390625, -0.244415283203125, -0.21905517578125, -0.193695068359375, -0.1683349609375, -0.142974853515625, -0.11761474609375, -0.092254638671875, -0.06689453125, -0.041534423828125, -0.01617431640625, 0.009185791015625, 0.0345458984375, 0.059906005859375, 0.08526611328125, 0.110626220703125, 0.135986328125, 0.161346435546875, 0.18670654296875, 0.212066650390625, 0.2374267578125, 0.262786865234375, 0.28814697265625, 0.313507080078125, 0.3388671875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 21.0, 44.0, 110.0, 189.0, 171.0, 185.0, 109.0, 77.0, 38.0, 29.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.862631320953369, -2.7916030883789062, -2.7205750942230225, -2.6495471000671387, -2.578518867492676, -2.507490634918213, -2.436462640762329, -2.3654346466064453, -2.2944064140319824, -2.2233781814575195, -2.1523501873016357, -2.081322193145752, -2.010293960571289, -1.9392658472061157, -1.8682377338409424, -1.797209620475769, -1.7261815071105957, -1.6551533937454224, -1.584125280380249, -1.5130971670150757, -1.4420690536499023, -1.371040940284729, -1.3000128269195557, -1.2289847135543823, -1.157956600189209, -1.0869284868240356, -1.0159003734588623, -0.944872260093689, -0.8738441467285156, -0.8028160333633423, -0.731787919998169, -0.6607598066329956, -0.5897315740585327, -0.5187034606933594, -0.44767534732818604, -0.3766472339630127, -0.30561912059783936, -0.23459100723266602, -0.16356289386749268, -0.09253478050231934, -0.021506667137145996, 0.049521446228027344, 0.12054955959320068, 0.19157767295837402, 0.26260578632354736, 0.3336338996887207, 0.40466201305389404, 0.4756901264190674, 0.5467182397842407, 0.6177463531494141, 0.6887744665145874, 0.7598025798797607, 0.8308306932449341, 0.9018588066101074, 0.9728869199752808, 1.043915033340454, 1.1149431467056274, 1.1859712600708008, 1.2569993734359741, 1.3280274868011475, 1.3990556001663208, 1.4700837135314941, 1.5411118268966675, 1.6121399402618408, 1.6831680536270142]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 13.0, 5.0, 17.0, 20.0, 15.0, 23.0, 28.0, 24.0, 39.0, 39.0, 34.0, 42.0, 48.0, 47.0, 45.0, 37.0, 50.0, 51.0, 39.0, 43.0, 48.0, 43.0, 36.0, 30.0, 36.0, 27.0, 26.0, 15.0, 21.0, 20.0, 11.0, 10.0, 8.0, 6.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.122253179550171, -1.0843738317489624, -1.046494483947754, -1.0086150169372559, -0.9707356691360474, -0.9328563213348389, -0.8949769735336304, -0.8570976257324219, -0.8192182183265686, -0.7813388705253601, -0.7434594631195068, -0.7055801153182983, -0.6677007675170898, -0.6298213601112366, -0.5919420123100281, -0.5540626049041748, -0.5161832571029663, -0.4783038794994354, -0.44042450189590454, -0.40254515409469604, -0.36466577649116516, -0.3267863988876343, -0.2889070510864258, -0.2510276734828949, -0.213148295879364, -0.17526891827583313, -0.13738955557346344, -0.09951018542051315, -0.061630815267562866, -0.023751437664031982, 0.014127925038337708, 0.0520072877407074, 0.08988678455352783, 0.12776616215705872, 0.1656455248594284, 0.2035248875617981, 0.24140426516532898, 0.27928364276885986, 0.31716299057006836, 0.35504236817359924, 0.3929217457771301, 0.430801123380661, 0.4686805009841919, 0.5065598487854004, 0.5444391965866089, 0.5823186039924622, 0.6201979517936707, 0.6580773591995239, 0.6959567070007324, 0.7338360548019409, 0.7717154622077942, 0.8095948100090027, 0.847474217414856, 0.8853535652160645, 0.923232913017273, 0.9611122608184814, 0.9989916682243347, 1.036871075630188, 1.0747504234313965, 1.112629771232605, 1.1505091190338135, 1.1883885860443115, 1.22626793384552, 1.2641472816467285, 1.302026629447937]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 8.0, 17.0, 16.0, 21.0, 34.0, 48.0, 87.0, 146.0, 225.0, 363.0, 699.0, 1257.0, 2487.0, 5383.0, 14691.0, 55098.0, 298053.0, 510380.0, 117965.0, 25831.0, 8311.0, 3568.0, 1682.0, 950.0, 447.0, 283.0, 177.0, 102.0, 67.0, 45.0, 30.0, 26.0, 12.0, 7.0, 9.0, 4.0, 7.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2099609375, -1.1699371337890625, -1.129913330078125, -1.0898895263671875, -1.04986572265625, -1.0098419189453125, -0.969818115234375, -0.9297943115234375, -0.8897705078125, -0.8497467041015625, -0.809722900390625, -0.7696990966796875, -0.72967529296875, -0.6896514892578125, -0.649627685546875, -0.6096038818359375, -0.569580078125, -0.5295562744140625, -0.489532470703125, -0.4495086669921875, -0.40948486328125, -0.3694610595703125, -0.329437255859375, -0.2894134521484375, -0.2493896484375, -0.2093658447265625, -0.169342041015625, -0.1293182373046875, -0.08929443359375, -0.0492706298828125, -0.009246826171875, 0.0307769775390625, 0.07080078125, 0.1108245849609375, 0.150848388671875, 0.1908721923828125, 0.23089599609375, 0.2709197998046875, 0.310943603515625, 0.3509674072265625, 0.3909912109375, 0.4310150146484375, 0.471038818359375, 0.5110626220703125, 0.55108642578125, 0.5911102294921875, 0.631134033203125, 0.6711578369140625, 0.711181640625, 0.7512054443359375, 0.791229248046875, 0.8312530517578125, 0.87127685546875, 0.9113006591796875, 0.951324462890625, 0.9913482666015625, 1.0313720703125, 1.0713958740234375, 1.111419677734375, 1.1514434814453125, 1.19146728515625, 1.2314910888671875, 1.271514892578125, 1.3115386962890625, 1.3515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 7.0, 7.0, 6.0, 9.0, 6.0, 17.0, 20.0, 30.0, 29.0, 47.0, 54.0, 67.0, 70.0, 78.0, 85.0, 79.0, 68.0, 74.0, 67.0, 38.0, 44.0, 28.0, 17.0, 13.0, 14.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.84912109375, -0.82379150390625, -0.7984619140625, -0.77313232421875, -0.747802734375, -0.72247314453125, -0.6971435546875, -0.67181396484375, -0.646484375, -0.62115478515625, -0.5958251953125, -0.57049560546875, -0.545166015625, -0.51983642578125, -0.4945068359375, -0.46917724609375, -0.44384765625, -0.41851806640625, -0.3931884765625, -0.36785888671875, -0.342529296875, -0.31719970703125, -0.2918701171875, -0.26654052734375, -0.2412109375, -0.21588134765625, -0.1905517578125, -0.16522216796875, -0.139892578125, -0.11456298828125, -0.0892333984375, -0.06390380859375, -0.03857421875, -0.01324462890625, 0.0120849609375, 0.03741455078125, 0.062744140625, 0.08807373046875, 0.1134033203125, 0.13873291015625, 0.1640625, 0.18939208984375, 0.2147216796875, 0.24005126953125, 0.265380859375, 0.29071044921875, 0.3160400390625, 0.34136962890625, 0.36669921875, 0.39202880859375, 0.4173583984375, 0.44268798828125, 0.468017578125, 0.49334716796875, 0.5186767578125, 0.54400634765625, 0.5693359375, 0.59466552734375, 0.6199951171875, 0.64532470703125, 0.670654296875, 0.69598388671875, 0.7213134765625, 0.74664306640625, 0.77197265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 6.0, 11.0, 16.0, 24.0, 27.0, 39.0, 43.0, 79.0, 125.0, 200.0, 322.0, 621.0, 1509.0, 4917.0, 26302.0, 308866.0, 640025.0, 53411.0, 8043.0, 2132.0, 784.0, 379.0, 224.0, 129.0, 89.0, 63.0, 47.0, 26.0, 16.0, 12.0, 9.0, 9.0, 6.0, 3.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.516265869140625, -1.45831298828125, -1.400360107421875, -1.3424072265625, -1.284454345703125, -1.22650146484375, -1.168548583984375, -1.110595703125, -1.052642822265625, -0.99468994140625, -0.936737060546875, -0.8787841796875, -0.820831298828125, -0.76287841796875, -0.704925537109375, -0.64697265625, -0.589019775390625, -0.53106689453125, -0.473114013671875, -0.4151611328125, -0.357208251953125, -0.29925537109375, -0.241302490234375, -0.183349609375, -0.125396728515625, -0.06744384765625, -0.009490966796875, 0.0484619140625, 0.106414794921875, 0.16436767578125, 0.222320556640625, 0.2802734375, 0.338226318359375, 0.39617919921875, 0.454132080078125, 0.5120849609375, 0.570037841796875, 0.62799072265625, 0.685943603515625, 0.743896484375, 0.801849365234375, 0.85980224609375, 0.917755126953125, 0.9757080078125, 1.033660888671875, 1.09161376953125, 1.149566650390625, 1.20751953125, 1.265472412109375, 1.32342529296875, 1.381378173828125, 1.4393310546875, 1.497283935546875, 1.55523681640625, 1.613189697265625, 1.671142578125, 1.729095458984375, 1.78704833984375, 1.845001220703125, 1.9029541015625, 1.960906982421875, 2.01885986328125, 2.076812744140625, 2.134765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 11.0, 9.0, 13.0, 19.0, 22.0, 22.0, 26.0, 30.0, 52.0, 44.0, 51.0, 59.0, 62.0, 57.0, 55.0, 40.0, 51.0, 47.0, 51.0, 57.0, 49.0, 29.0, 31.0, 19.0, 16.0, 14.0, 11.0, 9.0, 16.0, 8.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.28228759765625, -2.1915283203125, -2.10076904296875, -2.010009765625, -1.91925048828125, -1.8284912109375, -1.73773193359375, -1.64697265625, -1.55621337890625, -1.4654541015625, -1.37469482421875, -1.283935546875, -1.19317626953125, -1.1024169921875, -1.01165771484375, -0.9208984375, -0.83013916015625, -0.7393798828125, -0.64862060546875, -0.557861328125, -0.46710205078125, -0.3763427734375, -0.28558349609375, -0.19482421875, -0.10406494140625, -0.0133056640625, 0.07745361328125, 0.168212890625, 0.25897216796875, 0.3497314453125, 0.44049072265625, 0.53125, 0.62200927734375, 0.7127685546875, 0.80352783203125, 0.894287109375, 0.98504638671875, 1.0758056640625, 1.16656494140625, 1.25732421875, 1.34808349609375, 1.4388427734375, 1.52960205078125, 1.620361328125, 1.71112060546875, 1.8018798828125, 1.89263916015625, 1.9833984375, 2.07415771484375, 2.1649169921875, 2.25567626953125, 2.346435546875, 2.43719482421875, 2.5279541015625, 2.61871337890625, 2.70947265625, 2.80023193359375, 2.8909912109375, 2.98175048828125, 3.072509765625, 3.16326904296875, 3.2540283203125, 3.34478759765625, 3.435546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 16.0, 25.0, 25.0, 41.0, 82.0, 213.0, 431.0, 1264.0, 6113.0, 196469.0, 823715.0, 16738.0, 2118.0, 656.0, 296.0, 137.0, 70.0, 35.0, 21.0, 24.0, 20.0, 7.0, 7.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.501953125, -1.4654922485351562, -1.4290313720703125, -1.3925704956054688, -1.356109619140625, -1.3196487426757812, -1.2831878662109375, -1.2467269897460938, -1.21026611328125, -1.1738052368164062, -1.1373443603515625, -1.1008834838867188, -1.064422607421875, -1.0279617309570312, -0.9915008544921875, -0.9550399780273438, -0.9185791015625, -0.8821182250976562, -0.8456573486328125, -0.8091964721679688, -0.772735595703125, -0.7362747192382812, -0.6998138427734375, -0.6633529663085938, -0.62689208984375, -0.5904312133789062, -0.5539703369140625, -0.5175094604492188, -0.481048583984375, -0.44458770751953125, -0.4081268310546875, -0.37166595458984375, -0.335205078125, -0.29874420166015625, -0.2622833251953125, -0.22582244873046875, -0.189361572265625, -0.15290069580078125, -0.1164398193359375, -0.07997894287109375, -0.04351806640625, -0.00705718994140625, 0.0294036865234375, 0.06586456298828125, 0.102325439453125, 0.13878631591796875, 0.1752471923828125, 0.21170806884765625, 0.2481689453125, 0.28462982177734375, 0.3210906982421875, 0.35755157470703125, 0.394012451171875, 0.43047332763671875, 0.4669342041015625, 0.5033950805664062, 0.53985595703125, 0.5763168334960938, 0.6127777099609375, 0.6492385864257812, 0.685699462890625, 0.7221603393554688, 0.7586212158203125, 0.7950820922851562, 0.83154296875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 7.0, 7.0, 18.0, 12.0, 17.0, 22.0, 30.0, 38.0, 46.0, 62.0, 90.0, 88.0, 98.0, 86.0, 77.0, 58.0, 57.0, 40.0, 36.0, 20.0, 20.0, 16.0, 17.0, 5.0, 10.0, 3.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0001112818717956543, -0.00010866299271583557, -0.00010604411363601685, -0.00010342523455619812, -0.0001008063554763794, -9.818747639656067e-05, -9.556859731674194e-05, -9.294971823692322e-05, -9.033083915710449e-05, -8.771196007728577e-05, -8.509308099746704e-05, -8.247420191764832e-05, -7.985532283782959e-05, -7.723644375801086e-05, -7.461756467819214e-05, -7.199868559837341e-05, -6.937980651855469e-05, -6.676092743873596e-05, -6.414204835891724e-05, -6.152316927909851e-05, -5.8904290199279785e-05, -5.628541111946106e-05, -5.3666532039642334e-05, -5.104765295982361e-05, -4.842877388000488e-05, -4.580989480018616e-05, -4.319101572036743e-05, -4.0572136640548706e-05, -3.795325756072998e-05, -3.5334378480911255e-05, -3.271549940109253e-05, -3.0096620321273804e-05, -2.7477741241455078e-05, -2.4858862161636353e-05, -2.2239983081817627e-05, -1.96211040019989e-05, -1.7002224922180176e-05, -1.438334584236145e-05, -1.1764466762542725e-05, -9.145587682723999e-06, -6.5267086029052734e-06, -3.907829523086548e-06, -1.2889504432678223e-06, 1.3299286365509033e-06, 3.948807716369629e-06, 6.5676867961883545e-06, 9.18656587600708e-06, 1.1805444955825806e-05, 1.4424324035644531e-05, 1.7043203115463257e-05, 1.9662082195281982e-05, 2.2280961275100708e-05, 2.4899840354919434e-05, 2.751871943473816e-05, 3.0137598514556885e-05, 3.275647759437561e-05, 3.5375356674194336e-05, 3.799423575401306e-05, 4.061311483383179e-05, 4.323199391365051e-05, 4.585087299346924e-05, 4.8469752073287964e-05, 5.108863115310669e-05, 5.3707510232925415e-05, 5.632638931274414e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 11.0, 11.0, 19.0, 20.0, 51.0, 80.0, 140.0, 287.0, 731.0, 2238.0, 11225.0, 232306.0, 764001.0, 31546.0, 3833.0, 1120.0, 451.0, 197.0, 116.0, 56.0, 26.0, 25.0, 10.0, 15.0, 11.0, 7.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.216796875, -1.1886367797851562, -1.1604766845703125, -1.1323165893554688, -1.104156494140625, -1.0759963989257812, -1.0478363037109375, -1.0196762084960938, -0.99151611328125, -0.9633560180664062, -0.9351959228515625, -0.9070358276367188, -0.878875732421875, -0.8507156372070312, -0.8225555419921875, -0.7943954467773438, -0.7662353515625, -0.7380752563476562, -0.7099151611328125, -0.6817550659179688, -0.653594970703125, -0.6254348754882812, -0.5972747802734375, -0.5691146850585938, -0.54095458984375, -0.5127944946289062, -0.4846343994140625, -0.45647430419921875, -0.428314208984375, -0.40015411376953125, -0.3719940185546875, -0.34383392333984375, -0.315673828125, -0.28751373291015625, -0.2593536376953125, -0.23119354248046875, -0.203033447265625, -0.17487335205078125, -0.1467132568359375, -0.11855316162109375, -0.09039306640625, -0.06223297119140625, -0.0340728759765625, -0.00591278076171875, 0.022247314453125, 0.05040740966796875, 0.0785675048828125, 0.10672760009765625, 0.1348876953125, 0.16304779052734375, 0.1912078857421875, 0.21936798095703125, 0.247528076171875, 0.27568817138671875, 0.3038482666015625, 0.33200836181640625, 0.36016845703125, 0.38832855224609375, 0.4164886474609375, 0.44464874267578125, 0.472808837890625, 0.5009689331054688, 0.5291290283203125, 0.5572891235351562, 0.58544921875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 15.0, 20.0, 22.0, 27.0, 40.0, 56.0, 85.0, 85.0, 67.0, 97.0, 96.0, 97.0, 67.0, 49.0, 48.0, 41.0, 25.0, 16.0, 13.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.99951171875, -0.9766426086425781, -0.9537734985351562, -0.9309043884277344, -0.9080352783203125, -0.8851661682128906, -0.8622970581054688, -0.8394279479980469, -0.816558837890625, -0.7936897277832031, -0.7708206176757812, -0.7479515075683594, -0.7250823974609375, -0.7022132873535156, -0.6793441772460938, -0.6564750671386719, -0.63360595703125, -0.6107368469238281, -0.5878677368164062, -0.5649986267089844, -0.5421295166015625, -0.5192604064941406, -0.49639129638671875, -0.4735221862792969, -0.450653076171875, -0.4277839660644531, -0.40491485595703125, -0.3820457458496094, -0.3591766357421875, -0.3363075256347656, -0.31343841552734375, -0.2905693054199219, -0.2677001953125, -0.24483108520507812, -0.22196197509765625, -0.19909286499023438, -0.1762237548828125, -0.15335464477539062, -0.13048553466796875, -0.10761642456054688, -0.084747314453125, -0.061878204345703125, -0.03900909423828125, -0.016139984130859375, 0.0067291259765625, 0.029598236083984375, 0.05246734619140625, 0.07533645629882812, 0.09820556640625, 0.12107467651367188, 0.14394378662109375, 0.16681289672851562, 0.1896820068359375, 0.21255111694335938, 0.23542022705078125, 0.2582893371582031, 0.281158447265625, 0.3040275573730469, 0.32689666748046875, 0.3497657775878906, 0.3726348876953125, 0.3955039978027344, 0.41837310791015625, 0.4412422180175781, 0.464111328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 19.0, 49.0, 138.0, 281.0, 305.0, 156.0, 33.0, 15.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.938005447387695, -31.27324104309082, -30.608478546142578, -29.943714141845703, -29.278949737548828, -28.614187240600586, -27.94942283630371, -27.28466033935547, -26.619895935058594, -25.95513153076172, -25.290369033813477, -24.6256046295166, -23.96084213256836, -23.296077728271484, -22.63131332397461, -21.966548919677734, -21.301786422729492, -20.637022018432617, -19.972259521484375, -19.3074951171875, -18.642730712890625, -17.977968215942383, -17.313203811645508, -16.648441314697266, -15.98367691040039, -15.318913459777832, -14.654150009155273, -13.989385604858398, -13.32462215423584, -12.659858703613281, -11.995094299316406, -11.330330848693848, -10.665567398071289, -10.00080394744873, -9.336040496826172, -8.671276092529297, -8.006512641906738, -7.34174919128418, -6.676985263824463, -6.012221336364746, -5.3474578857421875, -4.682694435119629, -4.017930507659912, -3.3531668186187744, -2.6884031295776367, -2.023639440536499, -1.3588757514953613, -0.6941118240356445, -0.029348373413085938, 0.6354153156280518, 1.3001790046691895, 1.9649426937103271, 2.629706382751465, 3.2944700717926025, 3.9592337608337402, 4.623997688293457, 5.288761138916016, 5.953524589538574, 6.618288516998291, 7.283052444458008, 7.947815895080566, 8.612579345703125, 9.27734375, 9.942107200622559, 10.606870651245117]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 10.0, 14.0, 11.0, 15.0, 18.0, 13.0, 15.0, 24.0, 26.0, 35.0, 33.0, 40.0, 30.0, 50.0, 49.0, 46.0, 46.0, 60.0, 63.0, 46.0, 47.0, 47.0, 37.0, 30.0, 25.0, 29.0, 29.0, 19.0, 13.0, 10.0, 6.0, 8.0, 11.0, 2.0, 6.0, 5.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.832784652709961, -8.520476341247559, -8.208168029785156, -7.895859718322754, -7.583551406860352, -7.271243095397949, -6.958934783935547, -6.6466264724731445, -6.334318161010742, -6.02200984954834, -5.7097015380859375, -5.397393226623535, -5.085084915161133, -4.7727766036987305, -4.460468292236328, -4.148159980773926, -3.8358516693115234, -3.523543357849121, -3.2112350463867188, -2.8989267349243164, -2.586618423461914, -2.2743101119995117, -1.9620018005371094, -1.649693489074707, -1.3373851776123047, -1.0250768661499023, -0.7127685546875, -0.40046024322509766, -0.08815193176269531, 0.22415637969970703, 0.5364646911621094, 0.8487730026245117, 1.161081314086914, 1.4733896255493164, 1.7856979370117188, 2.098006248474121, 2.4103145599365234, 2.722622871398926, 3.034931182861328, 3.3472394943237305, 3.659547805786133, 3.971856117248535, 4.2841644287109375, 4.59647274017334, 4.908781051635742, 5.2210893630981445, 5.533397674560547, 5.845705986022949, 6.158014297485352, 6.470322608947754, 6.782630920410156, 7.094939231872559, 7.407247543334961, 7.719555854797363, 8.031864166259766, 8.344172477722168, 8.65648078918457, 8.968789100646973, 9.281097412109375, 9.593405723571777, 9.90571403503418, 10.218022346496582, 10.530330657958984, 10.842638969421387, 11.154947280883789]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 6.0, 6.0, 6.0, 12.0, 17.0, 20.0, 27.0, 49.0, 74.0, 137.0, 408.0, 2496.0, 104479.0, 4075231.0, 9825.0, 898.0, 250.0, 118.0, 68.0, 42.0, 28.0, 19.0, 8.0, 15.0, 9.0, 5.0, 2.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.421875, -3.31890869140625, -3.2159423828125, -3.11297607421875, -3.010009765625, -2.90704345703125, -2.8040771484375, -2.70111083984375, -2.59814453125, -2.49517822265625, -2.3922119140625, -2.28924560546875, -2.186279296875, -2.08331298828125, -1.9803466796875, -1.87738037109375, -1.7744140625, -1.67144775390625, -1.5684814453125, -1.46551513671875, -1.362548828125, -1.25958251953125, -1.1566162109375, -1.05364990234375, -0.95068359375, -0.84771728515625, -0.7447509765625, -0.64178466796875, -0.538818359375, -0.43585205078125, -0.3328857421875, -0.22991943359375, -0.126953125, -0.02398681640625, 0.0789794921875, 0.18194580078125, 0.284912109375, 0.38787841796875, 0.4908447265625, 0.59381103515625, 0.69677734375, 0.79974365234375, 0.9027099609375, 1.00567626953125, 1.108642578125, 1.21160888671875, 1.3145751953125, 1.41754150390625, 1.5205078125, 1.62347412109375, 1.7264404296875, 1.82940673828125, 1.932373046875, 2.03533935546875, 2.1383056640625, 2.24127197265625, 2.34423828125, 2.44720458984375, 2.5501708984375, 2.65313720703125, 2.756103515625, 2.85906982421875, 2.9620361328125, 3.06500244140625, 3.16796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 9.0, 13.0, 22.0, 30.0, 40.0, 54.0, 66.0, 70.0, 87.0, 80.0, 105.0, 103.0, 78.0, 65.0, 58.0, 46.0, 24.0, 13.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5855484008789062, -0.5563507080078125, -0.5271530151367188, -0.497955322265625, -0.46875762939453125, -0.4395599365234375, -0.41036224365234375, -0.38116455078125, -0.35196685791015625, -0.3227691650390625, -0.29357147216796875, -0.264373779296875, -0.23517608642578125, -0.2059783935546875, -0.17678070068359375, -0.1475830078125, -0.11838531494140625, -0.0891876220703125, -0.05998992919921875, -0.030792236328125, -0.00159454345703125, 0.0276031494140625, 0.05680084228515625, 0.08599853515625, 0.11519622802734375, 0.1443939208984375, 0.17359161376953125, 0.202789306640625, 0.23198699951171875, 0.2611846923828125, 0.29038238525390625, 0.319580078125, 0.34877777099609375, 0.3779754638671875, 0.40717315673828125, 0.436370849609375, 0.46556854248046875, 0.4947662353515625, 0.5239639282226562, 0.55316162109375, 0.5823593139648438, 0.6115570068359375, 0.6407546997070312, 0.669952392578125, 0.6991500854492188, 0.7283477783203125, 0.7575454711914062, 0.7867431640625, 0.8159408569335938, 0.8451385498046875, 0.8743362426757812, 0.903533935546875, 0.9327316284179688, 0.9619293212890625, 0.9911270141601562, 1.02032470703125, 1.0495223999023438, 1.0787200927734375, 1.1079177856445312, 1.137115478515625, 1.1663131713867188, 1.1955108642578125, 1.2247085571289062, 1.25390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 11.0, 10.0, 4.0, 7.0, 9.0, 16.0, 23.0, 18.0, 20.0, 18.0, 17.0, 29.0, 22.0, 25.0, 20.0, 38.0, 47.0, 57.0, 199.0, 1085.0, 11509.0, 3902513.0, 272754.0, 4767.0, 592.0, 117.0, 49.0, 36.0, 33.0, 30.0, 31.0, 21.0, 21.0, 17.0, 20.0, 10.0, 21.0, 11.0, 11.0, 7.0, 11.0, 10.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.52734375, -2.442657470703125, -2.35797119140625, -2.273284912109375, -2.1885986328125, -2.103912353515625, -2.01922607421875, -1.934539794921875, -1.849853515625, -1.765167236328125, -1.68048095703125, -1.595794677734375, -1.5111083984375, -1.426422119140625, -1.34173583984375, -1.257049560546875, -1.17236328125, -1.087677001953125, -1.00299072265625, -0.918304443359375, -0.8336181640625, -0.748931884765625, -0.66424560546875, -0.579559326171875, -0.494873046875, -0.410186767578125, -0.32550048828125, -0.240814208984375, -0.1561279296875, -0.071441650390625, 0.01324462890625, 0.097930908203125, 0.1826171875, 0.267303466796875, 0.35198974609375, 0.436676025390625, 0.5213623046875, 0.606048583984375, 0.69073486328125, 0.775421142578125, 0.860107421875, 0.944793701171875, 1.02947998046875, 1.114166259765625, 1.1988525390625, 1.283538818359375, 1.36822509765625, 1.452911376953125, 1.53759765625, 1.622283935546875, 1.70697021484375, 1.791656494140625, 1.8763427734375, 1.961029052734375, 2.04571533203125, 2.130401611328125, 2.215087890625, 2.299774169921875, 2.38446044921875, 2.469146728515625, 2.5538330078125, 2.638519287109375, 2.72320556640625, 2.807891845703125, 2.892578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 13.0, 49.0, 528.0, 3351.0, 120.0, 21.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.755859375, -3.6890640258789062, -3.6222686767578125, -3.5554733276367188, -3.488677978515625, -3.4218826293945312, -3.3550872802734375, -3.2882919311523438, -3.22149658203125, -3.1547012329101562, -3.0879058837890625, -3.0211105346679688, -2.954315185546875, -2.8875198364257812, -2.8207244873046875, -2.7539291381835938, -2.6871337890625, -2.6203384399414062, -2.5535430908203125, -2.4867477416992188, -2.419952392578125, -2.3531570434570312, -2.2863616943359375, -2.2195663452148438, -2.15277099609375, -2.0859756469726562, -2.0191802978515625, -1.9523849487304688, -1.885589599609375, -1.8187942504882812, -1.7519989013671875, -1.6852035522460938, -1.618408203125, -1.5516128540039062, -1.4848175048828125, -1.4180221557617188, -1.351226806640625, -1.2844314575195312, -1.2176361083984375, -1.1508407592773438, -1.08404541015625, -1.0172500610351562, -0.9504547119140625, -0.8836593627929688, -0.816864013671875, -0.7500686645507812, -0.6832733154296875, -0.6164779663085938, -0.5496826171875, -0.48288726806640625, -0.4160919189453125, -0.34929656982421875, -0.282501220703125, -0.21570587158203125, -0.1489105224609375, -0.08211517333984375, -0.01531982421875, 0.05147552490234375, 0.1182708740234375, 0.18506622314453125, 0.251861572265625, 0.31865692138671875, 0.3854522705078125, 0.45224761962890625, 0.51904296875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 14.0, 13.0, 22.0, 41.0, 58.0, 81.0, 107.0, 151.0, 152.0, 124.0, 92.0, 56.0, 29.0, 11.0, 11.0, 7.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1278927326202393, -3.0505025386810303, -2.9731123447418213, -2.8957221508026123, -2.8183319568634033, -2.7409417629241943, -2.6635515689849854, -2.5861616134643555, -2.5087714195251465, -2.4313812255859375, -2.3539910316467285, -2.2766008377075195, -2.1992106437683105, -2.1218204498291016, -2.0444302558898926, -1.9670401811599731, -1.8896498680114746, -1.8122596740722656, -1.7348694801330566, -1.6574792861938477, -1.5800890922546387, -1.5026988983154297, -1.4253088235855103, -1.3479186296463013, -1.2705284357070923, -1.1931382417678833, -1.1157480478286743, -1.0383578538894653, -0.9609677195549011, -0.8835775256156921, -0.8061873912811279, -0.728797197341919, -0.65140700340271, -0.574016809463501, -0.4966266453266144, -0.4192364811897278, -0.3418462872505188, -0.2644560933113098, -0.18706592917442322, -0.10967576503753662, -0.03228557109832764, 0.045104607939720154, 0.12249478697776794, 0.19988496601581573, 0.2772751450538635, 0.3546653389930725, 0.4320555031299591, 0.5094456672668457, 0.5868358612060547, 0.6642260551452637, 0.7416162490844727, 0.8190063834190369, 0.8963965773582458, 0.9737867712974548, 1.051176905632019, 1.128567099571228, 1.205957293510437, 1.283347487449646, 1.360737681388855, 1.438127875328064, 1.5155179500579834, 1.5929081439971924, 1.6702983379364014, 1.7476885318756104, 1.8250787258148193]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 6.0, 7.0, 7.0, 5.0, 8.0, 15.0, 16.0, 9.0, 13.0, 28.0, 21.0, 23.0, 24.0, 27.0, 50.0, 46.0, 39.0, 40.0, 47.0, 53.0, 37.0, 50.0, 47.0, 39.0, 30.0, 39.0, 39.0, 32.0, 34.0, 28.0, 28.0, 20.0, 16.0, 20.0, 11.0, 10.0, 12.0, 8.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.3001372814178467, -2.2286465167999268, -2.157155990600586, -2.085665225982666, -2.014174461364746, -1.9426838159561157, -1.8711931705474854, -1.7997024059295654, -1.7282116413116455, -1.6567209959030151, -1.5852302312850952, -1.5137395858764648, -1.442248821258545, -1.3707581758499146, -1.2992675304412842, -1.2277767658233643, -1.1562861204147339, -1.0847954750061035, -1.0133047103881836, -0.9418140649795532, -0.8703233003616333, -0.7988326549530029, -0.7273419499397278, -0.6558512449264526, -0.5843605399131775, -0.5128698348999023, -0.4413791298866272, -0.36988845467567444, -0.2983977496623993, -0.22690704464912415, -0.1554163694381714, -0.08392566442489624, -0.012434959411621094, 0.059055738151073456, 0.130546435713768, 0.20203712582588196, 0.2735278308391571, 0.34501853585243225, 0.416509211063385, 0.48799991607666016, 0.5594906210899353, 0.6309813261032104, 0.7024720311164856, 0.7739627361297607, 0.8454533815383911, 0.916944146156311, 0.9884347915649414, 1.0599255561828613, 1.1314162015914917, 1.202906847000122, 1.274397611618042, 1.3458882570266724, 1.4173790216445923, 1.4888696670532227, 1.5603604316711426, 1.631851077079773, 1.7033417224884033, 1.7748323678970337, 1.8463231325149536, 1.917813777923584, 1.989304542541504, 2.060795307159424, 2.1322858333587646, 2.2037765979766846, 2.2752673625946045]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 5.0, 9.0, 11.0, 17.0, 24.0, 52.0, 70.0, 155.0, 279.0, 779.0, 2798.0, 16932.0, 222410.0, 719642.0, 74821.0, 7926.0, 1652.0, 514.0, 198.0, 94.0, 50.0, 45.0, 18.0, 14.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.166015625, -2.098968505859375, -2.03192138671875, -1.964874267578125, -1.8978271484375, -1.830780029296875, -1.76373291015625, -1.696685791015625, -1.629638671875, -1.562591552734375, -1.49554443359375, -1.428497314453125, -1.3614501953125, -1.294403076171875, -1.22735595703125, -1.160308837890625, -1.09326171875, -1.026214599609375, -0.95916748046875, -0.892120361328125, -0.8250732421875, -0.758026123046875, -0.69097900390625, -0.623931884765625, -0.556884765625, -0.489837646484375, -0.42279052734375, -0.355743408203125, -0.2886962890625, -0.221649169921875, -0.15460205078125, -0.087554931640625, -0.0205078125, 0.046539306640625, 0.11358642578125, 0.180633544921875, 0.2476806640625, 0.314727783203125, 0.38177490234375, 0.448822021484375, 0.515869140625, 0.582916259765625, 0.64996337890625, 0.717010498046875, 0.7840576171875, 0.851104736328125, 0.91815185546875, 0.985198974609375, 1.05224609375, 1.119293212890625, 1.18634033203125, 1.253387451171875, 1.3204345703125, 1.387481689453125, 1.45452880859375, 1.521575927734375, 1.588623046875, 1.655670166015625, 1.72271728515625, 1.789764404296875, 1.8568115234375, 1.923858642578125, 1.99090576171875, 2.057952880859375, 2.125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 7.0, 12.0, 15.0, 9.0, 10.0, 34.0, 42.0, 46.0, 66.0, 67.0, 54.0, 57.0, 66.0, 72.0, 93.0, 72.0, 54.0, 56.0, 43.0, 42.0, 29.0, 19.0, 5.0, 12.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61181640625, -0.5862350463867188, -0.5606536865234375, -0.5350723266601562, -0.509490966796875, -0.48390960693359375, -0.4583282470703125, -0.43274688720703125, -0.40716552734375, -0.38158416748046875, -0.3560028076171875, -0.33042144775390625, -0.304840087890625, -0.27925872802734375, -0.2536773681640625, -0.22809600830078125, -0.2025146484375, -0.17693328857421875, -0.1513519287109375, -0.12577056884765625, -0.100189208984375, -0.07460784912109375, -0.0490264892578125, -0.02344512939453125, 0.00213623046875, 0.02771759033203125, 0.0532989501953125, 0.07888031005859375, 0.104461669921875, 0.13004302978515625, 0.1556243896484375, 0.18120574951171875, 0.206787109375, 0.23236846923828125, 0.2579498291015625, 0.28353118896484375, 0.309112548828125, 0.33469390869140625, 0.3602752685546875, 0.38585662841796875, 0.41143798828125, 0.43701934814453125, 0.4626007080078125, 0.48818206787109375, 0.513763427734375, 0.5393447875976562, 0.5649261474609375, 0.5905075073242188, 0.6160888671875, 0.6416702270507812, 0.6672515869140625, 0.6928329467773438, 0.718414306640625, 0.7439956665039062, 0.7695770263671875, 0.7951583862304688, 0.82073974609375, 0.8463211059570312, 0.8719024658203125, 0.8974838256835938, 0.923065185546875, 0.9486465454101562, 0.9742279052734375, 0.9998092651367188, 1.025390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 15.0, 17.0, 30.0, 32.0, 71.0, 99.0, 186.0, 449.0, 1155.0, 5331.0, 86610.0, 898241.0, 50502.0, 3958.0, 1002.0, 397.0, 183.0, 98.0, 51.0, 32.0, 22.0, 18.0, 21.0, 7.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.318359375, -2.23382568359375, -2.1492919921875, -2.06475830078125, -1.980224609375, -1.89569091796875, -1.8111572265625, -1.72662353515625, -1.64208984375, -1.55755615234375, -1.4730224609375, -1.38848876953125, -1.303955078125, -1.21942138671875, -1.1348876953125, -1.05035400390625, -0.9658203125, -0.88128662109375, -0.7967529296875, -0.71221923828125, -0.627685546875, -0.54315185546875, -0.4586181640625, -0.37408447265625, -0.28955078125, -0.20501708984375, -0.1204833984375, -0.03594970703125, 0.048583984375, 0.13311767578125, 0.2176513671875, 0.30218505859375, 0.38671875, 0.47125244140625, 0.5557861328125, 0.64031982421875, 0.724853515625, 0.80938720703125, 0.8939208984375, 0.97845458984375, 1.06298828125, 1.14752197265625, 1.2320556640625, 1.31658935546875, 1.401123046875, 1.48565673828125, 1.5701904296875, 1.65472412109375, 1.7392578125, 1.82379150390625, 1.9083251953125, 1.99285888671875, 2.077392578125, 2.16192626953125, 2.2464599609375, 2.33099365234375, 2.41552734375, 2.50006103515625, 2.5845947265625, 2.66912841796875, 2.753662109375, 2.83819580078125, 2.9227294921875, 3.00726318359375, 3.091796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 5.0, 9.0, 19.0, 19.0, 22.0, 21.0, 25.0, 31.0, 36.0, 32.0, 47.0, 59.0, 59.0, 53.0, 45.0, 50.0, 31.0, 57.0, 49.0, 43.0, 44.0, 42.0, 28.0, 25.0, 24.0, 17.0, 17.0, 15.0, 8.0, 9.0, 11.0, 9.0, 4.0, 6.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.21875, -2.14495849609375, -2.0711669921875, -1.99737548828125, -1.923583984375, -1.84979248046875, -1.7760009765625, -1.70220947265625, -1.62841796875, -1.55462646484375, -1.4808349609375, -1.40704345703125, -1.333251953125, -1.25946044921875, -1.1856689453125, -1.11187744140625, -1.0380859375, -0.96429443359375, -0.8905029296875, -0.81671142578125, -0.742919921875, -0.66912841796875, -0.5953369140625, -0.52154541015625, -0.44775390625, -0.37396240234375, -0.3001708984375, -0.22637939453125, -0.152587890625, -0.07879638671875, -0.0050048828125, 0.06878662109375, 0.142578125, 0.21636962890625, 0.2901611328125, 0.36395263671875, 0.437744140625, 0.51153564453125, 0.5853271484375, 0.65911865234375, 0.73291015625, 0.80670166015625, 0.8804931640625, 0.95428466796875, 1.028076171875, 1.10186767578125, 1.1756591796875, 1.24945068359375, 1.3232421875, 1.39703369140625, 1.4708251953125, 1.54461669921875, 1.618408203125, 1.69219970703125, 1.7659912109375, 1.83978271484375, 1.91357421875, 1.98736572265625, 2.0611572265625, 2.13494873046875, 2.208740234375, 2.28253173828125, 2.3563232421875, 2.43011474609375, 2.50390625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 5.0, 7.0, 18.0, 30.0, 61.0, 113.0, 202.0, 536.0, 1623.0, 8227.0, 154819.0, 838781.0, 38523.0, 3926.0, 953.0, 365.0, 155.0, 90.0, 59.0, 21.0, 13.0, 5.0, 8.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98828125, -0.963134765625, -0.93798828125, -0.912841796875, -0.8876953125, -0.862548828125, -0.83740234375, -0.812255859375, -0.787109375, -0.761962890625, -0.73681640625, -0.711669921875, -0.6865234375, -0.661376953125, -0.63623046875, -0.611083984375, -0.5859375, -0.560791015625, -0.53564453125, -0.510498046875, -0.4853515625, -0.460205078125, -0.43505859375, -0.409912109375, -0.384765625, -0.359619140625, -0.33447265625, -0.309326171875, -0.2841796875, -0.259033203125, -0.23388671875, -0.208740234375, -0.18359375, -0.158447265625, -0.13330078125, -0.108154296875, -0.0830078125, -0.057861328125, -0.03271484375, -0.007568359375, 0.017578125, 0.042724609375, 0.06787109375, 0.093017578125, 0.1181640625, 0.143310546875, 0.16845703125, 0.193603515625, 0.21875, 0.243896484375, 0.26904296875, 0.294189453125, 0.3193359375, 0.344482421875, 0.36962890625, 0.394775390625, 0.419921875, 0.445068359375, 0.47021484375, 0.495361328125, 0.5205078125, 0.545654296875, 0.57080078125, 0.595947265625, 0.62109375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 8.0, 7.0, 11.0, 8.0, 7.0, 14.0, 11.0, 14.0, 15.0, 20.0, 24.0, 28.0, 28.0, 30.0, 36.0, 49.0, 71.0, 81.0, 85.0, 77.0, 60.0, 56.0, 44.0, 34.0, 25.0, 21.0, 16.0, 23.0, 17.0, 14.0, 7.0, 4.0, 10.0, 3.0, 9.0, 11.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.711483001708984e-05, -6.490759551525116e-05, -6.270036101341248e-05, -6.049312651157379e-05, -5.828589200973511e-05, -5.607865750789642e-05, -5.387142300605774e-05, -5.1664188504219055e-05, -4.945695400238037e-05, -4.724971950054169e-05, -4.5042484998703e-05, -4.283525049686432e-05, -4.0628015995025635e-05, -3.842078149318695e-05, -3.6213546991348267e-05, -3.400631248950958e-05, -3.17990779876709e-05, -2.9591843485832214e-05, -2.738460898399353e-05, -2.5177374482154846e-05, -2.2970139980316162e-05, -2.0762905478477478e-05, -1.8555670976638794e-05, -1.634843647480011e-05, -1.4141201972961426e-05, -1.1933967471122742e-05, -9.726732969284058e-06, -7.5194984674453735e-06, -5.3122639656066895e-06, -3.1050294637680054e-06, -8.977949619293213e-07, 1.3094395399093628e-06, 3.516674041748047e-06, 5.723908543586731e-06, 7.931143045425415e-06, 1.0138377547264099e-05, 1.2345612049102783e-05, 1.4552846550941467e-05, 1.676008105278015e-05, 1.8967315554618835e-05, 2.117455005645752e-05, 2.3381784558296204e-05, 2.5589019060134888e-05, 2.7796253561973572e-05, 3.0003488063812256e-05, 3.221072256565094e-05, 3.4417957067489624e-05, 3.662519156932831e-05, 3.883242607116699e-05, 4.1039660573005676e-05, 4.324689507484436e-05, 4.5454129576683044e-05, 4.766136407852173e-05, 4.986859858036041e-05, 5.20758330821991e-05, 5.428306758403778e-05, 5.6490302085876465e-05, 5.869753658771515e-05, 6.090477108955383e-05, 6.311200559139252e-05, 6.53192400932312e-05, 6.752647459506989e-05, 6.973370909690857e-05, 7.194094359874725e-05, 7.414817810058594e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 9.0, 19.0, 44.0, 79.0, 226.0, 426.0, 1267.0, 6433.0, 153087.0, 854374.0, 28615.0, 2732.0, 740.0, 248.0, 123.0, 55.0, 23.0, 12.0, 10.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2421875, -1.2128067016601562, -1.1834259033203125, -1.1540451049804688, -1.124664306640625, -1.0952835083007812, -1.0659027099609375, -1.0365219116210938, -1.00714111328125, -0.9777603149414062, -0.9483795166015625, -0.9189987182617188, -0.889617919921875, -0.8602371215820312, -0.8308563232421875, -0.8014755249023438, -0.7720947265625, -0.7427139282226562, -0.7133331298828125, -0.6839523315429688, -0.654571533203125, -0.6251907348632812, -0.5958099365234375, -0.5664291381835938, -0.53704833984375, -0.5076675415039062, -0.4782867431640625, -0.44890594482421875, -0.419525146484375, -0.39014434814453125, -0.3607635498046875, -0.33138275146484375, -0.302001953125, -0.27262115478515625, -0.2432403564453125, -0.21385955810546875, -0.184478759765625, -0.15509796142578125, -0.1257171630859375, -0.09633636474609375, -0.06695556640625, -0.03757476806640625, -0.0081939697265625, 0.02118682861328125, 0.050567626953125, 0.07994842529296875, 0.1093292236328125, 0.13871002197265625, 0.1680908203125, 0.19747161865234375, 0.2268524169921875, 0.25623321533203125, 0.285614013671875, 0.31499481201171875, 0.3443756103515625, 0.37375640869140625, 0.40313720703125, 0.43251800537109375, 0.4618988037109375, 0.49127960205078125, 0.520660400390625, 0.5500411987304688, 0.5794219970703125, 0.6088027954101562, 0.63818359375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 9.0, 7.0, 12.0, 12.0, 21.0, 18.0, 40.0, 44.0, 41.0, 67.0, 77.0, 98.0, 90.0, 83.0, 90.0, 67.0, 53.0, 47.0, 34.0, 19.0, 22.0, 10.0, 6.0, 7.0, 9.0, 1.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77490234375, -0.7567977905273438, -0.7386932373046875, -0.7205886840820312, -0.702484130859375, -0.6843795776367188, -0.6662750244140625, -0.6481704711914062, -0.63006591796875, -0.6119613647460938, -0.5938568115234375, -0.5757522583007812, -0.557647705078125, -0.5395431518554688, -0.5214385986328125, -0.5033340454101562, -0.4852294921875, -0.46712493896484375, -0.4490203857421875, -0.43091583251953125, -0.412811279296875, -0.39470672607421875, -0.3766021728515625, -0.35849761962890625, -0.34039306640625, -0.32228851318359375, -0.3041839599609375, -0.28607940673828125, -0.267974853515625, -0.24987030029296875, -0.2317657470703125, -0.21366119384765625, -0.195556640625, -0.17745208740234375, -0.1593475341796875, -0.14124298095703125, -0.123138427734375, -0.10503387451171875, -0.0869293212890625, -0.06882476806640625, -0.05072021484375, -0.03261566162109375, -0.0145111083984375, 0.00359344482421875, 0.021697998046875, 0.03980255126953125, 0.0579071044921875, 0.07601165771484375, 0.0941162109375, 0.11222076416015625, 0.1303253173828125, 0.14842987060546875, 0.166534423828125, 0.18463897705078125, 0.2027435302734375, 0.22084808349609375, 0.23895263671875, 0.25705718994140625, 0.2751617431640625, 0.29326629638671875, 0.311370849609375, 0.32947540283203125, 0.3475799560546875, 0.36568450927734375, 0.3837890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 32.0, 120.0, 304.0, 303.0, 154.0, 50.0, 20.0, 10.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.424694061279297, -27.75035285949707, -27.076013565063477, -26.40167236328125, -25.727333068847656, -25.05299186706543, -24.378650665283203, -23.70431137084961, -23.029972076416016, -22.35563087463379, -21.681291580200195, -21.00695037841797, -20.332611083984375, -19.65826988220215, -18.983928680419922, -18.309589385986328, -17.6352481842041, -16.960906982421875, -16.28656768798828, -15.612226486206055, -14.937887191772461, -14.263545989990234, -13.589205741882324, -12.914865493774414, -12.240525245666504, -11.566184997558594, -10.891844749450684, -10.217504501342773, -9.543163299560547, -8.868824005126953, -8.194482803344727, -7.520142555236816, -6.845800399780273, -6.171460151672363, -5.497119903564453, -4.822779178619385, -4.148438930511475, -3.4740986824035645, -2.799757957458496, -2.125417709350586, -1.4510774612426758, -0.7767370939254761, -0.10239672660827637, 0.5719437599182129, 1.246284008026123, 1.9206242561340332, 2.5949649810791016, 3.2693052291870117, 3.943645477294922, 4.617985725402832, 5.292325973510742, 5.9666666984558105, 6.641006946563721, 7.315347194671631, 7.989687919616699, 8.66402816772461, 9.33836841583252, 10.01270866394043, 10.68704891204834, 11.36138916015625, 12.035730361938477, 12.71006965637207, 13.384410858154297, 14.058751106262207, 14.733091354370117]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 5.0, 12.0, 13.0, 22.0, 19.0, 20.0, 24.0, 31.0, 40.0, 36.0, 46.0, 57.0, 53.0, 56.0, 53.0, 50.0, 49.0, 42.0, 52.0, 49.0, 36.0, 48.0, 30.0, 24.0, 26.0, 27.0, 17.0, 15.0, 11.0, 5.0, 5.0, 5.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.631057739257812, -9.301653861999512, -8.972249984741211, -8.64284610748291, -8.31344223022461, -7.984038352966309, -7.654634475708008, -7.325230598449707, -6.995826721191406, -6.6664228439331055, -6.337018966674805, -6.007615089416504, -5.678211212158203, -5.348807334899902, -5.019403457641602, -4.689999580383301, -4.360596179962158, -4.031192302703857, -3.7017884254455566, -3.372384548187256, -3.042980670928955, -2.7135767936706543, -2.3841731548309326, -2.054769277572632, -1.725365400314331, -1.3959615230560303, -1.0665576457977295, -0.7371538877487183, -0.4077500104904175, -0.0783461332321167, 0.25105762481689453, 0.5804615020751953, 0.9098653793334961, 1.2392692565917969, 1.5686731338500977, 1.8980768918991089, 2.227480888366699, 2.556884765625, 2.8862884044647217, 3.2156922817230225, 3.5450961589813232, 3.874500036239624, 4.203903675079346, 4.5333075523376465, 4.862711429595947, 5.192115306854248, 5.521519184112549, 5.85092306137085, 6.18032693862915, 6.509730815887451, 6.839134693145752, 7.168538570404053, 7.4979424476623535, 7.827346324920654, 8.156749725341797, 8.486153602600098, 8.815557479858398, 9.1449613571167, 9.474365234375, 9.8037691116333, 10.133172988891602, 10.462576866149902, 10.791980743408203, 11.121384620666504, 11.450788497924805]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 11.0, 8.0, 8.0, 18.0, 25.0, 41.0, 48.0, 91.0, 195.0, 453.0, 1229.0, 4910.0, 41774.0, 3314457.0, 809687.0, 16960.0, 2841.0, 865.0, 286.0, 131.0, 77.0, 50.0, 35.0, 26.0, 13.0, 10.0, 4.0, 3.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3544921875, -1.3075103759765625, -1.260528564453125, -1.2135467529296875, -1.16656494140625, -1.1195831298828125, -1.072601318359375, -1.0256195068359375, -0.9786376953125, -0.9316558837890625, -0.884674072265625, -0.8376922607421875, -0.79071044921875, -0.7437286376953125, -0.696746826171875, -0.6497650146484375, -0.602783203125, -0.5558013916015625, -0.508819580078125, -0.4618377685546875, -0.41485595703125, -0.3678741455078125, -0.320892333984375, -0.2739105224609375, -0.2269287109375, -0.1799468994140625, -0.132965087890625, -0.0859832763671875, -0.03900146484375, 0.0079803466796875, 0.054962158203125, 0.1019439697265625, 0.14892578125, 0.1959075927734375, 0.242889404296875, 0.2898712158203125, 0.33685302734375, 0.3838348388671875, 0.430816650390625, 0.4777984619140625, 0.5247802734375, 0.5717620849609375, 0.618743896484375, 0.6657257080078125, 0.71270751953125, 0.7596893310546875, 0.806671142578125, 0.8536529541015625, 0.900634765625, 0.9476165771484375, 0.994598388671875, 1.0415802001953125, 1.08856201171875, 1.1355438232421875, 1.182525634765625, 1.2295074462890625, 1.2764892578125, 1.3234710693359375, 1.370452880859375, 1.4174346923828125, 1.46441650390625, 1.5113983154296875, 1.558380126953125, 1.6053619384765625, 1.65234375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 10.0, 10.0, 13.0, 8.0, 19.0, 27.0, 24.0, 39.0, 34.0, 43.0, 44.0, 41.0, 50.0, 50.0, 61.0, 52.0, 58.0, 54.0, 38.0, 52.0, 44.0, 44.0, 30.0, 28.0, 28.0, 18.0, 15.0, 14.0, 16.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6337890625, -0.6171379089355469, -0.6004867553710938, -0.5838356018066406, -0.5671844482421875, -0.5505332946777344, -0.5338821411132812, -0.5172309875488281, -0.500579833984375, -0.4839286804199219, -0.46727752685546875, -0.4506263732910156, -0.4339752197265625, -0.4173240661621094, -0.40067291259765625, -0.3840217590332031, -0.36737060546875, -0.3507194519042969, -0.33406829833984375, -0.3174171447753906, -0.3007659912109375, -0.2841148376464844, -0.26746368408203125, -0.2508125305175781, -0.234161376953125, -0.21751022338867188, -0.20085906982421875, -0.18420791625976562, -0.1675567626953125, -0.15090560913085938, -0.13425445556640625, -0.11760330200195312, -0.1009521484375, -0.08430099487304688, -0.06764984130859375, -0.050998687744140625, -0.0343475341796875, -0.017696380615234375, -0.00104522705078125, 0.015605926513671875, 0.032257080078125, 0.048908233642578125, 0.06555938720703125, 0.08221054077148438, 0.0988616943359375, 0.11551284790039062, 0.13216400146484375, 0.14881515502929688, 0.16546630859375, 0.18211746215820312, 0.19876861572265625, 0.21541976928710938, 0.2320709228515625, 0.24872207641601562, 0.26537322998046875, 0.2820243835449219, 0.298675537109375, 0.3153266906738281, 0.33197784423828125, 0.3486289978027344, 0.3652801513671875, 0.3819313049316406, 0.39858245849609375, 0.4152336120605469, 0.431884765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 15.0, 47.0, 78.0, 155.0, 580.0, 68044.0, 4121791.0, 2990.0, 341.0, 140.0, 63.0, 29.0, 11.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.25762939453125, -4.1168212890625, -3.97601318359375, -3.835205078125, -3.69439697265625, -3.5535888671875, -3.41278076171875, -3.27197265625, -3.13116455078125, -2.9903564453125, -2.84954833984375, -2.708740234375, -2.56793212890625, -2.4271240234375, -2.28631591796875, -2.1455078125, -2.00469970703125, -1.8638916015625, -1.72308349609375, -1.582275390625, -1.44146728515625, -1.3006591796875, -1.15985107421875, -1.01904296875, -0.87823486328125, -0.7374267578125, -0.59661865234375, -0.455810546875, -0.31500244140625, -0.1741943359375, -0.03338623046875, 0.107421875, 0.24822998046875, 0.3890380859375, 0.52984619140625, 0.670654296875, 0.81146240234375, 0.9522705078125, 1.09307861328125, 1.23388671875, 1.37469482421875, 1.5155029296875, 1.65631103515625, 1.797119140625, 1.93792724609375, 2.0787353515625, 2.21954345703125, 2.3603515625, 2.50115966796875, 2.6419677734375, 2.78277587890625, 2.923583984375, 3.06439208984375, 3.2052001953125, 3.34600830078125, 3.48681640625, 3.62762451171875, 3.7684326171875, 3.90924072265625, 4.050048828125, 4.19085693359375, 4.3316650390625, 4.47247314453125, 4.61328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 8.0, 7.0, 16.0, 27.0, 58.0, 181.0, 914.0, 1950.0, 653.0, 169.0, 49.0, 26.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88671875, -0.80902099609375, -0.7313232421875, -0.65362548828125, -0.575927734375, -0.49822998046875, -0.4205322265625, -0.34283447265625, -0.26513671875, -0.18743896484375, -0.1097412109375, -0.03204345703125, 0.045654296875, 0.12335205078125, 0.2010498046875, 0.27874755859375, 0.3564453125, 0.43414306640625, 0.5118408203125, 0.58953857421875, 0.667236328125, 0.74493408203125, 0.8226318359375, 0.90032958984375, 0.97802734375, 1.05572509765625, 1.1334228515625, 1.21112060546875, 1.288818359375, 1.36651611328125, 1.4442138671875, 1.52191162109375, 1.599609375, 1.67730712890625, 1.7550048828125, 1.83270263671875, 1.910400390625, 1.98809814453125, 2.0657958984375, 2.14349365234375, 2.22119140625, 2.29888916015625, 2.3765869140625, 2.45428466796875, 2.531982421875, 2.60968017578125, 2.6873779296875, 2.76507568359375, 2.8427734375, 2.92047119140625, 2.9981689453125, 3.07586669921875, 3.153564453125, 3.23126220703125, 3.3089599609375, 3.38665771484375, 3.46435546875, 3.54205322265625, 3.6197509765625, 3.69744873046875, 3.775146484375, 3.85284423828125, 3.9305419921875, 4.00823974609375, 4.0859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 38.0, 100.0, 180.0, 244.0, 193.0, 121.0, 53.0, 25.0, 14.0, 7.0, 12.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.732222557067871, -8.398841857910156, -8.065462112426758, -7.732081413269043, -7.3987016677856445, -7.06532096862793, -6.731940746307373, -6.398560523986816, -6.06518030166626, -5.731800079345703, -5.3984198570251465, -5.06503963470459, -4.731658935546875, -4.398279190063477, -4.064898490905762, -3.731518268585205, -3.3981380462646484, -3.064757823944092, -2.731377601623535, -2.3979971408843994, -2.0646169185638428, -1.7312366962432861, -1.3978562355041504, -1.0644760131835938, -0.7310957908630371, -0.3977155089378357, -0.06433522701263428, 0.2690451145172119, 0.6024253368377686, 0.9358055591583252, 1.269186019897461, 1.6025662422180176, 1.9359464645385742, 2.269326686859131, 2.6027069091796875, 2.9360873699188232, 3.26946759223938, 3.6028478145599365, 3.9362282752990723, 4.269608497619629, 4.6029887199401855, 4.936368942260742, 5.269749164581299, 5.6031293869018555, 5.93651008605957, 6.269889831542969, 6.603270530700684, 6.93665075302124, 7.270030975341797, 7.6034111976623535, 7.93679141998291, 8.270172119140625, 8.603551864624023, 8.936932563781738, 9.270313262939453, 9.603693008422852, 9.93707275390625, 10.270453453063965, 10.603833198547363, 10.937213897705078, 11.270593643188477, 11.603974342346191, 11.937355041503906, 12.270734786987305, 12.60411548614502]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 3.0, 9.0, 11.0, 10.0, 13.0, 16.0, 17.0, 20.0, 31.0, 30.0, 30.0, 25.0, 42.0, 42.0, 44.0, 46.0, 46.0, 54.0, 39.0, 58.0, 41.0, 41.0, 41.0, 35.0, 36.0, 35.0, 32.0, 23.0, 16.0, 21.0, 14.0, 14.0, 13.0, 8.0, 10.0, 11.0, 3.0, 7.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.711890697479248, -4.555419445037842, -4.3989481925964355, -4.242476940155029, -4.086006164550781, -3.929534673690796, -3.7730636596679688, -3.6165924072265625, -3.4601211547851562, -3.30364990234375, -3.1471786499023438, -2.9907076358795166, -2.8342363834381104, -2.677765130996704, -2.521294116973877, -2.3648228645324707, -2.2083516120910645, -2.051880359649658, -1.8954092264175415, -1.7389380931854248, -1.5824668407440186, -1.4259955883026123, -1.2695244550704956, -1.113053321838379, -0.9565820693969727, -0.8001108765602112, -0.6436396837234497, -0.48716849088668823, -0.33069729804992676, -0.17422610521316528, -0.01775491237640381, 0.1387162208557129, 0.29518795013427734, 0.4516591429710388, 0.6081303358078003, 0.7646015286445618, 0.9210727214813232, 1.0775439739227295, 1.2340151071548462, 1.390486240386963, 1.5469574928283691, 1.7034287452697754, 1.859899878501892, 2.016371011734009, 2.172842264175415, 2.3293135166168213, 2.4857845306396484, 2.6422557830810547, 2.798727035522461, 2.955198287963867, 3.1116695404052734, 3.2681405544281006, 3.424611806869507, 3.581083059310913, 3.7375540733337402, 3.8940253257751465, 4.050496578216553, 4.206967830657959, 4.363439083099365, 4.5199103355407715, 4.6763811111450195, 4.832852363586426, 4.989323616027832, 5.145794868469238, 5.3022661209106445]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 7.0, 6.0, 10.0, 13.0, 14.0, 19.0, 32.0, 41.0, 50.0, 77.0, 115.0, 173.0, 283.0, 444.0, 754.0, 1188.0, 2091.0, 3552.0, 6615.0, 12515.0, 25088.0, 51888.0, 110361.0, 230238.0, 291543.0, 161858.0, 75238.0, 35902.0, 17622.0, 9018.0, 4897.0, 2736.0, 1619.0, 942.0, 571.0, 381.0, 227.0, 139.0, 102.0, 65.0, 36.0, 28.0, 18.0, 19.0, 9.0, 9.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.44921875, -0.43386077880859375, -0.4185028076171875, -0.40314483642578125, -0.387786865234375, -0.37242889404296875, -0.3570709228515625, -0.34171295166015625, -0.32635498046875, -0.31099700927734375, -0.2956390380859375, -0.28028106689453125, -0.264923095703125, -0.24956512451171875, -0.2342071533203125, -0.21884918212890625, -0.2034912109375, -0.18813323974609375, -0.1727752685546875, -0.15741729736328125, -0.142059326171875, -0.12670135498046875, -0.1113433837890625, -0.09598541259765625, -0.08062744140625, -0.06526947021484375, -0.0499114990234375, -0.03455352783203125, -0.019195556640625, -0.00383758544921875, 0.0115203857421875, 0.02687835693359375, 0.042236328125, 0.05759429931640625, 0.0729522705078125, 0.08831024169921875, 0.103668212890625, 0.11902618408203125, 0.1343841552734375, 0.14974212646484375, 0.16510009765625, 0.18045806884765625, 0.1958160400390625, 0.21117401123046875, 0.226531982421875, 0.24188995361328125, 0.2572479248046875, 0.27260589599609375, 0.2879638671875, 0.30332183837890625, 0.3186798095703125, 0.33403778076171875, 0.349395751953125, 0.36475372314453125, 0.3801116943359375, 0.39546966552734375, 0.41082763671875, 0.42618560791015625, 0.4415435791015625, 0.45690155029296875, 0.472259521484375, 0.48761749267578125, 0.5029754638671875, 0.5183334350585938, 0.53369140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 3.0, 4.0, 6.0, 7.0, 19.0, 13.0, 19.0, 31.0, 37.0, 41.0, 59.0, 41.0, 48.0, 45.0, 57.0, 55.0, 67.0, 60.0, 53.0, 63.0, 53.0, 41.0, 38.0, 26.0, 21.0, 26.0, 21.0, 17.0, 9.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65380859375, -0.6359977722167969, -0.6181869506835938, -0.6003761291503906, -0.5825653076171875, -0.5647544860839844, -0.5469436645507812, -0.5291328430175781, -0.511322021484375, -0.4935111999511719, -0.47570037841796875, -0.4578895568847656, -0.4400787353515625, -0.4222679138183594, -0.40445709228515625, -0.3866462707519531, -0.36883544921875, -0.3510246276855469, -0.33321380615234375, -0.3154029846191406, -0.2975921630859375, -0.2797813415527344, -0.26197052001953125, -0.24415969848632812, -0.226348876953125, -0.20853805541992188, -0.19072723388671875, -0.17291641235351562, -0.1551055908203125, -0.13729476928710938, -0.11948394775390625, -0.10167312622070312, -0.0838623046875, -0.06605148315429688, -0.04824066162109375, -0.030429840087890625, -0.0126190185546875, 0.005191802978515625, 0.02300262451171875, 0.040813446044921875, 0.058624267578125, 0.07643508911132812, 0.09424591064453125, 0.11205673217773438, 0.1298675537109375, 0.14767837524414062, 0.16548919677734375, 0.18330001831054688, 0.20111083984375, 0.21892166137695312, 0.23673248291015625, 0.2545433044433594, 0.2723541259765625, 0.2901649475097656, 0.30797576904296875, 0.3257865905761719, 0.343597412109375, 0.3614082336425781, 0.37921905517578125, 0.3970298767089844, 0.4148406982421875, 0.4326515197753906, 0.45046234130859375, 0.4682731628417969, 0.486083984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 10.0, 7.0, 5.0, 19.0, 16.0, 25.0, 35.0, 46.0, 88.0, 121.0, 187.0, 306.0, 552.0, 913.0, 1765.0, 5179.0, 27455.0, 300327.0, 643400.0, 54743.0, 8239.0, 2376.0, 1089.0, 606.0, 324.0, 213.0, 151.0, 110.0, 70.0, 41.0, 38.0, 19.0, 13.0, 12.0, 13.0, 6.0, 13.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.3779296875, -1.3350830078125, -1.292236328125, -1.2493896484375, -1.20654296875, -1.1636962890625, -1.120849609375, -1.0780029296875, -1.03515625, -0.9923095703125, -0.949462890625, -0.9066162109375, -0.86376953125, -0.8209228515625, -0.778076171875, -0.7352294921875, -0.6923828125, -0.6495361328125, -0.606689453125, -0.5638427734375, -0.52099609375, -0.4781494140625, -0.435302734375, -0.3924560546875, -0.349609375, -0.3067626953125, -0.263916015625, -0.2210693359375, -0.17822265625, -0.1353759765625, -0.092529296875, -0.0496826171875, -0.0068359375, 0.0360107421875, 0.078857421875, 0.1217041015625, 0.16455078125, 0.2073974609375, 0.250244140625, 0.2930908203125, 0.3359375, 0.3787841796875, 0.421630859375, 0.4644775390625, 0.50732421875, 0.5501708984375, 0.593017578125, 0.6358642578125, 0.6787109375, 0.7215576171875, 0.764404296875, 0.8072509765625, 0.85009765625, 0.8929443359375, 0.935791015625, 0.9786376953125, 1.021484375, 1.0643310546875, 1.107177734375, 1.1500244140625, 1.19287109375, 1.2357177734375, 1.278564453125, 1.3214111328125, 1.3642578125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 10.0, 12.0, 10.0, 29.0, 29.0, 30.0, 29.0, 42.0, 56.0, 60.0, 49.0, 61.0, 74.0, 68.0, 67.0, 49.0, 55.0, 52.0, 44.0, 41.0, 35.0, 22.0, 15.0, 17.0, 12.0, 9.0, 5.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1640625, -3.082794189453125, -3.00152587890625, -2.920257568359375, -2.8389892578125, -2.757720947265625, -2.67645263671875, -2.595184326171875, -2.513916015625, -2.432647705078125, -2.35137939453125, -2.270111083984375, -2.1888427734375, -2.107574462890625, -2.02630615234375, -1.945037841796875, -1.86376953125, -1.782501220703125, -1.70123291015625, -1.619964599609375, -1.5386962890625, -1.457427978515625, -1.37615966796875, -1.294891357421875, -1.213623046875, -1.132354736328125, -1.05108642578125, -0.969818115234375, -0.8885498046875, -0.807281494140625, -0.72601318359375, -0.644744873046875, -0.5634765625, -0.482208251953125, -0.40093994140625, -0.319671630859375, -0.2384033203125, -0.157135009765625, -0.07586669921875, 0.005401611328125, 0.086669921875, 0.167938232421875, 0.24920654296875, 0.330474853515625, 0.4117431640625, 0.493011474609375, 0.57427978515625, 0.655548095703125, 0.73681640625, 0.818084716796875, 0.89935302734375, 0.980621337890625, 1.0618896484375, 1.143157958984375, 1.22442626953125, 1.305694580078125, 1.386962890625, 1.468231201171875, 1.54949951171875, 1.630767822265625, 1.7120361328125, 1.793304443359375, 1.87457275390625, 1.955841064453125, 2.037109375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 9.0, 12.0, 11.0, 25.0, 25.0, 52.0, 93.0, 247.0, 548.0, 1897.0, 12385.0, 358469.0, 654803.0, 16470.0, 2367.0, 619.0, 237.0, 119.0, 59.0, 30.0, 18.0, 14.0, 12.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0255508422851562, -0.9954376220703125, -0.9653244018554688, -0.935211181640625, -0.9050979614257812, -0.8749847412109375, -0.8448715209960938, -0.81475830078125, -0.7846450805664062, -0.7545318603515625, -0.7244186401367188, -0.694305419921875, -0.6641921997070312, -0.6340789794921875, -0.6039657592773438, -0.5738525390625, -0.5437393188476562, -0.5136260986328125, -0.48351287841796875, -0.453399658203125, -0.42328643798828125, -0.3931732177734375, -0.36305999755859375, -0.33294677734375, -0.30283355712890625, -0.2727203369140625, -0.24260711669921875, -0.212493896484375, -0.18238067626953125, -0.1522674560546875, -0.12215423583984375, -0.092041015625, -0.06192779541015625, -0.0318145751953125, -0.00170135498046875, 0.028411865234375, 0.05852508544921875, 0.0886383056640625, 0.11875152587890625, 0.14886474609375, 0.17897796630859375, 0.2090911865234375, 0.23920440673828125, 0.269317626953125, 0.29943084716796875, 0.3295440673828125, 0.35965728759765625, 0.3897705078125, 0.41988372802734375, 0.4499969482421875, 0.48011016845703125, 0.510223388671875, 0.5403366088867188, 0.5704498291015625, 0.6005630493164062, 0.63067626953125, 0.6607894897460938, 0.6909027099609375, 0.7210159301757812, 0.751129150390625, 0.7812423706054688, 0.8113555908203125, 0.8414688110351562, 0.87158203125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 6.0, 2.0, 0.0, 8.0, 7.0, 8.0, 7.0, 6.0, 10.0, 9.0, 11.0, 18.0, 17.0, 15.0, 24.0, 31.0, 35.0, 54.0, 68.0, 114.0, 108.0, 107.0, 74.0, 54.0, 36.0, 17.0, 21.0, 17.0, 15.0, 10.0, 14.0, 12.0, 10.0, 5.0, 6.0, 10.0, 2.0, 6.0, 5.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.749961853027344e-05, -8.472800254821777e-05, -8.195638656616211e-05, -7.918477058410645e-05, -7.641315460205078e-05, -7.364153861999512e-05, -7.086992263793945e-05, -6.809830665588379e-05, -6.532669067382812e-05, -6.255507469177246e-05, -5.97834587097168e-05, -5.701184272766113e-05, -5.424022674560547e-05, -5.1468610763549805e-05, -4.869699478149414e-05, -4.5925378799438477e-05, -4.315376281738281e-05, -4.038214683532715e-05, -3.7610530853271484e-05, -3.483891487121582e-05, -3.2067298889160156e-05, -2.9295682907104492e-05, -2.6524066925048828e-05, -2.3752450942993164e-05, -2.09808349609375e-05, -1.8209218978881836e-05, -1.5437602996826172e-05, -1.2665987014770508e-05, -9.894371032714844e-06, -7.12275505065918e-06, -4.351139068603516e-06, -1.5795230865478516e-06, 1.1920928955078125e-06, 3.9637088775634766e-06, 6.735324859619141e-06, 9.506940841674805e-06, 1.2278556823730469e-05, 1.5050172805786133e-05, 1.7821788787841797e-05, 2.059340476989746e-05, 2.3365020751953125e-05, 2.613663673400879e-05, 2.8908252716064453e-05, 3.167986869812012e-05, 3.445148468017578e-05, 3.7223100662231445e-05, 3.999471664428711e-05, 4.2766332626342773e-05, 4.553794860839844e-05, 4.83095645904541e-05, 5.1081180572509766e-05, 5.385279655456543e-05, 5.6624412536621094e-05, 5.939602851867676e-05, 6.216764450073242e-05, 6.493926048278809e-05, 6.771087646484375e-05, 7.048249244689941e-05, 7.325410842895508e-05, 7.602572441101074e-05, 7.87973403930664e-05, 8.156895637512207e-05, 8.434057235717773e-05, 8.71121883392334e-05, 8.988380432128906e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 12.0, 19.0, 28.0, 40.0, 50.0, 66.0, 126.0, 204.0, 318.0, 548.0, 1078.0, 2820.0, 10175.0, 63174.0, 728697.0, 209250.0, 23144.0, 5164.0, 1802.0, 755.0, 414.0, 226.0, 147.0, 95.0, 63.0, 28.0, 30.0, 22.0, 3.0, 6.0, 7.0, 5.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6630859375, -0.6428375244140625, -0.622589111328125, -0.6023406982421875, -0.58209228515625, -0.5618438720703125, -0.541595458984375, -0.5213470458984375, -0.5010986328125, -0.4808502197265625, -0.460601806640625, -0.4403533935546875, -0.42010498046875, -0.3998565673828125, -0.379608154296875, -0.3593597412109375, -0.339111328125, -0.3188629150390625, -0.298614501953125, -0.2783660888671875, -0.25811767578125, -0.2378692626953125, -0.217620849609375, -0.1973724365234375, -0.1771240234375, -0.1568756103515625, -0.136627197265625, -0.1163787841796875, -0.09613037109375, -0.0758819580078125, -0.055633544921875, -0.0353851318359375, -0.01513671875, 0.0051116943359375, 0.025360107421875, 0.0456085205078125, 0.06585693359375, 0.0861053466796875, 0.106353759765625, 0.1266021728515625, 0.1468505859375, 0.1670989990234375, 0.187347412109375, 0.2075958251953125, 0.22784423828125, 0.2480926513671875, 0.268341064453125, 0.2885894775390625, 0.308837890625, 0.3290863037109375, 0.349334716796875, 0.3695831298828125, 0.38983154296875, 0.4100799560546875, 0.430328369140625, 0.4505767822265625, 0.4708251953125, 0.4910736083984375, 0.511322021484375, 0.5315704345703125, 0.55181884765625, 0.5720672607421875, 0.592315673828125, 0.6125640869140625, 0.6328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 9.0, 3.0, 17.0, 14.0, 21.0, 28.0, 49.0, 51.0, 77.0, 87.0, 101.0, 104.0, 101.0, 84.0, 64.0, 64.0, 42.0, 20.0, 27.0, 12.0, 11.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.4863739013671875, -0.463470458984375, -0.4405670166015625, -0.41766357421875, -0.3947601318359375, -0.371856689453125, -0.3489532470703125, -0.3260498046875, -0.3031463623046875, -0.280242919921875, -0.2573394775390625, -0.23443603515625, -0.2115325927734375, -0.188629150390625, -0.1657257080078125, -0.142822265625, -0.1199188232421875, -0.097015380859375, -0.0741119384765625, -0.05120849609375, -0.0283050537109375, -0.005401611328125, 0.0175018310546875, 0.0404052734375, 0.0633087158203125, 0.086212158203125, 0.1091156005859375, 0.13201904296875, 0.1549224853515625, 0.177825927734375, 0.2007293701171875, 0.2236328125, 0.2465362548828125, 0.269439697265625, 0.2923431396484375, 0.31524658203125, 0.3381500244140625, 0.361053466796875, 0.3839569091796875, 0.4068603515625, 0.4297637939453125, 0.452667236328125, 0.4755706787109375, 0.49847412109375, 0.5213775634765625, 0.544281005859375, 0.5671844482421875, 0.590087890625, 0.6129913330078125, 0.635894775390625, 0.6587982177734375, 0.68170166015625, 0.7046051025390625, 0.727508544921875, 0.7504119873046875, 0.7733154296875, 0.7962188720703125, 0.819122314453125, 0.8420257568359375, 0.86492919921875, 0.8878326416015625, 0.910736083984375, 0.9336395263671875, 0.95654296875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 17.0, 32.0, 59.0, 128.0, 205.0, 236.0, 166.0, 68.0, 33.0, 10.0, 10.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.92164421081543, -11.593828201293945, -11.266013145446777, -10.938197135925293, -10.610382080078125, -10.28256607055664, -9.954751014709473, -9.626935005187988, -9.29911994934082, -8.971303939819336, -8.643488883972168, -8.315672874450684, -7.987857818603516, -7.660041809082031, -7.332226276397705, -7.004410743713379, -6.6765947341918945, -6.348779201507568, -6.020963668823242, -5.693148136138916, -5.36533260345459, -5.0375165939331055, -4.709701061248779, -4.381885528564453, -4.054069995880127, -3.726254463195801, -3.3984389305114746, -3.0706231594085693, -2.742807626724243, -2.414992094039917, -2.0871763229370117, -1.7593607902526855, -1.431544303894043, -1.1037287712097168, -0.7759131193161011, -0.4480975270271301, -0.12028193473815918, 0.207533597946167, 0.5353492498397827, 0.8631649017333984, 1.1909804344177246, 1.5187959671020508, 1.8466116189956665, 2.1744272708892822, 2.5022428035736084, 2.8300583362579346, 3.15787410736084, 3.485689640045166, 3.813505172729492, 4.141320705413818, 4.4691362380981445, 4.796951770782471, 5.124767303466797, 5.452583312988281, 5.780398845672607, 6.108214378356934, 6.43602991104126, 6.763845443725586, 7.091660976409912, 7.419476509094238, 7.747292518615723, 8.07510757446289, 8.402923583984375, 8.73073959350586, 9.058554649353027]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 2.0, 2.0, 9.0, 4.0, 7.0, 14.0, 12.0, 17.0, 19.0, 24.0, 29.0, 21.0, 28.0, 26.0, 39.0, 46.0, 35.0, 50.0, 51.0, 65.0, 50.0, 40.0, 50.0, 48.0, 48.0, 44.0, 35.0, 32.0, 29.0, 19.0, 19.0, 20.0, 16.0, 14.0, 10.0, 7.0, 5.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.315830230712891, -6.0874199867248535, -5.859009742736816, -5.6305999755859375, -5.4021897315979, -5.173779487609863, -4.945369720458984, -4.716959476470947, -4.48854923248291, -4.260138988494873, -4.031728744506836, -3.803318977355957, -3.57490873336792, -3.346498489379883, -3.118088483810425, -2.889678478240967, -2.6612682342529297, -2.4328579902648926, -2.2044479846954346, -1.976037859916687, -1.7476277351379395, -1.519217610359192, -1.2908074855804443, -1.0623973608016968, -0.8339872360229492, -0.6055771112442017, -0.3771669864654541, -0.14875686168670654, 0.07965326309204102, 0.3080633878707886, 0.5364735126495361, 0.7648836374282837, 0.9932937622070312, 1.2217038869857788, 1.4501140117645264, 1.678524136543274, 1.9069342613220215, 2.1353445053100586, 2.3637545108795166, 2.5921645164489746, 2.8205747604370117, 3.048985004425049, 3.277395009994507, 3.505805015563965, 3.734215259552002, 3.962625503540039, 4.191035270690918, 4.419445514678955, 4.647855758666992, 4.876266002655029, 5.104676246643066, 5.333086013793945, 5.561496257781982, 5.7899065017700195, 6.018316268920898, 6.2467265129089355, 6.475136756896973, 6.70354700088501, 6.931957244873047, 7.160367012023926, 7.388777256011963, 7.6171875, 7.845597267150879, 8.074007987976074, 8.302417755126953]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 1.0, 6.0, 11.0, 12.0, 17.0, 31.0, 30.0, 41.0, 65.0, 102.0, 160.0, 252.0, 652.0, 3046.0, 79145.0, 4073853.0, 33457.0, 2217.0, 500.0, 231.0, 127.0, 81.0, 59.0, 42.0, 35.0, 30.0, 18.0, 15.0, 10.0, 9.0, 10.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -2.002655029296875, -1.93890380859375, -1.875152587890625, -1.8114013671875, -1.747650146484375, -1.68389892578125, -1.620147705078125, -1.556396484375, -1.492645263671875, -1.42889404296875, -1.365142822265625, -1.3013916015625, -1.237640380859375, -1.17388916015625, -1.110137939453125, -1.04638671875, -0.982635498046875, -0.91888427734375, -0.855133056640625, -0.7913818359375, -0.727630615234375, -0.66387939453125, -0.600128173828125, -0.536376953125, -0.472625732421875, -0.40887451171875, -0.345123291015625, -0.2813720703125, -0.217620849609375, -0.15386962890625, -0.090118408203125, -0.0263671875, 0.037384033203125, 0.10113525390625, 0.164886474609375, 0.2286376953125, 0.292388916015625, 0.35614013671875, 0.419891357421875, 0.483642578125, 0.547393798828125, 0.61114501953125, 0.674896240234375, 0.7386474609375, 0.802398681640625, 0.86614990234375, 0.929901123046875, 0.99365234375, 1.057403564453125, 1.12115478515625, 1.184906005859375, 1.2486572265625, 1.312408447265625, 1.37615966796875, 1.439910888671875, 1.503662109375, 1.567413330078125, 1.63116455078125, 1.694915771484375, 1.7586669921875, 1.822418212890625, 1.88616943359375, 1.949920654296875, 2.013671875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 6.0, 7.0, 9.0, 8.0, 14.0, 23.0, 25.0, 33.0, 44.0, 43.0, 58.0, 54.0, 37.0, 64.0, 60.0, 59.0, 64.0, 45.0, 57.0, 49.0, 47.0, 41.0, 34.0, 21.0, 23.0, 21.0, 17.0, 13.0, 6.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6201171875, -0.6028976440429688, -0.5856781005859375, -0.5684585571289062, -0.551239013671875, -0.5340194702148438, -0.5167999267578125, -0.49958038330078125, -0.48236083984375, -0.46514129638671875, -0.4479217529296875, -0.43070220947265625, -0.413482666015625, -0.39626312255859375, -0.3790435791015625, -0.36182403564453125, -0.3446044921875, -0.32738494873046875, -0.3101654052734375, -0.29294586181640625, -0.275726318359375, -0.25850677490234375, -0.2412872314453125, -0.22406768798828125, -0.20684814453125, -0.18962860107421875, -0.1724090576171875, -0.15518951416015625, -0.137969970703125, -0.12075042724609375, -0.1035308837890625, -0.08631134033203125, -0.069091796875, -0.05187225341796875, -0.0346527099609375, -0.01743316650390625, -0.000213623046875, 0.01700592041015625, 0.0342254638671875, 0.05144500732421875, 0.06866455078125, 0.08588409423828125, 0.1031036376953125, 0.12032318115234375, 0.137542724609375, 0.15476226806640625, 0.1719818115234375, 0.18920135498046875, 0.2064208984375, 0.22364044189453125, 0.2408599853515625, 0.25807952880859375, 0.275299072265625, 0.29251861572265625, 0.3097381591796875, 0.32695770263671875, 0.34417724609375, 0.36139678955078125, 0.3786163330078125, 0.39583587646484375, 0.413055419921875, 0.43027496337890625, 0.4474945068359375, 0.46471405029296875, 0.48193359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 12.0, 23.0, 31.0, 74.0, 128.0, 372.0, 992.0, 3720.0, 30576.0, 2242693.0, 1881489.0, 28437.0, 3745.0, 1126.0, 432.0, 195.0, 117.0, 50.0, 28.0, 17.0, 7.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -0.9927825927734375, -0.951385498046875, -0.9099884033203125, -0.86859130859375, -0.8271942138671875, -0.785797119140625, -0.7444000244140625, -0.7030029296875, -0.6616058349609375, -0.620208740234375, -0.5788116455078125, -0.53741455078125, -0.4960174560546875, -0.454620361328125, -0.4132232666015625, -0.371826171875, -0.3304290771484375, -0.289031982421875, -0.2476348876953125, -0.20623779296875, -0.1648406982421875, -0.123443603515625, -0.0820465087890625, -0.0406494140625, 0.0007476806640625, 0.042144775390625, 0.0835418701171875, 0.12493896484375, 0.1663360595703125, 0.207733154296875, 0.2491302490234375, 0.29052734375, 0.3319244384765625, 0.373321533203125, 0.4147186279296875, 0.45611572265625, 0.4975128173828125, 0.538909912109375, 0.5803070068359375, 0.6217041015625, 0.6631011962890625, 0.704498291015625, 0.7458953857421875, 0.78729248046875, 0.8286895751953125, 0.870086669921875, 0.9114837646484375, 0.952880859375, 0.9942779541015625, 1.035675048828125, 1.0770721435546875, 1.11846923828125, 1.1598663330078125, 1.201263427734375, 1.2426605224609375, 1.2840576171875, 1.3254547119140625, 1.366851806640625, 1.4082489013671875, 1.44964599609375, 1.4910430908203125, 1.532440185546875, 1.5738372802734375, 1.615234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 14.0, 10.0, 20.0, 29.0, 44.0, 83.0, 143.0, 297.0, 470.0, 853.0, 849.0, 528.0, 345.0, 148.0, 74.0, 49.0, 29.0, 20.0, 16.0, 12.0, 10.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.67529296875, -0.6483535766601562, -0.6214141845703125, -0.5944747924804688, -0.567535400390625, -0.5405960083007812, -0.5136566162109375, -0.48671722412109375, -0.45977783203125, -0.43283843994140625, -0.4058990478515625, -0.37895965576171875, -0.352020263671875, -0.32508087158203125, -0.2981414794921875, -0.27120208740234375, -0.2442626953125, -0.21732330322265625, -0.1903839111328125, -0.16344451904296875, -0.136505126953125, -0.10956573486328125, -0.0826263427734375, -0.05568695068359375, -0.02874755859375, -0.00180816650390625, 0.0251312255859375, 0.05207061767578125, 0.079010009765625, 0.10594940185546875, 0.1328887939453125, 0.15982818603515625, 0.186767578125, 0.21370697021484375, 0.2406463623046875, 0.26758575439453125, 0.294525146484375, 0.32146453857421875, 0.3484039306640625, 0.37534332275390625, 0.40228271484375, 0.42922210693359375, 0.4561614990234375, 0.48310089111328125, 0.510040283203125, 0.5369796752929688, 0.5639190673828125, 0.5908584594726562, 0.6177978515625, 0.6447372436523438, 0.6716766357421875, 0.6986160278320312, 0.725555419921875, 0.7524948120117188, 0.7794342041015625, 0.8063735961914062, 0.83331298828125, 0.8602523803710938, 0.8871917724609375, 0.9141311645507812, 0.941070556640625, 0.9680099487304688, 0.9949493408203125, 1.0218887329101562, 1.048828125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 13.0, 46.0, 138.0, 298.0, 261.0, 139.0, 51.0, 18.0, 9.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.177643775939941, -10.840587615966797, -10.503532409667969, -10.166476249694824, -9.829421043395996, -9.492364883422852, -9.155309677124023, -8.818253517150879, -8.481197357177734, -8.14414119720459, -7.807085990905762, -7.470029830932617, -7.132974624633789, -6.7959184646606445, -6.458862781524658, -6.121807098388672, -5.784751892089844, -5.447696208953857, -5.110640525817871, -4.773584365844727, -4.436529159545898, -4.099472999572754, -3.7624173164367676, -3.4253616333007812, -3.088305950164795, -2.7512502670288086, -2.4141945838928223, -2.077138662338257, -1.7400829792022705, -1.4030272960662842, -1.0659713745117188, -0.7289156913757324, -0.3918609619140625, -0.054805219173431396, 0.2822505235671997, 0.6193063259124756, 0.9563620090484619, 1.2934176921844482, 1.6304736137390137, 1.967529296875, 2.3045849800109863, 2.6416406631469727, 2.978696346282959, 3.3157522678375244, 3.6528079509735107, 3.989863634109497, 4.3269195556640625, 4.663975238800049, 5.001030921936035, 5.3380866050720215, 5.675142288208008, 6.012198448181152, 6.3492536544799805, 6.686309814453125, 7.023365497589111, 7.360421180725098, 7.697476863861084, 8.03453254699707, 8.371588706970215, 8.708643913269043, 9.045700073242188, 9.382755279541016, 9.71981143951416, 10.056867599487305, 10.393922805786133]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 8.0, 10.0, 11.0, 15.0, 18.0, 19.0, 25.0, 38.0, 31.0, 50.0, 35.0, 49.0, 58.0, 63.0, 51.0, 51.0, 59.0, 50.0, 43.0, 59.0, 36.0, 40.0, 23.0, 29.0, 17.0, 24.0, 17.0, 13.0, 10.0, 12.0, 5.0, 4.0, 4.0, 1.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3171606063842773, -3.198147773742676, -3.079134941101074, -2.9601221084594727, -2.841109275817871, -2.7220964431762695, -2.603083372116089, -2.4840705394744873, -2.3650577068328857, -2.246044874191284, -2.1270320415496826, -2.008019208908081, -1.88900625705719, -1.7699934244155884, -1.6509804725646973, -1.5319676399230957, -1.4129548072814941, -1.2939419746398926, -1.174929141998291, -1.0559161901474, -0.9369033575057983, -0.8178905248641968, -0.6988776326179504, -0.5798647403717041, -0.46085190773010254, -0.3418390452861786, -0.22282618284225464, -0.10381332039833069, 0.015199542045593262, 0.13421237468719482, 0.25322526693344116, 0.3722381591796875, 0.49125099182128906, 0.6102638244628906, 0.729276716709137, 0.8482896089553833, 0.9673024415969849, 1.0863152742385864, 1.2053282260894775, 1.324341058731079, 1.4433538913726807, 1.5623667240142822, 1.6813795566558838, 1.800392508506775, 1.9194053411483765, 2.0384182929992676, 2.157431125640869, 2.2764439582824707, 2.3954567909240723, 2.514469623565674, 2.6334824562072754, 2.752495288848877, 2.8715081214904785, 2.99052095413208, 3.1095340251922607, 3.2285468578338623, 3.347559690475464, 3.4665725231170654, 3.585585355758667, 3.7045981884002686, 3.823611259460449, 3.942624092102051, 4.061636924743652, 4.180649757385254, 4.2996625900268555]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 14.0, 22.0, 23.0, 48.0, 72.0, 122.0, 180.0, 288.0, 500.0, 884.0, 1531.0, 3061.0, 6115.0, 12971.0, 28954.0, 69718.0, 184203.0, 372254.0, 221355.0, 82687.0, 33937.0, 14899.0, 7006.0, 3490.0, 1775.0, 1022.0, 531.0, 333.0, 200.0, 118.0, 73.0, 54.0, 43.0, 27.0, 14.0, 7.0, 10.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5146484375, -0.49782562255859375, -0.4810028076171875, -0.46417999267578125, -0.447357177734375, -0.43053436279296875, -0.4137115478515625, -0.39688873291015625, -0.38006591796875, -0.36324310302734375, -0.3464202880859375, -0.32959747314453125, -0.312774658203125, -0.29595184326171875, -0.2791290283203125, -0.26230621337890625, -0.2454833984375, -0.22866058349609375, -0.2118377685546875, -0.19501495361328125, -0.178192138671875, -0.16136932373046875, -0.1445465087890625, -0.12772369384765625, -0.11090087890625, -0.09407806396484375, -0.0772552490234375, -0.06043243408203125, -0.043609619140625, -0.02678680419921875, -0.0099639892578125, 0.00685882568359375, 0.023681640625, 0.04050445556640625, 0.0573272705078125, 0.07415008544921875, 0.090972900390625, 0.10779571533203125, 0.1246185302734375, 0.14144134521484375, 0.15826416015625, 0.17508697509765625, 0.1919097900390625, 0.20873260498046875, 0.225555419921875, 0.24237823486328125, 0.2592010498046875, 0.27602386474609375, 0.2928466796875, 0.30966949462890625, 0.3264923095703125, 0.34331512451171875, 0.360137939453125, 0.37696075439453125, 0.3937835693359375, 0.41060638427734375, 0.42742919921875, 0.44425201416015625, 0.4610748291015625, 0.47789764404296875, 0.494720458984375, 0.5115432739257812, 0.5283660888671875, 0.5451889038085938, 0.56201171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 5.0, 6.0, 12.0, 9.0, 13.0, 22.0, 23.0, 35.0, 39.0, 42.0, 42.0, 47.0, 60.0, 59.0, 51.0, 56.0, 61.0, 59.0, 49.0, 45.0, 42.0, 39.0, 36.0, 28.0, 22.0, 14.0, 24.0, 17.0, 13.0, 10.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.65234375, -0.6361732482910156, -0.6200027465820312, -0.6038322448730469, -0.5876617431640625, -0.5714912414550781, -0.5553207397460938, -0.5391502380371094, -0.522979736328125, -0.5068092346191406, -0.49063873291015625, -0.4744682312011719, -0.4582977294921875, -0.4421272277832031, -0.42595672607421875, -0.4097862243652344, -0.39361572265625, -0.3774452209472656, -0.36127471923828125, -0.3451042175292969, -0.3289337158203125, -0.3127632141113281, -0.29659271240234375, -0.2804222106933594, -0.264251708984375, -0.24808120727539062, -0.23191070556640625, -0.21574020385742188, -0.1995697021484375, -0.18339920043945312, -0.16722869873046875, -0.15105819702148438, -0.1348876953125, -0.11871719360351562, -0.10254669189453125, -0.08637619018554688, -0.0702056884765625, -0.054035186767578125, -0.03786468505859375, -0.021694183349609375, -0.005523681640625, 0.010646820068359375, 0.02681732177734375, 0.042987823486328125, 0.0591583251953125, 0.07532882690429688, 0.09149932861328125, 0.10766983032226562, 0.12384033203125, 0.14001083374023438, 0.15618133544921875, 0.17235183715820312, 0.1885223388671875, 0.20469284057617188, 0.22086334228515625, 0.23703384399414062, 0.253204345703125, 0.2693748474121094, 0.28554534912109375, 0.3017158508300781, 0.3178863525390625, 0.3340568542480469, 0.35022735595703125, 0.3663978576660156, 0.382568359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 5.0, 10.0, 16.0, 14.0, 25.0, 42.0, 63.0, 123.0, 236.0, 420.0, 939.0, 3167.0, 18487.0, 228553.0, 732422.0, 54635.0, 6549.0, 1515.0, 565.0, 328.0, 147.0, 78.0, 46.0, 30.0, 35.0, 24.0, 20.0, 4.0, 9.0, 4.0, 9.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.412109375, -1.3654022216796875, -1.318695068359375, -1.2719879150390625, -1.22528076171875, -1.1785736083984375, -1.131866455078125, -1.0851593017578125, -1.0384521484375, -0.9917449951171875, -0.945037841796875, -0.8983306884765625, -0.85162353515625, -0.8049163818359375, -0.758209228515625, -0.7115020751953125, -0.664794921875, -0.6180877685546875, -0.571380615234375, -0.5246734619140625, -0.47796630859375, -0.4312591552734375, -0.384552001953125, -0.3378448486328125, -0.2911376953125, -0.2444305419921875, -0.197723388671875, -0.1510162353515625, -0.10430908203125, -0.0576019287109375, -0.010894775390625, 0.0358123779296875, 0.08251953125, 0.1292266845703125, 0.175933837890625, 0.2226409912109375, 0.26934814453125, 0.3160552978515625, 0.362762451171875, 0.4094696044921875, 0.4561767578125, 0.5028839111328125, 0.549591064453125, 0.5962982177734375, 0.64300537109375, 0.6897125244140625, 0.736419677734375, 0.7831268310546875, 0.829833984375, 0.8765411376953125, 0.923248291015625, 0.9699554443359375, 1.01666259765625, 1.0633697509765625, 1.110076904296875, 1.1567840576171875, 1.2034912109375, 1.2501983642578125, 1.296905517578125, 1.3436126708984375, 1.39031982421875, 1.4370269775390625, 1.483734130859375, 1.5304412841796875, 1.5771484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 7.0, 13.0, 12.0, 15.0, 24.0, 16.0, 25.0, 27.0, 39.0, 41.0, 44.0, 49.0, 54.0, 34.0, 52.0, 60.0, 59.0, 56.0, 41.0, 36.0, 40.0, 38.0, 39.0, 29.0, 28.0, 21.0, 16.0, 12.0, 7.0, 15.0, 5.0, 9.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4267578125, -1.3730926513671875, -1.319427490234375, -1.2657623291015625, -1.21209716796875, -1.1584320068359375, -1.104766845703125, -1.0511016845703125, -0.9974365234375, -0.9437713623046875, -0.890106201171875, -0.8364410400390625, -0.78277587890625, -0.7291107177734375, -0.675445556640625, -0.6217803955078125, -0.568115234375, -0.5144500732421875, -0.460784912109375, -0.4071197509765625, -0.35345458984375, -0.2997894287109375, -0.246124267578125, -0.1924591064453125, -0.1387939453125, -0.0851287841796875, -0.031463623046875, 0.0222015380859375, 0.07586669921875, 0.1295318603515625, 0.183197021484375, 0.2368621826171875, 0.29052734375, 0.3441925048828125, 0.397857666015625, 0.4515228271484375, 0.50518798828125, 0.5588531494140625, 0.612518310546875, 0.6661834716796875, 0.7198486328125, 0.7735137939453125, 0.827178955078125, 0.8808441162109375, 0.93450927734375, 0.9881744384765625, 1.041839599609375, 1.0955047607421875, 1.149169921875, 1.2028350830078125, 1.256500244140625, 1.3101654052734375, 1.36383056640625, 1.4174957275390625, 1.471160888671875, 1.5248260498046875, 1.5784912109375, 1.6321563720703125, 1.685821533203125, 1.7394866943359375, 1.79315185546875, 1.8468170166015625, 1.900482177734375, 1.9541473388671875, 2.0078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 8.0, 15.0, 18.0, 48.0, 80.0, 144.0, 295.0, 841.0, 3295.0, 25581.0, 689530.0, 308666.0, 16322.0, 2457.0, 673.0, 244.0, 128.0, 70.0, 38.0, 18.0, 17.0, 10.0, 7.0, 6.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80126953125, -0.77691650390625, -0.7525634765625, -0.72821044921875, -0.703857421875, -0.67950439453125, -0.6551513671875, -0.63079833984375, -0.6064453125, -0.58209228515625, -0.5577392578125, -0.53338623046875, -0.509033203125, -0.48468017578125, -0.4603271484375, -0.43597412109375, -0.41162109375, -0.38726806640625, -0.3629150390625, -0.33856201171875, -0.314208984375, -0.28985595703125, -0.2655029296875, -0.24114990234375, -0.216796875, -0.19244384765625, -0.1680908203125, -0.14373779296875, -0.119384765625, -0.09503173828125, -0.0706787109375, -0.04632568359375, -0.02197265625, 0.00238037109375, 0.0267333984375, 0.05108642578125, 0.075439453125, 0.09979248046875, 0.1241455078125, 0.14849853515625, 0.1728515625, 0.19720458984375, 0.2215576171875, 0.24591064453125, 0.270263671875, 0.29461669921875, 0.3189697265625, 0.34332275390625, 0.36767578125, 0.39202880859375, 0.4163818359375, 0.44073486328125, 0.465087890625, 0.48944091796875, 0.5137939453125, 0.53814697265625, 0.5625, 0.58685302734375, 0.6112060546875, 0.63555908203125, 0.659912109375, 0.68426513671875, 0.7086181640625, 0.73297119140625, 0.75732421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 10.0, 11.0, 8.0, 11.0, 19.0, 21.0, 31.0, 24.0, 47.0, 87.0, 101.0, 116.0, 133.0, 95.0, 59.0, 50.0, 32.0, 31.0, 14.0, 15.0, 7.0, 8.0, 4.0, 11.0, 7.0, 7.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.00011610984802246094, -0.00011296756565570831, -0.00010982528328895569, -0.00010668300092220306, -0.00010354071855545044, -0.00010039843618869781, -9.725615382194519e-05, -9.411387145519257e-05, -9.097158908843994e-05, -8.782930672168732e-05, -8.468702435493469e-05, -8.154474198818207e-05, -7.840245962142944e-05, -7.526017725467682e-05, -7.21178948879242e-05, -6.897561252117157e-05, -6.583333015441895e-05, -6.269104778766632e-05, -5.9548765420913696e-05, -5.640648305416107e-05, -5.326420068740845e-05, -5.012191832065582e-05, -4.69796359539032e-05, -4.3837353587150574e-05, -4.069507122039795e-05, -3.7552788853645325e-05, -3.44105064868927e-05, -3.1268224120140076e-05, -2.812594175338745e-05, -2.4983659386634827e-05, -2.1841377019882202e-05, -1.8699094653129578e-05, -1.5556812286376953e-05, -1.2414529919624329e-05, -9.272247552871704e-06, -6.12996518611908e-06, -2.987682819366455e-06, 1.5459954738616943e-07, 3.296881914138794e-06, 6.4391642808914185e-06, 9.581446647644043e-06, 1.2723729014396667e-05, 1.5866011381149292e-05, 1.9008293747901917e-05, 2.215057611465454e-05, 2.5292858481407166e-05, 2.843514084815979e-05, 3.1577423214912415e-05, 3.471970558166504e-05, 3.7861987948417664e-05, 4.100427031517029e-05, 4.414655268192291e-05, 4.728883504867554e-05, 5.043111741542816e-05, 5.3573399782180786e-05, 5.671568214893341e-05, 5.9857964515686035e-05, 6.300024688243866e-05, 6.614252924919128e-05, 6.928481161594391e-05, 7.242709398269653e-05, 7.556937634944916e-05, 7.871165871620178e-05, 8.18539410829544e-05, 8.499622344970703e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 2.0, 12.0, 14.0, 15.0, 34.0, 74.0, 101.0, 222.0, 563.0, 1607.0, 8075.0, 81383.0, 883263.0, 63775.0, 6899.0, 1471.0, 540.0, 240.0, 111.0, 51.0, 39.0, 22.0, 21.0, 11.0, 4.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61865234375, -0.5933609008789062, -0.5680694580078125, -0.5427780151367188, -0.517486572265625, -0.49219512939453125, -0.4669036865234375, -0.44161224365234375, -0.41632080078125, -0.39102935791015625, -0.3657379150390625, -0.34044647216796875, -0.315155029296875, -0.28986358642578125, -0.2645721435546875, -0.23928070068359375, -0.2139892578125, -0.18869781494140625, -0.1634063720703125, -0.13811492919921875, -0.112823486328125, -0.08753204345703125, -0.0622406005859375, -0.03694915771484375, -0.01165771484375, 0.01363372802734375, 0.0389251708984375, 0.06421661376953125, 0.089508056640625, 0.11479949951171875, 0.1400909423828125, 0.16538238525390625, 0.190673828125, 0.21596527099609375, 0.2412567138671875, 0.26654815673828125, 0.291839599609375, 0.31713104248046875, 0.3424224853515625, 0.36771392822265625, 0.39300537109375, 0.41829681396484375, 0.4435882568359375, 0.46887969970703125, 0.494171142578125, 0.5194625854492188, 0.5447540283203125, 0.5700454711914062, 0.5953369140625, 0.6206283569335938, 0.6459197998046875, 0.6712112426757812, 0.696502685546875, 0.7217941284179688, 0.7470855712890625, 0.7723770141601562, 0.79766845703125, 0.8229598999023438, 0.8482513427734375, 0.8735427856445312, 0.898834228515625, 0.9241256713867188, 0.9494171142578125, 0.9747085571289062, 1.0]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 19.0, 16.0, 23.0, 41.0, 67.0, 88.0, 117.0, 137.0, 116.0, 90.0, 89.0, 52.0, 43.0, 20.0, 8.0, 9.0, 8.0, 6.0, 7.0, 3.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421630859375, -0.4038124084472656, -0.38599395751953125, -0.3681755065917969, -0.3503570556640625, -0.3325386047363281, -0.31472015380859375, -0.2969017028808594, -0.279083251953125, -0.2612648010253906, -0.24344635009765625, -0.22562789916992188, -0.2078094482421875, -0.18999099731445312, -0.17217254638671875, -0.15435409545898438, -0.13653564453125, -0.11871719360351562, -0.10089874267578125, -0.08308029174804688, -0.0652618408203125, -0.047443389892578125, -0.02962493896484375, -0.011806488037109375, 0.006011962890625, 0.023830413818359375, 0.04164886474609375, 0.059467315673828125, 0.0772857666015625, 0.09510421752929688, 0.11292266845703125, 0.13074111938476562, 0.1485595703125, 0.16637802124023438, 0.18419647216796875, 0.20201492309570312, 0.2198333740234375, 0.23765182495117188, 0.25547027587890625, 0.2732887268066406, 0.291107177734375, 0.3089256286621094, 0.32674407958984375, 0.3445625305175781, 0.3623809814453125, 0.3801994323730469, 0.39801788330078125, 0.4158363342285156, 0.43365478515625, 0.4514732360839844, 0.46929168701171875, 0.4871101379394531, 0.5049285888671875, 0.5227470397949219, 0.5405654907226562, 0.5583839416503906, 0.576202392578125, 0.5940208435058594, 0.6118392944335938, 0.6296577453613281, 0.6474761962890625, 0.6652946472167969, 0.6831130981445312, 0.7009315490722656, 0.71875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 12.0, 14.0, 89.0, 280.0, 397.0, 142.0, 36.0, 17.0, 8.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.032573699951172, -19.49614143371582, -18.9597110748291, -18.42327880859375, -17.8868465423584, -17.350414276123047, -16.813983917236328, -16.277551651000977, -15.741120338439941, -15.204689025878906, -14.668256759643555, -14.13182544708252, -13.595394134521484, -13.058961868286133, -12.522530555725098, -11.986099243164062, -11.449666976928711, -10.913235664367676, -10.376803398132324, -9.840372085571289, -9.303939819335938, -8.767508506774902, -8.231077194213867, -7.694645404815674, -7.1582136154174805, -6.621781826019287, -6.085350036621094, -5.548918724060059, -5.012486934661865, -4.476055145263672, -3.9396235942840576, -3.4031920433044434, -2.8667612075805664, -2.330329418182373, -1.7938978672027588, -1.257466197013855, -0.7210345268249512, -0.1846027374267578, 0.35182881355285645, 0.8882603645324707, 1.424692153930664, 1.9611238241195679, 2.4975554943084717, 3.033987045288086, 3.5704188346862793, 4.106850624084473, 4.643281936645508, 5.179713726043701, 5.7161455154418945, 6.252577304840088, 6.789009094238281, 7.325440406799316, 7.86187219619751, 8.398303985595703, 8.934735298156738, 9.471166610717773, 10.007598876953125, 10.54403018951416, 11.080462455749512, 11.616893768310547, 12.153326034545898, 12.689757347106934, 13.226188659667969, 13.76262092590332, 14.299052238464355]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 1.0, 6.0, 3.0, 9.0, 11.0, 5.0, 5.0, 13.0, 8.0, 16.0, 25.0, 24.0, 25.0, 28.0, 43.0, 34.0, 46.0, 40.0, 50.0, 51.0, 60.0, 47.0, 54.0, 48.0, 44.0, 35.0, 39.0, 36.0, 16.0, 26.0, 32.0, 17.0, 15.0, 9.0, 18.0, 13.0, 10.0, 7.0, 5.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-6.710257053375244, -6.521196365356445, -6.332135200500488, -6.1430745124816895, -5.954013824462891, -5.764952659606934, -5.575891971588135, -5.386831283569336, -5.197770118713379, -5.00870943069458, -4.819648265838623, -4.630587577819824, -4.441526889801025, -4.252466201782227, -4.0634050369262695, -3.8743443489074707, -3.685283660888672, -3.496222734451294, -3.307162046432495, -3.118101119995117, -2.9290404319763184, -2.7399795055389404, -2.5509185791015625, -2.3618578910827637, -2.1727969646453857, -1.9837361574172974, -1.794675350189209, -1.605614423751831, -1.4165536165237427, -1.2274928092956543, -1.0384318828582764, -0.849371075630188, -0.6603102684020996, -0.47124943137168884, -0.2821885943412781, -0.09312772750854492, 0.09593307971954346, 0.28499388694763184, 0.47405481338500977, 0.6631156206130981, 0.8521764278411865, 1.041237235069275, 1.2302980422973633, 1.4193589687347412, 1.6084197759628296, 1.797480583190918, 1.986541509628296, 2.175602436065674, 2.3646631240844727, 2.5537240505218506, 2.7427847385406494, 2.9318456649780273, 3.120906352996826, 3.309967279434204, 3.499028205871582, 3.688088893890381, 3.877149820327759, 4.066210746765137, 4.2552714347839355, 4.444332122802734, 4.633393287658691, 4.82245397567749, 5.011514663696289, 5.200575828552246, 5.389636516571045]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 7.0, 14.0, 21.0, 31.0, 47.0, 52.0, 78.0, 145.0, 215.0, 351.0, 643.0, 1310.0, 2514.0, 5503.0, 14138.0, 51626.0, 353395.0, 2263969.0, 1291574.0, 159183.0, 31421.0, 9842.0, 4029.0, 1872.0, 985.0, 524.0, 287.0, 180.0, 112.0, 64.0, 37.0, 26.0, 21.0, 10.0, 11.0, 11.0, 10.0, 3.0, 4.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.548828125, -0.5335006713867188, -0.5181732177734375, -0.5028457641601562, -0.487518310546875, -0.47219085693359375, -0.4568634033203125, -0.44153594970703125, -0.42620849609375, -0.41088104248046875, -0.3955535888671875, -0.38022613525390625, -0.364898681640625, -0.34957122802734375, -0.3342437744140625, -0.31891632080078125, -0.3035888671875, -0.28826141357421875, -0.2729339599609375, -0.25760650634765625, -0.242279052734375, -0.22695159912109375, -0.2116241455078125, -0.19629669189453125, -0.18096923828125, -0.16564178466796875, -0.1503143310546875, -0.13498687744140625, -0.119659423828125, -0.10433197021484375, -0.0890045166015625, -0.07367706298828125, -0.058349609375, -0.04302215576171875, -0.0276947021484375, -0.01236724853515625, 0.002960205078125, 0.01828765869140625, 0.0336151123046875, 0.04894256591796875, 0.06427001953125, 0.07959747314453125, 0.0949249267578125, 0.11025238037109375, 0.125579833984375, 0.14090728759765625, 0.1562347412109375, 0.17156219482421875, 0.1868896484375, 0.20221710205078125, 0.2175445556640625, 0.23287200927734375, 0.248199462890625, 0.26352691650390625, 0.2788543701171875, 0.29418182373046875, 0.30950927734375, 0.32483673095703125, 0.3401641845703125, 0.35549163818359375, 0.370819091796875, 0.38614654541015625, 0.4014739990234375, 0.41680145263671875, 0.43212890625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 9.0, 12.0, 6.0, 22.0, 17.0, 23.0, 35.0, 46.0, 50.0, 34.0, 56.0, 57.0, 47.0, 52.0, 55.0, 50.0, 68.0, 60.0, 42.0, 51.0, 48.0, 39.0, 26.0, 25.0, 14.0, 17.0, 9.0, 8.0, 7.0, 5.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6025390625, -0.5871658325195312, -0.5717926025390625, -0.5564193725585938, -0.541046142578125, -0.5256729125976562, -0.5102996826171875, -0.49492645263671875, -0.47955322265625, -0.46417999267578125, -0.4488067626953125, -0.43343353271484375, -0.418060302734375, -0.40268707275390625, -0.3873138427734375, -0.37194061279296875, -0.3565673828125, -0.34119415283203125, -0.3258209228515625, -0.31044769287109375, -0.295074462890625, -0.27970123291015625, -0.2643280029296875, -0.24895477294921875, -0.23358154296875, -0.21820831298828125, -0.2028350830078125, -0.18746185302734375, -0.172088623046875, -0.15671539306640625, -0.1413421630859375, -0.12596893310546875, -0.110595703125, -0.09522247314453125, -0.0798492431640625, -0.06447601318359375, -0.049102783203125, -0.03372955322265625, -0.0183563232421875, -0.00298309326171875, 0.01239013671875, 0.02776336669921875, 0.0431365966796875, 0.05850982666015625, 0.073883056640625, 0.08925628662109375, 0.1046295166015625, 0.12000274658203125, 0.1353759765625, 0.15074920654296875, 0.1661224365234375, 0.18149566650390625, 0.196868896484375, 0.21224212646484375, 0.2276153564453125, 0.24298858642578125, 0.25836181640625, 0.27373504638671875, 0.2891082763671875, 0.30448150634765625, 0.319854736328125, 0.33522796630859375, 0.3506011962890625, 0.36597442626953125, 0.38134765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 18.0, 17.0, 28.0, 51.0, 106.0, 202.0, 429.0, 897.0, 2580.0, 10862.0, 96306.0, 3045544.0, 986102.0, 41825.0, 6350.0, 1640.0, 609.0, 319.0, 149.0, 73.0, 70.0, 28.0, 15.0, 15.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7320938110351562, -0.7000274658203125, -0.6679611206054688, -0.635894775390625, -0.6038284301757812, -0.5717620849609375, -0.5396957397460938, -0.50762939453125, -0.47556304931640625, -0.4434967041015625, -0.41143035888671875, -0.379364013671875, -0.34729766845703125, -0.3152313232421875, -0.28316497802734375, -0.2510986328125, -0.21903228759765625, -0.1869659423828125, -0.15489959716796875, -0.122833251953125, -0.09076690673828125, -0.0587005615234375, -0.02663421630859375, 0.00543212890625, 0.03749847412109375, 0.0695648193359375, 0.10163116455078125, 0.133697509765625, 0.16576385498046875, 0.1978302001953125, 0.22989654541015625, 0.261962890625, 0.29402923583984375, 0.3260955810546875, 0.35816192626953125, 0.390228271484375, 0.42229461669921875, 0.4543609619140625, 0.48642730712890625, 0.51849365234375, 0.5505599975585938, 0.5826263427734375, 0.6146926879882812, 0.646759033203125, 0.6788253784179688, 0.7108917236328125, 0.7429580688476562, 0.7750244140625, 0.8070907592773438, 0.8391571044921875, 0.8712234497070312, 0.903289794921875, 0.9353561401367188, 0.9674224853515625, 0.9994888305664062, 1.03155517578125, 1.0636215209960938, 1.0956878662109375, 1.1277542114257812, 1.159820556640625, 1.1918869018554688, 1.2239532470703125, 1.2560195922851562, 1.2880859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 5.0, 18.0, 22.0, 43.0, 40.0, 78.0, 149.0, 210.0, 414.0, 711.0, 786.0, 600.0, 364.0, 229.0, 130.0, 86.0, 57.0, 38.0, 20.0, 15.0, 15.0, 8.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1044921875, -1.0749893188476562, -1.0454864501953125, -1.0159835815429688, -0.986480712890625, -0.9569778442382812, -0.9274749755859375, -0.8979721069335938, -0.86846923828125, -0.8389663696289062, -0.8094635009765625, -0.7799606323242188, -0.750457763671875, -0.7209548950195312, -0.6914520263671875, -0.6619491577148438, -0.6324462890625, -0.6029434204101562, -0.5734405517578125, -0.5439376831054688, -0.514434814453125, -0.48493194580078125, -0.4554290771484375, -0.42592620849609375, -0.39642333984375, -0.36692047119140625, -0.3374176025390625, -0.30791473388671875, -0.278411865234375, -0.24890899658203125, -0.2194061279296875, -0.18990325927734375, -0.160400390625, -0.13089752197265625, -0.1013946533203125, -0.07189178466796875, -0.042388916015625, -0.01288604736328125, 0.0166168212890625, 0.04611968994140625, 0.07562255859375, 0.10512542724609375, 0.1346282958984375, 0.16413116455078125, 0.193634033203125, 0.22313690185546875, 0.2526397705078125, 0.28214263916015625, 0.3116455078125, 0.34114837646484375, 0.3706512451171875, 0.40015411376953125, 0.429656982421875, 0.45915985107421875, 0.4886627197265625, 0.5181655883789062, 0.54766845703125, 0.5771713256835938, 0.6066741943359375, 0.6361770629882812, 0.665679931640625, 0.6951828002929688, 0.7246856689453125, 0.7541885375976562, 0.78369140625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 14.0, 26.0, 83.0, 246.0, 312.0, 190.0, 71.0, 29.0, 11.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.921965599060059, -14.498946189880371, -14.075926780700684, -13.65290641784668, -13.229887008666992, -12.806867599487305, -12.383848190307617, -11.96082878112793, -11.537809371948242, -11.114789962768555, -10.691770553588867, -10.26875114440918, -9.845730781555176, -9.422711372375488, -8.9996919631958, -8.576672554016113, -8.15365219116211, -7.730632781982422, -7.307612895965576, -6.884593486785889, -6.461573600769043, -6.0385541915893555, -5.615534782409668, -5.1925153732299805, -4.769495487213135, -4.346476078033447, -3.9234561920166016, -3.500436782836914, -3.0774171352386475, -2.654397487640381, -2.2313780784606934, -1.8083584308624268, -1.3853378295898438, -0.9623182415962219, -0.5392986536026001, -0.11627912521362305, 0.30674052238464355, 0.7297601699829102, 1.1527795791625977, 1.5757992267608643, 1.9988188743591309, 2.4218385219573975, 2.844858169555664, 3.2678775787353516, 3.690897226333618, 4.113916873931885, 4.536936283111572, 4.959956169128418, 5.3829755783081055, 5.805994987487793, 6.229014873504639, 6.652034282684326, 7.075054168701172, 7.498073577880859, 7.921092987060547, 8.344112396240234, 8.767131805419922, 9.19015121459961, 9.613170623779297, 10.036190032958984, 10.459210395812988, 10.882229804992676, 11.305249214172363, 11.72826862335205, 12.151288986206055]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 5.0, 3.0, 8.0, 3.0, 10.0, 18.0, 11.0, 13.0, 30.0, 29.0, 34.0, 35.0, 50.0, 45.0, 50.0, 52.0, 59.0, 70.0, 69.0, 56.0, 58.0, 41.0, 38.0, 41.0, 33.0, 31.0, 19.0, 21.0, 10.0, 21.0, 3.0, 5.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.285148620605469, -4.1447529792785645, -4.004356861114502, -3.8639612197875977, -3.7235655784606934, -3.58316969871521, -3.4427738189697266, -3.3023781776428223, -3.161982297897339, -3.0215864181518555, -2.881190776824951, -2.7407948970794678, -2.6003990173339844, -2.46000337600708, -2.3196074962615967, -2.1792116165161133, -2.038815975189209, -1.8984202146530151, -1.7580244541168213, -1.617628574371338, -1.477232813835144, -1.3368370532989502, -1.1964411735534668, -1.056045413017273, -0.9156496524810791, -0.7752538919448853, -0.6348580718040466, -0.4944622814655304, -0.35406649112701416, -0.2136707305908203, -0.07327491044998169, 0.06712090969085693, 0.20751619338989258, 0.3479119837284088, 0.48830777406692505, 0.6287035942077637, 0.7690993547439575, 0.9094951152801514, 1.0498909950256348, 1.1902867555618286, 1.3306825160980225, 1.4710782766342163, 1.6114740371704102, 1.7518699169158936, 1.8922656774520874, 2.0326614379882812, 2.1730573177337646, 2.313453197479248, 2.4538488388061523, 2.5942447185516357, 2.73464035987854, 2.8750362396240234, 3.0154318809509277, 3.155827760696411, 3.2962236404418945, 3.436619281768799, 3.5770151615142822, 3.7174110412597656, 3.85780668258667, 3.9982025623321533, 4.138598442077637, 4.278994083404541, 4.419389724731445, 4.559785842895508, 4.700181484222412]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 7.0, 10.0, 19.0, 30.0, 32.0, 49.0, 82.0, 171.0, 218.0, 423.0, 731.0, 1378.0, 2866.0, 5958.0, 13283.0, 32065.0, 80700.0, 201898.0, 347859.0, 214095.0, 85935.0, 33903.0, 14283.0, 6262.0, 2865.0, 1550.0, 827.0, 411.0, 250.0, 155.0, 86.0, 51.0, 25.0, 27.0, 18.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.56591796875, -0.549041748046875, -0.53216552734375, -0.515289306640625, -0.4984130859375, -0.481536865234375, -0.46466064453125, -0.447784423828125, -0.430908203125, -0.414031982421875, -0.39715576171875, -0.380279541015625, -0.3634033203125, -0.346527099609375, -0.32965087890625, -0.312774658203125, -0.2958984375, -0.279022216796875, -0.26214599609375, -0.245269775390625, -0.2283935546875, -0.211517333984375, -0.19464111328125, -0.177764892578125, -0.160888671875, -0.144012451171875, -0.12713623046875, -0.110260009765625, -0.0933837890625, -0.076507568359375, -0.05963134765625, -0.042755126953125, -0.02587890625, -0.009002685546875, 0.00787353515625, 0.024749755859375, 0.0416259765625, 0.058502197265625, 0.07537841796875, 0.092254638671875, 0.109130859375, 0.126007080078125, 0.14288330078125, 0.159759521484375, 0.1766357421875, 0.193511962890625, 0.21038818359375, 0.227264404296875, 0.244140625, 0.261016845703125, 0.27789306640625, 0.294769287109375, 0.3116455078125, 0.328521728515625, 0.34539794921875, 0.362274169921875, 0.379150390625, 0.396026611328125, 0.41290283203125, 0.429779052734375, 0.4466552734375, 0.463531494140625, 0.48040771484375, 0.497283935546875, 0.51416015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 11.0, 10.0, 17.0, 23.0, 34.0, 30.0, 33.0, 46.0, 47.0, 63.0, 51.0, 51.0, 65.0, 58.0, 47.0, 63.0, 56.0, 41.0, 47.0, 40.0, 24.0, 27.0, 35.0, 14.0, 13.0, 12.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5576858520507812, -0.5426177978515625, -0.5275497436523438, -0.512481689453125, -0.49741363525390625, -0.4823455810546875, -0.46727752685546875, -0.45220947265625, -0.43714141845703125, -0.4220733642578125, -0.40700531005859375, -0.391937255859375, -0.37686920166015625, -0.3618011474609375, -0.34673309326171875, -0.3316650390625, -0.31659698486328125, -0.3015289306640625, -0.28646087646484375, -0.271392822265625, -0.25632476806640625, -0.2412567138671875, -0.22618865966796875, -0.21112060546875, -0.19605255126953125, -0.1809844970703125, -0.16591644287109375, -0.150848388671875, -0.13578033447265625, -0.1207122802734375, -0.10564422607421875, -0.090576171875, -0.07550811767578125, -0.0604400634765625, -0.04537200927734375, -0.030303955078125, -0.01523590087890625, -0.0001678466796875, 0.01490020751953125, 0.02996826171875, 0.04503631591796875, 0.0601043701171875, 0.07517242431640625, 0.090240478515625, 0.10530853271484375, 0.1203765869140625, 0.13544464111328125, 0.1505126953125, 0.16558074951171875, 0.1806488037109375, 0.19571685791015625, 0.210784912109375, 0.22585296630859375, 0.2409210205078125, 0.25598907470703125, 0.27105712890625, 0.28612518310546875, 0.3011932373046875, 0.31626129150390625, 0.331329345703125, 0.34639739990234375, 0.3614654541015625, 0.37653350830078125, 0.3916015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 11.0, 11.0, 15.0, 14.0, 21.0, 35.0, 52.0, 76.0, 113.0, 150.0, 247.0, 316.0, 452.0, 790.0, 1329.0, 2529.0, 7094.0, 32089.0, 265435.0, 650220.0, 68101.0, 11570.0, 3527.0, 1628.0, 904.0, 586.0, 354.0, 244.0, 181.0, 133.0, 74.0, 63.0, 45.0, 32.0, 21.0, 22.0, 15.0, 13.0, 5.0, 9.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1103515625, -1.0723114013671875, -1.034271240234375, -0.9962310791015625, -0.95819091796875, -0.9201507568359375, -0.882110595703125, -0.8440704345703125, -0.8060302734375, -0.7679901123046875, -0.729949951171875, -0.6919097900390625, -0.65386962890625, -0.6158294677734375, -0.577789306640625, -0.5397491455078125, -0.501708984375, -0.4636688232421875, -0.425628662109375, -0.3875885009765625, -0.34954833984375, -0.3115081787109375, -0.273468017578125, -0.2354278564453125, -0.1973876953125, -0.1593475341796875, -0.121307373046875, -0.0832672119140625, -0.04522705078125, -0.0071868896484375, 0.030853271484375, 0.0688934326171875, 0.10693359375, 0.1449737548828125, 0.183013916015625, 0.2210540771484375, 0.25909423828125, 0.2971343994140625, 0.335174560546875, 0.3732147216796875, 0.4112548828125, 0.4492950439453125, 0.487335205078125, 0.5253753662109375, 0.56341552734375, 0.6014556884765625, 0.639495849609375, 0.6775360107421875, 0.715576171875, 0.7536163330078125, 0.791656494140625, 0.8296966552734375, 0.86773681640625, 0.9057769775390625, 0.943817138671875, 0.9818572998046875, 1.0198974609375, 1.0579376220703125, 1.095977783203125, 1.1340179443359375, 1.17205810546875, 1.2100982666015625, 1.248138427734375, 1.2861785888671875, 1.32421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 10.0, 20.0, 17.0, 28.0, 34.0, 33.0, 37.0, 52.0, 59.0, 50.0, 73.0, 64.0, 61.0, 44.0, 53.0, 56.0, 43.0, 55.0, 23.0, 35.0, 30.0, 28.0, 17.0, 14.0, 12.0, 13.0, 8.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.033660888671875, -1.96185302734375, -1.890045166015625, -1.8182373046875, -1.746429443359375, -1.67462158203125, -1.602813720703125, -1.531005859375, -1.459197998046875, -1.38739013671875, -1.315582275390625, -1.2437744140625, -1.171966552734375, -1.10015869140625, -1.028350830078125, -0.95654296875, -0.884735107421875, -0.81292724609375, -0.741119384765625, -0.6693115234375, -0.597503662109375, -0.52569580078125, -0.453887939453125, -0.382080078125, -0.310272216796875, -0.23846435546875, -0.166656494140625, -0.0948486328125, -0.023040771484375, 0.04876708984375, 0.120574951171875, 0.1923828125, 0.264190673828125, 0.33599853515625, 0.407806396484375, 0.4796142578125, 0.551422119140625, 0.62322998046875, 0.695037841796875, 0.766845703125, 0.838653564453125, 0.91046142578125, 0.982269287109375, 1.0540771484375, 1.125885009765625, 1.19769287109375, 1.269500732421875, 1.34130859375, 1.413116455078125, 1.48492431640625, 1.556732177734375, 1.6285400390625, 1.700347900390625, 1.77215576171875, 1.843963623046875, 1.915771484375, 1.987579345703125, 2.05938720703125, 2.131195068359375, 2.2030029296875, 2.274810791015625, 2.34661865234375, 2.418426513671875, 2.490234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 4.0, 13.0, 11.0, 7.0, 18.0, 27.0, 29.0, 61.0, 90.0, 136.0, 190.0, 304.0, 475.0, 888.0, 1810.0, 4485.0, 13878.0, 58552.0, 492170.0, 396822.0, 56380.0, 13699.0, 4442.0, 1779.0, 836.0, 512.0, 290.0, 184.0, 117.0, 103.0, 67.0, 47.0, 34.0, 28.0, 17.0, 12.0, 7.0, 9.0, 5.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.448974609375, -0.4349403381347656, -0.42090606689453125, -0.4068717956542969, -0.3928375244140625, -0.3788032531738281, -0.36476898193359375, -0.3507347106933594, -0.336700439453125, -0.3226661682128906, -0.30863189697265625, -0.2945976257324219, -0.2805633544921875, -0.2665290832519531, -0.25249481201171875, -0.23846054077148438, -0.22442626953125, -0.21039199829101562, -0.19635772705078125, -0.18232345581054688, -0.1682891845703125, -0.15425491333007812, -0.14022064208984375, -0.12618637084960938, -0.112152099609375, -0.09811782836914062, -0.08408355712890625, -0.07004928588867188, -0.0560150146484375, -0.041980743408203125, -0.02794647216796875, -0.013912200927734375, 0.0001220703125, 0.014156341552734375, 0.02819061279296875, 0.042224884033203125, 0.0562591552734375, 0.07029342651367188, 0.08432769775390625, 0.09836196899414062, 0.112396240234375, 0.12643051147460938, 0.14046478271484375, 0.15449905395507812, 0.1685333251953125, 0.18256759643554688, 0.19660186767578125, 0.21063613891601562, 0.22467041015625, 0.23870468139648438, 0.25273895263671875, 0.2667732238769531, 0.2808074951171875, 0.2948417663574219, 0.30887603759765625, 0.3229103088378906, 0.336944580078125, 0.3509788513183594, 0.36501312255859375, 0.3790473937988281, 0.3930816650390625, 0.4071159362792969, 0.42115020751953125, 0.4351844787597656, 0.44921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 8.0, 4.0, 13.0, 5.0, 10.0, 19.0, 28.0, 27.0, 30.0, 28.0, 50.0, 58.0, 104.0, 108.0, 91.0, 80.0, 70.0, 38.0, 31.0, 33.0, 21.0, 21.0, 18.0, 24.0, 17.0, 11.0, 7.0, 5.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00012624263763427734, -0.00012251082807779312, -0.0001187790185213089, -0.00011504720896482468, -0.00011131539940834045, -0.00010758358985185623, -0.00010385178029537201, -0.00010011997073888779, -9.638816118240356e-05, -9.265635162591934e-05, -8.892454206943512e-05, -8.51927325129509e-05, -8.146092295646667e-05, -7.772911339998245e-05, -7.399730384349823e-05, -7.026549428701401e-05, -6.653368473052979e-05, -6.280187517404556e-05, -5.907006561756134e-05, -5.533825606107712e-05, -5.1606446504592896e-05, -4.787463694810867e-05, -4.414282739162445e-05, -4.041101783514023e-05, -3.6679208278656006e-05, -3.2947398722171783e-05, -2.921558916568756e-05, -2.548377960920334e-05, -2.1751970052719116e-05, -1.8020160496234894e-05, -1.4288350939750671e-05, -1.0556541383266449e-05, -6.8247318267822266e-06, -3.092922270298004e-06, 6.388872861862183e-07, 4.370696842670441e-06, 8.102506399154663e-06, 1.1834315955638885e-05, 1.5566125512123108e-05, 1.929793506860733e-05, 2.3029744625091553e-05, 2.6761554181575775e-05, 3.0493363738059998e-05, 3.422517329454422e-05, 3.795698285102844e-05, 4.1688792407512665e-05, 4.542060196399689e-05, 4.915241152048111e-05, 5.288422107696533e-05, 5.6616030633449554e-05, 6.034784018993378e-05, 6.4079649746418e-05, 6.781145930290222e-05, 7.154326885938644e-05, 7.527507841587067e-05, 7.900688797235489e-05, 8.273869752883911e-05, 8.647050708532333e-05, 9.020231664180756e-05, 9.393412619829178e-05, 9.7665935754776e-05, 0.00010139774531126022, 0.00010512955486774445, 0.00010886136442422867, 0.00011259317398071289]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 15.0, 17.0, 36.0, 33.0, 44.0, 60.0, 122.0, 159.0, 247.0, 387.0, 592.0, 1204.0, 2549.0, 6524.0, 23513.0, 135396.0, 744709.0, 102789.0, 19233.0, 5838.0, 2336.0, 1147.0, 572.0, 344.0, 227.0, 112.0, 115.0, 62.0, 46.0, 19.0, 18.0, 19.0, 17.0, 13.0, 4.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.56414794921875, -0.5467529296875, -0.52935791015625, -0.511962890625, -0.49456787109375, -0.4771728515625, -0.45977783203125, -0.4423828125, -0.42498779296875, -0.4075927734375, -0.39019775390625, -0.372802734375, -0.35540771484375, -0.3380126953125, -0.32061767578125, -0.30322265625, -0.28582763671875, -0.2684326171875, -0.25103759765625, -0.233642578125, -0.21624755859375, -0.1988525390625, -0.18145751953125, -0.1640625, -0.14666748046875, -0.1292724609375, -0.11187744140625, -0.094482421875, -0.07708740234375, -0.0596923828125, -0.04229736328125, -0.02490234375, -0.00750732421875, 0.0098876953125, 0.02728271484375, 0.044677734375, 0.06207275390625, 0.0794677734375, 0.09686279296875, 0.1142578125, 0.13165283203125, 0.1490478515625, 0.16644287109375, 0.183837890625, 0.20123291015625, 0.2186279296875, 0.23602294921875, 0.25341796875, 0.27081298828125, 0.2882080078125, 0.30560302734375, 0.322998046875, 0.34039306640625, 0.3577880859375, 0.37518310546875, 0.392578125, 0.40997314453125, 0.4273681640625, 0.44476318359375, 0.462158203125, 0.47955322265625, 0.4969482421875, 0.51434326171875, 0.53173828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 6.0, 5.0, 6.0, 10.0, 10.0, 18.0, 23.0, 21.0, 29.0, 40.0, 48.0, 65.0, 98.0, 95.0, 117.0, 78.0, 66.0, 51.0, 46.0, 36.0, 37.0, 22.0, 17.0, 8.0, 17.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5078125, -0.49289703369140625, -0.4779815673828125, -0.46306610107421875, -0.448150634765625, -0.43323516845703125, -0.4183197021484375, -0.40340423583984375, -0.38848876953125, -0.37357330322265625, -0.3586578369140625, -0.34374237060546875, -0.328826904296875, -0.31391143798828125, -0.2989959716796875, -0.28408050537109375, -0.2691650390625, -0.25424957275390625, -0.2393341064453125, -0.22441864013671875, -0.209503173828125, -0.19458770751953125, -0.1796722412109375, -0.16475677490234375, -0.14984130859375, -0.13492584228515625, -0.1200103759765625, -0.10509490966796875, -0.090179443359375, -0.07526397705078125, -0.0603485107421875, -0.04543304443359375, -0.030517578125, -0.01560211181640625, -0.0006866455078125, 0.01422882080078125, 0.029144287109375, 0.04405975341796875, 0.0589752197265625, 0.07389068603515625, 0.08880615234375, 0.10372161865234375, 0.1186370849609375, 0.13355255126953125, 0.148468017578125, 0.16338348388671875, 0.1782989501953125, 0.19321441650390625, 0.2081298828125, 0.22304534912109375, 0.2379608154296875, 0.25287628173828125, 0.267791748046875, 0.28270721435546875, 0.2976226806640625, 0.31253814697265625, 0.32745361328125, 0.34236907958984375, 0.3572845458984375, 0.37220001220703125, 0.387115478515625, 0.40203094482421875, 0.4169464111328125, 0.43186187744140625, 0.44677734375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 19.0, 81.0, 288.0, 380.0, 147.0, 38.0, 15.0, 8.0, 5.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.554574966430664, -10.004039764404297, -9.45350456237793, -8.902968406677246, -8.352433204650879, -7.801898002624512, -7.251362323760986, -6.700826644897461, -6.150291442871094, -5.599756240844727, -5.049220561981201, -4.498684883117676, -3.9481496810913086, -3.3976142406463623, -2.847078800201416, -2.2965433597564697, -1.7460079193115234, -1.1954724788665771, -0.6449370384216309, -0.09440159797668457, 0.4561338424682617, 1.006669282913208, 1.5572047233581543, 2.1077401638031006, 2.658275604248047, 3.208811044692993, 3.7593464851379395, 4.309882164001465, 4.860417366027832, 5.410952568054199, 5.961488246917725, 6.51202392578125, 7.062559127807617, 7.613094329833984, 8.163629531860352, 8.714165687561035, 9.264700889587402, 9.81523609161377, 10.365772247314453, 10.91630744934082, 11.466842651367188, 12.017377853393555, 12.567913055419922, 13.118449211120605, 13.668984413146973, 14.21951961517334, 14.770055770874023, 15.32059097290039, 15.871126174926758, 16.421661376953125, 16.972196578979492, 17.52273178100586, 18.07326889038086, 18.623804092407227, 19.174339294433594, 19.72487449645996, 20.275409698486328, 20.825944900512695, 21.376480102539062, 21.92701530456543, 22.477550506591797, 23.028087615966797, 23.578622817993164, 24.12915802001953, 24.6796932220459]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 7.0, 12.0, 8.0, 18.0, 22.0, 17.0, 28.0, 26.0, 30.0, 28.0, 30.0, 43.0, 40.0, 64.0, 46.0, 60.0, 73.0, 55.0, 49.0, 37.0, 35.0, 34.0, 28.0, 35.0, 26.0, 23.0, 23.0, 23.0, 17.0, 13.0, 9.0, 3.0, 4.0, 10.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.155106544494629, -5.951432704925537, -5.747758865356445, -5.544084548950195, -5.3404107093811035, -5.136736869812012, -4.93306303024292, -4.729389190673828, -4.525714874267578, -4.322041034698486, -4.1183671951293945, -3.9146931171417236, -3.7110190391540527, -3.507345199584961, -3.303671360015869, -3.0999972820281982, -2.8963234424591064, -2.6926496028900146, -2.4889755249023438, -2.285301685333252, -2.081627607345581, -1.8779537677764893, -1.674279808998108, -1.4706058502197266, -1.2669318914413452, -1.0632579326629639, -0.8595839738845825, -0.655910074710846, -0.4522361159324646, -0.24856221675872803, -0.04488825798034668, 0.15878570079803467, 0.362459659576416, 0.5661336183547974, 0.7698075771331787, 0.9734814763069153, 1.1771554946899414, 1.3808293342590332, 1.5845032930374146, 1.788177251815796, 1.9918512105941772, 2.1955251693725586, 2.3991990089416504, 2.6028730869293213, 2.806546926498413, 3.010221004486084, 3.213894844055176, 3.4175686836242676, 3.6212427616119385, 3.8249166011810303, 4.028590679168701, 4.232264518737793, 4.435938358306885, 4.639612197875977, 4.843286514282227, 5.046960353851318, 5.25063419342041, 5.454308032989502, 5.657981872558594, 5.861656188964844, 6.0653300285339355, 6.269003868103027, 6.472677707672119, 6.676351547241211, 6.880025863647461]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 9.0, 10.0, 19.0, 22.0, 31.0, 47.0, 39.0, 86.0, 167.0, 255.0, 479.0, 826.0, 1586.0, 3318.0, 9366.0, 41660.0, 392919.0, 2612980.0, 1004397.0, 97092.0, 18355.0, 5624.0, 2333.0, 1133.0, 618.0, 343.0, 197.0, 133.0, 67.0, 46.0, 33.0, 28.0, 12.0, 9.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.45263671875, -0.4362945556640625, -0.419952392578125, -0.4036102294921875, -0.38726806640625, -0.3709259033203125, -0.354583740234375, -0.3382415771484375, -0.3218994140625, -0.3055572509765625, -0.289215087890625, -0.2728729248046875, -0.25653076171875, -0.2401885986328125, -0.223846435546875, -0.2075042724609375, -0.191162109375, -0.1748199462890625, -0.158477783203125, -0.1421356201171875, -0.12579345703125, -0.1094512939453125, -0.093109130859375, -0.0767669677734375, -0.0604248046875, -0.0440826416015625, -0.027740478515625, -0.0113983154296875, 0.00494384765625, 0.0212860107421875, 0.037628173828125, 0.0539703369140625, 0.0703125, 0.0866546630859375, 0.102996826171875, 0.1193389892578125, 0.13568115234375, 0.1520233154296875, 0.168365478515625, 0.1847076416015625, 0.2010498046875, 0.2173919677734375, 0.233734130859375, 0.2500762939453125, 0.26641845703125, 0.2827606201171875, 0.299102783203125, 0.3154449462890625, 0.331787109375, 0.3481292724609375, 0.364471435546875, 0.3808135986328125, 0.39715576171875, 0.4134979248046875, 0.429840087890625, 0.4461822509765625, 0.4625244140625, 0.4788665771484375, 0.495208740234375, 0.5115509033203125, 0.52789306640625, 0.5442352294921875, 0.560577392578125, 0.5769195556640625, 0.59326171875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 11.0, 10.0, 12.0, 17.0, 20.0, 35.0, 28.0, 33.0, 36.0, 62.0, 50.0, 63.0, 51.0, 64.0, 52.0, 45.0, 60.0, 37.0, 59.0, 33.0, 33.0, 41.0, 15.0, 33.0, 26.0, 17.0, 17.0, 9.0, 9.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5244140625, -0.50994873046875, -0.4954833984375, -0.48101806640625, -0.466552734375, -0.45208740234375, -0.4376220703125, -0.42315673828125, -0.40869140625, -0.39422607421875, -0.3797607421875, -0.36529541015625, -0.350830078125, -0.33636474609375, -0.3218994140625, -0.30743408203125, -0.29296875, -0.27850341796875, -0.2640380859375, -0.24957275390625, -0.235107421875, -0.22064208984375, -0.2061767578125, -0.19171142578125, -0.17724609375, -0.16278076171875, -0.1483154296875, -0.13385009765625, -0.119384765625, -0.10491943359375, -0.0904541015625, -0.07598876953125, -0.0615234375, -0.04705810546875, -0.0325927734375, -0.01812744140625, -0.003662109375, 0.01080322265625, 0.0252685546875, 0.03973388671875, 0.05419921875, 0.06866455078125, 0.0831298828125, 0.09759521484375, 0.112060546875, 0.12652587890625, 0.1409912109375, 0.15545654296875, 0.169921875, 0.18438720703125, 0.1988525390625, 0.21331787109375, 0.227783203125, 0.24224853515625, 0.2567138671875, 0.27117919921875, 0.28564453125, 0.30010986328125, 0.3145751953125, 0.32904052734375, 0.343505859375, 0.35797119140625, 0.3724365234375, 0.38690185546875, 0.4013671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 12.0, 6.0, 10.0, 18.0, 17.0, 22.0, 35.0, 60.0, 59.0, 99.0, 189.0, 253.0, 503.0, 997.0, 2595.0, 10800.0, 91995.0, 3247505.0, 799848.0, 30432.0, 5268.0, 1754.0, 739.0, 403.0, 214.0, 123.0, 91.0, 65.0, 36.0, 35.0, 35.0, 13.0, 15.0, 12.0, 7.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77001953125, -0.7389602661132812, -0.7079010009765625, -0.6768417358398438, -0.645782470703125, -0.6147232055664062, -0.5836639404296875, -0.5526046752929688, -0.52154541015625, -0.49048614501953125, -0.4594268798828125, -0.42836761474609375, -0.397308349609375, -0.36624908447265625, -0.3351898193359375, -0.30413055419921875, -0.2730712890625, -0.24201202392578125, -0.2109527587890625, -0.17989349365234375, -0.148834228515625, -0.11777496337890625, -0.0867156982421875, -0.05565643310546875, -0.02459716796875, 0.00646209716796875, 0.0375213623046875, 0.06858062744140625, 0.099639892578125, 0.13069915771484375, 0.1617584228515625, 0.19281768798828125, 0.223876953125, 0.25493621826171875, 0.2859954833984375, 0.31705474853515625, 0.348114013671875, 0.37917327880859375, 0.4102325439453125, 0.44129180908203125, 0.47235107421875, 0.5034103393554688, 0.5344696044921875, 0.5655288696289062, 0.596588134765625, 0.6276473999023438, 0.6587066650390625, 0.6897659301757812, 0.7208251953125, 0.7518844604492188, 0.7829437255859375, 0.8140029907226562, 0.845062255859375, 0.8761215209960938, 0.9071807861328125, 0.9382400512695312, 0.96929931640625, 1.0003585815429688, 1.0314178466796875, 1.0624771118164062, 1.093536376953125, 1.1245956420898438, 1.1556549072265625, 1.1867141723632812, 1.2177734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 12.0, 13.0, 10.0, 28.0, 50.0, 80.0, 134.0, 280.0, 563.0, 862.0, 825.0, 553.0, 314.0, 141.0, 76.0, 37.0, 27.0, 11.0, 15.0, 9.0, 7.0, 6.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1279296875, -1.097503662109375, -1.06707763671875, -1.036651611328125, -1.0062255859375, -0.975799560546875, -0.94537353515625, -0.914947509765625, -0.884521484375, -0.854095458984375, -0.82366943359375, -0.793243408203125, -0.7628173828125, -0.732391357421875, -0.70196533203125, -0.671539306640625, -0.64111328125, -0.610687255859375, -0.58026123046875, -0.549835205078125, -0.5194091796875, -0.488983154296875, -0.45855712890625, -0.428131103515625, -0.397705078125, -0.367279052734375, -0.33685302734375, -0.306427001953125, -0.2760009765625, -0.245574951171875, -0.21514892578125, -0.184722900390625, -0.154296875, -0.123870849609375, -0.09344482421875, -0.063018798828125, -0.0325927734375, -0.002166748046875, 0.02825927734375, 0.058685302734375, 0.089111328125, 0.119537353515625, 0.14996337890625, 0.180389404296875, 0.2108154296875, 0.241241455078125, 0.27166748046875, 0.302093505859375, 0.33251953125, 0.362945556640625, 0.39337158203125, 0.423797607421875, 0.4542236328125, 0.484649658203125, 0.51507568359375, 0.545501708984375, 0.575927734375, 0.606353759765625, 0.63677978515625, 0.667205810546875, 0.6976318359375, 0.728057861328125, 0.75848388671875, 0.788909912109375, 0.8193359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 6.0, 17.0, 62.0, 164.0, 286.0, 257.0, 119.0, 48.0, 14.0, 7.0, 7.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.306276321411133, -18.91156578063965, -18.516855239868164, -18.12214469909668, -17.727434158325195, -17.33272361755371, -16.93801498413086, -16.543304443359375, -16.14859390258789, -15.753883361816406, -15.359172821044922, -14.964462280273438, -14.56975269317627, -14.175042152404785, -13.7803316116333, -13.385621070861816, -12.990909576416016, -12.596199035644531, -12.201488494873047, -11.806777954101562, -11.412068367004395, -11.01735782623291, -10.622647285461426, -10.227936744689941, -9.833227157592773, -9.438516616821289, -9.043806076049805, -8.64909553527832, -8.254385948181152, -7.859675407409668, -7.464964866638184, -7.070254325866699, -6.675543785095215, -6.2808332443237305, -5.886123180389404, -5.49141263961792, -5.0967020988464355, -4.701992034912109, -4.307281494140625, -3.9125709533691406, -3.5178606510162354, -3.12315034866333, -2.7284398078918457, -2.3337295055389404, -1.9390190839767456, -1.5443086624145508, -1.1495983600616455, -0.7548878192901611, -0.36017751693725586, 0.03453287482261658, 0.429243266582489, 0.8239536285400391, 1.2186640501022339, 1.6133744716644287, 2.008084774017334, 2.4027953147888184, 2.7975056171417236, 3.192215919494629, 3.5869264602661133, 3.9816367626190186, 4.376347064971924, 4.771057605743408, 5.165767669677734, 5.560478210449219, 5.955188751220703]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 7.0, 11.0, 17.0, 20.0, 19.0, 32.0, 27.0, 32.0, 42.0, 36.0, 37.0, 39.0, 46.0, 45.0, 45.0, 51.0, 44.0, 52.0, 45.0, 53.0, 37.0, 37.0, 41.0, 27.0, 33.0, 17.0, 22.0, 7.0, 12.0, 11.0, 11.0, 13.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.402264356613159, -3.2911269664764404, -3.179989814758301, -3.068852424621582, -2.9577150344848633, -2.8465776443481445, -2.735440492630005, -2.624303102493286, -2.5131659507751465, -2.4020285606384277, -2.290891408920288, -2.1797540187835693, -2.0686166286468506, -1.9574793577194214, -1.8463420867919922, -1.7352046966552734, -1.6240673065185547, -1.5129300355911255, -1.4017926454544067, -1.2906553745269775, -1.1795179843902588, -1.0683807134628296, -0.9572434425354004, -0.8461061120033264, -0.7349687814712524, -0.6238314509391785, -0.5126941204071045, -0.4015568494796753, -0.2904195189476013, -0.17928218841552734, -0.06814491748809814, 0.04299241304397583, 0.1541297435760498, 0.2652670741081238, 0.37640437483787537, 0.48754167556762695, 0.5986790060997009, 0.7098163366317749, 0.8209536075592041, 0.9320909380912781, 1.043228268623352, 1.1543655395507812, 1.2655029296875, 1.3766402006149292, 1.4877774715423584, 1.5989148616790771, 1.7100521326065063, 1.8211894035339355, 1.9323267936706543, 2.043464183807373, 2.1546013355255127, 2.2657387256622314, 2.37687611579895, 2.48801326751709, 2.5991506576538086, 2.7102880477905273, 2.821425437927246, 2.932562828063965, 3.0436999797821045, 3.1548373699188232, 3.265974760055542, 3.3771119117736816, 3.4882493019104004, 3.599386692047119, 3.710523843765259]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 13.0, 13.0, 16.0, 28.0, 28.0, 35.0, 69.0, 103.0, 174.0, 288.0, 598.0, 1272.0, 2741.0, 6772.0, 19380.0, 66915.0, 260600.0, 468065.0, 157680.0, 41799.0, 13012.0, 4838.0, 2038.0, 995.0, 456.0, 258.0, 115.0, 83.0, 42.0, 33.0, 24.0, 15.0, 15.0, 12.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69921875, -0.6761550903320312, -0.6530914306640625, -0.6300277709960938, -0.606964111328125, -0.5839004516601562, -0.5608367919921875, -0.5377731323242188, -0.51470947265625, -0.49164581298828125, -0.4685821533203125, -0.44551849365234375, -0.422454833984375, -0.39939117431640625, -0.3763275146484375, -0.35326385498046875, -0.3302001953125, -0.30713653564453125, -0.2840728759765625, -0.26100921630859375, -0.237945556640625, -0.21488189697265625, -0.1918182373046875, -0.16875457763671875, -0.14569091796875, -0.12262725830078125, -0.0995635986328125, -0.07649993896484375, -0.053436279296875, -0.03037261962890625, -0.0073089599609375, 0.01575469970703125, 0.038818359375, 0.06188201904296875, 0.0849456787109375, 0.10800933837890625, 0.131072998046875, 0.15413665771484375, 0.1772003173828125, 0.20026397705078125, 0.22332763671875, 0.24639129638671875, 0.2694549560546875, 0.29251861572265625, 0.315582275390625, 0.33864593505859375, 0.3617095947265625, 0.38477325439453125, 0.4078369140625, 0.43090057373046875, 0.4539642333984375, 0.47702789306640625, 0.500091552734375, 0.5231552124023438, 0.5462188720703125, 0.5692825317382812, 0.59234619140625, 0.6154098510742188, 0.6384735107421875, 0.6615371704101562, 0.684600830078125, 0.7076644897460938, 0.7307281494140625, 0.7537918090820312, 0.77685546875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 5.0, 9.0, 9.0, 21.0, 15.0, 26.0, 38.0, 39.0, 41.0, 48.0, 46.0, 61.0, 53.0, 62.0, 63.0, 52.0, 55.0, 48.0, 44.0, 48.0, 40.0, 46.0, 27.0, 16.0, 18.0, 21.0, 18.0, 9.0, 6.0, 3.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5419921875, -0.5274887084960938, -0.5129852294921875, -0.49848175048828125, -0.483978271484375, -0.46947479248046875, -0.4549713134765625, -0.44046783447265625, -0.42596435546875, -0.41146087646484375, -0.3969573974609375, -0.38245391845703125, -0.367950439453125, -0.35344696044921875, -0.3389434814453125, -0.32444000244140625, -0.3099365234375, -0.29543304443359375, -0.2809295654296875, -0.26642608642578125, -0.251922607421875, -0.23741912841796875, -0.2229156494140625, -0.20841217041015625, -0.19390869140625, -0.17940521240234375, -0.1649017333984375, -0.15039825439453125, -0.135894775390625, -0.12139129638671875, -0.1068878173828125, -0.09238433837890625, -0.077880859375, -0.06337738037109375, -0.0488739013671875, -0.03437042236328125, -0.019866943359375, -0.00536346435546875, 0.0091400146484375, 0.02364349365234375, 0.03814697265625, 0.05265045166015625, 0.0671539306640625, 0.08165740966796875, 0.096160888671875, 0.11066436767578125, 0.1251678466796875, 0.13967132568359375, 0.1541748046875, 0.16867828369140625, 0.1831817626953125, 0.19768524169921875, 0.212188720703125, 0.22669219970703125, 0.2411956787109375, 0.25569915771484375, 0.27020263671875, 0.28470611572265625, 0.2992095947265625, 0.31371307373046875, 0.328216552734375, 0.34272003173828125, 0.3572235107421875, 0.37172698974609375, 0.38623046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 3.0, 4.0, 7.0, 9.0, 12.0, 16.0, 22.0, 37.0, 47.0, 71.0, 107.0, 166.0, 215.0, 434.0, 712.0, 1447.0, 3507.0, 14883.0, 132315.0, 794263.0, 83244.0, 11024.0, 2969.0, 1309.0, 659.0, 362.0, 243.0, 150.0, 102.0, 76.0, 41.0, 24.0, 28.0, 7.0, 10.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4677734375, -1.4195098876953125, -1.371246337890625, -1.3229827880859375, -1.27471923828125, -1.2264556884765625, -1.178192138671875, -1.1299285888671875, -1.0816650390625, -1.0334014892578125, -0.985137939453125, -0.9368743896484375, -0.88861083984375, -0.8403472900390625, -0.792083740234375, -0.7438201904296875, -0.695556640625, -0.6472930908203125, -0.599029541015625, -0.5507659912109375, -0.50250244140625, -0.4542388916015625, -0.405975341796875, -0.3577117919921875, -0.3094482421875, -0.2611846923828125, -0.212921142578125, -0.1646575927734375, -0.11639404296875, -0.0681304931640625, -0.019866943359375, 0.0283966064453125, 0.07666015625, 0.1249237060546875, 0.173187255859375, 0.2214508056640625, 0.26971435546875, 0.3179779052734375, 0.366241455078125, 0.4145050048828125, 0.4627685546875, 0.5110321044921875, 0.559295654296875, 0.6075592041015625, 0.65582275390625, 0.7040863037109375, 0.752349853515625, 0.8006134033203125, 0.848876953125, 0.8971405029296875, 0.945404052734375, 0.9936676025390625, 1.04193115234375, 1.0901947021484375, 1.138458251953125, 1.1867218017578125, 1.2349853515625, 1.2832489013671875, 1.331512451171875, 1.3797760009765625, 1.42803955078125, 1.4763031005859375, 1.524566650390625, 1.5728302001953125, 1.62109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 4.0, 5.0, 4.0, 14.0, 13.0, 17.0, 11.0, 12.0, 25.0, 14.0, 28.0, 29.0, 39.0, 40.0, 44.0, 47.0, 43.0, 43.0, 53.0, 65.0, 47.0, 54.0, 39.0, 39.0, 40.0, 26.0, 31.0, 37.0, 30.0, 17.0, 16.0, 20.0, 11.0, 15.0, 8.0, 1.0, 4.0, 5.0, 0.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.66015625, -1.6114654541015625, -1.562774658203125, -1.5140838623046875, -1.46539306640625, -1.4167022705078125, -1.368011474609375, -1.3193206787109375, -1.2706298828125, -1.2219390869140625, -1.173248291015625, -1.1245574951171875, -1.07586669921875, -1.0271759033203125, -0.978485107421875, -0.9297943115234375, -0.881103515625, -0.8324127197265625, -0.783721923828125, -0.7350311279296875, -0.68634033203125, -0.6376495361328125, -0.588958740234375, -0.5402679443359375, -0.4915771484375, -0.4428863525390625, -0.394195556640625, -0.3455047607421875, -0.29681396484375, -0.2481231689453125, -0.199432373046875, -0.1507415771484375, -0.10205078125, -0.0533599853515625, -0.004669189453125, 0.0440216064453125, 0.09271240234375, 0.1414031982421875, 0.190093994140625, 0.2387847900390625, 0.2874755859375, 0.3361663818359375, 0.384857177734375, 0.4335479736328125, 0.48223876953125, 0.5309295654296875, 0.579620361328125, 0.6283111572265625, 0.677001953125, 0.7256927490234375, 0.774383544921875, 0.8230743408203125, 0.87176513671875, 0.9204559326171875, 0.969146728515625, 1.0178375244140625, 1.0665283203125, 1.1152191162109375, 1.163909912109375, 1.2126007080078125, 1.26129150390625, 1.3099822998046875, 1.358673095703125, 1.4073638916015625, 1.4560546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 6.0, 18.0, 20.0, 16.0, 23.0, 40.0, 45.0, 71.0, 102.0, 160.0, 212.0, 371.0, 672.0, 1463.0, 3482.0, 9653.0, 33703.0, 182703.0, 709475.0, 76827.0, 18772.0, 5907.0, 2288.0, 1039.0, 540.0, 294.0, 208.0, 101.0, 80.0, 66.0, 47.0, 31.0, 23.0, 22.0, 15.0, 10.0, 12.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50048828125, -0.4827880859375, -0.465087890625, -0.4473876953125, -0.4296875, -0.4119873046875, -0.394287109375, -0.3765869140625, -0.35888671875, -0.3411865234375, -0.323486328125, -0.3057861328125, -0.2880859375, -0.2703857421875, -0.252685546875, -0.2349853515625, -0.21728515625, -0.1995849609375, -0.181884765625, -0.1641845703125, -0.146484375, -0.1287841796875, -0.111083984375, -0.0933837890625, -0.07568359375, -0.0579833984375, -0.040283203125, -0.0225830078125, -0.0048828125, 0.0128173828125, 0.030517578125, 0.0482177734375, 0.06591796875, 0.0836181640625, 0.101318359375, 0.1190185546875, 0.13671875, 0.1544189453125, 0.172119140625, 0.1898193359375, 0.20751953125, 0.2252197265625, 0.242919921875, 0.2606201171875, 0.2783203125, 0.2960205078125, 0.313720703125, 0.3314208984375, 0.34912109375, 0.3668212890625, 0.384521484375, 0.4022216796875, 0.419921875, 0.4376220703125, 0.455322265625, 0.4730224609375, 0.49072265625, 0.5084228515625, 0.526123046875, 0.5438232421875, 0.5615234375, 0.5792236328125, 0.596923828125, 0.6146240234375, 0.63232421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 4.0, 5.0, 5.0, 10.0, 14.0, 17.0, 19.0, 25.0, 33.0, 36.0, 62.0, 120.0, 148.0, 168.0, 99.0, 53.0, 47.0, 37.0, 9.0, 12.0, 15.0, 14.0, 14.0, 10.0, 7.0, 5.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017511844635009766, -0.000169459730386734, -0.00016380101442337036, -0.00015814229846000671, -0.00015248358249664307, -0.00014682486653327942, -0.00014116615056991577, -0.00013550743460655212, -0.00012984871864318848, -0.00012419000267982483, -0.00011853128671646118, -0.00011287257075309753, -0.00010721385478973389, -0.00010155513882637024, -9.589642286300659e-05, -9.023770689964294e-05, -8.45789909362793e-05, -7.892027497291565e-05, -7.3261559009552e-05, -6.760284304618835e-05, -6.194412708282471e-05, -5.628541111946106e-05, -5.062669515609741e-05, -4.4967979192733765e-05, -3.930926322937012e-05, -3.365054726600647e-05, -2.7991831302642822e-05, -2.2333115339279175e-05, -1.6674399375915527e-05, -1.101568341255188e-05, -5.356967449188232e-06, 3.0174851417541504e-07, 5.9604644775390625e-06, 1.161918044090271e-05, 1.7277896404266357e-05, 2.2936612367630005e-05, 2.8595328330993652e-05, 3.42540442943573e-05, 3.991276025772095e-05, 4.5571476221084595e-05, 5.123019218444824e-05, 5.688890814781189e-05, 6.254762411117554e-05, 6.820634007453918e-05, 7.386505603790283e-05, 7.952377200126648e-05, 8.518248796463013e-05, 9.084120392799377e-05, 9.649991989135742e-05, 0.00010215863585472107, 0.00010781735181808472, 0.00011347606778144836, 0.00011913478374481201, 0.00012479349970817566, 0.0001304522156715393, 0.00013611093163490295, 0.0001417696475982666, 0.00014742836356163025, 0.0001530870795249939, 0.00015874579548835754, 0.0001644045114517212, 0.00017006322741508484, 0.00017572194337844849, 0.00018138065934181213, 0.00018703937530517578]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 11.0, 7.0, 30.0, 22.0, 33.0, 57.0, 68.0, 121.0, 164.0, 238.0, 405.0, 734.0, 1487.0, 3613.0, 11162.0, 45012.0, 325754.0, 584187.0, 54629.0, 13115.0, 4140.0, 1642.0, 738.0, 425.0, 244.0, 157.0, 103.0, 62.0, 59.0, 30.0, 27.0, 26.0, 11.0, 9.0, 10.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.55810546875, -0.5401382446289062, -0.5221710205078125, -0.5042037963867188, -0.486236572265625, -0.46826934814453125, -0.4503021240234375, -0.43233489990234375, -0.41436767578125, -0.39640045166015625, -0.3784332275390625, -0.36046600341796875, -0.342498779296875, -0.32453155517578125, -0.3065643310546875, -0.28859710693359375, -0.2706298828125, -0.25266265869140625, -0.2346954345703125, -0.21672821044921875, -0.198760986328125, -0.18079376220703125, -0.1628265380859375, -0.14485931396484375, -0.12689208984375, -0.10892486572265625, -0.0909576416015625, -0.07299041748046875, -0.055023193359375, -0.03705596923828125, -0.0190887451171875, -0.00112152099609375, 0.016845703125, 0.03481292724609375, 0.0527801513671875, 0.07074737548828125, 0.088714599609375, 0.10668182373046875, 0.1246490478515625, 0.14261627197265625, 0.16058349609375, 0.17855072021484375, 0.1965179443359375, 0.21448516845703125, 0.232452392578125, 0.25041961669921875, 0.2683868408203125, 0.28635406494140625, 0.3043212890625, 0.32228851318359375, 0.3402557373046875, 0.35822296142578125, 0.376190185546875, 0.39415740966796875, 0.4121246337890625, 0.43009185791015625, 0.44805908203125, 0.46602630615234375, 0.4839935302734375, 0.5019607543945312, 0.519927978515625, 0.5378952026367188, 0.5558624267578125, 0.5738296508789062, 0.591796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 5.0, 4.0, 6.0, 6.0, 4.0, 13.0, 14.0, 20.0, 24.0, 34.0, 29.0, 44.0, 64.0, 105.0, 119.0, 119.0, 85.0, 85.0, 47.0, 44.0, 38.0, 17.0, 18.0, 9.0, 10.0, 7.0, 8.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67578125, -0.6580238342285156, -0.6402664184570312, -0.6225090026855469, -0.6047515869140625, -0.5869941711425781, -0.5692367553710938, -0.5514793395996094, -0.533721923828125, -0.5159645080566406, -0.49820709228515625, -0.4804496765136719, -0.4626922607421875, -0.4449348449707031, -0.42717742919921875, -0.4094200134277344, -0.39166259765625, -0.3739051818847656, -0.35614776611328125, -0.3383903503417969, -0.3206329345703125, -0.3028755187988281, -0.28511810302734375, -0.2673606872558594, -0.249603271484375, -0.23184585571289062, -0.21408843994140625, -0.19633102416992188, -0.1785736083984375, -0.16081619262695312, -0.14305877685546875, -0.12530136108398438, -0.1075439453125, -0.08978652954101562, -0.07202911376953125, -0.054271697998046875, -0.0365142822265625, -0.018756866455078125, -0.00099945068359375, 0.016757965087890625, 0.034515380859375, 0.052272796630859375, 0.07003021240234375, 0.08778762817382812, 0.1055450439453125, 0.12330245971679688, 0.14105987548828125, 0.15881729125976562, 0.17657470703125, 0.19433212280273438, 0.21208953857421875, 0.22984695434570312, 0.2476043701171875, 0.2653617858886719, 0.28311920166015625, 0.3008766174316406, 0.318634033203125, 0.3363914489746094, 0.35414886474609375, 0.3719062805175781, 0.3896636962890625, 0.4074211120605469, 0.42517852783203125, 0.4429359436035156, 0.460693359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 8.0, 14.0, 48.0, 171.0, 397.0, 272.0, 59.0, 14.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.543594360351562, -22.92159080505371, -22.29958724975586, -21.677583694458008, -21.055580139160156, -20.433574676513672, -19.81157112121582, -19.18956756591797, -18.567564010620117, -17.945560455322266, -17.323556900024414, -16.701553344726562, -16.079547882080078, -15.457545280456543, -14.835540771484375, -14.213537216186523, -13.591533660888672, -12.96953010559082, -12.347526550292969, -11.7255220413208, -11.10351848602295, -10.481514930725098, -9.85951042175293, -9.237506866455078, -8.615503311157227, -7.993499755859375, -7.371495723724365, -6.7494916915893555, -6.127488136291504, -5.505484580993652, -4.883480548858643, -4.261476516723633, -3.6394710540771484, -3.0174672603607178, -2.395463466644287, -1.7734596729278564, -1.1514558792114258, -0.5294520854949951, 0.09255170822143555, 0.7145557403564453, 1.3365592956542969, 1.9585630893707275, 2.580566883087158, 3.202570676803589, 3.8245744705200195, 4.446578025817871, 5.068582057952881, 5.690586090087891, 6.312589645385742, 6.934593200683594, 7.5565972328186035, 8.178601264953613, 8.800604820251465, 9.422608375549316, 10.044612884521484, 10.666616439819336, 11.288619995117188, 11.910623550415039, 12.53262710571289, 13.154631614685059, 13.77663516998291, 14.398638725280762, 15.02064323425293, 15.642646789550781, 16.264650344848633]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 6.0, 3.0, 6.0, 3.0, 12.0, 7.0, 14.0, 16.0, 23.0, 26.0, 17.0, 15.0, 15.0, 26.0, 39.0, 28.0, 52.0, 54.0, 57.0, 74.0, 80.0, 63.0, 45.0, 37.0, 47.0, 31.0, 22.0, 27.0, 32.0, 26.0, 19.0, 8.0, 16.0, 18.0, 8.0, 10.0, 7.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.54152774810791, -4.343632698059082, -4.145737648010254, -3.947842836380005, -3.749948024749756, -3.5520529747009277, -3.3541579246520996, -3.1562628746032715, -2.9583680629730225, -2.7604730129241943, -2.5625782012939453, -2.364683151245117, -2.166788101196289, -1.96889328956604, -1.770998239517212, -1.5731033086776733, -1.3752083778381348, -1.1773134469985962, -0.9794184565544128, -0.7815234661102295, -0.5836285352706909, -0.38573360443115234, -0.18783855438232422, 0.010056376457214355, 0.20795130729675293, 0.4058462679386139, 0.6037412285804749, 0.8016362190246582, 0.9995311498641968, 1.1974260807037354, 1.3953211307525635, 1.593216061592102, 1.7911109924316406, 1.9890059232711792, 2.1869008541107178, 2.384795904159546, 2.582690715789795, 2.780585765838623, 2.978480815887451, 3.1763758659362793, 3.3742706775665283, 3.5721657276153564, 3.7700605392456055, 3.9679555892944336, 4.165850639343262, 4.36374568939209, 4.561640739440918, 4.759535312652588, 4.957430362701416, 5.155325412750244, 5.353220462799072, 5.551115036010742, 5.74901008605957, 5.946905136108398, 6.144800186157227, 6.342695236206055, 6.540590286254883, 6.738485336303711, 6.936380386352539, 7.134275436401367, 7.332170009613037, 7.530065059661865, 7.727960109710693, 7.9258551597595215, 8.123749732971191]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 13.0, 21.0, 22.0, 39.0, 63.0, 114.0, 199.0, 374.0, 871.0, 2181.0, 7644.0, 52512.0, 1745658.0, 2298655.0, 71300.0, 9696.0, 2864.0, 1020.0, 489.0, 241.0, 131.0, 71.0, 45.0, 16.0, 16.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6669921875, -0.6403656005859375, -0.613739013671875, -0.5871124267578125, -0.56048583984375, -0.5338592529296875, -0.507232666015625, -0.4806060791015625, -0.4539794921875, -0.4273529052734375, -0.400726318359375, -0.3740997314453125, -0.34747314453125, -0.3208465576171875, -0.294219970703125, -0.2675933837890625, -0.240966796875, -0.2143402099609375, -0.187713623046875, -0.1610870361328125, -0.13446044921875, -0.1078338623046875, -0.081207275390625, -0.0545806884765625, -0.0279541015625, -0.0013275146484375, 0.025299072265625, 0.0519256591796875, 0.07855224609375, 0.1051788330078125, 0.131805419921875, 0.1584320068359375, 0.18505859375, 0.2116851806640625, 0.238311767578125, 0.2649383544921875, 0.29156494140625, 0.3181915283203125, 0.344818115234375, 0.3714447021484375, 0.3980712890625, 0.4246978759765625, 0.451324462890625, 0.4779510498046875, 0.50457763671875, 0.5312042236328125, 0.557830810546875, 0.5844573974609375, 0.611083984375, 0.6377105712890625, 0.664337158203125, 0.6909637451171875, 0.71759033203125, 0.7442169189453125, 0.770843505859375, 0.7974700927734375, 0.8240966796875, 0.8507232666015625, 0.877349853515625, 0.9039764404296875, 0.93060302734375, 0.9572296142578125, 0.983856201171875, 1.0104827880859375, 1.037109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 17.0, 15.0, 18.0, 16.0, 30.0, 42.0, 56.0, 60.0, 57.0, 63.0, 73.0, 73.0, 64.0, 61.0, 58.0, 54.0, 56.0, 55.0, 36.0, 17.0, 24.0, 20.0, 6.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.576171875, -0.5590133666992188, -0.5418548583984375, -0.5246963500976562, -0.507537841796875, -0.49037933349609375, -0.4732208251953125, -0.45606231689453125, -0.43890380859375, -0.42174530029296875, -0.4045867919921875, -0.38742828369140625, -0.370269775390625, -0.35311126708984375, -0.3359527587890625, -0.31879425048828125, -0.3016357421875, -0.28447723388671875, -0.2673187255859375, -0.25016021728515625, -0.233001708984375, -0.21584320068359375, -0.1986846923828125, -0.18152618408203125, -0.16436767578125, -0.14720916748046875, -0.1300506591796875, -0.11289215087890625, -0.095733642578125, -0.07857513427734375, -0.0614166259765625, -0.04425811767578125, -0.027099609375, -0.00994110107421875, 0.0072174072265625, 0.02437591552734375, 0.041534423828125, 0.05869293212890625, 0.0758514404296875, 0.09300994873046875, 0.11016845703125, 0.12732696533203125, 0.1444854736328125, 0.16164398193359375, 0.178802490234375, 0.19596099853515625, 0.2131195068359375, 0.23027801513671875, 0.2474365234375, 0.26459503173828125, 0.2817535400390625, 0.29891204833984375, 0.316070556640625, 0.33322906494140625, 0.3503875732421875, 0.36754608154296875, 0.38470458984375, 0.40186309814453125, 0.4190216064453125, 0.43618011474609375, 0.453338623046875, 0.47049713134765625, 0.4876556396484375, 0.5048141479492188, 0.52197265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 5.0, 11.0, 9.0, 13.0, 28.0, 43.0, 76.0, 158.0, 302.0, 879.0, 3308.0, 30162.0, 4009570.0, 140636.0, 6514.0, 1595.0, 498.0, 194.0, 118.0, 72.0, 37.0, 27.0, 8.0, 7.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8515625, -1.7869873046875, -1.722412109375, -1.6578369140625, -1.59326171875, -1.5286865234375, -1.464111328125, -1.3995361328125, -1.3349609375, -1.2703857421875, -1.205810546875, -1.1412353515625, -1.07666015625, -1.0120849609375, -0.947509765625, -0.8829345703125, -0.818359375, -0.7537841796875, -0.689208984375, -0.6246337890625, -0.56005859375, -0.4954833984375, -0.430908203125, -0.3663330078125, -0.3017578125, -0.2371826171875, -0.172607421875, -0.1080322265625, -0.04345703125, 0.0211181640625, 0.085693359375, 0.1502685546875, 0.21484375, 0.2794189453125, 0.343994140625, 0.4085693359375, 0.47314453125, 0.5377197265625, 0.602294921875, 0.6668701171875, 0.7314453125, 0.7960205078125, 0.860595703125, 0.9251708984375, 0.98974609375, 1.0543212890625, 1.118896484375, 1.1834716796875, 1.248046875, 1.3126220703125, 1.377197265625, 1.4417724609375, 1.50634765625, 1.5709228515625, 1.635498046875, 1.7000732421875, 1.7646484375, 1.8292236328125, 1.893798828125, 1.9583740234375, 2.02294921875, 2.0875244140625, 2.152099609375, 2.2166748046875, 2.28125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 5.0, 8.0, 18.0, 26.0, 37.0, 68.0, 176.0, 375.0, 758.0, 1041.0, 776.0, 380.0, 184.0, 90.0, 46.0, 17.0, 17.0, 8.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0224609375, -0.987884521484375, -0.95330810546875, -0.918731689453125, -0.8841552734375, -0.849578857421875, -0.81500244140625, -0.780426025390625, -0.745849609375, -0.711273193359375, -0.67669677734375, -0.642120361328125, -0.6075439453125, -0.572967529296875, -0.53839111328125, -0.503814697265625, -0.46923828125, -0.434661865234375, -0.40008544921875, -0.365509033203125, -0.3309326171875, -0.296356201171875, -0.26177978515625, -0.227203369140625, -0.192626953125, -0.158050537109375, -0.12347412109375, -0.088897705078125, -0.0543212890625, -0.019744873046875, 0.01483154296875, 0.049407958984375, 0.083984375, 0.118560791015625, 0.15313720703125, 0.187713623046875, 0.2222900390625, 0.256866455078125, 0.29144287109375, 0.326019287109375, 0.360595703125, 0.395172119140625, 0.42974853515625, 0.464324951171875, 0.4989013671875, 0.533477783203125, 0.56805419921875, 0.602630615234375, 0.63720703125, 0.671783447265625, 0.70635986328125, 0.740936279296875, 0.7755126953125, 0.810089111328125, 0.84466552734375, 0.879241943359375, 0.913818359375, 0.948394775390625, 0.98297119140625, 1.017547607421875, 1.0521240234375, 1.086700439453125, 1.12127685546875, 1.155853271484375, 1.1904296875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 13.0, 29.0, 95.0, 338.0, 364.0, 104.0, 30.0, 14.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.368759155273438, -16.82703399658203, -16.285308837890625, -15.743585586547852, -15.201860427856445, -14.660135269165039, -14.11841106414795, -13.57668685913086, -13.034961700439453, -12.493236541748047, -11.951512336730957, -11.409788131713867, -10.868062973022461, -10.326337814331055, -9.784613609313965, -9.242889404296875, -8.701164245605469, -8.159439086914062, -7.617714881896973, -7.075990200042725, -6.534265518188477, -5.9925408363342285, -5.4508161544799805, -4.909091472625732, -4.367366790771484, -3.8256421089172363, -3.2839174270629883, -2.7421927452087402, -2.200468063354492, -1.6587433815002441, -1.117018699645996, -0.575294017791748, -0.0335693359375, 0.508155345916748, 1.049880027770996, 1.5916047096252441, 2.133329391479492, 2.6750540733337402, 3.2167787551879883, 3.7585034370422363, 4.300228118896484, 4.841952800750732, 5.3836774826049805, 5.9254021644592285, 6.467126846313477, 7.008851528167725, 7.550576210021973, 8.092300415039062, 8.634025573730469, 9.175750732421875, 9.717474937438965, 10.259199142456055, 10.800924301147461, 11.342649459838867, 11.884373664855957, 12.426097869873047, 12.967823028564453, 13.50954818725586, 14.05127239227295, 14.592996597290039, 15.134721755981445, 15.676446914672852, 16.218170166015625, 16.75989532470703, 17.301620483398438]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 9.0, 8.0, 7.0, 15.0, 29.0, 29.0, 51.0, 59.0, 61.0, 80.0, 104.0, 94.0, 72.0, 64.0, 73.0, 60.0, 53.0, 33.0, 27.0, 18.0, 19.0, 20.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5304436683654785, -6.347877025604248, -6.165310382843018, -5.982743263244629, -5.800176620483398, -5.617609977722168, -5.4350433349609375, -5.252476692199707, -5.069910049438477, -4.887343406677246, -4.704776763916016, -4.522210121154785, -4.3396430015563965, -4.157076358795166, -3.9745097160339355, -3.791943073272705, -3.6093759536743164, -3.426809310913086, -3.2442424297332764, -3.061675786972046, -2.8791089057922363, -2.696542263031006, -2.5139756202697754, -2.331408977508545, -2.1488420963287354, -1.9662753343582153, -1.7837085723876953, -1.6011419296264648, -1.4185751676559448, -1.2360084056854248, -1.0534417629241943, -0.8708750009536743, -0.6883087158203125, -0.5057419538497925, -0.32317525148391724, -0.140608549118042, 0.04195821285247803, 0.22452497482299805, 0.4070916175842285, 0.5896583795547485, 0.7722251415252686, 0.9547919034957886, 1.1373586654663086, 1.319925308227539, 1.502492070198059, 1.685058832168579, 1.8676254749298096, 2.050192356109619, 2.2327589988708496, 2.41532564163208, 2.5978925228118896, 2.78045916557312, 2.9630260467529297, 3.14559268951416, 3.3281593322753906, 3.510725975036621, 3.6932928562164307, 3.875859498977661, 4.058426380157471, 4.240993022918701, 4.423559665679932, 4.60612678527832, 4.788693428039551, 4.971260070800781, 5.153826713562012]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 4.0, 7.0, 7.0, 15.0, 23.0, 25.0, 33.0, 51.0, 79.0, 164.0, 374.0, 951.0, 2797.0, 11195.0, 71103.0, 518851.0, 384164.0, 46951.0, 8103.0, 2260.0, 695.0, 306.0, 172.0, 79.0, 37.0, 36.0, 21.0, 11.0, 11.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1025390625, -1.0709457397460938, -1.0393524169921875, -1.0077590942382812, -0.976165771484375, -0.9445724487304688, -0.9129791259765625, -0.8813858032226562, -0.84979248046875, -0.8181991577148438, -0.7866058349609375, -0.7550125122070312, -0.723419189453125, -0.6918258666992188, -0.6602325439453125, -0.6286392211914062, -0.5970458984375, -0.5654525756835938, -0.5338592529296875, -0.5022659301757812, -0.470672607421875, -0.43907928466796875, -0.4074859619140625, -0.37589263916015625, -0.34429931640625, -0.31270599365234375, -0.2811126708984375, -0.24951934814453125, -0.217926025390625, -0.18633270263671875, -0.1547393798828125, -0.12314605712890625, -0.091552734375, -0.05995941162109375, -0.0283660888671875, 0.00322723388671875, 0.034820556640625, 0.06641387939453125, 0.0980072021484375, 0.12960052490234375, 0.16119384765625, 0.19278717041015625, 0.2243804931640625, 0.25597381591796875, 0.287567138671875, 0.31916046142578125, 0.3507537841796875, 0.38234710693359375, 0.4139404296875, 0.44553375244140625, 0.4771270751953125, 0.5087203979492188, 0.540313720703125, 0.5719070434570312, 0.6035003662109375, 0.6350936889648438, 0.66668701171875, 0.6982803344726562, 0.7298736572265625, 0.7614669799804688, 0.793060302734375, 0.8246536254882812, 0.8562469482421875, 0.8878402709960938, 0.91943359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 4.0, 8.0, 15.0, 26.0, 21.0, 31.0, 35.0, 56.0, 48.0, 63.0, 83.0, 64.0, 64.0, 57.0, 73.0, 56.0, 50.0, 55.0, 46.0, 30.0, 25.0, 22.0, 22.0, 18.0, 9.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.646484375, -0.6292762756347656, -0.6120681762695312, -0.5948600769042969, -0.5776519775390625, -0.5604438781738281, -0.5432357788085938, -0.5260276794433594, -0.508819580078125, -0.4916114807128906, -0.47440338134765625, -0.4571952819824219, -0.4399871826171875, -0.4227790832519531, -0.40557098388671875, -0.3883628845214844, -0.37115478515625, -0.3539466857910156, -0.33673858642578125, -0.3195304870605469, -0.3023223876953125, -0.2851142883300781, -0.26790618896484375, -0.2506980895996094, -0.233489990234375, -0.21628189086914062, -0.19907379150390625, -0.18186569213867188, -0.1646575927734375, -0.14744949340820312, -0.13024139404296875, -0.11303329467773438, -0.0958251953125, -0.07861709594726562, -0.06140899658203125, -0.044200897216796875, -0.0269927978515625, -0.009784698486328125, 0.00742340087890625, 0.024631500244140625, 0.041839599609375, 0.059047698974609375, 0.07625579833984375, 0.09346389770507812, 0.1106719970703125, 0.12788009643554688, 0.14508819580078125, 0.16229629516601562, 0.17950439453125, 0.19671249389648438, 0.21392059326171875, 0.23112869262695312, 0.2483367919921875, 0.2655448913574219, 0.28275299072265625, 0.2999610900878906, 0.317169189453125, 0.3343772888183594, 0.35158538818359375, 0.3687934875488281, 0.3860015869140625, 0.4032096862792969, 0.42041778564453125, 0.4376258850097656, 0.454833984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 16.0, 21.0, 13.0, 26.0, 33.0, 42.0, 52.0, 87.0, 148.0, 242.0, 460.0, 1211.0, 3974.0, 18847.0, 138669.0, 727365.0, 132929.0, 18204.0, 3919.0, 1155.0, 453.0, 213.0, 143.0, 87.0, 53.0, 54.0, 23.0, 21.0, 16.0, 14.0, 8.0, 8.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1692047119140625, -1.136260986328125, -1.1033172607421875, -1.07037353515625, -1.0374298095703125, -1.004486083984375, -0.9715423583984375, -0.9385986328125, -0.9056549072265625, -0.872711181640625, -0.8397674560546875, -0.80682373046875, -0.7738800048828125, -0.740936279296875, -0.7079925537109375, -0.675048828125, -0.6421051025390625, -0.609161376953125, -0.5762176513671875, -0.54327392578125, -0.5103302001953125, -0.477386474609375, -0.4444427490234375, -0.4114990234375, -0.3785552978515625, -0.345611572265625, -0.3126678466796875, -0.27972412109375, -0.2467803955078125, -0.213836669921875, -0.1808929443359375, -0.14794921875, -0.1150054931640625, -0.082061767578125, -0.0491180419921875, -0.01617431640625, 0.0167694091796875, 0.049713134765625, 0.0826568603515625, 0.1156005859375, 0.1485443115234375, 0.181488037109375, 0.2144317626953125, 0.24737548828125, 0.2803192138671875, 0.313262939453125, 0.3462066650390625, 0.379150390625, 0.4120941162109375, 0.445037841796875, 0.4779815673828125, 0.51092529296875, 0.5438690185546875, 0.576812744140625, 0.6097564697265625, 0.6427001953125, 0.6756439208984375, 0.708587646484375, 0.7415313720703125, 0.77447509765625, 0.8074188232421875, 0.840362548828125, 0.8733062744140625, 0.90625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 7.0, 9.0, 9.0, 7.0, 11.0, 16.0, 16.0, 21.0, 27.0, 30.0, 41.0, 40.0, 41.0, 57.0, 50.0, 50.0, 63.0, 60.0, 64.0, 55.0, 34.0, 41.0, 41.0, 51.0, 28.0, 27.0, 19.0, 20.0, 21.0, 8.0, 12.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.791015625, -1.7397003173828125, -1.688385009765625, -1.6370697021484375, -1.58575439453125, -1.5344390869140625, -1.483123779296875, -1.4318084716796875, -1.3804931640625, -1.3291778564453125, -1.277862548828125, -1.2265472412109375, -1.17523193359375, -1.1239166259765625, -1.072601318359375, -1.0212860107421875, -0.969970703125, -0.9186553955078125, -0.867340087890625, -0.8160247802734375, -0.76470947265625, -0.7133941650390625, -0.662078857421875, -0.6107635498046875, -0.5594482421875, -0.5081329345703125, -0.456817626953125, -0.4055023193359375, -0.35418701171875, -0.3028717041015625, -0.251556396484375, -0.2002410888671875, -0.14892578125, -0.0976104736328125, -0.046295166015625, 0.0050201416015625, 0.05633544921875, 0.1076507568359375, 0.158966064453125, 0.2102813720703125, 0.2615966796875, 0.3129119873046875, 0.364227294921875, 0.4155426025390625, 0.46685791015625, 0.5181732177734375, 0.569488525390625, 0.6208038330078125, 0.672119140625, 0.7234344482421875, 0.774749755859375, 0.8260650634765625, 0.87738037109375, 0.9286956787109375, 0.980010986328125, 1.0313262939453125, 1.0826416015625, 1.1339569091796875, 1.185272216796875, 1.2365875244140625, 1.28790283203125, 1.3392181396484375, 1.390533447265625, 1.4418487548828125, 1.4931640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 17.0, 40.0, 44.0, 75.0, 152.0, 388.0, 755.0, 2002.0, 5749.0, 20813.0, 116107.0, 711300.0, 154305.0, 26051.0, 6767.0, 2319.0, 881.0, 382.0, 174.0, 95.0, 51.0, 33.0, 20.0, 9.0, 6.0, 0.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.393798828125, -0.38240814208984375, -0.3710174560546875, -0.35962677001953125, -0.348236083984375, -0.33684539794921875, -0.3254547119140625, -0.31406402587890625, -0.30267333984375, -0.29128265380859375, -0.2798919677734375, -0.26850128173828125, -0.257110595703125, -0.24571990966796875, -0.2343292236328125, -0.22293853759765625, -0.2115478515625, -0.20015716552734375, -0.1887664794921875, -0.17737579345703125, -0.165985107421875, -0.15459442138671875, -0.1432037353515625, -0.13181304931640625, -0.12042236328125, -0.10903167724609375, -0.0976409912109375, -0.08625030517578125, -0.074859619140625, -0.06346893310546875, -0.0520782470703125, -0.04068756103515625, -0.029296875, -0.01790618896484375, -0.0065155029296875, 0.00487518310546875, 0.016265869140625, 0.02765655517578125, 0.0390472412109375, 0.05043792724609375, 0.06182861328125, 0.07321929931640625, 0.0846099853515625, 0.09600067138671875, 0.107391357421875, 0.11878204345703125, 0.1301727294921875, 0.14156341552734375, 0.1529541015625, 0.16434478759765625, 0.1757354736328125, 0.18712615966796875, 0.198516845703125, 0.20990753173828125, 0.2212982177734375, 0.23268890380859375, 0.24407958984375, 0.25547027587890625, 0.2668609619140625, 0.27825164794921875, 0.289642333984375, 0.30103302001953125, 0.3124237060546875, 0.32381439208984375, 0.335205078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 8.0, 15.0, 23.0, 38.0, 57.0, 87.0, 124.0, 161.0, 130.0, 117.0, 81.0, 42.0, 30.0, 24.0, 9.0, 9.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00014090538024902344, -0.00013726204633712769, -0.00013361871242523193, -0.00012997537851333618, -0.00012633204460144043, -0.00012268871068954468, -0.00011904537677764893, -0.00011540204286575317, -0.00011175870895385742, -0.00010811537504196167, -0.00010447204113006592, -0.00010082870721817017, -9.718537330627441e-05, -9.354203939437866e-05, -8.989870548248291e-05, -8.625537157058716e-05, -8.26120376586914e-05, -7.896870374679565e-05, -7.53253698348999e-05, -7.168203592300415e-05, -6.80387020111084e-05, -6.439536809921265e-05, -6.0752034187316895e-05, -5.710870027542114e-05, -5.346536636352539e-05, -4.982203245162964e-05, -4.617869853973389e-05, -4.2535364627838135e-05, -3.889203071594238e-05, -3.524869680404663e-05, -3.160536289215088e-05, -2.7962028980255127e-05, -2.4318695068359375e-05, -2.0675361156463623e-05, -1.703202724456787e-05, -1.3388693332672119e-05, -9.745359420776367e-06, -6.102025508880615e-06, -2.4586915969848633e-06, 1.1846423149108887e-06, 4.827976226806641e-06, 8.471310138702393e-06, 1.2114644050598145e-05, 1.5757977962493896e-05, 1.940131187438965e-05, 2.30446457862854e-05, 2.6687979698181152e-05, 3.0331313610076904e-05, 3.3974647521972656e-05, 3.761798143386841e-05, 4.126131534576416e-05, 4.490464925765991e-05, 4.8547983169555664e-05, 5.2191317081451416e-05, 5.583465099334717e-05, 5.947798490524292e-05, 6.312131881713867e-05, 6.676465272903442e-05, 7.040798664093018e-05, 7.405132055282593e-05, 7.769465446472168e-05, 8.133798837661743e-05, 8.498132228851318e-05, 8.862465620040894e-05, 9.226799011230469e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 11.0, 14.0, 21.0, 27.0, 56.0, 131.0, 215.0, 518.0, 1395.0, 4669.0, 18099.0, 102527.0, 712500.0, 171754.0, 27174.0, 6401.0, 1810.0, 669.0, 279.0, 104.0, 65.0, 40.0, 29.0, 14.0, 16.0, 9.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421630859375, -0.4090919494628906, -0.39655303955078125, -0.3840141296386719, -0.3714752197265625, -0.3589363098144531, -0.34639739990234375, -0.3338584899902344, -0.321319580078125, -0.3087806701660156, -0.29624176025390625, -0.2837028503417969, -0.2711639404296875, -0.2586250305175781, -0.24608612060546875, -0.23354721069335938, -0.22100830078125, -0.20846939086914062, -0.19593048095703125, -0.18339157104492188, -0.1708526611328125, -0.15831375122070312, -0.14577484130859375, -0.13323593139648438, -0.120697021484375, -0.10815811157226562, -0.09561920166015625, -0.08308029174804688, -0.0705413818359375, -0.058002471923828125, -0.04546356201171875, -0.032924652099609375, -0.0203857421875, -0.007846832275390625, 0.00469207763671875, 0.017230987548828125, 0.0297698974609375, 0.042308807373046875, 0.05484771728515625, 0.06738662719726562, 0.079925537109375, 0.09246444702148438, 0.10500335693359375, 0.11754226684570312, 0.1300811767578125, 0.14262008666992188, 0.15515899658203125, 0.16769790649414062, 0.18023681640625, 0.19277572631835938, 0.20531463623046875, 0.21785354614257812, 0.2303924560546875, 0.24293136596679688, 0.25547027587890625, 0.2680091857910156, 0.280548095703125, 0.2930870056152344, 0.30562591552734375, 0.3181648254394531, 0.3307037353515625, 0.3432426452636719, 0.35578155517578125, 0.3683204650878906, 0.380859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 7.0, 5.0, 7.0, 7.0, 12.0, 9.0, 22.0, 40.0, 32.0, 49.0, 54.0, 80.0, 92.0, 84.0, 82.0, 76.0, 77.0, 71.0, 35.0, 31.0, 23.0, 25.0, 18.0, 13.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265869140625, -0.2559852600097656, -0.24610137939453125, -0.23621749877929688, -0.2263336181640625, -0.21644973754882812, -0.20656585693359375, -0.19668197631835938, -0.186798095703125, -0.17691421508789062, -0.16703033447265625, -0.15714645385742188, -0.1472625732421875, -0.13737869262695312, -0.12749481201171875, -0.11761093139648438, -0.10772705078125, -0.09784317016601562, -0.08795928955078125, -0.07807540893554688, -0.0681915283203125, -0.058307647705078125, -0.04842376708984375, -0.038539886474609375, -0.028656005859375, -0.018772125244140625, -0.00888824462890625, 0.000995635986328125, 0.0108795166015625, 0.020763397216796875, 0.03064727783203125, 0.040531158447265625, 0.0504150390625, 0.060298919677734375, 0.07018280029296875, 0.08006668090820312, 0.0899505615234375, 0.09983444213867188, 0.10971832275390625, 0.11960220336914062, 0.129486083984375, 0.13936996459960938, 0.14925384521484375, 0.15913772583007812, 0.1690216064453125, 0.17890548706054688, 0.18878936767578125, 0.19867324829101562, 0.20855712890625, 0.21844100952148438, 0.22832489013671875, 0.23820877075195312, 0.2480926513671875, 0.2579765319824219, 0.26786041259765625, 0.2777442932128906, 0.287628173828125, 0.2975120544433594, 0.30739593505859375, 0.3172798156738281, 0.3271636962890625, 0.3370475769042969, 0.34693145751953125, 0.3568153381347656, 0.36669921875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 4.0, 15.0, 33.0, 74.0, 161.0, 359.0, 216.0, 81.0, 31.0, 11.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.750744819641113, -11.403002738952637, -11.05526065826416, -10.707518577575684, -10.359776496887207, -10.01203441619873, -9.664291381835938, -9.316549301147461, -8.968807220458984, -8.621065139770508, -8.273323059082031, -7.925580978393555, -7.577838897705078, -7.230096817016602, -6.882354259490967, -6.53461217880249, -6.186870574951172, -5.839128494262695, -5.491386413574219, -5.143644332885742, -4.795902252197266, -4.448160171508789, -4.100417613983154, -3.7526755332946777, -3.404933452606201, -3.0571913719177246, -2.709449291229248, -2.3617069721221924, -2.013964891433716, -1.6662228107452393, -1.3184804916381836, -0.970738410949707, -0.6229953765869141, -0.2752532362937927, 0.07248890399932861, 0.4202311038970947, 0.7679731845855713, 1.1157152652740479, 1.4634575843811035, 1.81119966506958, 2.1589417457580566, 2.506683826446533, 2.8544259071350098, 3.2021682262420654, 3.549910306930542, 3.8976523876190186, 4.245394706726074, 4.593136787414551, 4.940878868103027, 5.288620948791504, 5.6363630294799805, 5.984105110168457, 6.331847190856934, 6.67958927154541, 7.027331829071045, 7.3750739097595215, 7.722815990447998, 8.070558547973633, 8.41830062866211, 8.766042709350586, 9.113784790039062, 9.461526870727539, 9.809268951416016, 10.157011032104492, 10.504753112792969]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 6.0, 5.0, 11.0, 4.0, 15.0, 13.0, 22.0, 32.0, 36.0, 38.0, 48.0, 41.0, 59.0, 81.0, 85.0, 94.0, 94.0, 52.0, 33.0, 41.0, 25.0, 35.0, 22.0, 21.0, 21.0, 20.0, 11.0, 16.0, 7.0, 3.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6579790115356445, -4.439215183258057, -4.220451831817627, -4.001688003540039, -3.782924175262451, -3.5641605854034424, -3.3453969955444336, -3.1266331672668457, -2.907869338989258, -2.689105749130249, -2.470341920852661, -2.2515783309936523, -2.0328145027160645, -1.8140509128570557, -1.5952872037887573, -1.376523494720459, -1.1577599048614502, -0.9389961957931519, -0.7202324867248535, -0.5014688372612, -0.2827051281929016, -0.06394147872924805, 0.1548222303390503, 0.37358593940734863, 0.592349648475647, 0.8111133575439453, 1.0298770666122437, 1.248640775680542, 1.4674043655395508, 1.6861680746078491, 1.9049317836761475, 2.1236953735351562, 2.342459201812744, 2.561222791671753, 2.779986619949341, 2.9987502098083496, 3.2175140380859375, 3.4362776279449463, 3.655041217803955, 3.873805046081543, 4.092568874359131, 4.311332702636719, 4.530096054077148, 4.748859882354736, 4.967623710632324, 5.186387062072754, 5.405150890350342, 5.62391471862793, 5.842678070068359, 6.061441898345947, 6.280205249786377, 6.498969078063965, 6.717732906341553, 6.936496734619141, 7.15526008605957, 7.374023914337158, 7.592787742614746, 7.811551570892334, 8.030315399169922, 8.249078750610352, 8.467842102050781, 8.686606407165527, 8.905369758605957, 9.124134063720703, 9.342897415161133]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 4.0, 11.0, 10.0, 31.0, 47.0, 66.0, 106.0, 187.0, 324.0, 574.0, 1224.0, 2546.0, 6785.0, 27647.0, 266295.0, 2737447.0, 1055147.0, 75120.0, 13300.0, 4047.0, 1545.0, 743.0, 435.0, 241.0, 125.0, 95.0, 57.0, 35.0, 21.0, 14.0, 15.0, 11.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6171875, -0.5983428955078125, -0.579498291015625, -0.5606536865234375, -0.54180908203125, -0.5229644775390625, -0.504119873046875, -0.4852752685546875, -0.4664306640625, -0.4475860595703125, -0.428741455078125, -0.4098968505859375, -0.39105224609375, -0.3722076416015625, -0.353363037109375, -0.3345184326171875, -0.315673828125, -0.2968292236328125, -0.277984619140625, -0.2591400146484375, -0.24029541015625, -0.2214508056640625, -0.202606201171875, -0.1837615966796875, -0.1649169921875, -0.1460723876953125, -0.127227783203125, -0.1083831787109375, -0.08953857421875, -0.0706939697265625, -0.051849365234375, -0.0330047607421875, -0.01416015625, 0.0046844482421875, 0.023529052734375, 0.0423736572265625, 0.06121826171875, 0.0800628662109375, 0.098907470703125, 0.1177520751953125, 0.1365966796875, 0.1554412841796875, 0.174285888671875, 0.1931304931640625, 0.21197509765625, 0.2308197021484375, 0.249664306640625, 0.2685089111328125, 0.287353515625, 0.3061981201171875, 0.325042724609375, 0.3438873291015625, 0.36273193359375, 0.3815765380859375, 0.400421142578125, 0.4192657470703125, 0.4381103515625, 0.4569549560546875, 0.475799560546875, 0.4946441650390625, 0.51348876953125, 0.5323333740234375, 0.551177978515625, 0.5700225830078125, 0.5888671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 13.0, 19.0, 11.0, 26.0, 30.0, 38.0, 35.0, 55.0, 47.0, 60.0, 56.0, 61.0, 58.0, 70.0, 58.0, 53.0, 41.0, 47.0, 38.0, 34.0, 34.0, 22.0, 20.0, 23.0, 18.0, 8.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.53759765625, -0.5225715637207031, -0.5075454711914062, -0.4925193786621094, -0.4774932861328125, -0.4624671936035156, -0.44744110107421875, -0.4324150085449219, -0.417388916015625, -0.4023628234863281, -0.38733673095703125, -0.3723106384277344, -0.3572845458984375, -0.3422584533691406, -0.32723236083984375, -0.3122062683105469, -0.29718017578125, -0.2821540832519531, -0.26712799072265625, -0.2521018981933594, -0.2370758056640625, -0.22204971313476562, -0.20702362060546875, -0.19199752807617188, -0.176971435546875, -0.16194534301757812, -0.14691925048828125, -0.13189315795898438, -0.1168670654296875, -0.10184097290039062, -0.08681488037109375, -0.07178878784179688, -0.0567626953125, -0.041736602783203125, -0.02671051025390625, -0.011684417724609375, 0.0033416748046875, 0.018367767333984375, 0.03339385986328125, 0.048419952392578125, 0.063446044921875, 0.07847213745117188, 0.09349822998046875, 0.10852432250976562, 0.1235504150390625, 0.13857650756835938, 0.15360260009765625, 0.16862869262695312, 0.18365478515625, 0.19868087768554688, 0.21370697021484375, 0.22873306274414062, 0.2437591552734375, 0.2587852478027344, 0.27381134033203125, 0.2888374328613281, 0.303863525390625, 0.3188896179199219, 0.33391571044921875, 0.3489418029785156, 0.3639678955078125, 0.3789939880371094, 0.39402008056640625, 0.4090461730957031, 0.424072265625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 12.0, 19.0, 37.0, 74.0, 218.0, 606.0, 5628.0, 4130992.0, 54892.0, 1222.0, 354.0, 125.0, 62.0, 26.0, 12.0, 7.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.386688232421875, -3.28314208984375, -3.179595947265625, -3.0760498046875, -2.972503662109375, -2.86895751953125, -2.765411376953125, -2.661865234375, -2.558319091796875, -2.45477294921875, -2.351226806640625, -2.2476806640625, -2.144134521484375, -2.04058837890625, -1.937042236328125, -1.83349609375, -1.729949951171875, -1.62640380859375, -1.522857666015625, -1.4193115234375, -1.315765380859375, -1.21221923828125, -1.108673095703125, -1.005126953125, -0.901580810546875, -0.79803466796875, -0.694488525390625, -0.5909423828125, -0.487396240234375, -0.38385009765625, -0.280303955078125, -0.1767578125, -0.073211669921875, 0.03033447265625, 0.133880615234375, 0.2374267578125, 0.340972900390625, 0.44451904296875, 0.548065185546875, 0.651611328125, 0.755157470703125, 0.85870361328125, 0.962249755859375, 1.0657958984375, 1.169342041015625, 1.27288818359375, 1.376434326171875, 1.47998046875, 1.583526611328125, 1.68707275390625, 1.790618896484375, 1.8941650390625, 1.997711181640625, 2.10125732421875, 2.204803466796875, 2.308349609375, 2.411895751953125, 2.51544189453125, 2.618988037109375, 2.7225341796875, 2.826080322265625, 2.92962646484375, 3.033172607421875, 3.13671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 11.0, 10.0, 9.0, 21.0, 39.0, 47.0, 121.0, 238.0, 395.0, 713.0, 852.0, 673.0, 426.0, 216.0, 115.0, 74.0, 33.0, 21.0, 16.0, 8.0, 9.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69140625, -0.664276123046875, -0.63714599609375, -0.610015869140625, -0.5828857421875, -0.555755615234375, -0.52862548828125, -0.501495361328125, -0.474365234375, -0.447235107421875, -0.42010498046875, -0.392974853515625, -0.3658447265625, -0.338714599609375, -0.31158447265625, -0.284454345703125, -0.25732421875, -0.230194091796875, -0.20306396484375, -0.175933837890625, -0.1488037109375, -0.121673583984375, -0.09454345703125, -0.067413330078125, -0.040283203125, -0.013153076171875, 0.01397705078125, 0.041107177734375, 0.0682373046875, 0.095367431640625, 0.12249755859375, 0.149627685546875, 0.1767578125, 0.203887939453125, 0.23101806640625, 0.258148193359375, 0.2852783203125, 0.312408447265625, 0.33953857421875, 0.366668701171875, 0.393798828125, 0.420928955078125, 0.44805908203125, 0.475189208984375, 0.5023193359375, 0.529449462890625, 0.55657958984375, 0.583709716796875, 0.61083984375, 0.637969970703125, 0.66510009765625, 0.692230224609375, 0.7193603515625, 0.746490478515625, 0.77362060546875, 0.800750732421875, 0.827880859375, 0.855010986328125, 0.88214111328125, 0.909271240234375, 0.9364013671875, 0.963531494140625, 0.99066162109375, 1.017791748046875, 1.044921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 10.0, 12.0, 19.0, 26.0, 62.0, 90.0, 146.0, 150.0, 170.0, 122.0, 72.0, 39.0, 26.0, 20.0, 10.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.930845260620117, -3.7311618328094482, -3.5314786434173584, -3.3317952156066895, -3.1321120262145996, -2.9324285984039307, -2.7327451705932617, -2.533061981201172, -2.333378553390503, -2.133695125579834, -1.9340119361877441, -1.7343285083770752, -1.5346451997756958, -1.3349618911743164, -1.1352784633636475, -0.9355951547622681, -0.7359118461608887, -0.5362285375595093, -0.3365451693534851, -0.13686180114746094, 0.06282150745391846, 0.26250481605529785, 0.4621882438659668, 0.6618715524673462, 0.8615548610687256, 1.061238169670105, 1.2609214782714844, 1.4606049060821533, 1.6602882146835327, 1.859971523284912, 2.059654951095581, 2.25933837890625, 2.45902156829834, 2.658704996109009, 2.8583881855010986, 3.0580716133117676, 3.2577548027038574, 3.4574382305145264, 3.6571216583251953, 3.856804847717285, 4.056488037109375, 4.256171226501465, 4.455854892730713, 4.655538082122803, 4.855221271514893, 5.054904937744141, 5.2545881271362305, 5.45427131652832, 5.653954982757568, 5.853638172149658, 6.053321838378906, 6.253005027770996, 6.452688217163086, 6.652371406555176, 6.852055072784424, 7.051738262176514, 7.251421928405762, 7.451105117797852, 7.6507887840271, 7.8504719734191895, 8.050155639648438, 8.249838829040527, 8.449522018432617, 8.649205207824707, 8.848888397216797]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 7.0, 8.0, 17.0, 19.0, 21.0, 27.0, 35.0, 46.0, 61.0, 53.0, 83.0, 75.0, 84.0, 90.0, 72.0, 69.0, 63.0, 45.0, 34.0, 19.0, 19.0, 17.0, 12.0, 7.0, 4.0, 9.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.112256050109863, -5.954841136932373, -5.797426223754883, -5.640011787414551, -5.4825968742370605, -5.32518196105957, -5.16776704788208, -5.01035213470459, -4.852937698364258, -4.695522785186768, -4.538107872009277, -4.380693435668945, -4.223278522491455, -4.065863609313965, -3.9084486961364746, -3.7510337829589844, -3.593618869781494, -3.436203956604004, -3.2787892818450928, -3.1213743686676025, -2.9639596939086914, -2.806544780731201, -2.649129867553711, -2.4917149543762207, -2.3343002796173096, -2.1768853664398193, -2.019470691680908, -1.862055778503418, -1.7046409845352173, -1.5472261905670166, -1.3898112773895264, -1.2323964834213257, -1.074981927871704, -0.9175671339035034, -0.760152280330658, -0.6027374267578125, -0.4453226327896118, -0.28790783882141113, -0.13049298524856567, 0.026921868324279785, 0.18433666229248047, 0.34175148606300354, 0.4991663098335266, 0.6565811634063721, 0.8139959573745728, 0.9714107513427734, 1.1288256645202637, 1.2862404584884644, 1.443655252456665, 1.6010700464248657, 1.7584848403930664, 1.9158997535705566, 2.073314666748047, 2.230729341506958, 2.3881442546844482, 2.5455589294433594, 2.7029738426208496, 2.86038875579834, 3.017803430557251, 3.175218343734741, 3.3326330184936523, 3.4900479316711426, 3.647462844848633, 3.804877758026123, 3.962292432785034]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 8.0, 6.0, 10.0, 15.0, 26.0, 64.0, 102.0, 225.0, 577.0, 1541.0, 5447.0, 25357.0, 174129.0, 660184.0, 151080.0, 22607.0, 4890.0, 1379.0, 494.0, 205.0, 89.0, 52.0, 28.0, 16.0, 12.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0068359375, -0.9748382568359375, -0.942840576171875, -0.9108428955078125, -0.87884521484375, -0.8468475341796875, -0.814849853515625, -0.7828521728515625, -0.7508544921875, -0.7188568115234375, -0.686859130859375, -0.6548614501953125, -0.62286376953125, -0.5908660888671875, -0.558868408203125, -0.5268707275390625, -0.494873046875, -0.4628753662109375, -0.430877685546875, -0.3988800048828125, -0.36688232421875, -0.3348846435546875, -0.302886962890625, -0.2708892822265625, -0.2388916015625, -0.2068939208984375, -0.174896240234375, -0.1428985595703125, -0.11090087890625, -0.0789031982421875, -0.046905517578125, -0.0149078369140625, 0.01708984375, 0.0490875244140625, 0.081085205078125, 0.1130828857421875, 0.14508056640625, 0.1770782470703125, 0.209075927734375, 0.2410736083984375, 0.2730712890625, 0.3050689697265625, 0.337066650390625, 0.3690643310546875, 0.40106201171875, 0.4330596923828125, 0.465057373046875, 0.4970550537109375, 0.529052734375, 0.5610504150390625, 0.593048095703125, 0.6250457763671875, 0.65704345703125, 0.6890411376953125, 0.721038818359375, 0.7530364990234375, 0.7850341796875, 0.8170318603515625, 0.849029541015625, 0.8810272216796875, 0.91302490234375, 0.9450225830078125, 0.977020263671875, 1.0090179443359375, 1.041015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 10.0, 13.0, 18.0, 26.0, 22.0, 24.0, 40.0, 40.0, 51.0, 49.0, 60.0, 65.0, 56.0, 54.0, 57.0, 55.0, 45.0, 50.0, 44.0, 32.0, 51.0, 27.0, 24.0, 23.0, 21.0, 9.0, 10.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.54833984375, -0.5329666137695312, -0.5175933837890625, -0.5022201538085938, -0.486846923828125, -0.47147369384765625, -0.4561004638671875, -0.44072723388671875, -0.42535400390625, -0.40998077392578125, -0.3946075439453125, -0.37923431396484375, -0.363861083984375, -0.34848785400390625, -0.3331146240234375, -0.31774139404296875, -0.3023681640625, -0.28699493408203125, -0.2716217041015625, -0.25624847412109375, -0.240875244140625, -0.22550201416015625, -0.2101287841796875, -0.19475555419921875, -0.17938232421875, -0.16400909423828125, -0.1486358642578125, -0.13326263427734375, -0.117889404296875, -0.10251617431640625, -0.0871429443359375, -0.07176971435546875, -0.056396484375, -0.04102325439453125, -0.0256500244140625, -0.01027679443359375, 0.005096435546875, 0.02046966552734375, 0.0358428955078125, 0.05121612548828125, 0.06658935546875, 0.08196258544921875, 0.0973358154296875, 0.11270904541015625, 0.128082275390625, 0.14345550537109375, 0.1588287353515625, 0.17420196533203125, 0.1895751953125, 0.20494842529296875, 0.2203216552734375, 0.23569488525390625, 0.251068115234375, 0.26644134521484375, 0.2818145751953125, 0.29718780517578125, 0.31256103515625, 0.32793426513671875, 0.3433074951171875, 0.35868072509765625, 0.374053955078125, 0.38942718505859375, 0.4048004150390625, 0.42017364501953125, 0.435546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 9.0, 5.0, 15.0, 20.0, 20.0, 31.0, 40.0, 46.0, 67.0, 99.0, 126.0, 202.0, 269.0, 415.0, 737.0, 1402.0, 3131.0, 9892.0, 41539.0, 274627.0, 627804.0, 65882.0, 13835.0, 4257.0, 1742.0, 857.0, 462.0, 316.0, 195.0, 123.0, 105.0, 50.0, 53.0, 37.0, 27.0, 20.0, 16.0, 17.0, 13.0, 12.0, 9.0, 3.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.92822265625, -0.90020751953125, -0.8721923828125, -0.84417724609375, -0.816162109375, -0.78814697265625, -0.7601318359375, -0.73211669921875, -0.7041015625, -0.67608642578125, -0.6480712890625, -0.62005615234375, -0.592041015625, -0.56402587890625, -0.5360107421875, -0.50799560546875, -0.47998046875, -0.45196533203125, -0.4239501953125, -0.39593505859375, -0.367919921875, -0.33990478515625, -0.3118896484375, -0.28387451171875, -0.255859375, -0.22784423828125, -0.1998291015625, -0.17181396484375, -0.143798828125, -0.11578369140625, -0.0877685546875, -0.05975341796875, -0.03173828125, -0.00372314453125, 0.0242919921875, 0.05230712890625, 0.080322265625, 0.10833740234375, 0.1363525390625, 0.16436767578125, 0.1923828125, 0.22039794921875, 0.2484130859375, 0.27642822265625, 0.304443359375, 0.33245849609375, 0.3604736328125, 0.38848876953125, 0.41650390625, 0.44451904296875, 0.4725341796875, 0.50054931640625, 0.528564453125, 0.55657958984375, 0.5845947265625, 0.61260986328125, 0.640625, 0.66864013671875, 0.6966552734375, 0.72467041015625, 0.752685546875, 0.78070068359375, 0.8087158203125, 0.83673095703125, 0.86474609375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 4.0, 4.0, 13.0, 10.0, 15.0, 15.0, 17.0, 22.0, 29.0, 26.0, 43.0, 33.0, 59.0, 54.0, 61.0, 72.0, 70.0, 66.0, 61.0, 40.0, 43.0, 38.0, 41.0, 25.0, 30.0, 29.0, 18.0, 19.0, 5.0, 7.0, 10.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3759765625, -1.3220062255859375, -1.268035888671875, -1.2140655517578125, -1.16009521484375, -1.1061248779296875, -1.052154541015625, -0.9981842041015625, -0.9442138671875, -0.8902435302734375, -0.836273193359375, -0.7823028564453125, -0.72833251953125, -0.6743621826171875, -0.620391845703125, -0.5664215087890625, -0.512451171875, -0.4584808349609375, -0.404510498046875, -0.3505401611328125, -0.29656982421875, -0.2425994873046875, -0.188629150390625, -0.1346588134765625, -0.0806884765625, -0.0267181396484375, 0.027252197265625, 0.0812225341796875, 0.13519287109375, 0.1891632080078125, 0.243133544921875, 0.2971038818359375, 0.35107421875, 0.4050445556640625, 0.459014892578125, 0.5129852294921875, 0.56695556640625, 0.6209259033203125, 0.674896240234375, 0.7288665771484375, 0.7828369140625, 0.8368072509765625, 0.890777587890625, 0.9447479248046875, 0.99871826171875, 1.0526885986328125, 1.106658935546875, 1.1606292724609375, 1.214599609375, 1.2685699462890625, 1.322540283203125, 1.3765106201171875, 1.43048095703125, 1.4844512939453125, 1.538421630859375, 1.5923919677734375, 1.6463623046875, 1.7003326416015625, 1.754302978515625, 1.8082733154296875, 1.86224365234375, 1.9162139892578125, 1.970184326171875, 2.0241546630859375, 2.078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 5.0, 13.0, 13.0, 12.0, 32.0, 42.0, 67.0, 114.0, 198.0, 386.0, 803.0, 1940.0, 4965.0, 14406.0, 54615.0, 662181.0, 252061.0, 38608.0, 11220.0, 3807.0, 1526.0, 720.0, 361.0, 163.0, 103.0, 75.0, 30.0, 27.0, 21.0, 13.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361572265625, -0.3494720458984375, -0.337371826171875, -0.3252716064453125, -0.31317138671875, -0.3010711669921875, -0.288970947265625, -0.2768707275390625, -0.2647705078125, -0.2526702880859375, -0.240570068359375, -0.2284698486328125, -0.21636962890625, -0.2042694091796875, -0.192169189453125, -0.1800689697265625, -0.16796875, -0.1558685302734375, -0.143768310546875, -0.1316680908203125, -0.11956787109375, -0.1074676513671875, -0.095367431640625, -0.0832672119140625, -0.0711669921875, -0.0590667724609375, -0.046966552734375, -0.0348663330078125, -0.02276611328125, -0.0106658935546875, 0.001434326171875, 0.0135345458984375, 0.025634765625, 0.0377349853515625, 0.049835205078125, 0.0619354248046875, 0.07403564453125, 0.0861358642578125, 0.098236083984375, 0.1103363037109375, 0.1224365234375, 0.1345367431640625, 0.146636962890625, 0.1587371826171875, 0.17083740234375, 0.1829376220703125, 0.195037841796875, 0.2071380615234375, 0.21923828125, 0.2313385009765625, 0.243438720703125, 0.2555389404296875, 0.26763916015625, 0.2797393798828125, 0.291839599609375, 0.3039398193359375, 0.3160400390625, 0.3281402587890625, 0.340240478515625, 0.3523406982421875, 0.36444091796875, 0.3765411376953125, 0.388641357421875, 0.4007415771484375, 0.412841796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 2.0, 10.0, 9.0, 8.0, 10.0, 18.0, 25.0, 30.0, 56.0, 83.0, 146.0, 147.0, 147.0, 91.0, 68.0, 35.0, 32.0, 24.0, 7.0, 14.0, 3.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.751319885253906e-05, -9.409245103597641e-05, -9.067170321941376e-05, -8.72509554028511e-05, -8.383020758628845e-05, -8.04094597697258e-05, -7.698871195316315e-05, -7.35679641366005e-05, -7.014721632003784e-05, -6.672646850347519e-05, -6.330572068691254e-05, -5.9884972870349884e-05, -5.646422505378723e-05, -5.304347723722458e-05, -4.9622729420661926e-05, -4.6201981604099274e-05, -4.278123378753662e-05, -3.936048597097397e-05, -3.5939738154411316e-05, -3.251899033784866e-05, -2.909824252128601e-05, -2.5677494704723358e-05, -2.2256746888160706e-05, -1.8835999071598053e-05, -1.54152512550354e-05, -1.1994503438472748e-05, -8.573755621910095e-06, -5.153007805347443e-06, -1.73225998878479e-06, 1.6884878277778625e-06, 5.109235644340515e-06, 8.529983460903168e-06, 1.195073127746582e-05, 1.5371479094028473e-05, 1.8792226910591125e-05, 2.2212974727153778e-05, 2.563372254371643e-05, 2.9054470360279083e-05, 3.2475218176841736e-05, 3.589596599340439e-05, 3.931671380996704e-05, 4.2737461626529694e-05, 4.6158209443092346e-05, 4.9578957259655e-05, 5.299970507621765e-05, 5.6420452892780304e-05, 5.9841200709342957e-05, 6.326194852590561e-05, 6.668269634246826e-05, 7.010344415903091e-05, 7.352419197559357e-05, 7.694493979215622e-05, 8.036568760871887e-05, 8.378643542528152e-05, 8.720718324184418e-05, 9.062793105840683e-05, 9.404867887496948e-05, 9.746942669153214e-05, 0.00010089017450809479, 0.00010431092232465744, 0.00010773167014122009, 0.00011115241795778275, 0.0001145731657743454, 0.00011799391359090805, 0.0001214146614074707]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 17.0, 25.0, 18.0, 45.0, 91.0, 157.0, 335.0, 684.0, 1711.0, 5207.0, 20536.0, 114336.0, 788014.0, 92194.0, 17499.0, 4711.0, 1561.0, 696.0, 330.0, 153.0, 81.0, 62.0, 32.0, 23.0, 10.0, 8.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46240234375, -0.448577880859375, -0.43475341796875, -0.420928955078125, -0.4071044921875, -0.393280029296875, -0.37945556640625, -0.365631103515625, -0.351806640625, -0.337982177734375, -0.32415771484375, -0.310333251953125, -0.2965087890625, -0.282684326171875, -0.26885986328125, -0.255035400390625, -0.2412109375, -0.227386474609375, -0.21356201171875, -0.199737548828125, -0.1859130859375, -0.172088623046875, -0.15826416015625, -0.144439697265625, -0.130615234375, -0.116790771484375, -0.10296630859375, -0.089141845703125, -0.0753173828125, -0.061492919921875, -0.04766845703125, -0.033843994140625, -0.02001953125, -0.006195068359375, 0.00762939453125, 0.021453857421875, 0.0352783203125, 0.049102783203125, 0.06292724609375, 0.076751708984375, 0.090576171875, 0.104400634765625, 0.11822509765625, 0.132049560546875, 0.1458740234375, 0.159698486328125, 0.17352294921875, 0.187347412109375, 0.201171875, 0.214996337890625, 0.22882080078125, 0.242645263671875, 0.2564697265625, 0.270294189453125, 0.28411865234375, 0.297943115234375, 0.311767578125, 0.325592041015625, 0.33941650390625, 0.353240966796875, 0.3670654296875, 0.380889892578125, 0.39471435546875, 0.408538818359375, 0.42236328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 6.0, 5.0, 18.0, 17.0, 24.0, 21.0, 46.0, 54.0, 84.0, 129.0, 122.0, 139.0, 86.0, 68.0, 43.0, 23.0, 19.0, 18.0, 26.0, 9.0, 6.0, 5.0, 5.0, 6.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.353759765625, -0.34255218505859375, -0.3313446044921875, -0.32013702392578125, -0.308929443359375, -0.29772186279296875, -0.2865142822265625, -0.27530670166015625, -0.26409912109375, -0.25289154052734375, -0.2416839599609375, -0.23047637939453125, -0.219268798828125, -0.20806121826171875, -0.1968536376953125, -0.18564605712890625, -0.1744384765625, -0.16323089599609375, -0.1520233154296875, -0.14081573486328125, -0.129608154296875, -0.11840057373046875, -0.1071929931640625, -0.09598541259765625, -0.08477783203125, -0.07357025146484375, -0.0623626708984375, -0.05115509033203125, -0.039947509765625, -0.02873992919921875, -0.0175323486328125, -0.00632476806640625, 0.0048828125, 0.01609039306640625, 0.0272979736328125, 0.03850555419921875, 0.049713134765625, 0.06092071533203125, 0.0721282958984375, 0.08333587646484375, 0.09454345703125, 0.10575103759765625, 0.1169586181640625, 0.12816619873046875, 0.139373779296875, 0.15058135986328125, 0.1617889404296875, 0.17299652099609375, 0.1842041015625, 0.19541168212890625, 0.2066192626953125, 0.21782684326171875, 0.229034423828125, 0.24024200439453125, 0.2514495849609375, 0.26265716552734375, 0.27386474609375, 0.28507232666015625, 0.2962799072265625, 0.30748748779296875, 0.318695068359375, 0.32990264892578125, 0.3411102294921875, 0.35231781005859375, 0.363525390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 16.0, 39.0, 72.0, 113.0, 314.0, 214.0, 110.0, 47.0, 24.0, 16.0, 9.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.36539363861084, -8.085188865661621, -7.804985046386719, -7.5247802734375, -7.2445759773254395, -6.964371681213379, -6.68416690826416, -6.4039626121521, -6.123758316040039, -5.8435540199279785, -5.563349723815918, -5.283144950866699, -5.002940654754639, -4.722736358642578, -4.442531585693359, -4.162327289581299, -3.8821229934692383, -3.6019186973571777, -3.321714162826538, -3.0415096282958984, -2.761305332183838, -2.4811010360717773, -2.2008965015411377, -1.9206920862197876, -1.6404876708984375, -1.3602832555770874, -1.0800788402557373, -0.7998744249343872, -0.5196700096130371, -0.239465594291687, 0.040738821029663086, 0.3209432363510132, 0.6011476516723633, 0.8813520669937134, 1.1615564823150635, 1.4417608976364136, 1.7219653129577637, 2.002169609069824, 2.282374143600464, 2.5625786781311035, 2.842782974243164, 3.1229872703552246, 3.4031918048858643, 3.683396339416504, 3.9636006355285645, 4.243804931640625, 4.524009704589844, 4.804214000701904, 5.084418296813965, 5.364622592926025, 5.644826889038086, 5.925031661987305, 6.205235958099365, 6.485440254211426, 6.7656450271606445, 7.045849323272705, 7.326053619384766, 7.606257915496826, 7.886462211608887, 8.166666984558105, 8.446870803833008, 8.727075576782227, 9.007280349731445, 9.287484169006348, 9.567688941955566]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 4.0, 7.0, 5.0, 11.0, 12.0, 13.0, 11.0, 19.0, 22.0, 20.0, 19.0, 11.0, 29.0, 38.0, 33.0, 26.0, 52.0, 59.0, 61.0, 83.0, 64.0, 51.0, 37.0, 27.0, 34.0, 28.0, 23.0, 28.0, 18.0, 20.0, 19.0, 12.0, 15.0, 17.0, 4.0, 3.0, 9.0, 5.0, 4.0, 5.0, 4.0, 3.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.5683135986328125, -4.434481143951416, -4.300649166107178, -4.166816711425781, -4.032984256744385, -3.8991520404815674, -3.76531982421875, -3.6314873695373535, -3.497655153274536, -3.3638229370117188, -3.2299904823303223, -3.096158266067505, -2.9623260498046875, -2.828493595123291, -2.6946613788604736, -2.5608291625976562, -2.4269967079162598, -2.2931644916534424, -2.159332036972046, -2.0254998207092285, -1.8916674852371216, -1.7578351497650146, -1.6240029335021973, -1.4901705980300903, -1.3563382625579834, -1.2225059270858765, -1.0886735916137695, -0.9548413753509521, -0.8210090398788452, -0.6871767044067383, -0.5533444285392761, -0.41951215267181396, -0.28567981719970703, -0.15184751152992249, -0.01801520586013794, 0.1158170998096466, 0.24964940547943115, 0.3834817409515381, 0.5173140168190002, 0.6511462926864624, 0.7849786281585693, 0.9188109636306763, 1.0526432991027832, 1.1864755153656006, 1.3203078508377075, 1.4541401863098145, 1.5879724025726318, 1.7218047380447388, 1.8556370735168457, 1.9894694089889526, 2.1233017444610596, 2.257133960723877, 2.3909664154052734, 2.524798631668091, 2.658630847930908, 2.7924633026123047, 2.926295518875122, 3.0601277351379395, 3.193960189819336, 3.3277924060821533, 3.4616246223449707, 3.595457077026367, 3.7292892932891846, 3.863121509552002, 3.9969539642333984]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 8.0, 15.0, 24.0, 34.0, 50.0, 81.0, 124.0, 225.0, 358.0, 713.0, 1527.0, 4907.0, 32114.0, 1100926.0, 2935894.0, 103257.0, 9543.0, 2432.0, 930.0, 457.0, 264.0, 152.0, 93.0, 65.0, 29.0, 15.0, 10.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9404296875, -0.9102706909179688, -0.8801116943359375, -0.8499526977539062, -0.819793701171875, -0.7896347045898438, -0.7594757080078125, -0.7293167114257812, -0.69915771484375, -0.6689987182617188, -0.6388397216796875, -0.6086807250976562, -0.578521728515625, -0.5483627319335938, -0.5182037353515625, -0.48804473876953125, -0.4578857421875, -0.42772674560546875, -0.3975677490234375, -0.36740875244140625, -0.337249755859375, -0.30709075927734375, -0.2769317626953125, -0.24677276611328125, -0.21661376953125, -0.18645477294921875, -0.1562957763671875, -0.12613677978515625, -0.095977783203125, -0.06581878662109375, -0.0356597900390625, -0.00550079345703125, 0.024658203125, 0.05481719970703125, 0.0849761962890625, 0.11513519287109375, 0.145294189453125, 0.17545318603515625, 0.2056121826171875, 0.23577117919921875, 0.26593017578125, 0.29608917236328125, 0.3262481689453125, 0.35640716552734375, 0.386566162109375, 0.41672515869140625, 0.4468841552734375, 0.47704315185546875, 0.5072021484375, 0.5373611450195312, 0.5675201416015625, 0.5976791381835938, 0.627838134765625, 0.6579971313476562, 0.6881561279296875, 0.7183151245117188, 0.74847412109375, 0.7786331176757812, 0.8087921142578125, 0.8389511108398438, 0.869110107421875, 0.8992691040039062, 0.9294281005859375, 0.9595870971679688, 0.98974609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 8.0, 7.0, 7.0, 11.0, 12.0, 29.0, 24.0, 35.0, 28.0, 52.0, 50.0, 63.0, 61.0, 57.0, 62.0, 57.0, 50.0, 46.0, 36.0, 41.0, 59.0, 39.0, 37.0, 30.0, 25.0, 15.0, 10.0, 20.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5394058227539062, -0.5241241455078125, -0.5088424682617188, -0.493560791015625, -0.47827911376953125, -0.4629974365234375, -0.44771575927734375, -0.43243408203125, -0.41715240478515625, -0.4018707275390625, -0.38658905029296875, -0.371307373046875, -0.35602569580078125, -0.3407440185546875, -0.32546234130859375, -0.3101806640625, -0.29489898681640625, -0.2796173095703125, -0.26433563232421875, -0.249053955078125, -0.23377227783203125, -0.2184906005859375, -0.20320892333984375, -0.18792724609375, -0.17264556884765625, -0.1573638916015625, -0.14208221435546875, -0.126800537109375, -0.11151885986328125, -0.0962371826171875, -0.08095550537109375, -0.065673828125, -0.05039215087890625, -0.0351104736328125, -0.01982879638671875, -0.004547119140625, 0.01073455810546875, 0.0260162353515625, 0.04129791259765625, 0.05657958984375, 0.07186126708984375, 0.0871429443359375, 0.10242462158203125, 0.117706298828125, 0.13298797607421875, 0.1482696533203125, 0.16355133056640625, 0.1788330078125, 0.19411468505859375, 0.2093963623046875, 0.22467803955078125, 0.239959716796875, 0.25524139404296875, 0.2705230712890625, 0.28580474853515625, 0.30108642578125, 0.31636810302734375, 0.3316497802734375, 0.34693145751953125, 0.362213134765625, 0.37749481201171875, 0.3927764892578125, 0.40805816650390625, 0.42333984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 8.0, 11.0, 21.0, 42.0, 87.0, 173.0, 301.0, 649.0, 2000.0, 56216.0, 4120245.0, 12409.0, 1212.0, 446.0, 228.0, 100.0, 64.0, 31.0, 17.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.3448486328125, -3.250244140625, -3.1556396484375, -3.06103515625, -2.9664306640625, -2.871826171875, -2.7772216796875, -2.6826171875, -2.5880126953125, -2.493408203125, -2.3988037109375, -2.30419921875, -2.2095947265625, -2.114990234375, -2.0203857421875, -1.92578125, -1.8311767578125, -1.736572265625, -1.6419677734375, -1.54736328125, -1.4527587890625, -1.358154296875, -1.2635498046875, -1.1689453125, -1.0743408203125, -0.979736328125, -0.8851318359375, -0.79052734375, -0.6959228515625, -0.601318359375, -0.5067138671875, -0.412109375, -0.3175048828125, -0.222900390625, -0.1282958984375, -0.03369140625, 0.0609130859375, 0.155517578125, 0.2501220703125, 0.3447265625, 0.4393310546875, 0.533935546875, 0.6285400390625, 0.72314453125, 0.8177490234375, 0.912353515625, 1.0069580078125, 1.1015625, 1.1961669921875, 1.290771484375, 1.3853759765625, 1.47998046875, 1.5745849609375, 1.669189453125, 1.7637939453125, 1.8583984375, 1.9530029296875, 2.047607421875, 2.1422119140625, 2.23681640625, 2.3314208984375, 2.426025390625, 2.5206298828125, 2.615234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 15.0, 30.0, 77.0, 183.0, 639.0, 1628.0, 1060.0, 295.0, 77.0, 41.0, 15.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6484375, -2.5833892822265625, -2.518341064453125, -2.4532928466796875, -2.38824462890625, -2.3231964111328125, -2.258148193359375, -2.1930999755859375, -2.1280517578125, -2.0630035400390625, -1.997955322265625, -1.9329071044921875, -1.86785888671875, -1.8028106689453125, -1.737762451171875, -1.6727142333984375, -1.607666015625, -1.5426177978515625, -1.477569580078125, -1.4125213623046875, -1.34747314453125, -1.2824249267578125, -1.217376708984375, -1.1523284912109375, -1.0872802734375, -1.0222320556640625, -0.957183837890625, -0.8921356201171875, -0.82708740234375, -0.7620391845703125, -0.696990966796875, -0.6319427490234375, -0.56689453125, -0.5018463134765625, -0.436798095703125, -0.3717498779296875, -0.30670166015625, -0.2416534423828125, -0.176605224609375, -0.1115570068359375, -0.0465087890625, 0.0185394287109375, 0.083587646484375, 0.1486358642578125, 0.21368408203125, 0.2787322998046875, 0.343780517578125, 0.4088287353515625, 0.473876953125, 0.5389251708984375, 0.603973388671875, 0.6690216064453125, 0.73406982421875, 0.7991180419921875, 0.864166259765625, 0.9292144775390625, 0.9942626953125, 1.0593109130859375, 1.124359130859375, 1.1894073486328125, 1.25445556640625, 1.3195037841796875, 1.384552001953125, 1.4496002197265625, 1.5146484375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 13.0, 9.0, 19.0, 29.0, 56.0, 115.0, 198.0, 264.0, 175.0, 71.0, 26.0, 10.0, 9.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.52092933654785, -20.139076232910156, -19.75722312927246, -19.375370025634766, -18.99351692199707, -18.611663818359375, -18.229808807373047, -17.847957611083984, -17.466102600097656, -17.08424949645996, -16.702396392822266, -16.32054328918457, -15.938689231872559, -15.556836128234863, -15.174983024597168, -14.793129920959473, -14.411277770996094, -14.029424667358398, -13.647571563720703, -13.265718460083008, -12.883864402770996, -12.5020112991333, -12.120158195495605, -11.73830509185791, -11.356451034545898, -10.974597930908203, -10.592744827270508, -10.210891723632812, -9.8290376663208, -9.447184562683105, -9.06533145904541, -8.683478355407715, -8.301624298095703, -7.919771194458008, -7.537917613983154, -7.156064510345459, -6.774211406707764, -6.39235782623291, -6.010504722595215, -5.6286516189575195, -5.246798515319824, -4.864945411682129, -4.483091831207275, -4.10123872756958, -3.7193856239318848, -3.3375322818756104, -2.955678939819336, -2.5738258361816406, -2.1919727325439453, -1.8101195096969604, -1.4282662868499756, -1.0464129447937012, -0.6645597219467163, -0.28270649909973145, 0.09914684295654297, 0.4809999465942383, 0.8628532886505127, 1.2447065114974976, 1.6265597343444824, 2.008413076400757, 2.3902664184570312, 2.7721195220947266, 3.153972864151001, 3.5358259677886963, 3.9176793098449707]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 5.0, 0.0, 7.0, 8.0, 9.0, 7.0, 14.0, 17.0, 17.0, 22.0, 25.0, 28.0, 20.0, 43.0, 41.0, 43.0, 39.0, 50.0, 46.0, 39.0, 48.0, 58.0, 42.0, 37.0, 36.0, 39.0, 35.0, 32.0, 24.0, 43.0, 26.0, 20.0, 13.0, 14.0, 14.0, 9.0, 7.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.515741348266602, -4.367719650268555, -4.219698429107666, -4.071676731109619, -3.9236552715301514, -3.7756338119506836, -3.6276121139526367, -3.479590654373169, -3.331569194793701, -3.1835477352142334, -3.0355262756347656, -2.8875045776367188, -2.739483118057251, -2.591461658477783, -2.4434399604797363, -2.2954185009002686, -2.147397041320801, -1.999375581741333, -1.8513540029525757, -1.7033324241638184, -1.5553109645843506, -1.4072895050048828, -1.2592679262161255, -1.1112463474273682, -0.9632248878479004, -0.8152033686637878, -0.6671818494796753, -0.5191603302955627, -0.3711388111114502, -0.22311729192733765, -0.0750957727432251, 0.07292580604553223, 0.2209467887878418, 0.36896830797195435, 0.5169898271560669, 0.6650113463401794, 0.813032865524292, 0.9610543847084045, 1.109075903892517, 1.2570974826812744, 1.4051189422607422, 1.55314040184021, 1.7011619806289673, 1.8491835594177246, 1.9972050189971924, 2.14522647857666, 2.293248176574707, 2.441269636154175, 2.5892910957336426, 2.7373125553131104, 2.885334014892578, 3.033355712890625, 3.1813771724700928, 3.3293986320495605, 3.4774203300476074, 3.625441789627075, 3.773463249206543, 3.9214847087860107, 4.0695061683654785, 4.217527866363525, 4.365549087524414, 4.513570785522461, 4.661592483520508, 4.809614181518555, 4.957635402679443]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 10.0, 5.0, 16.0, 17.0, 26.0, 49.0, 67.0, 114.0, 219.0, 397.0, 761.0, 1440.0, 3102.0, 6902.0, 16414.0, 44941.0, 140110.0, 413536.0, 285258.0, 85304.0, 28873.0, 11473.0, 4803.0, 2292.0, 1118.0, 577.0, 300.0, 167.0, 111.0, 51.0, 34.0, 21.0, 20.0, 10.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5869140625, -0.5690155029296875, -0.551116943359375, -0.5332183837890625, -0.51531982421875, -0.4974212646484375, -0.479522705078125, -0.4616241455078125, -0.4437255859375, -0.4258270263671875, -0.407928466796875, -0.3900299072265625, -0.37213134765625, -0.3542327880859375, -0.336334228515625, -0.3184356689453125, -0.300537109375, -0.2826385498046875, -0.264739990234375, -0.2468414306640625, -0.22894287109375, -0.2110443115234375, -0.193145751953125, -0.1752471923828125, -0.1573486328125, -0.1394500732421875, -0.121551513671875, -0.1036529541015625, -0.08575439453125, -0.0678558349609375, -0.049957275390625, -0.0320587158203125, -0.01416015625, 0.0037384033203125, 0.021636962890625, 0.0395355224609375, 0.05743408203125, 0.0753326416015625, 0.093231201171875, 0.1111297607421875, 0.1290283203125, 0.1469268798828125, 0.164825439453125, 0.1827239990234375, 0.20062255859375, 0.2185211181640625, 0.236419677734375, 0.2543182373046875, 0.272216796875, 0.2901153564453125, 0.308013916015625, 0.3259124755859375, 0.34381103515625, 0.3617095947265625, 0.379608154296875, 0.3975067138671875, 0.4154052734375, 0.4333038330078125, 0.451202392578125, 0.4691009521484375, 0.48699951171875, 0.5048980712890625, 0.522796630859375, 0.5406951904296875, 0.55859375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 11.0, 7.0, 15.0, 19.0, 22.0, 19.0, 22.0, 24.0, 39.0, 40.0, 33.0, 48.0, 48.0, 49.0, 33.0, 53.0, 52.0, 56.0, 38.0, 54.0, 42.0, 33.0, 42.0, 37.0, 27.0, 26.0, 21.0, 14.0, 13.0, 14.0, 9.0, 11.0, 7.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.52392578125, -0.5098114013671875, -0.495697021484375, -0.4815826416015625, -0.46746826171875, -0.4533538818359375, -0.439239501953125, -0.4251251220703125, -0.4110107421875, -0.3968963623046875, -0.382781982421875, -0.3686676025390625, -0.35455322265625, -0.3404388427734375, -0.326324462890625, -0.3122100830078125, -0.298095703125, -0.2839813232421875, -0.269866943359375, -0.2557525634765625, -0.24163818359375, -0.2275238037109375, -0.213409423828125, -0.1992950439453125, -0.1851806640625, -0.1710662841796875, -0.156951904296875, -0.1428375244140625, -0.12872314453125, -0.1146087646484375, -0.100494384765625, -0.0863800048828125, -0.072265625, -0.0581512451171875, -0.044036865234375, -0.0299224853515625, -0.01580810546875, -0.0016937255859375, 0.012420654296875, 0.0265350341796875, 0.0406494140625, 0.0547637939453125, 0.068878173828125, 0.0829925537109375, 0.09710693359375, 0.1112213134765625, 0.125335693359375, 0.1394500732421875, 0.153564453125, 0.1676788330078125, 0.181793212890625, 0.1959075927734375, 0.21002197265625, 0.2241363525390625, 0.238250732421875, 0.2523651123046875, 0.2664794921875, 0.2805938720703125, 0.294708251953125, 0.3088226318359375, 0.32293701171875, 0.3370513916015625, 0.351165771484375, 0.3652801513671875, 0.37939453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 7.0, 18.0, 11.0, 23.0, 32.0, 46.0, 72.0, 76.0, 128.0, 188.0, 303.0, 475.0, 837.0, 1796.0, 6161.0, 39020.0, 718239.0, 251455.0, 22051.0, 4274.0, 1395.0, 679.0, 421.0, 245.0, 174.0, 129.0, 87.0, 56.0, 42.0, 31.0, 21.0, 15.0, 9.0, 10.0, 4.0, 9.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3125, -1.27374267578125, -1.2349853515625, -1.19622802734375, -1.157470703125, -1.11871337890625, -1.0799560546875, -1.04119873046875, -1.00244140625, -0.96368408203125, -0.9249267578125, -0.88616943359375, -0.847412109375, -0.80865478515625, -0.7698974609375, -0.73114013671875, -0.6923828125, -0.65362548828125, -0.6148681640625, -0.57611083984375, -0.537353515625, -0.49859619140625, -0.4598388671875, -0.42108154296875, -0.38232421875, -0.34356689453125, -0.3048095703125, -0.26605224609375, -0.227294921875, -0.18853759765625, -0.1497802734375, -0.11102294921875, -0.072265625, -0.03350830078125, 0.0052490234375, 0.04400634765625, 0.082763671875, 0.12152099609375, 0.1602783203125, 0.19903564453125, 0.23779296875, 0.27655029296875, 0.3153076171875, 0.35406494140625, 0.392822265625, 0.43157958984375, 0.4703369140625, 0.50909423828125, 0.5478515625, 0.58660888671875, 0.6253662109375, 0.66412353515625, 0.702880859375, 0.74163818359375, 0.7803955078125, 0.81915283203125, 0.85791015625, 0.89666748046875, 0.9354248046875, 0.97418212890625, 1.012939453125, 1.05169677734375, 1.0904541015625, 1.12921142578125, 1.16796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 6.0, 9.0, 12.0, 9.0, 14.0, 12.0, 16.0, 16.0, 20.0, 33.0, 24.0, 30.0, 35.0, 53.0, 47.0, 54.0, 58.0, 43.0, 70.0, 65.0, 44.0, 50.0, 42.0, 40.0, 26.0, 25.0, 32.0, 19.0, 17.0, 12.0, 12.0, 10.0, 9.0, 10.0, 5.0, 4.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5625, -1.5084228515625, -1.454345703125, -1.4002685546875, -1.34619140625, -1.2921142578125, -1.238037109375, -1.1839599609375, -1.1298828125, -1.0758056640625, -1.021728515625, -0.9676513671875, -0.91357421875, -0.8594970703125, -0.805419921875, -0.7513427734375, -0.697265625, -0.6431884765625, -0.589111328125, -0.5350341796875, -0.48095703125, -0.4268798828125, -0.372802734375, -0.3187255859375, -0.2646484375, -0.2105712890625, -0.156494140625, -0.1024169921875, -0.04833984375, 0.0057373046875, 0.059814453125, 0.1138916015625, 0.16796875, 0.2220458984375, 0.276123046875, 0.3302001953125, 0.38427734375, 0.4383544921875, 0.492431640625, 0.5465087890625, 0.6005859375, 0.6546630859375, 0.708740234375, 0.7628173828125, 0.81689453125, 0.8709716796875, 0.925048828125, 0.9791259765625, 1.033203125, 1.0872802734375, 1.141357421875, 1.1954345703125, 1.24951171875, 1.3035888671875, 1.357666015625, 1.4117431640625, 1.4658203125, 1.5198974609375, 1.573974609375, 1.6280517578125, 1.68212890625, 1.7362060546875, 1.790283203125, 1.8443603515625, 1.8984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 7.0, 7.0, 2.0, 14.0, 22.0, 38.0, 51.0, 84.0, 154.0, 305.0, 787.0, 2486.0, 12566.0, 177544.0, 826264.0, 22394.0, 3909.0, 1073.0, 365.0, 180.0, 98.0, 62.0, 36.0, 25.0, 12.0, 17.0, 13.0, 4.0, 8.0, 1.0, 4.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6943359375, -0.6727371215820312, -0.6511383056640625, -0.6295394897460938, -0.607940673828125, -0.5863418579101562, -0.5647430419921875, -0.5431442260742188, -0.52154541015625, -0.49994659423828125, -0.4783477783203125, -0.45674896240234375, -0.435150146484375, -0.41355133056640625, -0.3919525146484375, -0.37035369873046875, -0.3487548828125, -0.32715606689453125, -0.3055572509765625, -0.28395843505859375, -0.262359619140625, -0.24076080322265625, -0.2191619873046875, -0.19756317138671875, -0.17596435546875, -0.15436553955078125, -0.1327667236328125, -0.11116790771484375, -0.089569091796875, -0.06797027587890625, -0.0463714599609375, -0.02477264404296875, -0.003173828125, 0.01842498779296875, 0.0400238037109375, 0.06162261962890625, 0.083221435546875, 0.10482025146484375, 0.1264190673828125, 0.14801788330078125, 0.16961669921875, 0.19121551513671875, 0.2128143310546875, 0.23441314697265625, 0.256011962890625, 0.27761077880859375, 0.2992095947265625, 0.32080841064453125, 0.3424072265625, 0.36400604248046875, 0.3856048583984375, 0.40720367431640625, 0.428802490234375, 0.45040130615234375, 0.4720001220703125, 0.49359893798828125, 0.51519775390625, 0.5367965698242188, 0.5583953857421875, 0.5799942016601562, 0.601593017578125, 0.6231918334960938, 0.6447906494140625, 0.6663894653320312, 0.68798828125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 8.0, 10.0, 12.0, 23.0, 29.0, 77.0, 149.0, 210.0, 186.0, 91.0, 44.0, 36.0, 24.0, 14.0, 9.0, 7.0, 6.0, 6.0, 2.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00014162063598632812, -0.00013650953769683838, -0.00013139843940734863, -0.0001262873411178589, -0.00012117624282836914, -0.0001160651445388794, -0.00011095404624938965, -0.0001058429479598999, -0.00010073184967041016, -9.562075138092041e-05, -9.050965309143066e-05, -8.539855480194092e-05, -8.028745651245117e-05, -7.517635822296143e-05, -7.006525993347168e-05, -6.495416164398193e-05, -5.984306335449219e-05, -5.473196506500244e-05, -4.9620866775512695e-05, -4.450976848602295e-05, -3.93986701965332e-05, -3.428757190704346e-05, -2.917647361755371e-05, -2.4065375328063965e-05, -1.895427703857422e-05, -1.3843178749084473e-05, -8.732080459594727e-06, -3.6209821701049805e-06, 1.4901161193847656e-06, 6.601214408874512e-06, 1.1712312698364258e-05, 1.6823410987854004e-05, 2.193450927734375e-05, 2.7045607566833496e-05, 3.215670585632324e-05, 3.726780414581299e-05, 4.2378902435302734e-05, 4.749000072479248e-05, 5.2601099014282227e-05, 5.771219730377197e-05, 6.282329559326172e-05, 6.793439388275146e-05, 7.304549217224121e-05, 7.815659046173096e-05, 8.32676887512207e-05, 8.837878704071045e-05, 9.34898853302002e-05, 9.860098361968994e-05, 0.00010371208190917969, 0.00010882318019866943, 0.00011393427848815918, 0.00011904537677764893, 0.00012415647506713867, 0.00012926757335662842, 0.00013437867164611816, 0.0001394897699356079, 0.00014460086822509766, 0.0001497119665145874, 0.00015482306480407715, 0.0001599341630935669, 0.00016504526138305664, 0.0001701563596725464, 0.00017526745796203613, 0.00018037855625152588, 0.00018548965454101562]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 8.0, 25.0, 22.0, 38.0, 63.0, 121.0, 242.0, 506.0, 1219.0, 4132.0, 20390.0, 686378.0, 311808.0, 17871.0, 3595.0, 1149.0, 471.0, 225.0, 106.0, 66.0, 34.0, 18.0, 13.0, 14.0, 8.0, 5.0, 8.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6364517211914062, -0.6171417236328125, -0.5978317260742188, -0.578521728515625, -0.5592117309570312, -0.5399017333984375, -0.5205917358398438, -0.50128173828125, -0.48197174072265625, -0.4626617431640625, -0.44335174560546875, -0.424041748046875, -0.40473175048828125, -0.3854217529296875, -0.36611175537109375, -0.3468017578125, -0.32749176025390625, -0.3081817626953125, -0.28887176513671875, -0.269561767578125, -0.25025177001953125, -0.2309417724609375, -0.21163177490234375, -0.19232177734375, -0.17301177978515625, -0.1537017822265625, -0.13439178466796875, -0.115081787109375, -0.09577178955078125, -0.0764617919921875, -0.05715179443359375, -0.037841796875, -0.01853179931640625, 0.0007781982421875, 0.02008819580078125, 0.039398193359375, 0.05870819091796875, 0.0780181884765625, 0.09732818603515625, 0.11663818359375, 0.13594818115234375, 0.1552581787109375, 0.17456817626953125, 0.193878173828125, 0.21318817138671875, 0.2324981689453125, 0.25180816650390625, 0.2711181640625, 0.29042816162109375, 0.3097381591796875, 0.32904815673828125, 0.348358154296875, 0.36766815185546875, 0.3869781494140625, 0.40628814697265625, 0.42559814453125, 0.44490814208984375, 0.4642181396484375, 0.48352813720703125, 0.502838134765625, 0.5221481323242188, 0.5414581298828125, 0.5607681274414062, 0.580078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 14.0, 9.0, 24.0, 18.0, 34.0, 57.0, 64.0, 98.0, 146.0, 184.0, 105.0, 59.0, 47.0, 35.0, 24.0, 16.0, 12.0, 8.0, 4.0, 7.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.418701171875, -0.4032325744628906, -0.38776397705078125, -0.3722953796386719, -0.3568267822265625, -0.3413581848144531, -0.32588958740234375, -0.3104209899902344, -0.294952392578125, -0.2794837951660156, -0.26401519775390625, -0.24854660034179688, -0.2330780029296875, -0.21760940551757812, -0.20214080810546875, -0.18667221069335938, -0.17120361328125, -0.15573501586914062, -0.14026641845703125, -0.12479782104492188, -0.1093292236328125, -0.09386062622070312, -0.07839202880859375, -0.06292343139648438, -0.047454833984375, -0.031986236572265625, -0.01651763916015625, -0.001049041748046875, 0.0144195556640625, 0.029888153076171875, 0.04535675048828125, 0.060825347900390625, 0.0762939453125, 0.09176254272460938, 0.10723114013671875, 0.12269973754882812, 0.1381683349609375, 0.15363693237304688, 0.16910552978515625, 0.18457412719726562, 0.200042724609375, 0.21551132202148438, 0.23097991943359375, 0.24644851684570312, 0.2619171142578125, 0.2773857116699219, 0.29285430908203125, 0.3083229064941406, 0.32379150390625, 0.3392601013183594, 0.35472869873046875, 0.3701972961425781, 0.3856658935546875, 0.4011344909667969, 0.41660308837890625, 0.4320716857910156, 0.447540283203125, 0.4630088806152344, 0.47847747802734375, 0.4939460754394531, 0.5094146728515625, 0.5248832702636719, 0.5403518676757812, 0.5558204650878906, 0.5712890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 14.0, 55.0, 225.0, 503.0, 138.0, 34.0, 16.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.36214828491211, -10.771464347839355, -10.180779457092285, -9.590095520019531, -8.999411582946777, -8.408727645874023, -7.818042755126953, -7.227358818054199, -6.636674404144287, -6.045989990234375, -5.455306053161621, -4.864621639251709, -4.273937225341797, -3.683253288269043, -3.092568874359131, -2.501884937286377, -1.9112005233764648, -1.3205163478851318, -0.7298320531845093, -0.13914775848388672, 0.4515364170074463, 1.0422205924987793, 1.6329050064086914, 2.2235889434814453, 2.8142733573913574, 3.4049575328826904, 3.9956417083740234, 4.5863261222839355, 5.177010536193848, 5.767694473266602, 6.358378887176514, 6.949062824249268, 7.53974723815918, 8.130431175231934, 8.721116065979004, 9.311800003051758, 9.902483940124512, 10.493167877197266, 11.083852767944336, 11.67453670501709, 12.265220642089844, 12.855904579162598, 13.446589469909668, 14.037273406982422, 14.627957344055176, 15.21864128112793, 15.809326171875, 16.400009155273438, 16.99069595336914, 17.58138084411621, 18.17206382751465, 18.76274871826172, 19.35343360900879, 19.944116592407227, 20.534801483154297, 21.125484466552734, 21.716169357299805, 22.306854248046875, 22.897537231445312, 23.488222122192383, 24.078907012939453, 24.66958999633789, 25.26027488708496, 25.85095977783203, 26.44164276123047]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 2.0, 3.0, 5.0, 10.0, 5.0, 10.0, 10.0, 14.0, 8.0, 8.0, 16.0, 19.0, 16.0, 18.0, 21.0, 23.0, 21.0, 43.0, 41.0, 62.0, 64.0, 76.0, 61.0, 66.0, 58.0, 29.0, 28.0, 33.0, 33.0, 25.0, 22.0, 24.0, 21.0, 19.0, 19.0, 12.0, 9.0, 7.0, 6.0, 7.0, 5.0, 2.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-6.698087692260742, -6.502269268035889, -6.306451320648193, -6.11063289642334, -5.9148149490356445, -5.718996524810791, -5.523178577423096, -5.327360153198242, -5.131542205810547, -4.935723781585693, -4.739905834197998, -4.5440874099731445, -4.348269462585449, -4.152451038360596, -3.9566330909729004, -3.760814666748047, -3.5649964809417725, -3.369178295135498, -3.1733601093292236, -2.977541923522949, -2.781723737716675, -2.5859055519104004, -2.390087127685547, -2.1942691802978516, -1.9984508752822876, -1.8026326894760132, -1.6068145036697388, -1.4109961986541748, -1.2151780128479004, -1.019359827041626, -0.8235416412353516, -0.6277234554290771, -0.43190526962280273, -0.23608706891536713, -0.04026886820793152, 0.15554934740066528, 0.3513675332069397, 0.5471857190132141, 0.7430039644241333, 0.9388221502304077, 1.1346403360366821, 1.3304585218429565, 1.526276707649231, 1.722095012664795, 1.9179131984710693, 2.1137313842773438, 2.309549570083618, 2.5053677558898926, 2.701185941696167, 2.8970041275024414, 3.092822313308716, 3.2886404991149902, 3.4844586849212646, 3.680276870727539, 3.8760952949523926, 4.071913242340088, 4.267731666564941, 4.463550090789795, 4.65936803817749, 4.855186462402344, 5.051004409790039, 5.246822834014893, 5.442640781402588, 5.638459205627441, 5.834277153015137]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 8.0, 10.0, 11.0, 19.0, 28.0, 20.0, 60.0, 92.0, 112.0, 171.0, 279.0, 431.0, 736.0, 1460.0, 2929.0, 6118.0, 15822.0, 58621.0, 365957.0, 1813143.0, 1566996.0, 286600.0, 49870.0, 13810.0, 5424.0, 2524.0, 1295.0, 717.0, 395.0, 237.0, 126.0, 93.0, 56.0, 35.0, 24.0, 15.0, 15.0, 8.0, 6.0, 8.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.845703125, -0.8221664428710938, -0.7986297607421875, -0.7750930786132812, -0.751556396484375, -0.7280197143554688, -0.7044830322265625, -0.6809463500976562, -0.65740966796875, -0.6338729858398438, -0.6103363037109375, -0.5867996215820312, -0.563262939453125, -0.5397262573242188, -0.5161895751953125, -0.49265289306640625, -0.4691162109375, -0.44557952880859375, -0.4220428466796875, -0.39850616455078125, -0.374969482421875, -0.35143280029296875, -0.3278961181640625, -0.30435943603515625, -0.28082275390625, -0.25728607177734375, -0.2337493896484375, -0.21021270751953125, -0.186676025390625, -0.16313934326171875, -0.1396026611328125, -0.11606597900390625, -0.092529296875, -0.06899261474609375, -0.0454559326171875, -0.02191925048828125, 0.001617431640625, 0.02515411376953125, 0.0486907958984375, 0.07222747802734375, 0.09576416015625, 0.11930084228515625, 0.1428375244140625, 0.16637420654296875, 0.189910888671875, 0.21344757080078125, 0.2369842529296875, 0.26052093505859375, 0.2840576171875, 0.30759429931640625, 0.3311309814453125, 0.35466766357421875, 0.378204345703125, 0.40174102783203125, 0.4252777099609375, 0.44881439208984375, 0.47235107421875, 0.49588775634765625, 0.5194244384765625, 0.5429611206054688, 0.566497802734375, 0.5900344848632812, 0.6135711669921875, 0.6371078491210938, 0.66064453125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 14.0, 12.0, 15.0, 16.0, 22.0, 37.0, 24.0, 32.0, 26.0, 50.0, 43.0, 52.0, 57.0, 54.0, 55.0, 49.0, 38.0, 43.0, 42.0, 44.0, 38.0, 40.0, 26.0, 32.0, 33.0, 18.0, 10.0, 10.0, 14.0, 11.0, 8.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5244140625, -0.5102043151855469, -0.49599456787109375, -0.4817848205566406, -0.4675750732421875, -0.4533653259277344, -0.43915557861328125, -0.4249458312988281, -0.410736083984375, -0.3965263366699219, -0.38231658935546875, -0.3681068420410156, -0.3538970947265625, -0.3396873474121094, -0.32547760009765625, -0.3112678527832031, -0.29705810546875, -0.2828483581542969, -0.26863861083984375, -0.2544288635253906, -0.2402191162109375, -0.22600936889648438, -0.21179962158203125, -0.19758987426757812, -0.183380126953125, -0.16917037963867188, -0.15496063232421875, -0.14075088500976562, -0.1265411376953125, -0.11233139038085938, -0.09812164306640625, -0.08391189575195312, -0.0697021484375, -0.055492401123046875, -0.04128265380859375, -0.027072906494140625, -0.0128631591796875, 0.001346588134765625, 0.01555633544921875, 0.029766082763671875, 0.043975830078125, 0.058185577392578125, 0.07239532470703125, 0.08660507202148438, 0.1008148193359375, 0.11502456665039062, 0.12923431396484375, 0.14344406127929688, 0.15765380859375, 0.17186355590820312, 0.18607330322265625, 0.20028305053710938, 0.2144927978515625, 0.22870254516601562, 0.24291229248046875, 0.2571220397949219, 0.271331787109375, 0.2855415344238281, 0.29975128173828125, 0.3139610290527344, 0.3281707763671875, 0.3423805236816406, 0.35659027099609375, 0.3708000183105469, 0.385009765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 3.0, 7.0, 15.0, 23.0, 37.0, 51.0, 80.0, 180.0, 387.0, 862.0, 2223.0, 12339.0, 3749492.0, 418850.0, 6767.0, 1684.0, 671.0, 286.0, 143.0, 59.0, 28.0, 32.0, 15.0, 16.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.11328125, -3.995269775390625, -3.87725830078125, -3.759246826171875, -3.6412353515625, -3.523223876953125, -3.40521240234375, -3.287200927734375, -3.169189453125, -3.051177978515625, -2.93316650390625, -2.815155029296875, -2.6971435546875, -2.579132080078125, -2.46112060546875, -2.343109130859375, -2.22509765625, -2.107086181640625, -1.98907470703125, -1.871063232421875, -1.7530517578125, -1.635040283203125, -1.51702880859375, -1.399017333984375, -1.281005859375, -1.162994384765625, -1.04498291015625, -0.926971435546875, -0.8089599609375, -0.690948486328125, -0.57293701171875, -0.454925537109375, -0.3369140625, -0.218902587890625, -0.10089111328125, 0.017120361328125, 0.1351318359375, 0.253143310546875, 0.37115478515625, 0.489166259765625, 0.607177734375, 0.725189208984375, 0.84320068359375, 0.961212158203125, 1.0792236328125, 1.197235107421875, 1.31524658203125, 1.433258056640625, 1.55126953125, 1.669281005859375, 1.78729248046875, 1.905303955078125, 2.0233154296875, 2.141326904296875, 2.25933837890625, 2.377349853515625, 2.495361328125, 2.613372802734375, 2.73138427734375, 2.849395751953125, 2.9674072265625, 3.085418701171875, 3.20343017578125, 3.321441650390625, 3.439453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 7.0, 14.0, 31.0, 51.0, 106.0, 207.0, 465.0, 840.0, 997.0, 638.0, 322.0, 199.0, 89.0, 50.0, 27.0, 15.0, 9.0, 11.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9609375, -3.8771820068359375, -3.793426513671875, -3.7096710205078125, -3.62591552734375, -3.5421600341796875, -3.458404541015625, -3.3746490478515625, -3.2908935546875, -3.2071380615234375, -3.123382568359375, -3.0396270751953125, -2.95587158203125, -2.8721160888671875, -2.788360595703125, -2.7046051025390625, -2.620849609375, -2.5370941162109375, -2.453338623046875, -2.3695831298828125, -2.28582763671875, -2.2020721435546875, -2.118316650390625, -2.0345611572265625, -1.9508056640625, -1.8670501708984375, -1.783294677734375, -1.6995391845703125, -1.61578369140625, -1.5320281982421875, -1.448272705078125, -1.3645172119140625, -1.28076171875, -1.1970062255859375, -1.113250732421875, -1.0294952392578125, -0.94573974609375, -0.8619842529296875, -0.778228759765625, -0.6944732666015625, -0.6107177734375, -0.5269622802734375, -0.443206787109375, -0.3594512939453125, -0.27569580078125, -0.1919403076171875, -0.108184814453125, -0.0244293212890625, 0.059326171875, 0.1430816650390625, 0.226837158203125, 0.3105926513671875, 0.39434814453125, 0.4781036376953125, 0.561859130859375, 0.6456146240234375, 0.7293701171875, 0.8131256103515625, 0.896881103515625, 0.9806365966796875, 1.06439208984375, 1.1481475830078125, 1.231903076171875, 1.3156585693359375, 1.3994140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 7.0, 8.0, 12.0, 22.0, 22.0, 45.0, 71.0, 129.0, 145.0, 144.0, 138.0, 88.0, 52.0, 30.0, 20.0, 9.0, 10.0, 4.0, 5.0, 6.0, 1.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.983972549438477, -9.551544189453125, -9.119115829467773, -8.686687469482422, -8.254258155822754, -7.821829795837402, -7.389401435852051, -6.956973075866699, -6.524544715881348, -6.092116355895996, -5.659687519073486, -5.227259159088135, -4.794830799102783, -4.362401962280273, -3.929973602294922, -3.4975452423095703, -3.0651164054870605, -2.63268780708313, -2.2002594470977783, -1.7678308486938477, -1.3354023694992065, -0.9029738903045654, -0.47054529190063477, -0.0381169319152832, 0.39431166648864746, 0.8267401456832886, 1.2591686248779297, 1.6915972232818604, 2.124025821685791, 2.5564541816711426, 2.9888827800750732, 3.421311140060425, 3.8537397384643555, 4.286168098449707, 4.718596935272217, 5.151025295257568, 5.58345365524292, 6.01588249206543, 6.448310852050781, 6.880739212036133, 7.313167572021484, 7.745595932006836, 8.178024291992188, 8.610452651977539, 9.042881965637207, 9.475310325622559, 9.90773868560791, 10.340167045593262, 10.77259635925293, 11.205024719238281, 11.637453079223633, 12.069881439208984, 12.502310752868652, 12.934739112854004, 13.367167472839355, 13.799595832824707, 14.232024192810059, 14.66445255279541, 15.096880912780762, 15.52931022644043, 15.961738586425781, 16.394166946411133, 16.826595306396484, 17.259023666381836, 17.691452026367188]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 4.0, 5.0, 8.0, 7.0, 8.0, 16.0, 14.0, 19.0, 16.0, 37.0, 44.0, 44.0, 39.0, 49.0, 56.0, 72.0, 62.0, 63.0, 61.0, 46.0, 36.0, 40.0, 31.0, 36.0, 35.0, 30.0, 12.0, 18.0, 12.0, 17.0, 5.0, 6.0, 10.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.444842338562012, -9.149336814880371, -8.85383129119873, -8.55832576751709, -8.26282024383545, -7.967314720153809, -7.67180871963501, -7.376303195953369, -7.0807976722717285, -6.785292148590088, -6.489786624908447, -6.194281101226807, -5.898775100708008, -5.603269577026367, -5.307764053344727, -5.012258529663086, -4.716753005981445, -4.421247482299805, -4.125741958618164, -3.8302361965179443, -3.5347306728363037, -3.239225149154663, -2.9437193870544434, -2.6482138633728027, -2.352708339691162, -2.0572028160095215, -1.7616971731185913, -1.4661915302276611, -1.1706860065460205, -0.8751804828643799, -0.5796748399734497, -0.28416919708251953, 0.011335372924804688, 0.3068409562110901, 0.6023465394973755, 0.8978521227836609, 1.1933577060699463, 1.488863229751587, 1.784368872642517, 2.0798745155334473, 2.375380039215088, 2.6708855628967285, 2.966391086578369, 3.261896848678589, 3.5574023723602295, 3.85290789604187, 4.14841365814209, 4.4439191818237305, 4.739424705505371, 5.034930229187012, 5.330435752868652, 5.625941276550293, 5.921446800231934, 6.216952323913574, 6.512458324432373, 6.807963848114014, 7.103469371795654, 7.398974895477295, 7.6944804191589355, 7.989985942840576, 8.285491943359375, 8.580997467041016, 8.876502990722656, 9.172008514404297, 9.467514038085938]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 9.0, 23.0, 23.0, 47.0, 58.0, 110.0, 175.0, 304.0, 646.0, 1355.0, 3069.0, 8959.0, 32996.0, 198574.0, 676608.0, 95125.0, 20009.0, 6010.0, 2300.0, 1004.0, 469.0, 275.0, 135.0, 95.0, 55.0, 27.0, 23.0, 20.0, 7.0, 13.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98974609375, -0.9617233276367188, -0.9337005615234375, -0.9056777954101562, -0.877655029296875, -0.8496322631835938, -0.8216094970703125, -0.7935867309570312, -0.76556396484375, -0.7375411987304688, -0.7095184326171875, -0.6814956665039062, -0.653472900390625, -0.6254501342773438, -0.5974273681640625, -0.5694046020507812, -0.5413818359375, -0.5133590698242188, -0.4853363037109375, -0.45731353759765625, -0.429290771484375, -0.40126800537109375, -0.3732452392578125, -0.34522247314453125, -0.31719970703125, -0.28917694091796875, -0.2611541748046875, -0.23313140869140625, -0.205108642578125, -0.17708587646484375, -0.1490631103515625, -0.12104034423828125, -0.093017578125, -0.06499481201171875, -0.0369720458984375, -0.00894927978515625, 0.019073486328125, 0.04709625244140625, 0.0751190185546875, 0.10314178466796875, 0.13116455078125, 0.15918731689453125, 0.1872100830078125, 0.21523284912109375, 0.243255615234375, 0.27127838134765625, 0.2993011474609375, 0.32732391357421875, 0.3553466796875, 0.38336944580078125, 0.4113922119140625, 0.43941497802734375, 0.467437744140625, 0.49546051025390625, 0.5234832763671875, 0.5515060424804688, 0.57952880859375, 0.6075515747070312, 0.6355743408203125, 0.6635971069335938, 0.691619873046875, 0.7196426391601562, 0.7476654052734375, 0.7756881713867188, 0.8037109375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 10.0, 15.0, 16.0, 20.0, 29.0, 32.0, 28.0, 39.0, 45.0, 55.0, 63.0, 59.0, 70.0, 49.0, 65.0, 46.0, 60.0, 36.0, 43.0, 31.0, 35.0, 26.0, 22.0, 16.0, 19.0, 12.0, 12.0, 9.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.658203125, -0.6383132934570312, -0.6184234619140625, -0.5985336303710938, -0.578643798828125, -0.5587539672851562, -0.5388641357421875, -0.5189743041992188, -0.49908447265625, -0.47919464111328125, -0.4593048095703125, -0.43941497802734375, -0.419525146484375, -0.39963531494140625, -0.3797454833984375, -0.35985565185546875, -0.3399658203125, -0.32007598876953125, -0.3001861572265625, -0.28029632568359375, -0.260406494140625, -0.24051666259765625, -0.2206268310546875, -0.20073699951171875, -0.18084716796875, -0.16095733642578125, -0.1410675048828125, -0.12117767333984375, -0.101287841796875, -0.08139801025390625, -0.0615081787109375, -0.04161834716796875, -0.021728515625, -0.00183868408203125, 0.0180511474609375, 0.03794097900390625, 0.057830810546875, 0.07772064208984375, 0.0976104736328125, 0.11750030517578125, 0.13739013671875, 0.15727996826171875, 0.1771697998046875, 0.19705963134765625, 0.216949462890625, 0.23683929443359375, 0.2567291259765625, 0.27661895751953125, 0.2965087890625, 0.31639862060546875, 0.3362884521484375, 0.35617828369140625, 0.376068115234375, 0.39595794677734375, 0.4158477783203125, 0.43573760986328125, 0.45562744140625, 0.47551727294921875, 0.4954071044921875, 0.5152969360351562, 0.535186767578125, 0.5550765991210938, 0.5749664306640625, 0.5948562622070312, 0.61474609375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 8.0, 12.0, 14.0, 24.0, 27.0, 52.0, 59.0, 98.0, 196.0, 351.0, 652.0, 1933.0, 10657.0, 602904.0, 417660.0, 10394.0, 1957.0, 653.0, 344.0, 168.0, 114.0, 81.0, 41.0, 35.0, 20.0, 19.0, 16.0, 17.0, 8.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.626953125, -1.5790863037109375, -1.531219482421875, -1.4833526611328125, -1.43548583984375, -1.3876190185546875, -1.339752197265625, -1.2918853759765625, -1.2440185546875, -1.1961517333984375, -1.148284912109375, -1.1004180908203125, -1.05255126953125, -1.0046844482421875, -0.956817626953125, -0.9089508056640625, -0.861083984375, -0.8132171630859375, -0.765350341796875, -0.7174835205078125, -0.66961669921875, -0.6217498779296875, -0.573883056640625, -0.5260162353515625, -0.4781494140625, -0.4302825927734375, -0.382415771484375, -0.3345489501953125, -0.28668212890625, -0.2388153076171875, -0.190948486328125, -0.1430816650390625, -0.09521484375, -0.0473480224609375, 0.000518798828125, 0.0483856201171875, 0.09625244140625, 0.1441192626953125, 0.191986083984375, 0.2398529052734375, 0.2877197265625, 0.3355865478515625, 0.383453369140625, 0.4313201904296875, 0.47918701171875, 0.5270538330078125, 0.574920654296875, 0.6227874755859375, 0.670654296875, 0.7185211181640625, 0.766387939453125, 0.8142547607421875, 0.86212158203125, 0.9099884033203125, 0.957855224609375, 1.0057220458984375, 1.0535888671875, 1.1014556884765625, 1.149322509765625, 1.1971893310546875, 1.24505615234375, 1.2929229736328125, 1.340789794921875, 1.3886566162109375, 1.4365234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 7.0, 6.0, 7.0, 8.0, 6.0, 19.0, 13.0, 25.0, 20.0, 26.0, 37.0, 43.0, 38.0, 49.0, 74.0, 79.0, 102.0, 85.0, 54.0, 45.0, 40.0, 41.0, 26.0, 24.0, 20.0, 12.0, 24.0, 10.0, 15.0, 11.0, 11.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.240234375, -2.16387939453125, -2.0875244140625, -2.01116943359375, -1.934814453125, -1.85845947265625, -1.7821044921875, -1.70574951171875, -1.62939453125, -1.55303955078125, -1.4766845703125, -1.40032958984375, -1.323974609375, -1.24761962890625, -1.1712646484375, -1.09490966796875, -1.0185546875, -0.94219970703125, -0.8658447265625, -0.78948974609375, -0.713134765625, -0.63677978515625, -0.5604248046875, -0.48406982421875, -0.40771484375, -0.33135986328125, -0.2550048828125, -0.17864990234375, -0.102294921875, -0.02593994140625, 0.0504150390625, 0.12677001953125, 0.203125, 0.27947998046875, 0.3558349609375, 0.43218994140625, 0.508544921875, 0.58489990234375, 0.6612548828125, 0.73760986328125, 0.81396484375, 0.89031982421875, 0.9666748046875, 1.04302978515625, 1.119384765625, 1.19573974609375, 1.2720947265625, 1.34844970703125, 1.4248046875, 1.50115966796875, 1.5775146484375, 1.65386962890625, 1.730224609375, 1.80657958984375, 1.8829345703125, 1.95928955078125, 2.03564453125, 2.11199951171875, 2.1883544921875, 2.26470947265625, 2.341064453125, 2.41741943359375, 2.4937744140625, 2.57012939453125, 2.646484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 11.0, 9.0, 7.0, 12.0, 28.0, 33.0, 40.0, 88.0, 140.0, 330.0, 787.0, 2357.0, 12511.0, 779450.0, 238475.0, 10625.0, 2213.0, 727.0, 303.0, 150.0, 96.0, 46.0, 28.0, 18.0, 19.0, 12.0, 8.0, 7.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2181396484375, -0.20863914489746094, -0.19913864135742188, -0.1896381378173828, -0.18013763427734375, -0.1706371307373047, -0.16113662719726562, -0.15163612365722656, -0.1421356201171875, -0.13263511657714844, -0.12313461303710938, -0.11363410949707031, -0.10413360595703125, -0.09463310241699219, -0.08513259887695312, -0.07563209533691406, -0.066131591796875, -0.05663108825683594, -0.047130584716796875, -0.03763008117675781, -0.02812957763671875, -0.018629074096679688, -0.009128570556640625, 0.0003719329833984375, 0.0098724365234375, 0.019372940063476562, 0.028873443603515625, 0.03837394714355469, 0.04787445068359375, 0.05737495422363281, 0.06687545776367188, 0.07637596130371094, 0.08587646484375, 0.09537696838378906, 0.10487747192382812, 0.11437797546386719, 0.12387847900390625, 0.1333789825439453, 0.14287948608398438, 0.15237998962402344, 0.1618804931640625, 0.17138099670410156, 0.18088150024414062, 0.1903820037841797, 0.19988250732421875, 0.2093830108642578, 0.21888351440429688, 0.22838401794433594, 0.237884521484375, 0.24738502502441406, 0.2568855285644531, 0.2663860321044922, 0.27588653564453125, 0.2853870391845703, 0.2948875427246094, 0.30438804626464844, 0.3138885498046875, 0.32338905334472656, 0.3328895568847656, 0.3423900604248047, 0.35189056396484375, 0.3613910675048828, 0.3708915710449219, 0.38039207458496094, 0.389892578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 11.0, 5.0, 9.0, 19.0, 24.0, 19.0, 29.0, 37.0, 57.0, 73.0, 82.0, 83.0, 93.0, 104.0, 77.0, 64.0, 40.0, 34.0, 27.0, 13.0, 17.0, 11.0, 9.0, 8.0, 7.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-05, -4.343502223491669e-05, -4.2166560888290405e-05, -4.0898099541664124e-05, -3.962963819503784e-05, -3.836117684841156e-05, -3.709271550178528e-05, -3.5824254155158997e-05, -3.4555792808532715e-05, -3.328733146190643e-05, -3.201887011528015e-05, -3.075040876865387e-05, -2.9481947422027588e-05, -2.8213486075401306e-05, -2.6945024728775024e-05, -2.5676563382148743e-05, -2.440810203552246e-05, -2.313964068889618e-05, -2.1871179342269897e-05, -2.0602717995643616e-05, -1.9334256649017334e-05, -1.8065795302391052e-05, -1.679733395576477e-05, -1.552887260913849e-05, -1.4260411262512207e-05, -1.2991949915885925e-05, -1.1723488569259644e-05, -1.0455027222633362e-05, -9.18656587600708e-06, -7.918104529380798e-06, -6.649643182754517e-06, -5.381181836128235e-06, -4.112720489501953e-06, -2.8442591428756714e-06, -1.5757977962493896e-06, -3.073364496231079e-07, 9.611248970031738e-07, 2.2295862436294556e-06, 3.4980475902557373e-06, 4.766508936882019e-06, 6.034970283508301e-06, 7.3034316301345825e-06, 8.571892976760864e-06, 9.840354323387146e-06, 1.1108815670013428e-05, 1.237727701663971e-05, 1.3645738363265991e-05, 1.4914199709892273e-05, 1.6182661056518555e-05, 1.7451122403144836e-05, 1.8719583749771118e-05, 1.99880450963974e-05, 2.125650644302368e-05, 2.2524967789649963e-05, 2.3793429136276245e-05, 2.5061890482902527e-05, 2.633035182952881e-05, 2.759881317615509e-05, 2.8867274522781372e-05, 3.0135735869407654e-05, 3.1404197216033936e-05, 3.267265856266022e-05, 3.39411199092865e-05, 3.520958125591278e-05, 3.647804260253906e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 12.0, 6.0, 16.0, 19.0, 35.0, 50.0, 60.0, 93.0, 154.0, 264.0, 439.0, 877.0, 1908.0, 4389.0, 13158.0, 61755.0, 868023.0, 73574.0, 14731.0, 4839.0, 1914.0, 1001.0, 480.0, 270.0, 175.0, 94.0, 70.0, 34.0, 28.0, 19.0, 18.0, 14.0, 5.0, 3.0, 4.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1766357421875, -0.1706562042236328, -0.16467666625976562, -0.15869712829589844, -0.15271759033203125, -0.14673805236816406, -0.14075851440429688, -0.1347789764404297, -0.1287994384765625, -0.12281990051269531, -0.11684036254882812, -0.11086082458496094, -0.10488128662109375, -0.09890174865722656, -0.09292221069335938, -0.08694267272949219, -0.080963134765625, -0.07498359680175781, -0.06900405883789062, -0.06302452087402344, -0.05704498291015625, -0.05106544494628906, -0.045085906982421875, -0.03910636901855469, -0.0331268310546875, -0.027147293090820312, -0.021167755126953125, -0.015188217163085938, -0.00920867919921875, -0.0032291412353515625, 0.002750396728515625, 0.008729934692382812, 0.01470947265625, 0.020689010620117188, 0.026668548583984375, 0.03264808654785156, 0.03862762451171875, 0.04460716247558594, 0.050586700439453125, 0.05656623840332031, 0.0625457763671875, 0.06852531433105469, 0.07450485229492188, 0.08048439025878906, 0.08646392822265625, 0.09244346618652344, 0.09842300415039062, 0.10440254211425781, 0.110382080078125, 0.11636161804199219, 0.12234115600585938, 0.12832069396972656, 0.13430023193359375, 0.14027976989746094, 0.14625930786132812, 0.1522388458251953, 0.1582183837890625, 0.1641979217529297, 0.17017745971679688, 0.17615699768066406, 0.18213653564453125, 0.18811607360839844, 0.19409561157226562, 0.2000751495361328, 0.2060546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 4.0, 7.0, 16.0, 21.0, 26.0, 37.0, 58.0, 93.0, 166.0, 143.0, 116.0, 85.0, 53.0, 45.0, 27.0, 18.0, 14.0, 7.0, 8.0, 8.0, 2.0, 2.0, 7.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.249267578125, -0.24073028564453125, -0.2321929931640625, -0.22365570068359375, -0.215118408203125, -0.20658111572265625, -0.1980438232421875, -0.18950653076171875, -0.18096923828125, -0.17243194580078125, -0.1638946533203125, -0.15535736083984375, -0.146820068359375, -0.13828277587890625, -0.1297454833984375, -0.12120819091796875, -0.1126708984375, -0.10413360595703125, -0.0955963134765625, -0.08705902099609375, -0.078521728515625, -0.06998443603515625, -0.0614471435546875, -0.05290985107421875, -0.04437255859375, -0.03583526611328125, -0.0272979736328125, -0.01876068115234375, -0.010223388671875, -0.00168609619140625, 0.0068511962890625, 0.01538848876953125, 0.02392578125, 0.03246307373046875, 0.0410003662109375, 0.04953765869140625, 0.058074951171875, 0.06661224365234375, 0.0751495361328125, 0.08368682861328125, 0.09222412109375, 0.10076141357421875, 0.1092987060546875, 0.11783599853515625, 0.126373291015625, 0.13491058349609375, 0.1434478759765625, 0.15198516845703125, 0.1605224609375, 0.16905975341796875, 0.1775970458984375, 0.18613433837890625, 0.194671630859375, 0.20320892333984375, 0.2117462158203125, 0.22028350830078125, 0.22882080078125, 0.23735809326171875, 0.2458953857421875, 0.25443267822265625, 0.262969970703125, 0.27150726318359375, 0.2800445556640625, 0.28858184814453125, 0.297119140625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 11.0, 42.0, 150.0, 594.0, 138.0, 39.0, 17.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.80231475830078, -16.2125301361084, -15.622745513916016, -15.032960891723633, -14.44317626953125, -13.853391647338867, -13.2636079788208, -12.673823356628418, -12.084038734436035, -11.494254112243652, -10.90446949005127, -10.314684867858887, -9.72490119934082, -9.135116577148438, -8.545331954956055, -7.955547332763672, -7.365762710571289, -6.775978088378906, -6.186193466186523, -5.596409320831299, -5.006624698638916, -4.416840076446533, -3.8270556926727295, -3.237271308898926, -2.647486686706543, -2.05770206451416, -1.4679176807403564, -0.8781331777572632, -0.2883486747741699, 0.3014359474182129, 0.8912203311920166, 1.4810047149658203, 2.0707874298095703, 2.660572052001953, 3.250356435775757, 3.8401408195495605, 4.429925441741943, 5.019710063934326, 5.609494209289551, 6.199278831481934, 6.789063453674316, 7.378848075866699, 7.968632698059082, 8.558417320251465, 9.148200988769531, 9.737985610961914, 10.327770233154297, 10.91755485534668, 11.507339477539062, 12.097124099731445, 12.686908721923828, 13.276693344116211, 13.866477966308594, 14.456262588500977, 15.046046257019043, 15.635830879211426, 16.225616455078125, 16.815401077270508, 17.40518569946289, 17.994970321655273, 18.584754943847656, 19.17453956604004, 19.764324188232422, 20.354106903076172, 20.943891525268555]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 7.0, 11.0, 9.0, 16.0, 23.0, 15.0, 19.0, 23.0, 32.0, 42.0, 69.0, 101.0, 135.0, 133.0, 87.0, 52.0, 38.0, 33.0, 22.0, 18.0, 17.0, 21.0, 14.0, 12.0, 5.0, 9.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.367238998413086, -9.098390579223633, -8.82954216003418, -8.560693740844727, -8.291845321655273, -8.02299690246582, -7.754148960113525, -7.485300540924072, -7.216452598571777, -6.947604179382324, -6.678755760192871, -6.409907341003418, -6.141059398651123, -5.87221097946167, -5.603362560272217, -5.334514141082764, -5.0656657218933105, -4.796817302703857, -4.527968883514404, -4.259120941162109, -3.9902725219726562, -3.721424102783203, -3.45257568359375, -3.183727264404297, -2.914879083633423, -2.6460306644439697, -2.3771824836730957, -2.1083340644836426, -1.839485764503479, -1.5706374645233154, -1.3017890453338623, -1.0329407453536987, -0.7640924453735352, -0.4952441155910492, -0.22639578580856323, 0.04245257377624512, 0.3113008737564087, 0.5801491737365723, 0.8489975929260254, 1.117845892906189, 1.3866941928863525, 1.6555424928665161, 1.9243907928466797, 2.193239212036133, 2.462087631225586, 2.73093581199646, 2.999784231185913, 3.268632411956787, 3.5374808311462402, 3.8063292503356934, 4.0751776695251465, 4.344025611877441, 4.6128740310668945, 4.881722450256348, 5.150570869445801, 5.419419288635254, 5.688267707824707, 5.95711612701416, 6.225964546203613, 6.494812965393066, 6.763660907745361, 7.0325093269348145, 7.301357746124268, 7.570206165313721, 7.839054107666016]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 3.0, 8.0, 9.0, 19.0, 19.0, 17.0, 38.0, 28.0, 40.0, 45.0, 42.0, 79.0, 265.0, 94.0, 54.0, 42.0, 28.0, 35.0, 20.0, 21.0, 19.0, 15.0, 13.0, 9.0, 5.0, 7.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6279296875, -0.6074142456054688, -0.5868988037109375, -0.5663833618164062, -0.545867919921875, -0.5253524780273438, -0.5048370361328125, -0.48432159423828125, -0.46380615234375, -0.44329071044921875, -0.4227752685546875, -0.40225982666015625, -0.381744384765625, -0.36122894287109375, -0.3407135009765625, -0.32019805908203125, -0.2996826171875, -0.27916717529296875, -0.2586517333984375, -0.23813629150390625, -0.217620849609375, -0.19710540771484375, -0.1765899658203125, -0.15607452392578125, -0.13555908203125, -0.11504364013671875, -0.0945281982421875, -0.07401275634765625, -0.053497314453125, -0.03298187255859375, -0.0124664306640625, 0.00804901123046875, 0.028564453125, 0.04907989501953125, 0.0695953369140625, 0.09011077880859375, 0.110626220703125, 0.13114166259765625, 0.1516571044921875, 0.17217254638671875, 0.19268798828125, 0.21320343017578125, 0.2337188720703125, 0.25423431396484375, 0.274749755859375, 0.29526519775390625, 0.3157806396484375, 0.33629608154296875, 0.3568115234375, 0.37732696533203125, 0.3978424072265625, 0.41835784912109375, 0.438873291015625, 0.45938873291015625, 0.4799041748046875, 0.5004196166992188, 0.52093505859375, 0.5414505004882812, 0.5619659423828125, 0.5824813842773438, 0.602996826171875, 0.6235122680664062, 0.6440277099609375, 0.6645431518554688, 0.68505859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 11.0, 0.0, 10.0, 7.0, 11.0, 15.0, 22.0, 31.0, 47.0, 108.0, 146.0, 326.0, 963.0, 5676.0, 8343872.0, 33906.0, 2392.0, 560.0, 221.0, 96.0, 65.0, 30.0, 13.0, 14.0, 14.0, 5.0, 9.0, 4.0, 6.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.962745189666748, -6.750376224517822, -6.538007736206055, -6.325638771057129, -6.113269805908203, -5.900900840759277, -5.688531875610352, -5.476163387298584, -5.263794422149658, -5.051425457000732, -4.839056968688965, -4.626688003540039, -4.414319038391113, -4.2019500732421875, -3.989581346511841, -3.777212619781494, -3.5648436546325684, -3.3524746894836426, -3.140105962753296, -2.927737236022949, -2.7153682708740234, -2.5029993057250977, -2.290630578994751, -2.0782618522644043, -1.8658928871154785, -1.6535240411758423, -1.441155195236206, -1.2287863492965698, -1.0164175033569336, -0.8040486574172974, -0.5916798114776611, -0.3793109655380249, -0.16694164276123047, 0.04542720317840576, 0.257796049118042, 0.4701648950576782, 0.6825337409973145, 0.8949025869369507, 1.107271432876587, 1.3196402788162231, 1.5320091247558594, 1.7443779706954956, 1.9567468166351318, 2.1691155433654785, 2.3814845085144043, 2.59385347366333, 2.8062222003936768, 3.0185909271240234, 3.230959892272949, 3.443328857421875, 3.6556975841522217, 3.8680663108825684, 4.080435276031494, 4.29280424118042, 4.5051727294921875, 4.717541694641113, 4.929910659790039, 5.142279624938965, 5.354648590087891, 5.567017078399658, 5.779386043548584, 5.99175500869751, 6.204123497009277, 6.416492462158203, 6.628861427307129]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 8.0, 7.0, 6.0, 1.0, 8.0, 1.0, 4.0, 7.0, 5.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.03990364074707, -8.761964797973633, -8.484025955200195, -8.206087112426758, -7.928147792816162, -7.650208950042725, -7.372270107269287, -7.09433126449585, -6.816391944885254, -6.538453102111816, -6.260514259338379, -5.982575416564941, -5.704636096954346, -5.426697254180908, -5.148758411407471, -4.870819568634033, -4.592880725860596, -4.314941883087158, -4.037003040313721, -3.759063959121704, -3.4811248779296875, -3.20318603515625, -2.9252471923828125, -2.647308349609375, -2.3693692684173584, -2.091430425643921, -1.8134913444519043, -1.5355525016784668, -1.2576135396957397, -0.9796745777130127, -0.7017357349395752, -0.42379677295684814, -0.1458578109741211, 0.13208112120628357, 0.41002005338668823, 0.6879589557647705, 0.9658979177474976, 1.2438368797302246, 1.521775722503662, 1.7997146844863892, 2.077653646469116, 2.3555924892425537, 2.6335315704345703, 2.911470413208008, 3.1894092559814453, 3.467348337173462, 3.7452871799468994, 4.023226261138916, 4.3011651039123535, 4.579103946685791, 4.8570427894592285, 5.134982109069824, 5.412920951843262, 5.690859794616699, 5.968798637390137, 6.246737480163574, 6.524676322937012, 6.802615165710449, 7.080554008483887, 7.358492851257324, 7.63643217086792, 7.914371013641357, 8.192310333251953, 8.47024917602539, 8.748188018798828]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 11.0, 18.0, 23.0, 31.0, 51.0, 46.0, 61.0, 69.0, 96.0, 106.0, 98.0, 70.0, 78.0, 44.0, 44.0, 33.0, 29.0, 17.0, 11.0, 12.0, 8.0, 9.0, 11.0, 3.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.367431640625, -0.3561363220214844, -0.34484100341796875, -0.3335456848144531, -0.3222503662109375, -0.3109550476074219, -0.29965972900390625, -0.2883644104003906, -0.277069091796875, -0.2657737731933594, -0.25447845458984375, -0.24318313598632812, -0.2318878173828125, -0.22059249877929688, -0.20929718017578125, -0.19800186157226562, -0.18670654296875, -0.17541122436523438, -0.16411590576171875, -0.15282058715820312, -0.1415252685546875, -0.13022994995117188, -0.11893463134765625, -0.10763931274414062, -0.096343994140625, -0.08504867553710938, -0.07375335693359375, -0.062458038330078125, -0.0511627197265625, -0.039867401123046875, -0.02857208251953125, -0.017276763916015625, -0.0059814453125, 0.005313873291015625, 0.01660919189453125, 0.027904510498046875, 0.0391998291015625, 0.050495147705078125, 0.06179046630859375, 0.07308578491210938, 0.084381103515625, 0.09567642211914062, 0.10697174072265625, 0.11826705932617188, 0.1295623779296875, 0.14085769653320312, 0.15215301513671875, 0.16344833374023438, 0.17474365234375, 0.18603897094726562, 0.19733428955078125, 0.20862960815429688, 0.2199249267578125, 0.23122024536132812, 0.24251556396484375, 0.2538108825683594, 0.265106201171875, 0.2764015197753906, 0.28769683837890625, 0.2989921569824219, 0.3102874755859375, 0.3215827941894531, 0.33287811279296875, 0.3441734313964844, 0.35546875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 10.0, 11.0, 16.0, 27.0, 35.0, 91.0, 104.0, 210.0, 406.0, 850.0, 2135.0, 5991.0, 20478.0, 78782.0, 229885.0, 133979.0, 35539.0, 10052.0, 3286.0, 1249.0, 524.0, 277.0, 140.0, 66.0, 59.0, 20.0, 17.0, 12.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.685546875, -3.557098388671875, -3.42864990234375, -3.300201416015625, -3.1717529296875, -3.043304443359375, -2.91485595703125, -2.786407470703125, -2.657958984375, -2.529510498046875, -2.40106201171875, -2.272613525390625, -2.1441650390625, -2.015716552734375, -1.88726806640625, -1.758819580078125, -1.63037109375, -1.501922607421875, -1.37347412109375, -1.245025634765625, -1.1165771484375, -0.988128662109375, -0.85968017578125, -0.731231689453125, -0.602783203125, -0.474334716796875, -0.34588623046875, -0.217437744140625, -0.0889892578125, 0.039459228515625, 0.16790771484375, 0.296356201171875, 0.4248046875, 0.553253173828125, 0.68170166015625, 0.810150146484375, 0.9385986328125, 1.067047119140625, 1.19549560546875, 1.323944091796875, 1.452392578125, 1.580841064453125, 1.70928955078125, 1.837738037109375, 1.9661865234375, 2.094635009765625, 2.22308349609375, 2.351531982421875, 2.47998046875, 2.608428955078125, 2.73687744140625, 2.865325927734375, 2.9937744140625, 3.122222900390625, 3.25067138671875, 3.379119873046875, 3.507568359375, 3.636016845703125, 3.76446533203125, 3.892913818359375, 4.0213623046875, 4.149810791015625, 4.27825927734375, 4.406707763671875, 4.53515625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 10.0, 11.0, 10.0, 9.0, 15.0, 27.0, 36.0, 38.0, 49.0, 51.0, 71.0, 73.0, 69.0, 81.0, 83.0, 66.0, 59.0, 46.0, 49.0, 34.0, 31.0, 22.0, 17.0, 7.0, 9.0, 5.0, 4.0, 3.0, 8.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55615234375, -0.5337905883789062, -0.5114288330078125, -0.48906707763671875, -0.466705322265625, -0.44434356689453125, -0.4219818115234375, -0.39962005615234375, -0.37725830078125, -0.35489654541015625, -0.3325347900390625, -0.31017303466796875, -0.287811279296875, -0.26544952392578125, -0.2430877685546875, -0.22072601318359375, -0.1983642578125, -0.17600250244140625, -0.1536407470703125, -0.13127899169921875, -0.108917236328125, -0.08655548095703125, -0.0641937255859375, -0.04183197021484375, -0.01947021484375, 0.00289154052734375, 0.0252532958984375, 0.04761505126953125, 0.069976806640625, 0.09233856201171875, 0.1147003173828125, 0.13706207275390625, 0.159423828125, 0.18178558349609375, 0.2041473388671875, 0.22650909423828125, 0.248870849609375, 0.27123260498046875, 0.2935943603515625, 0.31595611572265625, 0.33831787109375, 0.36067962646484375, 0.3830413818359375, 0.40540313720703125, 0.427764892578125, 0.45012664794921875, 0.4724884033203125, 0.49485015869140625, 0.5172119140625, 0.5395736694335938, 0.5619354248046875, 0.5842971801757812, 0.606658935546875, 0.6290206909179688, 0.6513824462890625, 0.6737442016601562, 0.69610595703125, 0.7184677124023438, 0.7408294677734375, 0.7631912231445312, 0.785552978515625, 0.8079147338867188, 0.8302764892578125, 0.8526382446289062, 0.875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 11.0, 18.0, 37.0, 93.0, 127.0, 106.0, 34.0, 23.0, 13.0, 5.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7304370403289795, -2.5282552242279053, -2.326073408126831, -2.1238913536071777, -1.9217095375061035, -1.7195277214050293, -1.517345905303955, -1.3151639699935913, -1.112982153892517, -0.9108002781867981, -0.7086184024810791, -0.5064365863800049, -0.3042547106742859, -0.1020728349685669, 0.10010898113250732, 0.3022909164428711, 0.5044727325439453, 0.7066546082496643, 0.9088364839553833, 1.1110183000564575, 1.3132002353668213, 1.5153820514678955, 1.7175638675689697, 1.9197458028793335, 2.1219277381896973, 2.3241095542907715, 2.5262913703918457, 2.72847318649292, 2.9306552410125732, 3.1328370571136475, 3.3350188732147217, 3.537200927734375, 3.739382266998291, 3.9415640830993652, 4.1437458992004395, 4.345927715301514, 4.548109531402588, 4.75029182434082, 4.9524736404418945, 5.154655456542969, 5.356837272644043, 5.559019088745117, 5.761200904846191, 5.963382720947266, 6.16556453704834, 6.367746353149414, 6.569928169250488, 6.772110462188721, 6.974291801452637, 7.176473617553711, 7.378655433654785, 7.580837249755859, 7.783019065856934, 7.985200881958008, 8.187382698059082, 8.389564514160156, 8.591747283935547, 8.793929100036621, 8.996110916137695, 9.19829273223877, 9.400474548339844, 9.602656364440918, 9.804838180541992, 10.007019996643066, 10.20920181274414]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 6.0, 12.0, 23.0, 16.0, 37.0, 51.0, 68.0, 77.0, 48.0, 41.0, 29.0, 9.0, 8.0, 5.0, 1.0, 4.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.290059804916382, -2.211210250854492, -2.1323606967926025, -2.053511142730713, -1.9746617078781128, -1.8958121538162231, -1.816962718963623, -1.7381131649017334, -1.6592636108398438, -1.580414056777954, -1.5015645027160645, -1.4227150678634644, -1.3438655138015747, -1.265015959739685, -1.186166524887085, -1.1073169708251953, -1.0284674167633057, -0.949617862701416, -0.8707683682441711, -0.7919188737869263, -0.7130693197250366, -0.634219765663147, -0.5553702712059021, -0.4765207767486572, -0.3976712226867676, -0.3188216984272003, -0.23997217416763306, -0.1611226499080658, -0.08227312564849854, -0.0034236013889312744, 0.07542592287063599, 0.15427541732788086, 0.2331252098083496, 0.31197473406791687, 0.39082425832748413, 0.4696737825870514, 0.5485233068466187, 0.6273728609085083, 0.7062223553657532, 0.785071849822998, 0.8639214038848877, 0.9427709579467773, 1.021620512008667, 1.100469946861267, 1.1793195009231567, 1.2581690549850464, 1.3370184898376465, 1.4158680438995361, 1.4947175979614258, 1.5735671520233154, 1.652416706085205, 1.7312661409378052, 1.8101156949996948, 1.8889652490615845, 1.9678146839141846, 2.046664237976074, 2.125513792037964, 2.2043633460998535, 2.283212900161743, 2.362062454223633, 2.4409117698669434, 2.519761323928833, 2.5986108779907227, 2.6774604320526123, 2.756309986114502]}, "eval/loss": 4.352957248687744, "eval/wer": 1.7716977389924633, "eval/runtime": 602.6395, "eval/samples_per_second": 4.384, "eval/steps_per_second": 0.549} \ No newline at end of file